diff --git a/florence-2-b_vis1024-lang2048_dior-v2_b2x16-100e-slurm-zero2/eval_dior/parsed_answers_test/eval_liqingyun@SH-IDC1-10-140-37-21_device0_rank0.log b/florence-2-b_vis1024-lang2048_dior-v2_b2x16-100e-slurm-zero2/eval_dior/parsed_answers_test/eval_liqingyun@SH-IDC1-10-140-37-21_device0_rank0.log
new file mode 100644
index 0000000000000000000000000000000000000000..c512f6ea7abf7d56a153b50afea69c48cd5a9770
--- /dev/null
+++ b/florence-2-b_vis1024-lang2048_dior-v2_b2x16-100e-slurm-zero2/eval_dior/parsed_answers_test/eval_liqingyun@SH-IDC1-10-140-37-21_device0_rank0.log
@@ -0,0 +1,42 @@
+2025/01/04 02:50:07 - dior test Evaluation - INFO - --------------------
+2025/01/04 02:50:09 - dior test Evaluation - INFO - Fuzzy matched vehicleicle to vehicle
+2025/01/04 02:50:10 - dior test Evaluation - INFO - Fuzzy matched vehicleicle to vehicle
+2025/01/04 02:50:11 - dior test Evaluation - INFO - Fuzzy matched groundtrackstation to trainstation
+2025/01/04 02:50:12 - dior test Evaluation - INFO - Fuzzy matched tennicle to vehicle
+2025/01/04 02:50:13 - dior test Evaluation - INFO - Fuzzy matched tennourt to tenniscourt
+2025/01/04 02:50:15 - dior test Evaluation - INFO - Fuzzy matched storgetank to storagetank
+2025/01/04 02:50:16 - dior test Evaluation - INFO - Fuzzy matched trainstationstationstation to trainstation
+2025/01/04 02:50:16 - dior test Evaluation - INFO - Fuzzy matched storank to storagetank
+2025/01/04 02:50:18 - dior test Evaluation - INFO - Fuzzy matched stadiumadiumadium to stadium
+2025/01/04 02:50:19 - dior test Evaluation - INFO - Fuzzy matched storadium to stadium
+2025/01/04 02:50:22 - dior test Evaluation - INFO -
+---------------iou_thr: 0.5---------------
+2025/01/04 02:51:06 - dior test Evaluation - INFO -
++-------------------------+-------+-------+--------+-------+
+| class | gts | dets | recall | ap |
++-------------------------+-------+-------+--------+-------+
+| airplane | 8212 | 7661 | 0.827 | 0.746 |
+| airport | 666 | 691 | 0.581 | 0.346 |
+| baseballfield | 3434 | 2940 | 0.791 | 0.682 |
+| basketballcourt | 2146 | 1951 | 0.832 | 0.758 |
+| bridge | 2589 | 2178 | 0.421 | 0.277 |
+| chimney | 1031 | 884 | 0.799 | 0.687 |
+| expressway-service-area | 1085 | 1063 | 0.846 | 0.722 |
+| expressway-toll-station | 688 | 685 | 0.749 | 0.570 |
+| dam | 538 | 590 | 0.398 | 0.195 |
+| golffield | 575 | 642 | 0.823 | 0.644 |
+| groundtrackfield | 1885 | 2179 | 0.836 | 0.636 |
+| harbor | 3105 | 3584 | 0.437 | 0.250 |
+| overpass | 1782 | 1516 | 0.552 | 0.364 |
+| ship | 35184 | 29010 | 0.677 | 0.543 |
+| stadium | 672 | 517 | 0.564 | 0.478 |
+| storagetank | 23361 | 17806 | 0.627 | 0.544 |
+| tenniscourt | 7343 | 6754 | 0.849 | 0.775 |
+| trainstation | 509 | 548 | 0.670 | 0.431 |
+| vehicle | 26640 | 17384 | 0.471 | 0.355 |
+| windmill | 2998 | 3007 | 0.780 | 0.598 |
++-------------------------+-------+-------+--------+-------+
+| mAP | | | | 0.530 |
++-------------------------+-------+-------+--------+-------+
+2025/01/04 02:51:06 - dior test Evaluation - INFO - --------------------
+
diff --git a/florence-2-b_vis1024-lang2048_dior-v2_b2x16-100e-slurm-zero2/trainer_state.json b/florence-2-b_vis1024-lang2048_dior-v2_b2x16-100e-slurm-zero2/trainer_state.json
new file mode 100644
index 0000000000000000000000000000000000000000..446a809a3e05e780d23a05a509fa8534b9104b68
--- /dev/null
+++ b/florence-2-b_vis1024-lang2048_dior-v2_b2x16-100e-slurm-zero2/trainer_state.json
@@ -0,0 +1,256942 @@
+{
+ "best_metric": null,
+ "best_model_checkpoint": null,
+ "epoch": 100.0,
+ "eval_steps": 200.0,
+ "global_step": 36700,
+ "is_hyper_param_search": false,
+ "is_local_process_zero": true,
+ "is_world_process_zero": true,
+ "log_history": [
+ {
+ "epoch": 0.0027247956403269754,
+ "grad_norm": 40.78464126586914,
+ "learning_rate": 1.8165304268846506e-08,
+ "loss": 6.8438,
+ "step": 1
+ },
+ {
+ "epoch": 0.005449591280653951,
+ "grad_norm": 44.312137603759766,
+ "learning_rate": 3.633060853769301e-08,
+ "loss": 6.8809,
+ "step": 2
+ },
+ {
+ "epoch": 0.008174386920980926,
+ "grad_norm": 44.27949523925781,
+ "learning_rate": 5.449591280653951e-08,
+ "loss": 6.8516,
+ "step": 3
+ },
+ {
+ "epoch": 0.010899182561307902,
+ "grad_norm": 40.63651657104492,
+ "learning_rate": 7.266121707538602e-08,
+ "loss": 7.0879,
+ "step": 4
+ },
+ {
+ "epoch": 0.013623978201634877,
+ "grad_norm": 39.83088302612305,
+ "learning_rate": 9.082652134423253e-08,
+ "loss": 6.8555,
+ "step": 5
+ },
+ {
+ "epoch": 0.01634877384196185,
+ "grad_norm": 38.950218200683594,
+ "learning_rate": 1.0899182561307902e-07,
+ "loss": 6.9551,
+ "step": 6
+ },
+ {
+ "epoch": 0.01907356948228883,
+ "grad_norm": 40.39432144165039,
+ "learning_rate": 1.2715712988192554e-07,
+ "loss": 6.9512,
+ "step": 7
+ },
+ {
+ "epoch": 0.021798365122615803,
+ "grad_norm": 48.991764068603516,
+ "learning_rate": 1.4532243415077205e-07,
+ "loss": 7.0898,
+ "step": 8
+ },
+ {
+ "epoch": 0.02452316076294278,
+ "grad_norm": 49.33735275268555,
+ "learning_rate": 1.6348773841961852e-07,
+ "loss": 6.8613,
+ "step": 9
+ },
+ {
+ "epoch": 0.027247956403269755,
+ "grad_norm": 61.31592559814453,
+ "learning_rate": 1.8165304268846506e-07,
+ "loss": 6.8047,
+ "step": 10
+ },
+ {
+ "epoch": 0.02997275204359673,
+ "grad_norm": 39.412933349609375,
+ "learning_rate": 1.9981834695731156e-07,
+ "loss": 6.9297,
+ "step": 11
+ },
+ {
+ "epoch": 0.0326975476839237,
+ "grad_norm": 39.78142166137695,
+ "learning_rate": 2.1798365122615804e-07,
+ "loss": 7.0254,
+ "step": 12
+ },
+ {
+ "epoch": 0.035422343324250684,
+ "grad_norm": 38.37565994262695,
+ "learning_rate": 2.3614895549500455e-07,
+ "loss": 6.9766,
+ "step": 13
+ },
+ {
+ "epoch": 0.03814713896457766,
+ "grad_norm": 51.07477951049805,
+ "learning_rate": 2.543142597638511e-07,
+ "loss": 6.9414,
+ "step": 14
+ },
+ {
+ "epoch": 0.04087193460490463,
+ "grad_norm": 38.784751892089844,
+ "learning_rate": 2.7247956403269756e-07,
+ "loss": 6.8379,
+ "step": 15
+ },
+ {
+ "epoch": 0.043596730245231606,
+ "grad_norm": 38.25511932373047,
+ "learning_rate": 2.906448683015441e-07,
+ "loss": 6.8965,
+ "step": 16
+ },
+ {
+ "epoch": 0.04632152588555858,
+ "grad_norm": 32.41145324707031,
+ "learning_rate": 3.0881017257039057e-07,
+ "loss": 6.9238,
+ "step": 17
+ },
+ {
+ "epoch": 0.04904632152588556,
+ "grad_norm": 35.66207504272461,
+ "learning_rate": 3.2697547683923705e-07,
+ "loss": 6.9258,
+ "step": 18
+ },
+ {
+ "epoch": 0.051771117166212535,
+ "grad_norm": 57.06675720214844,
+ "learning_rate": 3.4514078110808363e-07,
+ "loss": 6.8262,
+ "step": 19
+ },
+ {
+ "epoch": 0.05449591280653951,
+ "grad_norm": 36.9990119934082,
+ "learning_rate": 3.633060853769301e-07,
+ "loss": 6.9121,
+ "step": 20
+ },
+ {
+ "epoch": 0.05722070844686648,
+ "grad_norm": 56.178890228271484,
+ "learning_rate": 3.814713896457766e-07,
+ "loss": 7.1934,
+ "step": 21
+ },
+ {
+ "epoch": 0.05994550408719346,
+ "grad_norm": 44.32059097290039,
+ "learning_rate": 3.996366939146231e-07,
+ "loss": 6.8652,
+ "step": 22
+ },
+ {
+ "epoch": 0.06267029972752043,
+ "grad_norm": 46.04462432861328,
+ "learning_rate": 4.178019981834696e-07,
+ "loss": 7.0117,
+ "step": 23
+ },
+ {
+ "epoch": 0.0653950953678474,
+ "grad_norm": 57.29674530029297,
+ "learning_rate": 4.359673024523161e-07,
+ "loss": 6.8086,
+ "step": 24
+ },
+ {
+ "epoch": 0.0681198910081744,
+ "grad_norm": 34.19939041137695,
+ "learning_rate": 4.541326067211626e-07,
+ "loss": 6.5684,
+ "step": 25
+ },
+ {
+ "epoch": 0.07084468664850137,
+ "grad_norm": 36.27748107910156,
+ "learning_rate": 4.722979109900091e-07,
+ "loss": 6.9805,
+ "step": 26
+ },
+ {
+ "epoch": 0.07356948228882834,
+ "grad_norm": 33.618751525878906,
+ "learning_rate": 4.904632152588557e-07,
+ "loss": 6.873,
+ "step": 27
+ },
+ {
+ "epoch": 0.07629427792915532,
+ "grad_norm": 38.21268844604492,
+ "learning_rate": 5.086285195277022e-07,
+ "loss": 6.7188,
+ "step": 28
+ },
+ {
+ "epoch": 0.07901907356948229,
+ "grad_norm": 40.83243942260742,
+ "learning_rate": 5.267938237965486e-07,
+ "loss": 6.8965,
+ "step": 29
+ },
+ {
+ "epoch": 0.08174386920980926,
+ "grad_norm": 34.49842071533203,
+ "learning_rate": 5.449591280653951e-07,
+ "loss": 7.0137,
+ "step": 30
+ },
+ {
+ "epoch": 0.08446866485013624,
+ "grad_norm": 41.635982513427734,
+ "learning_rate": 5.631244323342416e-07,
+ "loss": 7.0996,
+ "step": 31
+ },
+ {
+ "epoch": 0.08719346049046321,
+ "grad_norm": 53.25373458862305,
+ "learning_rate": 5.812897366030882e-07,
+ "loss": 7.1289,
+ "step": 32
+ },
+ {
+ "epoch": 0.08991825613079019,
+ "grad_norm": 31.06708526611328,
+ "learning_rate": 5.994550408719347e-07,
+ "loss": 6.5547,
+ "step": 33
+ },
+ {
+ "epoch": 0.09264305177111716,
+ "grad_norm": 53.0910530090332,
+ "learning_rate": 6.176203451407811e-07,
+ "loss": 6.9785,
+ "step": 34
+ },
+ {
+ "epoch": 0.09536784741144415,
+ "grad_norm": 38.88106918334961,
+ "learning_rate": 6.357856494096276e-07,
+ "loss": 6.8457,
+ "step": 35
+ },
+ {
+ "epoch": 0.09809264305177112,
+ "grad_norm": 37.74711608886719,
+ "learning_rate": 6.539509536784741e-07,
+ "loss": 6.7148,
+ "step": 36
+ },
+ {
+ "epoch": 0.1008174386920981,
+ "grad_norm": 63.326045989990234,
+ "learning_rate": 6.721162579473206e-07,
+ "loss": 6.7129,
+ "step": 37
+ },
+ {
+ "epoch": 0.10354223433242507,
+ "grad_norm": 33.27577209472656,
+ "learning_rate": 6.902815622161673e-07,
+ "loss": 6.7168,
+ "step": 38
+ },
+ {
+ "epoch": 0.10626702997275204,
+ "grad_norm": 31.722137451171875,
+ "learning_rate": 7.084468664850137e-07,
+ "loss": 6.7754,
+ "step": 39
+ },
+ {
+ "epoch": 0.10899182561307902,
+ "grad_norm": 44.16450881958008,
+ "learning_rate": 7.266121707538602e-07,
+ "loss": 6.8105,
+ "step": 40
+ },
+ {
+ "epoch": 0.11171662125340599,
+ "grad_norm": 38.69147491455078,
+ "learning_rate": 7.447774750227067e-07,
+ "loss": 6.6855,
+ "step": 41
+ },
+ {
+ "epoch": 0.11444141689373297,
+ "grad_norm": 27.381261825561523,
+ "learning_rate": 7.629427792915532e-07,
+ "loss": 6.623,
+ "step": 42
+ },
+ {
+ "epoch": 0.11716621253405994,
+ "grad_norm": 33.229217529296875,
+ "learning_rate": 7.811080835603997e-07,
+ "loss": 6.6211,
+ "step": 43
+ },
+ {
+ "epoch": 0.11989100817438691,
+ "grad_norm": 42.80620193481445,
+ "learning_rate": 7.992733878292462e-07,
+ "loss": 6.8574,
+ "step": 44
+ },
+ {
+ "epoch": 0.1226158038147139,
+ "grad_norm": 33.26158905029297,
+ "learning_rate": 8.174386920980927e-07,
+ "loss": 6.375,
+ "step": 45
+ },
+ {
+ "epoch": 0.12534059945504086,
+ "grad_norm": 26.46646499633789,
+ "learning_rate": 8.356039963669392e-07,
+ "loss": 6.3516,
+ "step": 46
+ },
+ {
+ "epoch": 0.12806539509536785,
+ "grad_norm": 32.222042083740234,
+ "learning_rate": 8.537693006357857e-07,
+ "loss": 6.4531,
+ "step": 47
+ },
+ {
+ "epoch": 0.1307901907356948,
+ "grad_norm": 38.365352630615234,
+ "learning_rate": 8.719346049046322e-07,
+ "loss": 6.6836,
+ "step": 48
+ },
+ {
+ "epoch": 0.1335149863760218,
+ "grad_norm": 28.54322052001953,
+ "learning_rate": 8.900999091734786e-07,
+ "loss": 6.498,
+ "step": 49
+ },
+ {
+ "epoch": 0.1362397820163488,
+ "grad_norm": 28.877483367919922,
+ "learning_rate": 9.082652134423252e-07,
+ "loss": 6.4141,
+ "step": 50
+ },
+ {
+ "epoch": 0.13896457765667575,
+ "grad_norm": 27.959054946899414,
+ "learning_rate": 9.264305177111717e-07,
+ "loss": 6.2188,
+ "step": 51
+ },
+ {
+ "epoch": 0.14168937329700274,
+ "grad_norm": 23.965312957763672,
+ "learning_rate": 9.445958219800182e-07,
+ "loss": 6.3184,
+ "step": 52
+ },
+ {
+ "epoch": 0.1444141689373297,
+ "grad_norm": 59.07518768310547,
+ "learning_rate": 9.627611262488648e-07,
+ "loss": 6.5605,
+ "step": 53
+ },
+ {
+ "epoch": 0.14713896457765668,
+ "grad_norm": 29.662635803222656,
+ "learning_rate": 9.809264305177114e-07,
+ "loss": 6.2461,
+ "step": 54
+ },
+ {
+ "epoch": 0.14986376021798364,
+ "grad_norm": 29.20414161682129,
+ "learning_rate": 9.990917347865577e-07,
+ "loss": 6.3477,
+ "step": 55
+ },
+ {
+ "epoch": 0.15258855585831063,
+ "grad_norm": 37.64859390258789,
+ "learning_rate": 1.0172570390554043e-06,
+ "loss": 6.0879,
+ "step": 56
+ },
+ {
+ "epoch": 0.1553133514986376,
+ "grad_norm": 30.13629150390625,
+ "learning_rate": 1.0354223433242507e-06,
+ "loss": 6.293,
+ "step": 57
+ },
+ {
+ "epoch": 0.15803814713896458,
+ "grad_norm": 21.255197525024414,
+ "learning_rate": 1.0535876475930973e-06,
+ "loss": 6.3887,
+ "step": 58
+ },
+ {
+ "epoch": 0.16076294277929154,
+ "grad_norm": 29.932714462280273,
+ "learning_rate": 1.0717529518619439e-06,
+ "loss": 6.1172,
+ "step": 59
+ },
+ {
+ "epoch": 0.16348773841961853,
+ "grad_norm": 23.474641799926758,
+ "learning_rate": 1.0899182561307902e-06,
+ "loss": 6.1816,
+ "step": 60
+ },
+ {
+ "epoch": 0.16621253405994552,
+ "grad_norm": 22.93517303466797,
+ "learning_rate": 1.1080835603996368e-06,
+ "loss": 6.3008,
+ "step": 61
+ },
+ {
+ "epoch": 0.16893732970027248,
+ "grad_norm": 19.647396087646484,
+ "learning_rate": 1.1262488646684832e-06,
+ "loss": 6.0918,
+ "step": 62
+ },
+ {
+ "epoch": 0.17166212534059946,
+ "grad_norm": 25.928668975830078,
+ "learning_rate": 1.1444141689373298e-06,
+ "loss": 5.9766,
+ "step": 63
+ },
+ {
+ "epoch": 0.17438692098092642,
+ "grad_norm": 23.329084396362305,
+ "learning_rate": 1.1625794732061764e-06,
+ "loss": 5.9316,
+ "step": 64
+ },
+ {
+ "epoch": 0.1771117166212534,
+ "grad_norm": 28.719526290893555,
+ "learning_rate": 1.1807447774750227e-06,
+ "loss": 5.9121,
+ "step": 65
+ },
+ {
+ "epoch": 0.17983651226158037,
+ "grad_norm": 23.34282112121582,
+ "learning_rate": 1.1989100817438693e-06,
+ "loss": 5.7422,
+ "step": 66
+ },
+ {
+ "epoch": 0.18256130790190736,
+ "grad_norm": 23.170896530151367,
+ "learning_rate": 1.217075386012716e-06,
+ "loss": 5.7812,
+ "step": 67
+ },
+ {
+ "epoch": 0.18528610354223432,
+ "grad_norm": 17.787656784057617,
+ "learning_rate": 1.2352406902815623e-06,
+ "loss": 5.9316,
+ "step": 68
+ },
+ {
+ "epoch": 0.1880108991825613,
+ "grad_norm": 28.331361770629883,
+ "learning_rate": 1.2534059945504087e-06,
+ "loss": 5.6387,
+ "step": 69
+ },
+ {
+ "epoch": 0.1907356948228883,
+ "grad_norm": 20.090055465698242,
+ "learning_rate": 1.2715712988192552e-06,
+ "loss": 5.7715,
+ "step": 70
+ },
+ {
+ "epoch": 0.19346049046321526,
+ "grad_norm": 20.68782615661621,
+ "learning_rate": 1.2897366030881018e-06,
+ "loss": 5.457,
+ "step": 71
+ },
+ {
+ "epoch": 0.19618528610354224,
+ "grad_norm": 16.90093421936035,
+ "learning_rate": 1.3079019073569482e-06,
+ "loss": 5.6348,
+ "step": 72
+ },
+ {
+ "epoch": 0.1989100817438692,
+ "grad_norm": 50.501258850097656,
+ "learning_rate": 1.3260672116257948e-06,
+ "loss": 5.5293,
+ "step": 73
+ },
+ {
+ "epoch": 0.2016348773841962,
+ "grad_norm": 18.65361213684082,
+ "learning_rate": 1.3442325158946412e-06,
+ "loss": 5.4395,
+ "step": 74
+ },
+ {
+ "epoch": 0.20435967302452315,
+ "grad_norm": 32.909339904785156,
+ "learning_rate": 1.362397820163488e-06,
+ "loss": 5.5742,
+ "step": 75
+ },
+ {
+ "epoch": 0.20708446866485014,
+ "grad_norm": 17.824298858642578,
+ "learning_rate": 1.3805631244323345e-06,
+ "loss": 5.6914,
+ "step": 76
+ },
+ {
+ "epoch": 0.2098092643051771,
+ "grad_norm": 20.759225845336914,
+ "learning_rate": 1.398728428701181e-06,
+ "loss": 5.418,
+ "step": 77
+ },
+ {
+ "epoch": 0.2125340599455041,
+ "grad_norm": 20.385583877563477,
+ "learning_rate": 1.4168937329700275e-06,
+ "loss": 5.3809,
+ "step": 78
+ },
+ {
+ "epoch": 0.21525885558583105,
+ "grad_norm": 16.89611053466797,
+ "learning_rate": 1.4350590372388739e-06,
+ "loss": 5.4844,
+ "step": 79
+ },
+ {
+ "epoch": 0.21798365122615804,
+ "grad_norm": 22.670808792114258,
+ "learning_rate": 1.4532243415077205e-06,
+ "loss": 5.3105,
+ "step": 80
+ },
+ {
+ "epoch": 0.22070844686648503,
+ "grad_norm": 20.921186447143555,
+ "learning_rate": 1.471389645776567e-06,
+ "loss": 5.2852,
+ "step": 81
+ },
+ {
+ "epoch": 0.22343324250681199,
+ "grad_norm": 18.31825065612793,
+ "learning_rate": 1.4895549500454134e-06,
+ "loss": 5.4473,
+ "step": 82
+ },
+ {
+ "epoch": 0.22615803814713897,
+ "grad_norm": 17.247661590576172,
+ "learning_rate": 1.50772025431426e-06,
+ "loss": 5.2773,
+ "step": 83
+ },
+ {
+ "epoch": 0.22888283378746593,
+ "grad_norm": 26.34626579284668,
+ "learning_rate": 1.5258855585831064e-06,
+ "loss": 5.291,
+ "step": 84
+ },
+ {
+ "epoch": 0.23160762942779292,
+ "grad_norm": 21.106550216674805,
+ "learning_rate": 1.544050862851953e-06,
+ "loss": 5.4531,
+ "step": 85
+ },
+ {
+ "epoch": 0.23433242506811988,
+ "grad_norm": 25.7116756439209,
+ "learning_rate": 1.5622161671207993e-06,
+ "loss": 5.2168,
+ "step": 86
+ },
+ {
+ "epoch": 0.23705722070844687,
+ "grad_norm": 21.119768142700195,
+ "learning_rate": 1.580381471389646e-06,
+ "loss": 5.3438,
+ "step": 87
+ },
+ {
+ "epoch": 0.23978201634877383,
+ "grad_norm": 20.929882049560547,
+ "learning_rate": 1.5985467756584925e-06,
+ "loss": 5.1504,
+ "step": 88
+ },
+ {
+ "epoch": 0.24250681198910082,
+ "grad_norm": 29.220802307128906,
+ "learning_rate": 1.6167120799273389e-06,
+ "loss": 4.918,
+ "step": 89
+ },
+ {
+ "epoch": 0.2452316076294278,
+ "grad_norm": 35.418941497802734,
+ "learning_rate": 1.6348773841961855e-06,
+ "loss": 5.0137,
+ "step": 90
+ },
+ {
+ "epoch": 0.24795640326975477,
+ "grad_norm": 16.804855346679688,
+ "learning_rate": 1.6530426884650318e-06,
+ "loss": 5.1211,
+ "step": 91
+ },
+ {
+ "epoch": 0.2506811989100817,
+ "grad_norm": 17.878726959228516,
+ "learning_rate": 1.6712079927338784e-06,
+ "loss": 5.1953,
+ "step": 92
+ },
+ {
+ "epoch": 0.25340599455040874,
+ "grad_norm": 18.441425323486328,
+ "learning_rate": 1.689373297002725e-06,
+ "loss": 4.7861,
+ "step": 93
+ },
+ {
+ "epoch": 0.2561307901907357,
+ "grad_norm": 21.388906478881836,
+ "learning_rate": 1.7075386012715714e-06,
+ "loss": 4.8379,
+ "step": 94
+ },
+ {
+ "epoch": 0.25885558583106266,
+ "grad_norm": 19.879146575927734,
+ "learning_rate": 1.725703905540418e-06,
+ "loss": 4.7842,
+ "step": 95
+ },
+ {
+ "epoch": 0.2615803814713896,
+ "grad_norm": 24.641145706176758,
+ "learning_rate": 1.7438692098092643e-06,
+ "loss": 4.9785,
+ "step": 96
+ },
+ {
+ "epoch": 0.26430517711171664,
+ "grad_norm": 13.113323211669922,
+ "learning_rate": 1.762034514078111e-06,
+ "loss": 4.6279,
+ "step": 97
+ },
+ {
+ "epoch": 0.2670299727520436,
+ "grad_norm": 16.05596923828125,
+ "learning_rate": 1.7801998183469573e-06,
+ "loss": 4.3711,
+ "step": 98
+ },
+ {
+ "epoch": 0.26975476839237056,
+ "grad_norm": 14.967947006225586,
+ "learning_rate": 1.7983651226158039e-06,
+ "loss": 4.376,
+ "step": 99
+ },
+ {
+ "epoch": 0.2724795640326976,
+ "grad_norm": 15.026629447937012,
+ "learning_rate": 1.8165304268846505e-06,
+ "loss": 5.0801,
+ "step": 100
+ },
+ {
+ "epoch": 0.27520435967302453,
+ "grad_norm": 15.951396942138672,
+ "learning_rate": 1.8346957311534968e-06,
+ "loss": 4.8525,
+ "step": 101
+ },
+ {
+ "epoch": 0.2779291553133515,
+ "grad_norm": 13.121307373046875,
+ "learning_rate": 1.8528610354223434e-06,
+ "loss": 4.4746,
+ "step": 102
+ },
+ {
+ "epoch": 0.28065395095367845,
+ "grad_norm": 14.952683448791504,
+ "learning_rate": 1.8710263396911898e-06,
+ "loss": 4.665,
+ "step": 103
+ },
+ {
+ "epoch": 0.28337874659400547,
+ "grad_norm": 13.740148544311523,
+ "learning_rate": 1.8891916439600364e-06,
+ "loss": 4.3633,
+ "step": 104
+ },
+ {
+ "epoch": 0.28610354223433243,
+ "grad_norm": 15.738082885742188,
+ "learning_rate": 1.907356948228883e-06,
+ "loss": 4.5303,
+ "step": 105
+ },
+ {
+ "epoch": 0.2888283378746594,
+ "grad_norm": 12.909492492675781,
+ "learning_rate": 1.9255222524977295e-06,
+ "loss": 4.3691,
+ "step": 106
+ },
+ {
+ "epoch": 0.29155313351498635,
+ "grad_norm": 15.026860237121582,
+ "learning_rate": 1.943687556766576e-06,
+ "loss": 4.6152,
+ "step": 107
+ },
+ {
+ "epoch": 0.29427792915531337,
+ "grad_norm": 13.496101379394531,
+ "learning_rate": 1.9618528610354227e-06,
+ "loss": 4.2588,
+ "step": 108
+ },
+ {
+ "epoch": 0.2970027247956403,
+ "grad_norm": 14.526864051818848,
+ "learning_rate": 1.9800181653042693e-06,
+ "loss": 4.4912,
+ "step": 109
+ },
+ {
+ "epoch": 0.2997275204359673,
+ "grad_norm": 12.712934494018555,
+ "learning_rate": 1.9981834695731155e-06,
+ "loss": 4.4111,
+ "step": 110
+ },
+ {
+ "epoch": 0.3024523160762943,
+ "grad_norm": 11.968435287475586,
+ "learning_rate": 2.016348773841962e-06,
+ "loss": 4.4316,
+ "step": 111
+ },
+ {
+ "epoch": 0.30517711171662126,
+ "grad_norm": 13.326701164245605,
+ "learning_rate": 2.0345140781108086e-06,
+ "loss": 4.5,
+ "step": 112
+ },
+ {
+ "epoch": 0.3079019073569482,
+ "grad_norm": 16.02067756652832,
+ "learning_rate": 2.0526793823796552e-06,
+ "loss": 4.124,
+ "step": 113
+ },
+ {
+ "epoch": 0.3106267029972752,
+ "grad_norm": 13.210917472839355,
+ "learning_rate": 2.0708446866485014e-06,
+ "loss": 4.3545,
+ "step": 114
+ },
+ {
+ "epoch": 0.3133514986376022,
+ "grad_norm": 12.205485343933105,
+ "learning_rate": 2.089009990917348e-06,
+ "loss": 4.6543,
+ "step": 115
+ },
+ {
+ "epoch": 0.31607629427792916,
+ "grad_norm": 11.650239944458008,
+ "learning_rate": 2.1071752951861945e-06,
+ "loss": 4.3682,
+ "step": 116
+ },
+ {
+ "epoch": 0.3188010899182561,
+ "grad_norm": 11.849342346191406,
+ "learning_rate": 2.125340599455041e-06,
+ "loss": 4.4482,
+ "step": 117
+ },
+ {
+ "epoch": 0.3215258855585831,
+ "grad_norm": 10.80008316040039,
+ "learning_rate": 2.1435059037238877e-06,
+ "loss": 3.9756,
+ "step": 118
+ },
+ {
+ "epoch": 0.3242506811989101,
+ "grad_norm": 12.67882251739502,
+ "learning_rate": 2.161671207992734e-06,
+ "loss": 4.2832,
+ "step": 119
+ },
+ {
+ "epoch": 0.32697547683923706,
+ "grad_norm": 10.75010871887207,
+ "learning_rate": 2.1798365122615805e-06,
+ "loss": 4.3525,
+ "step": 120
+ },
+ {
+ "epoch": 0.329700272479564,
+ "grad_norm": 10.905150413513184,
+ "learning_rate": 2.198001816530427e-06,
+ "loss": 4.3975,
+ "step": 121
+ },
+ {
+ "epoch": 0.33242506811989103,
+ "grad_norm": 12.39403247833252,
+ "learning_rate": 2.2161671207992736e-06,
+ "loss": 4.5381,
+ "step": 122
+ },
+ {
+ "epoch": 0.335149863760218,
+ "grad_norm": 13.479368209838867,
+ "learning_rate": 2.2343324250681202e-06,
+ "loss": 3.8682,
+ "step": 123
+ },
+ {
+ "epoch": 0.33787465940054495,
+ "grad_norm": 13.995524406433105,
+ "learning_rate": 2.2524977293369664e-06,
+ "loss": 4.3496,
+ "step": 124
+ },
+ {
+ "epoch": 0.3405994550408719,
+ "grad_norm": 12.977371215820312,
+ "learning_rate": 2.270663033605813e-06,
+ "loss": 4.0049,
+ "step": 125
+ },
+ {
+ "epoch": 0.34332425068119893,
+ "grad_norm": 11.538091659545898,
+ "learning_rate": 2.2888283378746596e-06,
+ "loss": 4.4365,
+ "step": 126
+ },
+ {
+ "epoch": 0.3460490463215259,
+ "grad_norm": 12.014766693115234,
+ "learning_rate": 2.306993642143506e-06,
+ "loss": 4.0898,
+ "step": 127
+ },
+ {
+ "epoch": 0.34877384196185285,
+ "grad_norm": 10.364009857177734,
+ "learning_rate": 2.3251589464123527e-06,
+ "loss": 4.292,
+ "step": 128
+ },
+ {
+ "epoch": 0.35149863760217986,
+ "grad_norm": 10.310364723205566,
+ "learning_rate": 2.343324250681199e-06,
+ "loss": 3.9658,
+ "step": 129
+ },
+ {
+ "epoch": 0.3542234332425068,
+ "grad_norm": 14.921072959899902,
+ "learning_rate": 2.3614895549500455e-06,
+ "loss": 3.9932,
+ "step": 130
+ },
+ {
+ "epoch": 0.3569482288828338,
+ "grad_norm": 11.562774658203125,
+ "learning_rate": 2.379654859218892e-06,
+ "loss": 4.292,
+ "step": 131
+ },
+ {
+ "epoch": 0.35967302452316074,
+ "grad_norm": 12.198079109191895,
+ "learning_rate": 2.3978201634877386e-06,
+ "loss": 4.2441,
+ "step": 132
+ },
+ {
+ "epoch": 0.36239782016348776,
+ "grad_norm": 12.380412101745605,
+ "learning_rate": 2.415985467756585e-06,
+ "loss": 4.2373,
+ "step": 133
+ },
+ {
+ "epoch": 0.3651226158038147,
+ "grad_norm": 11.048654556274414,
+ "learning_rate": 2.434150772025432e-06,
+ "loss": 3.998,
+ "step": 134
+ },
+ {
+ "epoch": 0.3678474114441417,
+ "grad_norm": 17.524181365966797,
+ "learning_rate": 2.4523160762942784e-06,
+ "loss": 4.0967,
+ "step": 135
+ },
+ {
+ "epoch": 0.37057220708446864,
+ "grad_norm": 12.678315162658691,
+ "learning_rate": 2.4704813805631246e-06,
+ "loss": 4.1025,
+ "step": 136
+ },
+ {
+ "epoch": 0.37329700272479566,
+ "grad_norm": 10.025920867919922,
+ "learning_rate": 2.488646684831971e-06,
+ "loss": 4.0293,
+ "step": 137
+ },
+ {
+ "epoch": 0.3760217983651226,
+ "grad_norm": 14.001442909240723,
+ "learning_rate": 2.5068119891008173e-06,
+ "loss": 4.0107,
+ "step": 138
+ },
+ {
+ "epoch": 0.3787465940054496,
+ "grad_norm": 13.694280624389648,
+ "learning_rate": 2.5249772933696643e-06,
+ "loss": 3.9805,
+ "step": 139
+ },
+ {
+ "epoch": 0.3814713896457766,
+ "grad_norm": 10.68122673034668,
+ "learning_rate": 2.5431425976385105e-06,
+ "loss": 3.8984,
+ "step": 140
+ },
+ {
+ "epoch": 0.38419618528610355,
+ "grad_norm": 17.292200088500977,
+ "learning_rate": 2.561307901907357e-06,
+ "loss": 3.8594,
+ "step": 141
+ },
+ {
+ "epoch": 0.3869209809264305,
+ "grad_norm": 11.216814041137695,
+ "learning_rate": 2.5794732061762036e-06,
+ "loss": 3.9932,
+ "step": 142
+ },
+ {
+ "epoch": 0.3896457765667575,
+ "grad_norm": 11.111741065979004,
+ "learning_rate": 2.5976385104450502e-06,
+ "loss": 3.8643,
+ "step": 143
+ },
+ {
+ "epoch": 0.3923705722070845,
+ "grad_norm": 12.438227653503418,
+ "learning_rate": 2.6158038147138964e-06,
+ "loss": 3.7656,
+ "step": 144
+ },
+ {
+ "epoch": 0.39509536784741145,
+ "grad_norm": 11.749055862426758,
+ "learning_rate": 2.6339691189827434e-06,
+ "loss": 3.8945,
+ "step": 145
+ },
+ {
+ "epoch": 0.3978201634877384,
+ "grad_norm": 12.600846290588379,
+ "learning_rate": 2.6521344232515896e-06,
+ "loss": 4.1074,
+ "step": 146
+ },
+ {
+ "epoch": 0.40054495912806537,
+ "grad_norm": 10.880453109741211,
+ "learning_rate": 2.670299727520436e-06,
+ "loss": 4.0225,
+ "step": 147
+ },
+ {
+ "epoch": 0.4032697547683924,
+ "grad_norm": 10.751895904541016,
+ "learning_rate": 2.6884650317892823e-06,
+ "loss": 4.0391,
+ "step": 148
+ },
+ {
+ "epoch": 0.40599455040871935,
+ "grad_norm": 12.65353775024414,
+ "learning_rate": 2.7066303360581293e-06,
+ "loss": 4.0244,
+ "step": 149
+ },
+ {
+ "epoch": 0.4087193460490463,
+ "grad_norm": 13.534128189086914,
+ "learning_rate": 2.724795640326976e-06,
+ "loss": 3.7412,
+ "step": 150
+ },
+ {
+ "epoch": 0.4114441416893733,
+ "grad_norm": 13.41270923614502,
+ "learning_rate": 2.742960944595822e-06,
+ "loss": 3.8105,
+ "step": 151
+ },
+ {
+ "epoch": 0.4141689373297003,
+ "grad_norm": 11.690704345703125,
+ "learning_rate": 2.761126248864669e-06,
+ "loss": 4.0684,
+ "step": 152
+ },
+ {
+ "epoch": 0.41689373297002724,
+ "grad_norm": 12.114771842956543,
+ "learning_rate": 2.7792915531335152e-06,
+ "loss": 3.751,
+ "step": 153
+ },
+ {
+ "epoch": 0.4196185286103542,
+ "grad_norm": 46.29283142089844,
+ "learning_rate": 2.797456857402362e-06,
+ "loss": 3.875,
+ "step": 154
+ },
+ {
+ "epoch": 0.4223433242506812,
+ "grad_norm": 15.252677917480469,
+ "learning_rate": 2.815622161671208e-06,
+ "loss": 3.8926,
+ "step": 155
+ },
+ {
+ "epoch": 0.4250681198910082,
+ "grad_norm": 9.994403839111328,
+ "learning_rate": 2.833787465940055e-06,
+ "loss": 3.6943,
+ "step": 156
+ },
+ {
+ "epoch": 0.42779291553133514,
+ "grad_norm": 12.046945571899414,
+ "learning_rate": 2.851952770208901e-06,
+ "loss": 3.8477,
+ "step": 157
+ },
+ {
+ "epoch": 0.4305177111716621,
+ "grad_norm": 10.81486701965332,
+ "learning_rate": 2.8701180744777477e-06,
+ "loss": 3.9033,
+ "step": 158
+ },
+ {
+ "epoch": 0.4332425068119891,
+ "grad_norm": 10.982769966125488,
+ "learning_rate": 2.8882833787465943e-06,
+ "loss": 3.707,
+ "step": 159
+ },
+ {
+ "epoch": 0.4359673024523161,
+ "grad_norm": 21.560009002685547,
+ "learning_rate": 2.906448683015441e-06,
+ "loss": 3.709,
+ "step": 160
+ },
+ {
+ "epoch": 0.43869209809264303,
+ "grad_norm": 10.339600563049316,
+ "learning_rate": 2.924613987284287e-06,
+ "loss": 3.6982,
+ "step": 161
+ },
+ {
+ "epoch": 0.44141689373297005,
+ "grad_norm": 12.688766479492188,
+ "learning_rate": 2.942779291553134e-06,
+ "loss": 3.7021,
+ "step": 162
+ },
+ {
+ "epoch": 0.444141689373297,
+ "grad_norm": 13.196794509887695,
+ "learning_rate": 2.9609445958219802e-06,
+ "loss": 3.5156,
+ "step": 163
+ },
+ {
+ "epoch": 0.44686648501362397,
+ "grad_norm": 11.564620971679688,
+ "learning_rate": 2.979109900090827e-06,
+ "loss": 3.8828,
+ "step": 164
+ },
+ {
+ "epoch": 0.44959128065395093,
+ "grad_norm": 10.873297691345215,
+ "learning_rate": 2.997275204359673e-06,
+ "loss": 3.7412,
+ "step": 165
+ },
+ {
+ "epoch": 0.45231607629427795,
+ "grad_norm": 11.341376304626465,
+ "learning_rate": 3.01544050862852e-06,
+ "loss": 3.7471,
+ "step": 166
+ },
+ {
+ "epoch": 0.4550408719346049,
+ "grad_norm": 12.239847183227539,
+ "learning_rate": 3.033605812897366e-06,
+ "loss": 3.6182,
+ "step": 167
+ },
+ {
+ "epoch": 0.45776566757493187,
+ "grad_norm": 10.07335376739502,
+ "learning_rate": 3.0517711171662127e-06,
+ "loss": 3.5586,
+ "step": 168
+ },
+ {
+ "epoch": 0.4604904632152589,
+ "grad_norm": 12.485919952392578,
+ "learning_rate": 3.069936421435059e-06,
+ "loss": 3.7471,
+ "step": 169
+ },
+ {
+ "epoch": 0.46321525885558584,
+ "grad_norm": 13.17069149017334,
+ "learning_rate": 3.088101725703906e-06,
+ "loss": 3.79,
+ "step": 170
+ },
+ {
+ "epoch": 0.4659400544959128,
+ "grad_norm": 10.066970825195312,
+ "learning_rate": 3.106267029972752e-06,
+ "loss": 3.8877,
+ "step": 171
+ },
+ {
+ "epoch": 0.46866485013623976,
+ "grad_norm": 10.02057933807373,
+ "learning_rate": 3.1244323342415987e-06,
+ "loss": 3.8125,
+ "step": 172
+ },
+ {
+ "epoch": 0.4713896457765668,
+ "grad_norm": 9.856107711791992,
+ "learning_rate": 3.1425976385104452e-06,
+ "loss": 3.46,
+ "step": 173
+ },
+ {
+ "epoch": 0.47411444141689374,
+ "grad_norm": 9.71706771850586,
+ "learning_rate": 3.160762942779292e-06,
+ "loss": 3.7637,
+ "step": 174
+ },
+ {
+ "epoch": 0.4768392370572207,
+ "grad_norm": 10.88630199432373,
+ "learning_rate": 3.178928247048138e-06,
+ "loss": 3.6582,
+ "step": 175
+ },
+ {
+ "epoch": 0.47956403269754766,
+ "grad_norm": 14.558564186096191,
+ "learning_rate": 3.197093551316985e-06,
+ "loss": 3.7422,
+ "step": 176
+ },
+ {
+ "epoch": 0.4822888283378747,
+ "grad_norm": 16.139097213745117,
+ "learning_rate": 3.215258855585831e-06,
+ "loss": 3.7441,
+ "step": 177
+ },
+ {
+ "epoch": 0.48501362397820164,
+ "grad_norm": 9.087676048278809,
+ "learning_rate": 3.2334241598546777e-06,
+ "loss": 3.6074,
+ "step": 178
+ },
+ {
+ "epoch": 0.4877384196185286,
+ "grad_norm": 11.948226928710938,
+ "learning_rate": 3.2515894641235247e-06,
+ "loss": 3.5625,
+ "step": 179
+ },
+ {
+ "epoch": 0.4904632152588556,
+ "grad_norm": 10.44946002960205,
+ "learning_rate": 3.269754768392371e-06,
+ "loss": 3.6328,
+ "step": 180
+ },
+ {
+ "epoch": 0.49318801089918257,
+ "grad_norm": 13.133516311645508,
+ "learning_rate": 3.2879200726612175e-06,
+ "loss": 3.7539,
+ "step": 181
+ },
+ {
+ "epoch": 0.49591280653950953,
+ "grad_norm": 9.692259788513184,
+ "learning_rate": 3.3060853769300637e-06,
+ "loss": 3.4502,
+ "step": 182
+ },
+ {
+ "epoch": 0.4986376021798365,
+ "grad_norm": 14.369646072387695,
+ "learning_rate": 3.3242506811989107e-06,
+ "loss": 3.4297,
+ "step": 183
+ },
+ {
+ "epoch": 0.5013623978201635,
+ "grad_norm": 14.707884788513184,
+ "learning_rate": 3.342415985467757e-06,
+ "loss": 3.4756,
+ "step": 184
+ },
+ {
+ "epoch": 0.5040871934604905,
+ "grad_norm": 11.313895225524902,
+ "learning_rate": 3.3605812897366034e-06,
+ "loss": 3.7871,
+ "step": 185
+ },
+ {
+ "epoch": 0.5068119891008175,
+ "grad_norm": 12.058860778808594,
+ "learning_rate": 3.37874659400545e-06,
+ "loss": 3.4521,
+ "step": 186
+ },
+ {
+ "epoch": 0.5095367847411444,
+ "grad_norm": 9.204839706420898,
+ "learning_rate": 3.3969118982742966e-06,
+ "loss": 3.623,
+ "step": 187
+ },
+ {
+ "epoch": 0.5122615803814714,
+ "grad_norm": 16.05647087097168,
+ "learning_rate": 3.4150772025431427e-06,
+ "loss": 3.5137,
+ "step": 188
+ },
+ {
+ "epoch": 0.5149863760217984,
+ "grad_norm": 11.145015716552734,
+ "learning_rate": 3.4332425068119898e-06,
+ "loss": 3.5723,
+ "step": 189
+ },
+ {
+ "epoch": 0.5177111716621253,
+ "grad_norm": 10.855523109436035,
+ "learning_rate": 3.451407811080836e-06,
+ "loss": 3.2344,
+ "step": 190
+ },
+ {
+ "epoch": 0.5204359673024523,
+ "grad_norm": 10.985532760620117,
+ "learning_rate": 3.4695731153496825e-06,
+ "loss": 3.6309,
+ "step": 191
+ },
+ {
+ "epoch": 0.5231607629427792,
+ "grad_norm": 12.266671180725098,
+ "learning_rate": 3.4877384196185287e-06,
+ "loss": 3.3369,
+ "step": 192
+ },
+ {
+ "epoch": 0.5258855585831063,
+ "grad_norm": 10.597880363464355,
+ "learning_rate": 3.5059037238873757e-06,
+ "loss": 3.4443,
+ "step": 193
+ },
+ {
+ "epoch": 0.5286103542234333,
+ "grad_norm": 19.650754928588867,
+ "learning_rate": 3.524069028156222e-06,
+ "loss": 3.5801,
+ "step": 194
+ },
+ {
+ "epoch": 0.5313351498637602,
+ "grad_norm": 11.14974308013916,
+ "learning_rate": 3.5422343324250684e-06,
+ "loss": 3.4766,
+ "step": 195
+ },
+ {
+ "epoch": 0.5340599455040872,
+ "grad_norm": 11.0927734375,
+ "learning_rate": 3.5603996366939146e-06,
+ "loss": 3.3281,
+ "step": 196
+ },
+ {
+ "epoch": 0.5367847411444142,
+ "grad_norm": 10.628003120422363,
+ "learning_rate": 3.5785649409627616e-06,
+ "loss": 3.293,
+ "step": 197
+ },
+ {
+ "epoch": 0.5395095367847411,
+ "grad_norm": 10.564107894897461,
+ "learning_rate": 3.5967302452316077e-06,
+ "loss": 3.1475,
+ "step": 198
+ },
+ {
+ "epoch": 0.5422343324250681,
+ "grad_norm": 13.25076961517334,
+ "learning_rate": 3.6148955495004543e-06,
+ "loss": 3.4648,
+ "step": 199
+ },
+ {
+ "epoch": 0.5449591280653951,
+ "grad_norm": 14.788480758666992,
+ "learning_rate": 3.633060853769301e-06,
+ "loss": 3.4941,
+ "step": 200
+ },
+ {
+ "epoch": 0.547683923705722,
+ "grad_norm": 9.797980308532715,
+ "learning_rate": 3.6512261580381475e-06,
+ "loss": 3.1133,
+ "step": 201
+ },
+ {
+ "epoch": 0.5504087193460491,
+ "grad_norm": 13.813182830810547,
+ "learning_rate": 3.6693914623069937e-06,
+ "loss": 3.3164,
+ "step": 202
+ },
+ {
+ "epoch": 0.553133514986376,
+ "grad_norm": 15.10222053527832,
+ "learning_rate": 3.6875567665758407e-06,
+ "loss": 3.5234,
+ "step": 203
+ },
+ {
+ "epoch": 0.555858310626703,
+ "grad_norm": 12.306085586547852,
+ "learning_rate": 3.705722070844687e-06,
+ "loss": 3.334,
+ "step": 204
+ },
+ {
+ "epoch": 0.55858310626703,
+ "grad_norm": 9.715800285339355,
+ "learning_rate": 3.7238873751135334e-06,
+ "loss": 3.4756,
+ "step": 205
+ },
+ {
+ "epoch": 0.5613079019073569,
+ "grad_norm": 12.598706245422363,
+ "learning_rate": 3.7420526793823796e-06,
+ "loss": 3.4111,
+ "step": 206
+ },
+ {
+ "epoch": 0.5640326975476839,
+ "grad_norm": 8.66494369506836,
+ "learning_rate": 3.7602179836512266e-06,
+ "loss": 3.4951,
+ "step": 207
+ },
+ {
+ "epoch": 0.5667574931880109,
+ "grad_norm": 9.56230354309082,
+ "learning_rate": 3.7783832879200728e-06,
+ "loss": 3.624,
+ "step": 208
+ },
+ {
+ "epoch": 0.5694822888283378,
+ "grad_norm": 10.649101257324219,
+ "learning_rate": 3.7965485921889193e-06,
+ "loss": 3.3105,
+ "step": 209
+ },
+ {
+ "epoch": 0.5722070844686649,
+ "grad_norm": 12.988601684570312,
+ "learning_rate": 3.814713896457766e-06,
+ "loss": 3.1914,
+ "step": 210
+ },
+ {
+ "epoch": 0.5749318801089919,
+ "grad_norm": 10.908307075500488,
+ "learning_rate": 3.832879200726612e-06,
+ "loss": 3.752,
+ "step": 211
+ },
+ {
+ "epoch": 0.5776566757493188,
+ "grad_norm": 20.07297706604004,
+ "learning_rate": 3.851044504995459e-06,
+ "loss": 3.5322,
+ "step": 212
+ },
+ {
+ "epoch": 0.5803814713896458,
+ "grad_norm": 11.026345252990723,
+ "learning_rate": 3.869209809264305e-06,
+ "loss": 3.6133,
+ "step": 213
+ },
+ {
+ "epoch": 0.5831062670299727,
+ "grad_norm": 11.130549430847168,
+ "learning_rate": 3.887375113533152e-06,
+ "loss": 3.3799,
+ "step": 214
+ },
+ {
+ "epoch": 0.5858310626702997,
+ "grad_norm": 12.440305709838867,
+ "learning_rate": 3.9055404178019984e-06,
+ "loss": 3.1426,
+ "step": 215
+ },
+ {
+ "epoch": 0.5885558583106267,
+ "grad_norm": 10.083247184753418,
+ "learning_rate": 3.9237057220708454e-06,
+ "loss": 3.4043,
+ "step": 216
+ },
+ {
+ "epoch": 0.5912806539509536,
+ "grad_norm": 10.952589988708496,
+ "learning_rate": 3.941871026339692e-06,
+ "loss": 3.7031,
+ "step": 217
+ },
+ {
+ "epoch": 0.5940054495912807,
+ "grad_norm": 12.696151733398438,
+ "learning_rate": 3.960036330608539e-06,
+ "loss": 3.3369,
+ "step": 218
+ },
+ {
+ "epoch": 0.5967302452316077,
+ "grad_norm": 11.99606990814209,
+ "learning_rate": 3.978201634877385e-06,
+ "loss": 3.4512,
+ "step": 219
+ },
+ {
+ "epoch": 0.5994550408719346,
+ "grad_norm": 10.46695613861084,
+ "learning_rate": 3.996366939146231e-06,
+ "loss": 3.3955,
+ "step": 220
+ },
+ {
+ "epoch": 0.6021798365122616,
+ "grad_norm": 10.558157920837402,
+ "learning_rate": 4.014532243415077e-06,
+ "loss": 3.4482,
+ "step": 221
+ },
+ {
+ "epoch": 0.6049046321525886,
+ "grad_norm": 8.639076232910156,
+ "learning_rate": 4.032697547683924e-06,
+ "loss": 3.1802,
+ "step": 222
+ },
+ {
+ "epoch": 0.6076294277929155,
+ "grad_norm": 9.703048706054688,
+ "learning_rate": 4.05086285195277e-06,
+ "loss": 3.374,
+ "step": 223
+ },
+ {
+ "epoch": 0.6103542234332425,
+ "grad_norm": 14.701447486877441,
+ "learning_rate": 4.069028156221617e-06,
+ "loss": 3.2822,
+ "step": 224
+ },
+ {
+ "epoch": 0.6130790190735694,
+ "grad_norm": 12.3848237991333,
+ "learning_rate": 4.0871934604904634e-06,
+ "loss": 3.2939,
+ "step": 225
+ },
+ {
+ "epoch": 0.6158038147138964,
+ "grad_norm": 9.180680274963379,
+ "learning_rate": 4.1053587647593104e-06,
+ "loss": 3.4766,
+ "step": 226
+ },
+ {
+ "epoch": 0.6185286103542235,
+ "grad_norm": 10.701723098754883,
+ "learning_rate": 4.123524069028157e-06,
+ "loss": 3.2617,
+ "step": 227
+ },
+ {
+ "epoch": 0.6212534059945504,
+ "grad_norm": 9.880071640014648,
+ "learning_rate": 4.141689373297003e-06,
+ "loss": 3.5107,
+ "step": 228
+ },
+ {
+ "epoch": 0.6239782016348774,
+ "grad_norm": 9.402396202087402,
+ "learning_rate": 4.15985467756585e-06,
+ "loss": 3.0391,
+ "step": 229
+ },
+ {
+ "epoch": 0.6267029972752044,
+ "grad_norm": 12.24167251586914,
+ "learning_rate": 4.178019981834696e-06,
+ "loss": 3.1533,
+ "step": 230
+ },
+ {
+ "epoch": 0.6294277929155313,
+ "grad_norm": 12.463957786560059,
+ "learning_rate": 4.196185286103542e-06,
+ "loss": 3.4404,
+ "step": 231
+ },
+ {
+ "epoch": 0.6321525885558583,
+ "grad_norm": 9.269294738769531,
+ "learning_rate": 4.214350590372389e-06,
+ "loss": 3.3408,
+ "step": 232
+ },
+ {
+ "epoch": 0.6348773841961853,
+ "grad_norm": 10.651533126831055,
+ "learning_rate": 4.232515894641235e-06,
+ "loss": 3.4043,
+ "step": 233
+ },
+ {
+ "epoch": 0.6376021798365122,
+ "grad_norm": 10.966300010681152,
+ "learning_rate": 4.250681198910082e-06,
+ "loss": 3.4717,
+ "step": 234
+ },
+ {
+ "epoch": 0.6403269754768393,
+ "grad_norm": 8.606398582458496,
+ "learning_rate": 4.2688465031789284e-06,
+ "loss": 3.2646,
+ "step": 235
+ },
+ {
+ "epoch": 0.6430517711171662,
+ "grad_norm": 11.82869815826416,
+ "learning_rate": 4.2870118074477754e-06,
+ "loss": 3.1846,
+ "step": 236
+ },
+ {
+ "epoch": 0.6457765667574932,
+ "grad_norm": 11.79569149017334,
+ "learning_rate": 4.305177111716622e-06,
+ "loss": 3.2842,
+ "step": 237
+ },
+ {
+ "epoch": 0.6485013623978202,
+ "grad_norm": 11.205436706542969,
+ "learning_rate": 4.323342415985468e-06,
+ "loss": 3.4346,
+ "step": 238
+ },
+ {
+ "epoch": 0.6512261580381471,
+ "grad_norm": 8.987303733825684,
+ "learning_rate": 4.341507720254315e-06,
+ "loss": 3.0576,
+ "step": 239
+ },
+ {
+ "epoch": 0.6539509536784741,
+ "grad_norm": 9.633455276489258,
+ "learning_rate": 4.359673024523161e-06,
+ "loss": 3.2197,
+ "step": 240
+ },
+ {
+ "epoch": 0.6566757493188011,
+ "grad_norm": 11.276183128356934,
+ "learning_rate": 4.377838328792008e-06,
+ "loss": 3.04,
+ "step": 241
+ },
+ {
+ "epoch": 0.659400544959128,
+ "grad_norm": 11.363617897033691,
+ "learning_rate": 4.396003633060854e-06,
+ "loss": 3.2559,
+ "step": 242
+ },
+ {
+ "epoch": 0.662125340599455,
+ "grad_norm": 11.577837944030762,
+ "learning_rate": 4.414168937329701e-06,
+ "loss": 3.2891,
+ "step": 243
+ },
+ {
+ "epoch": 0.6648501362397821,
+ "grad_norm": 8.874040603637695,
+ "learning_rate": 4.432334241598547e-06,
+ "loss": 3.1104,
+ "step": 244
+ },
+ {
+ "epoch": 0.667574931880109,
+ "grad_norm": 10.832159042358398,
+ "learning_rate": 4.4504995458673934e-06,
+ "loss": 3.0151,
+ "step": 245
+ },
+ {
+ "epoch": 0.670299727520436,
+ "grad_norm": 11.228150367736816,
+ "learning_rate": 4.4686648501362404e-06,
+ "loss": 3.2842,
+ "step": 246
+ },
+ {
+ "epoch": 0.6730245231607629,
+ "grad_norm": 9.785909652709961,
+ "learning_rate": 4.486830154405087e-06,
+ "loss": 3.4727,
+ "step": 247
+ },
+ {
+ "epoch": 0.6757493188010899,
+ "grad_norm": 9.006978034973145,
+ "learning_rate": 4.504995458673933e-06,
+ "loss": 3.3057,
+ "step": 248
+ },
+ {
+ "epoch": 0.6784741144414169,
+ "grad_norm": 9.31069278717041,
+ "learning_rate": 4.52316076294278e-06,
+ "loss": 3.1445,
+ "step": 249
+ },
+ {
+ "epoch": 0.6811989100817438,
+ "grad_norm": 14.589471817016602,
+ "learning_rate": 4.541326067211626e-06,
+ "loss": 3.0654,
+ "step": 250
+ },
+ {
+ "epoch": 0.6839237057220708,
+ "grad_norm": 9.290428161621094,
+ "learning_rate": 4.559491371480473e-06,
+ "loss": 3.127,
+ "step": 251
+ },
+ {
+ "epoch": 0.6866485013623979,
+ "grad_norm": 10.998537063598633,
+ "learning_rate": 4.577656675749319e-06,
+ "loss": 2.8945,
+ "step": 252
+ },
+ {
+ "epoch": 0.6893732970027248,
+ "grad_norm": 13.25707721710205,
+ "learning_rate": 4.595821980018166e-06,
+ "loss": 3.3193,
+ "step": 253
+ },
+ {
+ "epoch": 0.6920980926430518,
+ "grad_norm": 9.896824836730957,
+ "learning_rate": 4.613987284287012e-06,
+ "loss": 3.3301,
+ "step": 254
+ },
+ {
+ "epoch": 0.6948228882833788,
+ "grad_norm": 10.812071800231934,
+ "learning_rate": 4.6321525885558584e-06,
+ "loss": 3.2236,
+ "step": 255
+ },
+ {
+ "epoch": 0.6975476839237057,
+ "grad_norm": 10.396222114562988,
+ "learning_rate": 4.6503178928247054e-06,
+ "loss": 3.1211,
+ "step": 256
+ },
+ {
+ "epoch": 0.7002724795640327,
+ "grad_norm": 9.00611686706543,
+ "learning_rate": 4.668483197093552e-06,
+ "loss": 3.2051,
+ "step": 257
+ },
+ {
+ "epoch": 0.7029972752043597,
+ "grad_norm": 9.797375679016113,
+ "learning_rate": 4.686648501362398e-06,
+ "loss": 3.1797,
+ "step": 258
+ },
+ {
+ "epoch": 0.7057220708446866,
+ "grad_norm": 10.615898132324219,
+ "learning_rate": 4.704813805631245e-06,
+ "loss": 2.9658,
+ "step": 259
+ },
+ {
+ "epoch": 0.7084468664850136,
+ "grad_norm": 11.570025444030762,
+ "learning_rate": 4.722979109900091e-06,
+ "loss": 3.0869,
+ "step": 260
+ },
+ {
+ "epoch": 0.7111716621253406,
+ "grad_norm": 11.155060768127441,
+ "learning_rate": 4.741144414168938e-06,
+ "loss": 3.3213,
+ "step": 261
+ },
+ {
+ "epoch": 0.7138964577656676,
+ "grad_norm": 13.674558639526367,
+ "learning_rate": 4.759309718437784e-06,
+ "loss": 3.5439,
+ "step": 262
+ },
+ {
+ "epoch": 0.7166212534059946,
+ "grad_norm": 10.254398345947266,
+ "learning_rate": 4.777475022706631e-06,
+ "loss": 3.3672,
+ "step": 263
+ },
+ {
+ "epoch": 0.7193460490463215,
+ "grad_norm": 10.633976936340332,
+ "learning_rate": 4.795640326975477e-06,
+ "loss": 3.1436,
+ "step": 264
+ },
+ {
+ "epoch": 0.7220708446866485,
+ "grad_norm": 13.250679016113281,
+ "learning_rate": 4.8138056312443234e-06,
+ "loss": 3.0303,
+ "step": 265
+ },
+ {
+ "epoch": 0.7247956403269755,
+ "grad_norm": 10.197409629821777,
+ "learning_rate": 4.83197093551317e-06,
+ "loss": 3.0986,
+ "step": 266
+ },
+ {
+ "epoch": 0.7275204359673024,
+ "grad_norm": 12.010652542114258,
+ "learning_rate": 4.850136239782017e-06,
+ "loss": 3.0781,
+ "step": 267
+ },
+ {
+ "epoch": 0.7302452316076294,
+ "grad_norm": 10.654179573059082,
+ "learning_rate": 4.868301544050864e-06,
+ "loss": 3.2129,
+ "step": 268
+ },
+ {
+ "epoch": 0.7329700272479565,
+ "grad_norm": 10.578466415405273,
+ "learning_rate": 4.88646684831971e-06,
+ "loss": 3.3418,
+ "step": 269
+ },
+ {
+ "epoch": 0.7356948228882834,
+ "grad_norm": 11.487197875976562,
+ "learning_rate": 4.904632152588557e-06,
+ "loss": 3.1787,
+ "step": 270
+ },
+ {
+ "epoch": 0.7384196185286104,
+ "grad_norm": 8.67462158203125,
+ "learning_rate": 4.922797456857403e-06,
+ "loss": 3.0166,
+ "step": 271
+ },
+ {
+ "epoch": 0.7411444141689373,
+ "grad_norm": 10.115763664245605,
+ "learning_rate": 4.940962761126249e-06,
+ "loss": 2.9932,
+ "step": 272
+ },
+ {
+ "epoch": 0.7438692098092643,
+ "grad_norm": 10.159469604492188,
+ "learning_rate": 4.959128065395096e-06,
+ "loss": 3.0356,
+ "step": 273
+ },
+ {
+ "epoch": 0.7465940054495913,
+ "grad_norm": 10.377588272094727,
+ "learning_rate": 4.977293369663942e-06,
+ "loss": 3.043,
+ "step": 274
+ },
+ {
+ "epoch": 0.7493188010899182,
+ "grad_norm": 11.266051292419434,
+ "learning_rate": 4.9954586739327884e-06,
+ "loss": 3.1914,
+ "step": 275
+ },
+ {
+ "epoch": 0.7520435967302452,
+ "grad_norm": 12.121461868286133,
+ "learning_rate": 5.013623978201635e-06,
+ "loss": 2.8984,
+ "step": 276
+ },
+ {
+ "epoch": 0.7547683923705722,
+ "grad_norm": 10.40197467803955,
+ "learning_rate": 5.031789282470482e-06,
+ "loss": 2.6602,
+ "step": 277
+ },
+ {
+ "epoch": 0.7574931880108992,
+ "grad_norm": 10.558917999267578,
+ "learning_rate": 5.049954586739329e-06,
+ "loss": 3.043,
+ "step": 278
+ },
+ {
+ "epoch": 0.7602179836512262,
+ "grad_norm": 9.786828994750977,
+ "learning_rate": 5.068119891008176e-06,
+ "loss": 3.1069,
+ "step": 279
+ },
+ {
+ "epoch": 0.7629427792915532,
+ "grad_norm": 11.263306617736816,
+ "learning_rate": 5.086285195277021e-06,
+ "loss": 3.0688,
+ "step": 280
+ },
+ {
+ "epoch": 0.7656675749318801,
+ "grad_norm": 8.676852226257324,
+ "learning_rate": 5.104450499545868e-06,
+ "loss": 2.9199,
+ "step": 281
+ },
+ {
+ "epoch": 0.7683923705722071,
+ "grad_norm": 10.780664443969727,
+ "learning_rate": 5.122615803814714e-06,
+ "loss": 3.0317,
+ "step": 282
+ },
+ {
+ "epoch": 0.771117166212534,
+ "grad_norm": 12.283220291137695,
+ "learning_rate": 5.140781108083561e-06,
+ "loss": 3.1592,
+ "step": 283
+ },
+ {
+ "epoch": 0.773841961852861,
+ "grad_norm": 9.572271347045898,
+ "learning_rate": 5.158946412352407e-06,
+ "loss": 3.1748,
+ "step": 284
+ },
+ {
+ "epoch": 0.776566757493188,
+ "grad_norm": 13.599047660827637,
+ "learning_rate": 5.1771117166212534e-06,
+ "loss": 2.9395,
+ "step": 285
+ },
+ {
+ "epoch": 0.779291553133515,
+ "grad_norm": 12.397294998168945,
+ "learning_rate": 5.1952770208901005e-06,
+ "loss": 3.0732,
+ "step": 286
+ },
+ {
+ "epoch": 0.782016348773842,
+ "grad_norm": 10.11894416809082,
+ "learning_rate": 5.2134423251589475e-06,
+ "loss": 3.2109,
+ "step": 287
+ },
+ {
+ "epoch": 0.784741144414169,
+ "grad_norm": 9.713980674743652,
+ "learning_rate": 5.231607629427793e-06,
+ "loss": 3.002,
+ "step": 288
+ },
+ {
+ "epoch": 0.7874659400544959,
+ "grad_norm": 12.788566589355469,
+ "learning_rate": 5.24977293369664e-06,
+ "loss": 3.125,
+ "step": 289
+ },
+ {
+ "epoch": 0.7901907356948229,
+ "grad_norm": 10.20035171508789,
+ "learning_rate": 5.267938237965487e-06,
+ "loss": 3.1172,
+ "step": 290
+ },
+ {
+ "epoch": 0.7929155313351499,
+ "grad_norm": 9.050313949584961,
+ "learning_rate": 5.286103542234333e-06,
+ "loss": 3.1074,
+ "step": 291
+ },
+ {
+ "epoch": 0.7956403269754768,
+ "grad_norm": 12.593305587768555,
+ "learning_rate": 5.304268846503179e-06,
+ "loss": 3.2715,
+ "step": 292
+ },
+ {
+ "epoch": 0.7983651226158038,
+ "grad_norm": 9.735793113708496,
+ "learning_rate": 5.322434150772025e-06,
+ "loss": 3.1445,
+ "step": 293
+ },
+ {
+ "epoch": 0.8010899182561307,
+ "grad_norm": 13.674619674682617,
+ "learning_rate": 5.340599455040872e-06,
+ "loss": 3.1611,
+ "step": 294
+ },
+ {
+ "epoch": 0.8038147138964578,
+ "grad_norm": 11.066041946411133,
+ "learning_rate": 5.358764759309719e-06,
+ "loss": 2.8115,
+ "step": 295
+ },
+ {
+ "epoch": 0.8065395095367848,
+ "grad_norm": 10.592111587524414,
+ "learning_rate": 5.376930063578565e-06,
+ "loss": 2.9028,
+ "step": 296
+ },
+ {
+ "epoch": 0.8092643051771117,
+ "grad_norm": 10.814714431762695,
+ "learning_rate": 5.395095367847412e-06,
+ "loss": 2.8428,
+ "step": 297
+ },
+ {
+ "epoch": 0.8119891008174387,
+ "grad_norm": 9.773011207580566,
+ "learning_rate": 5.413260672116259e-06,
+ "loss": 2.8975,
+ "step": 298
+ },
+ {
+ "epoch": 0.8147138964577657,
+ "grad_norm": 9.989364624023438,
+ "learning_rate": 5.431425976385105e-06,
+ "loss": 2.8833,
+ "step": 299
+ },
+ {
+ "epoch": 0.8174386920980926,
+ "grad_norm": 10.806577682495117,
+ "learning_rate": 5.449591280653952e-06,
+ "loss": 3.3301,
+ "step": 300
+ },
+ {
+ "epoch": 0.8201634877384196,
+ "grad_norm": 11.721353530883789,
+ "learning_rate": 5.467756584922798e-06,
+ "loss": 3.0889,
+ "step": 301
+ },
+ {
+ "epoch": 0.8228882833787466,
+ "grad_norm": 11.272564888000488,
+ "learning_rate": 5.485921889191644e-06,
+ "loss": 3.25,
+ "step": 302
+ },
+ {
+ "epoch": 0.8256130790190735,
+ "grad_norm": 9.646610260009766,
+ "learning_rate": 5.504087193460491e-06,
+ "loss": 3.0498,
+ "step": 303
+ },
+ {
+ "epoch": 0.8283378746594006,
+ "grad_norm": 10.122640609741211,
+ "learning_rate": 5.522252497729338e-06,
+ "loss": 2.8525,
+ "step": 304
+ },
+ {
+ "epoch": 0.8310626702997275,
+ "grad_norm": 11.975621223449707,
+ "learning_rate": 5.5404178019981835e-06,
+ "loss": 2.98,
+ "step": 305
+ },
+ {
+ "epoch": 0.8337874659400545,
+ "grad_norm": 9.96011734008789,
+ "learning_rate": 5.5585831062670305e-06,
+ "loss": 3.1787,
+ "step": 306
+ },
+ {
+ "epoch": 0.8365122615803815,
+ "grad_norm": 11.059173583984375,
+ "learning_rate": 5.5767484105358775e-06,
+ "loss": 3.2861,
+ "step": 307
+ },
+ {
+ "epoch": 0.8392370572207084,
+ "grad_norm": 10.573100090026855,
+ "learning_rate": 5.594913714804724e-06,
+ "loss": 2.9976,
+ "step": 308
+ },
+ {
+ "epoch": 0.8419618528610354,
+ "grad_norm": 11.470596313476562,
+ "learning_rate": 5.61307901907357e-06,
+ "loss": 2.9238,
+ "step": 309
+ },
+ {
+ "epoch": 0.8446866485013624,
+ "grad_norm": 11.162026405334473,
+ "learning_rate": 5.631244323342416e-06,
+ "loss": 3.2871,
+ "step": 310
+ },
+ {
+ "epoch": 0.8474114441416893,
+ "grad_norm": 10.692909240722656,
+ "learning_rate": 5.649409627611263e-06,
+ "loss": 3.252,
+ "step": 311
+ },
+ {
+ "epoch": 0.8501362397820164,
+ "grad_norm": 11.107943534851074,
+ "learning_rate": 5.66757493188011e-06,
+ "loss": 3.2139,
+ "step": 312
+ },
+ {
+ "epoch": 0.8528610354223434,
+ "grad_norm": 9.772025108337402,
+ "learning_rate": 5.685740236148955e-06,
+ "loss": 2.8848,
+ "step": 313
+ },
+ {
+ "epoch": 0.8555858310626703,
+ "grad_norm": 10.775506019592285,
+ "learning_rate": 5.703905540417802e-06,
+ "loss": 3.0908,
+ "step": 314
+ },
+ {
+ "epoch": 0.8583106267029973,
+ "grad_norm": 14.792106628417969,
+ "learning_rate": 5.722070844686649e-06,
+ "loss": 2.8691,
+ "step": 315
+ },
+ {
+ "epoch": 0.8610354223433242,
+ "grad_norm": 10.167881965637207,
+ "learning_rate": 5.7402361489554955e-06,
+ "loss": 3.0137,
+ "step": 316
+ },
+ {
+ "epoch": 0.8637602179836512,
+ "grad_norm": 11.682990074157715,
+ "learning_rate": 5.758401453224342e-06,
+ "loss": 3.2441,
+ "step": 317
+ },
+ {
+ "epoch": 0.8664850136239782,
+ "grad_norm": 10.642148971557617,
+ "learning_rate": 5.776566757493189e-06,
+ "loss": 2.9629,
+ "step": 318
+ },
+ {
+ "epoch": 0.8692098092643051,
+ "grad_norm": 13.177349090576172,
+ "learning_rate": 5.794732061762035e-06,
+ "loss": 3.1973,
+ "step": 319
+ },
+ {
+ "epoch": 0.8719346049046321,
+ "grad_norm": 10.01991081237793,
+ "learning_rate": 5.812897366030882e-06,
+ "loss": 2.9751,
+ "step": 320
+ },
+ {
+ "epoch": 0.8746594005449592,
+ "grad_norm": 11.585193634033203,
+ "learning_rate": 5.831062670299727e-06,
+ "loss": 3.249,
+ "step": 321
+ },
+ {
+ "epoch": 0.8773841961852861,
+ "grad_norm": 9.34164047241211,
+ "learning_rate": 5.849227974568574e-06,
+ "loss": 2.9863,
+ "step": 322
+ },
+ {
+ "epoch": 0.8801089918256131,
+ "grad_norm": 10.178692817687988,
+ "learning_rate": 5.867393278837421e-06,
+ "loss": 2.9072,
+ "step": 323
+ },
+ {
+ "epoch": 0.8828337874659401,
+ "grad_norm": 10.652539253234863,
+ "learning_rate": 5.885558583106268e-06,
+ "loss": 2.9502,
+ "step": 324
+ },
+ {
+ "epoch": 0.885558583106267,
+ "grad_norm": 9.648669242858887,
+ "learning_rate": 5.9037238873751135e-06,
+ "loss": 3.0527,
+ "step": 325
+ },
+ {
+ "epoch": 0.888283378746594,
+ "grad_norm": 8.94349193572998,
+ "learning_rate": 5.9218891916439605e-06,
+ "loss": 3.1143,
+ "step": 326
+ },
+ {
+ "epoch": 0.8910081743869209,
+ "grad_norm": 9.749101638793945,
+ "learning_rate": 5.940054495912807e-06,
+ "loss": 2.957,
+ "step": 327
+ },
+ {
+ "epoch": 0.8937329700272479,
+ "grad_norm": 10.487102508544922,
+ "learning_rate": 5.958219800181654e-06,
+ "loss": 2.7764,
+ "step": 328
+ },
+ {
+ "epoch": 0.896457765667575,
+ "grad_norm": 11.558155059814453,
+ "learning_rate": 5.976385104450501e-06,
+ "loss": 3.0679,
+ "step": 329
+ },
+ {
+ "epoch": 0.8991825613079019,
+ "grad_norm": 8.687368392944336,
+ "learning_rate": 5.994550408719346e-06,
+ "loss": 2.8779,
+ "step": 330
+ },
+ {
+ "epoch": 0.9019073569482289,
+ "grad_norm": 11.50344181060791,
+ "learning_rate": 6.012715712988193e-06,
+ "loss": 2.8945,
+ "step": 331
+ },
+ {
+ "epoch": 0.9046321525885559,
+ "grad_norm": 8.328307151794434,
+ "learning_rate": 6.03088101725704e-06,
+ "loss": 2.8618,
+ "step": 332
+ },
+ {
+ "epoch": 0.9073569482288828,
+ "grad_norm": 10.823127746582031,
+ "learning_rate": 6.049046321525886e-06,
+ "loss": 3.085,
+ "step": 333
+ },
+ {
+ "epoch": 0.9100817438692098,
+ "grad_norm": 9.42167854309082,
+ "learning_rate": 6.067211625794732e-06,
+ "loss": 2.7568,
+ "step": 334
+ },
+ {
+ "epoch": 0.9128065395095368,
+ "grad_norm": 9.684298515319824,
+ "learning_rate": 6.085376930063579e-06,
+ "loss": 2.9136,
+ "step": 335
+ },
+ {
+ "epoch": 0.9155313351498637,
+ "grad_norm": 10.575213432312012,
+ "learning_rate": 6.1035422343324255e-06,
+ "loss": 3.1797,
+ "step": 336
+ },
+ {
+ "epoch": 0.9182561307901907,
+ "grad_norm": 9.206254959106445,
+ "learning_rate": 6.1217075386012725e-06,
+ "loss": 3.084,
+ "step": 337
+ },
+ {
+ "epoch": 0.9209809264305178,
+ "grad_norm": 10.56982135772705,
+ "learning_rate": 6.139872842870118e-06,
+ "loss": 2.7876,
+ "step": 338
+ },
+ {
+ "epoch": 0.9237057220708447,
+ "grad_norm": 9.894237518310547,
+ "learning_rate": 6.158038147138965e-06,
+ "loss": 2.9077,
+ "step": 339
+ },
+ {
+ "epoch": 0.9264305177111717,
+ "grad_norm": 8.02868366241455,
+ "learning_rate": 6.176203451407812e-06,
+ "loss": 2.8062,
+ "step": 340
+ },
+ {
+ "epoch": 0.9291553133514986,
+ "grad_norm": 8.86514663696289,
+ "learning_rate": 6.194368755676659e-06,
+ "loss": 2.9062,
+ "step": 341
+ },
+ {
+ "epoch": 0.9318801089918256,
+ "grad_norm": 15.095792770385742,
+ "learning_rate": 6.212534059945504e-06,
+ "loss": 2.9209,
+ "step": 342
+ },
+ {
+ "epoch": 0.9346049046321526,
+ "grad_norm": 10.972758293151855,
+ "learning_rate": 6.230699364214351e-06,
+ "loss": 2.9863,
+ "step": 343
+ },
+ {
+ "epoch": 0.9373297002724795,
+ "grad_norm": 9.462160110473633,
+ "learning_rate": 6.248864668483197e-06,
+ "loss": 2.9688,
+ "step": 344
+ },
+ {
+ "epoch": 0.9400544959128065,
+ "grad_norm": 8.696920394897461,
+ "learning_rate": 6.267029972752044e-06,
+ "loss": 2.96,
+ "step": 345
+ },
+ {
+ "epoch": 0.9427792915531336,
+ "grad_norm": 12.647309303283691,
+ "learning_rate": 6.2851952770208905e-06,
+ "loss": 3.0645,
+ "step": 346
+ },
+ {
+ "epoch": 0.9455040871934605,
+ "grad_norm": 10.608399391174316,
+ "learning_rate": 6.303360581289737e-06,
+ "loss": 2.8242,
+ "step": 347
+ },
+ {
+ "epoch": 0.9482288828337875,
+ "grad_norm": 11.65522289276123,
+ "learning_rate": 6.321525885558584e-06,
+ "loss": 3.1382,
+ "step": 348
+ },
+ {
+ "epoch": 0.9509536784741145,
+ "grad_norm": 8.824722290039062,
+ "learning_rate": 6.339691189827431e-06,
+ "loss": 2.917,
+ "step": 349
+ },
+ {
+ "epoch": 0.9536784741144414,
+ "grad_norm": 11.027289390563965,
+ "learning_rate": 6.357856494096276e-06,
+ "loss": 3.0371,
+ "step": 350
+ },
+ {
+ "epoch": 0.9564032697547684,
+ "grad_norm": 12.124699592590332,
+ "learning_rate": 6.376021798365123e-06,
+ "loss": 3.1348,
+ "step": 351
+ },
+ {
+ "epoch": 0.9591280653950953,
+ "grad_norm": 11.385178565979004,
+ "learning_rate": 6.39418710263397e-06,
+ "loss": 2.9229,
+ "step": 352
+ },
+ {
+ "epoch": 0.9618528610354223,
+ "grad_norm": 11.994840621948242,
+ "learning_rate": 6.412352406902816e-06,
+ "loss": 3.1709,
+ "step": 353
+ },
+ {
+ "epoch": 0.9645776566757494,
+ "grad_norm": 8.85571002960205,
+ "learning_rate": 6.430517711171662e-06,
+ "loss": 2.7881,
+ "step": 354
+ },
+ {
+ "epoch": 0.9673024523160763,
+ "grad_norm": 11.468720436096191,
+ "learning_rate": 6.448683015440509e-06,
+ "loss": 2.7666,
+ "step": 355
+ },
+ {
+ "epoch": 0.9700272479564033,
+ "grad_norm": 9.187004089355469,
+ "learning_rate": 6.4668483197093555e-06,
+ "loss": 3.0547,
+ "step": 356
+ },
+ {
+ "epoch": 0.9727520435967303,
+ "grad_norm": 11.031088829040527,
+ "learning_rate": 6.4850136239782025e-06,
+ "loss": 3.1611,
+ "step": 357
+ },
+ {
+ "epoch": 0.9754768392370572,
+ "grad_norm": 10.66789436340332,
+ "learning_rate": 6.5031789282470495e-06,
+ "loss": 2.8545,
+ "step": 358
+ },
+ {
+ "epoch": 0.9782016348773842,
+ "grad_norm": 12.648036003112793,
+ "learning_rate": 6.521344232515895e-06,
+ "loss": 2.9009,
+ "step": 359
+ },
+ {
+ "epoch": 0.9809264305177112,
+ "grad_norm": 9.666924476623535,
+ "learning_rate": 6.539509536784742e-06,
+ "loss": 2.9673,
+ "step": 360
+ },
+ {
+ "epoch": 0.9836512261580381,
+ "grad_norm": 11.903847694396973,
+ "learning_rate": 6.557674841053589e-06,
+ "loss": 2.6465,
+ "step": 361
+ },
+ {
+ "epoch": 0.9863760217983651,
+ "grad_norm": 14.617626190185547,
+ "learning_rate": 6.575840145322435e-06,
+ "loss": 3.0,
+ "step": 362
+ },
+ {
+ "epoch": 0.989100817438692,
+ "grad_norm": 17.167770385742188,
+ "learning_rate": 6.594005449591281e-06,
+ "loss": 3.041,
+ "step": 363
+ },
+ {
+ "epoch": 0.9918256130790191,
+ "grad_norm": 12.77061653137207,
+ "learning_rate": 6.612170753860127e-06,
+ "loss": 2.9688,
+ "step": 364
+ },
+ {
+ "epoch": 0.9945504087193461,
+ "grad_norm": 10.30443286895752,
+ "learning_rate": 6.630336058128974e-06,
+ "loss": 2.7344,
+ "step": 365
+ },
+ {
+ "epoch": 0.997275204359673,
+ "grad_norm": 14.379679679870605,
+ "learning_rate": 6.648501362397821e-06,
+ "loss": 2.8291,
+ "step": 366
+ },
+ {
+ "epoch": 1.0,
+ "grad_norm": 10.28809928894043,
+ "learning_rate": 6.666666666666667e-06,
+ "loss": 2.9424,
+ "step": 367
+ },
+ {
+ "epoch": 1.002724795640327,
+ "grad_norm": 10.779088973999023,
+ "learning_rate": 6.684831970935514e-06,
+ "loss": 2.9834,
+ "step": 368
+ },
+ {
+ "epoch": 1.005449591280654,
+ "grad_norm": 11.226832389831543,
+ "learning_rate": 6.702997275204361e-06,
+ "loss": 2.9473,
+ "step": 369
+ },
+ {
+ "epoch": 1.008174386920981,
+ "grad_norm": 9.997020721435547,
+ "learning_rate": 6.721162579473207e-06,
+ "loss": 2.7344,
+ "step": 370
+ },
+ {
+ "epoch": 1.0108991825613078,
+ "grad_norm": 11.764245986938477,
+ "learning_rate": 6.739327883742053e-06,
+ "loss": 2.8877,
+ "step": 371
+ },
+ {
+ "epoch": 1.013623978201635,
+ "grad_norm": 11.373870849609375,
+ "learning_rate": 6.7574931880109e-06,
+ "loss": 3.1035,
+ "step": 372
+ },
+ {
+ "epoch": 1.0163487738419619,
+ "grad_norm": 12.055533409118652,
+ "learning_rate": 6.775658492279746e-06,
+ "loss": 2.8447,
+ "step": 373
+ },
+ {
+ "epoch": 1.0190735694822888,
+ "grad_norm": 31.768789291381836,
+ "learning_rate": 6.793823796548593e-06,
+ "loss": 2.8325,
+ "step": 374
+ },
+ {
+ "epoch": 1.021798365122616,
+ "grad_norm": 10.671889305114746,
+ "learning_rate": 6.8119891008174385e-06,
+ "loss": 2.96,
+ "step": 375
+ },
+ {
+ "epoch": 1.0245231607629428,
+ "grad_norm": 11.033255577087402,
+ "learning_rate": 6.8301544050862855e-06,
+ "loss": 2.8223,
+ "step": 376
+ },
+ {
+ "epoch": 1.0272479564032697,
+ "grad_norm": 11.364258766174316,
+ "learning_rate": 6.8483197093551325e-06,
+ "loss": 2.9634,
+ "step": 377
+ },
+ {
+ "epoch": 1.0299727520435966,
+ "grad_norm": 8.979849815368652,
+ "learning_rate": 6.8664850136239795e-06,
+ "loss": 2.9229,
+ "step": 378
+ },
+ {
+ "epoch": 1.0326975476839237,
+ "grad_norm": 10.40015697479248,
+ "learning_rate": 6.884650317892825e-06,
+ "loss": 2.8232,
+ "step": 379
+ },
+ {
+ "epoch": 1.0354223433242506,
+ "grad_norm": 8.893531799316406,
+ "learning_rate": 6.902815622161672e-06,
+ "loss": 2.8813,
+ "step": 380
+ },
+ {
+ "epoch": 1.0381471389645776,
+ "grad_norm": 11.417078018188477,
+ "learning_rate": 6.920980926430518e-06,
+ "loss": 2.7207,
+ "step": 381
+ },
+ {
+ "epoch": 1.0408719346049047,
+ "grad_norm": 10.525177955627441,
+ "learning_rate": 6.939146230699365e-06,
+ "loss": 2.9854,
+ "step": 382
+ },
+ {
+ "epoch": 1.0435967302452316,
+ "grad_norm": 9.927412033081055,
+ "learning_rate": 6.957311534968211e-06,
+ "loss": 2.8262,
+ "step": 383
+ },
+ {
+ "epoch": 1.0463215258855585,
+ "grad_norm": 12.706193923950195,
+ "learning_rate": 6.975476839237057e-06,
+ "loss": 3.0049,
+ "step": 384
+ },
+ {
+ "epoch": 1.0490463215258856,
+ "grad_norm": 10.498812675476074,
+ "learning_rate": 6.993642143505904e-06,
+ "loss": 2.7578,
+ "step": 385
+ },
+ {
+ "epoch": 1.0517711171662125,
+ "grad_norm": 10.719517707824707,
+ "learning_rate": 7.011807447774751e-06,
+ "loss": 2.8618,
+ "step": 386
+ },
+ {
+ "epoch": 1.0544959128065394,
+ "grad_norm": 12.072530746459961,
+ "learning_rate": 7.0299727520435975e-06,
+ "loss": 2.7798,
+ "step": 387
+ },
+ {
+ "epoch": 1.0572207084468666,
+ "grad_norm": 9.507881164550781,
+ "learning_rate": 7.048138056312444e-06,
+ "loss": 2.6548,
+ "step": 388
+ },
+ {
+ "epoch": 1.0599455040871935,
+ "grad_norm": 12.026369094848633,
+ "learning_rate": 7.066303360581291e-06,
+ "loss": 2.7642,
+ "step": 389
+ },
+ {
+ "epoch": 1.0626702997275204,
+ "grad_norm": 11.388680458068848,
+ "learning_rate": 7.084468664850137e-06,
+ "loss": 2.749,
+ "step": 390
+ },
+ {
+ "epoch": 1.0653950953678475,
+ "grad_norm": 12.096214294433594,
+ "learning_rate": 7.102633969118984e-06,
+ "loss": 2.6499,
+ "step": 391
+ },
+ {
+ "epoch": 1.0681198910081744,
+ "grad_norm": 12.473118782043457,
+ "learning_rate": 7.120799273387829e-06,
+ "loss": 2.9619,
+ "step": 392
+ },
+ {
+ "epoch": 1.0708446866485013,
+ "grad_norm": 10.778851509094238,
+ "learning_rate": 7.138964577656676e-06,
+ "loss": 2.7432,
+ "step": 393
+ },
+ {
+ "epoch": 1.0735694822888284,
+ "grad_norm": 12.79310417175293,
+ "learning_rate": 7.157129881925523e-06,
+ "loss": 2.8647,
+ "step": 394
+ },
+ {
+ "epoch": 1.0762942779291553,
+ "grad_norm": 12.59657096862793,
+ "learning_rate": 7.17529518619437e-06,
+ "loss": 2.689,
+ "step": 395
+ },
+ {
+ "epoch": 1.0790190735694822,
+ "grad_norm": 11.395380973815918,
+ "learning_rate": 7.1934604904632155e-06,
+ "loss": 2.9043,
+ "step": 396
+ },
+ {
+ "epoch": 1.0817438692098094,
+ "grad_norm": 12.513686180114746,
+ "learning_rate": 7.2116257947320625e-06,
+ "loss": 2.8154,
+ "step": 397
+ },
+ {
+ "epoch": 1.0844686648501363,
+ "grad_norm": 10.173294067382812,
+ "learning_rate": 7.229791099000909e-06,
+ "loss": 2.6123,
+ "step": 398
+ },
+ {
+ "epoch": 1.0871934604904632,
+ "grad_norm": 9.681666374206543,
+ "learning_rate": 7.247956403269756e-06,
+ "loss": 2.4634,
+ "step": 399
+ },
+ {
+ "epoch": 1.0899182561307903,
+ "grad_norm": 11.721431732177734,
+ "learning_rate": 7.266121707538602e-06,
+ "loss": 2.8311,
+ "step": 400
+ },
+ {
+ "epoch": 1.0926430517711172,
+ "grad_norm": 9.718865394592285,
+ "learning_rate": 7.284287011807448e-06,
+ "loss": 2.7515,
+ "step": 401
+ },
+ {
+ "epoch": 1.095367847411444,
+ "grad_norm": 13.524134635925293,
+ "learning_rate": 7.302452316076295e-06,
+ "loss": 2.6484,
+ "step": 402
+ },
+ {
+ "epoch": 1.0980926430517712,
+ "grad_norm": 8.978958129882812,
+ "learning_rate": 7.320617620345142e-06,
+ "loss": 2.8022,
+ "step": 403
+ },
+ {
+ "epoch": 1.1008174386920981,
+ "grad_norm": 10.181389808654785,
+ "learning_rate": 7.338782924613987e-06,
+ "loss": 2.8721,
+ "step": 404
+ },
+ {
+ "epoch": 1.103542234332425,
+ "grad_norm": 9.95703125,
+ "learning_rate": 7.356948228882834e-06,
+ "loss": 2.9873,
+ "step": 405
+ },
+ {
+ "epoch": 1.106267029972752,
+ "grad_norm": 9.80728530883789,
+ "learning_rate": 7.375113533151681e-06,
+ "loss": 2.5879,
+ "step": 406
+ },
+ {
+ "epoch": 1.108991825613079,
+ "grad_norm": 11.94822883605957,
+ "learning_rate": 7.3932788374205275e-06,
+ "loss": 2.6226,
+ "step": 407
+ },
+ {
+ "epoch": 1.111716621253406,
+ "grad_norm": 10.268418312072754,
+ "learning_rate": 7.411444141689374e-06,
+ "loss": 2.6157,
+ "step": 408
+ },
+ {
+ "epoch": 1.1144414168937329,
+ "grad_norm": 13.16259765625,
+ "learning_rate": 7.42960944595822e-06,
+ "loss": 2.6309,
+ "step": 409
+ },
+ {
+ "epoch": 1.11716621253406,
+ "grad_norm": 9.806975364685059,
+ "learning_rate": 7.447774750227067e-06,
+ "loss": 2.5195,
+ "step": 410
+ },
+ {
+ "epoch": 1.119891008174387,
+ "grad_norm": 11.498656272888184,
+ "learning_rate": 7.465940054495914e-06,
+ "loss": 2.9082,
+ "step": 411
+ },
+ {
+ "epoch": 1.1226158038147138,
+ "grad_norm": 10.164894104003906,
+ "learning_rate": 7.484105358764759e-06,
+ "loss": 2.7812,
+ "step": 412
+ },
+ {
+ "epoch": 1.125340599455041,
+ "grad_norm": 16.40764808654785,
+ "learning_rate": 7.502270663033606e-06,
+ "loss": 2.5967,
+ "step": 413
+ },
+ {
+ "epoch": 1.1280653950953679,
+ "grad_norm": 13.020524024963379,
+ "learning_rate": 7.520435967302453e-06,
+ "loss": 2.793,
+ "step": 414
+ },
+ {
+ "epoch": 1.1307901907356948,
+ "grad_norm": 9.52269458770752,
+ "learning_rate": 7.538601271571299e-06,
+ "loss": 2.4224,
+ "step": 415
+ },
+ {
+ "epoch": 1.1335149863760219,
+ "grad_norm": 13.420445442199707,
+ "learning_rate": 7.5567665758401455e-06,
+ "loss": 2.6089,
+ "step": 416
+ },
+ {
+ "epoch": 1.1362397820163488,
+ "grad_norm": 10.215398788452148,
+ "learning_rate": 7.5749318801089925e-06,
+ "loss": 2.9336,
+ "step": 417
+ },
+ {
+ "epoch": 1.1389645776566757,
+ "grad_norm": 11.343588829040527,
+ "learning_rate": 7.593097184377839e-06,
+ "loss": 2.8281,
+ "step": 418
+ },
+ {
+ "epoch": 1.1416893732970028,
+ "grad_norm": 11.341489791870117,
+ "learning_rate": 7.611262488646686e-06,
+ "loss": 2.8442,
+ "step": 419
+ },
+ {
+ "epoch": 1.1444141689373297,
+ "grad_norm": 13.097975730895996,
+ "learning_rate": 7.629427792915532e-06,
+ "loss": 2.897,
+ "step": 420
+ },
+ {
+ "epoch": 1.1471389645776566,
+ "grad_norm": 15.45946216583252,
+ "learning_rate": 7.647593097184378e-06,
+ "loss": 2.4253,
+ "step": 421
+ },
+ {
+ "epoch": 1.1498637602179835,
+ "grad_norm": 9.48956298828125,
+ "learning_rate": 7.665758401453224e-06,
+ "loss": 2.501,
+ "step": 422
+ },
+ {
+ "epoch": 1.1525885558583107,
+ "grad_norm": 14.140972137451172,
+ "learning_rate": 7.683923705722072e-06,
+ "loss": 2.6108,
+ "step": 423
+ },
+ {
+ "epoch": 1.1553133514986376,
+ "grad_norm": 12.59040641784668,
+ "learning_rate": 7.702089009990918e-06,
+ "loss": 2.7061,
+ "step": 424
+ },
+ {
+ "epoch": 1.1580381471389645,
+ "grad_norm": 11.303720474243164,
+ "learning_rate": 7.720254314259764e-06,
+ "loss": 2.6416,
+ "step": 425
+ },
+ {
+ "epoch": 1.1607629427792916,
+ "grad_norm": 9.568498611450195,
+ "learning_rate": 7.73841961852861e-06,
+ "loss": 2.6787,
+ "step": 426
+ },
+ {
+ "epoch": 1.1634877384196185,
+ "grad_norm": 9.496077537536621,
+ "learning_rate": 7.756584922797458e-06,
+ "loss": 2.918,
+ "step": 427
+ },
+ {
+ "epoch": 1.1662125340599454,
+ "grad_norm": 11.773557662963867,
+ "learning_rate": 7.774750227066305e-06,
+ "loss": 2.9116,
+ "step": 428
+ },
+ {
+ "epoch": 1.1689373297002725,
+ "grad_norm": 10.357346534729004,
+ "learning_rate": 7.79291553133515e-06,
+ "loss": 2.627,
+ "step": 429
+ },
+ {
+ "epoch": 1.1716621253405994,
+ "grad_norm": 12.790385246276855,
+ "learning_rate": 7.811080835603997e-06,
+ "loss": 2.6235,
+ "step": 430
+ },
+ {
+ "epoch": 1.1743869209809263,
+ "grad_norm": 13.647273063659668,
+ "learning_rate": 7.829246139872843e-06,
+ "loss": 3.248,
+ "step": 431
+ },
+ {
+ "epoch": 1.1771117166212535,
+ "grad_norm": 12.220288276672363,
+ "learning_rate": 7.847411444141691e-06,
+ "loss": 2.769,
+ "step": 432
+ },
+ {
+ "epoch": 1.1798365122615804,
+ "grad_norm": 11.686890602111816,
+ "learning_rate": 7.865576748410535e-06,
+ "loss": 2.3706,
+ "step": 433
+ },
+ {
+ "epoch": 1.1825613079019073,
+ "grad_norm": 12.022626876831055,
+ "learning_rate": 7.883742052679383e-06,
+ "loss": 2.5293,
+ "step": 434
+ },
+ {
+ "epoch": 1.1852861035422344,
+ "grad_norm": 9.241992950439453,
+ "learning_rate": 7.90190735694823e-06,
+ "loss": 2.5386,
+ "step": 435
+ },
+ {
+ "epoch": 1.1880108991825613,
+ "grad_norm": 9.880123138427734,
+ "learning_rate": 7.920072661217077e-06,
+ "loss": 2.687,
+ "step": 436
+ },
+ {
+ "epoch": 1.1907356948228882,
+ "grad_norm": 11.03382396697998,
+ "learning_rate": 7.938237965485922e-06,
+ "loss": 2.7334,
+ "step": 437
+ },
+ {
+ "epoch": 1.1934604904632153,
+ "grad_norm": 11.051270484924316,
+ "learning_rate": 7.95640326975477e-06,
+ "loss": 2.7217,
+ "step": 438
+ },
+ {
+ "epoch": 1.1961852861035422,
+ "grad_norm": 13.074309349060059,
+ "learning_rate": 7.974568574023616e-06,
+ "loss": 2.7139,
+ "step": 439
+ },
+ {
+ "epoch": 1.1989100817438691,
+ "grad_norm": 11.242266654968262,
+ "learning_rate": 7.992733878292462e-06,
+ "loss": 2.6152,
+ "step": 440
+ },
+ {
+ "epoch": 1.2016348773841963,
+ "grad_norm": 11.25084400177002,
+ "learning_rate": 8.010899182561308e-06,
+ "loss": 2.6558,
+ "step": 441
+ },
+ {
+ "epoch": 1.2043596730245232,
+ "grad_norm": 10.377076148986816,
+ "learning_rate": 8.029064486830154e-06,
+ "loss": 2.6245,
+ "step": 442
+ },
+ {
+ "epoch": 1.20708446866485,
+ "grad_norm": 10.222033500671387,
+ "learning_rate": 8.047229791099002e-06,
+ "loss": 3.0137,
+ "step": 443
+ },
+ {
+ "epoch": 1.2098092643051772,
+ "grad_norm": 9.710803031921387,
+ "learning_rate": 8.065395095367848e-06,
+ "loss": 2.8018,
+ "step": 444
+ },
+ {
+ "epoch": 1.2125340599455041,
+ "grad_norm": 12.02476692199707,
+ "learning_rate": 8.083560399636694e-06,
+ "loss": 2.7852,
+ "step": 445
+ },
+ {
+ "epoch": 1.215258855585831,
+ "grad_norm": 11.377335548400879,
+ "learning_rate": 8.10172570390554e-06,
+ "loss": 2.6895,
+ "step": 446
+ },
+ {
+ "epoch": 1.2179836512261581,
+ "grad_norm": 9.653413772583008,
+ "learning_rate": 8.119891008174388e-06,
+ "loss": 2.5435,
+ "step": 447
+ },
+ {
+ "epoch": 1.220708446866485,
+ "grad_norm": 10.20368480682373,
+ "learning_rate": 8.138056312443235e-06,
+ "loss": 2.71,
+ "step": 448
+ },
+ {
+ "epoch": 1.223433242506812,
+ "grad_norm": 10.484225273132324,
+ "learning_rate": 8.15622161671208e-06,
+ "loss": 2.5337,
+ "step": 449
+ },
+ {
+ "epoch": 1.226158038147139,
+ "grad_norm": 13.753677368164062,
+ "learning_rate": 8.174386920980927e-06,
+ "loss": 2.7847,
+ "step": 450
+ },
+ {
+ "epoch": 1.228882833787466,
+ "grad_norm": 11.210610389709473,
+ "learning_rate": 8.192552225249773e-06,
+ "loss": 2.6738,
+ "step": 451
+ },
+ {
+ "epoch": 1.231607629427793,
+ "grad_norm": 10.580645561218262,
+ "learning_rate": 8.210717529518621e-06,
+ "loss": 2.6934,
+ "step": 452
+ },
+ {
+ "epoch": 1.2343324250681198,
+ "grad_norm": 10.421024322509766,
+ "learning_rate": 8.228882833787467e-06,
+ "loss": 2.7798,
+ "step": 453
+ },
+ {
+ "epoch": 1.237057220708447,
+ "grad_norm": 11.129182815551758,
+ "learning_rate": 8.247048138056313e-06,
+ "loss": 2.6597,
+ "step": 454
+ },
+ {
+ "epoch": 1.2397820163487738,
+ "grad_norm": 11.662261009216309,
+ "learning_rate": 8.26521344232516e-06,
+ "loss": 2.6504,
+ "step": 455
+ },
+ {
+ "epoch": 1.2425068119891007,
+ "grad_norm": 29.719701766967773,
+ "learning_rate": 8.283378746594006e-06,
+ "loss": 2.9678,
+ "step": 456
+ },
+ {
+ "epoch": 1.2452316076294279,
+ "grad_norm": 10.148482322692871,
+ "learning_rate": 8.301544050862853e-06,
+ "loss": 2.5928,
+ "step": 457
+ },
+ {
+ "epoch": 1.2479564032697548,
+ "grad_norm": 10.919842720031738,
+ "learning_rate": 8.3197093551317e-06,
+ "loss": 2.6074,
+ "step": 458
+ },
+ {
+ "epoch": 1.2506811989100817,
+ "grad_norm": 11.2857027053833,
+ "learning_rate": 8.337874659400546e-06,
+ "loss": 2.7573,
+ "step": 459
+ },
+ {
+ "epoch": 1.2534059945504088,
+ "grad_norm": 10.820455551147461,
+ "learning_rate": 8.356039963669392e-06,
+ "loss": 2.4141,
+ "step": 460
+ },
+ {
+ "epoch": 1.2561307901907357,
+ "grad_norm": 14.457060813903809,
+ "learning_rate": 8.37420526793824e-06,
+ "loss": 2.8892,
+ "step": 461
+ },
+ {
+ "epoch": 1.2588555858310626,
+ "grad_norm": 8.9891939163208,
+ "learning_rate": 8.392370572207084e-06,
+ "loss": 2.8398,
+ "step": 462
+ },
+ {
+ "epoch": 1.2615803814713895,
+ "grad_norm": 11.050307273864746,
+ "learning_rate": 8.410535876475932e-06,
+ "loss": 2.6924,
+ "step": 463
+ },
+ {
+ "epoch": 1.2643051771117166,
+ "grad_norm": 10.814742088317871,
+ "learning_rate": 8.428701180744778e-06,
+ "loss": 2.6929,
+ "step": 464
+ },
+ {
+ "epoch": 1.2670299727520435,
+ "grad_norm": 11.274110794067383,
+ "learning_rate": 8.446866485013624e-06,
+ "loss": 2.5933,
+ "step": 465
+ },
+ {
+ "epoch": 1.2697547683923704,
+ "grad_norm": 13.799680709838867,
+ "learning_rate": 8.46503178928247e-06,
+ "loss": 2.6382,
+ "step": 466
+ },
+ {
+ "epoch": 1.2724795640326976,
+ "grad_norm": 11.533510208129883,
+ "learning_rate": 8.483197093551317e-06,
+ "loss": 2.7002,
+ "step": 467
+ },
+ {
+ "epoch": 1.2752043596730245,
+ "grad_norm": 11.78360366821289,
+ "learning_rate": 8.501362397820165e-06,
+ "loss": 2.5723,
+ "step": 468
+ },
+ {
+ "epoch": 1.2779291553133514,
+ "grad_norm": 14.222066879272461,
+ "learning_rate": 8.51952770208901e-06,
+ "loss": 2.7705,
+ "step": 469
+ },
+ {
+ "epoch": 1.2806539509536785,
+ "grad_norm": 12.54738712310791,
+ "learning_rate": 8.537693006357857e-06,
+ "loss": 2.4131,
+ "step": 470
+ },
+ {
+ "epoch": 1.2833787465940054,
+ "grad_norm": 11.072205543518066,
+ "learning_rate": 8.555858310626703e-06,
+ "loss": 2.7427,
+ "step": 471
+ },
+ {
+ "epoch": 1.2861035422343323,
+ "grad_norm": 11.79690170288086,
+ "learning_rate": 8.574023614895551e-06,
+ "loss": 2.7095,
+ "step": 472
+ },
+ {
+ "epoch": 1.2888283378746594,
+ "grad_norm": 11.124776840209961,
+ "learning_rate": 8.592188919164397e-06,
+ "loss": 2.624,
+ "step": 473
+ },
+ {
+ "epoch": 1.2915531335149864,
+ "grad_norm": 10.043506622314453,
+ "learning_rate": 8.610354223433243e-06,
+ "loss": 2.4404,
+ "step": 474
+ },
+ {
+ "epoch": 1.2942779291553133,
+ "grad_norm": 15.051888465881348,
+ "learning_rate": 8.62851952770209e-06,
+ "loss": 2.833,
+ "step": 475
+ },
+ {
+ "epoch": 1.2970027247956404,
+ "grad_norm": 9.278153419494629,
+ "learning_rate": 8.646684831970936e-06,
+ "loss": 2.5469,
+ "step": 476
+ },
+ {
+ "epoch": 1.2997275204359673,
+ "grad_norm": 12.055374145507812,
+ "learning_rate": 8.664850136239783e-06,
+ "loss": 2.5098,
+ "step": 477
+ },
+ {
+ "epoch": 1.3024523160762942,
+ "grad_norm": 9.819018363952637,
+ "learning_rate": 8.68301544050863e-06,
+ "loss": 2.522,
+ "step": 478
+ },
+ {
+ "epoch": 1.3051771117166213,
+ "grad_norm": 10.395660400390625,
+ "learning_rate": 8.701180744777476e-06,
+ "loss": 2.6792,
+ "step": 479
+ },
+ {
+ "epoch": 1.3079019073569482,
+ "grad_norm": 12.166010856628418,
+ "learning_rate": 8.719346049046322e-06,
+ "loss": 2.5669,
+ "step": 480
+ },
+ {
+ "epoch": 1.3106267029972751,
+ "grad_norm": 23.176393508911133,
+ "learning_rate": 8.73751135331517e-06,
+ "loss": 2.7007,
+ "step": 481
+ },
+ {
+ "epoch": 1.3133514986376023,
+ "grad_norm": 11.619187355041504,
+ "learning_rate": 8.755676657584016e-06,
+ "loss": 2.6953,
+ "step": 482
+ },
+ {
+ "epoch": 1.3160762942779292,
+ "grad_norm": 10.351978302001953,
+ "learning_rate": 8.773841961852862e-06,
+ "loss": 2.6812,
+ "step": 483
+ },
+ {
+ "epoch": 1.318801089918256,
+ "grad_norm": 10.137228012084961,
+ "learning_rate": 8.792007266121708e-06,
+ "loss": 2.4609,
+ "step": 484
+ },
+ {
+ "epoch": 1.3215258855585832,
+ "grad_norm": 11.376115798950195,
+ "learning_rate": 8.810172570390554e-06,
+ "loss": 2.5933,
+ "step": 485
+ },
+ {
+ "epoch": 1.32425068119891,
+ "grad_norm": 10.707823753356934,
+ "learning_rate": 8.828337874659402e-06,
+ "loss": 2.7358,
+ "step": 486
+ },
+ {
+ "epoch": 1.326975476839237,
+ "grad_norm": 11.9663724899292,
+ "learning_rate": 8.846503178928247e-06,
+ "loss": 2.5566,
+ "step": 487
+ },
+ {
+ "epoch": 1.3297002724795641,
+ "grad_norm": 10.451996803283691,
+ "learning_rate": 8.864668483197095e-06,
+ "loss": 2.6133,
+ "step": 488
+ },
+ {
+ "epoch": 1.332425068119891,
+ "grad_norm": 10.462884902954102,
+ "learning_rate": 8.88283378746594e-06,
+ "loss": 2.373,
+ "step": 489
+ },
+ {
+ "epoch": 1.335149863760218,
+ "grad_norm": 11.319975852966309,
+ "learning_rate": 8.900999091734787e-06,
+ "loss": 2.4707,
+ "step": 490
+ },
+ {
+ "epoch": 1.337874659400545,
+ "grad_norm": 11.024785995483398,
+ "learning_rate": 8.919164396003633e-06,
+ "loss": 2.7427,
+ "step": 491
+ },
+ {
+ "epoch": 1.340599455040872,
+ "grad_norm": 12.764436721801758,
+ "learning_rate": 8.937329700272481e-06,
+ "loss": 2.8945,
+ "step": 492
+ },
+ {
+ "epoch": 1.3433242506811989,
+ "grad_norm": 12.335233688354492,
+ "learning_rate": 8.955495004541327e-06,
+ "loss": 2.7842,
+ "step": 493
+ },
+ {
+ "epoch": 1.346049046321526,
+ "grad_norm": 10.881226539611816,
+ "learning_rate": 8.973660308810173e-06,
+ "loss": 2.6929,
+ "step": 494
+ },
+ {
+ "epoch": 1.348773841961853,
+ "grad_norm": 13.029730796813965,
+ "learning_rate": 8.99182561307902e-06,
+ "loss": 2.416,
+ "step": 495
+ },
+ {
+ "epoch": 1.3514986376021798,
+ "grad_norm": 9.454353332519531,
+ "learning_rate": 9.009990917347866e-06,
+ "loss": 2.395,
+ "step": 496
+ },
+ {
+ "epoch": 1.354223433242507,
+ "grad_norm": 10.588221549987793,
+ "learning_rate": 9.028156221616713e-06,
+ "loss": 2.3359,
+ "step": 497
+ },
+ {
+ "epoch": 1.3569482288828338,
+ "grad_norm": 10.198881149291992,
+ "learning_rate": 9.04632152588556e-06,
+ "loss": 2.7339,
+ "step": 498
+ },
+ {
+ "epoch": 1.3596730245231607,
+ "grad_norm": 10.493569374084473,
+ "learning_rate": 9.064486830154406e-06,
+ "loss": 2.769,
+ "step": 499
+ },
+ {
+ "epoch": 1.3623978201634879,
+ "grad_norm": 13.529339790344238,
+ "learning_rate": 9.082652134423252e-06,
+ "loss": 2.6699,
+ "step": 500
+ },
+ {
+ "epoch": 1.3651226158038148,
+ "grad_norm": 12.325822830200195,
+ "learning_rate": 9.1008174386921e-06,
+ "loss": 2.5801,
+ "step": 501
+ },
+ {
+ "epoch": 1.3678474114441417,
+ "grad_norm": 10.57773494720459,
+ "learning_rate": 9.118982742960946e-06,
+ "loss": 2.8398,
+ "step": 502
+ },
+ {
+ "epoch": 1.3705722070844686,
+ "grad_norm": 10.800013542175293,
+ "learning_rate": 9.137148047229792e-06,
+ "loss": 2.7549,
+ "step": 503
+ },
+ {
+ "epoch": 1.3732970027247957,
+ "grad_norm": 12.23603343963623,
+ "learning_rate": 9.155313351498638e-06,
+ "loss": 2.625,
+ "step": 504
+ },
+ {
+ "epoch": 1.3760217983651226,
+ "grad_norm": 10.985679626464844,
+ "learning_rate": 9.173478655767484e-06,
+ "loss": 2.5469,
+ "step": 505
+ },
+ {
+ "epoch": 1.3787465940054495,
+ "grad_norm": 10.75507926940918,
+ "learning_rate": 9.191643960036332e-06,
+ "loss": 2.4526,
+ "step": 506
+ },
+ {
+ "epoch": 1.3814713896457766,
+ "grad_norm": 11.696499824523926,
+ "learning_rate": 9.209809264305178e-06,
+ "loss": 2.5278,
+ "step": 507
+ },
+ {
+ "epoch": 1.3841961852861036,
+ "grad_norm": 12.926390647888184,
+ "learning_rate": 9.227974568574025e-06,
+ "loss": 2.752,
+ "step": 508
+ },
+ {
+ "epoch": 1.3869209809264305,
+ "grad_norm": 9.957062721252441,
+ "learning_rate": 9.24613987284287e-06,
+ "loss": 2.6543,
+ "step": 509
+ },
+ {
+ "epoch": 1.3896457765667574,
+ "grad_norm": 11.469195365905762,
+ "learning_rate": 9.264305177111717e-06,
+ "loss": 2.5161,
+ "step": 510
+ },
+ {
+ "epoch": 1.3923705722070845,
+ "grad_norm": 13.082963943481445,
+ "learning_rate": 9.282470481380565e-06,
+ "loss": 2.6533,
+ "step": 511
+ },
+ {
+ "epoch": 1.3950953678474114,
+ "grad_norm": 8.906614303588867,
+ "learning_rate": 9.300635785649411e-06,
+ "loss": 2.4404,
+ "step": 512
+ },
+ {
+ "epoch": 1.3978201634877383,
+ "grad_norm": 11.93236255645752,
+ "learning_rate": 9.318801089918257e-06,
+ "loss": 2.8286,
+ "step": 513
+ },
+ {
+ "epoch": 1.4005449591280654,
+ "grad_norm": 11.915575981140137,
+ "learning_rate": 9.336966394187103e-06,
+ "loss": 2.6279,
+ "step": 514
+ },
+ {
+ "epoch": 1.4032697547683923,
+ "grad_norm": 10.185914039611816,
+ "learning_rate": 9.355131698455951e-06,
+ "loss": 2.6211,
+ "step": 515
+ },
+ {
+ "epoch": 1.4059945504087192,
+ "grad_norm": 8.432724952697754,
+ "learning_rate": 9.373297002724796e-06,
+ "loss": 2.4209,
+ "step": 516
+ },
+ {
+ "epoch": 1.4087193460490464,
+ "grad_norm": 11.576340675354004,
+ "learning_rate": 9.391462306993643e-06,
+ "loss": 2.8804,
+ "step": 517
+ },
+ {
+ "epoch": 1.4114441416893733,
+ "grad_norm": 14.05243968963623,
+ "learning_rate": 9.40962761126249e-06,
+ "loss": 2.749,
+ "step": 518
+ },
+ {
+ "epoch": 1.4141689373297002,
+ "grad_norm": 13.364104270935059,
+ "learning_rate": 9.427792915531336e-06,
+ "loss": 2.5923,
+ "step": 519
+ },
+ {
+ "epoch": 1.4168937329700273,
+ "grad_norm": 11.277190208435059,
+ "learning_rate": 9.445958219800182e-06,
+ "loss": 2.5156,
+ "step": 520
+ },
+ {
+ "epoch": 1.4196185286103542,
+ "grad_norm": 10.909285545349121,
+ "learning_rate": 9.464123524069028e-06,
+ "loss": 2.4678,
+ "step": 521
+ },
+ {
+ "epoch": 1.422343324250681,
+ "grad_norm": 11.696632385253906,
+ "learning_rate": 9.482288828337876e-06,
+ "loss": 2.8662,
+ "step": 522
+ },
+ {
+ "epoch": 1.4250681198910082,
+ "grad_norm": 11.566356658935547,
+ "learning_rate": 9.500454132606722e-06,
+ "loss": 2.5601,
+ "step": 523
+ },
+ {
+ "epoch": 1.4277929155313351,
+ "grad_norm": 10.315143585205078,
+ "learning_rate": 9.518619436875568e-06,
+ "loss": 2.5898,
+ "step": 524
+ },
+ {
+ "epoch": 1.430517711171662,
+ "grad_norm": 10.548094749450684,
+ "learning_rate": 9.536784741144414e-06,
+ "loss": 2.7236,
+ "step": 525
+ },
+ {
+ "epoch": 1.4332425068119892,
+ "grad_norm": 11.040914535522461,
+ "learning_rate": 9.554950045413262e-06,
+ "loss": 2.4258,
+ "step": 526
+ },
+ {
+ "epoch": 1.435967302452316,
+ "grad_norm": 9.996368408203125,
+ "learning_rate": 9.573115349682108e-06,
+ "loss": 2.3677,
+ "step": 527
+ },
+ {
+ "epoch": 1.438692098092643,
+ "grad_norm": 10.326546669006348,
+ "learning_rate": 9.591280653950955e-06,
+ "loss": 2.5425,
+ "step": 528
+ },
+ {
+ "epoch": 1.44141689373297,
+ "grad_norm": 13.101269721984863,
+ "learning_rate": 9.6094459582198e-06,
+ "loss": 2.8428,
+ "step": 529
+ },
+ {
+ "epoch": 1.444141689373297,
+ "grad_norm": 12.325589179992676,
+ "learning_rate": 9.627611262488647e-06,
+ "loss": 2.6436,
+ "step": 530
+ },
+ {
+ "epoch": 1.446866485013624,
+ "grad_norm": 10.933701515197754,
+ "learning_rate": 9.645776566757495e-06,
+ "loss": 2.3931,
+ "step": 531
+ },
+ {
+ "epoch": 1.449591280653951,
+ "grad_norm": 9.500052452087402,
+ "learning_rate": 9.66394187102634e-06,
+ "loss": 2.3345,
+ "step": 532
+ },
+ {
+ "epoch": 1.452316076294278,
+ "grad_norm": 13.047250747680664,
+ "learning_rate": 9.682107175295187e-06,
+ "loss": 2.7686,
+ "step": 533
+ },
+ {
+ "epoch": 1.4550408719346049,
+ "grad_norm": 12.109979629516602,
+ "learning_rate": 9.700272479564033e-06,
+ "loss": 2.501,
+ "step": 534
+ },
+ {
+ "epoch": 1.457765667574932,
+ "grad_norm": 12.179343223571777,
+ "learning_rate": 9.718437783832881e-06,
+ "loss": 2.5972,
+ "step": 535
+ },
+ {
+ "epoch": 1.4604904632152589,
+ "grad_norm": 9.693185806274414,
+ "learning_rate": 9.736603088101727e-06,
+ "loss": 2.437,
+ "step": 536
+ },
+ {
+ "epoch": 1.4632152588555858,
+ "grad_norm": 12.021675109863281,
+ "learning_rate": 9.754768392370573e-06,
+ "loss": 2.7832,
+ "step": 537
+ },
+ {
+ "epoch": 1.465940054495913,
+ "grad_norm": 13.525501251220703,
+ "learning_rate": 9.77293369663942e-06,
+ "loss": 2.7178,
+ "step": 538
+ },
+ {
+ "epoch": 1.4686648501362398,
+ "grad_norm": 10.672472953796387,
+ "learning_rate": 9.791099000908266e-06,
+ "loss": 2.7441,
+ "step": 539
+ },
+ {
+ "epoch": 1.4713896457765667,
+ "grad_norm": 11.792448043823242,
+ "learning_rate": 9.809264305177114e-06,
+ "loss": 2.4883,
+ "step": 540
+ },
+ {
+ "epoch": 1.4741144414168939,
+ "grad_norm": 11.761456489562988,
+ "learning_rate": 9.827429609445958e-06,
+ "loss": 2.3374,
+ "step": 541
+ },
+ {
+ "epoch": 1.4768392370572208,
+ "grad_norm": 9.928813934326172,
+ "learning_rate": 9.845594913714806e-06,
+ "loss": 2.3564,
+ "step": 542
+ },
+ {
+ "epoch": 1.4795640326975477,
+ "grad_norm": 9.164095878601074,
+ "learning_rate": 9.863760217983652e-06,
+ "loss": 2.2881,
+ "step": 543
+ },
+ {
+ "epoch": 1.4822888283378748,
+ "grad_norm": 8.395923614501953,
+ "learning_rate": 9.881925522252498e-06,
+ "loss": 2.5308,
+ "step": 544
+ },
+ {
+ "epoch": 1.4850136239782017,
+ "grad_norm": 11.917168617248535,
+ "learning_rate": 9.900090826521344e-06,
+ "loss": 2.4995,
+ "step": 545
+ },
+ {
+ "epoch": 1.4877384196185286,
+ "grad_norm": 10.364140510559082,
+ "learning_rate": 9.918256130790192e-06,
+ "loss": 2.5234,
+ "step": 546
+ },
+ {
+ "epoch": 1.4904632152588557,
+ "grad_norm": 9.905284881591797,
+ "learning_rate": 9.936421435059038e-06,
+ "loss": 2.6123,
+ "step": 547
+ },
+ {
+ "epoch": 1.4931880108991826,
+ "grad_norm": 10.341503143310547,
+ "learning_rate": 9.954586739327885e-06,
+ "loss": 2.6328,
+ "step": 548
+ },
+ {
+ "epoch": 1.4959128065395095,
+ "grad_norm": 9.595457077026367,
+ "learning_rate": 9.97275204359673e-06,
+ "loss": 2.4976,
+ "step": 549
+ },
+ {
+ "epoch": 1.4986376021798364,
+ "grad_norm": 8.586732864379883,
+ "learning_rate": 9.990917347865577e-06,
+ "loss": 2.3501,
+ "step": 550
+ },
+ {
+ "epoch": 1.5013623978201633,
+ "grad_norm": 10.91036605834961,
+ "learning_rate": 1.0009082652134423e-05,
+ "loss": 2.5,
+ "step": 551
+ },
+ {
+ "epoch": 1.5040871934604905,
+ "grad_norm": 10.423352241516113,
+ "learning_rate": 1.002724795640327e-05,
+ "loss": 2.6089,
+ "step": 552
+ },
+ {
+ "epoch": 1.5068119891008176,
+ "grad_norm": 9.540590286254883,
+ "learning_rate": 1.0045413260672117e-05,
+ "loss": 2.4922,
+ "step": 553
+ },
+ {
+ "epoch": 1.5095367847411443,
+ "grad_norm": 11.419909477233887,
+ "learning_rate": 1.0063578564940963e-05,
+ "loss": 2.6396,
+ "step": 554
+ },
+ {
+ "epoch": 1.5122615803814714,
+ "grad_norm": 14.756720542907715,
+ "learning_rate": 1.008174386920981e-05,
+ "loss": 2.7812,
+ "step": 555
+ },
+ {
+ "epoch": 1.5149863760217985,
+ "grad_norm": 10.618692398071289,
+ "learning_rate": 1.0099909173478657e-05,
+ "loss": 2.5645,
+ "step": 556
+ },
+ {
+ "epoch": 1.5177111716621252,
+ "grad_norm": 9.123624801635742,
+ "learning_rate": 1.0118074477747503e-05,
+ "loss": 2.6064,
+ "step": 557
+ },
+ {
+ "epoch": 1.5204359673024523,
+ "grad_norm": 10.515607833862305,
+ "learning_rate": 1.0136239782016351e-05,
+ "loss": 2.5498,
+ "step": 558
+ },
+ {
+ "epoch": 1.5231607629427792,
+ "grad_norm": 15.523499488830566,
+ "learning_rate": 1.0154405086285196e-05,
+ "loss": 2.4937,
+ "step": 559
+ },
+ {
+ "epoch": 1.5258855585831061,
+ "grad_norm": 13.398969650268555,
+ "learning_rate": 1.0172570390554042e-05,
+ "loss": 2.667,
+ "step": 560
+ },
+ {
+ "epoch": 1.5286103542234333,
+ "grad_norm": 9.918622970581055,
+ "learning_rate": 1.0190735694822888e-05,
+ "loss": 2.4619,
+ "step": 561
+ },
+ {
+ "epoch": 1.5313351498637602,
+ "grad_norm": 11.595111846923828,
+ "learning_rate": 1.0208900999091736e-05,
+ "loss": 2.4878,
+ "step": 562
+ },
+ {
+ "epoch": 1.534059945504087,
+ "grad_norm": 9.246755599975586,
+ "learning_rate": 1.0227066303360582e-05,
+ "loss": 2.5894,
+ "step": 563
+ },
+ {
+ "epoch": 1.5367847411444142,
+ "grad_norm": 13.432228088378906,
+ "learning_rate": 1.0245231607629428e-05,
+ "loss": 2.7573,
+ "step": 564
+ },
+ {
+ "epoch": 1.5395095367847411,
+ "grad_norm": 10.047687530517578,
+ "learning_rate": 1.0263396911898276e-05,
+ "loss": 2.25,
+ "step": 565
+ },
+ {
+ "epoch": 1.542234332425068,
+ "grad_norm": 13.986072540283203,
+ "learning_rate": 1.0281562216167122e-05,
+ "loss": 2.6641,
+ "step": 566
+ },
+ {
+ "epoch": 1.5449591280653951,
+ "grad_norm": 11.353102684020996,
+ "learning_rate": 1.0299727520435968e-05,
+ "loss": 2.6831,
+ "step": 567
+ },
+ {
+ "epoch": 1.547683923705722,
+ "grad_norm": 11.442963600158691,
+ "learning_rate": 1.0317892824704815e-05,
+ "loss": 2.3428,
+ "step": 568
+ },
+ {
+ "epoch": 1.550408719346049,
+ "grad_norm": 10.155078887939453,
+ "learning_rate": 1.033605812897366e-05,
+ "loss": 2.4673,
+ "step": 569
+ },
+ {
+ "epoch": 1.553133514986376,
+ "grad_norm": 9.572172164916992,
+ "learning_rate": 1.0354223433242507e-05,
+ "loss": 2.606,
+ "step": 570
+ },
+ {
+ "epoch": 1.555858310626703,
+ "grad_norm": 11.651671409606934,
+ "learning_rate": 1.0372388737511355e-05,
+ "loss": 2.5181,
+ "step": 571
+ },
+ {
+ "epoch": 1.55858310626703,
+ "grad_norm": 10.545559883117676,
+ "learning_rate": 1.0390554041780201e-05,
+ "loss": 2.3989,
+ "step": 572
+ },
+ {
+ "epoch": 1.561307901907357,
+ "grad_norm": 11.466548919677734,
+ "learning_rate": 1.0408719346049047e-05,
+ "loss": 2.5503,
+ "step": 573
+ },
+ {
+ "epoch": 1.564032697547684,
+ "grad_norm": 11.771925926208496,
+ "learning_rate": 1.0426884650317895e-05,
+ "loss": 2.6226,
+ "step": 574
+ },
+ {
+ "epoch": 1.5667574931880108,
+ "grad_norm": 9.880620956420898,
+ "learning_rate": 1.0445049954586741e-05,
+ "loss": 2.4404,
+ "step": 575
+ },
+ {
+ "epoch": 1.569482288828338,
+ "grad_norm": 11.97048568725586,
+ "learning_rate": 1.0463215258855586e-05,
+ "loss": 2.6875,
+ "step": 576
+ },
+ {
+ "epoch": 1.5722070844686649,
+ "grad_norm": 13.414999008178711,
+ "learning_rate": 1.0481380563124432e-05,
+ "loss": 2.6855,
+ "step": 577
+ },
+ {
+ "epoch": 1.5749318801089918,
+ "grad_norm": 11.781789779663086,
+ "learning_rate": 1.049954586739328e-05,
+ "loss": 2.4966,
+ "step": 578
+ },
+ {
+ "epoch": 1.577656675749319,
+ "grad_norm": 18.100326538085938,
+ "learning_rate": 1.0517711171662126e-05,
+ "loss": 2.6426,
+ "step": 579
+ },
+ {
+ "epoch": 1.5803814713896458,
+ "grad_norm": 11.263434410095215,
+ "learning_rate": 1.0535876475930974e-05,
+ "loss": 2.5903,
+ "step": 580
+ },
+ {
+ "epoch": 1.5831062670299727,
+ "grad_norm": 11.495070457458496,
+ "learning_rate": 1.055404178019982e-05,
+ "loss": 2.4575,
+ "step": 581
+ },
+ {
+ "epoch": 1.5858310626702998,
+ "grad_norm": 9.964534759521484,
+ "learning_rate": 1.0572207084468666e-05,
+ "loss": 2.5522,
+ "step": 582
+ },
+ {
+ "epoch": 1.5885558583106267,
+ "grad_norm": 11.702447891235352,
+ "learning_rate": 1.0590372388737514e-05,
+ "loss": 2.3389,
+ "step": 583
+ },
+ {
+ "epoch": 1.5912806539509536,
+ "grad_norm": 9.268019676208496,
+ "learning_rate": 1.0608537693006358e-05,
+ "loss": 2.269,
+ "step": 584
+ },
+ {
+ "epoch": 1.5940054495912808,
+ "grad_norm": 15.74026870727539,
+ "learning_rate": 1.0626702997275204e-05,
+ "loss": 2.3662,
+ "step": 585
+ },
+ {
+ "epoch": 1.5967302452316077,
+ "grad_norm": 10.973413467407227,
+ "learning_rate": 1.064486830154405e-05,
+ "loss": 2.6699,
+ "step": 586
+ },
+ {
+ "epoch": 1.5994550408719346,
+ "grad_norm": 13.940545082092285,
+ "learning_rate": 1.0663033605812898e-05,
+ "loss": 2.668,
+ "step": 587
+ },
+ {
+ "epoch": 1.6021798365122617,
+ "grad_norm": 9.798370361328125,
+ "learning_rate": 1.0681198910081745e-05,
+ "loss": 2.5801,
+ "step": 588
+ },
+ {
+ "epoch": 1.6049046321525886,
+ "grad_norm": 10.114641189575195,
+ "learning_rate": 1.069936421435059e-05,
+ "loss": 2.3628,
+ "step": 589
+ },
+ {
+ "epoch": 1.6076294277929155,
+ "grad_norm": 13.61198616027832,
+ "learning_rate": 1.0717529518619439e-05,
+ "loss": 2.3149,
+ "step": 590
+ },
+ {
+ "epoch": 1.6103542234332426,
+ "grad_norm": 11.84930419921875,
+ "learning_rate": 1.0735694822888285e-05,
+ "loss": 2.1602,
+ "step": 591
+ },
+ {
+ "epoch": 1.6130790190735693,
+ "grad_norm": 11.23861026763916,
+ "learning_rate": 1.075386012715713e-05,
+ "loss": 2.5112,
+ "step": 592
+ },
+ {
+ "epoch": 1.6158038147138964,
+ "grad_norm": 12.049510955810547,
+ "learning_rate": 1.0772025431425977e-05,
+ "loss": 2.499,
+ "step": 593
+ },
+ {
+ "epoch": 1.6185286103542236,
+ "grad_norm": 11.305673599243164,
+ "learning_rate": 1.0790190735694823e-05,
+ "loss": 2.4512,
+ "step": 594
+ },
+ {
+ "epoch": 1.6212534059945503,
+ "grad_norm": 8.980688095092773,
+ "learning_rate": 1.080835603996367e-05,
+ "loss": 2.2471,
+ "step": 595
+ },
+ {
+ "epoch": 1.6239782016348774,
+ "grad_norm": 13.167588233947754,
+ "learning_rate": 1.0826521344232517e-05,
+ "loss": 2.4492,
+ "step": 596
+ },
+ {
+ "epoch": 1.6267029972752045,
+ "grad_norm": 13.362232208251953,
+ "learning_rate": 1.0844686648501363e-05,
+ "loss": 2.3589,
+ "step": 597
+ },
+ {
+ "epoch": 1.6294277929155312,
+ "grad_norm": 13.432881355285645,
+ "learning_rate": 1.086285195277021e-05,
+ "loss": 2.3999,
+ "step": 598
+ },
+ {
+ "epoch": 1.6321525885558583,
+ "grad_norm": 10.197798728942871,
+ "learning_rate": 1.0881017257039057e-05,
+ "loss": 2.4595,
+ "step": 599
+ },
+ {
+ "epoch": 1.6348773841961854,
+ "grad_norm": 12.196104049682617,
+ "learning_rate": 1.0899182561307904e-05,
+ "loss": 2.5488,
+ "step": 600
+ },
+ {
+ "epoch": 1.6376021798365121,
+ "grad_norm": 10.602243423461914,
+ "learning_rate": 1.0917347865576748e-05,
+ "loss": 2.6128,
+ "step": 601
+ },
+ {
+ "epoch": 1.6403269754768393,
+ "grad_norm": 11.960326194763184,
+ "learning_rate": 1.0935513169845596e-05,
+ "loss": 2.6465,
+ "step": 602
+ },
+ {
+ "epoch": 1.6430517711171662,
+ "grad_norm": 12.77395248413086,
+ "learning_rate": 1.0953678474114442e-05,
+ "loss": 2.7295,
+ "step": 603
+ },
+ {
+ "epoch": 1.645776566757493,
+ "grad_norm": 14.705750465393066,
+ "learning_rate": 1.0971843778383288e-05,
+ "loss": 2.5347,
+ "step": 604
+ },
+ {
+ "epoch": 1.6485013623978202,
+ "grad_norm": 9.935203552246094,
+ "learning_rate": 1.0990009082652136e-05,
+ "loss": 2.1514,
+ "step": 605
+ },
+ {
+ "epoch": 1.651226158038147,
+ "grad_norm": 11.95473575592041,
+ "learning_rate": 1.1008174386920982e-05,
+ "loss": 2.5923,
+ "step": 606
+ },
+ {
+ "epoch": 1.653950953678474,
+ "grad_norm": 14.375449180603027,
+ "learning_rate": 1.1026339691189828e-05,
+ "loss": 2.6475,
+ "step": 607
+ },
+ {
+ "epoch": 1.6566757493188011,
+ "grad_norm": 10.64272689819336,
+ "learning_rate": 1.1044504995458676e-05,
+ "loss": 2.4312,
+ "step": 608
+ },
+ {
+ "epoch": 1.659400544959128,
+ "grad_norm": 12.748344421386719,
+ "learning_rate": 1.106267029972752e-05,
+ "loss": 2.4067,
+ "step": 609
+ },
+ {
+ "epoch": 1.662125340599455,
+ "grad_norm": 10.088484764099121,
+ "learning_rate": 1.1080835603996367e-05,
+ "loss": 2.4624,
+ "step": 610
+ },
+ {
+ "epoch": 1.664850136239782,
+ "grad_norm": 11.537372589111328,
+ "learning_rate": 1.1099000908265215e-05,
+ "loss": 2.3145,
+ "step": 611
+ },
+ {
+ "epoch": 1.667574931880109,
+ "grad_norm": 10.860895156860352,
+ "learning_rate": 1.1117166212534061e-05,
+ "loss": 2.4912,
+ "step": 612
+ },
+ {
+ "epoch": 1.6702997275204359,
+ "grad_norm": 11.544546127319336,
+ "learning_rate": 1.1135331516802907e-05,
+ "loss": 2.6802,
+ "step": 613
+ },
+ {
+ "epoch": 1.673024523160763,
+ "grad_norm": 12.035743713378906,
+ "learning_rate": 1.1153496821071755e-05,
+ "loss": 2.3105,
+ "step": 614
+ },
+ {
+ "epoch": 1.67574931880109,
+ "grad_norm": 11.289690971374512,
+ "learning_rate": 1.1171662125340601e-05,
+ "loss": 2.3843,
+ "step": 615
+ },
+ {
+ "epoch": 1.6784741144414168,
+ "grad_norm": 10.212812423706055,
+ "learning_rate": 1.1189827429609447e-05,
+ "loss": 2.7515,
+ "step": 616
+ },
+ {
+ "epoch": 1.681198910081744,
+ "grad_norm": 11.834221839904785,
+ "learning_rate": 1.1207992733878292e-05,
+ "loss": 2.6309,
+ "step": 617
+ },
+ {
+ "epoch": 1.6839237057220708,
+ "grad_norm": 10.995518684387207,
+ "learning_rate": 1.122615803814714e-05,
+ "loss": 2.4917,
+ "step": 618
+ },
+ {
+ "epoch": 1.6866485013623977,
+ "grad_norm": 11.77338695526123,
+ "learning_rate": 1.1244323342415986e-05,
+ "loss": 2.6064,
+ "step": 619
+ },
+ {
+ "epoch": 1.6893732970027249,
+ "grad_norm": 11.592185020446777,
+ "learning_rate": 1.1262488646684832e-05,
+ "loss": 2.4995,
+ "step": 620
+ },
+ {
+ "epoch": 1.6920980926430518,
+ "grad_norm": 10.184931755065918,
+ "learning_rate": 1.128065395095368e-05,
+ "loss": 2.3975,
+ "step": 621
+ },
+ {
+ "epoch": 1.6948228882833787,
+ "grad_norm": 9.818941116333008,
+ "learning_rate": 1.1298819255222526e-05,
+ "loss": 2.5396,
+ "step": 622
+ },
+ {
+ "epoch": 1.6975476839237058,
+ "grad_norm": 12.17223834991455,
+ "learning_rate": 1.1316984559491374e-05,
+ "loss": 2.4321,
+ "step": 623
+ },
+ {
+ "epoch": 1.7002724795640327,
+ "grad_norm": 10.2310152053833,
+ "learning_rate": 1.133514986376022e-05,
+ "loss": 2.3984,
+ "step": 624
+ },
+ {
+ "epoch": 1.7029972752043596,
+ "grad_norm": 11.413909912109375,
+ "learning_rate": 1.1353315168029066e-05,
+ "loss": 2.5557,
+ "step": 625
+ },
+ {
+ "epoch": 1.7057220708446867,
+ "grad_norm": 10.546042442321777,
+ "learning_rate": 1.137148047229791e-05,
+ "loss": 2.6455,
+ "step": 626
+ },
+ {
+ "epoch": 1.7084468664850136,
+ "grad_norm": 13.648941040039062,
+ "learning_rate": 1.1389645776566758e-05,
+ "loss": 2.5625,
+ "step": 627
+ },
+ {
+ "epoch": 1.7111716621253406,
+ "grad_norm": 14.775775909423828,
+ "learning_rate": 1.1407811080835605e-05,
+ "loss": 2.4966,
+ "step": 628
+ },
+ {
+ "epoch": 1.7138964577656677,
+ "grad_norm": 20.476844787597656,
+ "learning_rate": 1.142597638510445e-05,
+ "loss": 2.479,
+ "step": 629
+ },
+ {
+ "epoch": 1.7166212534059946,
+ "grad_norm": 10.364046096801758,
+ "learning_rate": 1.1444141689373299e-05,
+ "loss": 2.6875,
+ "step": 630
+ },
+ {
+ "epoch": 1.7193460490463215,
+ "grad_norm": 8.582182884216309,
+ "learning_rate": 1.1462306993642145e-05,
+ "loss": 2.144,
+ "step": 631
+ },
+ {
+ "epoch": 1.7220708446866486,
+ "grad_norm": 10.024995803833008,
+ "learning_rate": 1.1480472297910991e-05,
+ "loss": 2.4619,
+ "step": 632
+ },
+ {
+ "epoch": 1.7247956403269755,
+ "grad_norm": 8.943358421325684,
+ "learning_rate": 1.1498637602179839e-05,
+ "loss": 2.4033,
+ "step": 633
+ },
+ {
+ "epoch": 1.7275204359673024,
+ "grad_norm": 12.314430236816406,
+ "learning_rate": 1.1516802906448683e-05,
+ "loss": 2.3384,
+ "step": 634
+ },
+ {
+ "epoch": 1.7302452316076296,
+ "grad_norm": 11.263984680175781,
+ "learning_rate": 1.153496821071753e-05,
+ "loss": 2.6621,
+ "step": 635
+ },
+ {
+ "epoch": 1.7329700272479565,
+ "grad_norm": 11.925774574279785,
+ "learning_rate": 1.1553133514986377e-05,
+ "loss": 2.1382,
+ "step": 636
+ },
+ {
+ "epoch": 1.7356948228882834,
+ "grad_norm": 10.014432907104492,
+ "learning_rate": 1.1571298819255223e-05,
+ "loss": 2.1636,
+ "step": 637
+ },
+ {
+ "epoch": 1.7384196185286105,
+ "grad_norm": 11.657225608825684,
+ "learning_rate": 1.158946412352407e-05,
+ "loss": 2.458,
+ "step": 638
+ },
+ {
+ "epoch": 1.7411444141689372,
+ "grad_norm": 20.94296646118164,
+ "learning_rate": 1.1607629427792917e-05,
+ "loss": 2.6333,
+ "step": 639
+ },
+ {
+ "epoch": 1.7438692098092643,
+ "grad_norm": 12.757229804992676,
+ "learning_rate": 1.1625794732061764e-05,
+ "loss": 2.3477,
+ "step": 640
+ },
+ {
+ "epoch": 1.7465940054495914,
+ "grad_norm": 12.054852485656738,
+ "learning_rate": 1.164396003633061e-05,
+ "loss": 2.4404,
+ "step": 641
+ },
+ {
+ "epoch": 1.749318801089918,
+ "grad_norm": 14.641657829284668,
+ "learning_rate": 1.1662125340599454e-05,
+ "loss": 2.3457,
+ "step": 642
+ },
+ {
+ "epoch": 1.7520435967302452,
+ "grad_norm": 10.225979804992676,
+ "learning_rate": 1.1680290644868302e-05,
+ "loss": 2.481,
+ "step": 643
+ },
+ {
+ "epoch": 1.7547683923705724,
+ "grad_norm": 13.0012788772583,
+ "learning_rate": 1.1698455949137148e-05,
+ "loss": 2.375,
+ "step": 644
+ },
+ {
+ "epoch": 1.757493188010899,
+ "grad_norm": 12.893733978271484,
+ "learning_rate": 1.1716621253405996e-05,
+ "loss": 2.7119,
+ "step": 645
+ },
+ {
+ "epoch": 1.7602179836512262,
+ "grad_norm": 10.805425643920898,
+ "learning_rate": 1.1734786557674842e-05,
+ "loss": 2.4614,
+ "step": 646
+ },
+ {
+ "epoch": 1.7629427792915533,
+ "grad_norm": 11.27730941772461,
+ "learning_rate": 1.1752951861943688e-05,
+ "loss": 2.4028,
+ "step": 647
+ },
+ {
+ "epoch": 1.76566757493188,
+ "grad_norm": 10.970818519592285,
+ "learning_rate": 1.1771117166212536e-05,
+ "loss": 2.4282,
+ "step": 648
+ },
+ {
+ "epoch": 1.768392370572207,
+ "grad_norm": 10.74846076965332,
+ "learning_rate": 1.1789282470481382e-05,
+ "loss": 2.2319,
+ "step": 649
+ },
+ {
+ "epoch": 1.771117166212534,
+ "grad_norm": 11.724044799804688,
+ "learning_rate": 1.1807447774750227e-05,
+ "loss": 2.583,
+ "step": 650
+ },
+ {
+ "epoch": 1.773841961852861,
+ "grad_norm": 11.138653755187988,
+ "learning_rate": 1.1825613079019073e-05,
+ "loss": 2.3076,
+ "step": 651
+ },
+ {
+ "epoch": 1.776566757493188,
+ "grad_norm": 14.40742015838623,
+ "learning_rate": 1.1843778383287921e-05,
+ "loss": 2.4297,
+ "step": 652
+ },
+ {
+ "epoch": 1.779291553133515,
+ "grad_norm": 10.167417526245117,
+ "learning_rate": 1.1861943687556767e-05,
+ "loss": 2.4209,
+ "step": 653
+ },
+ {
+ "epoch": 1.7820163487738419,
+ "grad_norm": 11.244752883911133,
+ "learning_rate": 1.1880108991825613e-05,
+ "loss": 2.3984,
+ "step": 654
+ },
+ {
+ "epoch": 1.784741144414169,
+ "grad_norm": 7.9195685386657715,
+ "learning_rate": 1.1898274296094461e-05,
+ "loss": 2.1392,
+ "step": 655
+ },
+ {
+ "epoch": 1.7874659400544959,
+ "grad_norm": 12.2032470703125,
+ "learning_rate": 1.1916439600363307e-05,
+ "loss": 2.3579,
+ "step": 656
+ },
+ {
+ "epoch": 1.7901907356948228,
+ "grad_norm": 9.648261070251465,
+ "learning_rate": 1.1934604904632155e-05,
+ "loss": 2.2925,
+ "step": 657
+ },
+ {
+ "epoch": 1.79291553133515,
+ "grad_norm": 12.435829162597656,
+ "learning_rate": 1.1952770208901001e-05,
+ "loss": 2.5117,
+ "step": 658
+ },
+ {
+ "epoch": 1.7956403269754768,
+ "grad_norm": 13.42502498626709,
+ "learning_rate": 1.1970935513169846e-05,
+ "loss": 2.6919,
+ "step": 659
+ },
+ {
+ "epoch": 1.7983651226158037,
+ "grad_norm": 13.266587257385254,
+ "learning_rate": 1.1989100817438692e-05,
+ "loss": 2.3936,
+ "step": 660
+ },
+ {
+ "epoch": 1.8010899182561309,
+ "grad_norm": 11.673394203186035,
+ "learning_rate": 1.200726612170754e-05,
+ "loss": 2.2725,
+ "step": 661
+ },
+ {
+ "epoch": 1.8038147138964578,
+ "grad_norm": 10.024274826049805,
+ "learning_rate": 1.2025431425976386e-05,
+ "loss": 2.4785,
+ "step": 662
+ },
+ {
+ "epoch": 1.8065395095367847,
+ "grad_norm": 8.943089485168457,
+ "learning_rate": 1.2043596730245232e-05,
+ "loss": 2.3887,
+ "step": 663
+ },
+ {
+ "epoch": 1.8092643051771118,
+ "grad_norm": 12.43687629699707,
+ "learning_rate": 1.206176203451408e-05,
+ "loss": 2.355,
+ "step": 664
+ },
+ {
+ "epoch": 1.8119891008174387,
+ "grad_norm": 8.887104988098145,
+ "learning_rate": 1.2079927338782926e-05,
+ "loss": 2.3379,
+ "step": 665
+ },
+ {
+ "epoch": 1.8147138964577656,
+ "grad_norm": 16.104576110839844,
+ "learning_rate": 1.2098092643051772e-05,
+ "loss": 2.4424,
+ "step": 666
+ },
+ {
+ "epoch": 1.8174386920980927,
+ "grad_norm": 15.355511665344238,
+ "learning_rate": 1.2116257947320618e-05,
+ "loss": 2.4673,
+ "step": 667
+ },
+ {
+ "epoch": 1.8201634877384196,
+ "grad_norm": 18.361045837402344,
+ "learning_rate": 1.2134423251589465e-05,
+ "loss": 2.6831,
+ "step": 668
+ },
+ {
+ "epoch": 1.8228882833787465,
+ "grad_norm": 9.65218448638916,
+ "learning_rate": 1.215258855585831e-05,
+ "loss": 2.4902,
+ "step": 669
+ },
+ {
+ "epoch": 1.8256130790190737,
+ "grad_norm": 10.684483528137207,
+ "learning_rate": 1.2170753860127159e-05,
+ "loss": 2.3867,
+ "step": 670
+ },
+ {
+ "epoch": 1.8283378746594006,
+ "grad_norm": 9.706910133361816,
+ "learning_rate": 1.2188919164396005e-05,
+ "loss": 2.2607,
+ "step": 671
+ },
+ {
+ "epoch": 1.8310626702997275,
+ "grad_norm": 11.646918296813965,
+ "learning_rate": 1.2207084468664851e-05,
+ "loss": 2.2642,
+ "step": 672
+ },
+ {
+ "epoch": 1.8337874659400546,
+ "grad_norm": 11.801918029785156,
+ "learning_rate": 1.2225249772933699e-05,
+ "loss": 2.3691,
+ "step": 673
+ },
+ {
+ "epoch": 1.8365122615803815,
+ "grad_norm": 11.345173835754395,
+ "learning_rate": 1.2243415077202545e-05,
+ "loss": 2.4072,
+ "step": 674
+ },
+ {
+ "epoch": 1.8392370572207084,
+ "grad_norm": 11.49028205871582,
+ "learning_rate": 1.226158038147139e-05,
+ "loss": 2.4395,
+ "step": 675
+ },
+ {
+ "epoch": 1.8419618528610355,
+ "grad_norm": 11.581648826599121,
+ "learning_rate": 1.2279745685740236e-05,
+ "loss": 2.1338,
+ "step": 676
+ },
+ {
+ "epoch": 1.8446866485013624,
+ "grad_norm": 9.466208457946777,
+ "learning_rate": 1.2297910990009083e-05,
+ "loss": 2.29,
+ "step": 677
+ },
+ {
+ "epoch": 1.8474114441416893,
+ "grad_norm": 10.945378303527832,
+ "learning_rate": 1.231607629427793e-05,
+ "loss": 2.4863,
+ "step": 678
+ },
+ {
+ "epoch": 1.8501362397820165,
+ "grad_norm": 11.229761123657227,
+ "learning_rate": 1.2334241598546777e-05,
+ "loss": 2.4067,
+ "step": 679
+ },
+ {
+ "epoch": 1.8528610354223434,
+ "grad_norm": 13.484183311462402,
+ "learning_rate": 1.2352406902815624e-05,
+ "loss": 2.4678,
+ "step": 680
+ },
+ {
+ "epoch": 1.8555858310626703,
+ "grad_norm": 12.50755500793457,
+ "learning_rate": 1.237057220708447e-05,
+ "loss": 2.7646,
+ "step": 681
+ },
+ {
+ "epoch": 1.8583106267029974,
+ "grad_norm": 12.71037769317627,
+ "learning_rate": 1.2388737511353318e-05,
+ "loss": 2.2935,
+ "step": 682
+ },
+ {
+ "epoch": 1.861035422343324,
+ "grad_norm": 9.98797607421875,
+ "learning_rate": 1.2406902815622162e-05,
+ "loss": 2.1328,
+ "step": 683
+ },
+ {
+ "epoch": 1.8637602179836512,
+ "grad_norm": 10.682023048400879,
+ "learning_rate": 1.2425068119891008e-05,
+ "loss": 2.1211,
+ "step": 684
+ },
+ {
+ "epoch": 1.8664850136239783,
+ "grad_norm": 10.15453815460205,
+ "learning_rate": 1.2443233424159854e-05,
+ "loss": 2.3521,
+ "step": 685
+ },
+ {
+ "epoch": 1.869209809264305,
+ "grad_norm": 10.65381908416748,
+ "learning_rate": 1.2461398728428702e-05,
+ "loss": 2.3804,
+ "step": 686
+ },
+ {
+ "epoch": 1.8719346049046321,
+ "grad_norm": 12.174696922302246,
+ "learning_rate": 1.2479564032697548e-05,
+ "loss": 2.4795,
+ "step": 687
+ },
+ {
+ "epoch": 1.8746594005449593,
+ "grad_norm": 10.093709945678711,
+ "learning_rate": 1.2497729336966395e-05,
+ "loss": 2.3071,
+ "step": 688
+ },
+ {
+ "epoch": 1.877384196185286,
+ "grad_norm": 9.991334915161133,
+ "learning_rate": 1.2515894641235242e-05,
+ "loss": 2.2856,
+ "step": 689
+ },
+ {
+ "epoch": 1.880108991825613,
+ "grad_norm": 10.812753677368164,
+ "learning_rate": 1.2534059945504089e-05,
+ "loss": 2.314,
+ "step": 690
+ },
+ {
+ "epoch": 1.8828337874659402,
+ "grad_norm": 10.286032676696777,
+ "learning_rate": 1.2552225249772936e-05,
+ "loss": 2.3818,
+ "step": 691
+ },
+ {
+ "epoch": 1.885558583106267,
+ "grad_norm": 9.558748245239258,
+ "learning_rate": 1.2570390554041781e-05,
+ "loss": 2.2256,
+ "step": 692
+ },
+ {
+ "epoch": 1.888283378746594,
+ "grad_norm": 12.837057113647461,
+ "learning_rate": 1.2588555858310627e-05,
+ "loss": 2.5161,
+ "step": 693
+ },
+ {
+ "epoch": 1.891008174386921,
+ "grad_norm": 12.383069038391113,
+ "learning_rate": 1.2606721162579473e-05,
+ "loss": 2.6084,
+ "step": 694
+ },
+ {
+ "epoch": 1.8937329700272478,
+ "grad_norm": 12.400851249694824,
+ "learning_rate": 1.2624886466848321e-05,
+ "loss": 2.2778,
+ "step": 695
+ },
+ {
+ "epoch": 1.896457765667575,
+ "grad_norm": 9.855324745178223,
+ "learning_rate": 1.2643051771117167e-05,
+ "loss": 2.3657,
+ "step": 696
+ },
+ {
+ "epoch": 1.8991825613079019,
+ "grad_norm": 12.803309440612793,
+ "learning_rate": 1.2661217075386013e-05,
+ "loss": 2.3423,
+ "step": 697
+ },
+ {
+ "epoch": 1.9019073569482288,
+ "grad_norm": 11.03612232208252,
+ "learning_rate": 1.2679382379654861e-05,
+ "loss": 2.583,
+ "step": 698
+ },
+ {
+ "epoch": 1.904632152588556,
+ "grad_norm": 10.573287010192871,
+ "learning_rate": 1.2697547683923707e-05,
+ "loss": 2.5322,
+ "step": 699
+ },
+ {
+ "epoch": 1.9073569482288828,
+ "grad_norm": 11.009425163269043,
+ "learning_rate": 1.2715712988192552e-05,
+ "loss": 2.4336,
+ "step": 700
+ },
+ {
+ "epoch": 1.9100817438692097,
+ "grad_norm": 10.598993301391602,
+ "learning_rate": 1.27338782924614e-05,
+ "loss": 2.2759,
+ "step": 701
+ },
+ {
+ "epoch": 1.9128065395095368,
+ "grad_norm": 10.426955223083496,
+ "learning_rate": 1.2752043596730246e-05,
+ "loss": 2.1611,
+ "step": 702
+ },
+ {
+ "epoch": 1.9155313351498637,
+ "grad_norm": 10.571686744689941,
+ "learning_rate": 1.2770208900999092e-05,
+ "loss": 2.3501,
+ "step": 703
+ },
+ {
+ "epoch": 1.9182561307901906,
+ "grad_norm": 13.263895988464355,
+ "learning_rate": 1.278837420526794e-05,
+ "loss": 2.2925,
+ "step": 704
+ },
+ {
+ "epoch": 1.9209809264305178,
+ "grad_norm": 9.810479164123535,
+ "learning_rate": 1.2806539509536786e-05,
+ "loss": 2.5063,
+ "step": 705
+ },
+ {
+ "epoch": 1.9237057220708447,
+ "grad_norm": 11.980880737304688,
+ "learning_rate": 1.2824704813805632e-05,
+ "loss": 2.4922,
+ "step": 706
+ },
+ {
+ "epoch": 1.9264305177111716,
+ "grad_norm": 11.019759178161621,
+ "learning_rate": 1.284287011807448e-05,
+ "loss": 2.3877,
+ "step": 707
+ },
+ {
+ "epoch": 1.9291553133514987,
+ "grad_norm": 9.92830753326416,
+ "learning_rate": 1.2861035422343325e-05,
+ "loss": 2.0889,
+ "step": 708
+ },
+ {
+ "epoch": 1.9318801089918256,
+ "grad_norm": 12.595752716064453,
+ "learning_rate": 1.287920072661217e-05,
+ "loss": 2.249,
+ "step": 709
+ },
+ {
+ "epoch": 1.9346049046321525,
+ "grad_norm": 12.465704917907715,
+ "learning_rate": 1.2897366030881019e-05,
+ "loss": 2.2461,
+ "step": 710
+ },
+ {
+ "epoch": 1.9373297002724796,
+ "grad_norm": 9.215608596801758,
+ "learning_rate": 1.2915531335149865e-05,
+ "loss": 2.208,
+ "step": 711
+ },
+ {
+ "epoch": 1.9400544959128065,
+ "grad_norm": 9.664246559143066,
+ "learning_rate": 1.2933696639418711e-05,
+ "loss": 2.1519,
+ "step": 712
+ },
+ {
+ "epoch": 1.9427792915531334,
+ "grad_norm": 10.005195617675781,
+ "learning_rate": 1.2951861943687559e-05,
+ "loss": 2.5396,
+ "step": 713
+ },
+ {
+ "epoch": 1.9455040871934606,
+ "grad_norm": 12.706524848937988,
+ "learning_rate": 1.2970027247956405e-05,
+ "loss": 2.3086,
+ "step": 714
+ },
+ {
+ "epoch": 1.9482288828337875,
+ "grad_norm": 10.416522979736328,
+ "learning_rate": 1.2988192552225251e-05,
+ "loss": 2.3281,
+ "step": 715
+ },
+ {
+ "epoch": 1.9509536784741144,
+ "grad_norm": 8.217157363891602,
+ "learning_rate": 1.3006357856494099e-05,
+ "loss": 2.3672,
+ "step": 716
+ },
+ {
+ "epoch": 1.9536784741144415,
+ "grad_norm": 11.214954376220703,
+ "learning_rate": 1.3024523160762943e-05,
+ "loss": 2.2183,
+ "step": 717
+ },
+ {
+ "epoch": 1.9564032697547684,
+ "grad_norm": 11.53817081451416,
+ "learning_rate": 1.304268846503179e-05,
+ "loss": 2.2422,
+ "step": 718
+ },
+ {
+ "epoch": 1.9591280653950953,
+ "grad_norm": 8.654513359069824,
+ "learning_rate": 1.3060853769300636e-05,
+ "loss": 2.4492,
+ "step": 719
+ },
+ {
+ "epoch": 1.9618528610354224,
+ "grad_norm": 12.240690231323242,
+ "learning_rate": 1.3079019073569484e-05,
+ "loss": 2.3838,
+ "step": 720
+ },
+ {
+ "epoch": 1.9645776566757494,
+ "grad_norm": 10.855642318725586,
+ "learning_rate": 1.309718437783833e-05,
+ "loss": 2.4893,
+ "step": 721
+ },
+ {
+ "epoch": 1.9673024523160763,
+ "grad_norm": 10.994941711425781,
+ "learning_rate": 1.3115349682107178e-05,
+ "loss": 2.3906,
+ "step": 722
+ },
+ {
+ "epoch": 1.9700272479564034,
+ "grad_norm": 10.279187202453613,
+ "learning_rate": 1.3133514986376024e-05,
+ "loss": 2.1851,
+ "step": 723
+ },
+ {
+ "epoch": 1.9727520435967303,
+ "grad_norm": 10.290560722351074,
+ "learning_rate": 1.315168029064487e-05,
+ "loss": 2.2305,
+ "step": 724
+ },
+ {
+ "epoch": 1.9754768392370572,
+ "grad_norm": 8.804238319396973,
+ "learning_rate": 1.3169845594913714e-05,
+ "loss": 2.3457,
+ "step": 725
+ },
+ {
+ "epoch": 1.9782016348773843,
+ "grad_norm": 20.067276000976562,
+ "learning_rate": 1.3188010899182562e-05,
+ "loss": 2.3394,
+ "step": 726
+ },
+ {
+ "epoch": 1.9809264305177112,
+ "grad_norm": 8.709736824035645,
+ "learning_rate": 1.3206176203451408e-05,
+ "loss": 2.147,
+ "step": 727
+ },
+ {
+ "epoch": 1.9836512261580381,
+ "grad_norm": 9.862410545349121,
+ "learning_rate": 1.3224341507720255e-05,
+ "loss": 2.3857,
+ "step": 728
+ },
+ {
+ "epoch": 1.9863760217983653,
+ "grad_norm": 13.235732078552246,
+ "learning_rate": 1.3242506811989102e-05,
+ "loss": 2.2124,
+ "step": 729
+ },
+ {
+ "epoch": 1.989100817438692,
+ "grad_norm": 10.813942909240723,
+ "learning_rate": 1.3260672116257949e-05,
+ "loss": 2.5288,
+ "step": 730
+ },
+ {
+ "epoch": 1.991825613079019,
+ "grad_norm": 10.577856063842773,
+ "learning_rate": 1.3278837420526795e-05,
+ "loss": 2.1875,
+ "step": 731
+ },
+ {
+ "epoch": 1.9945504087193462,
+ "grad_norm": 11.54691219329834,
+ "learning_rate": 1.3297002724795643e-05,
+ "loss": 2.4673,
+ "step": 732
+ },
+ {
+ "epoch": 1.9972752043596729,
+ "grad_norm": 11.1182279586792,
+ "learning_rate": 1.3315168029064487e-05,
+ "loss": 2.2476,
+ "step": 733
+ },
+ {
+ "epoch": 2.0,
+ "grad_norm": 10.508315086364746,
+ "learning_rate": 1.3333333333333333e-05,
+ "loss": 2.2329,
+ "step": 734
+ },
+ {
+ "epoch": 2.002724795640327,
+ "grad_norm": 9.416644096374512,
+ "learning_rate": 1.3351498637602181e-05,
+ "loss": 2.3159,
+ "step": 735
+ },
+ {
+ "epoch": 2.005449591280654,
+ "grad_norm": 11.600786209106445,
+ "learning_rate": 1.3369663941871027e-05,
+ "loss": 2.3403,
+ "step": 736
+ },
+ {
+ "epoch": 2.008174386920981,
+ "grad_norm": 10.866864204406738,
+ "learning_rate": 1.3387829246139873e-05,
+ "loss": 2.3638,
+ "step": 737
+ },
+ {
+ "epoch": 2.010899182561308,
+ "grad_norm": 9.856853485107422,
+ "learning_rate": 1.3405994550408721e-05,
+ "loss": 2.1553,
+ "step": 738
+ },
+ {
+ "epoch": 2.0136239782016347,
+ "grad_norm": 12.677173614501953,
+ "learning_rate": 1.3424159854677567e-05,
+ "loss": 2.3608,
+ "step": 739
+ },
+ {
+ "epoch": 2.016348773841962,
+ "grad_norm": 13.566946983337402,
+ "learning_rate": 1.3442325158946414e-05,
+ "loss": 2.2056,
+ "step": 740
+ },
+ {
+ "epoch": 2.019073569482289,
+ "grad_norm": 11.25836181640625,
+ "learning_rate": 1.3460490463215258e-05,
+ "loss": 2.2539,
+ "step": 741
+ },
+ {
+ "epoch": 2.0217983651226157,
+ "grad_norm": 9.697957992553711,
+ "learning_rate": 1.3478655767484106e-05,
+ "loss": 2.1094,
+ "step": 742
+ },
+ {
+ "epoch": 2.024523160762943,
+ "grad_norm": 11.091008186340332,
+ "learning_rate": 1.3496821071752952e-05,
+ "loss": 2.3203,
+ "step": 743
+ },
+ {
+ "epoch": 2.02724795640327,
+ "grad_norm": 8.965106010437012,
+ "learning_rate": 1.35149863760218e-05,
+ "loss": 2.1367,
+ "step": 744
+ },
+ {
+ "epoch": 2.0299727520435966,
+ "grad_norm": 9.569092750549316,
+ "learning_rate": 1.3533151680290646e-05,
+ "loss": 2.2056,
+ "step": 745
+ },
+ {
+ "epoch": 2.0326975476839237,
+ "grad_norm": 11.248583793640137,
+ "learning_rate": 1.3551316984559492e-05,
+ "loss": 2.2119,
+ "step": 746
+ },
+ {
+ "epoch": 2.035422343324251,
+ "grad_norm": 10.267621994018555,
+ "learning_rate": 1.356948228882834e-05,
+ "loss": 2.0845,
+ "step": 747
+ },
+ {
+ "epoch": 2.0381471389645776,
+ "grad_norm": 13.887840270996094,
+ "learning_rate": 1.3587647593097186e-05,
+ "loss": 2.1733,
+ "step": 748
+ },
+ {
+ "epoch": 2.0408719346049047,
+ "grad_norm": 17.721181869506836,
+ "learning_rate": 1.3605812897366032e-05,
+ "loss": 2.3569,
+ "step": 749
+ },
+ {
+ "epoch": 2.043596730245232,
+ "grad_norm": 15.872747421264648,
+ "learning_rate": 1.3623978201634877e-05,
+ "loss": 2.3384,
+ "step": 750
+ },
+ {
+ "epoch": 2.0463215258855585,
+ "grad_norm": 12.283638000488281,
+ "learning_rate": 1.3642143505903725e-05,
+ "loss": 2.1323,
+ "step": 751
+ },
+ {
+ "epoch": 2.0490463215258856,
+ "grad_norm": 11.33743667602539,
+ "learning_rate": 1.3660308810172571e-05,
+ "loss": 2.3105,
+ "step": 752
+ },
+ {
+ "epoch": 2.0517711171662127,
+ "grad_norm": 9.7986421585083,
+ "learning_rate": 1.3678474114441417e-05,
+ "loss": 2.1245,
+ "step": 753
+ },
+ {
+ "epoch": 2.0544959128065394,
+ "grad_norm": 14.31638240814209,
+ "learning_rate": 1.3696639418710265e-05,
+ "loss": 2.5381,
+ "step": 754
+ },
+ {
+ "epoch": 2.0572207084468666,
+ "grad_norm": 10.74636459350586,
+ "learning_rate": 1.3714804722979111e-05,
+ "loss": 2.2754,
+ "step": 755
+ },
+ {
+ "epoch": 2.0599455040871932,
+ "grad_norm": 11.772139549255371,
+ "learning_rate": 1.3732970027247959e-05,
+ "loss": 2.3711,
+ "step": 756
+ },
+ {
+ "epoch": 2.0626702997275204,
+ "grad_norm": 10.804475784301758,
+ "learning_rate": 1.3751135331516805e-05,
+ "loss": 2.3838,
+ "step": 757
+ },
+ {
+ "epoch": 2.0653950953678475,
+ "grad_norm": 11.526287078857422,
+ "learning_rate": 1.376930063578565e-05,
+ "loss": 2.1738,
+ "step": 758
+ },
+ {
+ "epoch": 2.068119891008174,
+ "grad_norm": 11.430591583251953,
+ "learning_rate": 1.3787465940054496e-05,
+ "loss": 2.27,
+ "step": 759
+ },
+ {
+ "epoch": 2.0708446866485013,
+ "grad_norm": 90.60478210449219,
+ "learning_rate": 1.3805631244323344e-05,
+ "loss": 2.106,
+ "step": 760
+ },
+ {
+ "epoch": 2.0735694822888284,
+ "grad_norm": 12.474735260009766,
+ "learning_rate": 1.382379654859219e-05,
+ "loss": 2.2876,
+ "step": 761
+ },
+ {
+ "epoch": 2.076294277929155,
+ "grad_norm": 13.374337196350098,
+ "learning_rate": 1.3841961852861036e-05,
+ "loss": 2.4697,
+ "step": 762
+ },
+ {
+ "epoch": 2.0790190735694822,
+ "grad_norm": 13.265146255493164,
+ "learning_rate": 1.3860127157129884e-05,
+ "loss": 2.2998,
+ "step": 763
+ },
+ {
+ "epoch": 2.0817438692098094,
+ "grad_norm": 11.40599536895752,
+ "learning_rate": 1.387829246139873e-05,
+ "loss": 2.2158,
+ "step": 764
+ },
+ {
+ "epoch": 2.084468664850136,
+ "grad_norm": 12.681764602661133,
+ "learning_rate": 1.3896457765667576e-05,
+ "loss": 2.1958,
+ "step": 765
+ },
+ {
+ "epoch": 2.087193460490463,
+ "grad_norm": 15.120609283447266,
+ "learning_rate": 1.3914623069936422e-05,
+ "loss": 2.582,
+ "step": 766
+ },
+ {
+ "epoch": 2.0899182561307903,
+ "grad_norm": 20.23128318786621,
+ "learning_rate": 1.3932788374205268e-05,
+ "loss": 2.5552,
+ "step": 767
+ },
+ {
+ "epoch": 2.092643051771117,
+ "grad_norm": 20.257232666015625,
+ "learning_rate": 1.3950953678474115e-05,
+ "loss": 2.4346,
+ "step": 768
+ },
+ {
+ "epoch": 2.095367847411444,
+ "grad_norm": 12.688992500305176,
+ "learning_rate": 1.3969118982742963e-05,
+ "loss": 2.1992,
+ "step": 769
+ },
+ {
+ "epoch": 2.0980926430517712,
+ "grad_norm": 14.45832633972168,
+ "learning_rate": 1.3987284287011809e-05,
+ "loss": 2.3193,
+ "step": 770
+ },
+ {
+ "epoch": 2.100817438692098,
+ "grad_norm": 13.274530410766602,
+ "learning_rate": 1.4005449591280655e-05,
+ "loss": 2.2349,
+ "step": 771
+ },
+ {
+ "epoch": 2.103542234332425,
+ "grad_norm": 15.1006441116333,
+ "learning_rate": 1.4023614895549503e-05,
+ "loss": 2.3721,
+ "step": 772
+ },
+ {
+ "epoch": 2.106267029972752,
+ "grad_norm": 12.727002143859863,
+ "learning_rate": 1.4041780199818349e-05,
+ "loss": 2.2393,
+ "step": 773
+ },
+ {
+ "epoch": 2.108991825613079,
+ "grad_norm": 15.004621505737305,
+ "learning_rate": 1.4059945504087195e-05,
+ "loss": 2.2686,
+ "step": 774
+ },
+ {
+ "epoch": 2.111716621253406,
+ "grad_norm": 13.299857139587402,
+ "learning_rate": 1.407811080835604e-05,
+ "loss": 2.334,
+ "step": 775
+ },
+ {
+ "epoch": 2.114441416893733,
+ "grad_norm": 14.570548057556152,
+ "learning_rate": 1.4096276112624887e-05,
+ "loss": 2.208,
+ "step": 776
+ },
+ {
+ "epoch": 2.11716621253406,
+ "grad_norm": 10.870620727539062,
+ "learning_rate": 1.4114441416893733e-05,
+ "loss": 2.2275,
+ "step": 777
+ },
+ {
+ "epoch": 2.119891008174387,
+ "grad_norm": 11.548524856567383,
+ "learning_rate": 1.4132606721162581e-05,
+ "loss": 2.1538,
+ "step": 778
+ },
+ {
+ "epoch": 2.122615803814714,
+ "grad_norm": 10.89322280883789,
+ "learning_rate": 1.4150772025431428e-05,
+ "loss": 2.3955,
+ "step": 779
+ },
+ {
+ "epoch": 2.1253405994550407,
+ "grad_norm": 13.28118896484375,
+ "learning_rate": 1.4168937329700274e-05,
+ "loss": 2.3999,
+ "step": 780
+ },
+ {
+ "epoch": 2.128065395095368,
+ "grad_norm": 13.44669246673584,
+ "learning_rate": 1.4187102633969122e-05,
+ "loss": 2.2476,
+ "step": 781
+ },
+ {
+ "epoch": 2.130790190735695,
+ "grad_norm": 13.213591575622559,
+ "learning_rate": 1.4205267938237968e-05,
+ "loss": 2.0225,
+ "step": 782
+ },
+ {
+ "epoch": 2.1335149863760217,
+ "grad_norm": 11.242518424987793,
+ "learning_rate": 1.4223433242506812e-05,
+ "loss": 2.3213,
+ "step": 783
+ },
+ {
+ "epoch": 2.136239782016349,
+ "grad_norm": 11.51584243774414,
+ "learning_rate": 1.4241598546775658e-05,
+ "loss": 2.2988,
+ "step": 784
+ },
+ {
+ "epoch": 2.138964577656676,
+ "grad_norm": 13.992745399475098,
+ "learning_rate": 1.4259763851044506e-05,
+ "loss": 2.3643,
+ "step": 785
+ },
+ {
+ "epoch": 2.1416893732970026,
+ "grad_norm": 12.655274391174316,
+ "learning_rate": 1.4277929155313352e-05,
+ "loss": 2.5439,
+ "step": 786
+ },
+ {
+ "epoch": 2.1444141689373297,
+ "grad_norm": 12.481905937194824,
+ "learning_rate": 1.4296094459582198e-05,
+ "loss": 2.2559,
+ "step": 787
+ },
+ {
+ "epoch": 2.147138964577657,
+ "grad_norm": 15.663750648498535,
+ "learning_rate": 1.4314259763851046e-05,
+ "loss": 2.311,
+ "step": 788
+ },
+ {
+ "epoch": 2.1498637602179835,
+ "grad_norm": 12.196157455444336,
+ "learning_rate": 1.4332425068119893e-05,
+ "loss": 2.1567,
+ "step": 789
+ },
+ {
+ "epoch": 2.1525885558583107,
+ "grad_norm": 11.681686401367188,
+ "learning_rate": 1.435059037238874e-05,
+ "loss": 2.4229,
+ "step": 790
+ },
+ {
+ "epoch": 2.155313351498638,
+ "grad_norm": 9.554698944091797,
+ "learning_rate": 1.4368755676657585e-05,
+ "loss": 2.0493,
+ "step": 791
+ },
+ {
+ "epoch": 2.1580381471389645,
+ "grad_norm": 11.352317810058594,
+ "learning_rate": 1.4386920980926431e-05,
+ "loss": 2.4033,
+ "step": 792
+ },
+ {
+ "epoch": 2.1607629427792916,
+ "grad_norm": 9.571414947509766,
+ "learning_rate": 1.4405086285195277e-05,
+ "loss": 2.2031,
+ "step": 793
+ },
+ {
+ "epoch": 2.1634877384196187,
+ "grad_norm": 14.849584579467773,
+ "learning_rate": 1.4423251589464125e-05,
+ "loss": 2.0972,
+ "step": 794
+ },
+ {
+ "epoch": 2.1662125340599454,
+ "grad_norm": 11.889425277709961,
+ "learning_rate": 1.4441416893732971e-05,
+ "loss": 2.1924,
+ "step": 795
+ },
+ {
+ "epoch": 2.1689373297002725,
+ "grad_norm": 10.594819068908691,
+ "learning_rate": 1.4459582198001817e-05,
+ "loss": 2.1279,
+ "step": 796
+ },
+ {
+ "epoch": 2.1716621253405997,
+ "grad_norm": 14.0387544631958,
+ "learning_rate": 1.4477747502270665e-05,
+ "loss": 2.4731,
+ "step": 797
+ },
+ {
+ "epoch": 2.1743869209809263,
+ "grad_norm": 12.90074348449707,
+ "learning_rate": 1.4495912806539511e-05,
+ "loss": 2.4609,
+ "step": 798
+ },
+ {
+ "epoch": 2.1771117166212535,
+ "grad_norm": 11.694089889526367,
+ "learning_rate": 1.4514078110808356e-05,
+ "loss": 2.1475,
+ "step": 799
+ },
+ {
+ "epoch": 2.1798365122615806,
+ "grad_norm": 12.369209289550781,
+ "learning_rate": 1.4532243415077204e-05,
+ "loss": 2.2612,
+ "step": 800
+ },
+ {
+ "epoch": 2.1825613079019073,
+ "grad_norm": 16.08076286315918,
+ "learning_rate": 1.455040871934605e-05,
+ "loss": 2.3594,
+ "step": 801
+ },
+ {
+ "epoch": 2.1852861035422344,
+ "grad_norm": 12.111376762390137,
+ "learning_rate": 1.4568574023614896e-05,
+ "loss": 2.2886,
+ "step": 802
+ },
+ {
+ "epoch": 2.1880108991825615,
+ "grad_norm": 9.426592826843262,
+ "learning_rate": 1.4586739327883744e-05,
+ "loss": 1.9961,
+ "step": 803
+ },
+ {
+ "epoch": 2.190735694822888,
+ "grad_norm": 19.973569869995117,
+ "learning_rate": 1.460490463215259e-05,
+ "loss": 2.3408,
+ "step": 804
+ },
+ {
+ "epoch": 2.1934604904632153,
+ "grad_norm": 8.401344299316406,
+ "learning_rate": 1.4623069936421436e-05,
+ "loss": 2.0479,
+ "step": 805
+ },
+ {
+ "epoch": 2.1961852861035425,
+ "grad_norm": 9.423659324645996,
+ "learning_rate": 1.4641235240690284e-05,
+ "loss": 2.0825,
+ "step": 806
+ },
+ {
+ "epoch": 2.198910081743869,
+ "grad_norm": 11.838205337524414,
+ "learning_rate": 1.465940054495913e-05,
+ "loss": 2.3599,
+ "step": 807
+ },
+ {
+ "epoch": 2.2016348773841963,
+ "grad_norm": 12.468666076660156,
+ "learning_rate": 1.4677565849227975e-05,
+ "loss": 2.2124,
+ "step": 808
+ },
+ {
+ "epoch": 2.204359673024523,
+ "grad_norm": 15.283005714416504,
+ "learning_rate": 1.469573115349682e-05,
+ "loss": 2.1201,
+ "step": 809
+ },
+ {
+ "epoch": 2.20708446866485,
+ "grad_norm": 12.136519432067871,
+ "learning_rate": 1.4713896457765669e-05,
+ "loss": 2.3779,
+ "step": 810
+ },
+ {
+ "epoch": 2.209809264305177,
+ "grad_norm": 9.63491439819336,
+ "learning_rate": 1.4732061762034515e-05,
+ "loss": 2.0181,
+ "step": 811
+ },
+ {
+ "epoch": 2.212534059945504,
+ "grad_norm": 11.01519775390625,
+ "learning_rate": 1.4750227066303363e-05,
+ "loss": 1.9985,
+ "step": 812
+ },
+ {
+ "epoch": 2.215258855585831,
+ "grad_norm": 10.398948669433594,
+ "learning_rate": 1.4768392370572209e-05,
+ "loss": 2.2524,
+ "step": 813
+ },
+ {
+ "epoch": 2.217983651226158,
+ "grad_norm": 10.20798110961914,
+ "learning_rate": 1.4786557674841055e-05,
+ "loss": 2.0015,
+ "step": 814
+ },
+ {
+ "epoch": 2.220708446866485,
+ "grad_norm": 12.424089431762695,
+ "learning_rate": 1.4804722979109903e-05,
+ "loss": 2.355,
+ "step": 815
+ },
+ {
+ "epoch": 2.223433242506812,
+ "grad_norm": 12.882838249206543,
+ "learning_rate": 1.4822888283378747e-05,
+ "loss": 2.2236,
+ "step": 816
+ },
+ {
+ "epoch": 2.226158038147139,
+ "grad_norm": 13.038334846496582,
+ "learning_rate": 1.4841053587647594e-05,
+ "loss": 2.5132,
+ "step": 817
+ },
+ {
+ "epoch": 2.2288828337874658,
+ "grad_norm": 10.221287727355957,
+ "learning_rate": 1.485921889191644e-05,
+ "loss": 2.1704,
+ "step": 818
+ },
+ {
+ "epoch": 2.231607629427793,
+ "grad_norm": 13.483091354370117,
+ "learning_rate": 1.4877384196185288e-05,
+ "loss": 2.519,
+ "step": 819
+ },
+ {
+ "epoch": 2.23433242506812,
+ "grad_norm": 12.316015243530273,
+ "learning_rate": 1.4895549500454134e-05,
+ "loss": 2.144,
+ "step": 820
+ },
+ {
+ "epoch": 2.2370572207084467,
+ "grad_norm": 10.261295318603516,
+ "learning_rate": 1.4913714804722982e-05,
+ "loss": 2.186,
+ "step": 821
+ },
+ {
+ "epoch": 2.239782016348774,
+ "grad_norm": 11.669163703918457,
+ "learning_rate": 1.4931880108991828e-05,
+ "loss": 2.166,
+ "step": 822
+ },
+ {
+ "epoch": 2.242506811989101,
+ "grad_norm": 12.902145385742188,
+ "learning_rate": 1.4950045413260674e-05,
+ "loss": 2.2456,
+ "step": 823
+ },
+ {
+ "epoch": 2.2452316076294276,
+ "grad_norm": 11.576069831848145,
+ "learning_rate": 1.4968210717529518e-05,
+ "loss": 2.2324,
+ "step": 824
+ },
+ {
+ "epoch": 2.2479564032697548,
+ "grad_norm": 11.665193557739258,
+ "learning_rate": 1.4986376021798366e-05,
+ "loss": 2.0337,
+ "step": 825
+ },
+ {
+ "epoch": 2.250681198910082,
+ "grad_norm": 11.684881210327148,
+ "learning_rate": 1.5004541326067212e-05,
+ "loss": 2.3325,
+ "step": 826
+ },
+ {
+ "epoch": 2.2534059945504086,
+ "grad_norm": 10.821648597717285,
+ "learning_rate": 1.5022706630336059e-05,
+ "loss": 2.1533,
+ "step": 827
+ },
+ {
+ "epoch": 2.2561307901907357,
+ "grad_norm": 12.104910850524902,
+ "learning_rate": 1.5040871934604906e-05,
+ "loss": 2.104,
+ "step": 828
+ },
+ {
+ "epoch": 2.258855585831063,
+ "grad_norm": 15.326925277709961,
+ "learning_rate": 1.5059037238873753e-05,
+ "loss": 2.1938,
+ "step": 829
+ },
+ {
+ "epoch": 2.2615803814713895,
+ "grad_norm": 15.872440338134766,
+ "learning_rate": 1.5077202543142599e-05,
+ "loss": 2.0366,
+ "step": 830
+ },
+ {
+ "epoch": 2.2643051771117166,
+ "grad_norm": 19.063030242919922,
+ "learning_rate": 1.5095367847411447e-05,
+ "loss": 2.4019,
+ "step": 831
+ },
+ {
+ "epoch": 2.2670299727520438,
+ "grad_norm": 14.302577018737793,
+ "learning_rate": 1.5113533151680291e-05,
+ "loss": 2.2896,
+ "step": 832
+ },
+ {
+ "epoch": 2.2697547683923704,
+ "grad_norm": 9.565779685974121,
+ "learning_rate": 1.5131698455949137e-05,
+ "loss": 2.2368,
+ "step": 833
+ },
+ {
+ "epoch": 2.2724795640326976,
+ "grad_norm": 10.099272727966309,
+ "learning_rate": 1.5149863760217985e-05,
+ "loss": 2.2588,
+ "step": 834
+ },
+ {
+ "epoch": 2.2752043596730247,
+ "grad_norm": 10.54786491394043,
+ "learning_rate": 1.5168029064486831e-05,
+ "loss": 1.916,
+ "step": 835
+ },
+ {
+ "epoch": 2.2779291553133514,
+ "grad_norm": 8.687639236450195,
+ "learning_rate": 1.5186194368755677e-05,
+ "loss": 2.1084,
+ "step": 836
+ },
+ {
+ "epoch": 2.2806539509536785,
+ "grad_norm": 10.300875663757324,
+ "learning_rate": 1.5204359673024525e-05,
+ "loss": 2.4204,
+ "step": 837
+ },
+ {
+ "epoch": 2.2833787465940056,
+ "grad_norm": 10.761526107788086,
+ "learning_rate": 1.5222524977293371e-05,
+ "loss": 2.1538,
+ "step": 838
+ },
+ {
+ "epoch": 2.2861035422343323,
+ "grad_norm": 10.05339527130127,
+ "learning_rate": 1.5240690281562218e-05,
+ "loss": 2.1846,
+ "step": 839
+ },
+ {
+ "epoch": 2.2888283378746594,
+ "grad_norm": 10.227608680725098,
+ "learning_rate": 1.5258855585831064e-05,
+ "loss": 2.2031,
+ "step": 840
+ },
+ {
+ "epoch": 2.291553133514986,
+ "grad_norm": 9.570499420166016,
+ "learning_rate": 1.5277020890099908e-05,
+ "loss": 1.9465,
+ "step": 841
+ },
+ {
+ "epoch": 2.2942779291553133,
+ "grad_norm": 11.354101181030273,
+ "learning_rate": 1.5295186194368756e-05,
+ "loss": 2.1499,
+ "step": 842
+ },
+ {
+ "epoch": 2.2970027247956404,
+ "grad_norm": 11.209668159484863,
+ "learning_rate": 1.5313351498637604e-05,
+ "loss": 2.1768,
+ "step": 843
+ },
+ {
+ "epoch": 2.299727520435967,
+ "grad_norm": 14.012726783752441,
+ "learning_rate": 1.533151680290645e-05,
+ "loss": 2.4834,
+ "step": 844
+ },
+ {
+ "epoch": 2.302452316076294,
+ "grad_norm": 13.252918243408203,
+ "learning_rate": 1.5349682107175296e-05,
+ "loss": 2.4282,
+ "step": 845
+ },
+ {
+ "epoch": 2.3051771117166213,
+ "grad_norm": 13.012864112854004,
+ "learning_rate": 1.5367847411444144e-05,
+ "loss": 2.0635,
+ "step": 846
+ },
+ {
+ "epoch": 2.307901907356948,
+ "grad_norm": 10.489202499389648,
+ "learning_rate": 1.538601271571299e-05,
+ "loss": 2.0771,
+ "step": 847
+ },
+ {
+ "epoch": 2.310626702997275,
+ "grad_norm": 9.56246280670166,
+ "learning_rate": 1.5404178019981836e-05,
+ "loss": 2.0532,
+ "step": 848
+ },
+ {
+ "epoch": 2.3133514986376023,
+ "grad_norm": 11.222508430480957,
+ "learning_rate": 1.542234332425068e-05,
+ "loss": 2.3257,
+ "step": 849
+ },
+ {
+ "epoch": 2.316076294277929,
+ "grad_norm": 14.687914848327637,
+ "learning_rate": 1.544050862851953e-05,
+ "loss": 2.3257,
+ "step": 850
+ },
+ {
+ "epoch": 2.318801089918256,
+ "grad_norm": 12.809759140014648,
+ "learning_rate": 1.5458673932788377e-05,
+ "loss": 2.2896,
+ "step": 851
+ },
+ {
+ "epoch": 2.321525885558583,
+ "grad_norm": 10.033246994018555,
+ "learning_rate": 1.547683923705722e-05,
+ "loss": 2.1733,
+ "step": 852
+ },
+ {
+ "epoch": 2.32425068119891,
+ "grad_norm": 10.335433959960938,
+ "learning_rate": 1.549500454132607e-05,
+ "loss": 2.0479,
+ "step": 853
+ },
+ {
+ "epoch": 2.326975476839237,
+ "grad_norm": 14.753990173339844,
+ "learning_rate": 1.5513169845594917e-05,
+ "loss": 2.082,
+ "step": 854
+ },
+ {
+ "epoch": 2.329700272479564,
+ "grad_norm": 10.427779197692871,
+ "learning_rate": 1.553133514986376e-05,
+ "loss": 2.1675,
+ "step": 855
+ },
+ {
+ "epoch": 2.332425068119891,
+ "grad_norm": 11.808363914489746,
+ "learning_rate": 1.554950045413261e-05,
+ "loss": 2.1299,
+ "step": 856
+ },
+ {
+ "epoch": 2.335149863760218,
+ "grad_norm": 12.636821746826172,
+ "learning_rate": 1.5567665758401454e-05,
+ "loss": 2.3027,
+ "step": 857
+ },
+ {
+ "epoch": 2.337874659400545,
+ "grad_norm": 10.85216999053955,
+ "learning_rate": 1.55858310626703e-05,
+ "loss": 2.1714,
+ "step": 858
+ },
+ {
+ "epoch": 2.3405994550408717,
+ "grad_norm": 14.7868070602417,
+ "learning_rate": 1.5603996366939146e-05,
+ "loss": 2.2993,
+ "step": 859
+ },
+ {
+ "epoch": 2.343324250681199,
+ "grad_norm": 13.12626838684082,
+ "learning_rate": 1.5622161671207994e-05,
+ "loss": 2.3159,
+ "step": 860
+ },
+ {
+ "epoch": 2.346049046321526,
+ "grad_norm": 27.119937896728516,
+ "learning_rate": 1.564032697547684e-05,
+ "loss": 2.1138,
+ "step": 861
+ },
+ {
+ "epoch": 2.3487738419618527,
+ "grad_norm": 11.369824409484863,
+ "learning_rate": 1.5658492279745686e-05,
+ "loss": 2.1289,
+ "step": 862
+ },
+ {
+ "epoch": 2.35149863760218,
+ "grad_norm": 11.388385772705078,
+ "learning_rate": 1.5676657584014534e-05,
+ "loss": 2.125,
+ "step": 863
+ },
+ {
+ "epoch": 2.354223433242507,
+ "grad_norm": 9.750898361206055,
+ "learning_rate": 1.5694822888283382e-05,
+ "loss": 1.9927,
+ "step": 864
+ },
+ {
+ "epoch": 2.3569482288828336,
+ "grad_norm": 13.13124942779541,
+ "learning_rate": 1.5712988192552226e-05,
+ "loss": 2.062,
+ "step": 865
+ },
+ {
+ "epoch": 2.3596730245231607,
+ "grad_norm": 11.438236236572266,
+ "learning_rate": 1.573115349682107e-05,
+ "loss": 2.0923,
+ "step": 866
+ },
+ {
+ "epoch": 2.362397820163488,
+ "grad_norm": 12.381810188293457,
+ "learning_rate": 1.574931880108992e-05,
+ "loss": 2.1172,
+ "step": 867
+ },
+ {
+ "epoch": 2.3651226158038146,
+ "grad_norm": 12.36788558959961,
+ "learning_rate": 1.5767484105358766e-05,
+ "loss": 2.3823,
+ "step": 868
+ },
+ {
+ "epoch": 2.3678474114441417,
+ "grad_norm": 11.918746948242188,
+ "learning_rate": 1.578564940962761e-05,
+ "loss": 2.3428,
+ "step": 869
+ },
+ {
+ "epoch": 2.370572207084469,
+ "grad_norm": 11.873290061950684,
+ "learning_rate": 1.580381471389646e-05,
+ "loss": 1.9648,
+ "step": 870
+ },
+ {
+ "epoch": 2.3732970027247955,
+ "grad_norm": 9.237068176269531,
+ "learning_rate": 1.5821980018165307e-05,
+ "loss": 2.1528,
+ "step": 871
+ },
+ {
+ "epoch": 2.3760217983651226,
+ "grad_norm": 11.43176555633545,
+ "learning_rate": 1.5840145322434154e-05,
+ "loss": 2.3501,
+ "step": 872
+ },
+ {
+ "epoch": 2.3787465940054497,
+ "grad_norm": 11.239076614379883,
+ "learning_rate": 1.5858310626703e-05,
+ "loss": 2.1973,
+ "step": 873
+ },
+ {
+ "epoch": 2.3814713896457764,
+ "grad_norm": 9.229157447814941,
+ "learning_rate": 1.5876475930971843e-05,
+ "loss": 2.1504,
+ "step": 874
+ },
+ {
+ "epoch": 2.3841961852861036,
+ "grad_norm": 10.20166301727295,
+ "learning_rate": 1.589464123524069e-05,
+ "loss": 1.9539,
+ "step": 875
+ },
+ {
+ "epoch": 2.3869209809264307,
+ "grad_norm": 13.474658012390137,
+ "learning_rate": 1.591280653950954e-05,
+ "loss": 2.1465,
+ "step": 876
+ },
+ {
+ "epoch": 2.3896457765667574,
+ "grad_norm": 9.529938697814941,
+ "learning_rate": 1.5930971843778384e-05,
+ "loss": 2.1045,
+ "step": 877
+ },
+ {
+ "epoch": 2.3923705722070845,
+ "grad_norm": 9.707219123840332,
+ "learning_rate": 1.594913714804723e-05,
+ "loss": 2.0859,
+ "step": 878
+ },
+ {
+ "epoch": 2.3950953678474116,
+ "grad_norm": 10.575519561767578,
+ "learning_rate": 1.596730245231608e-05,
+ "loss": 2.3926,
+ "step": 879
+ },
+ {
+ "epoch": 2.3978201634877383,
+ "grad_norm": 9.208884239196777,
+ "learning_rate": 1.5985467756584924e-05,
+ "loss": 2.2114,
+ "step": 880
+ },
+ {
+ "epoch": 2.4005449591280654,
+ "grad_norm": 11.017399787902832,
+ "learning_rate": 1.600363306085377e-05,
+ "loss": 2.4048,
+ "step": 881
+ },
+ {
+ "epoch": 2.4032697547683926,
+ "grad_norm": 11.70709228515625,
+ "learning_rate": 1.6021798365122616e-05,
+ "loss": 2.1816,
+ "step": 882
+ },
+ {
+ "epoch": 2.4059945504087192,
+ "grad_norm": 13.651061058044434,
+ "learning_rate": 1.6039963669391464e-05,
+ "loss": 2.0396,
+ "step": 883
+ },
+ {
+ "epoch": 2.4087193460490464,
+ "grad_norm": 12.736273765563965,
+ "learning_rate": 1.605812897366031e-05,
+ "loss": 2.397,
+ "step": 884
+ },
+ {
+ "epoch": 2.4114441416893735,
+ "grad_norm": 10.983773231506348,
+ "learning_rate": 1.6076294277929156e-05,
+ "loss": 2.0938,
+ "step": 885
+ },
+ {
+ "epoch": 2.4141689373297,
+ "grad_norm": 10.832428932189941,
+ "learning_rate": 1.6094459582198004e-05,
+ "loss": 2.0327,
+ "step": 886
+ },
+ {
+ "epoch": 2.4168937329700273,
+ "grad_norm": 11.225357055664062,
+ "learning_rate": 1.611262488646685e-05,
+ "loss": 1.9614,
+ "step": 887
+ },
+ {
+ "epoch": 2.4196185286103544,
+ "grad_norm": 12.462913513183594,
+ "learning_rate": 1.6130790190735696e-05,
+ "loss": 2.0,
+ "step": 888
+ },
+ {
+ "epoch": 2.422343324250681,
+ "grad_norm": 10.41214370727539,
+ "learning_rate": 1.6148955495004544e-05,
+ "loss": 2.1411,
+ "step": 889
+ },
+ {
+ "epoch": 2.4250681198910082,
+ "grad_norm": 11.749297142028809,
+ "learning_rate": 1.616712079927339e-05,
+ "loss": 2.25,
+ "step": 890
+ },
+ {
+ "epoch": 2.4277929155313354,
+ "grad_norm": 11.546613693237305,
+ "learning_rate": 1.6185286103542233e-05,
+ "loss": 2.0762,
+ "step": 891
+ },
+ {
+ "epoch": 2.430517711171662,
+ "grad_norm": 11.366194725036621,
+ "learning_rate": 1.620345140781108e-05,
+ "loss": 2.2031,
+ "step": 892
+ },
+ {
+ "epoch": 2.433242506811989,
+ "grad_norm": 13.148904800415039,
+ "learning_rate": 1.622161671207993e-05,
+ "loss": 2.1274,
+ "step": 893
+ },
+ {
+ "epoch": 2.4359673024523163,
+ "grad_norm": 21.143726348876953,
+ "learning_rate": 1.6239782016348777e-05,
+ "loss": 2.1182,
+ "step": 894
+ },
+ {
+ "epoch": 2.438692098092643,
+ "grad_norm": 11.426177978515625,
+ "learning_rate": 1.625794732061762e-05,
+ "loss": 2.2329,
+ "step": 895
+ },
+ {
+ "epoch": 2.44141689373297,
+ "grad_norm": 11.629473686218262,
+ "learning_rate": 1.627611262488647e-05,
+ "loss": 2.1201,
+ "step": 896
+ },
+ {
+ "epoch": 2.4441416893732972,
+ "grad_norm": 12.553741455078125,
+ "learning_rate": 1.6294277929155317e-05,
+ "loss": 2.1685,
+ "step": 897
+ },
+ {
+ "epoch": 2.446866485013624,
+ "grad_norm": 10.176178932189941,
+ "learning_rate": 1.631244323342416e-05,
+ "loss": 2.0972,
+ "step": 898
+ },
+ {
+ "epoch": 2.449591280653951,
+ "grad_norm": 12.827268600463867,
+ "learning_rate": 1.6330608537693006e-05,
+ "loss": 2.3735,
+ "step": 899
+ },
+ {
+ "epoch": 2.452316076294278,
+ "grad_norm": 17.78833770751953,
+ "learning_rate": 1.6348773841961854e-05,
+ "loss": 1.9966,
+ "step": 900
+ },
+ {
+ "epoch": 2.455040871934605,
+ "grad_norm": 10.53470516204834,
+ "learning_rate": 1.63669391462307e-05,
+ "loss": 2.2173,
+ "step": 901
+ },
+ {
+ "epoch": 2.457765667574932,
+ "grad_norm": 12.696940422058105,
+ "learning_rate": 1.6385104450499546e-05,
+ "loss": 2.1294,
+ "step": 902
+ },
+ {
+ "epoch": 2.460490463215259,
+ "grad_norm": 10.315053939819336,
+ "learning_rate": 1.6403269754768394e-05,
+ "loss": 2.0537,
+ "step": 903
+ },
+ {
+ "epoch": 2.463215258855586,
+ "grad_norm": 10.008761405944824,
+ "learning_rate": 1.6421435059037242e-05,
+ "loss": 2.2856,
+ "step": 904
+ },
+ {
+ "epoch": 2.465940054495913,
+ "grad_norm": 11.975059509277344,
+ "learning_rate": 1.6439600363306086e-05,
+ "loss": 2.105,
+ "step": 905
+ },
+ {
+ "epoch": 2.4686648501362396,
+ "grad_norm": 12.422130584716797,
+ "learning_rate": 1.6457765667574934e-05,
+ "loss": 2.2124,
+ "step": 906
+ },
+ {
+ "epoch": 2.4713896457765667,
+ "grad_norm": 11.444618225097656,
+ "learning_rate": 1.647593097184378e-05,
+ "loss": 2.1665,
+ "step": 907
+ },
+ {
+ "epoch": 2.474114441416894,
+ "grad_norm": 13.179655075073242,
+ "learning_rate": 1.6494096276112626e-05,
+ "loss": 2.6147,
+ "step": 908
+ },
+ {
+ "epoch": 2.4768392370572205,
+ "grad_norm": 10.262988090515137,
+ "learning_rate": 1.651226158038147e-05,
+ "loss": 2.4829,
+ "step": 909
+ },
+ {
+ "epoch": 2.4795640326975477,
+ "grad_norm": 9.67646598815918,
+ "learning_rate": 1.653042688465032e-05,
+ "loss": 2.0737,
+ "step": 910
+ },
+ {
+ "epoch": 2.482288828337875,
+ "grad_norm": 8.827295303344727,
+ "learning_rate": 1.6548592188919167e-05,
+ "loss": 1.8481,
+ "step": 911
+ },
+ {
+ "epoch": 2.4850136239782015,
+ "grad_norm": 9.027557373046875,
+ "learning_rate": 1.656675749318801e-05,
+ "loss": 2.3447,
+ "step": 912
+ },
+ {
+ "epoch": 2.4877384196185286,
+ "grad_norm": 13.08642292022705,
+ "learning_rate": 1.658492279745686e-05,
+ "loss": 2.3794,
+ "step": 913
+ },
+ {
+ "epoch": 2.4904632152588557,
+ "grad_norm": 14.326387405395508,
+ "learning_rate": 1.6603088101725707e-05,
+ "loss": 2.0713,
+ "step": 914
+ },
+ {
+ "epoch": 2.4931880108991824,
+ "grad_norm": 10.7723970413208,
+ "learning_rate": 1.662125340599455e-05,
+ "loss": 2.2383,
+ "step": 915
+ },
+ {
+ "epoch": 2.4959128065395095,
+ "grad_norm": 11.671551704406738,
+ "learning_rate": 1.66394187102634e-05,
+ "loss": 2.3242,
+ "step": 916
+ },
+ {
+ "epoch": 2.4986376021798367,
+ "grad_norm": 9.647505760192871,
+ "learning_rate": 1.6657584014532244e-05,
+ "loss": 2.1035,
+ "step": 917
+ },
+ {
+ "epoch": 2.5013623978201633,
+ "grad_norm": 10.872794151306152,
+ "learning_rate": 1.667574931880109e-05,
+ "loss": 2.1948,
+ "step": 918
+ },
+ {
+ "epoch": 2.5040871934604905,
+ "grad_norm": 11.074483871459961,
+ "learning_rate": 1.669391462306994e-05,
+ "loss": 2.0283,
+ "step": 919
+ },
+ {
+ "epoch": 2.5068119891008176,
+ "grad_norm": 10.048798561096191,
+ "learning_rate": 1.6712079927338784e-05,
+ "loss": 2.1079,
+ "step": 920
+ },
+ {
+ "epoch": 2.5095367847411443,
+ "grad_norm": 16.10767936706543,
+ "learning_rate": 1.673024523160763e-05,
+ "loss": 2.3203,
+ "step": 921
+ },
+ {
+ "epoch": 2.5122615803814714,
+ "grad_norm": 10.057881355285645,
+ "learning_rate": 1.674841053587648e-05,
+ "loss": 1.9272,
+ "step": 922
+ },
+ {
+ "epoch": 2.5149863760217985,
+ "grad_norm": 10.424790382385254,
+ "learning_rate": 1.6766575840145324e-05,
+ "loss": 1.8945,
+ "step": 923
+ },
+ {
+ "epoch": 2.517711171662125,
+ "grad_norm": 8.450881958007812,
+ "learning_rate": 1.678474114441417e-05,
+ "loss": 2.0601,
+ "step": 924
+ },
+ {
+ "epoch": 2.5204359673024523,
+ "grad_norm": 8.487282752990723,
+ "learning_rate": 1.6802906448683016e-05,
+ "loss": 1.9404,
+ "step": 925
+ },
+ {
+ "epoch": 2.523160762942779,
+ "grad_norm": 12.343279838562012,
+ "learning_rate": 1.6821071752951864e-05,
+ "loss": 2.1753,
+ "step": 926
+ },
+ {
+ "epoch": 2.525885558583106,
+ "grad_norm": 10.701006889343262,
+ "learning_rate": 1.683923705722071e-05,
+ "loss": 2.0884,
+ "step": 927
+ },
+ {
+ "epoch": 2.5286103542234333,
+ "grad_norm": 12.124945640563965,
+ "learning_rate": 1.6857402361489556e-05,
+ "loss": 2.2012,
+ "step": 928
+ },
+ {
+ "epoch": 2.53133514986376,
+ "grad_norm": 12.241605758666992,
+ "learning_rate": 1.6875567665758404e-05,
+ "loss": 2.0977,
+ "step": 929
+ },
+ {
+ "epoch": 2.534059945504087,
+ "grad_norm": 12.198929786682129,
+ "learning_rate": 1.689373297002725e-05,
+ "loss": 2.1514,
+ "step": 930
+ },
+ {
+ "epoch": 2.536784741144414,
+ "grad_norm": 10.598546028137207,
+ "learning_rate": 1.6911898274296097e-05,
+ "loss": 2.1274,
+ "step": 931
+ },
+ {
+ "epoch": 2.539509536784741,
+ "grad_norm": 10.838115692138672,
+ "learning_rate": 1.693006357856494e-05,
+ "loss": 2.1362,
+ "step": 932
+ },
+ {
+ "epoch": 2.542234332425068,
+ "grad_norm": 12.07777214050293,
+ "learning_rate": 1.694822888283379e-05,
+ "loss": 2.1733,
+ "step": 933
+ },
+ {
+ "epoch": 2.544959128065395,
+ "grad_norm": 12.838855743408203,
+ "learning_rate": 1.6966394187102633e-05,
+ "loss": 2.3003,
+ "step": 934
+ },
+ {
+ "epoch": 2.547683923705722,
+ "grad_norm": 15.405717849731445,
+ "learning_rate": 1.698455949137148e-05,
+ "loss": 2.0708,
+ "step": 935
+ },
+ {
+ "epoch": 2.550408719346049,
+ "grad_norm": 12.793071746826172,
+ "learning_rate": 1.700272479564033e-05,
+ "loss": 2.1646,
+ "step": 936
+ },
+ {
+ "epoch": 2.553133514986376,
+ "grad_norm": 13.155274391174316,
+ "learning_rate": 1.7020890099909177e-05,
+ "loss": 1.9976,
+ "step": 937
+ },
+ {
+ "epoch": 2.5558583106267028,
+ "grad_norm": 11.268887519836426,
+ "learning_rate": 1.703905540417802e-05,
+ "loss": 2.2085,
+ "step": 938
+ },
+ {
+ "epoch": 2.55858310626703,
+ "grad_norm": 10.742142677307129,
+ "learning_rate": 1.705722070844687e-05,
+ "loss": 2.3872,
+ "step": 939
+ },
+ {
+ "epoch": 2.561307901907357,
+ "grad_norm": 9.933159828186035,
+ "learning_rate": 1.7075386012715714e-05,
+ "loss": 2.1978,
+ "step": 940
+ },
+ {
+ "epoch": 2.5640326975476837,
+ "grad_norm": 13.011128425598145,
+ "learning_rate": 1.709355131698456e-05,
+ "loss": 2.3154,
+ "step": 941
+ },
+ {
+ "epoch": 2.566757493188011,
+ "grad_norm": 11.067089080810547,
+ "learning_rate": 1.7111716621253406e-05,
+ "loss": 2.207,
+ "step": 942
+ },
+ {
+ "epoch": 2.569482288828338,
+ "grad_norm": 9.70608139038086,
+ "learning_rate": 1.7129881925522254e-05,
+ "loss": 2.1768,
+ "step": 943
+ },
+ {
+ "epoch": 2.5722070844686646,
+ "grad_norm": 11.981213569641113,
+ "learning_rate": 1.7148047229791102e-05,
+ "loss": 2.0952,
+ "step": 944
+ },
+ {
+ "epoch": 2.5749318801089918,
+ "grad_norm": 12.573433876037598,
+ "learning_rate": 1.7166212534059946e-05,
+ "loss": 2.2168,
+ "step": 945
+ },
+ {
+ "epoch": 2.577656675749319,
+ "grad_norm": 12.08493423461914,
+ "learning_rate": 1.7184377838328794e-05,
+ "loss": 1.9185,
+ "step": 946
+ },
+ {
+ "epoch": 2.5803814713896456,
+ "grad_norm": 13.089865684509277,
+ "learning_rate": 1.7202543142597642e-05,
+ "loss": 2.186,
+ "step": 947
+ },
+ {
+ "epoch": 2.5831062670299727,
+ "grad_norm": 13.027048110961914,
+ "learning_rate": 1.7220708446866486e-05,
+ "loss": 1.9521,
+ "step": 948
+ },
+ {
+ "epoch": 2.5858310626703,
+ "grad_norm": 11.275967597961426,
+ "learning_rate": 1.723887375113533e-05,
+ "loss": 2.0278,
+ "step": 949
+ },
+ {
+ "epoch": 2.5885558583106265,
+ "grad_norm": 11.945215225219727,
+ "learning_rate": 1.725703905540418e-05,
+ "loss": 2.0869,
+ "step": 950
+ },
+ {
+ "epoch": 2.5912806539509536,
+ "grad_norm": 13.042049407958984,
+ "learning_rate": 1.7275204359673027e-05,
+ "loss": 2.1851,
+ "step": 951
+ },
+ {
+ "epoch": 2.5940054495912808,
+ "grad_norm": 12.437920570373535,
+ "learning_rate": 1.729336966394187e-05,
+ "loss": 2.189,
+ "step": 952
+ },
+ {
+ "epoch": 2.5967302452316074,
+ "grad_norm": 10.772150039672852,
+ "learning_rate": 1.731153496821072e-05,
+ "loss": 2.0439,
+ "step": 953
+ },
+ {
+ "epoch": 2.5994550408719346,
+ "grad_norm": 9.490487098693848,
+ "learning_rate": 1.7329700272479567e-05,
+ "loss": 2.2412,
+ "step": 954
+ },
+ {
+ "epoch": 2.6021798365122617,
+ "grad_norm": 11.776585578918457,
+ "learning_rate": 1.734786557674841e-05,
+ "loss": 2.2949,
+ "step": 955
+ },
+ {
+ "epoch": 2.6049046321525884,
+ "grad_norm": 11.594934463500977,
+ "learning_rate": 1.736603088101726e-05,
+ "loss": 2.4121,
+ "step": 956
+ },
+ {
+ "epoch": 2.6076294277929155,
+ "grad_norm": 10.30360221862793,
+ "learning_rate": 1.7384196185286104e-05,
+ "loss": 2.2046,
+ "step": 957
+ },
+ {
+ "epoch": 2.6103542234332426,
+ "grad_norm": 10.74131965637207,
+ "learning_rate": 1.740236148955495e-05,
+ "loss": 2.0342,
+ "step": 958
+ },
+ {
+ "epoch": 2.6130790190735693,
+ "grad_norm": 14.043535232543945,
+ "learning_rate": 1.74205267938238e-05,
+ "loss": 2.0068,
+ "step": 959
+ },
+ {
+ "epoch": 2.6158038147138964,
+ "grad_norm": 15.56317138671875,
+ "learning_rate": 1.7438692098092644e-05,
+ "loss": 2.3081,
+ "step": 960
+ },
+ {
+ "epoch": 2.6185286103542236,
+ "grad_norm": 11.279816627502441,
+ "learning_rate": 1.745685740236149e-05,
+ "loss": 2.1792,
+ "step": 961
+ },
+ {
+ "epoch": 2.6212534059945503,
+ "grad_norm": 10.112878799438477,
+ "learning_rate": 1.747502270663034e-05,
+ "loss": 2.0562,
+ "step": 962
+ },
+ {
+ "epoch": 2.6239782016348774,
+ "grad_norm": 9.889863967895508,
+ "learning_rate": 1.7493188010899184e-05,
+ "loss": 2.0547,
+ "step": 963
+ },
+ {
+ "epoch": 2.6267029972752045,
+ "grad_norm": 11.233699798583984,
+ "learning_rate": 1.7511353315168032e-05,
+ "loss": 2.0146,
+ "step": 964
+ },
+ {
+ "epoch": 2.629427792915531,
+ "grad_norm": 11.08191204071045,
+ "learning_rate": 1.7529518619436876e-05,
+ "loss": 2.1846,
+ "step": 965
+ },
+ {
+ "epoch": 2.6321525885558583,
+ "grad_norm": 10.609518051147461,
+ "learning_rate": 1.7547683923705724e-05,
+ "loss": 2.0576,
+ "step": 966
+ },
+ {
+ "epoch": 2.6348773841961854,
+ "grad_norm": 10.003273010253906,
+ "learning_rate": 1.756584922797457e-05,
+ "loss": 2.064,
+ "step": 967
+ },
+ {
+ "epoch": 2.637602179836512,
+ "grad_norm": 11.615416526794434,
+ "learning_rate": 1.7584014532243416e-05,
+ "loss": 2.1299,
+ "step": 968
+ },
+ {
+ "epoch": 2.6403269754768393,
+ "grad_norm": 9.684825897216797,
+ "learning_rate": 1.7602179836512264e-05,
+ "loss": 2.0669,
+ "step": 969
+ },
+ {
+ "epoch": 2.6430517711171664,
+ "grad_norm": 9.547039985656738,
+ "learning_rate": 1.762034514078111e-05,
+ "loss": 2.3301,
+ "step": 970
+ },
+ {
+ "epoch": 2.645776566757493,
+ "grad_norm": 16.897127151489258,
+ "learning_rate": 1.7638510445049957e-05,
+ "loss": 2.1841,
+ "step": 971
+ },
+ {
+ "epoch": 2.64850136239782,
+ "grad_norm": 10.307887077331543,
+ "learning_rate": 1.7656675749318804e-05,
+ "loss": 2.0186,
+ "step": 972
+ },
+ {
+ "epoch": 2.6512261580381473,
+ "grad_norm": 10.339676856994629,
+ "learning_rate": 1.767484105358765e-05,
+ "loss": 1.9565,
+ "step": 973
+ },
+ {
+ "epoch": 2.653950953678474,
+ "grad_norm": 11.42247200012207,
+ "learning_rate": 1.7693006357856493e-05,
+ "loss": 2.1255,
+ "step": 974
+ },
+ {
+ "epoch": 2.656675749318801,
+ "grad_norm": 14.291765213012695,
+ "learning_rate": 1.771117166212534e-05,
+ "loss": 2.1147,
+ "step": 975
+ },
+ {
+ "epoch": 2.6594005449591283,
+ "grad_norm": 11.153193473815918,
+ "learning_rate": 1.772933696639419e-05,
+ "loss": 2.2563,
+ "step": 976
+ },
+ {
+ "epoch": 2.662125340599455,
+ "grad_norm": 21.198802947998047,
+ "learning_rate": 1.7747502270663034e-05,
+ "loss": 2.0952,
+ "step": 977
+ },
+ {
+ "epoch": 2.664850136239782,
+ "grad_norm": 8.79081916809082,
+ "learning_rate": 1.776566757493188e-05,
+ "loss": 1.9707,
+ "step": 978
+ },
+ {
+ "epoch": 2.667574931880109,
+ "grad_norm": 10.3134126663208,
+ "learning_rate": 1.778383287920073e-05,
+ "loss": 2.3716,
+ "step": 979
+ },
+ {
+ "epoch": 2.670299727520436,
+ "grad_norm": 11.59449577331543,
+ "learning_rate": 1.7801998183469574e-05,
+ "loss": 2.1514,
+ "step": 980
+ },
+ {
+ "epoch": 2.673024523160763,
+ "grad_norm": 11.302346229553223,
+ "learning_rate": 1.782016348773842e-05,
+ "loss": 2.1157,
+ "step": 981
+ },
+ {
+ "epoch": 2.67574931880109,
+ "grad_norm": 9.75825309753418,
+ "learning_rate": 1.7838328792007266e-05,
+ "loss": 2.0571,
+ "step": 982
+ },
+ {
+ "epoch": 2.678474114441417,
+ "grad_norm": 10.609179496765137,
+ "learning_rate": 1.7856494096276114e-05,
+ "loss": 2.1133,
+ "step": 983
+ },
+ {
+ "epoch": 2.681198910081744,
+ "grad_norm": 11.286617279052734,
+ "learning_rate": 1.7874659400544962e-05,
+ "loss": 2.3467,
+ "step": 984
+ },
+ {
+ "epoch": 2.683923705722071,
+ "grad_norm": 9.509994506835938,
+ "learning_rate": 1.7892824704813806e-05,
+ "loss": 1.9917,
+ "step": 985
+ },
+ {
+ "epoch": 2.6866485013623977,
+ "grad_norm": 14.678549766540527,
+ "learning_rate": 1.7910990009082654e-05,
+ "loss": 2.0366,
+ "step": 986
+ },
+ {
+ "epoch": 2.689373297002725,
+ "grad_norm": 11.929479598999023,
+ "learning_rate": 1.7929155313351502e-05,
+ "loss": 2.2295,
+ "step": 987
+ },
+ {
+ "epoch": 2.692098092643052,
+ "grad_norm": 17.15774917602539,
+ "learning_rate": 1.7947320617620346e-05,
+ "loss": 2.1348,
+ "step": 988
+ },
+ {
+ "epoch": 2.6948228882833787,
+ "grad_norm": 10.941985130310059,
+ "learning_rate": 1.7965485921889194e-05,
+ "loss": 2.0767,
+ "step": 989
+ },
+ {
+ "epoch": 2.697547683923706,
+ "grad_norm": 12.462225914001465,
+ "learning_rate": 1.798365122615804e-05,
+ "loss": 2.1367,
+ "step": 990
+ },
+ {
+ "epoch": 2.700272479564033,
+ "grad_norm": 11.844996452331543,
+ "learning_rate": 1.8001816530426887e-05,
+ "loss": 2.1934,
+ "step": 991
+ },
+ {
+ "epoch": 2.7029972752043596,
+ "grad_norm": 14.804704666137695,
+ "learning_rate": 1.801998183469573e-05,
+ "loss": 2.395,
+ "step": 992
+ },
+ {
+ "epoch": 2.7057220708446867,
+ "grad_norm": 11.517407417297363,
+ "learning_rate": 1.803814713896458e-05,
+ "loss": 2.3286,
+ "step": 993
+ },
+ {
+ "epoch": 2.708446866485014,
+ "grad_norm": 14.478534698486328,
+ "learning_rate": 1.8056312443233427e-05,
+ "loss": 2.1533,
+ "step": 994
+ },
+ {
+ "epoch": 2.7111716621253406,
+ "grad_norm": 9.946856498718262,
+ "learning_rate": 1.807447774750227e-05,
+ "loss": 1.96,
+ "step": 995
+ },
+ {
+ "epoch": 2.7138964577656677,
+ "grad_norm": 13.665610313415527,
+ "learning_rate": 1.809264305177112e-05,
+ "loss": 2.2798,
+ "step": 996
+ },
+ {
+ "epoch": 2.716621253405995,
+ "grad_norm": 10.038129806518555,
+ "learning_rate": 1.8110808356039967e-05,
+ "loss": 2.1304,
+ "step": 997
+ },
+ {
+ "epoch": 2.7193460490463215,
+ "grad_norm": 11.260223388671875,
+ "learning_rate": 1.812897366030881e-05,
+ "loss": 1.9653,
+ "step": 998
+ },
+ {
+ "epoch": 2.7220708446866486,
+ "grad_norm": 15.872689247131348,
+ "learning_rate": 1.8147138964577656e-05,
+ "loss": 2.145,
+ "step": 999
+ },
+ {
+ "epoch": 2.7247956403269757,
+ "grad_norm": 11.008293151855469,
+ "learning_rate": 1.8165304268846504e-05,
+ "loss": 1.9932,
+ "step": 1000
+ },
+ {
+ "epoch": 2.7275204359673024,
+ "grad_norm": 21.713911056518555,
+ "learning_rate": 1.818346957311535e-05,
+ "loss": 2.1406,
+ "step": 1001
+ },
+ {
+ "epoch": 2.7302452316076296,
+ "grad_norm": 10.877911567687988,
+ "learning_rate": 1.82016348773842e-05,
+ "loss": 1.8789,
+ "step": 1002
+ },
+ {
+ "epoch": 2.7329700272479567,
+ "grad_norm": 9.547883033752441,
+ "learning_rate": 1.8219800181653044e-05,
+ "loss": 1.9058,
+ "step": 1003
+ },
+ {
+ "epoch": 2.7356948228882834,
+ "grad_norm": 10.755492210388184,
+ "learning_rate": 1.8237965485921892e-05,
+ "loss": 2.2559,
+ "step": 1004
+ },
+ {
+ "epoch": 2.7384196185286105,
+ "grad_norm": 14.680377006530762,
+ "learning_rate": 1.825613079019074e-05,
+ "loss": 2.1792,
+ "step": 1005
+ },
+ {
+ "epoch": 2.741144414168937,
+ "grad_norm": 11.496443748474121,
+ "learning_rate": 1.8274296094459584e-05,
+ "loss": 1.8442,
+ "step": 1006
+ },
+ {
+ "epoch": 2.7438692098092643,
+ "grad_norm": 10.433564186096191,
+ "learning_rate": 1.829246139872843e-05,
+ "loss": 2.0632,
+ "step": 1007
+ },
+ {
+ "epoch": 2.7465940054495914,
+ "grad_norm": 13.286279678344727,
+ "learning_rate": 1.8310626702997276e-05,
+ "loss": 2.0337,
+ "step": 1008
+ },
+ {
+ "epoch": 2.749318801089918,
+ "grad_norm": 12.263654708862305,
+ "learning_rate": 1.8328792007266124e-05,
+ "loss": 2.2349,
+ "step": 1009
+ },
+ {
+ "epoch": 2.7520435967302452,
+ "grad_norm": 12.426753997802734,
+ "learning_rate": 1.834695731153497e-05,
+ "loss": 2.1875,
+ "step": 1010
+ },
+ {
+ "epoch": 2.7547683923705724,
+ "grad_norm": 11.248434066772461,
+ "learning_rate": 1.8365122615803817e-05,
+ "loss": 2.3296,
+ "step": 1011
+ },
+ {
+ "epoch": 2.757493188010899,
+ "grad_norm": 9.859634399414062,
+ "learning_rate": 1.8383287920072664e-05,
+ "loss": 2.0513,
+ "step": 1012
+ },
+ {
+ "epoch": 2.760217983651226,
+ "grad_norm": 14.553107261657715,
+ "learning_rate": 1.840145322434151e-05,
+ "loss": 1.9404,
+ "step": 1013
+ },
+ {
+ "epoch": 2.7629427792915533,
+ "grad_norm": 12.255064010620117,
+ "learning_rate": 1.8419618528610357e-05,
+ "loss": 2.0938,
+ "step": 1014
+ },
+ {
+ "epoch": 2.76566757493188,
+ "grad_norm": 9.135375022888184,
+ "learning_rate": 1.84377838328792e-05,
+ "loss": 1.9819,
+ "step": 1015
+ },
+ {
+ "epoch": 2.768392370572207,
+ "grad_norm": 9.41851806640625,
+ "learning_rate": 1.845594913714805e-05,
+ "loss": 2.1963,
+ "step": 1016
+ },
+ {
+ "epoch": 2.771117166212534,
+ "grad_norm": 10.326286315917969,
+ "learning_rate": 1.8474114441416894e-05,
+ "loss": 2.0601,
+ "step": 1017
+ },
+ {
+ "epoch": 2.773841961852861,
+ "grad_norm": 10.37588119506836,
+ "learning_rate": 1.849227974568574e-05,
+ "loss": 2.0913,
+ "step": 1018
+ },
+ {
+ "epoch": 2.776566757493188,
+ "grad_norm": 11.31806755065918,
+ "learning_rate": 1.851044504995459e-05,
+ "loss": 1.9868,
+ "step": 1019
+ },
+ {
+ "epoch": 2.7792915531335147,
+ "grad_norm": 11.349784851074219,
+ "learning_rate": 1.8528610354223434e-05,
+ "loss": 2.0552,
+ "step": 1020
+ },
+ {
+ "epoch": 2.782016348773842,
+ "grad_norm": 14.040486335754395,
+ "learning_rate": 1.854677565849228e-05,
+ "loss": 2.0845,
+ "step": 1021
+ },
+ {
+ "epoch": 2.784741144414169,
+ "grad_norm": 13.191317558288574,
+ "learning_rate": 1.856494096276113e-05,
+ "loss": 2.1899,
+ "step": 1022
+ },
+ {
+ "epoch": 2.7874659400544957,
+ "grad_norm": 9.923206329345703,
+ "learning_rate": 1.8583106267029974e-05,
+ "loss": 1.9409,
+ "step": 1023
+ },
+ {
+ "epoch": 2.790190735694823,
+ "grad_norm": 10.722381591796875,
+ "learning_rate": 1.8601271571298822e-05,
+ "loss": 2.0586,
+ "step": 1024
+ },
+ {
+ "epoch": 2.79291553133515,
+ "grad_norm": 17.646202087402344,
+ "learning_rate": 1.8619436875567666e-05,
+ "loss": 2.1035,
+ "step": 1025
+ },
+ {
+ "epoch": 2.7956403269754766,
+ "grad_norm": 9.694844245910645,
+ "learning_rate": 1.8637602179836514e-05,
+ "loss": 2.0835,
+ "step": 1026
+ },
+ {
+ "epoch": 2.7983651226158037,
+ "grad_norm": 12.24616813659668,
+ "learning_rate": 1.8655767484105362e-05,
+ "loss": 2.1138,
+ "step": 1027
+ },
+ {
+ "epoch": 2.801089918256131,
+ "grad_norm": 9.930631637573242,
+ "learning_rate": 1.8673932788374206e-05,
+ "loss": 2.0835,
+ "step": 1028
+ },
+ {
+ "epoch": 2.8038147138964575,
+ "grad_norm": 10.830024719238281,
+ "learning_rate": 1.8692098092643054e-05,
+ "loss": 2.0444,
+ "step": 1029
+ },
+ {
+ "epoch": 2.8065395095367847,
+ "grad_norm": 10.865161895751953,
+ "learning_rate": 1.8710263396911902e-05,
+ "loss": 2.0405,
+ "step": 1030
+ },
+ {
+ "epoch": 2.809264305177112,
+ "grad_norm": 14.24614429473877,
+ "learning_rate": 1.8728428701180747e-05,
+ "loss": 2.0142,
+ "step": 1031
+ },
+ {
+ "epoch": 2.8119891008174385,
+ "grad_norm": 11.228114128112793,
+ "learning_rate": 1.874659400544959e-05,
+ "loss": 2.0884,
+ "step": 1032
+ },
+ {
+ "epoch": 2.8147138964577656,
+ "grad_norm": 10.059917449951172,
+ "learning_rate": 1.876475930971844e-05,
+ "loss": 2.1763,
+ "step": 1033
+ },
+ {
+ "epoch": 2.8174386920980927,
+ "grad_norm": 11.651665687561035,
+ "learning_rate": 1.8782924613987287e-05,
+ "loss": 2.0122,
+ "step": 1034
+ },
+ {
+ "epoch": 2.8201634877384194,
+ "grad_norm": 11.106765747070312,
+ "learning_rate": 1.880108991825613e-05,
+ "loss": 2.2271,
+ "step": 1035
+ },
+ {
+ "epoch": 2.8228882833787465,
+ "grad_norm": 15.006171226501465,
+ "learning_rate": 1.881925522252498e-05,
+ "loss": 2.1875,
+ "step": 1036
+ },
+ {
+ "epoch": 2.8256130790190737,
+ "grad_norm": 15.874217987060547,
+ "learning_rate": 1.8837420526793827e-05,
+ "loss": 2.2461,
+ "step": 1037
+ },
+ {
+ "epoch": 2.8283378746594003,
+ "grad_norm": 10.447962760925293,
+ "learning_rate": 1.885558583106267e-05,
+ "loss": 2.252,
+ "step": 1038
+ },
+ {
+ "epoch": 2.8310626702997275,
+ "grad_norm": 10.36314868927002,
+ "learning_rate": 1.8873751135331516e-05,
+ "loss": 1.9971,
+ "step": 1039
+ },
+ {
+ "epoch": 2.8337874659400546,
+ "grad_norm": 10.244414329528809,
+ "learning_rate": 1.8891916439600364e-05,
+ "loss": 2.1052,
+ "step": 1040
+ },
+ {
+ "epoch": 2.8365122615803813,
+ "grad_norm": 10.732833862304688,
+ "learning_rate": 1.891008174386921e-05,
+ "loss": 2.0864,
+ "step": 1041
+ },
+ {
+ "epoch": 2.8392370572207084,
+ "grad_norm": 8.79423999786377,
+ "learning_rate": 1.8928247048138056e-05,
+ "loss": 1.834,
+ "step": 1042
+ },
+ {
+ "epoch": 2.8419618528610355,
+ "grad_norm": 10.455263137817383,
+ "learning_rate": 1.8946412352406904e-05,
+ "loss": 2.1279,
+ "step": 1043
+ },
+ {
+ "epoch": 2.844686648501362,
+ "grad_norm": 10.553400039672852,
+ "learning_rate": 1.8964577656675752e-05,
+ "loss": 2.1826,
+ "step": 1044
+ },
+ {
+ "epoch": 2.8474114441416893,
+ "grad_norm": 14.043966293334961,
+ "learning_rate": 1.8982742960944596e-05,
+ "loss": 2.1504,
+ "step": 1045
+ },
+ {
+ "epoch": 2.8501362397820165,
+ "grad_norm": 9.35976505279541,
+ "learning_rate": 1.9000908265213444e-05,
+ "loss": 1.9067,
+ "step": 1046
+ },
+ {
+ "epoch": 2.852861035422343,
+ "grad_norm": 10.658482551574707,
+ "learning_rate": 1.9019073569482292e-05,
+ "loss": 1.834,
+ "step": 1047
+ },
+ {
+ "epoch": 2.8555858310626703,
+ "grad_norm": 13.526549339294434,
+ "learning_rate": 1.9037238873751136e-05,
+ "loss": 2.0977,
+ "step": 1048
+ },
+ {
+ "epoch": 2.8583106267029974,
+ "grad_norm": 12.88541316986084,
+ "learning_rate": 1.9055404178019984e-05,
+ "loss": 2.0054,
+ "step": 1049
+ },
+ {
+ "epoch": 2.861035422343324,
+ "grad_norm": 10.029620170593262,
+ "learning_rate": 1.907356948228883e-05,
+ "loss": 2.1782,
+ "step": 1050
+ },
+ {
+ "epoch": 2.863760217983651,
+ "grad_norm": 9.453518867492676,
+ "learning_rate": 1.9091734786557677e-05,
+ "loss": 1.9761,
+ "step": 1051
+ },
+ {
+ "epoch": 2.8664850136239783,
+ "grad_norm": 11.48316764831543,
+ "learning_rate": 1.9109900090826524e-05,
+ "loss": 2.0508,
+ "step": 1052
+ },
+ {
+ "epoch": 2.869209809264305,
+ "grad_norm": 11.313542366027832,
+ "learning_rate": 1.912806539509537e-05,
+ "loss": 2.2388,
+ "step": 1053
+ },
+ {
+ "epoch": 2.871934604904632,
+ "grad_norm": 9.777838706970215,
+ "learning_rate": 1.9146230699364217e-05,
+ "loss": 2.0586,
+ "step": 1054
+ },
+ {
+ "epoch": 2.8746594005449593,
+ "grad_norm": 10.812276840209961,
+ "learning_rate": 1.9164396003633065e-05,
+ "loss": 2.29,
+ "step": 1055
+ },
+ {
+ "epoch": 2.877384196185286,
+ "grad_norm": 12.773347854614258,
+ "learning_rate": 1.918256130790191e-05,
+ "loss": 1.9983,
+ "step": 1056
+ },
+ {
+ "epoch": 2.880108991825613,
+ "grad_norm": 11.323981285095215,
+ "learning_rate": 1.9200726612170754e-05,
+ "loss": 2.0874,
+ "step": 1057
+ },
+ {
+ "epoch": 2.88283378746594,
+ "grad_norm": 11.521679878234863,
+ "learning_rate": 1.92188919164396e-05,
+ "loss": 2.1499,
+ "step": 1058
+ },
+ {
+ "epoch": 2.885558583106267,
+ "grad_norm": 9.209939956665039,
+ "learning_rate": 1.923705722070845e-05,
+ "loss": 1.978,
+ "step": 1059
+ },
+ {
+ "epoch": 2.888283378746594,
+ "grad_norm": 10.25390625,
+ "learning_rate": 1.9255222524977294e-05,
+ "loss": 2.0332,
+ "step": 1060
+ },
+ {
+ "epoch": 2.891008174386921,
+ "grad_norm": 10.265666961669922,
+ "learning_rate": 1.927338782924614e-05,
+ "loss": 2.1875,
+ "step": 1061
+ },
+ {
+ "epoch": 2.893732970027248,
+ "grad_norm": 9.984662055969238,
+ "learning_rate": 1.929155313351499e-05,
+ "loss": 2.1362,
+ "step": 1062
+ },
+ {
+ "epoch": 2.896457765667575,
+ "grad_norm": 9.017266273498535,
+ "learning_rate": 1.9309718437783834e-05,
+ "loss": 2.0161,
+ "step": 1063
+ },
+ {
+ "epoch": 2.899182561307902,
+ "grad_norm": 9.564297676086426,
+ "learning_rate": 1.932788374205268e-05,
+ "loss": 2.0894,
+ "step": 1064
+ },
+ {
+ "epoch": 2.9019073569482288,
+ "grad_norm": 10.540470123291016,
+ "learning_rate": 1.9346049046321526e-05,
+ "loss": 1.9082,
+ "step": 1065
+ },
+ {
+ "epoch": 2.904632152588556,
+ "grad_norm": 11.878788948059082,
+ "learning_rate": 1.9364214350590374e-05,
+ "loss": 2.2153,
+ "step": 1066
+ },
+ {
+ "epoch": 2.907356948228883,
+ "grad_norm": 9.226091384887695,
+ "learning_rate": 1.938237965485922e-05,
+ "loss": 2.0347,
+ "step": 1067
+ },
+ {
+ "epoch": 2.9100817438692097,
+ "grad_norm": 11.214638710021973,
+ "learning_rate": 1.9400544959128066e-05,
+ "loss": 1.9736,
+ "step": 1068
+ },
+ {
+ "epoch": 2.912806539509537,
+ "grad_norm": 10.410806655883789,
+ "learning_rate": 1.9418710263396914e-05,
+ "loss": 1.8379,
+ "step": 1069
+ },
+ {
+ "epoch": 2.915531335149864,
+ "grad_norm": 9.997007369995117,
+ "learning_rate": 1.9436875567665762e-05,
+ "loss": 1.9756,
+ "step": 1070
+ },
+ {
+ "epoch": 2.9182561307901906,
+ "grad_norm": 8.648539543151855,
+ "learning_rate": 1.9455040871934607e-05,
+ "loss": 2.0698,
+ "step": 1071
+ },
+ {
+ "epoch": 2.9209809264305178,
+ "grad_norm": 9.715324401855469,
+ "learning_rate": 1.9473206176203454e-05,
+ "loss": 2.1509,
+ "step": 1072
+ },
+ {
+ "epoch": 2.923705722070845,
+ "grad_norm": 11.68460464477539,
+ "learning_rate": 1.94913714804723e-05,
+ "loss": 2.1602,
+ "step": 1073
+ },
+ {
+ "epoch": 2.9264305177111716,
+ "grad_norm": 8.657852172851562,
+ "learning_rate": 1.9509536784741147e-05,
+ "loss": 1.9038,
+ "step": 1074
+ },
+ {
+ "epoch": 2.9291553133514987,
+ "grad_norm": 12.567237854003906,
+ "learning_rate": 1.952770208900999e-05,
+ "loss": 2.1553,
+ "step": 1075
+ },
+ {
+ "epoch": 2.931880108991826,
+ "grad_norm": 10.17682933807373,
+ "learning_rate": 1.954586739327884e-05,
+ "loss": 1.9727,
+ "step": 1076
+ },
+ {
+ "epoch": 2.9346049046321525,
+ "grad_norm": 25.757490158081055,
+ "learning_rate": 1.9564032697547687e-05,
+ "loss": 2.1606,
+ "step": 1077
+ },
+ {
+ "epoch": 2.9373297002724796,
+ "grad_norm": 11.21967887878418,
+ "learning_rate": 1.958219800181653e-05,
+ "loss": 2.0835,
+ "step": 1078
+ },
+ {
+ "epoch": 2.9400544959128068,
+ "grad_norm": 11.750326156616211,
+ "learning_rate": 1.960036330608538e-05,
+ "loss": 1.7771,
+ "step": 1079
+ },
+ {
+ "epoch": 2.9427792915531334,
+ "grad_norm": 10.967148780822754,
+ "learning_rate": 1.9618528610354227e-05,
+ "loss": 2.0957,
+ "step": 1080
+ },
+ {
+ "epoch": 2.9455040871934606,
+ "grad_norm": 14.189801216125488,
+ "learning_rate": 1.963669391462307e-05,
+ "loss": 2.0962,
+ "step": 1081
+ },
+ {
+ "epoch": 2.9482288828337877,
+ "grad_norm": 10.641090393066406,
+ "learning_rate": 1.9654859218891916e-05,
+ "loss": 2.1592,
+ "step": 1082
+ },
+ {
+ "epoch": 2.9509536784741144,
+ "grad_norm": 12.17349910736084,
+ "learning_rate": 1.9673024523160764e-05,
+ "loss": 2.1245,
+ "step": 1083
+ },
+ {
+ "epoch": 2.9536784741144415,
+ "grad_norm": 10.572559356689453,
+ "learning_rate": 1.9691189827429612e-05,
+ "loss": 2.0898,
+ "step": 1084
+ },
+ {
+ "epoch": 2.9564032697547686,
+ "grad_norm": 9.885048866271973,
+ "learning_rate": 1.9709355131698456e-05,
+ "loss": 2.1226,
+ "step": 1085
+ },
+ {
+ "epoch": 2.9591280653950953,
+ "grad_norm": 9.901043891906738,
+ "learning_rate": 1.9727520435967304e-05,
+ "loss": 1.8735,
+ "step": 1086
+ },
+ {
+ "epoch": 2.9618528610354224,
+ "grad_norm": 15.233263969421387,
+ "learning_rate": 1.9745685740236152e-05,
+ "loss": 1.9155,
+ "step": 1087
+ },
+ {
+ "epoch": 2.9645776566757496,
+ "grad_norm": 16.466659545898438,
+ "learning_rate": 1.9763851044504996e-05,
+ "loss": 2.1514,
+ "step": 1088
+ },
+ {
+ "epoch": 2.9673024523160763,
+ "grad_norm": 12.63900089263916,
+ "learning_rate": 1.978201634877384e-05,
+ "loss": 2.1035,
+ "step": 1089
+ },
+ {
+ "epoch": 2.9700272479564034,
+ "grad_norm": 9.711353302001953,
+ "learning_rate": 1.980018165304269e-05,
+ "loss": 2.2021,
+ "step": 1090
+ },
+ {
+ "epoch": 2.9727520435967305,
+ "grad_norm": 10.527975082397461,
+ "learning_rate": 1.9818346957311537e-05,
+ "loss": 1.9062,
+ "step": 1091
+ },
+ {
+ "epoch": 2.975476839237057,
+ "grad_norm": 10.087246894836426,
+ "learning_rate": 1.9836512261580384e-05,
+ "loss": 1.9131,
+ "step": 1092
+ },
+ {
+ "epoch": 2.9782016348773843,
+ "grad_norm": 9.904088973999023,
+ "learning_rate": 1.985467756584923e-05,
+ "loss": 2.3457,
+ "step": 1093
+ },
+ {
+ "epoch": 2.9809264305177114,
+ "grad_norm": 10.21497631072998,
+ "learning_rate": 1.9872842870118077e-05,
+ "loss": 1.9922,
+ "step": 1094
+ },
+ {
+ "epoch": 2.983651226158038,
+ "grad_norm": 10.031513214111328,
+ "learning_rate": 1.9891008174386925e-05,
+ "loss": 1.8799,
+ "step": 1095
+ },
+ {
+ "epoch": 2.9863760217983653,
+ "grad_norm": 18.525638580322266,
+ "learning_rate": 1.990917347865577e-05,
+ "loss": 2.0332,
+ "step": 1096
+ },
+ {
+ "epoch": 2.989100817438692,
+ "grad_norm": 9.667322158813477,
+ "learning_rate": 1.9927338782924614e-05,
+ "loss": 1.969,
+ "step": 1097
+ },
+ {
+ "epoch": 2.991825613079019,
+ "grad_norm": 10.101297378540039,
+ "learning_rate": 1.994550408719346e-05,
+ "loss": 2.1143,
+ "step": 1098
+ },
+ {
+ "epoch": 2.994550408719346,
+ "grad_norm": 9.766504287719727,
+ "learning_rate": 1.996366939146231e-05,
+ "loss": 1.9966,
+ "step": 1099
+ },
+ {
+ "epoch": 2.997275204359673,
+ "grad_norm": 10.17359733581543,
+ "learning_rate": 1.9981834695731154e-05,
+ "loss": 2.2192,
+ "step": 1100
+ },
+ {
+ "epoch": 3.0,
+ "grad_norm": 11.143439292907715,
+ "learning_rate": 2e-05,
+ "loss": 2.041,
+ "step": 1101
+ },
+ {
+ "epoch": 3.002724795640327,
+ "grad_norm": 10.33942699432373,
+ "learning_rate": 1.9999999961060162e-05,
+ "loss": 1.875,
+ "step": 1102
+ },
+ {
+ "epoch": 3.005449591280654,
+ "grad_norm": 11.492137908935547,
+ "learning_rate": 1.9999999844240644e-05,
+ "loss": 2.2,
+ "step": 1103
+ },
+ {
+ "epoch": 3.008174386920981,
+ "grad_norm": 10.473490715026855,
+ "learning_rate": 1.999999964954145e-05,
+ "loss": 1.8848,
+ "step": 1104
+ },
+ {
+ "epoch": 3.010899182561308,
+ "grad_norm": 12.820694923400879,
+ "learning_rate": 1.9999999376962583e-05,
+ "loss": 2.1724,
+ "step": 1105
+ },
+ {
+ "epoch": 3.0136239782016347,
+ "grad_norm": 14.527670860290527,
+ "learning_rate": 1.999999902650404e-05,
+ "loss": 2.0332,
+ "step": 1106
+ },
+ {
+ "epoch": 3.016348773841962,
+ "grad_norm": 9.247108459472656,
+ "learning_rate": 1.9999998598165827e-05,
+ "loss": 1.8853,
+ "step": 1107
+ },
+ {
+ "epoch": 3.019073569482289,
+ "grad_norm": 12.707825660705566,
+ "learning_rate": 1.9999998091947947e-05,
+ "loss": 2.231,
+ "step": 1108
+ },
+ {
+ "epoch": 3.0217983651226157,
+ "grad_norm": 11.171661376953125,
+ "learning_rate": 1.9999997507850404e-05,
+ "loss": 1.8789,
+ "step": 1109
+ },
+ {
+ "epoch": 3.024523160762943,
+ "grad_norm": 11.998929023742676,
+ "learning_rate": 1.99999968458732e-05,
+ "loss": 1.9287,
+ "step": 1110
+ },
+ {
+ "epoch": 3.02724795640327,
+ "grad_norm": 10.787744522094727,
+ "learning_rate": 1.9999996106016345e-05,
+ "loss": 2.0576,
+ "step": 1111
+ },
+ {
+ "epoch": 3.0299727520435966,
+ "grad_norm": 14.347358703613281,
+ "learning_rate": 1.999999528827984e-05,
+ "loss": 1.9194,
+ "step": 1112
+ },
+ {
+ "epoch": 3.0326975476839237,
+ "grad_norm": 10.398091316223145,
+ "learning_rate": 1.9999994392663697e-05,
+ "loss": 1.9146,
+ "step": 1113
+ },
+ {
+ "epoch": 3.035422343324251,
+ "grad_norm": 10.237173080444336,
+ "learning_rate": 1.9999993419167914e-05,
+ "loss": 1.9946,
+ "step": 1114
+ },
+ {
+ "epoch": 3.0381471389645776,
+ "grad_norm": 10.289793968200684,
+ "learning_rate": 1.999999236779251e-05,
+ "loss": 1.9805,
+ "step": 1115
+ },
+ {
+ "epoch": 3.0408719346049047,
+ "grad_norm": 10.29628849029541,
+ "learning_rate": 1.9999991238537482e-05,
+ "loss": 2.0688,
+ "step": 1116
+ },
+ {
+ "epoch": 3.043596730245232,
+ "grad_norm": 10.019878387451172,
+ "learning_rate": 1.999999003140285e-05,
+ "loss": 1.8232,
+ "step": 1117
+ },
+ {
+ "epoch": 3.0463215258855585,
+ "grad_norm": 9.181999206542969,
+ "learning_rate": 1.9999988746388613e-05,
+ "loss": 1.8823,
+ "step": 1118
+ },
+ {
+ "epoch": 3.0490463215258856,
+ "grad_norm": 10.890800476074219,
+ "learning_rate": 1.9999987383494786e-05,
+ "loss": 1.8945,
+ "step": 1119
+ },
+ {
+ "epoch": 3.0517711171662127,
+ "grad_norm": 11.722890853881836,
+ "learning_rate": 1.999998594272138e-05,
+ "loss": 1.9785,
+ "step": 1120
+ },
+ {
+ "epoch": 3.0544959128065394,
+ "grad_norm": 11.116331100463867,
+ "learning_rate": 1.9999984424068405e-05,
+ "loss": 1.8101,
+ "step": 1121
+ },
+ {
+ "epoch": 3.0572207084468666,
+ "grad_norm": 12.051642417907715,
+ "learning_rate": 1.9999982827535874e-05,
+ "loss": 2.0015,
+ "step": 1122
+ },
+ {
+ "epoch": 3.0599455040871932,
+ "grad_norm": 10.866436004638672,
+ "learning_rate": 1.9999981153123797e-05,
+ "loss": 1.8687,
+ "step": 1123
+ },
+ {
+ "epoch": 3.0626702997275204,
+ "grad_norm": 10.616351127624512,
+ "learning_rate": 1.999997940083219e-05,
+ "loss": 1.9897,
+ "step": 1124
+ },
+ {
+ "epoch": 3.0653950953678475,
+ "grad_norm": 11.926887512207031,
+ "learning_rate": 1.9999977570661064e-05,
+ "loss": 1.8184,
+ "step": 1125
+ },
+ {
+ "epoch": 3.068119891008174,
+ "grad_norm": 9.511907577514648,
+ "learning_rate": 1.9999975662610435e-05,
+ "loss": 2.0708,
+ "step": 1126
+ },
+ {
+ "epoch": 3.0708446866485013,
+ "grad_norm": 11.440744400024414,
+ "learning_rate": 1.9999973676680318e-05,
+ "loss": 1.9248,
+ "step": 1127
+ },
+ {
+ "epoch": 3.0735694822888284,
+ "grad_norm": 10.463530540466309,
+ "learning_rate": 1.999997161287073e-05,
+ "loss": 2.0166,
+ "step": 1128
+ },
+ {
+ "epoch": 3.076294277929155,
+ "grad_norm": 13.820565223693848,
+ "learning_rate": 1.999996947118168e-05,
+ "loss": 1.9067,
+ "step": 1129
+ },
+ {
+ "epoch": 3.0790190735694822,
+ "grad_norm": 8.525996208190918,
+ "learning_rate": 1.999996725161319e-05,
+ "loss": 1.9385,
+ "step": 1130
+ },
+ {
+ "epoch": 3.0817438692098094,
+ "grad_norm": 13.830317497253418,
+ "learning_rate": 1.999996495416528e-05,
+ "loss": 2.0405,
+ "step": 1131
+ },
+ {
+ "epoch": 3.084468664850136,
+ "grad_norm": 11.075336456298828,
+ "learning_rate": 1.9999962578837967e-05,
+ "loss": 1.9897,
+ "step": 1132
+ },
+ {
+ "epoch": 3.087193460490463,
+ "grad_norm": 16.12899398803711,
+ "learning_rate": 1.999996012563126e-05,
+ "loss": 1.8789,
+ "step": 1133
+ },
+ {
+ "epoch": 3.0899182561307903,
+ "grad_norm": 10.055564880371094,
+ "learning_rate": 1.9999957594545193e-05,
+ "loss": 2.0825,
+ "step": 1134
+ },
+ {
+ "epoch": 3.092643051771117,
+ "grad_norm": 14.070582389831543,
+ "learning_rate": 1.9999954985579774e-05,
+ "loss": 1.8477,
+ "step": 1135
+ },
+ {
+ "epoch": 3.095367847411444,
+ "grad_norm": 10.774489402770996,
+ "learning_rate": 1.999995229873503e-05,
+ "loss": 1.9692,
+ "step": 1136
+ },
+ {
+ "epoch": 3.0980926430517712,
+ "grad_norm": 11.93801498413086,
+ "learning_rate": 1.9999949534010975e-05,
+ "loss": 2.0947,
+ "step": 1137
+ },
+ {
+ "epoch": 3.100817438692098,
+ "grad_norm": 9.086506843566895,
+ "learning_rate": 1.9999946691407635e-05,
+ "loss": 1.7251,
+ "step": 1138
+ },
+ {
+ "epoch": 3.103542234332425,
+ "grad_norm": 11.340764999389648,
+ "learning_rate": 1.9999943770925037e-05,
+ "loss": 1.9004,
+ "step": 1139
+ },
+ {
+ "epoch": 3.106267029972752,
+ "grad_norm": 11.077136039733887,
+ "learning_rate": 1.9999940772563194e-05,
+ "loss": 1.9233,
+ "step": 1140
+ },
+ {
+ "epoch": 3.108991825613079,
+ "grad_norm": 10.375553131103516,
+ "learning_rate": 1.9999937696322136e-05,
+ "loss": 1.8062,
+ "step": 1141
+ },
+ {
+ "epoch": 3.111716621253406,
+ "grad_norm": 10.730899810791016,
+ "learning_rate": 1.9999934542201888e-05,
+ "loss": 2.04,
+ "step": 1142
+ },
+ {
+ "epoch": 3.114441416893733,
+ "grad_norm": 12.8143310546875,
+ "learning_rate": 1.999993131020247e-05,
+ "loss": 2.1177,
+ "step": 1143
+ },
+ {
+ "epoch": 3.11716621253406,
+ "grad_norm": 12.750884056091309,
+ "learning_rate": 1.9999928000323903e-05,
+ "loss": 1.9541,
+ "step": 1144
+ },
+ {
+ "epoch": 3.119891008174387,
+ "grad_norm": 11.579204559326172,
+ "learning_rate": 1.9999924612566225e-05,
+ "loss": 2.0874,
+ "step": 1145
+ },
+ {
+ "epoch": 3.122615803814714,
+ "grad_norm": 11.029909133911133,
+ "learning_rate": 1.9999921146929454e-05,
+ "loss": 1.7896,
+ "step": 1146
+ },
+ {
+ "epoch": 3.1253405994550407,
+ "grad_norm": 11.410332679748535,
+ "learning_rate": 1.9999917603413618e-05,
+ "loss": 2.0469,
+ "step": 1147
+ },
+ {
+ "epoch": 3.128065395095368,
+ "grad_norm": 11.27589225769043,
+ "learning_rate": 1.9999913982018747e-05,
+ "loss": 1.9707,
+ "step": 1148
+ },
+ {
+ "epoch": 3.130790190735695,
+ "grad_norm": 10.249436378479004,
+ "learning_rate": 1.9999910282744865e-05,
+ "loss": 1.9133,
+ "step": 1149
+ },
+ {
+ "epoch": 3.1335149863760217,
+ "grad_norm": 12.009215354919434,
+ "learning_rate": 1.999990650559201e-05,
+ "loss": 1.978,
+ "step": 1150
+ },
+ {
+ "epoch": 3.136239782016349,
+ "grad_norm": 12.450786590576172,
+ "learning_rate": 1.99999026505602e-05,
+ "loss": 1.9531,
+ "step": 1151
+ },
+ {
+ "epoch": 3.138964577656676,
+ "grad_norm": 10.915098190307617,
+ "learning_rate": 1.999989871764947e-05,
+ "loss": 1.7954,
+ "step": 1152
+ },
+ {
+ "epoch": 3.1416893732970026,
+ "grad_norm": 10.478048324584961,
+ "learning_rate": 1.9999894706859852e-05,
+ "loss": 1.9912,
+ "step": 1153
+ },
+ {
+ "epoch": 3.1444141689373297,
+ "grad_norm": 22.394235610961914,
+ "learning_rate": 1.9999890618191375e-05,
+ "loss": 1.8711,
+ "step": 1154
+ },
+ {
+ "epoch": 3.147138964577657,
+ "grad_norm": 24.724218368530273,
+ "learning_rate": 1.999988645164407e-05,
+ "loss": 2.0547,
+ "step": 1155
+ },
+ {
+ "epoch": 3.1498637602179835,
+ "grad_norm": 9.987106323242188,
+ "learning_rate": 1.9999882207217976e-05,
+ "loss": 2.0884,
+ "step": 1156
+ },
+ {
+ "epoch": 3.1525885558583107,
+ "grad_norm": 10.89595890045166,
+ "learning_rate": 1.9999877884913116e-05,
+ "loss": 1.9312,
+ "step": 1157
+ },
+ {
+ "epoch": 3.155313351498638,
+ "grad_norm": 11.442464828491211,
+ "learning_rate": 1.9999873484729533e-05,
+ "loss": 2.0894,
+ "step": 1158
+ },
+ {
+ "epoch": 3.1580381471389645,
+ "grad_norm": 13.294852256774902,
+ "learning_rate": 1.9999869006667254e-05,
+ "loss": 1.8687,
+ "step": 1159
+ },
+ {
+ "epoch": 3.1607629427792916,
+ "grad_norm": 10.252835273742676,
+ "learning_rate": 1.999986445072632e-05,
+ "loss": 1.8933,
+ "step": 1160
+ },
+ {
+ "epoch": 3.1634877384196187,
+ "grad_norm": 12.676876068115234,
+ "learning_rate": 1.9999859816906763e-05,
+ "loss": 1.8652,
+ "step": 1161
+ },
+ {
+ "epoch": 3.1662125340599454,
+ "grad_norm": 18.203889846801758,
+ "learning_rate": 1.9999855105208616e-05,
+ "loss": 1.9907,
+ "step": 1162
+ },
+ {
+ "epoch": 3.1689373297002725,
+ "grad_norm": 11.438253402709961,
+ "learning_rate": 1.9999850315631925e-05,
+ "loss": 2.1001,
+ "step": 1163
+ },
+ {
+ "epoch": 3.1716621253405997,
+ "grad_norm": 11.49427318572998,
+ "learning_rate": 1.9999845448176717e-05,
+ "loss": 1.9683,
+ "step": 1164
+ },
+ {
+ "epoch": 3.1743869209809263,
+ "grad_norm": 24.44009780883789,
+ "learning_rate": 1.9999840502843034e-05,
+ "loss": 1.8289,
+ "step": 1165
+ },
+ {
+ "epoch": 3.1771117166212535,
+ "grad_norm": 11.613852500915527,
+ "learning_rate": 1.999983547963092e-05,
+ "loss": 1.9341,
+ "step": 1166
+ },
+ {
+ "epoch": 3.1798365122615806,
+ "grad_norm": 11.840388298034668,
+ "learning_rate": 1.9999830378540403e-05,
+ "loss": 1.9385,
+ "step": 1167
+ },
+ {
+ "epoch": 3.1825613079019073,
+ "grad_norm": 15.055170059204102,
+ "learning_rate": 1.9999825199571533e-05,
+ "loss": 1.9922,
+ "step": 1168
+ },
+ {
+ "epoch": 3.1852861035422344,
+ "grad_norm": 9.82111644744873,
+ "learning_rate": 1.9999819942724343e-05,
+ "loss": 2.0317,
+ "step": 1169
+ },
+ {
+ "epoch": 3.1880108991825615,
+ "grad_norm": 11.261125564575195,
+ "learning_rate": 1.9999814607998884e-05,
+ "loss": 2.0488,
+ "step": 1170
+ },
+ {
+ "epoch": 3.190735694822888,
+ "grad_norm": 14.382711410522461,
+ "learning_rate": 1.9999809195395182e-05,
+ "loss": 2.064,
+ "step": 1171
+ },
+ {
+ "epoch": 3.1934604904632153,
+ "grad_norm": 11.627882957458496,
+ "learning_rate": 1.9999803704913293e-05,
+ "loss": 2.0542,
+ "step": 1172
+ },
+ {
+ "epoch": 3.1961852861035425,
+ "grad_norm": 11.54857349395752,
+ "learning_rate": 1.9999798136553253e-05,
+ "loss": 2.0269,
+ "step": 1173
+ },
+ {
+ "epoch": 3.198910081743869,
+ "grad_norm": 11.140435218811035,
+ "learning_rate": 1.9999792490315107e-05,
+ "loss": 2.2227,
+ "step": 1174
+ },
+ {
+ "epoch": 3.2016348773841963,
+ "grad_norm": 14.964839935302734,
+ "learning_rate": 1.9999786766198902e-05,
+ "loss": 1.8779,
+ "step": 1175
+ },
+ {
+ "epoch": 3.204359673024523,
+ "grad_norm": 10.240537643432617,
+ "learning_rate": 1.9999780964204675e-05,
+ "loss": 1.9644,
+ "step": 1176
+ },
+ {
+ "epoch": 3.20708446866485,
+ "grad_norm": 14.842936515808105,
+ "learning_rate": 1.9999775084332477e-05,
+ "loss": 2.063,
+ "step": 1177
+ },
+ {
+ "epoch": 3.209809264305177,
+ "grad_norm": 8.813994407653809,
+ "learning_rate": 1.999976912658235e-05,
+ "loss": 2.0947,
+ "step": 1178
+ },
+ {
+ "epoch": 3.212534059945504,
+ "grad_norm": 9.20219612121582,
+ "learning_rate": 1.999976309095435e-05,
+ "loss": 2.0005,
+ "step": 1179
+ },
+ {
+ "epoch": 3.215258855585831,
+ "grad_norm": 12.575230598449707,
+ "learning_rate": 1.999975697744851e-05,
+ "loss": 2.0859,
+ "step": 1180
+ },
+ {
+ "epoch": 3.217983651226158,
+ "grad_norm": 10.840344429016113,
+ "learning_rate": 1.999975078606489e-05,
+ "loss": 1.7068,
+ "step": 1181
+ },
+ {
+ "epoch": 3.220708446866485,
+ "grad_norm": 10.119123458862305,
+ "learning_rate": 1.9999744516803527e-05,
+ "loss": 2.1094,
+ "step": 1182
+ },
+ {
+ "epoch": 3.223433242506812,
+ "grad_norm": 11.109670639038086,
+ "learning_rate": 1.999973816966448e-05,
+ "loss": 2.104,
+ "step": 1183
+ },
+ {
+ "epoch": 3.226158038147139,
+ "grad_norm": 15.738182067871094,
+ "learning_rate": 1.999973174464779e-05,
+ "loss": 1.9448,
+ "step": 1184
+ },
+ {
+ "epoch": 3.2288828337874658,
+ "grad_norm": 9.035996437072754,
+ "learning_rate": 1.9999725241753516e-05,
+ "loss": 1.8745,
+ "step": 1185
+ },
+ {
+ "epoch": 3.231607629427793,
+ "grad_norm": 12.854116439819336,
+ "learning_rate": 1.9999718660981703e-05,
+ "loss": 2.1528,
+ "step": 1186
+ },
+ {
+ "epoch": 3.23433242506812,
+ "grad_norm": 14.7183837890625,
+ "learning_rate": 1.9999712002332397e-05,
+ "loss": 1.9351,
+ "step": 1187
+ },
+ {
+ "epoch": 3.2370572207084467,
+ "grad_norm": 11.334243774414062,
+ "learning_rate": 1.9999705265805662e-05,
+ "loss": 2.042,
+ "step": 1188
+ },
+ {
+ "epoch": 3.239782016348774,
+ "grad_norm": 9.695436477661133,
+ "learning_rate": 1.9999698451401542e-05,
+ "loss": 1.855,
+ "step": 1189
+ },
+ {
+ "epoch": 3.242506811989101,
+ "grad_norm": 12.386056900024414,
+ "learning_rate": 1.9999691559120092e-05,
+ "loss": 2.0366,
+ "step": 1190
+ },
+ {
+ "epoch": 3.2452316076294276,
+ "grad_norm": 11.660694122314453,
+ "learning_rate": 1.999968458896137e-05,
+ "loss": 1.9668,
+ "step": 1191
+ },
+ {
+ "epoch": 3.2479564032697548,
+ "grad_norm": 10.674187660217285,
+ "learning_rate": 1.9999677540925416e-05,
+ "loss": 1.6982,
+ "step": 1192
+ },
+ {
+ "epoch": 3.250681198910082,
+ "grad_norm": 13.024900436401367,
+ "learning_rate": 1.9999670415012306e-05,
+ "loss": 1.8032,
+ "step": 1193
+ },
+ {
+ "epoch": 3.2534059945504086,
+ "grad_norm": 10.894378662109375,
+ "learning_rate": 1.9999663211222078e-05,
+ "loss": 2.0825,
+ "step": 1194
+ },
+ {
+ "epoch": 3.2561307901907357,
+ "grad_norm": 10.457403182983398,
+ "learning_rate": 1.9999655929554798e-05,
+ "loss": 1.9355,
+ "step": 1195
+ },
+ {
+ "epoch": 3.258855585831063,
+ "grad_norm": 10.54038143157959,
+ "learning_rate": 1.999964857001052e-05,
+ "loss": 2.0415,
+ "step": 1196
+ },
+ {
+ "epoch": 3.2615803814713895,
+ "grad_norm": 9.038063049316406,
+ "learning_rate": 1.99996411325893e-05,
+ "loss": 1.9448,
+ "step": 1197
+ },
+ {
+ "epoch": 3.2643051771117166,
+ "grad_norm": 9.49393081665039,
+ "learning_rate": 1.9999633617291196e-05,
+ "loss": 1.7476,
+ "step": 1198
+ },
+ {
+ "epoch": 3.2670299727520438,
+ "grad_norm": 10.450029373168945,
+ "learning_rate": 1.9999626024116267e-05,
+ "loss": 1.9834,
+ "step": 1199
+ },
+ {
+ "epoch": 3.2697547683923704,
+ "grad_norm": 9.543033599853516,
+ "learning_rate": 1.999961835306457e-05,
+ "loss": 1.9922,
+ "step": 1200
+ },
+ {
+ "epoch": 3.2724795640326976,
+ "grad_norm": 9.017727851867676,
+ "learning_rate": 1.999961060413617e-05,
+ "loss": 1.8706,
+ "step": 1201
+ },
+ {
+ "epoch": 3.2752043596730247,
+ "grad_norm": 11.66344928741455,
+ "learning_rate": 1.9999602777331124e-05,
+ "loss": 2.1118,
+ "step": 1202
+ },
+ {
+ "epoch": 3.2779291553133514,
+ "grad_norm": 9.141104698181152,
+ "learning_rate": 1.9999594872649495e-05,
+ "loss": 1.8687,
+ "step": 1203
+ },
+ {
+ "epoch": 3.2806539509536785,
+ "grad_norm": 9.666121482849121,
+ "learning_rate": 1.999958689009134e-05,
+ "loss": 2.0581,
+ "step": 1204
+ },
+ {
+ "epoch": 3.2833787465940056,
+ "grad_norm": 11.769775390625,
+ "learning_rate": 1.9999578829656724e-05,
+ "loss": 1.9629,
+ "step": 1205
+ },
+ {
+ "epoch": 3.2861035422343323,
+ "grad_norm": 9.261898040771484,
+ "learning_rate": 1.9999570691345712e-05,
+ "loss": 2.0469,
+ "step": 1206
+ },
+ {
+ "epoch": 3.2888283378746594,
+ "grad_norm": 12.135587692260742,
+ "learning_rate": 1.9999562475158365e-05,
+ "loss": 1.9556,
+ "step": 1207
+ },
+ {
+ "epoch": 3.291553133514986,
+ "grad_norm": 9.376842498779297,
+ "learning_rate": 1.9999554181094748e-05,
+ "loss": 1.728,
+ "step": 1208
+ },
+ {
+ "epoch": 3.2942779291553133,
+ "grad_norm": 13.119425773620605,
+ "learning_rate": 1.9999545809154925e-05,
+ "loss": 2.1191,
+ "step": 1209
+ },
+ {
+ "epoch": 3.2970027247956404,
+ "grad_norm": 10.199698448181152,
+ "learning_rate": 1.9999537359338957e-05,
+ "loss": 2.0723,
+ "step": 1210
+ },
+ {
+ "epoch": 3.299727520435967,
+ "grad_norm": 9.926660537719727,
+ "learning_rate": 1.999952883164692e-05,
+ "loss": 1.9331,
+ "step": 1211
+ },
+ {
+ "epoch": 3.302452316076294,
+ "grad_norm": 9.661992073059082,
+ "learning_rate": 1.9999520226078872e-05,
+ "loss": 2.2212,
+ "step": 1212
+ },
+ {
+ "epoch": 3.3051771117166213,
+ "grad_norm": 8.763089179992676,
+ "learning_rate": 1.999951154263488e-05,
+ "loss": 1.6157,
+ "step": 1213
+ },
+ {
+ "epoch": 3.307901907356948,
+ "grad_norm": 10.265016555786133,
+ "learning_rate": 1.9999502781315018e-05,
+ "loss": 1.9888,
+ "step": 1214
+ },
+ {
+ "epoch": 3.310626702997275,
+ "grad_norm": 8.20125961303711,
+ "learning_rate": 1.9999493942119346e-05,
+ "loss": 1.8853,
+ "step": 1215
+ },
+ {
+ "epoch": 3.3133514986376023,
+ "grad_norm": 9.446121215820312,
+ "learning_rate": 1.999948502504794e-05,
+ "loss": 1.8525,
+ "step": 1216
+ },
+ {
+ "epoch": 3.316076294277929,
+ "grad_norm": 10.643209457397461,
+ "learning_rate": 1.9999476030100862e-05,
+ "loss": 1.9517,
+ "step": 1217
+ },
+ {
+ "epoch": 3.318801089918256,
+ "grad_norm": 11.535621643066406,
+ "learning_rate": 1.999946695727819e-05,
+ "loss": 1.9863,
+ "step": 1218
+ },
+ {
+ "epoch": 3.321525885558583,
+ "grad_norm": 11.043972969055176,
+ "learning_rate": 1.999945780657999e-05,
+ "loss": 1.979,
+ "step": 1219
+ },
+ {
+ "epoch": 3.32425068119891,
+ "grad_norm": 11.173770904541016,
+ "learning_rate": 1.9999448578006337e-05,
+ "loss": 1.8547,
+ "step": 1220
+ },
+ {
+ "epoch": 3.326975476839237,
+ "grad_norm": 9.972723960876465,
+ "learning_rate": 1.9999439271557296e-05,
+ "loss": 2.0645,
+ "step": 1221
+ },
+ {
+ "epoch": 3.329700272479564,
+ "grad_norm": 12.643669128417969,
+ "learning_rate": 1.9999429887232948e-05,
+ "loss": 1.9204,
+ "step": 1222
+ },
+ {
+ "epoch": 3.332425068119891,
+ "grad_norm": 10.223214149475098,
+ "learning_rate": 1.999942042503336e-05,
+ "loss": 1.8872,
+ "step": 1223
+ },
+ {
+ "epoch": 3.335149863760218,
+ "grad_norm": 12.952620506286621,
+ "learning_rate": 1.9999410884958608e-05,
+ "loss": 1.7798,
+ "step": 1224
+ },
+ {
+ "epoch": 3.337874659400545,
+ "grad_norm": 11.56080150604248,
+ "learning_rate": 1.9999401267008766e-05,
+ "loss": 1.9966,
+ "step": 1225
+ },
+ {
+ "epoch": 3.3405994550408717,
+ "grad_norm": 8.708621978759766,
+ "learning_rate": 1.9999391571183907e-05,
+ "loss": 1.9858,
+ "step": 1226
+ },
+ {
+ "epoch": 3.343324250681199,
+ "grad_norm": 16.07501792907715,
+ "learning_rate": 1.9999381797484113e-05,
+ "loss": 1.937,
+ "step": 1227
+ },
+ {
+ "epoch": 3.346049046321526,
+ "grad_norm": 19.36942481994629,
+ "learning_rate": 1.999937194590945e-05,
+ "loss": 2.2212,
+ "step": 1228
+ },
+ {
+ "epoch": 3.3487738419618527,
+ "grad_norm": 9.319982528686523,
+ "learning_rate": 1.9999362016460005e-05,
+ "loss": 1.8535,
+ "step": 1229
+ },
+ {
+ "epoch": 3.35149863760218,
+ "grad_norm": 12.806680679321289,
+ "learning_rate": 1.9999352009135846e-05,
+ "loss": 2.0532,
+ "step": 1230
+ },
+ {
+ "epoch": 3.354223433242507,
+ "grad_norm": 8.694989204406738,
+ "learning_rate": 1.9999341923937056e-05,
+ "loss": 1.7805,
+ "step": 1231
+ },
+ {
+ "epoch": 3.3569482288828336,
+ "grad_norm": 11.847393989562988,
+ "learning_rate": 1.9999331760863715e-05,
+ "loss": 1.9702,
+ "step": 1232
+ },
+ {
+ "epoch": 3.3596730245231607,
+ "grad_norm": 17.723541259765625,
+ "learning_rate": 1.99993215199159e-05,
+ "loss": 1.8906,
+ "step": 1233
+ },
+ {
+ "epoch": 3.362397820163488,
+ "grad_norm": 10.759478569030762,
+ "learning_rate": 1.999931120109369e-05,
+ "loss": 2.1333,
+ "step": 1234
+ },
+ {
+ "epoch": 3.3651226158038146,
+ "grad_norm": 10.469283103942871,
+ "learning_rate": 1.9999300804397164e-05,
+ "loss": 2.0376,
+ "step": 1235
+ },
+ {
+ "epoch": 3.3678474114441417,
+ "grad_norm": 9.429465293884277,
+ "learning_rate": 1.9999290329826406e-05,
+ "loss": 1.7695,
+ "step": 1236
+ },
+ {
+ "epoch": 3.370572207084469,
+ "grad_norm": 10.218581199645996,
+ "learning_rate": 1.99992797773815e-05,
+ "loss": 1.8613,
+ "step": 1237
+ },
+ {
+ "epoch": 3.3732970027247955,
+ "grad_norm": 11.13946533203125,
+ "learning_rate": 1.999926914706252e-05,
+ "loss": 1.9194,
+ "step": 1238
+ },
+ {
+ "epoch": 3.3760217983651226,
+ "grad_norm": 10.5692138671875,
+ "learning_rate": 1.9999258438869558e-05,
+ "loss": 2.1162,
+ "step": 1239
+ },
+ {
+ "epoch": 3.3787465940054497,
+ "grad_norm": 10.036789894104004,
+ "learning_rate": 1.999924765280269e-05,
+ "loss": 1.9028,
+ "step": 1240
+ },
+ {
+ "epoch": 3.3814713896457764,
+ "grad_norm": 14.0789794921875,
+ "learning_rate": 1.9999236788862006e-05,
+ "loss": 1.7881,
+ "step": 1241
+ },
+ {
+ "epoch": 3.3841961852861036,
+ "grad_norm": 14.197346687316895,
+ "learning_rate": 1.999922584704759e-05,
+ "loss": 1.9946,
+ "step": 1242
+ },
+ {
+ "epoch": 3.3869209809264307,
+ "grad_norm": 8.973702430725098,
+ "learning_rate": 1.9999214827359518e-05,
+ "loss": 2.2031,
+ "step": 1243
+ },
+ {
+ "epoch": 3.3896457765667574,
+ "grad_norm": 10.881900787353516,
+ "learning_rate": 1.9999203729797887e-05,
+ "loss": 2.0522,
+ "step": 1244
+ },
+ {
+ "epoch": 3.3923705722070845,
+ "grad_norm": 10.742246627807617,
+ "learning_rate": 1.9999192554362777e-05,
+ "loss": 2.0303,
+ "step": 1245
+ },
+ {
+ "epoch": 3.3950953678474116,
+ "grad_norm": 9.714658737182617,
+ "learning_rate": 1.999918130105428e-05,
+ "loss": 1.7964,
+ "step": 1246
+ },
+ {
+ "epoch": 3.3978201634877383,
+ "grad_norm": 12.210956573486328,
+ "learning_rate": 1.999916996987248e-05,
+ "loss": 1.9883,
+ "step": 1247
+ },
+ {
+ "epoch": 3.4005449591280654,
+ "grad_norm": 9.146660804748535,
+ "learning_rate": 1.9999158560817463e-05,
+ "loss": 1.7617,
+ "step": 1248
+ },
+ {
+ "epoch": 3.4032697547683926,
+ "grad_norm": 10.378352165222168,
+ "learning_rate": 1.9999147073889325e-05,
+ "loss": 2.0044,
+ "step": 1249
+ },
+ {
+ "epoch": 3.4059945504087192,
+ "grad_norm": 10.546966552734375,
+ "learning_rate": 1.999913550908815e-05,
+ "loss": 2.3315,
+ "step": 1250
+ },
+ {
+ "epoch": 3.4087193460490464,
+ "grad_norm": 10.025370597839355,
+ "learning_rate": 1.9999123866414026e-05,
+ "loss": 1.8623,
+ "step": 1251
+ },
+ {
+ "epoch": 3.4114441416893735,
+ "grad_norm": 11.024093627929688,
+ "learning_rate": 1.9999112145867055e-05,
+ "loss": 2.0156,
+ "step": 1252
+ },
+ {
+ "epoch": 3.4141689373297,
+ "grad_norm": 8.24333667755127,
+ "learning_rate": 1.9999100347447314e-05,
+ "loss": 1.8171,
+ "step": 1253
+ },
+ {
+ "epoch": 3.4168937329700273,
+ "grad_norm": 10.128952980041504,
+ "learning_rate": 1.9999088471154904e-05,
+ "loss": 2.0664,
+ "step": 1254
+ },
+ {
+ "epoch": 3.4196185286103544,
+ "grad_norm": 9.902071952819824,
+ "learning_rate": 1.999907651698991e-05,
+ "loss": 2.292,
+ "step": 1255
+ },
+ {
+ "epoch": 3.422343324250681,
+ "grad_norm": 10.431514739990234,
+ "learning_rate": 1.999906448495244e-05,
+ "loss": 1.9111,
+ "step": 1256
+ },
+ {
+ "epoch": 3.4250681198910082,
+ "grad_norm": 11.33655071258545,
+ "learning_rate": 1.999905237504257e-05,
+ "loss": 1.8418,
+ "step": 1257
+ },
+ {
+ "epoch": 3.4277929155313354,
+ "grad_norm": 12.280555725097656,
+ "learning_rate": 1.9999040187260403e-05,
+ "loss": 1.9412,
+ "step": 1258
+ },
+ {
+ "epoch": 3.430517711171662,
+ "grad_norm": 9.858194351196289,
+ "learning_rate": 1.9999027921606033e-05,
+ "loss": 1.9077,
+ "step": 1259
+ },
+ {
+ "epoch": 3.433242506811989,
+ "grad_norm": 13.029343605041504,
+ "learning_rate": 1.9999015578079553e-05,
+ "loss": 1.9226,
+ "step": 1260
+ },
+ {
+ "epoch": 3.4359673024523163,
+ "grad_norm": 10.973852157592773,
+ "learning_rate": 1.9999003156681066e-05,
+ "loss": 2.0513,
+ "step": 1261
+ },
+ {
+ "epoch": 3.438692098092643,
+ "grad_norm": 9.369585037231445,
+ "learning_rate": 1.999899065741066e-05,
+ "loss": 1.9302,
+ "step": 1262
+ },
+ {
+ "epoch": 3.44141689373297,
+ "grad_norm": 10.328851699829102,
+ "learning_rate": 1.999897808026844e-05,
+ "loss": 2.0688,
+ "step": 1263
+ },
+ {
+ "epoch": 3.4441416893732972,
+ "grad_norm": 11.273093223571777,
+ "learning_rate": 1.99989654252545e-05,
+ "loss": 1.9956,
+ "step": 1264
+ },
+ {
+ "epoch": 3.446866485013624,
+ "grad_norm": 9.876923561096191,
+ "learning_rate": 1.9998952692368937e-05,
+ "loss": 2.0557,
+ "step": 1265
+ },
+ {
+ "epoch": 3.449591280653951,
+ "grad_norm": 10.082348823547363,
+ "learning_rate": 1.9998939881611857e-05,
+ "loss": 1.8853,
+ "step": 1266
+ },
+ {
+ "epoch": 3.452316076294278,
+ "grad_norm": 11.63476848602295,
+ "learning_rate": 1.9998926992983348e-05,
+ "loss": 2.0076,
+ "step": 1267
+ },
+ {
+ "epoch": 3.455040871934605,
+ "grad_norm": 12.106552124023438,
+ "learning_rate": 1.9998914026483526e-05,
+ "loss": 1.8557,
+ "step": 1268
+ },
+ {
+ "epoch": 3.457765667574932,
+ "grad_norm": 12.849235534667969,
+ "learning_rate": 1.9998900982112475e-05,
+ "loss": 1.9768,
+ "step": 1269
+ },
+ {
+ "epoch": 3.460490463215259,
+ "grad_norm": 12.221293449401855,
+ "learning_rate": 1.999888785987031e-05,
+ "loss": 2.2651,
+ "step": 1270
+ },
+ {
+ "epoch": 3.463215258855586,
+ "grad_norm": 12.192943572998047,
+ "learning_rate": 1.9998874659757125e-05,
+ "loss": 2.1226,
+ "step": 1271
+ },
+ {
+ "epoch": 3.465940054495913,
+ "grad_norm": 12.493210792541504,
+ "learning_rate": 1.999886138177303e-05,
+ "loss": 1.8794,
+ "step": 1272
+ },
+ {
+ "epoch": 3.4686648501362396,
+ "grad_norm": 14.664477348327637,
+ "learning_rate": 1.999884802591812e-05,
+ "loss": 1.6948,
+ "step": 1273
+ },
+ {
+ "epoch": 3.4713896457765667,
+ "grad_norm": 12.013493537902832,
+ "learning_rate": 1.999883459219251e-05,
+ "loss": 2.0154,
+ "step": 1274
+ },
+ {
+ "epoch": 3.474114441416894,
+ "grad_norm": 10.768638610839844,
+ "learning_rate": 1.999882108059629e-05,
+ "loss": 1.9712,
+ "step": 1275
+ },
+ {
+ "epoch": 3.4768392370572205,
+ "grad_norm": 13.831929206848145,
+ "learning_rate": 1.9998807491129576e-05,
+ "loss": 1.8254,
+ "step": 1276
+ },
+ {
+ "epoch": 3.4795640326975477,
+ "grad_norm": 11.40987777709961,
+ "learning_rate": 1.9998793823792474e-05,
+ "loss": 2.1958,
+ "step": 1277
+ },
+ {
+ "epoch": 3.482288828337875,
+ "grad_norm": 9.788375854492188,
+ "learning_rate": 1.9998780078585085e-05,
+ "loss": 1.9473,
+ "step": 1278
+ },
+ {
+ "epoch": 3.4850136239782015,
+ "grad_norm": 11.829399108886719,
+ "learning_rate": 1.999876625550752e-05,
+ "loss": 1.9839,
+ "step": 1279
+ },
+ {
+ "epoch": 3.4877384196185286,
+ "grad_norm": 10.215336799621582,
+ "learning_rate": 1.999875235455988e-05,
+ "loss": 1.7559,
+ "step": 1280
+ },
+ {
+ "epoch": 3.4904632152588557,
+ "grad_norm": 13.019379615783691,
+ "learning_rate": 1.9998738375742283e-05,
+ "loss": 2.0889,
+ "step": 1281
+ },
+ {
+ "epoch": 3.4931880108991824,
+ "grad_norm": 10.324209213256836,
+ "learning_rate": 1.9998724319054836e-05,
+ "loss": 2.1416,
+ "step": 1282
+ },
+ {
+ "epoch": 3.4959128065395095,
+ "grad_norm": 10.5282621383667,
+ "learning_rate": 1.999871018449764e-05,
+ "loss": 1.7649,
+ "step": 1283
+ },
+ {
+ "epoch": 3.4986376021798367,
+ "grad_norm": 9.629287719726562,
+ "learning_rate": 1.9998695972070814e-05,
+ "loss": 1.7354,
+ "step": 1284
+ },
+ {
+ "epoch": 3.5013623978201633,
+ "grad_norm": 18.714492797851562,
+ "learning_rate": 1.9998681681774465e-05,
+ "loss": 1.7544,
+ "step": 1285
+ },
+ {
+ "epoch": 3.5040871934604905,
+ "grad_norm": 11.829867362976074,
+ "learning_rate": 1.9998667313608706e-05,
+ "loss": 1.8809,
+ "step": 1286
+ },
+ {
+ "epoch": 3.5068119891008176,
+ "grad_norm": 18.325145721435547,
+ "learning_rate": 1.9998652867573646e-05,
+ "loss": 1.856,
+ "step": 1287
+ },
+ {
+ "epoch": 3.5095367847411443,
+ "grad_norm": 16.493732452392578,
+ "learning_rate": 1.99986383436694e-05,
+ "loss": 2.0933,
+ "step": 1288
+ },
+ {
+ "epoch": 3.5122615803814714,
+ "grad_norm": 9.553417205810547,
+ "learning_rate": 1.9998623741896082e-05,
+ "loss": 2.0122,
+ "step": 1289
+ },
+ {
+ "epoch": 3.5149863760217985,
+ "grad_norm": 15.020279884338379,
+ "learning_rate": 1.99986090622538e-05,
+ "loss": 2.272,
+ "step": 1290
+ },
+ {
+ "epoch": 3.517711171662125,
+ "grad_norm": 8.37663459777832,
+ "learning_rate": 1.9998594304742677e-05,
+ "loss": 1.8589,
+ "step": 1291
+ },
+ {
+ "epoch": 3.5204359673024523,
+ "grad_norm": 12.794005393981934,
+ "learning_rate": 1.999857946936282e-05,
+ "loss": 1.917,
+ "step": 1292
+ },
+ {
+ "epoch": 3.523160762942779,
+ "grad_norm": 9.891209602355957,
+ "learning_rate": 1.999856455611435e-05,
+ "loss": 1.8281,
+ "step": 1293
+ },
+ {
+ "epoch": 3.525885558583106,
+ "grad_norm": 10.598015785217285,
+ "learning_rate": 1.999854956499738e-05,
+ "loss": 1.8079,
+ "step": 1294
+ },
+ {
+ "epoch": 3.5286103542234333,
+ "grad_norm": 9.42640209197998,
+ "learning_rate": 1.9998534496012026e-05,
+ "loss": 2.0293,
+ "step": 1295
+ },
+ {
+ "epoch": 3.53133514986376,
+ "grad_norm": 10.417404174804688,
+ "learning_rate": 1.999851934915841e-05,
+ "loss": 2.031,
+ "step": 1296
+ },
+ {
+ "epoch": 3.534059945504087,
+ "grad_norm": 11.727996826171875,
+ "learning_rate": 1.9998504124436647e-05,
+ "loss": 2.1621,
+ "step": 1297
+ },
+ {
+ "epoch": 3.536784741144414,
+ "grad_norm": 9.807804107666016,
+ "learning_rate": 1.9998488821846855e-05,
+ "loss": 1.7075,
+ "step": 1298
+ },
+ {
+ "epoch": 3.539509536784741,
+ "grad_norm": 9.008427619934082,
+ "learning_rate": 1.999847344138915e-05,
+ "loss": 1.9229,
+ "step": 1299
+ },
+ {
+ "epoch": 3.542234332425068,
+ "grad_norm": 11.610631942749023,
+ "learning_rate": 1.999845798306366e-05,
+ "loss": 1.7598,
+ "step": 1300
+ },
+ {
+ "epoch": 3.544959128065395,
+ "grad_norm": 13.851554870605469,
+ "learning_rate": 1.9998442446870503e-05,
+ "loss": 1.9463,
+ "step": 1301
+ },
+ {
+ "epoch": 3.547683923705722,
+ "grad_norm": 10.183866500854492,
+ "learning_rate": 1.9998426832809796e-05,
+ "loss": 1.9863,
+ "step": 1302
+ },
+ {
+ "epoch": 3.550408719346049,
+ "grad_norm": 10.200240135192871,
+ "learning_rate": 1.9998411140881662e-05,
+ "loss": 2.0298,
+ "step": 1303
+ },
+ {
+ "epoch": 3.553133514986376,
+ "grad_norm": 14.371204376220703,
+ "learning_rate": 1.9998395371086223e-05,
+ "loss": 2.1377,
+ "step": 1304
+ },
+ {
+ "epoch": 3.5558583106267028,
+ "grad_norm": 9.169516563415527,
+ "learning_rate": 1.9998379523423604e-05,
+ "loss": 1.8818,
+ "step": 1305
+ },
+ {
+ "epoch": 3.55858310626703,
+ "grad_norm": 10.059884071350098,
+ "learning_rate": 1.9998363597893927e-05,
+ "loss": 1.875,
+ "step": 1306
+ },
+ {
+ "epoch": 3.561307901907357,
+ "grad_norm": 13.294024467468262,
+ "learning_rate": 1.9998347594497314e-05,
+ "loss": 2.2129,
+ "step": 1307
+ },
+ {
+ "epoch": 3.5640326975476837,
+ "grad_norm": 10.252388000488281,
+ "learning_rate": 1.9998331513233894e-05,
+ "loss": 1.9248,
+ "step": 1308
+ },
+ {
+ "epoch": 3.566757493188011,
+ "grad_norm": 11.85957145690918,
+ "learning_rate": 1.9998315354103793e-05,
+ "loss": 1.9844,
+ "step": 1309
+ },
+ {
+ "epoch": 3.569482288828338,
+ "grad_norm": 12.752264022827148,
+ "learning_rate": 1.9998299117107128e-05,
+ "loss": 2.0601,
+ "step": 1310
+ },
+ {
+ "epoch": 3.5722070844686646,
+ "grad_norm": 10.488571166992188,
+ "learning_rate": 1.9998282802244032e-05,
+ "loss": 1.9507,
+ "step": 1311
+ },
+ {
+ "epoch": 3.5749318801089918,
+ "grad_norm": 9.606192588806152,
+ "learning_rate": 1.9998266409514634e-05,
+ "loss": 1.8174,
+ "step": 1312
+ },
+ {
+ "epoch": 3.577656675749319,
+ "grad_norm": 10.860569953918457,
+ "learning_rate": 1.9998249938919056e-05,
+ "loss": 1.8677,
+ "step": 1313
+ },
+ {
+ "epoch": 3.5803814713896456,
+ "grad_norm": 10.547423362731934,
+ "learning_rate": 1.9998233390457433e-05,
+ "loss": 1.9253,
+ "step": 1314
+ },
+ {
+ "epoch": 3.5831062670299727,
+ "grad_norm": 10.076347351074219,
+ "learning_rate": 1.9998216764129887e-05,
+ "loss": 2.1001,
+ "step": 1315
+ },
+ {
+ "epoch": 3.5858310626703,
+ "grad_norm": 10.426956176757812,
+ "learning_rate": 1.9998200059936554e-05,
+ "loss": 1.9341,
+ "step": 1316
+ },
+ {
+ "epoch": 3.5885558583106265,
+ "grad_norm": 9.54003620147705,
+ "learning_rate": 1.9998183277877555e-05,
+ "loss": 2.0928,
+ "step": 1317
+ },
+ {
+ "epoch": 3.5912806539509536,
+ "grad_norm": 10.653057098388672,
+ "learning_rate": 1.9998166417953034e-05,
+ "loss": 1.8672,
+ "step": 1318
+ },
+ {
+ "epoch": 3.5940054495912808,
+ "grad_norm": 9.184635162353516,
+ "learning_rate": 1.9998149480163108e-05,
+ "loss": 1.9121,
+ "step": 1319
+ },
+ {
+ "epoch": 3.5967302452316074,
+ "grad_norm": 12.25539779663086,
+ "learning_rate": 1.999813246450792e-05,
+ "loss": 1.9648,
+ "step": 1320
+ },
+ {
+ "epoch": 3.5994550408719346,
+ "grad_norm": 12.260258674621582,
+ "learning_rate": 1.9998115370987595e-05,
+ "loss": 2.0103,
+ "step": 1321
+ },
+ {
+ "epoch": 3.6021798365122617,
+ "grad_norm": 9.864540100097656,
+ "learning_rate": 1.9998098199602273e-05,
+ "loss": 1.7336,
+ "step": 1322
+ },
+ {
+ "epoch": 3.6049046321525884,
+ "grad_norm": 10.197954177856445,
+ "learning_rate": 1.999808095035208e-05,
+ "loss": 1.8735,
+ "step": 1323
+ },
+ {
+ "epoch": 3.6076294277929155,
+ "grad_norm": 12.28921127319336,
+ "learning_rate": 1.9998063623237156e-05,
+ "loss": 2.1064,
+ "step": 1324
+ },
+ {
+ "epoch": 3.6103542234332426,
+ "grad_norm": 11.340349197387695,
+ "learning_rate": 1.9998046218257636e-05,
+ "loss": 1.8403,
+ "step": 1325
+ },
+ {
+ "epoch": 3.6130790190735693,
+ "grad_norm": 11.287467002868652,
+ "learning_rate": 1.9998028735413653e-05,
+ "loss": 1.978,
+ "step": 1326
+ },
+ {
+ "epoch": 3.6158038147138964,
+ "grad_norm": 9.40659236907959,
+ "learning_rate": 1.9998011174705344e-05,
+ "loss": 1.6609,
+ "step": 1327
+ },
+ {
+ "epoch": 3.6185286103542236,
+ "grad_norm": 10.861719131469727,
+ "learning_rate": 1.9997993536132846e-05,
+ "loss": 1.9077,
+ "step": 1328
+ },
+ {
+ "epoch": 3.6212534059945503,
+ "grad_norm": 9.687219619750977,
+ "learning_rate": 1.9997975819696293e-05,
+ "loss": 1.9351,
+ "step": 1329
+ },
+ {
+ "epoch": 3.6239782016348774,
+ "grad_norm": 9.664878845214844,
+ "learning_rate": 1.9997958025395826e-05,
+ "loss": 1.7739,
+ "step": 1330
+ },
+ {
+ "epoch": 3.6267029972752045,
+ "grad_norm": 14.998048782348633,
+ "learning_rate": 1.999794015323159e-05,
+ "loss": 1.9653,
+ "step": 1331
+ },
+ {
+ "epoch": 3.629427792915531,
+ "grad_norm": 15.942357063293457,
+ "learning_rate": 1.9997922203203713e-05,
+ "loss": 1.9585,
+ "step": 1332
+ },
+ {
+ "epoch": 3.6321525885558583,
+ "grad_norm": 11.56669807434082,
+ "learning_rate": 1.999790417531234e-05,
+ "loss": 1.927,
+ "step": 1333
+ },
+ {
+ "epoch": 3.6348773841961854,
+ "grad_norm": 9.04844856262207,
+ "learning_rate": 1.999788606955761e-05,
+ "loss": 1.8101,
+ "step": 1334
+ },
+ {
+ "epoch": 3.637602179836512,
+ "grad_norm": 11.053104400634766,
+ "learning_rate": 1.9997867885939668e-05,
+ "loss": 1.7412,
+ "step": 1335
+ },
+ {
+ "epoch": 3.6403269754768393,
+ "grad_norm": 13.446556091308594,
+ "learning_rate": 1.999784962445865e-05,
+ "loss": 2.2373,
+ "step": 1336
+ },
+ {
+ "epoch": 3.6430517711171664,
+ "grad_norm": 9.99754810333252,
+ "learning_rate": 1.9997831285114704e-05,
+ "loss": 1.8184,
+ "step": 1337
+ },
+ {
+ "epoch": 3.645776566757493,
+ "grad_norm": 10.847136497497559,
+ "learning_rate": 1.9997812867907966e-05,
+ "loss": 1.812,
+ "step": 1338
+ },
+ {
+ "epoch": 3.64850136239782,
+ "grad_norm": 10.042104721069336,
+ "learning_rate": 1.9997794372838584e-05,
+ "loss": 1.9033,
+ "step": 1339
+ },
+ {
+ "epoch": 3.6512261580381473,
+ "grad_norm": 10.487390518188477,
+ "learning_rate": 1.9997775799906706e-05,
+ "loss": 1.875,
+ "step": 1340
+ },
+ {
+ "epoch": 3.653950953678474,
+ "grad_norm": 9.03159236907959,
+ "learning_rate": 1.9997757149112465e-05,
+ "loss": 1.8364,
+ "step": 1341
+ },
+ {
+ "epoch": 3.656675749318801,
+ "grad_norm": 9.386551856994629,
+ "learning_rate": 1.9997738420456015e-05,
+ "loss": 1.8049,
+ "step": 1342
+ },
+ {
+ "epoch": 3.6594005449591283,
+ "grad_norm": 13.503704071044922,
+ "learning_rate": 1.9997719613937505e-05,
+ "loss": 2.0244,
+ "step": 1343
+ },
+ {
+ "epoch": 3.662125340599455,
+ "grad_norm": 8.827006340026855,
+ "learning_rate": 1.9997700729557074e-05,
+ "loss": 1.8726,
+ "step": 1344
+ },
+ {
+ "epoch": 3.664850136239782,
+ "grad_norm": 7.889685153961182,
+ "learning_rate": 1.999768176731487e-05,
+ "loss": 1.8403,
+ "step": 1345
+ },
+ {
+ "epoch": 3.667574931880109,
+ "grad_norm": 11.514538764953613,
+ "learning_rate": 1.999766272721104e-05,
+ "loss": 1.9133,
+ "step": 1346
+ },
+ {
+ "epoch": 3.670299727520436,
+ "grad_norm": 9.46600341796875,
+ "learning_rate": 1.9997643609245738e-05,
+ "loss": 1.7549,
+ "step": 1347
+ },
+ {
+ "epoch": 3.673024523160763,
+ "grad_norm": 10.599994659423828,
+ "learning_rate": 1.9997624413419108e-05,
+ "loss": 1.8149,
+ "step": 1348
+ },
+ {
+ "epoch": 3.67574931880109,
+ "grad_norm": 14.27822208404541,
+ "learning_rate": 1.99976051397313e-05,
+ "loss": 1.9634,
+ "step": 1349
+ },
+ {
+ "epoch": 3.678474114441417,
+ "grad_norm": 10.638948440551758,
+ "learning_rate": 1.999758578818247e-05,
+ "loss": 1.8379,
+ "step": 1350
+ },
+ {
+ "epoch": 3.681198910081744,
+ "grad_norm": 11.049464225769043,
+ "learning_rate": 1.9997566358772755e-05,
+ "loss": 1.9204,
+ "step": 1351
+ },
+ {
+ "epoch": 3.683923705722071,
+ "grad_norm": 21.863615036010742,
+ "learning_rate": 1.9997546851502322e-05,
+ "loss": 1.8022,
+ "step": 1352
+ },
+ {
+ "epoch": 3.6866485013623977,
+ "grad_norm": 12.01803970336914,
+ "learning_rate": 1.999752726637131e-05,
+ "loss": 1.9214,
+ "step": 1353
+ },
+ {
+ "epoch": 3.689373297002725,
+ "grad_norm": 11.750845909118652,
+ "learning_rate": 1.9997507603379883e-05,
+ "loss": 1.9639,
+ "step": 1354
+ },
+ {
+ "epoch": 3.692098092643052,
+ "grad_norm": 11.37834358215332,
+ "learning_rate": 1.9997487862528186e-05,
+ "loss": 2.0659,
+ "step": 1355
+ },
+ {
+ "epoch": 3.6948228882833787,
+ "grad_norm": 11.896803855895996,
+ "learning_rate": 1.9997468043816376e-05,
+ "loss": 1.7285,
+ "step": 1356
+ },
+ {
+ "epoch": 3.697547683923706,
+ "grad_norm": 10.095005989074707,
+ "learning_rate": 1.9997448147244607e-05,
+ "loss": 2.0884,
+ "step": 1357
+ },
+ {
+ "epoch": 3.700272479564033,
+ "grad_norm": 9.361732482910156,
+ "learning_rate": 1.999742817281303e-05,
+ "loss": 1.9331,
+ "step": 1358
+ },
+ {
+ "epoch": 3.7029972752043596,
+ "grad_norm": 10.310089111328125,
+ "learning_rate": 1.999740812052181e-05,
+ "loss": 1.8679,
+ "step": 1359
+ },
+ {
+ "epoch": 3.7057220708446867,
+ "grad_norm": 9.957247734069824,
+ "learning_rate": 1.9997387990371092e-05,
+ "loss": 1.8501,
+ "step": 1360
+ },
+ {
+ "epoch": 3.708446866485014,
+ "grad_norm": 9.856657028198242,
+ "learning_rate": 1.9997367782361042e-05,
+ "loss": 2.0308,
+ "step": 1361
+ },
+ {
+ "epoch": 3.7111716621253406,
+ "grad_norm": 8.72819709777832,
+ "learning_rate": 1.9997347496491812e-05,
+ "loss": 1.9629,
+ "step": 1362
+ },
+ {
+ "epoch": 3.7138964577656677,
+ "grad_norm": 9.658805847167969,
+ "learning_rate": 1.999732713276356e-05,
+ "loss": 1.9346,
+ "step": 1363
+ },
+ {
+ "epoch": 3.716621253405995,
+ "grad_norm": 12.807863235473633,
+ "learning_rate": 1.9997306691176448e-05,
+ "loss": 1.8555,
+ "step": 1364
+ },
+ {
+ "epoch": 3.7193460490463215,
+ "grad_norm": 8.534314155578613,
+ "learning_rate": 1.9997286171730632e-05,
+ "loss": 1.8364,
+ "step": 1365
+ },
+ {
+ "epoch": 3.7220708446866486,
+ "grad_norm": 8.962367057800293,
+ "learning_rate": 1.9997265574426276e-05,
+ "loss": 1.5764,
+ "step": 1366
+ },
+ {
+ "epoch": 3.7247956403269757,
+ "grad_norm": 12.41026782989502,
+ "learning_rate": 1.9997244899263536e-05,
+ "loss": 2.0601,
+ "step": 1367
+ },
+ {
+ "epoch": 3.7275204359673024,
+ "grad_norm": 11.09547233581543,
+ "learning_rate": 1.999722414624257e-05,
+ "loss": 1.9697,
+ "step": 1368
+ },
+ {
+ "epoch": 3.7302452316076296,
+ "grad_norm": 10.84226131439209,
+ "learning_rate": 1.999720331536355e-05,
+ "loss": 2.1177,
+ "step": 1369
+ },
+ {
+ "epoch": 3.7329700272479567,
+ "grad_norm": 10.707548141479492,
+ "learning_rate": 1.999718240662663e-05,
+ "loss": 1.9673,
+ "step": 1370
+ },
+ {
+ "epoch": 3.7356948228882834,
+ "grad_norm": 8.57364273071289,
+ "learning_rate": 1.9997161420031975e-05,
+ "loss": 1.9062,
+ "step": 1371
+ },
+ {
+ "epoch": 3.7384196185286105,
+ "grad_norm": 10.687947273254395,
+ "learning_rate": 1.999714035557975e-05,
+ "loss": 1.9863,
+ "step": 1372
+ },
+ {
+ "epoch": 3.741144414168937,
+ "grad_norm": 18.90679931640625,
+ "learning_rate": 1.9997119213270117e-05,
+ "loss": 1.9587,
+ "step": 1373
+ },
+ {
+ "epoch": 3.7438692098092643,
+ "grad_norm": 11.410531997680664,
+ "learning_rate": 1.999709799310324e-05,
+ "loss": 1.8726,
+ "step": 1374
+ },
+ {
+ "epoch": 3.7465940054495914,
+ "grad_norm": 10.942984580993652,
+ "learning_rate": 1.999707669507929e-05,
+ "loss": 1.9067,
+ "step": 1375
+ },
+ {
+ "epoch": 3.749318801089918,
+ "grad_norm": 9.907876968383789,
+ "learning_rate": 1.9997055319198422e-05,
+ "loss": 1.9297,
+ "step": 1376
+ },
+ {
+ "epoch": 3.7520435967302452,
+ "grad_norm": 13.171777725219727,
+ "learning_rate": 1.9997033865460812e-05,
+ "loss": 1.7925,
+ "step": 1377
+ },
+ {
+ "epoch": 3.7547683923705724,
+ "grad_norm": 10.019922256469727,
+ "learning_rate": 1.9997012333866623e-05,
+ "loss": 1.8657,
+ "step": 1378
+ },
+ {
+ "epoch": 3.757493188010899,
+ "grad_norm": 9.188364028930664,
+ "learning_rate": 1.9996990724416022e-05,
+ "loss": 1.8369,
+ "step": 1379
+ },
+ {
+ "epoch": 3.760217983651226,
+ "grad_norm": 12.900765419006348,
+ "learning_rate": 1.9996969037109185e-05,
+ "loss": 1.8818,
+ "step": 1380
+ },
+ {
+ "epoch": 3.7629427792915533,
+ "grad_norm": 9.810148239135742,
+ "learning_rate": 1.999694727194627e-05,
+ "loss": 1.6636,
+ "step": 1381
+ },
+ {
+ "epoch": 3.76566757493188,
+ "grad_norm": 12.080660820007324,
+ "learning_rate": 1.9996925428927456e-05,
+ "loss": 1.9839,
+ "step": 1382
+ },
+ {
+ "epoch": 3.768392370572207,
+ "grad_norm": 10.132020950317383,
+ "learning_rate": 1.9996903508052903e-05,
+ "loss": 1.8198,
+ "step": 1383
+ },
+ {
+ "epoch": 3.771117166212534,
+ "grad_norm": 10.986047744750977,
+ "learning_rate": 1.999688150932279e-05,
+ "loss": 1.873,
+ "step": 1384
+ },
+ {
+ "epoch": 3.773841961852861,
+ "grad_norm": 11.753776550292969,
+ "learning_rate": 1.9996859432737287e-05,
+ "loss": 1.9746,
+ "step": 1385
+ },
+ {
+ "epoch": 3.776566757493188,
+ "grad_norm": 9.40007209777832,
+ "learning_rate": 1.999683727829656e-05,
+ "loss": 1.7588,
+ "step": 1386
+ },
+ {
+ "epoch": 3.7792915531335147,
+ "grad_norm": 10.014466285705566,
+ "learning_rate": 1.999681504600079e-05,
+ "loss": 1.8784,
+ "step": 1387
+ },
+ {
+ "epoch": 3.782016348773842,
+ "grad_norm": 12.4912109375,
+ "learning_rate": 1.9996792735850145e-05,
+ "loss": 1.9907,
+ "step": 1388
+ },
+ {
+ "epoch": 3.784741144414169,
+ "grad_norm": 19.946182250976562,
+ "learning_rate": 1.99967703478448e-05,
+ "loss": 1.7798,
+ "step": 1389
+ },
+ {
+ "epoch": 3.7874659400544957,
+ "grad_norm": 14.574756622314453,
+ "learning_rate": 1.9996747881984928e-05,
+ "loss": 1.9358,
+ "step": 1390
+ },
+ {
+ "epoch": 3.790190735694823,
+ "grad_norm": 9.037312507629395,
+ "learning_rate": 1.9996725338270705e-05,
+ "loss": 2.0122,
+ "step": 1391
+ },
+ {
+ "epoch": 3.79291553133515,
+ "grad_norm": 11.350050926208496,
+ "learning_rate": 1.999670271670231e-05,
+ "loss": 1.834,
+ "step": 1392
+ },
+ {
+ "epoch": 3.7956403269754766,
+ "grad_norm": 9.058762550354004,
+ "learning_rate": 1.9996680017279916e-05,
+ "loss": 1.7659,
+ "step": 1393
+ },
+ {
+ "epoch": 3.7983651226158037,
+ "grad_norm": 9.022266387939453,
+ "learning_rate": 1.9996657240003692e-05,
+ "loss": 1.6792,
+ "step": 1394
+ },
+ {
+ "epoch": 3.801089918256131,
+ "grad_norm": 12.156946182250977,
+ "learning_rate": 1.9996634384873832e-05,
+ "loss": 1.7554,
+ "step": 1395
+ },
+ {
+ "epoch": 3.8038147138964575,
+ "grad_norm": 10.579151153564453,
+ "learning_rate": 1.9996611451890503e-05,
+ "loss": 1.8132,
+ "step": 1396
+ },
+ {
+ "epoch": 3.8065395095367847,
+ "grad_norm": 14.65162181854248,
+ "learning_rate": 1.9996588441053886e-05,
+ "loss": 2.0186,
+ "step": 1397
+ },
+ {
+ "epoch": 3.809264305177112,
+ "grad_norm": 9.863320350646973,
+ "learning_rate": 1.9996565352364156e-05,
+ "loss": 1.9731,
+ "step": 1398
+ },
+ {
+ "epoch": 3.8119891008174385,
+ "grad_norm": 13.058857917785645,
+ "learning_rate": 1.99965421858215e-05,
+ "loss": 1.9751,
+ "step": 1399
+ },
+ {
+ "epoch": 3.8147138964577656,
+ "grad_norm": 9.648780822753906,
+ "learning_rate": 1.9996518941426096e-05,
+ "loss": 1.9312,
+ "step": 1400
+ },
+ {
+ "epoch": 3.8174386920980927,
+ "grad_norm": 10.973150253295898,
+ "learning_rate": 1.9996495619178124e-05,
+ "loss": 1.9189,
+ "step": 1401
+ },
+ {
+ "epoch": 3.8201634877384194,
+ "grad_norm": 8.606739044189453,
+ "learning_rate": 1.999647221907776e-05,
+ "loss": 1.9082,
+ "step": 1402
+ },
+ {
+ "epoch": 3.8228882833787465,
+ "grad_norm": 11.51412582397461,
+ "learning_rate": 1.99964487411252e-05,
+ "loss": 1.9651,
+ "step": 1403
+ },
+ {
+ "epoch": 3.8256130790190737,
+ "grad_norm": 10.558756828308105,
+ "learning_rate": 1.9996425185320616e-05,
+ "loss": 1.9688,
+ "step": 1404
+ },
+ {
+ "epoch": 3.8283378746594003,
+ "grad_norm": 9.094059944152832,
+ "learning_rate": 1.9996401551664197e-05,
+ "loss": 1.7271,
+ "step": 1405
+ },
+ {
+ "epoch": 3.8310626702997275,
+ "grad_norm": 11.738804817199707,
+ "learning_rate": 1.999637784015612e-05,
+ "loss": 1.8857,
+ "step": 1406
+ },
+ {
+ "epoch": 3.8337874659400546,
+ "grad_norm": 11.302565574645996,
+ "learning_rate": 1.9996354050796577e-05,
+ "loss": 1.7378,
+ "step": 1407
+ },
+ {
+ "epoch": 3.8365122615803813,
+ "grad_norm": 11.154184341430664,
+ "learning_rate": 1.9996330183585747e-05,
+ "loss": 1.9048,
+ "step": 1408
+ },
+ {
+ "epoch": 3.8392370572207084,
+ "grad_norm": 12.222970008850098,
+ "learning_rate": 1.999630623852382e-05,
+ "loss": 1.9839,
+ "step": 1409
+ },
+ {
+ "epoch": 3.8419618528610355,
+ "grad_norm": 7.918453216552734,
+ "learning_rate": 1.9996282215610984e-05,
+ "loss": 1.6953,
+ "step": 1410
+ },
+ {
+ "epoch": 3.844686648501362,
+ "grad_norm": 10.142660140991211,
+ "learning_rate": 1.9996258114847427e-05,
+ "loss": 1.7627,
+ "step": 1411
+ },
+ {
+ "epoch": 3.8474114441416893,
+ "grad_norm": 10.53038501739502,
+ "learning_rate": 1.999623393623333e-05,
+ "loss": 2.0444,
+ "step": 1412
+ },
+ {
+ "epoch": 3.8501362397820165,
+ "grad_norm": 15.396425247192383,
+ "learning_rate": 1.999620967976888e-05,
+ "loss": 1.8823,
+ "step": 1413
+ },
+ {
+ "epoch": 3.852861035422343,
+ "grad_norm": 11.912347793579102,
+ "learning_rate": 1.999618534545428e-05,
+ "loss": 1.7593,
+ "step": 1414
+ },
+ {
+ "epoch": 3.8555858310626703,
+ "grad_norm": 9.395650863647461,
+ "learning_rate": 1.9996160933289704e-05,
+ "loss": 1.9619,
+ "step": 1415
+ },
+ {
+ "epoch": 3.8583106267029974,
+ "grad_norm": 14.379075050354004,
+ "learning_rate": 1.999613644327535e-05,
+ "loss": 1.729,
+ "step": 1416
+ },
+ {
+ "epoch": 3.861035422343324,
+ "grad_norm": 10.086915969848633,
+ "learning_rate": 1.9996111875411407e-05,
+ "loss": 1.9634,
+ "step": 1417
+ },
+ {
+ "epoch": 3.863760217983651,
+ "grad_norm": 10.041367530822754,
+ "learning_rate": 1.9996087229698064e-05,
+ "loss": 1.8315,
+ "step": 1418
+ },
+ {
+ "epoch": 3.8664850136239783,
+ "grad_norm": 9.252388954162598,
+ "learning_rate": 1.9996062506135518e-05,
+ "loss": 1.6943,
+ "step": 1419
+ },
+ {
+ "epoch": 3.869209809264305,
+ "grad_norm": 14.204264640808105,
+ "learning_rate": 1.999603770472396e-05,
+ "loss": 1.6887,
+ "step": 1420
+ },
+ {
+ "epoch": 3.871934604904632,
+ "grad_norm": 9.889179229736328,
+ "learning_rate": 1.999601282546358e-05,
+ "loss": 1.9517,
+ "step": 1421
+ },
+ {
+ "epoch": 3.8746594005449593,
+ "grad_norm": 12.913715362548828,
+ "learning_rate": 1.9995987868354577e-05,
+ "loss": 1.998,
+ "step": 1422
+ },
+ {
+ "epoch": 3.877384196185286,
+ "grad_norm": 11.989314079284668,
+ "learning_rate": 1.999596283339714e-05,
+ "loss": 1.9199,
+ "step": 1423
+ },
+ {
+ "epoch": 3.880108991825613,
+ "grad_norm": 11.67672061920166,
+ "learning_rate": 1.9995937720591464e-05,
+ "loss": 1.9343,
+ "step": 1424
+ },
+ {
+ "epoch": 3.88283378746594,
+ "grad_norm": 14.26172924041748,
+ "learning_rate": 1.999591252993775e-05,
+ "loss": 1.8789,
+ "step": 1425
+ },
+ {
+ "epoch": 3.885558583106267,
+ "grad_norm": 13.25046157836914,
+ "learning_rate": 1.9995887261436188e-05,
+ "loss": 1.9683,
+ "step": 1426
+ },
+ {
+ "epoch": 3.888283378746594,
+ "grad_norm": 15.621968269348145,
+ "learning_rate": 1.999586191508698e-05,
+ "loss": 1.7803,
+ "step": 1427
+ },
+ {
+ "epoch": 3.891008174386921,
+ "grad_norm": 12.299283027648926,
+ "learning_rate": 1.999583649089032e-05,
+ "loss": 1.9829,
+ "step": 1428
+ },
+ {
+ "epoch": 3.893732970027248,
+ "grad_norm": 14.862947463989258,
+ "learning_rate": 1.999581098884641e-05,
+ "loss": 1.7683,
+ "step": 1429
+ },
+ {
+ "epoch": 3.896457765667575,
+ "grad_norm": 8.998908042907715,
+ "learning_rate": 1.999578540895544e-05,
+ "loss": 1.8333,
+ "step": 1430
+ },
+ {
+ "epoch": 3.899182561307902,
+ "grad_norm": 10.61571979522705,
+ "learning_rate": 1.9995759751217617e-05,
+ "loss": 1.9771,
+ "step": 1431
+ },
+ {
+ "epoch": 3.9019073569482288,
+ "grad_norm": 14.07432746887207,
+ "learning_rate": 1.999573401563314e-05,
+ "loss": 1.8696,
+ "step": 1432
+ },
+ {
+ "epoch": 3.904632152588556,
+ "grad_norm": 13.334297180175781,
+ "learning_rate": 1.9995708202202212e-05,
+ "loss": 1.7495,
+ "step": 1433
+ },
+ {
+ "epoch": 3.907356948228883,
+ "grad_norm": 14.014077186584473,
+ "learning_rate": 1.9995682310925025e-05,
+ "loss": 2.0635,
+ "step": 1434
+ },
+ {
+ "epoch": 3.9100817438692097,
+ "grad_norm": 14.566712379455566,
+ "learning_rate": 1.9995656341801788e-05,
+ "loss": 1.832,
+ "step": 1435
+ },
+ {
+ "epoch": 3.912806539509537,
+ "grad_norm": 15.380060195922852,
+ "learning_rate": 1.9995630294832698e-05,
+ "loss": 1.9287,
+ "step": 1436
+ },
+ {
+ "epoch": 3.915531335149864,
+ "grad_norm": 13.439238548278809,
+ "learning_rate": 1.9995604170017967e-05,
+ "loss": 1.7549,
+ "step": 1437
+ },
+ {
+ "epoch": 3.9182561307901906,
+ "grad_norm": 14.134620666503906,
+ "learning_rate": 1.9995577967357788e-05,
+ "loss": 2.042,
+ "step": 1438
+ },
+ {
+ "epoch": 3.9209809264305178,
+ "grad_norm": 10.96253490447998,
+ "learning_rate": 1.999555168685237e-05,
+ "loss": 1.7932,
+ "step": 1439
+ },
+ {
+ "epoch": 3.923705722070845,
+ "grad_norm": 12.898005485534668,
+ "learning_rate": 1.999552532850192e-05,
+ "loss": 2.0718,
+ "step": 1440
+ },
+ {
+ "epoch": 3.9264305177111716,
+ "grad_norm": 13.486254692077637,
+ "learning_rate": 1.9995498892306634e-05,
+ "loss": 1.7651,
+ "step": 1441
+ },
+ {
+ "epoch": 3.9291553133514987,
+ "grad_norm": 17.048885345458984,
+ "learning_rate": 1.999547237826673e-05,
+ "loss": 1.605,
+ "step": 1442
+ },
+ {
+ "epoch": 3.931880108991826,
+ "grad_norm": 11.592516899108887,
+ "learning_rate": 1.9995445786382408e-05,
+ "loss": 1.853,
+ "step": 1443
+ },
+ {
+ "epoch": 3.9346049046321525,
+ "grad_norm": 11.45778751373291,
+ "learning_rate": 1.9995419116653876e-05,
+ "loss": 1.8711,
+ "step": 1444
+ },
+ {
+ "epoch": 3.9373297002724796,
+ "grad_norm": 13.221013069152832,
+ "learning_rate": 1.999539236908134e-05,
+ "loss": 2.1187,
+ "step": 1445
+ },
+ {
+ "epoch": 3.9400544959128068,
+ "grad_norm": 11.306771278381348,
+ "learning_rate": 1.999536554366501e-05,
+ "loss": 1.9995,
+ "step": 1446
+ },
+ {
+ "epoch": 3.9427792915531334,
+ "grad_norm": 13.746538162231445,
+ "learning_rate": 1.9995338640405096e-05,
+ "loss": 1.9072,
+ "step": 1447
+ },
+ {
+ "epoch": 3.9455040871934606,
+ "grad_norm": 9.49048900604248,
+ "learning_rate": 1.9995311659301804e-05,
+ "loss": 1.7983,
+ "step": 1448
+ },
+ {
+ "epoch": 3.9482288828337877,
+ "grad_norm": 9.7013578414917,
+ "learning_rate": 1.9995284600355348e-05,
+ "loss": 1.8359,
+ "step": 1449
+ },
+ {
+ "epoch": 3.9509536784741144,
+ "grad_norm": 11.810276985168457,
+ "learning_rate": 1.9995257463565937e-05,
+ "loss": 1.5774,
+ "step": 1450
+ },
+ {
+ "epoch": 3.9536784741144415,
+ "grad_norm": 12.751311302185059,
+ "learning_rate": 1.9995230248933784e-05,
+ "loss": 1.7988,
+ "step": 1451
+ },
+ {
+ "epoch": 3.9564032697547686,
+ "grad_norm": 11.19675064086914,
+ "learning_rate": 1.99952029564591e-05,
+ "loss": 1.8022,
+ "step": 1452
+ },
+ {
+ "epoch": 3.9591280653950953,
+ "grad_norm": 12.150336265563965,
+ "learning_rate": 1.9995175586142096e-05,
+ "loss": 2.0386,
+ "step": 1453
+ },
+ {
+ "epoch": 3.9618528610354224,
+ "grad_norm": 12.408337593078613,
+ "learning_rate": 1.9995148137982984e-05,
+ "loss": 1.8091,
+ "step": 1454
+ },
+ {
+ "epoch": 3.9645776566757496,
+ "grad_norm": 13.837706565856934,
+ "learning_rate": 1.9995120611981984e-05,
+ "loss": 1.98,
+ "step": 1455
+ },
+ {
+ "epoch": 3.9673024523160763,
+ "grad_norm": 10.49660587310791,
+ "learning_rate": 1.9995093008139304e-05,
+ "loss": 1.6807,
+ "step": 1456
+ },
+ {
+ "epoch": 3.9700272479564034,
+ "grad_norm": 11.55453872680664,
+ "learning_rate": 1.999506532645516e-05,
+ "loss": 1.9268,
+ "step": 1457
+ },
+ {
+ "epoch": 3.9727520435967305,
+ "grad_norm": 9.677781105041504,
+ "learning_rate": 1.9995037566929772e-05,
+ "loss": 1.9014,
+ "step": 1458
+ },
+ {
+ "epoch": 3.975476839237057,
+ "grad_norm": 10.551101684570312,
+ "learning_rate": 1.999500972956335e-05,
+ "loss": 1.6968,
+ "step": 1459
+ },
+ {
+ "epoch": 3.9782016348773843,
+ "grad_norm": 16.66094398498535,
+ "learning_rate": 1.9994981814356116e-05,
+ "loss": 1.7231,
+ "step": 1460
+ },
+ {
+ "epoch": 3.9809264305177114,
+ "grad_norm": 11.6234712600708,
+ "learning_rate": 1.9994953821308284e-05,
+ "loss": 1.7451,
+ "step": 1461
+ },
+ {
+ "epoch": 3.983651226158038,
+ "grad_norm": 13.92747688293457,
+ "learning_rate": 1.9994925750420077e-05,
+ "loss": 1.8594,
+ "step": 1462
+ },
+ {
+ "epoch": 3.9863760217983653,
+ "grad_norm": 9.083030700683594,
+ "learning_rate": 1.9994897601691706e-05,
+ "loss": 1.7178,
+ "step": 1463
+ },
+ {
+ "epoch": 3.989100817438692,
+ "grad_norm": 11.762439727783203,
+ "learning_rate": 1.9994869375123397e-05,
+ "loss": 1.7671,
+ "step": 1464
+ },
+ {
+ "epoch": 3.991825613079019,
+ "grad_norm": 37.79829025268555,
+ "learning_rate": 1.9994841070715365e-05,
+ "loss": 1.9292,
+ "step": 1465
+ },
+ {
+ "epoch": 3.994550408719346,
+ "grad_norm": 9.897245407104492,
+ "learning_rate": 1.999481268846783e-05,
+ "loss": 1.7383,
+ "step": 1466
+ },
+ {
+ "epoch": 3.997275204359673,
+ "grad_norm": 13.566228866577148,
+ "learning_rate": 1.9994784228381018e-05,
+ "loss": 1.9771,
+ "step": 1467
+ },
+ {
+ "epoch": 4.0,
+ "grad_norm": 16.183984756469727,
+ "learning_rate": 1.9994755690455154e-05,
+ "loss": 1.8462,
+ "step": 1468
+ },
+ {
+ "epoch": 4.002724795640327,
+ "grad_norm": 12.495182991027832,
+ "learning_rate": 1.9994727074690444e-05,
+ "loss": 1.8105,
+ "step": 1469
+ },
+ {
+ "epoch": 4.005449591280654,
+ "grad_norm": 11.816779136657715,
+ "learning_rate": 1.9994698381087128e-05,
+ "loss": 1.8804,
+ "step": 1470
+ },
+ {
+ "epoch": 4.008174386920981,
+ "grad_norm": 17.457576751708984,
+ "learning_rate": 1.999466960964542e-05,
+ "loss": 1.8481,
+ "step": 1471
+ },
+ {
+ "epoch": 4.010899182561308,
+ "grad_norm": 12.753191947937012,
+ "learning_rate": 1.9994640760365545e-05,
+ "loss": 1.9683,
+ "step": 1472
+ },
+ {
+ "epoch": 4.013623978201635,
+ "grad_norm": 10.090810775756836,
+ "learning_rate": 1.9994611833247733e-05,
+ "loss": 1.5667,
+ "step": 1473
+ },
+ {
+ "epoch": 4.016348773841962,
+ "grad_norm": 14.633957862854004,
+ "learning_rate": 1.9994582828292205e-05,
+ "loss": 1.6045,
+ "step": 1474
+ },
+ {
+ "epoch": 4.0190735694822886,
+ "grad_norm": 8.889056205749512,
+ "learning_rate": 1.9994553745499187e-05,
+ "loss": 1.8618,
+ "step": 1475
+ },
+ {
+ "epoch": 4.021798365122616,
+ "grad_norm": 13.44864559173584,
+ "learning_rate": 1.9994524584868907e-05,
+ "loss": 1.8105,
+ "step": 1476
+ },
+ {
+ "epoch": 4.024523160762943,
+ "grad_norm": 10.613789558410645,
+ "learning_rate": 1.999449534640159e-05,
+ "loss": 1.8403,
+ "step": 1477
+ },
+ {
+ "epoch": 4.0272479564032695,
+ "grad_norm": 12.439909934997559,
+ "learning_rate": 1.9994466030097466e-05,
+ "loss": 1.7319,
+ "step": 1478
+ },
+ {
+ "epoch": 4.029972752043597,
+ "grad_norm": 9.766961097717285,
+ "learning_rate": 1.9994436635956763e-05,
+ "loss": 1.8823,
+ "step": 1479
+ },
+ {
+ "epoch": 4.032697547683924,
+ "grad_norm": 11.173598289489746,
+ "learning_rate": 1.999440716397971e-05,
+ "loss": 1.895,
+ "step": 1480
+ },
+ {
+ "epoch": 4.03542234332425,
+ "grad_norm": 9.04456615447998,
+ "learning_rate": 1.999437761416653e-05,
+ "loss": 1.8838,
+ "step": 1481
+ },
+ {
+ "epoch": 4.038147138964578,
+ "grad_norm": 11.515022277832031,
+ "learning_rate": 1.9994347986517462e-05,
+ "loss": 1.9326,
+ "step": 1482
+ },
+ {
+ "epoch": 4.040871934604905,
+ "grad_norm": 13.177966117858887,
+ "learning_rate": 1.9994318281032733e-05,
+ "loss": 1.8623,
+ "step": 1483
+ },
+ {
+ "epoch": 4.043596730245231,
+ "grad_norm": 10.89008617401123,
+ "learning_rate": 1.9994288497712575e-05,
+ "loss": 2.1519,
+ "step": 1484
+ },
+ {
+ "epoch": 4.046321525885559,
+ "grad_norm": 11.134393692016602,
+ "learning_rate": 1.999425863655722e-05,
+ "loss": 1.8154,
+ "step": 1485
+ },
+ {
+ "epoch": 4.049046321525886,
+ "grad_norm": 13.724608421325684,
+ "learning_rate": 1.9994228697566905e-05,
+ "loss": 1.7354,
+ "step": 1486
+ },
+ {
+ "epoch": 4.051771117166212,
+ "grad_norm": 9.587696075439453,
+ "learning_rate": 1.999419868074185e-05,
+ "loss": 1.9072,
+ "step": 1487
+ },
+ {
+ "epoch": 4.05449591280654,
+ "grad_norm": 15.846437454223633,
+ "learning_rate": 1.9994168586082305e-05,
+ "loss": 1.658,
+ "step": 1488
+ },
+ {
+ "epoch": 4.0572207084468666,
+ "grad_norm": 9.667086601257324,
+ "learning_rate": 1.999413841358849e-05,
+ "loss": 1.7827,
+ "step": 1489
+ },
+ {
+ "epoch": 4.059945504087193,
+ "grad_norm": 19.252283096313477,
+ "learning_rate": 1.999410816326065e-05,
+ "loss": 1.5791,
+ "step": 1490
+ },
+ {
+ "epoch": 4.062670299727521,
+ "grad_norm": 9.600749015808105,
+ "learning_rate": 1.999407783509902e-05,
+ "loss": 1.8931,
+ "step": 1491
+ },
+ {
+ "epoch": 4.0653950953678475,
+ "grad_norm": 8.026127815246582,
+ "learning_rate": 1.9994047429103832e-05,
+ "loss": 1.6411,
+ "step": 1492
+ },
+ {
+ "epoch": 4.068119891008174,
+ "grad_norm": 11.90536117553711,
+ "learning_rate": 1.9994016945275324e-05,
+ "loss": 1.9187,
+ "step": 1493
+ },
+ {
+ "epoch": 4.070844686648502,
+ "grad_norm": 10.286707878112793,
+ "learning_rate": 1.999398638361373e-05,
+ "loss": 1.7402,
+ "step": 1494
+ },
+ {
+ "epoch": 4.073569482288828,
+ "grad_norm": 11.354410171508789,
+ "learning_rate": 1.9993955744119297e-05,
+ "loss": 1.7849,
+ "step": 1495
+ },
+ {
+ "epoch": 4.076294277929155,
+ "grad_norm": 11.293846130371094,
+ "learning_rate": 1.9993925026792252e-05,
+ "loss": 1.8325,
+ "step": 1496
+ },
+ {
+ "epoch": 4.079019073569483,
+ "grad_norm": 9.793984413146973,
+ "learning_rate": 1.9993894231632847e-05,
+ "loss": 1.9243,
+ "step": 1497
+ },
+ {
+ "epoch": 4.081743869209809,
+ "grad_norm": 11.538467407226562,
+ "learning_rate": 1.9993863358641313e-05,
+ "loss": 1.7949,
+ "step": 1498
+ },
+ {
+ "epoch": 4.084468664850136,
+ "grad_norm": 9.210892677307129,
+ "learning_rate": 1.9993832407817893e-05,
+ "loss": 1.6348,
+ "step": 1499
+ },
+ {
+ "epoch": 4.087193460490464,
+ "grad_norm": 9.606528282165527,
+ "learning_rate": 1.999380137916283e-05,
+ "loss": 1.8218,
+ "step": 1500
+ },
+ {
+ "epoch": 4.08991825613079,
+ "grad_norm": 12.650059700012207,
+ "learning_rate": 1.9993770272676358e-05,
+ "loss": 1.8882,
+ "step": 1501
+ },
+ {
+ "epoch": 4.092643051771117,
+ "grad_norm": 11.155830383300781,
+ "learning_rate": 1.9993739088358728e-05,
+ "loss": 1.7227,
+ "step": 1502
+ },
+ {
+ "epoch": 4.0953678474114446,
+ "grad_norm": 11.9778413772583,
+ "learning_rate": 1.999370782621018e-05,
+ "loss": 1.9614,
+ "step": 1503
+ },
+ {
+ "epoch": 4.098092643051771,
+ "grad_norm": 16.51782989501953,
+ "learning_rate": 1.9993676486230958e-05,
+ "loss": 1.8359,
+ "step": 1504
+ },
+ {
+ "epoch": 4.100817438692098,
+ "grad_norm": 11.23696231842041,
+ "learning_rate": 1.99936450684213e-05,
+ "loss": 1.7964,
+ "step": 1505
+ },
+ {
+ "epoch": 4.1035422343324255,
+ "grad_norm": 12.84441089630127,
+ "learning_rate": 1.9993613572781463e-05,
+ "loss": 1.6553,
+ "step": 1506
+ },
+ {
+ "epoch": 4.106267029972752,
+ "grad_norm": 9.473592758178711,
+ "learning_rate": 1.9993581999311683e-05,
+ "loss": 1.7896,
+ "step": 1507
+ },
+ {
+ "epoch": 4.108991825613079,
+ "grad_norm": 16.464216232299805,
+ "learning_rate": 1.9993550348012202e-05,
+ "loss": 1.8044,
+ "step": 1508
+ },
+ {
+ "epoch": 4.111716621253406,
+ "grad_norm": 19.52264976501465,
+ "learning_rate": 1.9993518618883278e-05,
+ "loss": 1.6797,
+ "step": 1509
+ },
+ {
+ "epoch": 4.114441416893733,
+ "grad_norm": 15.042317390441895,
+ "learning_rate": 1.9993486811925152e-05,
+ "loss": 1.9888,
+ "step": 1510
+ },
+ {
+ "epoch": 4.11716621253406,
+ "grad_norm": 11.100996971130371,
+ "learning_rate": 1.9993454927138075e-05,
+ "loss": 1.7837,
+ "step": 1511
+ },
+ {
+ "epoch": 4.1198910081743865,
+ "grad_norm": 13.300409317016602,
+ "learning_rate": 1.999342296452229e-05,
+ "loss": 1.9468,
+ "step": 1512
+ },
+ {
+ "epoch": 4.122615803814714,
+ "grad_norm": 13.411114692687988,
+ "learning_rate": 1.9993390924078048e-05,
+ "loss": 1.7124,
+ "step": 1513
+ },
+ {
+ "epoch": 4.125340599455041,
+ "grad_norm": 14.598684310913086,
+ "learning_rate": 1.99933588058056e-05,
+ "loss": 1.644,
+ "step": 1514
+ },
+ {
+ "epoch": 4.128065395095367,
+ "grad_norm": 14.471258163452148,
+ "learning_rate": 1.9993326609705193e-05,
+ "loss": 1.8794,
+ "step": 1515
+ },
+ {
+ "epoch": 4.130790190735695,
+ "grad_norm": 12.10798168182373,
+ "learning_rate": 1.999329433577708e-05,
+ "loss": 1.6577,
+ "step": 1516
+ },
+ {
+ "epoch": 4.133514986376022,
+ "grad_norm": 16.480541229248047,
+ "learning_rate": 1.9993261984021516e-05,
+ "loss": 1.9307,
+ "step": 1517
+ },
+ {
+ "epoch": 4.136239782016348,
+ "grad_norm": 18.721946716308594,
+ "learning_rate": 1.9993229554438748e-05,
+ "loss": 1.7847,
+ "step": 1518
+ },
+ {
+ "epoch": 4.138964577656676,
+ "grad_norm": 16.204620361328125,
+ "learning_rate": 1.999319704702903e-05,
+ "loss": 2.0347,
+ "step": 1519
+ },
+ {
+ "epoch": 4.141689373297003,
+ "grad_norm": 13.440073013305664,
+ "learning_rate": 1.9993164461792617e-05,
+ "loss": 1.5464,
+ "step": 1520
+ },
+ {
+ "epoch": 4.144414168937329,
+ "grad_norm": 12.055974960327148,
+ "learning_rate": 1.9993131798729757e-05,
+ "loss": 1.8345,
+ "step": 1521
+ },
+ {
+ "epoch": 4.147138964577657,
+ "grad_norm": 27.193063735961914,
+ "learning_rate": 1.999309905784071e-05,
+ "loss": 1.6394,
+ "step": 1522
+ },
+ {
+ "epoch": 4.1498637602179835,
+ "grad_norm": 36.53542709350586,
+ "learning_rate": 1.9993066239125726e-05,
+ "loss": 1.7129,
+ "step": 1523
+ },
+ {
+ "epoch": 4.15258855585831,
+ "grad_norm": 11.463371276855469,
+ "learning_rate": 1.9993033342585068e-05,
+ "loss": 1.5171,
+ "step": 1524
+ },
+ {
+ "epoch": 4.155313351498638,
+ "grad_norm": 13.343096733093262,
+ "learning_rate": 1.9993000368218985e-05,
+ "loss": 1.8806,
+ "step": 1525
+ },
+ {
+ "epoch": 4.1580381471389645,
+ "grad_norm": 14.698657035827637,
+ "learning_rate": 1.9992967316027738e-05,
+ "loss": 1.7224,
+ "step": 1526
+ },
+ {
+ "epoch": 4.160762942779291,
+ "grad_norm": 15.240327835083008,
+ "learning_rate": 1.9992934186011582e-05,
+ "loss": 1.792,
+ "step": 1527
+ },
+ {
+ "epoch": 4.163487738419619,
+ "grad_norm": 19.695175170898438,
+ "learning_rate": 1.999290097817078e-05,
+ "loss": 1.9006,
+ "step": 1528
+ },
+ {
+ "epoch": 4.166212534059945,
+ "grad_norm": 14.388656616210938,
+ "learning_rate": 1.9992867692505582e-05,
+ "loss": 1.7368,
+ "step": 1529
+ },
+ {
+ "epoch": 4.168937329700272,
+ "grad_norm": 18.168359756469727,
+ "learning_rate": 1.9992834329016256e-05,
+ "loss": 1.8735,
+ "step": 1530
+ },
+ {
+ "epoch": 4.1716621253406,
+ "grad_norm": 158.9042510986328,
+ "learning_rate": 1.9992800887703057e-05,
+ "loss": 1.8633,
+ "step": 1531
+ },
+ {
+ "epoch": 4.174386920980926,
+ "grad_norm": 20.479694366455078,
+ "learning_rate": 1.9992767368566244e-05,
+ "loss": 1.8296,
+ "step": 1532
+ },
+ {
+ "epoch": 4.177111716621253,
+ "grad_norm": 26.53901481628418,
+ "learning_rate": 1.9992733771606082e-05,
+ "loss": 1.7979,
+ "step": 1533
+ },
+ {
+ "epoch": 4.179836512261581,
+ "grad_norm": 16.466264724731445,
+ "learning_rate": 1.999270009682283e-05,
+ "loss": 1.7959,
+ "step": 1534
+ },
+ {
+ "epoch": 4.182561307901907,
+ "grad_norm": 13.911393165588379,
+ "learning_rate": 1.9992666344216754e-05,
+ "loss": 1.96,
+ "step": 1535
+ },
+ {
+ "epoch": 4.185286103542234,
+ "grad_norm": 24.931947708129883,
+ "learning_rate": 1.999263251378811e-05,
+ "loss": 1.8481,
+ "step": 1536
+ },
+ {
+ "epoch": 4.1880108991825615,
+ "grad_norm": 17.262683868408203,
+ "learning_rate": 1.999259860553717e-05,
+ "loss": 1.7502,
+ "step": 1537
+ },
+ {
+ "epoch": 4.190735694822888,
+ "grad_norm": 28.27671241760254,
+ "learning_rate": 1.999256461946419e-05,
+ "loss": 1.7588,
+ "step": 1538
+ },
+ {
+ "epoch": 4.193460490463215,
+ "grad_norm": 21.149972915649414,
+ "learning_rate": 1.999253055556944e-05,
+ "loss": 1.9121,
+ "step": 1539
+ },
+ {
+ "epoch": 4.1961852861035425,
+ "grad_norm": 15.513473510742188,
+ "learning_rate": 1.999249641385318e-05,
+ "loss": 1.7434,
+ "step": 1540
+ },
+ {
+ "epoch": 4.198910081743869,
+ "grad_norm": 14.91957950592041,
+ "learning_rate": 1.9992462194315685e-05,
+ "loss": 1.8267,
+ "step": 1541
+ },
+ {
+ "epoch": 4.201634877384196,
+ "grad_norm": 18.212005615234375,
+ "learning_rate": 1.9992427896957214e-05,
+ "loss": 1.6914,
+ "step": 1542
+ },
+ {
+ "epoch": 4.204359673024523,
+ "grad_norm": 14.364083290100098,
+ "learning_rate": 1.9992393521778038e-05,
+ "loss": 1.8149,
+ "step": 1543
+ },
+ {
+ "epoch": 4.20708446866485,
+ "grad_norm": 23.741731643676758,
+ "learning_rate": 1.999235906877842e-05,
+ "loss": 1.8225,
+ "step": 1544
+ },
+ {
+ "epoch": 4.209809264305177,
+ "grad_norm": 20.84150505065918,
+ "learning_rate": 1.9992324537958628e-05,
+ "loss": 1.7402,
+ "step": 1545
+ },
+ {
+ "epoch": 4.212534059945504,
+ "grad_norm": 43.37743377685547,
+ "learning_rate": 1.9992289929318944e-05,
+ "loss": 1.7632,
+ "step": 1546
+ },
+ {
+ "epoch": 4.215258855585831,
+ "grad_norm": 14.563302993774414,
+ "learning_rate": 1.9992255242859618e-05,
+ "loss": 1.7861,
+ "step": 1547
+ },
+ {
+ "epoch": 4.217983651226158,
+ "grad_norm": 18.320777893066406,
+ "learning_rate": 1.9992220478580936e-05,
+ "loss": 2.0103,
+ "step": 1548
+ },
+ {
+ "epoch": 4.220708446866485,
+ "grad_norm": 17.307558059692383,
+ "learning_rate": 1.999218563648316e-05,
+ "loss": 1.8047,
+ "step": 1549
+ },
+ {
+ "epoch": 4.223433242506812,
+ "grad_norm": 14.111106872558594,
+ "learning_rate": 1.9992150716566564e-05,
+ "loss": 1.9575,
+ "step": 1550
+ },
+ {
+ "epoch": 4.226158038147139,
+ "grad_norm": 27.04886245727539,
+ "learning_rate": 1.9992115718831416e-05,
+ "loss": 1.6965,
+ "step": 1551
+ },
+ {
+ "epoch": 4.228882833787466,
+ "grad_norm": 20.34300994873047,
+ "learning_rate": 1.9992080643278e-05,
+ "loss": 1.7808,
+ "step": 1552
+ },
+ {
+ "epoch": 4.231607629427793,
+ "grad_norm": 12.827519416809082,
+ "learning_rate": 1.9992045489906578e-05,
+ "loss": 1.8965,
+ "step": 1553
+ },
+ {
+ "epoch": 4.23433242506812,
+ "grad_norm": 10.950469970703125,
+ "learning_rate": 1.9992010258717423e-05,
+ "loss": 1.6541,
+ "step": 1554
+ },
+ {
+ "epoch": 4.237057220708447,
+ "grad_norm": 15.466451644897461,
+ "learning_rate": 1.9991974949710823e-05,
+ "loss": 2.0952,
+ "step": 1555
+ },
+ {
+ "epoch": 4.239782016348774,
+ "grad_norm": 15.410811424255371,
+ "learning_rate": 1.9991939562887035e-05,
+ "loss": 1.999,
+ "step": 1556
+ },
+ {
+ "epoch": 4.2425068119891005,
+ "grad_norm": 15.858236312866211,
+ "learning_rate": 1.9991904098246347e-05,
+ "loss": 1.7847,
+ "step": 1557
+ },
+ {
+ "epoch": 4.245231607629428,
+ "grad_norm": 18.37849235534668,
+ "learning_rate": 1.999186855578903e-05,
+ "loss": 1.9233,
+ "step": 1558
+ },
+ {
+ "epoch": 4.247956403269755,
+ "grad_norm": 21.132099151611328,
+ "learning_rate": 1.9991832935515366e-05,
+ "loss": 1.7544,
+ "step": 1559
+ },
+ {
+ "epoch": 4.2506811989100814,
+ "grad_norm": 11.251901626586914,
+ "learning_rate": 1.9991797237425625e-05,
+ "loss": 1.9648,
+ "step": 1560
+ },
+ {
+ "epoch": 4.253405994550409,
+ "grad_norm": 10.464017868041992,
+ "learning_rate": 1.9991761461520088e-05,
+ "loss": 1.7173,
+ "step": 1561
+ },
+ {
+ "epoch": 4.256130790190736,
+ "grad_norm": 15.851114273071289,
+ "learning_rate": 1.9991725607799037e-05,
+ "loss": 1.8613,
+ "step": 1562
+ },
+ {
+ "epoch": 4.258855585831062,
+ "grad_norm": 12.207009315490723,
+ "learning_rate": 1.999168967626275e-05,
+ "loss": 1.7659,
+ "step": 1563
+ },
+ {
+ "epoch": 4.26158038147139,
+ "grad_norm": 16.404396057128906,
+ "learning_rate": 1.99916536669115e-05,
+ "loss": 1.9849,
+ "step": 1564
+ },
+ {
+ "epoch": 4.264305177111717,
+ "grad_norm": 19.986793518066406,
+ "learning_rate": 1.999161757974558e-05,
+ "loss": 2.0391,
+ "step": 1565
+ },
+ {
+ "epoch": 4.267029972752043,
+ "grad_norm": 12.699073791503906,
+ "learning_rate": 1.9991581414765256e-05,
+ "loss": 1.7935,
+ "step": 1566
+ },
+ {
+ "epoch": 4.269754768392371,
+ "grad_norm": 10.729422569274902,
+ "learning_rate": 1.9991545171970822e-05,
+ "loss": 1.7974,
+ "step": 1567
+ },
+ {
+ "epoch": 4.272479564032698,
+ "grad_norm": 11.770853996276855,
+ "learning_rate": 1.9991508851362555e-05,
+ "loss": 1.77,
+ "step": 1568
+ },
+ {
+ "epoch": 4.275204359673024,
+ "grad_norm": 17.789634704589844,
+ "learning_rate": 1.9991472452940738e-05,
+ "loss": 1.9048,
+ "step": 1569
+ },
+ {
+ "epoch": 4.277929155313352,
+ "grad_norm": 16.31340217590332,
+ "learning_rate": 1.9991435976705657e-05,
+ "loss": 1.8638,
+ "step": 1570
+ },
+ {
+ "epoch": 4.2806539509536785,
+ "grad_norm": 16.50969123840332,
+ "learning_rate": 1.9991399422657593e-05,
+ "loss": 2.0146,
+ "step": 1571
+ },
+ {
+ "epoch": 4.283378746594005,
+ "grad_norm": 14.991809844970703,
+ "learning_rate": 1.999136279079683e-05,
+ "loss": 1.9717,
+ "step": 1572
+ },
+ {
+ "epoch": 4.286103542234333,
+ "grad_norm": 20.145408630371094,
+ "learning_rate": 1.999132608112366e-05,
+ "loss": 1.8589,
+ "step": 1573
+ },
+ {
+ "epoch": 4.2888283378746594,
+ "grad_norm": 16.198291778564453,
+ "learning_rate": 1.999128929363836e-05,
+ "loss": 1.8687,
+ "step": 1574
+ },
+ {
+ "epoch": 4.291553133514986,
+ "grad_norm": 11.562917709350586,
+ "learning_rate": 1.9991252428341222e-05,
+ "loss": 1.7009,
+ "step": 1575
+ },
+ {
+ "epoch": 4.294277929155314,
+ "grad_norm": 8.705707550048828,
+ "learning_rate": 1.999121548523253e-05,
+ "loss": 1.7183,
+ "step": 1576
+ },
+ {
+ "epoch": 4.29700272479564,
+ "grad_norm": 10.386330604553223,
+ "learning_rate": 1.9991178464312575e-05,
+ "loss": 1.801,
+ "step": 1577
+ },
+ {
+ "epoch": 4.299727520435967,
+ "grad_norm": 13.204593658447266,
+ "learning_rate": 1.9991141365581644e-05,
+ "loss": 1.7529,
+ "step": 1578
+ },
+ {
+ "epoch": 4.302452316076295,
+ "grad_norm": 11.083606719970703,
+ "learning_rate": 1.9991104189040024e-05,
+ "loss": 1.7524,
+ "step": 1579
+ },
+ {
+ "epoch": 4.305177111716621,
+ "grad_norm": 12.340747833251953,
+ "learning_rate": 1.999106693468801e-05,
+ "loss": 1.8311,
+ "step": 1580
+ },
+ {
+ "epoch": 4.307901907356948,
+ "grad_norm": 11.777390480041504,
+ "learning_rate": 1.9991029602525884e-05,
+ "loss": 2.0127,
+ "step": 1581
+ },
+ {
+ "epoch": 4.310626702997276,
+ "grad_norm": 12.502350807189941,
+ "learning_rate": 1.999099219255394e-05,
+ "loss": 2.0781,
+ "step": 1582
+ },
+ {
+ "epoch": 4.313351498637602,
+ "grad_norm": 12.655232429504395,
+ "learning_rate": 1.9990954704772473e-05,
+ "loss": 1.7717,
+ "step": 1583
+ },
+ {
+ "epoch": 4.316076294277929,
+ "grad_norm": 12.700472831726074,
+ "learning_rate": 1.9990917139181772e-05,
+ "loss": 2.0933,
+ "step": 1584
+ },
+ {
+ "epoch": 4.3188010899182565,
+ "grad_norm": 11.673563003540039,
+ "learning_rate": 1.999087949578213e-05,
+ "loss": 1.6792,
+ "step": 1585
+ },
+ {
+ "epoch": 4.321525885558583,
+ "grad_norm": 13.173969268798828,
+ "learning_rate": 1.9990841774573843e-05,
+ "loss": 1.9663,
+ "step": 1586
+ },
+ {
+ "epoch": 4.32425068119891,
+ "grad_norm": 13.962111473083496,
+ "learning_rate": 1.9990803975557197e-05,
+ "loss": 1.9666,
+ "step": 1587
+ },
+ {
+ "epoch": 4.3269754768392374,
+ "grad_norm": 15.190113067626953,
+ "learning_rate": 1.9990766098732493e-05,
+ "loss": 1.7192,
+ "step": 1588
+ },
+ {
+ "epoch": 4.329700272479564,
+ "grad_norm": 14.03504467010498,
+ "learning_rate": 1.9990728144100025e-05,
+ "loss": 1.8108,
+ "step": 1589
+ },
+ {
+ "epoch": 4.332425068119891,
+ "grad_norm": 10.579913139343262,
+ "learning_rate": 1.999069011166009e-05,
+ "loss": 1.8877,
+ "step": 1590
+ },
+ {
+ "epoch": 4.335149863760218,
+ "grad_norm": 12.852388381958008,
+ "learning_rate": 1.9990652001412973e-05,
+ "loss": 1.9597,
+ "step": 1591
+ },
+ {
+ "epoch": 4.337874659400545,
+ "grad_norm": 11.49439525604248,
+ "learning_rate": 1.9990613813358987e-05,
+ "loss": 1.894,
+ "step": 1592
+ },
+ {
+ "epoch": 4.340599455040872,
+ "grad_norm": 10.72061538696289,
+ "learning_rate": 1.999057554749842e-05,
+ "loss": 1.8101,
+ "step": 1593
+ },
+ {
+ "epoch": 4.343324250681199,
+ "grad_norm": 11.686420440673828,
+ "learning_rate": 1.9990537203831573e-05,
+ "loss": 2.0156,
+ "step": 1594
+ },
+ {
+ "epoch": 4.346049046321526,
+ "grad_norm": 13.056648254394531,
+ "learning_rate": 1.9990498782358745e-05,
+ "loss": 1.9202,
+ "step": 1595
+ },
+ {
+ "epoch": 4.348773841961853,
+ "grad_norm": 12.927536964416504,
+ "learning_rate": 1.9990460283080232e-05,
+ "loss": 1.9849,
+ "step": 1596
+ },
+ {
+ "epoch": 4.35149863760218,
+ "grad_norm": 10.1175537109375,
+ "learning_rate": 1.9990421705996336e-05,
+ "loss": 1.8677,
+ "step": 1597
+ },
+ {
+ "epoch": 4.354223433242507,
+ "grad_norm": 10.478602409362793,
+ "learning_rate": 1.999038305110736e-05,
+ "loss": 1.9634,
+ "step": 1598
+ },
+ {
+ "epoch": 4.356948228882834,
+ "grad_norm": 13.643245697021484,
+ "learning_rate": 1.9990344318413598e-05,
+ "loss": 1.7224,
+ "step": 1599
+ },
+ {
+ "epoch": 4.359673024523161,
+ "grad_norm": 10.597620010375977,
+ "learning_rate": 1.999030550791536e-05,
+ "loss": 1.8633,
+ "step": 1600
+ },
+ {
+ "epoch": 4.362397820163488,
+ "grad_norm": 18.982633590698242,
+ "learning_rate": 1.999026661961294e-05,
+ "loss": 1.7788,
+ "step": 1601
+ },
+ {
+ "epoch": 4.3651226158038146,
+ "grad_norm": 14.29390811920166,
+ "learning_rate": 1.999022765350665e-05,
+ "loss": 1.8198,
+ "step": 1602
+ },
+ {
+ "epoch": 4.367847411444142,
+ "grad_norm": 14.045916557312012,
+ "learning_rate": 1.9990188609596786e-05,
+ "loss": 1.6416,
+ "step": 1603
+ },
+ {
+ "epoch": 4.370572207084469,
+ "grad_norm": 9.716156005859375,
+ "learning_rate": 1.9990149487883653e-05,
+ "loss": 2.0276,
+ "step": 1604
+ },
+ {
+ "epoch": 4.3732970027247955,
+ "grad_norm": 12.709885597229004,
+ "learning_rate": 1.999011028836756e-05,
+ "loss": 1.804,
+ "step": 1605
+ },
+ {
+ "epoch": 4.376021798365123,
+ "grad_norm": 13.103960037231445,
+ "learning_rate": 1.9990071011048807e-05,
+ "loss": 1.8384,
+ "step": 1606
+ },
+ {
+ "epoch": 4.37874659400545,
+ "grad_norm": 11.972681999206543,
+ "learning_rate": 1.999003165592771e-05,
+ "loss": 1.9453,
+ "step": 1607
+ },
+ {
+ "epoch": 4.381471389645776,
+ "grad_norm": 23.582698822021484,
+ "learning_rate": 1.998999222300456e-05,
+ "loss": 1.6707,
+ "step": 1608
+ },
+ {
+ "epoch": 4.384196185286104,
+ "grad_norm": 11.656493186950684,
+ "learning_rate": 1.9989952712279674e-05,
+ "loss": 1.8208,
+ "step": 1609
+ },
+ {
+ "epoch": 4.386920980926431,
+ "grad_norm": 10.497620582580566,
+ "learning_rate": 1.998991312375336e-05,
+ "loss": 1.8674,
+ "step": 1610
+ },
+ {
+ "epoch": 4.389645776566757,
+ "grad_norm": 12.55628776550293,
+ "learning_rate": 1.9989873457425922e-05,
+ "loss": 1.7979,
+ "step": 1611
+ },
+ {
+ "epoch": 4.392370572207085,
+ "grad_norm": 12.809096336364746,
+ "learning_rate": 1.998983371329767e-05,
+ "loss": 1.9019,
+ "step": 1612
+ },
+ {
+ "epoch": 4.395095367847412,
+ "grad_norm": 15.382226943969727,
+ "learning_rate": 1.9989793891368915e-05,
+ "loss": 1.7056,
+ "step": 1613
+ },
+ {
+ "epoch": 4.397820163487738,
+ "grad_norm": 11.492066383361816,
+ "learning_rate": 1.9989753991639968e-05,
+ "loss": 1.814,
+ "step": 1614
+ },
+ {
+ "epoch": 4.400544959128065,
+ "grad_norm": 14.366987228393555,
+ "learning_rate": 1.998971401411114e-05,
+ "loss": 1.7908,
+ "step": 1615
+ },
+ {
+ "epoch": 4.4032697547683926,
+ "grad_norm": 13.31606388092041,
+ "learning_rate": 1.9989673958782735e-05,
+ "loss": 1.802,
+ "step": 1616
+ },
+ {
+ "epoch": 4.405994550408719,
+ "grad_norm": 26.214847564697266,
+ "learning_rate": 1.998963382565508e-05,
+ "loss": 1.8096,
+ "step": 1617
+ },
+ {
+ "epoch": 4.408719346049046,
+ "grad_norm": 12.695902824401855,
+ "learning_rate": 1.998959361472847e-05,
+ "loss": 1.7192,
+ "step": 1618
+ },
+ {
+ "epoch": 4.4114441416893735,
+ "grad_norm": 14.11608600616455,
+ "learning_rate": 1.9989553326003226e-05,
+ "loss": 1.8149,
+ "step": 1619
+ },
+ {
+ "epoch": 4.4141689373297,
+ "grad_norm": 14.843645095825195,
+ "learning_rate": 1.9989512959479666e-05,
+ "loss": 1.8113,
+ "step": 1620
+ },
+ {
+ "epoch": 4.416893732970027,
+ "grad_norm": 12.413495063781738,
+ "learning_rate": 1.9989472515158102e-05,
+ "loss": 2.0884,
+ "step": 1621
+ },
+ {
+ "epoch": 4.419618528610354,
+ "grad_norm": 14.569469451904297,
+ "learning_rate": 1.9989431993038842e-05,
+ "loss": 1.9043,
+ "step": 1622
+ },
+ {
+ "epoch": 4.422343324250681,
+ "grad_norm": 13.531723976135254,
+ "learning_rate": 1.998939139312221e-05,
+ "loss": 1.7754,
+ "step": 1623
+ },
+ {
+ "epoch": 4.425068119891008,
+ "grad_norm": 15.61850643157959,
+ "learning_rate": 1.9989350715408525e-05,
+ "loss": 1.7192,
+ "step": 1624
+ },
+ {
+ "epoch": 4.427792915531335,
+ "grad_norm": 12.612687110900879,
+ "learning_rate": 1.998930995989809e-05,
+ "loss": 1.8931,
+ "step": 1625
+ },
+ {
+ "epoch": 4.430517711171662,
+ "grad_norm": 13.903953552246094,
+ "learning_rate": 1.9989269126591236e-05,
+ "loss": 2.0015,
+ "step": 1626
+ },
+ {
+ "epoch": 4.433242506811989,
+ "grad_norm": 11.026742935180664,
+ "learning_rate": 1.9989228215488273e-05,
+ "loss": 1.5745,
+ "step": 1627
+ },
+ {
+ "epoch": 4.435967302452316,
+ "grad_norm": 22.10861587524414,
+ "learning_rate": 1.9989187226589522e-05,
+ "loss": 1.916,
+ "step": 1628
+ },
+ {
+ "epoch": 4.438692098092643,
+ "grad_norm": 21.367530822753906,
+ "learning_rate": 1.9989146159895305e-05,
+ "loss": 1.9092,
+ "step": 1629
+ },
+ {
+ "epoch": 4.44141689373297,
+ "grad_norm": 12.559633255004883,
+ "learning_rate": 1.9989105015405935e-05,
+ "loss": 1.8308,
+ "step": 1630
+ },
+ {
+ "epoch": 4.444141689373297,
+ "grad_norm": 15.54616928100586,
+ "learning_rate": 1.9989063793121736e-05,
+ "loss": 2.0679,
+ "step": 1631
+ },
+ {
+ "epoch": 4.446866485013624,
+ "grad_norm": 12.716418266296387,
+ "learning_rate": 1.9989022493043033e-05,
+ "loss": 1.7646,
+ "step": 1632
+ },
+ {
+ "epoch": 4.449591280653951,
+ "grad_norm": 16.063173294067383,
+ "learning_rate": 1.9988981115170144e-05,
+ "loss": 1.9248,
+ "step": 1633
+ },
+ {
+ "epoch": 4.452316076294278,
+ "grad_norm": 22.75617027282715,
+ "learning_rate": 1.998893965950339e-05,
+ "loss": 2.1328,
+ "step": 1634
+ },
+ {
+ "epoch": 4.455040871934605,
+ "grad_norm": 14.810853004455566,
+ "learning_rate": 1.99888981260431e-05,
+ "loss": 1.6895,
+ "step": 1635
+ },
+ {
+ "epoch": 4.4577656675749315,
+ "grad_norm": 23.45295524597168,
+ "learning_rate": 1.998885651478959e-05,
+ "loss": 1.8169,
+ "step": 1636
+ },
+ {
+ "epoch": 4.460490463215259,
+ "grad_norm": 23.975677490234375,
+ "learning_rate": 1.9988814825743183e-05,
+ "loss": 1.7471,
+ "step": 1637
+ },
+ {
+ "epoch": 4.463215258855586,
+ "grad_norm": 18.05084800720215,
+ "learning_rate": 1.9988773058904213e-05,
+ "loss": 1.6943,
+ "step": 1638
+ },
+ {
+ "epoch": 4.4659400544959125,
+ "grad_norm": 17.506332397460938,
+ "learning_rate": 1.9988731214272995e-05,
+ "loss": 1.9805,
+ "step": 1639
+ },
+ {
+ "epoch": 4.46866485013624,
+ "grad_norm": 45.82698059082031,
+ "learning_rate": 1.9988689291849865e-05,
+ "loss": 1.8711,
+ "step": 1640
+ },
+ {
+ "epoch": 4.471389645776567,
+ "grad_norm": 20.599950790405273,
+ "learning_rate": 1.9988647291635143e-05,
+ "loss": 2.0127,
+ "step": 1641
+ },
+ {
+ "epoch": 4.474114441416893,
+ "grad_norm": 27.706125259399414,
+ "learning_rate": 1.9988605213629157e-05,
+ "loss": 1.7874,
+ "step": 1642
+ },
+ {
+ "epoch": 4.476839237057221,
+ "grad_norm": 26.521753311157227,
+ "learning_rate": 1.9988563057832234e-05,
+ "loss": 1.834,
+ "step": 1643
+ },
+ {
+ "epoch": 4.479564032697548,
+ "grad_norm": 28.991363525390625,
+ "learning_rate": 1.9988520824244703e-05,
+ "loss": 1.8335,
+ "step": 1644
+ },
+ {
+ "epoch": 4.482288828337874,
+ "grad_norm": 13.267407417297363,
+ "learning_rate": 1.9988478512866893e-05,
+ "loss": 1.8252,
+ "step": 1645
+ },
+ {
+ "epoch": 4.485013623978202,
+ "grad_norm": 15.971419334411621,
+ "learning_rate": 1.9988436123699135e-05,
+ "loss": 1.6104,
+ "step": 1646
+ },
+ {
+ "epoch": 4.487738419618529,
+ "grad_norm": 12.338957786560059,
+ "learning_rate": 1.998839365674176e-05,
+ "loss": 1.9094,
+ "step": 1647
+ },
+ {
+ "epoch": 4.490463215258855,
+ "grad_norm": 12.820110321044922,
+ "learning_rate": 1.9988351111995095e-05,
+ "loss": 1.7393,
+ "step": 1648
+ },
+ {
+ "epoch": 4.493188010899183,
+ "grad_norm": 20.78042221069336,
+ "learning_rate": 1.998830848945947e-05,
+ "loss": 1.9839,
+ "step": 1649
+ },
+ {
+ "epoch": 4.4959128065395095,
+ "grad_norm": 15.028311729431152,
+ "learning_rate": 1.9988265789135224e-05,
+ "loss": 1.853,
+ "step": 1650
+ },
+ {
+ "epoch": 4.498637602179836,
+ "grad_norm": 16.6220645904541,
+ "learning_rate": 1.9988223011022686e-05,
+ "loss": 1.7827,
+ "step": 1651
+ },
+ {
+ "epoch": 4.501362397820164,
+ "grad_norm": 17.394527435302734,
+ "learning_rate": 1.9988180155122187e-05,
+ "loss": 1.8818,
+ "step": 1652
+ },
+ {
+ "epoch": 4.5040871934604905,
+ "grad_norm": 19.727069854736328,
+ "learning_rate": 1.998813722143406e-05,
+ "loss": 1.9028,
+ "step": 1653
+ },
+ {
+ "epoch": 4.506811989100817,
+ "grad_norm": 18.605106353759766,
+ "learning_rate": 1.9988094209958644e-05,
+ "loss": 1.8357,
+ "step": 1654
+ },
+ {
+ "epoch": 4.509536784741145,
+ "grad_norm": 14.147246360778809,
+ "learning_rate": 1.998805112069627e-05,
+ "loss": 1.7061,
+ "step": 1655
+ },
+ {
+ "epoch": 4.512261580381471,
+ "grad_norm": 14.222494125366211,
+ "learning_rate": 1.9988007953647278e-05,
+ "loss": 1.6477,
+ "step": 1656
+ },
+ {
+ "epoch": 4.514986376021798,
+ "grad_norm": 16.673221588134766,
+ "learning_rate": 1.9987964708812e-05,
+ "loss": 1.802,
+ "step": 1657
+ },
+ {
+ "epoch": 4.517711171662126,
+ "grad_norm": 13.81769847869873,
+ "learning_rate": 1.9987921386190777e-05,
+ "loss": 1.8066,
+ "step": 1658
+ },
+ {
+ "epoch": 4.520435967302452,
+ "grad_norm": 11.60045337677002,
+ "learning_rate": 1.998787798578394e-05,
+ "loss": 1.8171,
+ "step": 1659
+ },
+ {
+ "epoch": 4.523160762942779,
+ "grad_norm": 14.101318359375,
+ "learning_rate": 1.9987834507591834e-05,
+ "loss": 1.8599,
+ "step": 1660
+ },
+ {
+ "epoch": 4.525885558583107,
+ "grad_norm": 32.92286682128906,
+ "learning_rate": 1.9987790951614792e-05,
+ "loss": 2.0098,
+ "step": 1661
+ },
+ {
+ "epoch": 4.528610354223433,
+ "grad_norm": 14.645931243896484,
+ "learning_rate": 1.9987747317853156e-05,
+ "loss": 1.7949,
+ "step": 1662
+ },
+ {
+ "epoch": 4.53133514986376,
+ "grad_norm": 13.726556777954102,
+ "learning_rate": 1.9987703606307268e-05,
+ "loss": 1.8081,
+ "step": 1663
+ },
+ {
+ "epoch": 4.5340599455040875,
+ "grad_norm": 14.259086608886719,
+ "learning_rate": 1.998765981697746e-05,
+ "loss": 1.9502,
+ "step": 1664
+ },
+ {
+ "epoch": 4.536784741144414,
+ "grad_norm": 13.587321281433105,
+ "learning_rate": 1.9987615949864085e-05,
+ "loss": 2.0098,
+ "step": 1665
+ },
+ {
+ "epoch": 4.539509536784741,
+ "grad_norm": 17.23871612548828,
+ "learning_rate": 1.9987572004967474e-05,
+ "loss": 1.9043,
+ "step": 1666
+ },
+ {
+ "epoch": 4.5422343324250685,
+ "grad_norm": 11.833878517150879,
+ "learning_rate": 1.9987527982287977e-05,
+ "loss": 1.8086,
+ "step": 1667
+ },
+ {
+ "epoch": 4.544959128065395,
+ "grad_norm": 14.381035804748535,
+ "learning_rate": 1.9987483881825928e-05,
+ "loss": 1.8198,
+ "step": 1668
+ },
+ {
+ "epoch": 4.547683923705722,
+ "grad_norm": 13.35680103302002,
+ "learning_rate": 1.998743970358168e-05,
+ "loss": 1.7485,
+ "step": 1669
+ },
+ {
+ "epoch": 4.550408719346049,
+ "grad_norm": 9.395089149475098,
+ "learning_rate": 1.9987395447555574e-05,
+ "loss": 1.551,
+ "step": 1670
+ },
+ {
+ "epoch": 4.553133514986376,
+ "grad_norm": 11.275160789489746,
+ "learning_rate": 1.9987351113747953e-05,
+ "loss": 1.7605,
+ "step": 1671
+ },
+ {
+ "epoch": 4.555858310626703,
+ "grad_norm": 37.18361282348633,
+ "learning_rate": 1.998730670215916e-05,
+ "loss": 1.7385,
+ "step": 1672
+ },
+ {
+ "epoch": 4.55858310626703,
+ "grad_norm": 15.461226463317871,
+ "learning_rate": 1.9987262212789547e-05,
+ "loss": 1.7046,
+ "step": 1673
+ },
+ {
+ "epoch": 4.561307901907357,
+ "grad_norm": 11.419524192810059,
+ "learning_rate": 1.998721764563946e-05,
+ "loss": 1.6311,
+ "step": 1674
+ },
+ {
+ "epoch": 4.564032697547684,
+ "grad_norm": 11.717555046081543,
+ "learning_rate": 1.9987173000709238e-05,
+ "loss": 1.9062,
+ "step": 1675
+ },
+ {
+ "epoch": 4.566757493188011,
+ "grad_norm": 11.768439292907715,
+ "learning_rate": 1.9987128277999236e-05,
+ "loss": 1.8047,
+ "step": 1676
+ },
+ {
+ "epoch": 4.569482288828338,
+ "grad_norm": 11.077784538269043,
+ "learning_rate": 1.99870834775098e-05,
+ "loss": 1.8286,
+ "step": 1677
+ },
+ {
+ "epoch": 4.572207084468665,
+ "grad_norm": 9.806815147399902,
+ "learning_rate": 1.998703859924128e-05,
+ "loss": 1.8022,
+ "step": 1678
+ },
+ {
+ "epoch": 4.574931880108992,
+ "grad_norm": 21.835113525390625,
+ "learning_rate": 1.9986993643194022e-05,
+ "loss": 1.8,
+ "step": 1679
+ },
+ {
+ "epoch": 4.577656675749319,
+ "grad_norm": 11.922440528869629,
+ "learning_rate": 1.9986948609368385e-05,
+ "loss": 1.959,
+ "step": 1680
+ },
+ {
+ "epoch": 4.580381471389646,
+ "grad_norm": 12.709155082702637,
+ "learning_rate": 1.998690349776471e-05,
+ "loss": 1.7598,
+ "step": 1681
+ },
+ {
+ "epoch": 4.583106267029972,
+ "grad_norm": 12.793139457702637,
+ "learning_rate": 1.998685830838335e-05,
+ "loss": 1.7505,
+ "step": 1682
+ },
+ {
+ "epoch": 4.5858310626703,
+ "grad_norm": 12.681434631347656,
+ "learning_rate": 1.9986813041224662e-05,
+ "loss": 1.75,
+ "step": 1683
+ },
+ {
+ "epoch": 4.5885558583106265,
+ "grad_norm": 10.861709594726562,
+ "learning_rate": 1.9986767696288997e-05,
+ "loss": 1.9194,
+ "step": 1684
+ },
+ {
+ "epoch": 4.591280653950953,
+ "grad_norm": 10.562196731567383,
+ "learning_rate": 1.9986722273576703e-05,
+ "loss": 1.8896,
+ "step": 1685
+ },
+ {
+ "epoch": 4.594005449591281,
+ "grad_norm": 10.61209487915039,
+ "learning_rate": 1.9986676773088137e-05,
+ "loss": 1.6443,
+ "step": 1686
+ },
+ {
+ "epoch": 4.5967302452316074,
+ "grad_norm": 11.602971076965332,
+ "learning_rate": 1.9986631194823657e-05,
+ "loss": 1.7312,
+ "step": 1687
+ },
+ {
+ "epoch": 4.599455040871934,
+ "grad_norm": 11.791472434997559,
+ "learning_rate": 1.998658553878361e-05,
+ "loss": 1.6738,
+ "step": 1688
+ },
+ {
+ "epoch": 4.602179836512262,
+ "grad_norm": 10.37132740020752,
+ "learning_rate": 1.998653980496836e-05,
+ "loss": 1.6467,
+ "step": 1689
+ },
+ {
+ "epoch": 4.604904632152588,
+ "grad_norm": 11.563543319702148,
+ "learning_rate": 1.998649399337826e-05,
+ "loss": 2.0576,
+ "step": 1690
+ },
+ {
+ "epoch": 4.607629427792915,
+ "grad_norm": 11.379239082336426,
+ "learning_rate": 1.9986448104013664e-05,
+ "loss": 1.6252,
+ "step": 1691
+ },
+ {
+ "epoch": 4.610354223433243,
+ "grad_norm": 16.69204330444336,
+ "learning_rate": 1.998640213687493e-05,
+ "loss": 1.8271,
+ "step": 1692
+ },
+ {
+ "epoch": 4.613079019073569,
+ "grad_norm": 11.283498764038086,
+ "learning_rate": 1.9986356091962423e-05,
+ "loss": 1.7749,
+ "step": 1693
+ },
+ {
+ "epoch": 4.615803814713896,
+ "grad_norm": 11.236751556396484,
+ "learning_rate": 1.998630996927649e-05,
+ "loss": 1.9575,
+ "step": 1694
+ },
+ {
+ "epoch": 4.618528610354224,
+ "grad_norm": 9.967838287353516,
+ "learning_rate": 1.9986263768817502e-05,
+ "loss": 1.8423,
+ "step": 1695
+ },
+ {
+ "epoch": 4.62125340599455,
+ "grad_norm": 10.786258697509766,
+ "learning_rate": 1.998621749058581e-05,
+ "loss": 1.7085,
+ "step": 1696
+ },
+ {
+ "epoch": 4.623978201634877,
+ "grad_norm": 10.914759635925293,
+ "learning_rate": 1.9986171134581778e-05,
+ "loss": 1.7256,
+ "step": 1697
+ },
+ {
+ "epoch": 4.6267029972752045,
+ "grad_norm": 10.664731979370117,
+ "learning_rate": 1.9986124700805764e-05,
+ "loss": 1.644,
+ "step": 1698
+ },
+ {
+ "epoch": 4.629427792915531,
+ "grad_norm": 11.085412979125977,
+ "learning_rate": 1.998607818925814e-05,
+ "loss": 1.7568,
+ "step": 1699
+ },
+ {
+ "epoch": 4.632152588555858,
+ "grad_norm": 9.910640716552734,
+ "learning_rate": 1.9986031599939253e-05,
+ "loss": 1.7383,
+ "step": 1700
+ },
+ {
+ "epoch": 4.6348773841961854,
+ "grad_norm": 11.176325798034668,
+ "learning_rate": 1.9985984932849475e-05,
+ "loss": 1.5896,
+ "step": 1701
+ },
+ {
+ "epoch": 4.637602179836512,
+ "grad_norm": 11.895498275756836,
+ "learning_rate": 1.998593818798917e-05,
+ "loss": 1.9604,
+ "step": 1702
+ },
+ {
+ "epoch": 4.640326975476839,
+ "grad_norm": 10.814287185668945,
+ "learning_rate": 1.9985891365358697e-05,
+ "loss": 1.5288,
+ "step": 1703
+ },
+ {
+ "epoch": 4.643051771117166,
+ "grad_norm": 13.177926063537598,
+ "learning_rate": 1.9985844464958423e-05,
+ "loss": 2.0076,
+ "step": 1704
+ },
+ {
+ "epoch": 4.645776566757493,
+ "grad_norm": 12.39803695678711,
+ "learning_rate": 1.998579748678872e-05,
+ "loss": 2.041,
+ "step": 1705
+ },
+ {
+ "epoch": 4.64850136239782,
+ "grad_norm": 12.203011512756348,
+ "learning_rate": 1.998575043084994e-05,
+ "loss": 1.865,
+ "step": 1706
+ },
+ {
+ "epoch": 4.651226158038147,
+ "grad_norm": 14.263901710510254,
+ "learning_rate": 1.998570329714246e-05,
+ "loss": 1.8115,
+ "step": 1707
+ },
+ {
+ "epoch": 4.653950953678474,
+ "grad_norm": 11.454439163208008,
+ "learning_rate": 1.9985656085666646e-05,
+ "loss": 1.8589,
+ "step": 1708
+ },
+ {
+ "epoch": 4.656675749318801,
+ "grad_norm": 10.870101928710938,
+ "learning_rate": 1.9985608796422863e-05,
+ "loss": 1.5823,
+ "step": 1709
+ },
+ {
+ "epoch": 4.659400544959128,
+ "grad_norm": 10.731388092041016,
+ "learning_rate": 1.9985561429411478e-05,
+ "loss": 1.603,
+ "step": 1710
+ },
+ {
+ "epoch": 4.662125340599455,
+ "grad_norm": 11.784908294677734,
+ "learning_rate": 1.998551398463286e-05,
+ "loss": 1.7156,
+ "step": 1711
+ },
+ {
+ "epoch": 4.664850136239782,
+ "grad_norm": 11.44052505493164,
+ "learning_rate": 1.9985466462087383e-05,
+ "loss": 1.7234,
+ "step": 1712
+ },
+ {
+ "epoch": 4.667574931880109,
+ "grad_norm": 9.635643005371094,
+ "learning_rate": 1.9985418861775416e-05,
+ "loss": 1.7871,
+ "step": 1713
+ },
+ {
+ "epoch": 4.670299727520436,
+ "grad_norm": 10.105297088623047,
+ "learning_rate": 1.9985371183697327e-05,
+ "loss": 1.7383,
+ "step": 1714
+ },
+ {
+ "epoch": 4.6730245231607626,
+ "grad_norm": 11.22205638885498,
+ "learning_rate": 1.9985323427853492e-05,
+ "loss": 1.8931,
+ "step": 1715
+ },
+ {
+ "epoch": 4.67574931880109,
+ "grad_norm": 9.009623527526855,
+ "learning_rate": 1.9985275594244277e-05,
+ "loss": 1.6968,
+ "step": 1716
+ },
+ {
+ "epoch": 4.678474114441417,
+ "grad_norm": 9.375571250915527,
+ "learning_rate": 1.9985227682870054e-05,
+ "loss": 1.5361,
+ "step": 1717
+ },
+ {
+ "epoch": 4.6811989100817435,
+ "grad_norm": 19.648733139038086,
+ "learning_rate": 1.9985179693731204e-05,
+ "loss": 1.8423,
+ "step": 1718
+ },
+ {
+ "epoch": 4.683923705722071,
+ "grad_norm": 10.109658241271973,
+ "learning_rate": 1.9985131626828092e-05,
+ "loss": 1.6052,
+ "step": 1719
+ },
+ {
+ "epoch": 4.686648501362398,
+ "grad_norm": 12.355353355407715,
+ "learning_rate": 1.9985083482161098e-05,
+ "loss": 1.6052,
+ "step": 1720
+ },
+ {
+ "epoch": 4.689373297002724,
+ "grad_norm": 10.802824020385742,
+ "learning_rate": 1.9985035259730593e-05,
+ "loss": 1.8369,
+ "step": 1721
+ },
+ {
+ "epoch": 4.692098092643052,
+ "grad_norm": 11.200514793395996,
+ "learning_rate": 1.998498695953696e-05,
+ "loss": 1.8716,
+ "step": 1722
+ },
+ {
+ "epoch": 4.694822888283379,
+ "grad_norm": 11.038694381713867,
+ "learning_rate": 1.9984938581580566e-05,
+ "loss": 1.7036,
+ "step": 1723
+ },
+ {
+ "epoch": 4.697547683923705,
+ "grad_norm": 12.441304206848145,
+ "learning_rate": 1.998489012586179e-05,
+ "loss": 2.0435,
+ "step": 1724
+ },
+ {
+ "epoch": 4.700272479564033,
+ "grad_norm": 13.135621070861816,
+ "learning_rate": 1.9984841592381014e-05,
+ "loss": 1.6655,
+ "step": 1725
+ },
+ {
+ "epoch": 4.70299727520436,
+ "grad_norm": 11.036510467529297,
+ "learning_rate": 1.9984792981138616e-05,
+ "loss": 1.7988,
+ "step": 1726
+ },
+ {
+ "epoch": 4.705722070844686,
+ "grad_norm": 15.357640266418457,
+ "learning_rate": 1.9984744292134964e-05,
+ "loss": 1.8721,
+ "step": 1727
+ },
+ {
+ "epoch": 4.708446866485014,
+ "grad_norm": 11.371448516845703,
+ "learning_rate": 1.998469552537045e-05,
+ "loss": 1.8281,
+ "step": 1728
+ },
+ {
+ "epoch": 4.7111716621253406,
+ "grad_norm": 9.8068208694458,
+ "learning_rate": 1.9984646680845446e-05,
+ "loss": 1.5767,
+ "step": 1729
+ },
+ {
+ "epoch": 4.713896457765667,
+ "grad_norm": 13.548954010009766,
+ "learning_rate": 1.998459775856034e-05,
+ "loss": 2.1074,
+ "step": 1730
+ },
+ {
+ "epoch": 4.716621253405995,
+ "grad_norm": 10.1837158203125,
+ "learning_rate": 1.9984548758515503e-05,
+ "loss": 1.5684,
+ "step": 1731
+ },
+ {
+ "epoch": 4.7193460490463215,
+ "grad_norm": 8.237529754638672,
+ "learning_rate": 1.9984499680711322e-05,
+ "loss": 1.6902,
+ "step": 1732
+ },
+ {
+ "epoch": 4.722070844686648,
+ "grad_norm": 14.443774223327637,
+ "learning_rate": 1.9984450525148184e-05,
+ "loss": 1.7354,
+ "step": 1733
+ },
+ {
+ "epoch": 4.724795640326976,
+ "grad_norm": 13.338621139526367,
+ "learning_rate": 1.998440129182646e-05,
+ "loss": 1.791,
+ "step": 1734
+ },
+ {
+ "epoch": 4.727520435967302,
+ "grad_norm": 11.367993354797363,
+ "learning_rate": 1.9984351980746545e-05,
+ "loss": 1.7681,
+ "step": 1735
+ },
+ {
+ "epoch": 4.730245231607629,
+ "grad_norm": 8.49145221710205,
+ "learning_rate": 1.9984302591908812e-05,
+ "loss": 1.9062,
+ "step": 1736
+ },
+ {
+ "epoch": 4.732970027247957,
+ "grad_norm": 13.06961441040039,
+ "learning_rate": 1.998425312531366e-05,
+ "loss": 1.7966,
+ "step": 1737
+ },
+ {
+ "epoch": 4.735694822888283,
+ "grad_norm": 10.855565071105957,
+ "learning_rate": 1.998420358096146e-05,
+ "loss": 1.9082,
+ "step": 1738
+ },
+ {
+ "epoch": 4.73841961852861,
+ "grad_norm": 11.271066665649414,
+ "learning_rate": 1.9984153958852605e-05,
+ "loss": 1.8032,
+ "step": 1739
+ },
+ {
+ "epoch": 4.741144414168938,
+ "grad_norm": 10.016924858093262,
+ "learning_rate": 1.998410425898748e-05,
+ "loss": 1.6357,
+ "step": 1740
+ },
+ {
+ "epoch": 4.743869209809264,
+ "grad_norm": 13.83434772491455,
+ "learning_rate": 1.9984054481366474e-05,
+ "loss": 1.8184,
+ "step": 1741
+ },
+ {
+ "epoch": 4.746594005449591,
+ "grad_norm": 11.466126441955566,
+ "learning_rate": 1.9984004625989974e-05,
+ "loss": 1.7693,
+ "step": 1742
+ },
+ {
+ "epoch": 4.7493188010899186,
+ "grad_norm": 10.852738380432129,
+ "learning_rate": 1.9983954692858363e-05,
+ "loss": 1.5586,
+ "step": 1743
+ },
+ {
+ "epoch": 4.752043596730245,
+ "grad_norm": 11.944601058959961,
+ "learning_rate": 1.9983904681972034e-05,
+ "loss": 1.7754,
+ "step": 1744
+ },
+ {
+ "epoch": 4.754768392370572,
+ "grad_norm": 12.560547828674316,
+ "learning_rate": 1.998385459333138e-05,
+ "loss": 1.6797,
+ "step": 1745
+ },
+ {
+ "epoch": 4.7574931880108995,
+ "grad_norm": 12.880969047546387,
+ "learning_rate": 1.9983804426936787e-05,
+ "loss": 2.043,
+ "step": 1746
+ },
+ {
+ "epoch": 4.760217983651226,
+ "grad_norm": 10.755345344543457,
+ "learning_rate": 1.9983754182788647e-05,
+ "loss": 1.8086,
+ "step": 1747
+ },
+ {
+ "epoch": 4.762942779291553,
+ "grad_norm": 11.871491432189941,
+ "learning_rate": 1.9983703860887355e-05,
+ "loss": 1.7256,
+ "step": 1748
+ },
+ {
+ "epoch": 4.76566757493188,
+ "grad_norm": 10.811038970947266,
+ "learning_rate": 1.998365346123329e-05,
+ "loss": 1.6748,
+ "step": 1749
+ },
+ {
+ "epoch": 4.768392370572207,
+ "grad_norm": 12.117204666137695,
+ "learning_rate": 1.998360298382686e-05,
+ "loss": 1.9011,
+ "step": 1750
+ },
+ {
+ "epoch": 4.771117166212534,
+ "grad_norm": 12.1402587890625,
+ "learning_rate": 1.9983552428668448e-05,
+ "loss": 1.9209,
+ "step": 1751
+ },
+ {
+ "epoch": 4.773841961852861,
+ "grad_norm": 14.859792709350586,
+ "learning_rate": 1.998350179575845e-05,
+ "loss": 1.9126,
+ "step": 1752
+ },
+ {
+ "epoch": 4.776566757493188,
+ "grad_norm": 11.106743812561035,
+ "learning_rate": 1.9983451085097262e-05,
+ "loss": 1.8184,
+ "step": 1753
+ },
+ {
+ "epoch": 4.779291553133515,
+ "grad_norm": 16.94355583190918,
+ "learning_rate": 1.998340029668528e-05,
+ "loss": 1.6704,
+ "step": 1754
+ },
+ {
+ "epoch": 4.782016348773842,
+ "grad_norm": 9.108786582946777,
+ "learning_rate": 1.9983349430522896e-05,
+ "loss": 1.5703,
+ "step": 1755
+ },
+ {
+ "epoch": 4.784741144414169,
+ "grad_norm": 14.48527717590332,
+ "learning_rate": 1.9983298486610508e-05,
+ "loss": 1.6475,
+ "step": 1756
+ },
+ {
+ "epoch": 4.787465940054496,
+ "grad_norm": 10.127340316772461,
+ "learning_rate": 1.9983247464948515e-05,
+ "loss": 1.6936,
+ "step": 1757
+ },
+ {
+ "epoch": 4.790190735694823,
+ "grad_norm": 9.771352767944336,
+ "learning_rate": 1.9983196365537313e-05,
+ "loss": 1.6338,
+ "step": 1758
+ },
+ {
+ "epoch": 4.79291553133515,
+ "grad_norm": 11.561280250549316,
+ "learning_rate": 1.9983145188377297e-05,
+ "loss": 1.8057,
+ "step": 1759
+ },
+ {
+ "epoch": 4.795640326975477,
+ "grad_norm": 10.189553260803223,
+ "learning_rate": 1.9983093933468864e-05,
+ "loss": 1.5601,
+ "step": 1760
+ },
+ {
+ "epoch": 4.798365122615804,
+ "grad_norm": 10.330784797668457,
+ "learning_rate": 1.9983042600812423e-05,
+ "loss": 1.7271,
+ "step": 1761
+ },
+ {
+ "epoch": 4.801089918256131,
+ "grad_norm": 9.032349586486816,
+ "learning_rate": 1.9982991190408362e-05,
+ "loss": 1.5364,
+ "step": 1762
+ },
+ {
+ "epoch": 4.8038147138964575,
+ "grad_norm": 9.430227279663086,
+ "learning_rate": 1.9982939702257088e-05,
+ "loss": 1.7295,
+ "step": 1763
+ },
+ {
+ "epoch": 4.806539509536785,
+ "grad_norm": 13.426956176757812,
+ "learning_rate": 1.9982888136359e-05,
+ "loss": 2.0376,
+ "step": 1764
+ },
+ {
+ "epoch": 4.809264305177112,
+ "grad_norm": 9.60643196105957,
+ "learning_rate": 1.9982836492714505e-05,
+ "loss": 1.439,
+ "step": 1765
+ },
+ {
+ "epoch": 4.8119891008174385,
+ "grad_norm": 11.653831481933594,
+ "learning_rate": 1.9982784771324e-05,
+ "loss": 1.6733,
+ "step": 1766
+ },
+ {
+ "epoch": 4.814713896457766,
+ "grad_norm": 9.333499908447266,
+ "learning_rate": 1.9982732972187884e-05,
+ "loss": 1.7495,
+ "step": 1767
+ },
+ {
+ "epoch": 4.817438692098093,
+ "grad_norm": 10.512800216674805,
+ "learning_rate": 1.998268109530657e-05,
+ "loss": 1.6362,
+ "step": 1768
+ },
+ {
+ "epoch": 4.820163487738419,
+ "grad_norm": 11.654182434082031,
+ "learning_rate": 1.9982629140680453e-05,
+ "loss": 1.8032,
+ "step": 1769
+ },
+ {
+ "epoch": 4.822888283378747,
+ "grad_norm": 9.613519668579102,
+ "learning_rate": 1.9982577108309945e-05,
+ "loss": 1.7002,
+ "step": 1770
+ },
+ {
+ "epoch": 4.825613079019074,
+ "grad_norm": 10.996225357055664,
+ "learning_rate": 1.9982524998195446e-05,
+ "loss": 1.8635,
+ "step": 1771
+ },
+ {
+ "epoch": 4.8283378746594,
+ "grad_norm": 10.677639961242676,
+ "learning_rate": 1.9982472810337363e-05,
+ "loss": 1.6965,
+ "step": 1772
+ },
+ {
+ "epoch": 4.831062670299728,
+ "grad_norm": 11.29150104522705,
+ "learning_rate": 1.9982420544736106e-05,
+ "loss": 1.9971,
+ "step": 1773
+ },
+ {
+ "epoch": 4.833787465940055,
+ "grad_norm": 12.019180297851562,
+ "learning_rate": 1.9982368201392074e-05,
+ "loss": 1.5317,
+ "step": 1774
+ },
+ {
+ "epoch": 4.836512261580381,
+ "grad_norm": 11.11221981048584,
+ "learning_rate": 1.998231578030568e-05,
+ "loss": 1.6997,
+ "step": 1775
+ },
+ {
+ "epoch": 4.839237057220709,
+ "grad_norm": 13.890466690063477,
+ "learning_rate": 1.9982263281477338e-05,
+ "loss": 1.7688,
+ "step": 1776
+ },
+ {
+ "epoch": 4.8419618528610355,
+ "grad_norm": 10.007216453552246,
+ "learning_rate": 1.9982210704907446e-05,
+ "loss": 1.7949,
+ "step": 1777
+ },
+ {
+ "epoch": 4.844686648501362,
+ "grad_norm": 11.3532133102417,
+ "learning_rate": 1.998215805059642e-05,
+ "loss": 1.624,
+ "step": 1778
+ },
+ {
+ "epoch": 4.84741144414169,
+ "grad_norm": 12.174700736999512,
+ "learning_rate": 1.998210531854467e-05,
+ "loss": 1.8188,
+ "step": 1779
+ },
+ {
+ "epoch": 4.8501362397820165,
+ "grad_norm": 9.562557220458984,
+ "learning_rate": 1.9982052508752605e-05,
+ "loss": 1.7285,
+ "step": 1780
+ },
+ {
+ "epoch": 4.852861035422343,
+ "grad_norm": 11.95835018157959,
+ "learning_rate": 1.998199962122063e-05,
+ "loss": 1.5879,
+ "step": 1781
+ },
+ {
+ "epoch": 4.855585831062671,
+ "grad_norm": 8.104500770568848,
+ "learning_rate": 1.998194665594917e-05,
+ "loss": 1.7051,
+ "step": 1782
+ },
+ {
+ "epoch": 4.858310626702997,
+ "grad_norm": 10.136801719665527,
+ "learning_rate": 1.9981893612938624e-05,
+ "loss": 1.9111,
+ "step": 1783
+ },
+ {
+ "epoch": 4.861035422343324,
+ "grad_norm": 10.49084186553955,
+ "learning_rate": 1.998184049218942e-05,
+ "loss": 1.8105,
+ "step": 1784
+ },
+ {
+ "epoch": 4.863760217983652,
+ "grad_norm": 8.479459762573242,
+ "learning_rate": 1.9981787293701956e-05,
+ "loss": 1.6277,
+ "step": 1785
+ },
+ {
+ "epoch": 4.866485013623978,
+ "grad_norm": 20.927406311035156,
+ "learning_rate": 1.998173401747666e-05,
+ "loss": 1.7363,
+ "step": 1786
+ },
+ {
+ "epoch": 4.869209809264305,
+ "grad_norm": 10.920572280883789,
+ "learning_rate": 1.998168066351394e-05,
+ "loss": 1.8013,
+ "step": 1787
+ },
+ {
+ "epoch": 4.871934604904633,
+ "grad_norm": 9.645325660705566,
+ "learning_rate": 1.9981627231814207e-05,
+ "loss": 1.9629,
+ "step": 1788
+ },
+ {
+ "epoch": 4.874659400544959,
+ "grad_norm": 10.725105285644531,
+ "learning_rate": 1.9981573722377888e-05,
+ "loss": 1.7422,
+ "step": 1789
+ },
+ {
+ "epoch": 4.877384196185286,
+ "grad_norm": 19.972970962524414,
+ "learning_rate": 1.998152013520539e-05,
+ "loss": 1.7646,
+ "step": 1790
+ },
+ {
+ "epoch": 4.8801089918256135,
+ "grad_norm": 10.030486106872559,
+ "learning_rate": 1.9981466470297136e-05,
+ "loss": 1.9072,
+ "step": 1791
+ },
+ {
+ "epoch": 4.88283378746594,
+ "grad_norm": 11.005029678344727,
+ "learning_rate": 1.9981412727653544e-05,
+ "loss": 1.4939,
+ "step": 1792
+ },
+ {
+ "epoch": 4.885558583106267,
+ "grad_norm": 14.201371192932129,
+ "learning_rate": 1.998135890727503e-05,
+ "loss": 1.897,
+ "step": 1793
+ },
+ {
+ "epoch": 4.8882833787465945,
+ "grad_norm": 15.717061042785645,
+ "learning_rate": 1.998130500916201e-05,
+ "loss": 1.7451,
+ "step": 1794
+ },
+ {
+ "epoch": 4.891008174386921,
+ "grad_norm": 11.440669059753418,
+ "learning_rate": 1.9981251033314914e-05,
+ "loss": 1.5527,
+ "step": 1795
+ },
+ {
+ "epoch": 4.893732970027248,
+ "grad_norm": 10.5989990234375,
+ "learning_rate": 1.9981196979734157e-05,
+ "loss": 1.876,
+ "step": 1796
+ },
+ {
+ "epoch": 4.896457765667575,
+ "grad_norm": 13.592907905578613,
+ "learning_rate": 1.9981142848420152e-05,
+ "loss": 1.6316,
+ "step": 1797
+ },
+ {
+ "epoch": 4.899182561307902,
+ "grad_norm": 20.18497085571289,
+ "learning_rate": 1.9981088639373335e-05,
+ "loss": 1.9888,
+ "step": 1798
+ },
+ {
+ "epoch": 4.901907356948229,
+ "grad_norm": 9.938689231872559,
+ "learning_rate": 1.9981034352594117e-05,
+ "loss": 1.6448,
+ "step": 1799
+ },
+ {
+ "epoch": 4.904632152588556,
+ "grad_norm": 7.556951999664307,
+ "learning_rate": 1.9980979988082923e-05,
+ "loss": 1.7573,
+ "step": 1800
+ },
+ {
+ "epoch": 4.907356948228883,
+ "grad_norm": 9.85840129852295,
+ "learning_rate": 1.9980925545840183e-05,
+ "loss": 1.752,
+ "step": 1801
+ },
+ {
+ "epoch": 4.91008174386921,
+ "grad_norm": 8.957093238830566,
+ "learning_rate": 1.9980871025866314e-05,
+ "loss": 1.7471,
+ "step": 1802
+ },
+ {
+ "epoch": 4.912806539509537,
+ "grad_norm": 12.380105972290039,
+ "learning_rate": 1.998081642816174e-05,
+ "loss": 1.6592,
+ "step": 1803
+ },
+ {
+ "epoch": 4.915531335149864,
+ "grad_norm": 7.244705677032471,
+ "learning_rate": 1.998076175272689e-05,
+ "loss": 1.6409,
+ "step": 1804
+ },
+ {
+ "epoch": 4.918256130790191,
+ "grad_norm": 10.387642860412598,
+ "learning_rate": 1.998070699956219e-05,
+ "loss": 1.7148,
+ "step": 1805
+ },
+ {
+ "epoch": 4.920980926430518,
+ "grad_norm": 9.52930736541748,
+ "learning_rate": 1.9980652168668063e-05,
+ "loss": 1.8584,
+ "step": 1806
+ },
+ {
+ "epoch": 4.923705722070845,
+ "grad_norm": 10.156198501586914,
+ "learning_rate": 1.9980597260044944e-05,
+ "loss": 1.7664,
+ "step": 1807
+ },
+ {
+ "epoch": 4.926430517711172,
+ "grad_norm": 10.294306755065918,
+ "learning_rate": 1.998054227369325e-05,
+ "loss": 1.9492,
+ "step": 1808
+ },
+ {
+ "epoch": 4.929155313351498,
+ "grad_norm": 8.773594856262207,
+ "learning_rate": 1.998048720961341e-05,
+ "loss": 1.7065,
+ "step": 1809
+ },
+ {
+ "epoch": 4.931880108991826,
+ "grad_norm": 10.288111686706543,
+ "learning_rate": 1.9980432067805865e-05,
+ "loss": 1.7935,
+ "step": 1810
+ },
+ {
+ "epoch": 4.9346049046321525,
+ "grad_norm": 9.438074111938477,
+ "learning_rate": 1.9980376848271032e-05,
+ "loss": 1.7935,
+ "step": 1811
+ },
+ {
+ "epoch": 4.937329700272479,
+ "grad_norm": 9.358190536499023,
+ "learning_rate": 1.998032155100935e-05,
+ "loss": 1.6648,
+ "step": 1812
+ },
+ {
+ "epoch": 4.940054495912807,
+ "grad_norm": 14.03318977355957,
+ "learning_rate": 1.998026617602124e-05,
+ "loss": 1.8315,
+ "step": 1813
+ },
+ {
+ "epoch": 4.9427792915531334,
+ "grad_norm": 12.71858024597168,
+ "learning_rate": 1.998021072330714e-05,
+ "loss": 1.6411,
+ "step": 1814
+ },
+ {
+ "epoch": 4.94550408719346,
+ "grad_norm": 9.145251274108887,
+ "learning_rate": 1.9980155192867477e-05,
+ "loss": 1.8184,
+ "step": 1815
+ },
+ {
+ "epoch": 4.948228882833788,
+ "grad_norm": 11.447920799255371,
+ "learning_rate": 1.998009958470269e-05,
+ "loss": 1.8403,
+ "step": 1816
+ },
+ {
+ "epoch": 4.950953678474114,
+ "grad_norm": 12.897775650024414,
+ "learning_rate": 1.9980043898813206e-05,
+ "loss": 1.8479,
+ "step": 1817
+ },
+ {
+ "epoch": 4.953678474114441,
+ "grad_norm": 9.578463554382324,
+ "learning_rate": 1.9979988135199464e-05,
+ "loss": 1.7861,
+ "step": 1818
+ },
+ {
+ "epoch": 4.956403269754769,
+ "grad_norm": 9.109416007995605,
+ "learning_rate": 1.9979932293861895e-05,
+ "loss": 1.7188,
+ "step": 1819
+ },
+ {
+ "epoch": 4.959128065395095,
+ "grad_norm": 10.429159164428711,
+ "learning_rate": 1.9979876374800935e-05,
+ "loss": 1.4775,
+ "step": 1820
+ },
+ {
+ "epoch": 4.961852861035422,
+ "grad_norm": 9.446931838989258,
+ "learning_rate": 1.9979820378017017e-05,
+ "loss": 1.5884,
+ "step": 1821
+ },
+ {
+ "epoch": 4.96457765667575,
+ "grad_norm": 13.700077056884766,
+ "learning_rate": 1.997976430351058e-05,
+ "loss": 1.8855,
+ "step": 1822
+ },
+ {
+ "epoch": 4.967302452316076,
+ "grad_norm": 10.119503021240234,
+ "learning_rate": 1.997970815128206e-05,
+ "loss": 1.6887,
+ "step": 1823
+ },
+ {
+ "epoch": 4.970027247956403,
+ "grad_norm": 12.266241073608398,
+ "learning_rate": 1.9979651921331893e-05,
+ "loss": 1.8296,
+ "step": 1824
+ },
+ {
+ "epoch": 4.9727520435967305,
+ "grad_norm": 10.371781349182129,
+ "learning_rate": 1.997959561366052e-05,
+ "loss": 1.8691,
+ "step": 1825
+ },
+ {
+ "epoch": 4.975476839237057,
+ "grad_norm": 9.75312328338623,
+ "learning_rate": 1.9979539228268377e-05,
+ "loss": 1.9424,
+ "step": 1826
+ },
+ {
+ "epoch": 4.978201634877384,
+ "grad_norm": 9.707611083984375,
+ "learning_rate": 1.9979482765155905e-05,
+ "loss": 1.6619,
+ "step": 1827
+ },
+ {
+ "epoch": 4.9809264305177114,
+ "grad_norm": 12.377727508544922,
+ "learning_rate": 1.997942622432354e-05,
+ "loss": 1.6523,
+ "step": 1828
+ },
+ {
+ "epoch": 4.983651226158038,
+ "grad_norm": 9.129666328430176,
+ "learning_rate": 1.9979369605771722e-05,
+ "loss": 1.7437,
+ "step": 1829
+ },
+ {
+ "epoch": 4.986376021798365,
+ "grad_norm": 10.96391487121582,
+ "learning_rate": 1.9979312909500902e-05,
+ "loss": 1.5151,
+ "step": 1830
+ },
+ {
+ "epoch": 4.989100817438692,
+ "grad_norm": 8.620485305786133,
+ "learning_rate": 1.997925613551151e-05,
+ "loss": 1.7695,
+ "step": 1831
+ },
+ {
+ "epoch": 4.991825613079019,
+ "grad_norm": 9.796248435974121,
+ "learning_rate": 1.9979199283803994e-05,
+ "loss": 1.7188,
+ "step": 1832
+ },
+ {
+ "epoch": 4.994550408719346,
+ "grad_norm": 11.4308443069458,
+ "learning_rate": 1.9979142354378793e-05,
+ "loss": 1.7048,
+ "step": 1833
+ },
+ {
+ "epoch": 4.997275204359673,
+ "grad_norm": 11.859092712402344,
+ "learning_rate": 1.9979085347236355e-05,
+ "loss": 1.7302,
+ "step": 1834
+ },
+ {
+ "epoch": 5.0,
+ "grad_norm": 9.439201354980469,
+ "learning_rate": 1.997902826237712e-05,
+ "loss": 1.7229,
+ "step": 1835
+ },
+ {
+ "epoch": 5.002724795640327,
+ "grad_norm": 9.204095840454102,
+ "learning_rate": 1.9978971099801532e-05,
+ "loss": 1.4448,
+ "step": 1836
+ },
+ {
+ "epoch": 5.005449591280654,
+ "grad_norm": 7.906982421875,
+ "learning_rate": 1.997891385951004e-05,
+ "loss": 1.6667,
+ "step": 1837
+ },
+ {
+ "epoch": 5.008174386920981,
+ "grad_norm": 10.754129409790039,
+ "learning_rate": 1.997885654150309e-05,
+ "loss": 1.6953,
+ "step": 1838
+ },
+ {
+ "epoch": 5.010899182561308,
+ "grad_norm": 10.338284492492676,
+ "learning_rate": 1.9978799145781123e-05,
+ "loss": 1.9326,
+ "step": 1839
+ },
+ {
+ "epoch": 5.013623978201635,
+ "grad_norm": 8.468027114868164,
+ "learning_rate": 1.9978741672344594e-05,
+ "loss": 1.4824,
+ "step": 1840
+ },
+ {
+ "epoch": 5.016348773841962,
+ "grad_norm": 12.986717224121094,
+ "learning_rate": 1.9978684121193944e-05,
+ "loss": 1.6636,
+ "step": 1841
+ },
+ {
+ "epoch": 5.0190735694822886,
+ "grad_norm": 8.562746047973633,
+ "learning_rate": 1.997862649232962e-05,
+ "loss": 1.6724,
+ "step": 1842
+ },
+ {
+ "epoch": 5.021798365122616,
+ "grad_norm": 10.53598690032959,
+ "learning_rate": 1.9978568785752077e-05,
+ "loss": 1.6729,
+ "step": 1843
+ },
+ {
+ "epoch": 5.024523160762943,
+ "grad_norm": 11.25537109375,
+ "learning_rate": 1.997851100146176e-05,
+ "loss": 1.6594,
+ "step": 1844
+ },
+ {
+ "epoch": 5.0272479564032695,
+ "grad_norm": 9.552088737487793,
+ "learning_rate": 1.9978453139459123e-05,
+ "loss": 1.5952,
+ "step": 1845
+ },
+ {
+ "epoch": 5.029972752043597,
+ "grad_norm": 8.246376991271973,
+ "learning_rate": 1.997839519974461e-05,
+ "loss": 1.4541,
+ "step": 1846
+ },
+ {
+ "epoch": 5.032697547683924,
+ "grad_norm": 11.155094146728516,
+ "learning_rate": 1.9978337182318678e-05,
+ "loss": 1.5488,
+ "step": 1847
+ },
+ {
+ "epoch": 5.03542234332425,
+ "grad_norm": 9.724387168884277,
+ "learning_rate": 1.997827908718178e-05,
+ "loss": 1.7109,
+ "step": 1848
+ },
+ {
+ "epoch": 5.038147138964578,
+ "grad_norm": 11.168493270874023,
+ "learning_rate": 1.9978220914334363e-05,
+ "loss": 1.7383,
+ "step": 1849
+ },
+ {
+ "epoch": 5.040871934604905,
+ "grad_norm": 10.093647003173828,
+ "learning_rate": 1.9978162663776882e-05,
+ "loss": 1.7061,
+ "step": 1850
+ },
+ {
+ "epoch": 5.043596730245231,
+ "grad_norm": 9.386709213256836,
+ "learning_rate": 1.9978104335509796e-05,
+ "loss": 1.5657,
+ "step": 1851
+ },
+ {
+ "epoch": 5.046321525885559,
+ "grad_norm": 9.914746284484863,
+ "learning_rate": 1.997804592953355e-05,
+ "loss": 1.6787,
+ "step": 1852
+ },
+ {
+ "epoch": 5.049046321525886,
+ "grad_norm": 9.252211570739746,
+ "learning_rate": 1.9977987445848604e-05,
+ "loss": 1.6392,
+ "step": 1853
+ },
+ {
+ "epoch": 5.051771117166212,
+ "grad_norm": 8.123111724853516,
+ "learning_rate": 1.9977928884455412e-05,
+ "loss": 1.3396,
+ "step": 1854
+ },
+ {
+ "epoch": 5.05449591280654,
+ "grad_norm": 28.510730743408203,
+ "learning_rate": 1.9977870245354435e-05,
+ "loss": 1.8601,
+ "step": 1855
+ },
+ {
+ "epoch": 5.0572207084468666,
+ "grad_norm": 11.948402404785156,
+ "learning_rate": 1.9977811528546124e-05,
+ "loss": 1.7791,
+ "step": 1856
+ },
+ {
+ "epoch": 5.059945504087193,
+ "grad_norm": 8.497076988220215,
+ "learning_rate": 1.9977752734030935e-05,
+ "loss": 1.7415,
+ "step": 1857
+ },
+ {
+ "epoch": 5.062670299727521,
+ "grad_norm": 8.519002914428711,
+ "learning_rate": 1.9977693861809333e-05,
+ "loss": 1.5273,
+ "step": 1858
+ },
+ {
+ "epoch": 5.0653950953678475,
+ "grad_norm": 10.040315628051758,
+ "learning_rate": 1.997763491188177e-05,
+ "loss": 1.5908,
+ "step": 1859
+ },
+ {
+ "epoch": 5.068119891008174,
+ "grad_norm": 8.36683177947998,
+ "learning_rate": 1.9977575884248707e-05,
+ "loss": 1.4683,
+ "step": 1860
+ },
+ {
+ "epoch": 5.070844686648502,
+ "grad_norm": 13.225173950195312,
+ "learning_rate": 1.9977516778910607e-05,
+ "loss": 1.7437,
+ "step": 1861
+ },
+ {
+ "epoch": 5.073569482288828,
+ "grad_norm": 12.044672012329102,
+ "learning_rate": 1.9977457595867924e-05,
+ "loss": 1.7295,
+ "step": 1862
+ },
+ {
+ "epoch": 5.076294277929155,
+ "grad_norm": 11.419569969177246,
+ "learning_rate": 1.9977398335121126e-05,
+ "loss": 1.833,
+ "step": 1863
+ },
+ {
+ "epoch": 5.079019073569483,
+ "grad_norm": 9.895974159240723,
+ "learning_rate": 1.9977338996670665e-05,
+ "loss": 1.5835,
+ "step": 1864
+ },
+ {
+ "epoch": 5.081743869209809,
+ "grad_norm": 9.599562644958496,
+ "learning_rate": 1.9977279580517014e-05,
+ "loss": 1.6733,
+ "step": 1865
+ },
+ {
+ "epoch": 5.084468664850136,
+ "grad_norm": 8.531063079833984,
+ "learning_rate": 1.997722008666063e-05,
+ "loss": 1.708,
+ "step": 1866
+ },
+ {
+ "epoch": 5.087193460490464,
+ "grad_norm": 9.288894653320312,
+ "learning_rate": 1.9977160515101975e-05,
+ "loss": 1.5151,
+ "step": 1867
+ },
+ {
+ "epoch": 5.08991825613079,
+ "grad_norm": 10.671904563903809,
+ "learning_rate": 1.9977100865841516e-05,
+ "loss": 1.7759,
+ "step": 1868
+ },
+ {
+ "epoch": 5.092643051771117,
+ "grad_norm": 12.006613731384277,
+ "learning_rate": 1.997704113887972e-05,
+ "loss": 1.8088,
+ "step": 1869
+ },
+ {
+ "epoch": 5.0953678474114446,
+ "grad_norm": 10.795671463012695,
+ "learning_rate": 1.9976981334217046e-05,
+ "loss": 1.7363,
+ "step": 1870
+ },
+ {
+ "epoch": 5.098092643051771,
+ "grad_norm": 8.825675010681152,
+ "learning_rate": 1.997692145185396e-05,
+ "loss": 1.7041,
+ "step": 1871
+ },
+ {
+ "epoch": 5.100817438692098,
+ "grad_norm": 13.146547317504883,
+ "learning_rate": 1.9976861491790936e-05,
+ "loss": 1.7576,
+ "step": 1872
+ },
+ {
+ "epoch": 5.1035422343324255,
+ "grad_norm": 9.561686515808105,
+ "learning_rate": 1.997680145402843e-05,
+ "loss": 1.7068,
+ "step": 1873
+ },
+ {
+ "epoch": 5.106267029972752,
+ "grad_norm": 10.36915111541748,
+ "learning_rate": 1.997674133856692e-05,
+ "loss": 1.7524,
+ "step": 1874
+ },
+ {
+ "epoch": 5.108991825613079,
+ "grad_norm": 8.635497093200684,
+ "learning_rate": 1.997668114540687e-05,
+ "loss": 1.7163,
+ "step": 1875
+ },
+ {
+ "epoch": 5.111716621253406,
+ "grad_norm": 13.613897323608398,
+ "learning_rate": 1.997662087454874e-05,
+ "loss": 1.811,
+ "step": 1876
+ },
+ {
+ "epoch": 5.114441416893733,
+ "grad_norm": 10.332918167114258,
+ "learning_rate": 1.9976560525993015e-05,
+ "loss": 1.4631,
+ "step": 1877
+ },
+ {
+ "epoch": 5.11716621253406,
+ "grad_norm": 9.466386795043945,
+ "learning_rate": 1.997650009974016e-05,
+ "loss": 1.4214,
+ "step": 1878
+ },
+ {
+ "epoch": 5.1198910081743865,
+ "grad_norm": 9.696146011352539,
+ "learning_rate": 1.997643959579064e-05,
+ "loss": 1.4692,
+ "step": 1879
+ },
+ {
+ "epoch": 5.122615803814714,
+ "grad_norm": 11.486430168151855,
+ "learning_rate": 1.997637901414493e-05,
+ "loss": 1.6816,
+ "step": 1880
+ },
+ {
+ "epoch": 5.125340599455041,
+ "grad_norm": 14.753457069396973,
+ "learning_rate": 1.99763183548035e-05,
+ "loss": 1.5132,
+ "step": 1881
+ },
+ {
+ "epoch": 5.128065395095367,
+ "grad_norm": 11.152593612670898,
+ "learning_rate": 1.9976257617766824e-05,
+ "loss": 1.6729,
+ "step": 1882
+ },
+ {
+ "epoch": 5.130790190735695,
+ "grad_norm": 10.37635612487793,
+ "learning_rate": 1.9976196803035375e-05,
+ "loss": 1.575,
+ "step": 1883
+ },
+ {
+ "epoch": 5.133514986376022,
+ "grad_norm": 10.139860153198242,
+ "learning_rate": 1.9976135910609627e-05,
+ "loss": 1.7305,
+ "step": 1884
+ },
+ {
+ "epoch": 5.136239782016348,
+ "grad_norm": 12.509878158569336,
+ "learning_rate": 1.9976074940490052e-05,
+ "loss": 1.6179,
+ "step": 1885
+ },
+ {
+ "epoch": 5.138964577656676,
+ "grad_norm": 12.507528305053711,
+ "learning_rate": 1.997601389267713e-05,
+ "loss": 1.6895,
+ "step": 1886
+ },
+ {
+ "epoch": 5.141689373297003,
+ "grad_norm": 16.414642333984375,
+ "learning_rate": 1.997595276717133e-05,
+ "loss": 1.71,
+ "step": 1887
+ },
+ {
+ "epoch": 5.144414168937329,
+ "grad_norm": 12.145785331726074,
+ "learning_rate": 1.9975891563973132e-05,
+ "loss": 1.6699,
+ "step": 1888
+ },
+ {
+ "epoch": 5.147138964577657,
+ "grad_norm": 14.2864990234375,
+ "learning_rate": 1.997583028308301e-05,
+ "loss": 1.7114,
+ "step": 1889
+ },
+ {
+ "epoch": 5.1498637602179835,
+ "grad_norm": 16.97840690612793,
+ "learning_rate": 1.9975768924501444e-05,
+ "loss": 1.5745,
+ "step": 1890
+ },
+ {
+ "epoch": 5.15258855585831,
+ "grad_norm": 12.979388236999512,
+ "learning_rate": 1.997570748822891e-05,
+ "loss": 1.7158,
+ "step": 1891
+ },
+ {
+ "epoch": 5.155313351498638,
+ "grad_norm": 15.826199531555176,
+ "learning_rate": 1.997564597426589e-05,
+ "loss": 1.7612,
+ "step": 1892
+ },
+ {
+ "epoch": 5.1580381471389645,
+ "grad_norm": 15.385902404785156,
+ "learning_rate": 1.9975584382612855e-05,
+ "loss": 1.6587,
+ "step": 1893
+ },
+ {
+ "epoch": 5.160762942779291,
+ "grad_norm": 18.13292121887207,
+ "learning_rate": 1.9975522713270296e-05,
+ "loss": 1.5845,
+ "step": 1894
+ },
+ {
+ "epoch": 5.163487738419619,
+ "grad_norm": 11.18834114074707,
+ "learning_rate": 1.997546096623868e-05,
+ "loss": 1.6758,
+ "step": 1895
+ },
+ {
+ "epoch": 5.166212534059945,
+ "grad_norm": 10.812143325805664,
+ "learning_rate": 1.99753991415185e-05,
+ "loss": 1.7686,
+ "step": 1896
+ },
+ {
+ "epoch": 5.168937329700272,
+ "grad_norm": 16.42559814453125,
+ "learning_rate": 1.997533723911023e-05,
+ "loss": 1.6782,
+ "step": 1897
+ },
+ {
+ "epoch": 5.1716621253406,
+ "grad_norm": 13.681118965148926,
+ "learning_rate": 1.997527525901436e-05,
+ "loss": 1.8354,
+ "step": 1898
+ },
+ {
+ "epoch": 5.174386920980926,
+ "grad_norm": 47.688968658447266,
+ "learning_rate": 1.9975213201231363e-05,
+ "loss": 1.645,
+ "step": 1899
+ },
+ {
+ "epoch": 5.177111716621253,
+ "grad_norm": 14.734868049621582,
+ "learning_rate": 1.9975151065761728e-05,
+ "loss": 1.7627,
+ "step": 1900
+ },
+ {
+ "epoch": 5.179836512261581,
+ "grad_norm": 14.048941612243652,
+ "learning_rate": 1.9975088852605938e-05,
+ "loss": 1.7166,
+ "step": 1901
+ },
+ {
+ "epoch": 5.182561307901907,
+ "grad_norm": 10.565567970275879,
+ "learning_rate": 1.9975026561764474e-05,
+ "loss": 1.5193,
+ "step": 1902
+ },
+ {
+ "epoch": 5.185286103542234,
+ "grad_norm": 24.844717025756836,
+ "learning_rate": 1.9974964193237823e-05,
+ "loss": 1.8198,
+ "step": 1903
+ },
+ {
+ "epoch": 5.1880108991825615,
+ "grad_norm": 11.01167106628418,
+ "learning_rate": 1.9974901747026474e-05,
+ "loss": 1.5588,
+ "step": 1904
+ },
+ {
+ "epoch": 5.190735694822888,
+ "grad_norm": 12.473700523376465,
+ "learning_rate": 1.997483922313092e-05,
+ "loss": 1.6191,
+ "step": 1905
+ },
+ {
+ "epoch": 5.193460490463215,
+ "grad_norm": 19.939329147338867,
+ "learning_rate": 1.997477662155163e-05,
+ "loss": 1.6272,
+ "step": 1906
+ },
+ {
+ "epoch": 5.1961852861035425,
+ "grad_norm": 10.474801063537598,
+ "learning_rate": 1.99747139422891e-05,
+ "loss": 1.658,
+ "step": 1907
+ },
+ {
+ "epoch": 5.198910081743869,
+ "grad_norm": 9.368407249450684,
+ "learning_rate": 1.9974651185343822e-05,
+ "loss": 1.6333,
+ "step": 1908
+ },
+ {
+ "epoch": 5.201634877384196,
+ "grad_norm": 11.387381553649902,
+ "learning_rate": 1.997458835071628e-05,
+ "loss": 1.6475,
+ "step": 1909
+ },
+ {
+ "epoch": 5.204359673024523,
+ "grad_norm": 10.220231056213379,
+ "learning_rate": 1.9974525438406966e-05,
+ "loss": 1.8,
+ "step": 1910
+ },
+ {
+ "epoch": 5.20708446866485,
+ "grad_norm": 12.36602783203125,
+ "learning_rate": 1.9974462448416365e-05,
+ "loss": 1.686,
+ "step": 1911
+ },
+ {
+ "epoch": 5.209809264305177,
+ "grad_norm": 8.590251922607422,
+ "learning_rate": 1.9974399380744976e-05,
+ "loss": 1.647,
+ "step": 1912
+ },
+ {
+ "epoch": 5.212534059945504,
+ "grad_norm": 9.52476692199707,
+ "learning_rate": 1.9974336235393283e-05,
+ "loss": 1.6436,
+ "step": 1913
+ },
+ {
+ "epoch": 5.215258855585831,
+ "grad_norm": 13.15280532836914,
+ "learning_rate": 1.9974273012361784e-05,
+ "loss": 1.7412,
+ "step": 1914
+ },
+ {
+ "epoch": 5.217983651226158,
+ "grad_norm": 12.537514686584473,
+ "learning_rate": 1.9974209711650964e-05,
+ "loss": 1.7622,
+ "step": 1915
+ },
+ {
+ "epoch": 5.220708446866485,
+ "grad_norm": 14.053447723388672,
+ "learning_rate": 1.9974146333261323e-05,
+ "loss": 1.7861,
+ "step": 1916
+ },
+ {
+ "epoch": 5.223433242506812,
+ "grad_norm": 8.49190616607666,
+ "learning_rate": 1.997408287719335e-05,
+ "loss": 1.7324,
+ "step": 1917
+ },
+ {
+ "epoch": 5.226158038147139,
+ "grad_norm": 10.375123023986816,
+ "learning_rate": 1.997401934344754e-05,
+ "loss": 1.6785,
+ "step": 1918
+ },
+ {
+ "epoch": 5.228882833787466,
+ "grad_norm": 11.195998191833496,
+ "learning_rate": 1.997395573202439e-05,
+ "loss": 1.6948,
+ "step": 1919
+ },
+ {
+ "epoch": 5.231607629427793,
+ "grad_norm": 13.794561386108398,
+ "learning_rate": 1.997389204292439e-05,
+ "loss": 1.6665,
+ "step": 1920
+ },
+ {
+ "epoch": 5.23433242506812,
+ "grad_norm": 8.96519947052002,
+ "learning_rate": 1.9973828276148043e-05,
+ "loss": 1.4685,
+ "step": 1921
+ },
+ {
+ "epoch": 5.237057220708447,
+ "grad_norm": 9.925034523010254,
+ "learning_rate": 1.9973764431695844e-05,
+ "loss": 1.7209,
+ "step": 1922
+ },
+ {
+ "epoch": 5.239782016348774,
+ "grad_norm": 10.551443099975586,
+ "learning_rate": 1.9973700509568287e-05,
+ "loss": 1.8154,
+ "step": 1923
+ },
+ {
+ "epoch": 5.2425068119891005,
+ "grad_norm": 8.865917205810547,
+ "learning_rate": 1.997363650976587e-05,
+ "loss": 1.6018,
+ "step": 1924
+ },
+ {
+ "epoch": 5.245231607629428,
+ "grad_norm": 10.166401863098145,
+ "learning_rate": 1.9973572432289094e-05,
+ "loss": 1.7842,
+ "step": 1925
+ },
+ {
+ "epoch": 5.247956403269755,
+ "grad_norm": 9.873787879943848,
+ "learning_rate": 1.9973508277138457e-05,
+ "loss": 1.6418,
+ "step": 1926
+ },
+ {
+ "epoch": 5.2506811989100814,
+ "grad_norm": 30.08473777770996,
+ "learning_rate": 1.9973444044314458e-05,
+ "loss": 1.6238,
+ "step": 1927
+ },
+ {
+ "epoch": 5.253405994550409,
+ "grad_norm": 11.543693542480469,
+ "learning_rate": 1.99733797338176e-05,
+ "loss": 1.6841,
+ "step": 1928
+ },
+ {
+ "epoch": 5.256130790190736,
+ "grad_norm": 15.977535247802734,
+ "learning_rate": 1.9973315345648374e-05,
+ "loss": 1.8975,
+ "step": 1929
+ },
+ {
+ "epoch": 5.258855585831062,
+ "grad_norm": 11.794048309326172,
+ "learning_rate": 1.9973250879807295e-05,
+ "loss": 1.708,
+ "step": 1930
+ },
+ {
+ "epoch": 5.26158038147139,
+ "grad_norm": 11.914398193359375,
+ "learning_rate": 1.9973186336294857e-05,
+ "loss": 1.9424,
+ "step": 1931
+ },
+ {
+ "epoch": 5.264305177111717,
+ "grad_norm": 12.993264198303223,
+ "learning_rate": 1.9973121715111568e-05,
+ "loss": 1.7119,
+ "step": 1932
+ },
+ {
+ "epoch": 5.267029972752043,
+ "grad_norm": 8.076578140258789,
+ "learning_rate": 1.997305701625793e-05,
+ "loss": 1.5771,
+ "step": 1933
+ },
+ {
+ "epoch": 5.269754768392371,
+ "grad_norm": 22.118816375732422,
+ "learning_rate": 1.997299223973444e-05,
+ "loss": 1.5959,
+ "step": 1934
+ },
+ {
+ "epoch": 5.272479564032698,
+ "grad_norm": 13.975380897521973,
+ "learning_rate": 1.997292738554161e-05,
+ "loss": 1.7395,
+ "step": 1935
+ },
+ {
+ "epoch": 5.275204359673024,
+ "grad_norm": 28.772640228271484,
+ "learning_rate": 1.997286245367994e-05,
+ "loss": 1.792,
+ "step": 1936
+ },
+ {
+ "epoch": 5.277929155313352,
+ "grad_norm": 12.679280281066895,
+ "learning_rate": 1.997279744414994e-05,
+ "loss": 1.6987,
+ "step": 1937
+ },
+ {
+ "epoch": 5.2806539509536785,
+ "grad_norm": 10.289875984191895,
+ "learning_rate": 1.9972732356952115e-05,
+ "loss": 1.8115,
+ "step": 1938
+ },
+ {
+ "epoch": 5.283378746594005,
+ "grad_norm": 9.017131805419922,
+ "learning_rate": 1.997266719208697e-05,
+ "loss": 1.4751,
+ "step": 1939
+ },
+ {
+ "epoch": 5.286103542234333,
+ "grad_norm": 11.865049362182617,
+ "learning_rate": 1.9972601949555015e-05,
+ "loss": 2.021,
+ "step": 1940
+ },
+ {
+ "epoch": 5.2888283378746594,
+ "grad_norm": 15.10794734954834,
+ "learning_rate": 1.9972536629356756e-05,
+ "loss": 1.8965,
+ "step": 1941
+ },
+ {
+ "epoch": 5.291553133514986,
+ "grad_norm": 11.373397827148438,
+ "learning_rate": 1.99724712314927e-05,
+ "loss": 1.8027,
+ "step": 1942
+ },
+ {
+ "epoch": 5.294277929155314,
+ "grad_norm": 12.007485389709473,
+ "learning_rate": 1.9972405755963362e-05,
+ "loss": 1.7007,
+ "step": 1943
+ },
+ {
+ "epoch": 5.29700272479564,
+ "grad_norm": 11.727828025817871,
+ "learning_rate": 1.997234020276925e-05,
+ "loss": 1.6819,
+ "step": 1944
+ },
+ {
+ "epoch": 5.299727520435967,
+ "grad_norm": 23.94923973083496,
+ "learning_rate": 1.9972274571910873e-05,
+ "loss": 1.5952,
+ "step": 1945
+ },
+ {
+ "epoch": 5.302452316076295,
+ "grad_norm": 15.61506175994873,
+ "learning_rate": 1.9972208863388744e-05,
+ "loss": 1.5334,
+ "step": 1946
+ },
+ {
+ "epoch": 5.305177111716621,
+ "grad_norm": 10.43548583984375,
+ "learning_rate": 1.997214307720337e-05,
+ "loss": 1.7183,
+ "step": 1947
+ },
+ {
+ "epoch": 5.307901907356948,
+ "grad_norm": 15.498167991638184,
+ "learning_rate": 1.997207721335527e-05,
+ "loss": 1.7815,
+ "step": 1948
+ },
+ {
+ "epoch": 5.310626702997276,
+ "grad_norm": 10.394688606262207,
+ "learning_rate": 1.997201127184495e-05,
+ "loss": 1.8184,
+ "step": 1949
+ },
+ {
+ "epoch": 5.313351498637602,
+ "grad_norm": 10.260842323303223,
+ "learning_rate": 1.9971945252672927e-05,
+ "loss": 1.7708,
+ "step": 1950
+ },
+ {
+ "epoch": 5.316076294277929,
+ "grad_norm": 10.0009765625,
+ "learning_rate": 1.9971879155839717e-05,
+ "loss": 1.6846,
+ "step": 1951
+ },
+ {
+ "epoch": 5.3188010899182565,
+ "grad_norm": 11.772761344909668,
+ "learning_rate": 1.9971812981345834e-05,
+ "loss": 1.5054,
+ "step": 1952
+ },
+ {
+ "epoch": 5.321525885558583,
+ "grad_norm": 14.363198280334473,
+ "learning_rate": 1.9971746729191792e-05,
+ "loss": 1.8584,
+ "step": 1953
+ },
+ {
+ "epoch": 5.32425068119891,
+ "grad_norm": 11.569507598876953,
+ "learning_rate": 1.9971680399378107e-05,
+ "loss": 1.5986,
+ "step": 1954
+ },
+ {
+ "epoch": 5.3269754768392374,
+ "grad_norm": 10.486541748046875,
+ "learning_rate": 1.9971613991905298e-05,
+ "loss": 1.4114,
+ "step": 1955
+ },
+ {
+ "epoch": 5.329700272479564,
+ "grad_norm": 9.989212989807129,
+ "learning_rate": 1.9971547506773875e-05,
+ "loss": 1.6077,
+ "step": 1956
+ },
+ {
+ "epoch": 5.332425068119891,
+ "grad_norm": 10.298331260681152,
+ "learning_rate": 1.9971480943984364e-05,
+ "loss": 1.7222,
+ "step": 1957
+ },
+ {
+ "epoch": 5.335149863760218,
+ "grad_norm": 13.963698387145996,
+ "learning_rate": 1.997141430353728e-05,
+ "loss": 1.5579,
+ "step": 1958
+ },
+ {
+ "epoch": 5.337874659400545,
+ "grad_norm": 9.665743827819824,
+ "learning_rate": 1.9971347585433145e-05,
+ "loss": 1.6621,
+ "step": 1959
+ },
+ {
+ "epoch": 5.340599455040872,
+ "grad_norm": 20.565250396728516,
+ "learning_rate": 1.9971280789672474e-05,
+ "loss": 1.4971,
+ "step": 1960
+ },
+ {
+ "epoch": 5.343324250681199,
+ "grad_norm": 9.76312255859375,
+ "learning_rate": 1.9971213916255788e-05,
+ "loss": 1.689,
+ "step": 1961
+ },
+ {
+ "epoch": 5.346049046321526,
+ "grad_norm": 13.125452041625977,
+ "learning_rate": 1.997114696518361e-05,
+ "loss": 1.6313,
+ "step": 1962
+ },
+ {
+ "epoch": 5.348773841961853,
+ "grad_norm": 10.671045303344727,
+ "learning_rate": 1.997107993645646e-05,
+ "loss": 1.5195,
+ "step": 1963
+ },
+ {
+ "epoch": 5.35149863760218,
+ "grad_norm": 12.833518028259277,
+ "learning_rate": 1.997101283007486e-05,
+ "loss": 1.8257,
+ "step": 1964
+ },
+ {
+ "epoch": 5.354223433242507,
+ "grad_norm": 13.581474304199219,
+ "learning_rate": 1.9970945646039336e-05,
+ "loss": 1.8911,
+ "step": 1965
+ },
+ {
+ "epoch": 5.356948228882834,
+ "grad_norm": 8.949580192565918,
+ "learning_rate": 1.9970878384350404e-05,
+ "loss": 1.5591,
+ "step": 1966
+ },
+ {
+ "epoch": 5.359673024523161,
+ "grad_norm": 8.894742965698242,
+ "learning_rate": 1.9970811045008592e-05,
+ "loss": 1.5896,
+ "step": 1967
+ },
+ {
+ "epoch": 5.362397820163488,
+ "grad_norm": 11.158965110778809,
+ "learning_rate": 1.9970743628014428e-05,
+ "loss": 1.7842,
+ "step": 1968
+ },
+ {
+ "epoch": 5.3651226158038146,
+ "grad_norm": 10.686578750610352,
+ "learning_rate": 1.997067613336843e-05,
+ "loss": 1.6257,
+ "step": 1969
+ },
+ {
+ "epoch": 5.367847411444142,
+ "grad_norm": 10.511839866638184,
+ "learning_rate": 1.997060856107113e-05,
+ "loss": 1.8301,
+ "step": 1970
+ },
+ {
+ "epoch": 5.370572207084469,
+ "grad_norm": 8.157552719116211,
+ "learning_rate": 1.9970540911123052e-05,
+ "loss": 1.6621,
+ "step": 1971
+ },
+ {
+ "epoch": 5.3732970027247955,
+ "grad_norm": 14.843273162841797,
+ "learning_rate": 1.997047318352472e-05,
+ "loss": 1.5149,
+ "step": 1972
+ },
+ {
+ "epoch": 5.376021798365123,
+ "grad_norm": 12.004420280456543,
+ "learning_rate": 1.9970405378276666e-05,
+ "loss": 1.6685,
+ "step": 1973
+ },
+ {
+ "epoch": 5.37874659400545,
+ "grad_norm": 11.34261417388916,
+ "learning_rate": 1.997033749537941e-05,
+ "loss": 1.8472,
+ "step": 1974
+ },
+ {
+ "epoch": 5.381471389645776,
+ "grad_norm": 11.158589363098145,
+ "learning_rate": 1.9970269534833492e-05,
+ "loss": 1.4712,
+ "step": 1975
+ },
+ {
+ "epoch": 5.384196185286104,
+ "grad_norm": 8.92293643951416,
+ "learning_rate": 1.9970201496639436e-05,
+ "loss": 1.6367,
+ "step": 1976
+ },
+ {
+ "epoch": 5.386920980926431,
+ "grad_norm": 8.600255966186523,
+ "learning_rate": 1.997013338079777e-05,
+ "loss": 1.5042,
+ "step": 1977
+ },
+ {
+ "epoch": 5.389645776566757,
+ "grad_norm": 9.92839527130127,
+ "learning_rate": 1.9970065187309025e-05,
+ "loss": 1.6592,
+ "step": 1978
+ },
+ {
+ "epoch": 5.392370572207085,
+ "grad_norm": 21.944948196411133,
+ "learning_rate": 1.9969996916173735e-05,
+ "loss": 1.9316,
+ "step": 1979
+ },
+ {
+ "epoch": 5.395095367847412,
+ "grad_norm": 12.78380012512207,
+ "learning_rate": 1.996992856739243e-05,
+ "loss": 1.8149,
+ "step": 1980
+ },
+ {
+ "epoch": 5.397820163487738,
+ "grad_norm": 11.880173683166504,
+ "learning_rate": 1.9969860140965643e-05,
+ "loss": 1.6606,
+ "step": 1981
+ },
+ {
+ "epoch": 5.400544959128065,
+ "grad_norm": 9.758583068847656,
+ "learning_rate": 1.9969791636893904e-05,
+ "loss": 1.6963,
+ "step": 1982
+ },
+ {
+ "epoch": 5.4032697547683926,
+ "grad_norm": 12.348323822021484,
+ "learning_rate": 1.9969723055177748e-05,
+ "loss": 1.7661,
+ "step": 1983
+ },
+ {
+ "epoch": 5.405994550408719,
+ "grad_norm": 18.636323928833008,
+ "learning_rate": 1.9969654395817714e-05,
+ "loss": 1.6973,
+ "step": 1984
+ },
+ {
+ "epoch": 5.408719346049046,
+ "grad_norm": 10.546487808227539,
+ "learning_rate": 1.9969585658814327e-05,
+ "loss": 1.8486,
+ "step": 1985
+ },
+ {
+ "epoch": 5.4114441416893735,
+ "grad_norm": 9.425722122192383,
+ "learning_rate": 1.9969516844168132e-05,
+ "loss": 1.5786,
+ "step": 1986
+ },
+ {
+ "epoch": 5.4141689373297,
+ "grad_norm": 10.106487274169922,
+ "learning_rate": 1.9969447951879655e-05,
+ "loss": 1.8281,
+ "step": 1987
+ },
+ {
+ "epoch": 5.416893732970027,
+ "grad_norm": 9.693245887756348,
+ "learning_rate": 1.9969378981949445e-05,
+ "loss": 1.6099,
+ "step": 1988
+ },
+ {
+ "epoch": 5.419618528610354,
+ "grad_norm": 9.235607147216797,
+ "learning_rate": 1.996930993437803e-05,
+ "loss": 1.6379,
+ "step": 1989
+ },
+ {
+ "epoch": 5.422343324250681,
+ "grad_norm": 11.294902801513672,
+ "learning_rate": 1.9969240809165948e-05,
+ "loss": 1.614,
+ "step": 1990
+ },
+ {
+ "epoch": 5.425068119891008,
+ "grad_norm": 12.546422958374023,
+ "learning_rate": 1.9969171606313742e-05,
+ "loss": 1.6875,
+ "step": 1991
+ },
+ {
+ "epoch": 5.427792915531335,
+ "grad_norm": 10.250531196594238,
+ "learning_rate": 1.9969102325821947e-05,
+ "loss": 1.7649,
+ "step": 1992
+ },
+ {
+ "epoch": 5.430517711171662,
+ "grad_norm": 9.09671688079834,
+ "learning_rate": 1.9969032967691106e-05,
+ "loss": 1.7554,
+ "step": 1993
+ },
+ {
+ "epoch": 5.433242506811989,
+ "grad_norm": 9.852420806884766,
+ "learning_rate": 1.9968963531921753e-05,
+ "loss": 1.6787,
+ "step": 1994
+ },
+ {
+ "epoch": 5.435967302452316,
+ "grad_norm": 9.900439262390137,
+ "learning_rate": 1.9968894018514434e-05,
+ "loss": 1.5818,
+ "step": 1995
+ },
+ {
+ "epoch": 5.438692098092643,
+ "grad_norm": 9.226574897766113,
+ "learning_rate": 1.996882442746969e-05,
+ "loss": 1.4751,
+ "step": 1996
+ },
+ {
+ "epoch": 5.44141689373297,
+ "grad_norm": 9.87454605102539,
+ "learning_rate": 1.9968754758788064e-05,
+ "loss": 1.7722,
+ "step": 1997
+ },
+ {
+ "epoch": 5.444141689373297,
+ "grad_norm": 10.80100154876709,
+ "learning_rate": 1.9968685012470097e-05,
+ "loss": 1.6931,
+ "step": 1998
+ },
+ {
+ "epoch": 5.446866485013624,
+ "grad_norm": 9.997541427612305,
+ "learning_rate": 1.996861518851633e-05,
+ "loss": 1.7524,
+ "step": 1999
+ },
+ {
+ "epoch": 5.449591280653951,
+ "grad_norm": 10.228842735290527,
+ "learning_rate": 1.996854528692731e-05,
+ "loss": 1.6123,
+ "step": 2000
+ },
+ {
+ "epoch": 5.452316076294278,
+ "grad_norm": 10.22179889678955,
+ "learning_rate": 1.996847530770358e-05,
+ "loss": 1.4919,
+ "step": 2001
+ },
+ {
+ "epoch": 5.455040871934605,
+ "grad_norm": 22.50702667236328,
+ "learning_rate": 1.996840525084568e-05,
+ "loss": 1.8882,
+ "step": 2002
+ },
+ {
+ "epoch": 5.4577656675749315,
+ "grad_norm": 9.13119125366211,
+ "learning_rate": 1.996833511635417e-05,
+ "loss": 1.4927,
+ "step": 2003
+ },
+ {
+ "epoch": 5.460490463215259,
+ "grad_norm": 10.396625518798828,
+ "learning_rate": 1.996826490422958e-05,
+ "loss": 1.769,
+ "step": 2004
+ },
+ {
+ "epoch": 5.463215258855586,
+ "grad_norm": 10.584822654724121,
+ "learning_rate": 1.9968194614472465e-05,
+ "loss": 1.4788,
+ "step": 2005
+ },
+ {
+ "epoch": 5.4659400544959125,
+ "grad_norm": 14.889788627624512,
+ "learning_rate": 1.9968124247083375e-05,
+ "loss": 1.4604,
+ "step": 2006
+ },
+ {
+ "epoch": 5.46866485013624,
+ "grad_norm": 8.787952423095703,
+ "learning_rate": 1.996805380206285e-05,
+ "loss": 1.6577,
+ "step": 2007
+ },
+ {
+ "epoch": 5.471389645776567,
+ "grad_norm": 36.39643096923828,
+ "learning_rate": 1.9967983279411442e-05,
+ "loss": 1.5061,
+ "step": 2008
+ },
+ {
+ "epoch": 5.474114441416893,
+ "grad_norm": 10.348734855651855,
+ "learning_rate": 1.9967912679129708e-05,
+ "loss": 1.7217,
+ "step": 2009
+ },
+ {
+ "epoch": 5.476839237057221,
+ "grad_norm": 12.849311828613281,
+ "learning_rate": 1.9967842001218183e-05,
+ "loss": 1.6465,
+ "step": 2010
+ },
+ {
+ "epoch": 5.479564032697548,
+ "grad_norm": 16.13958740234375,
+ "learning_rate": 1.9967771245677427e-05,
+ "loss": 1.7622,
+ "step": 2011
+ },
+ {
+ "epoch": 5.482288828337874,
+ "grad_norm": 14.944127082824707,
+ "learning_rate": 1.996770041250799e-05,
+ "loss": 1.854,
+ "step": 2012
+ },
+ {
+ "epoch": 5.485013623978202,
+ "grad_norm": 9.569435119628906,
+ "learning_rate": 1.9967629501710423e-05,
+ "loss": 1.605,
+ "step": 2013
+ },
+ {
+ "epoch": 5.487738419618529,
+ "grad_norm": 10.095573425292969,
+ "learning_rate": 1.996755851328528e-05,
+ "loss": 1.7275,
+ "step": 2014
+ },
+ {
+ "epoch": 5.490463215258855,
+ "grad_norm": 10.504908561706543,
+ "learning_rate": 1.9967487447233114e-05,
+ "loss": 1.7283,
+ "step": 2015
+ },
+ {
+ "epoch": 5.493188010899183,
+ "grad_norm": 8.080174446105957,
+ "learning_rate": 1.9967416303554472e-05,
+ "loss": 1.458,
+ "step": 2016
+ },
+ {
+ "epoch": 5.4959128065395095,
+ "grad_norm": 11.463164329528809,
+ "learning_rate": 1.9967345082249912e-05,
+ "loss": 1.7104,
+ "step": 2017
+ },
+ {
+ "epoch": 5.498637602179836,
+ "grad_norm": 13.109505653381348,
+ "learning_rate": 1.9967273783319993e-05,
+ "loss": 1.5955,
+ "step": 2018
+ },
+ {
+ "epoch": 5.501362397820164,
+ "grad_norm": 10.553297996520996,
+ "learning_rate": 1.996720240676527e-05,
+ "loss": 1.7117,
+ "step": 2019
+ },
+ {
+ "epoch": 5.5040871934604905,
+ "grad_norm": 9.326204299926758,
+ "learning_rate": 1.9967130952586286e-05,
+ "loss": 1.6833,
+ "step": 2020
+ },
+ {
+ "epoch": 5.506811989100817,
+ "grad_norm": 11.271936416625977,
+ "learning_rate": 1.9967059420783612e-05,
+ "loss": 1.7017,
+ "step": 2021
+ },
+ {
+ "epoch": 5.509536784741145,
+ "grad_norm": 9.598100662231445,
+ "learning_rate": 1.9966987811357798e-05,
+ "loss": 1.6323,
+ "step": 2022
+ },
+ {
+ "epoch": 5.512261580381471,
+ "grad_norm": 8.798504829406738,
+ "learning_rate": 1.9966916124309404e-05,
+ "loss": 1.543,
+ "step": 2023
+ },
+ {
+ "epoch": 5.514986376021798,
+ "grad_norm": 10.221184730529785,
+ "learning_rate": 1.9966844359638992e-05,
+ "loss": 1.7039,
+ "step": 2024
+ },
+ {
+ "epoch": 5.517711171662126,
+ "grad_norm": 9.18807601928711,
+ "learning_rate": 1.9966772517347114e-05,
+ "loss": 1.6016,
+ "step": 2025
+ },
+ {
+ "epoch": 5.520435967302452,
+ "grad_norm": 10.857856750488281,
+ "learning_rate": 1.9966700597434333e-05,
+ "loss": 1.6917,
+ "step": 2026
+ },
+ {
+ "epoch": 5.523160762942779,
+ "grad_norm": 9.961305618286133,
+ "learning_rate": 1.9966628599901208e-05,
+ "loss": 1.5222,
+ "step": 2027
+ },
+ {
+ "epoch": 5.525885558583107,
+ "grad_norm": 12.995038032531738,
+ "learning_rate": 1.99665565247483e-05,
+ "loss": 1.72,
+ "step": 2028
+ },
+ {
+ "epoch": 5.528610354223433,
+ "grad_norm": 11.066896438598633,
+ "learning_rate": 1.9966484371976168e-05,
+ "loss": 1.9131,
+ "step": 2029
+ },
+ {
+ "epoch": 5.53133514986376,
+ "grad_norm": 9.92104721069336,
+ "learning_rate": 1.996641214158538e-05,
+ "loss": 1.8105,
+ "step": 2030
+ },
+ {
+ "epoch": 5.5340599455040875,
+ "grad_norm": 11.066975593566895,
+ "learning_rate": 1.9966339833576496e-05,
+ "loss": 1.6252,
+ "step": 2031
+ },
+ {
+ "epoch": 5.536784741144414,
+ "grad_norm": 10.61975383758545,
+ "learning_rate": 1.9966267447950076e-05,
+ "loss": 1.8926,
+ "step": 2032
+ },
+ {
+ "epoch": 5.539509536784741,
+ "grad_norm": 11.257098197937012,
+ "learning_rate": 1.9966194984706686e-05,
+ "loss": 1.707,
+ "step": 2033
+ },
+ {
+ "epoch": 5.5422343324250685,
+ "grad_norm": 9.231466293334961,
+ "learning_rate": 1.996612244384689e-05,
+ "loss": 1.7954,
+ "step": 2034
+ },
+ {
+ "epoch": 5.544959128065395,
+ "grad_norm": 12.137299537658691,
+ "learning_rate": 1.9966049825371254e-05,
+ "loss": 1.8252,
+ "step": 2035
+ },
+ {
+ "epoch": 5.547683923705722,
+ "grad_norm": 9.002218246459961,
+ "learning_rate": 1.9965977129280344e-05,
+ "loss": 1.6177,
+ "step": 2036
+ },
+ {
+ "epoch": 5.550408719346049,
+ "grad_norm": 11.364861488342285,
+ "learning_rate": 1.9965904355574723e-05,
+ "loss": 1.7212,
+ "step": 2037
+ },
+ {
+ "epoch": 5.553133514986376,
+ "grad_norm": 13.221735000610352,
+ "learning_rate": 1.996583150425496e-05,
+ "loss": 1.9946,
+ "step": 2038
+ },
+ {
+ "epoch": 5.555858310626703,
+ "grad_norm": 10.66685962677002,
+ "learning_rate": 1.996575857532162e-05,
+ "loss": 1.6626,
+ "step": 2039
+ },
+ {
+ "epoch": 5.55858310626703,
+ "grad_norm": 8.7399320602417,
+ "learning_rate": 1.996568556877528e-05,
+ "loss": 1.6018,
+ "step": 2040
+ },
+ {
+ "epoch": 5.561307901907357,
+ "grad_norm": 10.089179039001465,
+ "learning_rate": 1.996561248461649e-05,
+ "loss": 1.6326,
+ "step": 2041
+ },
+ {
+ "epoch": 5.564032697547684,
+ "grad_norm": 9.229874610900879,
+ "learning_rate": 1.996553932284584e-05,
+ "loss": 1.6128,
+ "step": 2042
+ },
+ {
+ "epoch": 5.566757493188011,
+ "grad_norm": 10.963753700256348,
+ "learning_rate": 1.9965466083463886e-05,
+ "loss": 1.4976,
+ "step": 2043
+ },
+ {
+ "epoch": 5.569482288828338,
+ "grad_norm": 11.130434036254883,
+ "learning_rate": 1.9965392766471205e-05,
+ "loss": 1.915,
+ "step": 2044
+ },
+ {
+ "epoch": 5.572207084468665,
+ "grad_norm": 8.809657096862793,
+ "learning_rate": 1.9965319371868367e-05,
+ "loss": 1.4905,
+ "step": 2045
+ },
+ {
+ "epoch": 5.574931880108992,
+ "grad_norm": 10.36462116241455,
+ "learning_rate": 1.996524589965594e-05,
+ "loss": 1.7361,
+ "step": 2046
+ },
+ {
+ "epoch": 5.577656675749319,
+ "grad_norm": 41.264801025390625,
+ "learning_rate": 1.99651723498345e-05,
+ "loss": 1.623,
+ "step": 2047
+ },
+ {
+ "epoch": 5.580381471389646,
+ "grad_norm": 8.902155876159668,
+ "learning_rate": 1.9965098722404617e-05,
+ "loss": 1.551,
+ "step": 2048
+ },
+ {
+ "epoch": 5.583106267029972,
+ "grad_norm": 11.729252815246582,
+ "learning_rate": 1.9965025017366867e-05,
+ "loss": 1.8154,
+ "step": 2049
+ },
+ {
+ "epoch": 5.5858310626703,
+ "grad_norm": 9.16838264465332,
+ "learning_rate": 1.9964951234721824e-05,
+ "loss": 1.7109,
+ "step": 2050
+ },
+ {
+ "epoch": 5.5885558583106265,
+ "grad_norm": 9.499626159667969,
+ "learning_rate": 1.996487737447006e-05,
+ "loss": 1.5315,
+ "step": 2051
+ },
+ {
+ "epoch": 5.591280653950953,
+ "grad_norm": 11.185776710510254,
+ "learning_rate": 1.9964803436612152e-05,
+ "loss": 1.7524,
+ "step": 2052
+ },
+ {
+ "epoch": 5.594005449591281,
+ "grad_norm": 14.046220779418945,
+ "learning_rate": 1.9964729421148676e-05,
+ "loss": 1.6965,
+ "step": 2053
+ },
+ {
+ "epoch": 5.5967302452316074,
+ "grad_norm": 10.339086532592773,
+ "learning_rate": 1.9964655328080207e-05,
+ "loss": 1.5032,
+ "step": 2054
+ },
+ {
+ "epoch": 5.599455040871934,
+ "grad_norm": 9.257699012756348,
+ "learning_rate": 1.9964581157407324e-05,
+ "loss": 1.4612,
+ "step": 2055
+ },
+ {
+ "epoch": 5.602179836512262,
+ "grad_norm": 8.680740356445312,
+ "learning_rate": 1.99645069091306e-05,
+ "loss": 1.4697,
+ "step": 2056
+ },
+ {
+ "epoch": 5.604904632152588,
+ "grad_norm": 15.50500202178955,
+ "learning_rate": 1.996443258325062e-05,
+ "loss": 1.7192,
+ "step": 2057
+ },
+ {
+ "epoch": 5.607629427792915,
+ "grad_norm": 10.124307632446289,
+ "learning_rate": 1.996435817976796e-05,
+ "loss": 1.6511,
+ "step": 2058
+ },
+ {
+ "epoch": 5.610354223433243,
+ "grad_norm": 18.231836318969727,
+ "learning_rate": 1.99642836986832e-05,
+ "loss": 1.7922,
+ "step": 2059
+ },
+ {
+ "epoch": 5.613079019073569,
+ "grad_norm": 10.452853202819824,
+ "learning_rate": 1.9964209139996917e-05,
+ "loss": 1.5552,
+ "step": 2060
+ },
+ {
+ "epoch": 5.615803814713896,
+ "grad_norm": 10.715081214904785,
+ "learning_rate": 1.9964134503709695e-05,
+ "loss": 1.5347,
+ "step": 2061
+ },
+ {
+ "epoch": 5.618528610354224,
+ "grad_norm": 9.665472030639648,
+ "learning_rate": 1.9964059789822118e-05,
+ "loss": 1.9624,
+ "step": 2062
+ },
+ {
+ "epoch": 5.62125340599455,
+ "grad_norm": 10.516495704650879,
+ "learning_rate": 1.9963984998334757e-05,
+ "loss": 1.6941,
+ "step": 2063
+ },
+ {
+ "epoch": 5.623978201634877,
+ "grad_norm": 10.411148071289062,
+ "learning_rate": 1.9963910129248206e-05,
+ "loss": 1.6367,
+ "step": 2064
+ },
+ {
+ "epoch": 5.6267029972752045,
+ "grad_norm": 10.789862632751465,
+ "learning_rate": 1.9963835182563043e-05,
+ "loss": 1.8081,
+ "step": 2065
+ },
+ {
+ "epoch": 5.629427792915531,
+ "grad_norm": 10.961912155151367,
+ "learning_rate": 1.996376015827985e-05,
+ "loss": 1.4958,
+ "step": 2066
+ },
+ {
+ "epoch": 5.632152588555858,
+ "grad_norm": 9.865840911865234,
+ "learning_rate": 1.9963685056399217e-05,
+ "loss": 1.5815,
+ "step": 2067
+ },
+ {
+ "epoch": 5.6348773841961854,
+ "grad_norm": 12.462875366210938,
+ "learning_rate": 1.9963609876921722e-05,
+ "loss": 1.7671,
+ "step": 2068
+ },
+ {
+ "epoch": 5.637602179836512,
+ "grad_norm": 11.314741134643555,
+ "learning_rate": 1.9963534619847956e-05,
+ "loss": 1.8618,
+ "step": 2069
+ },
+ {
+ "epoch": 5.640326975476839,
+ "grad_norm": 86.43844604492188,
+ "learning_rate": 1.9963459285178505e-05,
+ "loss": 1.699,
+ "step": 2070
+ },
+ {
+ "epoch": 5.643051771117166,
+ "grad_norm": 10.88832950592041,
+ "learning_rate": 1.996338387291395e-05,
+ "loss": 1.5166,
+ "step": 2071
+ },
+ {
+ "epoch": 5.645776566757493,
+ "grad_norm": 13.507354736328125,
+ "learning_rate": 1.9963308383054883e-05,
+ "loss": 1.5952,
+ "step": 2072
+ },
+ {
+ "epoch": 5.64850136239782,
+ "grad_norm": 9.790104866027832,
+ "learning_rate": 1.9963232815601896e-05,
+ "loss": 1.696,
+ "step": 2073
+ },
+ {
+ "epoch": 5.651226158038147,
+ "grad_norm": 10.6688814163208,
+ "learning_rate": 1.9963157170555564e-05,
+ "loss": 1.6699,
+ "step": 2074
+ },
+ {
+ "epoch": 5.653950953678474,
+ "grad_norm": 10.911157608032227,
+ "learning_rate": 1.996308144791649e-05,
+ "loss": 1.7339,
+ "step": 2075
+ },
+ {
+ "epoch": 5.656675749318801,
+ "grad_norm": 16.183406829833984,
+ "learning_rate": 1.9963005647685256e-05,
+ "loss": 1.4517,
+ "step": 2076
+ },
+ {
+ "epoch": 5.659400544959128,
+ "grad_norm": 11.098819732666016,
+ "learning_rate": 1.9962929769862456e-05,
+ "loss": 1.73,
+ "step": 2077
+ },
+ {
+ "epoch": 5.662125340599455,
+ "grad_norm": 13.996894836425781,
+ "learning_rate": 1.996285381444868e-05,
+ "loss": 1.6396,
+ "step": 2078
+ },
+ {
+ "epoch": 5.664850136239782,
+ "grad_norm": 15.200331687927246,
+ "learning_rate": 1.9962777781444518e-05,
+ "loss": 1.7942,
+ "step": 2079
+ },
+ {
+ "epoch": 5.667574931880109,
+ "grad_norm": 26.82591438293457,
+ "learning_rate": 1.9962701670850566e-05,
+ "loss": 1.8101,
+ "step": 2080
+ },
+ {
+ "epoch": 5.670299727520436,
+ "grad_norm": 9.281715393066406,
+ "learning_rate": 1.996262548266741e-05,
+ "loss": 1.55,
+ "step": 2081
+ },
+ {
+ "epoch": 5.6730245231607626,
+ "grad_norm": 14.311118125915527,
+ "learning_rate": 1.996254921689565e-05,
+ "loss": 1.7439,
+ "step": 2082
+ },
+ {
+ "epoch": 5.67574931880109,
+ "grad_norm": 15.628812789916992,
+ "learning_rate": 1.9962472873535877e-05,
+ "loss": 1.8042,
+ "step": 2083
+ },
+ {
+ "epoch": 5.678474114441417,
+ "grad_norm": 12.210664749145508,
+ "learning_rate": 1.9962396452588684e-05,
+ "loss": 1.7661,
+ "step": 2084
+ },
+ {
+ "epoch": 5.6811989100817435,
+ "grad_norm": 12.074110984802246,
+ "learning_rate": 1.996231995405467e-05,
+ "loss": 1.551,
+ "step": 2085
+ },
+ {
+ "epoch": 5.683923705722071,
+ "grad_norm": 8.891280174255371,
+ "learning_rate": 1.996224337793443e-05,
+ "loss": 1.3794,
+ "step": 2086
+ },
+ {
+ "epoch": 5.686648501362398,
+ "grad_norm": 12.006574630737305,
+ "learning_rate": 1.996216672422856e-05,
+ "loss": 1.7454,
+ "step": 2087
+ },
+ {
+ "epoch": 5.689373297002724,
+ "grad_norm": 12.251750946044922,
+ "learning_rate": 1.996208999293765e-05,
+ "loss": 1.6145,
+ "step": 2088
+ },
+ {
+ "epoch": 5.692098092643052,
+ "grad_norm": 12.137250900268555,
+ "learning_rate": 1.9962013184062308e-05,
+ "loss": 1.595,
+ "step": 2089
+ },
+ {
+ "epoch": 5.694822888283379,
+ "grad_norm": 16.92084312438965,
+ "learning_rate": 1.996193629760313e-05,
+ "loss": 1.4574,
+ "step": 2090
+ },
+ {
+ "epoch": 5.697547683923705,
+ "grad_norm": 15.800286293029785,
+ "learning_rate": 1.9961859333560708e-05,
+ "loss": 1.8149,
+ "step": 2091
+ },
+ {
+ "epoch": 5.700272479564033,
+ "grad_norm": 17.070358276367188,
+ "learning_rate": 1.9961782291935648e-05,
+ "loss": 1.7407,
+ "step": 2092
+ },
+ {
+ "epoch": 5.70299727520436,
+ "grad_norm": 11.122482299804688,
+ "learning_rate": 1.9961705172728547e-05,
+ "loss": 1.7949,
+ "step": 2093
+ },
+ {
+ "epoch": 5.705722070844686,
+ "grad_norm": 13.73668384552002,
+ "learning_rate": 1.996162797594001e-05,
+ "loss": 1.7913,
+ "step": 2094
+ },
+ {
+ "epoch": 5.708446866485014,
+ "grad_norm": 10.459869384765625,
+ "learning_rate": 1.9961550701570633e-05,
+ "loss": 1.3384,
+ "step": 2095
+ },
+ {
+ "epoch": 5.7111716621253406,
+ "grad_norm": 10.803874015808105,
+ "learning_rate": 1.996147334962102e-05,
+ "loss": 1.8022,
+ "step": 2096
+ },
+ {
+ "epoch": 5.713896457765667,
+ "grad_norm": 10.83578872680664,
+ "learning_rate": 1.9961395920091773e-05,
+ "loss": 1.6157,
+ "step": 2097
+ },
+ {
+ "epoch": 5.716621253405995,
+ "grad_norm": 15.397379875183105,
+ "learning_rate": 1.9961318412983494e-05,
+ "loss": 1.7383,
+ "step": 2098
+ },
+ {
+ "epoch": 5.7193460490463215,
+ "grad_norm": 15.053755760192871,
+ "learning_rate": 1.996124082829679e-05,
+ "loss": 1.7429,
+ "step": 2099
+ },
+ {
+ "epoch": 5.722070844686648,
+ "grad_norm": 14.341357231140137,
+ "learning_rate": 1.996116316603226e-05,
+ "loss": 2.02,
+ "step": 2100
+ },
+ {
+ "epoch": 5.724795640326976,
+ "grad_norm": 20.855138778686523,
+ "learning_rate": 1.9961085426190516e-05,
+ "loss": 1.9399,
+ "step": 2101
+ },
+ {
+ "epoch": 5.727520435967302,
+ "grad_norm": 11.542928695678711,
+ "learning_rate": 1.9961007608772157e-05,
+ "loss": 1.7102,
+ "step": 2102
+ },
+ {
+ "epoch": 5.730245231607629,
+ "grad_norm": 11.331934928894043,
+ "learning_rate": 1.996092971377779e-05,
+ "loss": 1.8606,
+ "step": 2103
+ },
+ {
+ "epoch": 5.732970027247957,
+ "grad_norm": 10.98530387878418,
+ "learning_rate": 1.996085174120803e-05,
+ "loss": 1.7747,
+ "step": 2104
+ },
+ {
+ "epoch": 5.735694822888283,
+ "grad_norm": 11.881148338317871,
+ "learning_rate": 1.9960773691063468e-05,
+ "loss": 1.7354,
+ "step": 2105
+ },
+ {
+ "epoch": 5.73841961852861,
+ "grad_norm": 13.253885269165039,
+ "learning_rate": 1.9960695563344727e-05,
+ "loss": 1.8047,
+ "step": 2106
+ },
+ {
+ "epoch": 5.741144414168938,
+ "grad_norm": 14.778120040893555,
+ "learning_rate": 1.9960617358052404e-05,
+ "loss": 1.7551,
+ "step": 2107
+ },
+ {
+ "epoch": 5.743869209809264,
+ "grad_norm": 10.513572692871094,
+ "learning_rate": 1.9960539075187116e-05,
+ "loss": 1.5071,
+ "step": 2108
+ },
+ {
+ "epoch": 5.746594005449591,
+ "grad_norm": 13.157445907592773,
+ "learning_rate": 1.996046071474947e-05,
+ "loss": 1.8066,
+ "step": 2109
+ },
+ {
+ "epoch": 5.7493188010899186,
+ "grad_norm": 9.51871395111084,
+ "learning_rate": 1.996038227674008e-05,
+ "loss": 1.5996,
+ "step": 2110
+ },
+ {
+ "epoch": 5.752043596730245,
+ "grad_norm": 16.539831161499023,
+ "learning_rate": 1.9960303761159552e-05,
+ "loss": 1.6382,
+ "step": 2111
+ },
+ {
+ "epoch": 5.754768392370572,
+ "grad_norm": 11.248241424560547,
+ "learning_rate": 1.9960225168008498e-05,
+ "loss": 1.4172,
+ "step": 2112
+ },
+ {
+ "epoch": 5.7574931880108995,
+ "grad_norm": 11.98831558227539,
+ "learning_rate": 1.9960146497287532e-05,
+ "loss": 1.7786,
+ "step": 2113
+ },
+ {
+ "epoch": 5.760217983651226,
+ "grad_norm": 12.180619239807129,
+ "learning_rate": 1.9960067748997264e-05,
+ "loss": 1.8003,
+ "step": 2114
+ },
+ {
+ "epoch": 5.762942779291553,
+ "grad_norm": 10.6093168258667,
+ "learning_rate": 1.995998892313831e-05,
+ "loss": 1.5938,
+ "step": 2115
+ },
+ {
+ "epoch": 5.76566757493188,
+ "grad_norm": 9.59289836883545,
+ "learning_rate": 1.9959910019711282e-05,
+ "loss": 1.646,
+ "step": 2116
+ },
+ {
+ "epoch": 5.768392370572207,
+ "grad_norm": 24.2403564453125,
+ "learning_rate": 1.9959831038716798e-05,
+ "loss": 1.6519,
+ "step": 2117
+ },
+ {
+ "epoch": 5.771117166212534,
+ "grad_norm": 21.29315185546875,
+ "learning_rate": 1.9959751980155465e-05,
+ "loss": 1.7158,
+ "step": 2118
+ },
+ {
+ "epoch": 5.773841961852861,
+ "grad_norm": 11.449963569641113,
+ "learning_rate": 1.995967284402791e-05,
+ "loss": 1.7832,
+ "step": 2119
+ },
+ {
+ "epoch": 5.776566757493188,
+ "grad_norm": 11.538114547729492,
+ "learning_rate": 1.995959363033474e-05,
+ "loss": 1.5942,
+ "step": 2120
+ },
+ {
+ "epoch": 5.779291553133515,
+ "grad_norm": 13.878122329711914,
+ "learning_rate": 1.9959514339076575e-05,
+ "loss": 1.7637,
+ "step": 2121
+ },
+ {
+ "epoch": 5.782016348773842,
+ "grad_norm": 19.71577262878418,
+ "learning_rate": 1.9959434970254036e-05,
+ "loss": 1.7839,
+ "step": 2122
+ },
+ {
+ "epoch": 5.784741144414169,
+ "grad_norm": 14.786399841308594,
+ "learning_rate": 1.9959355523867734e-05,
+ "loss": 1.7043,
+ "step": 2123
+ },
+ {
+ "epoch": 5.787465940054496,
+ "grad_norm": 11.029261589050293,
+ "learning_rate": 1.9959275999918293e-05,
+ "loss": 1.7603,
+ "step": 2124
+ },
+ {
+ "epoch": 5.790190735694823,
+ "grad_norm": 9.883845329284668,
+ "learning_rate": 1.9959196398406334e-05,
+ "loss": 1.5271,
+ "step": 2125
+ },
+ {
+ "epoch": 5.79291553133515,
+ "grad_norm": 14.708576202392578,
+ "learning_rate": 1.9959116719332468e-05,
+ "loss": 1.5571,
+ "step": 2126
+ },
+ {
+ "epoch": 5.795640326975477,
+ "grad_norm": 11.166234970092773,
+ "learning_rate": 1.9959036962697327e-05,
+ "loss": 1.7852,
+ "step": 2127
+ },
+ {
+ "epoch": 5.798365122615804,
+ "grad_norm": 11.428666114807129,
+ "learning_rate": 1.9958957128501528e-05,
+ "loss": 1.5862,
+ "step": 2128
+ },
+ {
+ "epoch": 5.801089918256131,
+ "grad_norm": 21.812938690185547,
+ "learning_rate": 1.9958877216745685e-05,
+ "loss": 1.6514,
+ "step": 2129
+ },
+ {
+ "epoch": 5.8038147138964575,
+ "grad_norm": 10.75883674621582,
+ "learning_rate": 1.995879722743043e-05,
+ "loss": 1.7747,
+ "step": 2130
+ },
+ {
+ "epoch": 5.806539509536785,
+ "grad_norm": 9.681130409240723,
+ "learning_rate": 1.9958717160556385e-05,
+ "loss": 1.5186,
+ "step": 2131
+ },
+ {
+ "epoch": 5.809264305177112,
+ "grad_norm": 12.587305068969727,
+ "learning_rate": 1.9958637016124167e-05,
+ "loss": 1.5547,
+ "step": 2132
+ },
+ {
+ "epoch": 5.8119891008174385,
+ "grad_norm": 9.57124137878418,
+ "learning_rate": 1.9958556794134407e-05,
+ "loss": 1.8291,
+ "step": 2133
+ },
+ {
+ "epoch": 5.814713896457766,
+ "grad_norm": 9.282252311706543,
+ "learning_rate": 1.9958476494587725e-05,
+ "loss": 1.9062,
+ "step": 2134
+ },
+ {
+ "epoch": 5.817438692098093,
+ "grad_norm": 19.19476890563965,
+ "learning_rate": 1.995839611748475e-05,
+ "loss": 1.6582,
+ "step": 2135
+ },
+ {
+ "epoch": 5.820163487738419,
+ "grad_norm": 10.15176010131836,
+ "learning_rate": 1.995831566282611e-05,
+ "loss": 1.6479,
+ "step": 2136
+ },
+ {
+ "epoch": 5.822888283378747,
+ "grad_norm": 11.221248626708984,
+ "learning_rate": 1.9958235130612423e-05,
+ "loss": 1.7581,
+ "step": 2137
+ },
+ {
+ "epoch": 5.825613079019074,
+ "grad_norm": 14.83688735961914,
+ "learning_rate": 1.9958154520844326e-05,
+ "loss": 1.8569,
+ "step": 2138
+ },
+ {
+ "epoch": 5.8283378746594,
+ "grad_norm": 10.33976936340332,
+ "learning_rate": 1.9958073833522437e-05,
+ "loss": 1.7148,
+ "step": 2139
+ },
+ {
+ "epoch": 5.831062670299728,
+ "grad_norm": 12.592178344726562,
+ "learning_rate": 1.9957993068647394e-05,
+ "loss": 1.5762,
+ "step": 2140
+ },
+ {
+ "epoch": 5.833787465940055,
+ "grad_norm": 12.909204483032227,
+ "learning_rate": 1.9957912226219817e-05,
+ "loss": 1.7793,
+ "step": 2141
+ },
+ {
+ "epoch": 5.836512261580381,
+ "grad_norm": 10.267101287841797,
+ "learning_rate": 1.9957831306240343e-05,
+ "loss": 1.8643,
+ "step": 2142
+ },
+ {
+ "epoch": 5.839237057220709,
+ "grad_norm": 8.997322082519531,
+ "learning_rate": 1.9957750308709598e-05,
+ "loss": 1.728,
+ "step": 2143
+ },
+ {
+ "epoch": 5.8419618528610355,
+ "grad_norm": 10.750346183776855,
+ "learning_rate": 1.9957669233628216e-05,
+ "loss": 1.7119,
+ "step": 2144
+ },
+ {
+ "epoch": 5.844686648501362,
+ "grad_norm": 10.793237686157227,
+ "learning_rate": 1.9957588080996825e-05,
+ "loss": 1.7256,
+ "step": 2145
+ },
+ {
+ "epoch": 5.84741144414169,
+ "grad_norm": 7.666360855102539,
+ "learning_rate": 1.995750685081606e-05,
+ "loss": 1.5859,
+ "step": 2146
+ },
+ {
+ "epoch": 5.8501362397820165,
+ "grad_norm": 8.329882621765137,
+ "learning_rate": 1.995742554308655e-05,
+ "loss": 1.7261,
+ "step": 2147
+ },
+ {
+ "epoch": 5.852861035422343,
+ "grad_norm": 11.187580108642578,
+ "learning_rate": 1.995734415780893e-05,
+ "loss": 1.9126,
+ "step": 2148
+ },
+ {
+ "epoch": 5.855585831062671,
+ "grad_norm": 9.039776802062988,
+ "learning_rate": 1.9957262694983837e-05,
+ "loss": 1.7249,
+ "step": 2149
+ },
+ {
+ "epoch": 5.858310626702997,
+ "grad_norm": 11.114256858825684,
+ "learning_rate": 1.9957181154611903e-05,
+ "loss": 1.6907,
+ "step": 2150
+ },
+ {
+ "epoch": 5.861035422343324,
+ "grad_norm": 11.95982551574707,
+ "learning_rate": 1.995709953669376e-05,
+ "loss": 1.5112,
+ "step": 2151
+ },
+ {
+ "epoch": 5.863760217983652,
+ "grad_norm": 11.137290000915527,
+ "learning_rate": 1.9957017841230045e-05,
+ "loss": 1.7397,
+ "step": 2152
+ },
+ {
+ "epoch": 5.866485013623978,
+ "grad_norm": 11.245691299438477,
+ "learning_rate": 1.9956936068221396e-05,
+ "loss": 1.4753,
+ "step": 2153
+ },
+ {
+ "epoch": 5.869209809264305,
+ "grad_norm": 10.877267837524414,
+ "learning_rate": 1.995685421766845e-05,
+ "loss": 1.8682,
+ "step": 2154
+ },
+ {
+ "epoch": 5.871934604904633,
+ "grad_norm": 16.539710998535156,
+ "learning_rate": 1.9956772289571845e-05,
+ "loss": 1.5327,
+ "step": 2155
+ },
+ {
+ "epoch": 5.874659400544959,
+ "grad_norm": 10.097494125366211,
+ "learning_rate": 1.995669028393222e-05,
+ "loss": 1.6814,
+ "step": 2156
+ },
+ {
+ "epoch": 5.877384196185286,
+ "grad_norm": 8.638931274414062,
+ "learning_rate": 1.995660820075021e-05,
+ "loss": 1.8547,
+ "step": 2157
+ },
+ {
+ "epoch": 5.8801089918256135,
+ "grad_norm": 18.214252471923828,
+ "learning_rate": 1.9956526040026453e-05,
+ "loss": 1.5378,
+ "step": 2158
+ },
+ {
+ "epoch": 5.88283378746594,
+ "grad_norm": 8.704755783081055,
+ "learning_rate": 1.9956443801761593e-05,
+ "loss": 1.4504,
+ "step": 2159
+ },
+ {
+ "epoch": 5.885558583106267,
+ "grad_norm": 7.709156513214111,
+ "learning_rate": 1.995636148595627e-05,
+ "loss": 1.6738,
+ "step": 2160
+ },
+ {
+ "epoch": 5.8882833787465945,
+ "grad_norm": 10.272282600402832,
+ "learning_rate": 1.9956279092611123e-05,
+ "loss": 1.8521,
+ "step": 2161
+ },
+ {
+ "epoch": 5.891008174386921,
+ "grad_norm": 8.876688957214355,
+ "learning_rate": 1.9956196621726794e-05,
+ "loss": 1.665,
+ "step": 2162
+ },
+ {
+ "epoch": 5.893732970027248,
+ "grad_norm": 12.127043724060059,
+ "learning_rate": 1.995611407330393e-05,
+ "loss": 1.5745,
+ "step": 2163
+ },
+ {
+ "epoch": 5.896457765667575,
+ "grad_norm": 9.917612075805664,
+ "learning_rate": 1.9956031447343166e-05,
+ "loss": 1.7146,
+ "step": 2164
+ },
+ {
+ "epoch": 5.899182561307902,
+ "grad_norm": 8.613646507263184,
+ "learning_rate": 1.9955948743845152e-05,
+ "loss": 1.418,
+ "step": 2165
+ },
+ {
+ "epoch": 5.901907356948229,
+ "grad_norm": 14.007044792175293,
+ "learning_rate": 1.995586596281053e-05,
+ "loss": 1.6123,
+ "step": 2166
+ },
+ {
+ "epoch": 5.904632152588556,
+ "grad_norm": 10.300485610961914,
+ "learning_rate": 1.9955783104239943e-05,
+ "loss": 1.708,
+ "step": 2167
+ },
+ {
+ "epoch": 5.907356948228883,
+ "grad_norm": 9.43236255645752,
+ "learning_rate": 1.995570016813404e-05,
+ "loss": 1.6816,
+ "step": 2168
+ },
+ {
+ "epoch": 5.91008174386921,
+ "grad_norm": 8.837135314941406,
+ "learning_rate": 1.9955617154493462e-05,
+ "loss": 1.6973,
+ "step": 2169
+ },
+ {
+ "epoch": 5.912806539509537,
+ "grad_norm": 8.825847625732422,
+ "learning_rate": 1.995553406331886e-05,
+ "loss": 1.5781,
+ "step": 2170
+ },
+ {
+ "epoch": 5.915531335149864,
+ "grad_norm": 13.152094841003418,
+ "learning_rate": 1.9955450894610875e-05,
+ "loss": 1.6084,
+ "step": 2171
+ },
+ {
+ "epoch": 5.918256130790191,
+ "grad_norm": 9.993326187133789,
+ "learning_rate": 1.995536764837016e-05,
+ "loss": 1.5632,
+ "step": 2172
+ },
+ {
+ "epoch": 5.920980926430518,
+ "grad_norm": 10.549430847167969,
+ "learning_rate": 1.9955284324597365e-05,
+ "loss": 1.8931,
+ "step": 2173
+ },
+ {
+ "epoch": 5.923705722070845,
+ "grad_norm": 11.248650550842285,
+ "learning_rate": 1.9955200923293134e-05,
+ "loss": 1.52,
+ "step": 2174
+ },
+ {
+ "epoch": 5.926430517711172,
+ "grad_norm": 10.428131103515625,
+ "learning_rate": 1.9955117444458118e-05,
+ "loss": 1.8013,
+ "step": 2175
+ },
+ {
+ "epoch": 5.929155313351498,
+ "grad_norm": 10.206390380859375,
+ "learning_rate": 1.9955033888092973e-05,
+ "loss": 1.623,
+ "step": 2176
+ },
+ {
+ "epoch": 5.931880108991826,
+ "grad_norm": 12.52747917175293,
+ "learning_rate": 1.995495025419834e-05,
+ "loss": 1.6709,
+ "step": 2177
+ },
+ {
+ "epoch": 5.9346049046321525,
+ "grad_norm": 12.243200302124023,
+ "learning_rate": 1.9954866542774872e-05,
+ "loss": 1.7246,
+ "step": 2178
+ },
+ {
+ "epoch": 5.937329700272479,
+ "grad_norm": 8.610759735107422,
+ "learning_rate": 1.9954782753823227e-05,
+ "loss": 1.5435,
+ "step": 2179
+ },
+ {
+ "epoch": 5.940054495912807,
+ "grad_norm": 8.388009071350098,
+ "learning_rate": 1.9954698887344057e-05,
+ "loss": 1.6885,
+ "step": 2180
+ },
+ {
+ "epoch": 5.9427792915531334,
+ "grad_norm": 8.853168487548828,
+ "learning_rate": 1.995461494333801e-05,
+ "loss": 1.8015,
+ "step": 2181
+ },
+ {
+ "epoch": 5.94550408719346,
+ "grad_norm": 8.397902488708496,
+ "learning_rate": 1.995453092180574e-05,
+ "loss": 1.6548,
+ "step": 2182
+ },
+ {
+ "epoch": 5.948228882833788,
+ "grad_norm": 10.568078994750977,
+ "learning_rate": 1.9954446822747905e-05,
+ "loss": 1.7788,
+ "step": 2183
+ },
+ {
+ "epoch": 5.950953678474114,
+ "grad_norm": 12.230669021606445,
+ "learning_rate": 1.995436264616516e-05,
+ "loss": 1.6689,
+ "step": 2184
+ },
+ {
+ "epoch": 5.953678474114441,
+ "grad_norm": 9.328551292419434,
+ "learning_rate": 1.995427839205816e-05,
+ "loss": 1.71,
+ "step": 2185
+ },
+ {
+ "epoch": 5.956403269754769,
+ "grad_norm": 10.6898193359375,
+ "learning_rate": 1.9954194060427557e-05,
+ "loss": 1.8257,
+ "step": 2186
+ },
+ {
+ "epoch": 5.959128065395095,
+ "grad_norm": 11.12633991241455,
+ "learning_rate": 1.9954109651274015e-05,
+ "loss": 1.6909,
+ "step": 2187
+ },
+ {
+ "epoch": 5.961852861035422,
+ "grad_norm": 8.994038581848145,
+ "learning_rate": 1.9954025164598184e-05,
+ "loss": 1.5422,
+ "step": 2188
+ },
+ {
+ "epoch": 5.96457765667575,
+ "grad_norm": 14.928201675415039,
+ "learning_rate": 1.9953940600400726e-05,
+ "loss": 1.6475,
+ "step": 2189
+ },
+ {
+ "epoch": 5.967302452316076,
+ "grad_norm": 13.77098274230957,
+ "learning_rate": 1.9953855958682297e-05,
+ "loss": 1.6206,
+ "step": 2190
+ },
+ {
+ "epoch": 5.970027247956403,
+ "grad_norm": 8.098898887634277,
+ "learning_rate": 1.9953771239443562e-05,
+ "loss": 1.5703,
+ "step": 2191
+ },
+ {
+ "epoch": 5.9727520435967305,
+ "grad_norm": 7.796526908874512,
+ "learning_rate": 1.9953686442685175e-05,
+ "loss": 1.5212,
+ "step": 2192
+ },
+ {
+ "epoch": 5.975476839237057,
+ "grad_norm": 9.103816986083984,
+ "learning_rate": 1.99536015684078e-05,
+ "loss": 1.6255,
+ "step": 2193
+ },
+ {
+ "epoch": 5.978201634877384,
+ "grad_norm": 8.29758071899414,
+ "learning_rate": 1.9953516616612093e-05,
+ "loss": 1.4558,
+ "step": 2194
+ },
+ {
+ "epoch": 5.9809264305177114,
+ "grad_norm": 11.29628849029541,
+ "learning_rate": 1.9953431587298723e-05,
+ "loss": 1.8486,
+ "step": 2195
+ },
+ {
+ "epoch": 5.983651226158038,
+ "grad_norm": 9.009011268615723,
+ "learning_rate": 1.9953346480468347e-05,
+ "loss": 1.6904,
+ "step": 2196
+ },
+ {
+ "epoch": 5.986376021798365,
+ "grad_norm": 12.899435997009277,
+ "learning_rate": 1.9953261296121625e-05,
+ "loss": 1.8438,
+ "step": 2197
+ },
+ {
+ "epoch": 5.989100817438692,
+ "grad_norm": 9.92809009552002,
+ "learning_rate": 1.995317603425923e-05,
+ "loss": 1.8542,
+ "step": 2198
+ },
+ {
+ "epoch": 5.991825613079019,
+ "grad_norm": 9.189982414245605,
+ "learning_rate": 1.9953090694881815e-05,
+ "loss": 1.73,
+ "step": 2199
+ },
+ {
+ "epoch": 5.994550408719346,
+ "grad_norm": 12.12692642211914,
+ "learning_rate": 1.9953005277990054e-05,
+ "loss": 1.7061,
+ "step": 2200
+ },
+ {
+ "epoch": 5.997275204359673,
+ "grad_norm": 10.086868286132812,
+ "learning_rate": 1.9952919783584608e-05,
+ "loss": 1.7578,
+ "step": 2201
+ },
+ {
+ "epoch": 6.0,
+ "grad_norm": 11.160868644714355,
+ "learning_rate": 1.995283421166614e-05,
+ "loss": 1.5291,
+ "step": 2202
+ },
+ {
+ "epoch": 6.002724795640327,
+ "grad_norm": 10.200235366821289,
+ "learning_rate": 1.9952748562235325e-05,
+ "loss": 1.4353,
+ "step": 2203
+ },
+ {
+ "epoch": 6.005449591280654,
+ "grad_norm": 13.496068954467773,
+ "learning_rate": 1.995266283529282e-05,
+ "loss": 1.5662,
+ "step": 2204
+ },
+ {
+ "epoch": 6.008174386920981,
+ "grad_norm": 7.2131242752075195,
+ "learning_rate": 1.9952577030839297e-05,
+ "loss": 1.3428,
+ "step": 2205
+ },
+ {
+ "epoch": 6.010899182561308,
+ "grad_norm": 9.206995964050293,
+ "learning_rate": 1.9952491148875427e-05,
+ "loss": 1.3918,
+ "step": 2206
+ },
+ {
+ "epoch": 6.013623978201635,
+ "grad_norm": 8.290966033935547,
+ "learning_rate": 1.9952405189401872e-05,
+ "loss": 1.5034,
+ "step": 2207
+ },
+ {
+ "epoch": 6.016348773841962,
+ "grad_norm": 10.639963150024414,
+ "learning_rate": 1.9952319152419314e-05,
+ "loss": 1.5547,
+ "step": 2208
+ },
+ {
+ "epoch": 6.0190735694822886,
+ "grad_norm": 11.235346794128418,
+ "learning_rate": 1.9952233037928406e-05,
+ "loss": 1.5151,
+ "step": 2209
+ },
+ {
+ "epoch": 6.021798365122616,
+ "grad_norm": 7.436095714569092,
+ "learning_rate": 1.9952146845929833e-05,
+ "loss": 1.4702,
+ "step": 2210
+ },
+ {
+ "epoch": 6.024523160762943,
+ "grad_norm": 10.257650375366211,
+ "learning_rate": 1.9952060576424256e-05,
+ "loss": 1.501,
+ "step": 2211
+ },
+ {
+ "epoch": 6.0272479564032695,
+ "grad_norm": 10.27843952178955,
+ "learning_rate": 1.9951974229412355e-05,
+ "loss": 1.5029,
+ "step": 2212
+ },
+ {
+ "epoch": 6.029972752043597,
+ "grad_norm": 11.819791793823242,
+ "learning_rate": 1.99518878048948e-05,
+ "loss": 1.4094,
+ "step": 2213
+ },
+ {
+ "epoch": 6.032697547683924,
+ "grad_norm": 11.006246566772461,
+ "learning_rate": 1.995180130287226e-05,
+ "loss": 1.6929,
+ "step": 2214
+ },
+ {
+ "epoch": 6.03542234332425,
+ "grad_norm": 9.352935791015625,
+ "learning_rate": 1.995171472334541e-05,
+ "loss": 1.7075,
+ "step": 2215
+ },
+ {
+ "epoch": 6.038147138964578,
+ "grad_norm": 9.678173065185547,
+ "learning_rate": 1.9951628066314928e-05,
+ "loss": 1.4509,
+ "step": 2216
+ },
+ {
+ "epoch": 6.040871934604905,
+ "grad_norm": 11.307157516479492,
+ "learning_rate": 1.995154133178149e-05,
+ "loss": 1.6777,
+ "step": 2217
+ },
+ {
+ "epoch": 6.043596730245231,
+ "grad_norm": 8.42729377746582,
+ "learning_rate": 1.9951454519745767e-05,
+ "loss": 1.4922,
+ "step": 2218
+ },
+ {
+ "epoch": 6.046321525885559,
+ "grad_norm": 8.440991401672363,
+ "learning_rate": 1.9951367630208437e-05,
+ "loss": 1.5571,
+ "step": 2219
+ },
+ {
+ "epoch": 6.049046321525886,
+ "grad_norm": 8.879366874694824,
+ "learning_rate": 1.9951280663170174e-05,
+ "loss": 1.5613,
+ "step": 2220
+ },
+ {
+ "epoch": 6.051771117166212,
+ "grad_norm": 8.939628601074219,
+ "learning_rate": 1.9951193618631655e-05,
+ "loss": 1.563,
+ "step": 2221
+ },
+ {
+ "epoch": 6.05449591280654,
+ "grad_norm": 10.681466102600098,
+ "learning_rate": 1.9951106496593566e-05,
+ "loss": 1.7241,
+ "step": 2222
+ },
+ {
+ "epoch": 6.0572207084468666,
+ "grad_norm": 8.742968559265137,
+ "learning_rate": 1.995101929705658e-05,
+ "loss": 1.5901,
+ "step": 2223
+ },
+ {
+ "epoch": 6.059945504087193,
+ "grad_norm": 9.580309867858887,
+ "learning_rate": 1.9950932020021372e-05,
+ "loss": 1.6521,
+ "step": 2224
+ },
+ {
+ "epoch": 6.062670299727521,
+ "grad_norm": 10.331524848937988,
+ "learning_rate": 1.9950844665488626e-05,
+ "loss": 1.8003,
+ "step": 2225
+ },
+ {
+ "epoch": 6.0653950953678475,
+ "grad_norm": 10.002351760864258,
+ "learning_rate": 1.9950757233459022e-05,
+ "loss": 1.6375,
+ "step": 2226
+ },
+ {
+ "epoch": 6.068119891008174,
+ "grad_norm": 8.716421127319336,
+ "learning_rate": 1.9950669723933246e-05,
+ "loss": 1.5286,
+ "step": 2227
+ },
+ {
+ "epoch": 6.070844686648502,
+ "grad_norm": 10.600811958312988,
+ "learning_rate": 1.9950582136911972e-05,
+ "loss": 1.7808,
+ "step": 2228
+ },
+ {
+ "epoch": 6.073569482288828,
+ "grad_norm": 8.420156478881836,
+ "learning_rate": 1.995049447239588e-05,
+ "loss": 1.3865,
+ "step": 2229
+ },
+ {
+ "epoch": 6.076294277929155,
+ "grad_norm": 11.201637268066406,
+ "learning_rate": 1.9950406730385663e-05,
+ "loss": 1.5684,
+ "step": 2230
+ },
+ {
+ "epoch": 6.079019073569483,
+ "grad_norm": 8.961545944213867,
+ "learning_rate": 1.9950318910881993e-05,
+ "loss": 1.4878,
+ "step": 2231
+ },
+ {
+ "epoch": 6.081743869209809,
+ "grad_norm": 7.664729118347168,
+ "learning_rate": 1.9950231013885566e-05,
+ "loss": 1.5403,
+ "step": 2232
+ },
+ {
+ "epoch": 6.084468664850136,
+ "grad_norm": 8.747848510742188,
+ "learning_rate": 1.9950143039397056e-05,
+ "loss": 1.5457,
+ "step": 2233
+ },
+ {
+ "epoch": 6.087193460490464,
+ "grad_norm": 10.3059663772583,
+ "learning_rate": 1.995005498741715e-05,
+ "loss": 1.4146,
+ "step": 2234
+ },
+ {
+ "epoch": 6.08991825613079,
+ "grad_norm": 10.38664722442627,
+ "learning_rate": 1.994996685794654e-05,
+ "loss": 1.6313,
+ "step": 2235
+ },
+ {
+ "epoch": 6.092643051771117,
+ "grad_norm": 9.838129997253418,
+ "learning_rate": 1.994987865098591e-05,
+ "loss": 1.5403,
+ "step": 2236
+ },
+ {
+ "epoch": 6.0953678474114446,
+ "grad_norm": 10.536702156066895,
+ "learning_rate": 1.9949790366535943e-05,
+ "loss": 1.5447,
+ "step": 2237
+ },
+ {
+ "epoch": 6.098092643051771,
+ "grad_norm": 11.688711166381836,
+ "learning_rate": 1.9949702004597327e-05,
+ "loss": 1.5115,
+ "step": 2238
+ },
+ {
+ "epoch": 6.100817438692098,
+ "grad_norm": 9.537701606750488,
+ "learning_rate": 1.9949613565170755e-05,
+ "loss": 1.584,
+ "step": 2239
+ },
+ {
+ "epoch": 6.1035422343324255,
+ "grad_norm": 10.0718355178833,
+ "learning_rate": 1.994952504825691e-05,
+ "loss": 1.478,
+ "step": 2240
+ },
+ {
+ "epoch": 6.106267029972752,
+ "grad_norm": 12.579290390014648,
+ "learning_rate": 1.9949436453856487e-05,
+ "loss": 1.5327,
+ "step": 2241
+ },
+ {
+ "epoch": 6.108991825613079,
+ "grad_norm": 14.01674747467041,
+ "learning_rate": 1.9949347781970172e-05,
+ "loss": 1.7759,
+ "step": 2242
+ },
+ {
+ "epoch": 6.111716621253406,
+ "grad_norm": 15.666253089904785,
+ "learning_rate": 1.9949259032598656e-05,
+ "loss": 1.3484,
+ "step": 2243
+ },
+ {
+ "epoch": 6.114441416893733,
+ "grad_norm": 10.228379249572754,
+ "learning_rate": 1.994917020574263e-05,
+ "loss": 1.6025,
+ "step": 2244
+ },
+ {
+ "epoch": 6.11716621253406,
+ "grad_norm": 9.948064804077148,
+ "learning_rate": 1.994908130140279e-05,
+ "loss": 1.4221,
+ "step": 2245
+ },
+ {
+ "epoch": 6.1198910081743865,
+ "grad_norm": 14.202163696289062,
+ "learning_rate": 1.9948992319579822e-05,
+ "loss": 1.4207,
+ "step": 2246
+ },
+ {
+ "epoch": 6.122615803814714,
+ "grad_norm": 8.870183944702148,
+ "learning_rate": 1.9948903260274424e-05,
+ "loss": 1.4668,
+ "step": 2247
+ },
+ {
+ "epoch": 6.125340599455041,
+ "grad_norm": 12.374833106994629,
+ "learning_rate": 1.9948814123487286e-05,
+ "loss": 1.6436,
+ "step": 2248
+ },
+ {
+ "epoch": 6.128065395095367,
+ "grad_norm": 11.639524459838867,
+ "learning_rate": 1.9948724909219104e-05,
+ "loss": 1.7617,
+ "step": 2249
+ },
+ {
+ "epoch": 6.130790190735695,
+ "grad_norm": 10.247749328613281,
+ "learning_rate": 1.9948635617470572e-05,
+ "loss": 1.3259,
+ "step": 2250
+ },
+ {
+ "epoch": 6.133514986376022,
+ "grad_norm": 10.985930442810059,
+ "learning_rate": 1.994854624824239e-05,
+ "loss": 1.5647,
+ "step": 2251
+ },
+ {
+ "epoch": 6.136239782016348,
+ "grad_norm": 12.321182250976562,
+ "learning_rate": 1.9948456801535247e-05,
+ "loss": 1.5081,
+ "step": 2252
+ },
+ {
+ "epoch": 6.138964577656676,
+ "grad_norm": 22.540081024169922,
+ "learning_rate": 1.994836727734984e-05,
+ "loss": 1.6118,
+ "step": 2253
+ },
+ {
+ "epoch": 6.141689373297003,
+ "grad_norm": 14.029481887817383,
+ "learning_rate": 1.9948277675686873e-05,
+ "loss": 1.5061,
+ "step": 2254
+ },
+ {
+ "epoch": 6.144414168937329,
+ "grad_norm": 11.365158081054688,
+ "learning_rate": 1.9948187996547037e-05,
+ "loss": 1.6843,
+ "step": 2255
+ },
+ {
+ "epoch": 6.147138964577657,
+ "grad_norm": 12.896124839782715,
+ "learning_rate": 1.9948098239931035e-05,
+ "loss": 1.7524,
+ "step": 2256
+ },
+ {
+ "epoch": 6.1498637602179835,
+ "grad_norm": 11.004476547241211,
+ "learning_rate": 1.994800840583956e-05,
+ "loss": 1.6116,
+ "step": 2257
+ },
+ {
+ "epoch": 6.15258855585831,
+ "grad_norm": 14.635592460632324,
+ "learning_rate": 1.9947918494273322e-05,
+ "loss": 1.5481,
+ "step": 2258
+ },
+ {
+ "epoch": 6.155313351498638,
+ "grad_norm": 10.547788619995117,
+ "learning_rate": 1.994782850523301e-05,
+ "loss": 1.6958,
+ "step": 2259
+ },
+ {
+ "epoch": 6.1580381471389645,
+ "grad_norm": 12.902785301208496,
+ "learning_rate": 1.9947738438719332e-05,
+ "loss": 1.7449,
+ "step": 2260
+ },
+ {
+ "epoch": 6.160762942779291,
+ "grad_norm": 11.040125846862793,
+ "learning_rate": 1.9947648294732988e-05,
+ "loss": 1.74,
+ "step": 2261
+ },
+ {
+ "epoch": 6.163487738419619,
+ "grad_norm": 39.967002868652344,
+ "learning_rate": 1.994755807327468e-05,
+ "loss": 1.5569,
+ "step": 2262
+ },
+ {
+ "epoch": 6.166212534059945,
+ "grad_norm": 8.66330623626709,
+ "learning_rate": 1.9947467774345108e-05,
+ "loss": 1.564,
+ "step": 2263
+ },
+ {
+ "epoch": 6.168937329700272,
+ "grad_norm": 9.942988395690918,
+ "learning_rate": 1.9947377397944974e-05,
+ "loss": 1.5427,
+ "step": 2264
+ },
+ {
+ "epoch": 6.1716621253406,
+ "grad_norm": 11.946412086486816,
+ "learning_rate": 1.994728694407499e-05,
+ "loss": 1.4629,
+ "step": 2265
+ },
+ {
+ "epoch": 6.174386920980926,
+ "grad_norm": 14.022274017333984,
+ "learning_rate": 1.9947196412735855e-05,
+ "loss": 1.9458,
+ "step": 2266
+ },
+ {
+ "epoch": 6.177111716621253,
+ "grad_norm": 11.036538124084473,
+ "learning_rate": 1.9947105803928272e-05,
+ "loss": 1.5564,
+ "step": 2267
+ },
+ {
+ "epoch": 6.179836512261581,
+ "grad_norm": 12.539093971252441,
+ "learning_rate": 1.994701511765295e-05,
+ "loss": 1.4727,
+ "step": 2268
+ },
+ {
+ "epoch": 6.182561307901907,
+ "grad_norm": 15.075506210327148,
+ "learning_rate": 1.9946924353910595e-05,
+ "loss": 1.5957,
+ "step": 2269
+ },
+ {
+ "epoch": 6.185286103542234,
+ "grad_norm": 11.200881958007812,
+ "learning_rate": 1.994683351270191e-05,
+ "loss": 1.6321,
+ "step": 2270
+ },
+ {
+ "epoch": 6.1880108991825615,
+ "grad_norm": 9.643436431884766,
+ "learning_rate": 1.994674259402761e-05,
+ "loss": 1.7334,
+ "step": 2271
+ },
+ {
+ "epoch": 6.190735694822888,
+ "grad_norm": 10.168499946594238,
+ "learning_rate": 1.99466515978884e-05,
+ "loss": 1.5505,
+ "step": 2272
+ },
+ {
+ "epoch": 6.193460490463215,
+ "grad_norm": 13.098001480102539,
+ "learning_rate": 1.9946560524284985e-05,
+ "loss": 1.6384,
+ "step": 2273
+ },
+ {
+ "epoch": 6.1961852861035425,
+ "grad_norm": 13.747922897338867,
+ "learning_rate": 1.9946469373218076e-05,
+ "loss": 1.4556,
+ "step": 2274
+ },
+ {
+ "epoch": 6.198910081743869,
+ "grad_norm": 12.153290748596191,
+ "learning_rate": 1.994637814468838e-05,
+ "loss": 1.6526,
+ "step": 2275
+ },
+ {
+ "epoch": 6.201634877384196,
+ "grad_norm": 10.517086029052734,
+ "learning_rate": 1.994628683869662e-05,
+ "loss": 1.4062,
+ "step": 2276
+ },
+ {
+ "epoch": 6.204359673024523,
+ "grad_norm": 19.21754264831543,
+ "learning_rate": 1.9946195455243494e-05,
+ "loss": 1.5022,
+ "step": 2277
+ },
+ {
+ "epoch": 6.20708446866485,
+ "grad_norm": 12.603913307189941,
+ "learning_rate": 1.9946103994329714e-05,
+ "loss": 1.6313,
+ "step": 2278
+ },
+ {
+ "epoch": 6.209809264305177,
+ "grad_norm": 17.378110885620117,
+ "learning_rate": 1.9946012455956004e-05,
+ "loss": 1.7715,
+ "step": 2279
+ },
+ {
+ "epoch": 6.212534059945504,
+ "grad_norm": 11.949447631835938,
+ "learning_rate": 1.9945920840123062e-05,
+ "loss": 1.583,
+ "step": 2280
+ },
+ {
+ "epoch": 6.215258855585831,
+ "grad_norm": 8.07461929321289,
+ "learning_rate": 1.9945829146831614e-05,
+ "loss": 1.4766,
+ "step": 2281
+ },
+ {
+ "epoch": 6.217983651226158,
+ "grad_norm": 9.490711212158203,
+ "learning_rate": 1.9945737376082363e-05,
+ "loss": 1.7275,
+ "step": 2282
+ },
+ {
+ "epoch": 6.220708446866485,
+ "grad_norm": 9.92374324798584,
+ "learning_rate": 1.9945645527876033e-05,
+ "loss": 1.6096,
+ "step": 2283
+ },
+ {
+ "epoch": 6.223433242506812,
+ "grad_norm": 15.487894058227539,
+ "learning_rate": 1.9945553602213336e-05,
+ "loss": 1.6487,
+ "step": 2284
+ },
+ {
+ "epoch": 6.226158038147139,
+ "grad_norm": 9.092809677124023,
+ "learning_rate": 1.994546159909499e-05,
+ "loss": 1.3423,
+ "step": 2285
+ },
+ {
+ "epoch": 6.228882833787466,
+ "grad_norm": 11.397137641906738,
+ "learning_rate": 1.9945369518521704e-05,
+ "loss": 1.7844,
+ "step": 2286
+ },
+ {
+ "epoch": 6.231607629427793,
+ "grad_norm": 10.459543228149414,
+ "learning_rate": 1.9945277360494204e-05,
+ "loss": 1.4954,
+ "step": 2287
+ },
+ {
+ "epoch": 6.23433242506812,
+ "grad_norm": 10.375653266906738,
+ "learning_rate": 1.99451851250132e-05,
+ "loss": 1.7891,
+ "step": 2288
+ },
+ {
+ "epoch": 6.237057220708447,
+ "grad_norm": 11.958422660827637,
+ "learning_rate": 1.994509281207942e-05,
+ "loss": 1.6511,
+ "step": 2289
+ },
+ {
+ "epoch": 6.239782016348774,
+ "grad_norm": 10.102315902709961,
+ "learning_rate": 1.9945000421693574e-05,
+ "loss": 1.6758,
+ "step": 2290
+ },
+ {
+ "epoch": 6.2425068119891005,
+ "grad_norm": 9.557490348815918,
+ "learning_rate": 1.9944907953856384e-05,
+ "loss": 1.5181,
+ "step": 2291
+ },
+ {
+ "epoch": 6.245231607629428,
+ "grad_norm": 11.85209846496582,
+ "learning_rate": 1.9944815408568572e-05,
+ "loss": 1.5681,
+ "step": 2292
+ },
+ {
+ "epoch": 6.247956403269755,
+ "grad_norm": 11.734000205993652,
+ "learning_rate": 1.9944722785830855e-05,
+ "loss": 1.7017,
+ "step": 2293
+ },
+ {
+ "epoch": 6.2506811989100814,
+ "grad_norm": 9.606616973876953,
+ "learning_rate": 1.994463008564396e-05,
+ "loss": 1.6003,
+ "step": 2294
+ },
+ {
+ "epoch": 6.253405994550409,
+ "grad_norm": 9.383480072021484,
+ "learning_rate": 1.9944537308008606e-05,
+ "loss": 1.4241,
+ "step": 2295
+ },
+ {
+ "epoch": 6.256130790190736,
+ "grad_norm": 9.445914268493652,
+ "learning_rate": 1.9944444452925514e-05,
+ "loss": 1.3701,
+ "step": 2296
+ },
+ {
+ "epoch": 6.258855585831062,
+ "grad_norm": 10.938509941101074,
+ "learning_rate": 1.994435152039541e-05,
+ "loss": 1.6641,
+ "step": 2297
+ },
+ {
+ "epoch": 6.26158038147139,
+ "grad_norm": 9.327269554138184,
+ "learning_rate": 1.9944258510419018e-05,
+ "loss": 1.6255,
+ "step": 2298
+ },
+ {
+ "epoch": 6.264305177111717,
+ "grad_norm": 21.856826782226562,
+ "learning_rate": 1.9944165422997058e-05,
+ "loss": 1.6892,
+ "step": 2299
+ },
+ {
+ "epoch": 6.267029972752043,
+ "grad_norm": 10.677403450012207,
+ "learning_rate": 1.994407225813026e-05,
+ "loss": 1.6177,
+ "step": 2300
+ },
+ {
+ "epoch": 6.269754768392371,
+ "grad_norm": 9.786881446838379,
+ "learning_rate": 1.9943979015819343e-05,
+ "loss": 1.6742,
+ "step": 2301
+ },
+ {
+ "epoch": 6.272479564032698,
+ "grad_norm": 10.130830764770508,
+ "learning_rate": 1.994388569606504e-05,
+ "loss": 1.6331,
+ "step": 2302
+ },
+ {
+ "epoch": 6.275204359673024,
+ "grad_norm": 10.384533882141113,
+ "learning_rate": 1.9943792298868076e-05,
+ "loss": 1.7134,
+ "step": 2303
+ },
+ {
+ "epoch": 6.277929155313352,
+ "grad_norm": 11.189226150512695,
+ "learning_rate": 1.994369882422918e-05,
+ "loss": 1.696,
+ "step": 2304
+ },
+ {
+ "epoch": 6.2806539509536785,
+ "grad_norm": 8.195403099060059,
+ "learning_rate": 1.9943605272149074e-05,
+ "loss": 1.4683,
+ "step": 2305
+ },
+ {
+ "epoch": 6.283378746594005,
+ "grad_norm": 10.447251319885254,
+ "learning_rate": 1.9943511642628488e-05,
+ "loss": 1.3259,
+ "step": 2306
+ },
+ {
+ "epoch": 6.286103542234333,
+ "grad_norm": 28.25797462463379,
+ "learning_rate": 1.9943417935668158e-05,
+ "loss": 1.6973,
+ "step": 2307
+ },
+ {
+ "epoch": 6.2888283378746594,
+ "grad_norm": 9.958805084228516,
+ "learning_rate": 1.9943324151268807e-05,
+ "loss": 1.7207,
+ "step": 2308
+ },
+ {
+ "epoch": 6.291553133514986,
+ "grad_norm": 10.296317100524902,
+ "learning_rate": 1.994323028943117e-05,
+ "loss": 1.5947,
+ "step": 2309
+ },
+ {
+ "epoch": 6.294277929155314,
+ "grad_norm": 13.088888168334961,
+ "learning_rate": 1.994313635015597e-05,
+ "loss": 1.6792,
+ "step": 2310
+ },
+ {
+ "epoch": 6.29700272479564,
+ "grad_norm": 10.405101776123047,
+ "learning_rate": 1.994304233344395e-05,
+ "loss": 1.6931,
+ "step": 2311
+ },
+ {
+ "epoch": 6.299727520435967,
+ "grad_norm": 10.78155517578125,
+ "learning_rate": 1.9942948239295833e-05,
+ "loss": 1.6045,
+ "step": 2312
+ },
+ {
+ "epoch": 6.302452316076295,
+ "grad_norm": 14.911649703979492,
+ "learning_rate": 1.9942854067712355e-05,
+ "loss": 1.4097,
+ "step": 2313
+ },
+ {
+ "epoch": 6.305177111716621,
+ "grad_norm": 11.39924430847168,
+ "learning_rate": 1.994275981869425e-05,
+ "loss": 1.6233,
+ "step": 2314
+ },
+ {
+ "epoch": 6.307901907356948,
+ "grad_norm": 13.633781433105469,
+ "learning_rate": 1.9942665492242256e-05,
+ "loss": 1.6016,
+ "step": 2315
+ },
+ {
+ "epoch": 6.310626702997276,
+ "grad_norm": 13.581009864807129,
+ "learning_rate": 1.9942571088357095e-05,
+ "loss": 1.4766,
+ "step": 2316
+ },
+ {
+ "epoch": 6.313351498637602,
+ "grad_norm": 11.985243797302246,
+ "learning_rate": 1.994247660703952e-05,
+ "loss": 1.5881,
+ "step": 2317
+ },
+ {
+ "epoch": 6.316076294277929,
+ "grad_norm": 14.857428550720215,
+ "learning_rate": 1.9942382048290248e-05,
+ "loss": 1.603,
+ "step": 2318
+ },
+ {
+ "epoch": 6.3188010899182565,
+ "grad_norm": 13.543075561523438,
+ "learning_rate": 1.994228741211003e-05,
+ "loss": 1.4346,
+ "step": 2319
+ },
+ {
+ "epoch": 6.321525885558583,
+ "grad_norm": 11.29600715637207,
+ "learning_rate": 1.9942192698499596e-05,
+ "loss": 1.6895,
+ "step": 2320
+ },
+ {
+ "epoch": 6.32425068119891,
+ "grad_norm": 10.868379592895508,
+ "learning_rate": 1.9942097907459687e-05,
+ "loss": 1.6465,
+ "step": 2321
+ },
+ {
+ "epoch": 6.3269754768392374,
+ "grad_norm": 25.268985748291016,
+ "learning_rate": 1.9942003038991035e-05,
+ "loss": 1.5962,
+ "step": 2322
+ },
+ {
+ "epoch": 6.329700272479564,
+ "grad_norm": 26.629039764404297,
+ "learning_rate": 1.9941908093094387e-05,
+ "loss": 1.4805,
+ "step": 2323
+ },
+ {
+ "epoch": 6.332425068119891,
+ "grad_norm": 12.916640281677246,
+ "learning_rate": 1.9941813069770478e-05,
+ "loss": 1.3672,
+ "step": 2324
+ },
+ {
+ "epoch": 6.335149863760218,
+ "grad_norm": 11.686497688293457,
+ "learning_rate": 1.9941717969020046e-05,
+ "loss": 1.6721,
+ "step": 2325
+ },
+ {
+ "epoch": 6.337874659400545,
+ "grad_norm": 10.163697242736816,
+ "learning_rate": 1.994162279084384e-05,
+ "loss": 1.4741,
+ "step": 2326
+ },
+ {
+ "epoch": 6.340599455040872,
+ "grad_norm": 10.932123184204102,
+ "learning_rate": 1.9941527535242592e-05,
+ "loss": 1.7891,
+ "step": 2327
+ },
+ {
+ "epoch": 6.343324250681199,
+ "grad_norm": 9.418354988098145,
+ "learning_rate": 1.9941432202217047e-05,
+ "loss": 1.5466,
+ "step": 2328
+ },
+ {
+ "epoch": 6.346049046321526,
+ "grad_norm": 11.555414199829102,
+ "learning_rate": 1.994133679176795e-05,
+ "loss": 1.6089,
+ "step": 2329
+ },
+ {
+ "epoch": 6.348773841961853,
+ "grad_norm": 12.213624000549316,
+ "learning_rate": 1.994124130389604e-05,
+ "loss": 1.5686,
+ "step": 2330
+ },
+ {
+ "epoch": 6.35149863760218,
+ "grad_norm": 13.881996154785156,
+ "learning_rate": 1.9941145738602065e-05,
+ "loss": 1.4187,
+ "step": 2331
+ },
+ {
+ "epoch": 6.354223433242507,
+ "grad_norm": 10.478837966918945,
+ "learning_rate": 1.9941050095886763e-05,
+ "loss": 1.7446,
+ "step": 2332
+ },
+ {
+ "epoch": 6.356948228882834,
+ "grad_norm": 12.292433738708496,
+ "learning_rate": 1.9940954375750888e-05,
+ "loss": 1.6624,
+ "step": 2333
+ },
+ {
+ "epoch": 6.359673024523161,
+ "grad_norm": 21.07522201538086,
+ "learning_rate": 1.994085857819518e-05,
+ "loss": 1.8042,
+ "step": 2334
+ },
+ {
+ "epoch": 6.362397820163488,
+ "grad_norm": 9.90341567993164,
+ "learning_rate": 1.9940762703220383e-05,
+ "loss": 1.4639,
+ "step": 2335
+ },
+ {
+ "epoch": 6.3651226158038146,
+ "grad_norm": 10.5038423538208,
+ "learning_rate": 1.9940666750827247e-05,
+ "loss": 1.7549,
+ "step": 2336
+ },
+ {
+ "epoch": 6.367847411444142,
+ "grad_norm": 13.10082721710205,
+ "learning_rate": 1.9940570721016516e-05,
+ "loss": 1.4827,
+ "step": 2337
+ },
+ {
+ "epoch": 6.370572207084469,
+ "grad_norm": 9.728696823120117,
+ "learning_rate": 1.994047461378894e-05,
+ "loss": 1.4875,
+ "step": 2338
+ },
+ {
+ "epoch": 6.3732970027247955,
+ "grad_norm": 10.2384614944458,
+ "learning_rate": 1.994037842914527e-05,
+ "loss": 1.7046,
+ "step": 2339
+ },
+ {
+ "epoch": 6.376021798365123,
+ "grad_norm": 23.558156967163086,
+ "learning_rate": 1.9940282167086255e-05,
+ "loss": 1.5261,
+ "step": 2340
+ },
+ {
+ "epoch": 6.37874659400545,
+ "grad_norm": 12.822075843811035,
+ "learning_rate": 1.9940185827612638e-05,
+ "loss": 1.5405,
+ "step": 2341
+ },
+ {
+ "epoch": 6.381471389645776,
+ "grad_norm": 12.047752380371094,
+ "learning_rate": 1.9940089410725174e-05,
+ "loss": 1.5564,
+ "step": 2342
+ },
+ {
+ "epoch": 6.384196185286104,
+ "grad_norm": 33.5240364074707,
+ "learning_rate": 1.9939992916424614e-05,
+ "loss": 1.4438,
+ "step": 2343
+ },
+ {
+ "epoch": 6.386920980926431,
+ "grad_norm": 10.042675018310547,
+ "learning_rate": 1.9939896344711714e-05,
+ "loss": 1.6416,
+ "step": 2344
+ },
+ {
+ "epoch": 6.389645776566757,
+ "grad_norm": 11.133225440979004,
+ "learning_rate": 1.9939799695587213e-05,
+ "loss": 1.6123,
+ "step": 2345
+ },
+ {
+ "epoch": 6.392370572207085,
+ "grad_norm": 19.349576950073242,
+ "learning_rate": 1.9939702969051876e-05,
+ "loss": 1.5417,
+ "step": 2346
+ },
+ {
+ "epoch": 6.395095367847412,
+ "grad_norm": 15.16633415222168,
+ "learning_rate": 1.993960616510645e-05,
+ "loss": 1.5361,
+ "step": 2347
+ },
+ {
+ "epoch": 6.397820163487738,
+ "grad_norm": 10.151996612548828,
+ "learning_rate": 1.9939509283751696e-05,
+ "loss": 1.4199,
+ "step": 2348
+ },
+ {
+ "epoch": 6.400544959128065,
+ "grad_norm": 12.841211318969727,
+ "learning_rate": 1.993941232498836e-05,
+ "loss": 1.4395,
+ "step": 2349
+ },
+ {
+ "epoch": 6.4032697547683926,
+ "grad_norm": 14.988808631896973,
+ "learning_rate": 1.9939315288817203e-05,
+ "loss": 1.6819,
+ "step": 2350
+ },
+ {
+ "epoch": 6.405994550408719,
+ "grad_norm": 10.59081745147705,
+ "learning_rate": 1.993921817523898e-05,
+ "loss": 1.5515,
+ "step": 2351
+ },
+ {
+ "epoch": 6.408719346049046,
+ "grad_norm": 10.21403694152832,
+ "learning_rate": 1.993912098425444e-05,
+ "loss": 1.3684,
+ "step": 2352
+ },
+ {
+ "epoch": 6.4114441416893735,
+ "grad_norm": 16.891313552856445,
+ "learning_rate": 1.993902371586435e-05,
+ "loss": 1.6753,
+ "step": 2353
+ },
+ {
+ "epoch": 6.4141689373297,
+ "grad_norm": 12.440431594848633,
+ "learning_rate": 1.993892637006946e-05,
+ "loss": 1.7651,
+ "step": 2354
+ },
+ {
+ "epoch": 6.416893732970027,
+ "grad_norm": 11.252609252929688,
+ "learning_rate": 1.993882894687053e-05,
+ "loss": 1.739,
+ "step": 2355
+ },
+ {
+ "epoch": 6.419618528610354,
+ "grad_norm": 8.985031127929688,
+ "learning_rate": 1.993873144626833e-05,
+ "loss": 1.5359,
+ "step": 2356
+ },
+ {
+ "epoch": 6.422343324250681,
+ "grad_norm": 10.893987655639648,
+ "learning_rate": 1.9938633868263597e-05,
+ "loss": 1.7124,
+ "step": 2357
+ },
+ {
+ "epoch": 6.425068119891008,
+ "grad_norm": 9.890556335449219,
+ "learning_rate": 1.993853621285711e-05,
+ "loss": 1.3611,
+ "step": 2358
+ },
+ {
+ "epoch": 6.427792915531335,
+ "grad_norm": 9.026385307312012,
+ "learning_rate": 1.993843848004962e-05,
+ "loss": 1.677,
+ "step": 2359
+ },
+ {
+ "epoch": 6.430517711171662,
+ "grad_norm": 9.886550903320312,
+ "learning_rate": 1.9938340669841893e-05,
+ "loss": 1.4731,
+ "step": 2360
+ },
+ {
+ "epoch": 6.433242506811989,
+ "grad_norm": 9.005744934082031,
+ "learning_rate": 1.993824278223469e-05,
+ "loss": 1.6106,
+ "step": 2361
+ },
+ {
+ "epoch": 6.435967302452316,
+ "grad_norm": 13.120516777038574,
+ "learning_rate": 1.993814481722877e-05,
+ "loss": 1.626,
+ "step": 2362
+ },
+ {
+ "epoch": 6.438692098092643,
+ "grad_norm": 12.961750984191895,
+ "learning_rate": 1.9938046774824897e-05,
+ "loss": 1.6194,
+ "step": 2363
+ },
+ {
+ "epoch": 6.44141689373297,
+ "grad_norm": 11.148823738098145,
+ "learning_rate": 1.9937948655023838e-05,
+ "loss": 1.6655,
+ "step": 2364
+ },
+ {
+ "epoch": 6.444141689373297,
+ "grad_norm": 8.781012535095215,
+ "learning_rate": 1.9937850457826354e-05,
+ "loss": 1.5259,
+ "step": 2365
+ },
+ {
+ "epoch": 6.446866485013624,
+ "grad_norm": 11.232917785644531,
+ "learning_rate": 1.993775218323321e-05,
+ "loss": 1.6318,
+ "step": 2366
+ },
+ {
+ "epoch": 6.449591280653951,
+ "grad_norm": 13.188098907470703,
+ "learning_rate": 1.993765383124517e-05,
+ "loss": 1.7705,
+ "step": 2367
+ },
+ {
+ "epoch": 6.452316076294278,
+ "grad_norm": 17.013540267944336,
+ "learning_rate": 1.9937555401863005e-05,
+ "loss": 1.583,
+ "step": 2368
+ },
+ {
+ "epoch": 6.455040871934605,
+ "grad_norm": 10.890372276306152,
+ "learning_rate": 1.9937456895087477e-05,
+ "loss": 1.616,
+ "step": 2369
+ },
+ {
+ "epoch": 6.4577656675749315,
+ "grad_norm": 10.225186347961426,
+ "learning_rate": 1.9937358310919356e-05,
+ "loss": 1.6235,
+ "step": 2370
+ },
+ {
+ "epoch": 6.460490463215259,
+ "grad_norm": 12.753676414489746,
+ "learning_rate": 1.9937259649359406e-05,
+ "loss": 1.6106,
+ "step": 2371
+ },
+ {
+ "epoch": 6.463215258855586,
+ "grad_norm": 10.8523530960083,
+ "learning_rate": 1.9937160910408396e-05,
+ "loss": 1.7925,
+ "step": 2372
+ },
+ {
+ "epoch": 6.4659400544959125,
+ "grad_norm": 10.743764877319336,
+ "learning_rate": 1.99370620940671e-05,
+ "loss": 1.5129,
+ "step": 2373
+ },
+ {
+ "epoch": 6.46866485013624,
+ "grad_norm": 8.791482925415039,
+ "learning_rate": 1.9936963200336287e-05,
+ "loss": 1.4031,
+ "step": 2374
+ },
+ {
+ "epoch": 6.471389645776567,
+ "grad_norm": 8.918050765991211,
+ "learning_rate": 1.9936864229216718e-05,
+ "loss": 1.3892,
+ "step": 2375
+ },
+ {
+ "epoch": 6.474114441416893,
+ "grad_norm": 9.868968963623047,
+ "learning_rate": 1.9936765180709173e-05,
+ "loss": 1.4968,
+ "step": 2376
+ },
+ {
+ "epoch": 6.476839237057221,
+ "grad_norm": 12.836007118225098,
+ "learning_rate": 1.993666605481442e-05,
+ "loss": 1.4861,
+ "step": 2377
+ },
+ {
+ "epoch": 6.479564032697548,
+ "grad_norm": 10.597851753234863,
+ "learning_rate": 1.9936566851533232e-05,
+ "loss": 1.4966,
+ "step": 2378
+ },
+ {
+ "epoch": 6.482288828337874,
+ "grad_norm": 8.851969718933105,
+ "learning_rate": 1.9936467570866384e-05,
+ "loss": 1.2188,
+ "step": 2379
+ },
+ {
+ "epoch": 6.485013623978202,
+ "grad_norm": 11.105555534362793,
+ "learning_rate": 1.9936368212814643e-05,
+ "loss": 1.7676,
+ "step": 2380
+ },
+ {
+ "epoch": 6.487738419618529,
+ "grad_norm": 10.325815200805664,
+ "learning_rate": 1.9936268777378785e-05,
+ "loss": 1.4563,
+ "step": 2381
+ },
+ {
+ "epoch": 6.490463215258855,
+ "grad_norm": 9.311816215515137,
+ "learning_rate": 1.993616926455959e-05,
+ "loss": 1.4685,
+ "step": 2382
+ },
+ {
+ "epoch": 6.493188010899183,
+ "grad_norm": 9.058845520019531,
+ "learning_rate": 1.9936069674357826e-05,
+ "loss": 1.5105,
+ "step": 2383
+ },
+ {
+ "epoch": 6.4959128065395095,
+ "grad_norm": 24.743215560913086,
+ "learning_rate": 1.993597000677427e-05,
+ "loss": 1.5391,
+ "step": 2384
+ },
+ {
+ "epoch": 6.498637602179836,
+ "grad_norm": 10.185152053833008,
+ "learning_rate": 1.9935870261809703e-05,
+ "loss": 1.6858,
+ "step": 2385
+ },
+ {
+ "epoch": 6.501362397820164,
+ "grad_norm": 9.319504737854004,
+ "learning_rate": 1.9935770439464896e-05,
+ "loss": 1.5894,
+ "step": 2386
+ },
+ {
+ "epoch": 6.5040871934604905,
+ "grad_norm": 9.412171363830566,
+ "learning_rate": 1.9935670539740626e-05,
+ "loss": 1.5222,
+ "step": 2387
+ },
+ {
+ "epoch": 6.506811989100817,
+ "grad_norm": 16.216398239135742,
+ "learning_rate": 1.9935570562637675e-05,
+ "loss": 1.5078,
+ "step": 2388
+ },
+ {
+ "epoch": 6.509536784741145,
+ "grad_norm": 11.490829467773438,
+ "learning_rate": 1.993547050815682e-05,
+ "loss": 1.6562,
+ "step": 2389
+ },
+ {
+ "epoch": 6.512261580381471,
+ "grad_norm": 10.294737815856934,
+ "learning_rate": 1.9935370376298842e-05,
+ "loss": 1.4717,
+ "step": 2390
+ },
+ {
+ "epoch": 6.514986376021798,
+ "grad_norm": 31.39698028564453,
+ "learning_rate": 1.9935270167064523e-05,
+ "loss": 1.4307,
+ "step": 2391
+ },
+ {
+ "epoch": 6.517711171662126,
+ "grad_norm": 11.936128616333008,
+ "learning_rate": 1.9935169880454635e-05,
+ "loss": 1.5737,
+ "step": 2392
+ },
+ {
+ "epoch": 6.520435967302452,
+ "grad_norm": 15.877132415771484,
+ "learning_rate": 1.9935069516469964e-05,
+ "loss": 1.562,
+ "step": 2393
+ },
+ {
+ "epoch": 6.523160762942779,
+ "grad_norm": 10.936116218566895,
+ "learning_rate": 1.993496907511129e-05,
+ "loss": 1.6309,
+ "step": 2394
+ },
+ {
+ "epoch": 6.525885558583107,
+ "grad_norm": 8.006392478942871,
+ "learning_rate": 1.99348685563794e-05,
+ "loss": 1.4521,
+ "step": 2395
+ },
+ {
+ "epoch": 6.528610354223433,
+ "grad_norm": 11.510782241821289,
+ "learning_rate": 1.993476796027507e-05,
+ "loss": 1.6775,
+ "step": 2396
+ },
+ {
+ "epoch": 6.53133514986376,
+ "grad_norm": 15.735798835754395,
+ "learning_rate": 1.993466728679909e-05,
+ "loss": 1.6934,
+ "step": 2397
+ },
+ {
+ "epoch": 6.5340599455040875,
+ "grad_norm": 13.140318870544434,
+ "learning_rate": 1.993456653595224e-05,
+ "loss": 1.3596,
+ "step": 2398
+ },
+ {
+ "epoch": 6.536784741144414,
+ "grad_norm": 11.08877944946289,
+ "learning_rate": 1.9934465707735304e-05,
+ "loss": 1.6812,
+ "step": 2399
+ },
+ {
+ "epoch": 6.539509536784741,
+ "grad_norm": 12.190179824829102,
+ "learning_rate": 1.993436480214907e-05,
+ "loss": 1.4988,
+ "step": 2400
+ },
+ {
+ "epoch": 6.5422343324250685,
+ "grad_norm": 20.818950653076172,
+ "learning_rate": 1.993426381919432e-05,
+ "loss": 1.4949,
+ "step": 2401
+ },
+ {
+ "epoch": 6.544959128065395,
+ "grad_norm": 13.064900398254395,
+ "learning_rate": 1.993416275887185e-05,
+ "loss": 1.7405,
+ "step": 2402
+ },
+ {
+ "epoch": 6.547683923705722,
+ "grad_norm": 12.698445320129395,
+ "learning_rate": 1.9934061621182433e-05,
+ "loss": 1.5542,
+ "step": 2403
+ },
+ {
+ "epoch": 6.550408719346049,
+ "grad_norm": 11.332972526550293,
+ "learning_rate": 1.993396040612687e-05,
+ "loss": 1.4771,
+ "step": 2404
+ },
+ {
+ "epoch": 6.553133514986376,
+ "grad_norm": 14.005719184875488,
+ "learning_rate": 1.9933859113705937e-05,
+ "loss": 1.5176,
+ "step": 2405
+ },
+ {
+ "epoch": 6.555858310626703,
+ "grad_norm": 11.294587135314941,
+ "learning_rate": 1.9933757743920433e-05,
+ "loss": 1.6316,
+ "step": 2406
+ },
+ {
+ "epoch": 6.55858310626703,
+ "grad_norm": 10.821269035339355,
+ "learning_rate": 1.993365629677114e-05,
+ "loss": 1.6152,
+ "step": 2407
+ },
+ {
+ "epoch": 6.561307901907357,
+ "grad_norm": 10.606854438781738,
+ "learning_rate": 1.9933554772258853e-05,
+ "loss": 1.6602,
+ "step": 2408
+ },
+ {
+ "epoch": 6.564032697547684,
+ "grad_norm": 13.516182899475098,
+ "learning_rate": 1.9933453170384363e-05,
+ "loss": 1.5715,
+ "step": 2409
+ },
+ {
+ "epoch": 6.566757493188011,
+ "grad_norm": 10.468656539916992,
+ "learning_rate": 1.993335149114846e-05,
+ "loss": 1.4802,
+ "step": 2410
+ },
+ {
+ "epoch": 6.569482288828338,
+ "grad_norm": 11.097125053405762,
+ "learning_rate": 1.9933249734551934e-05,
+ "loss": 1.5691,
+ "step": 2411
+ },
+ {
+ "epoch": 6.572207084468665,
+ "grad_norm": 10.488286972045898,
+ "learning_rate": 1.9933147900595576e-05,
+ "loss": 1.6445,
+ "step": 2412
+ },
+ {
+ "epoch": 6.574931880108992,
+ "grad_norm": 14.706908226013184,
+ "learning_rate": 1.9933045989280188e-05,
+ "loss": 1.4363,
+ "step": 2413
+ },
+ {
+ "epoch": 6.577656675749319,
+ "grad_norm": 10.991456985473633,
+ "learning_rate": 1.993294400060655e-05,
+ "loss": 1.6826,
+ "step": 2414
+ },
+ {
+ "epoch": 6.580381471389646,
+ "grad_norm": 14.5840425491333,
+ "learning_rate": 1.9932841934575468e-05,
+ "loss": 1.8613,
+ "step": 2415
+ },
+ {
+ "epoch": 6.583106267029972,
+ "grad_norm": 13.031789779663086,
+ "learning_rate": 1.9932739791187733e-05,
+ "loss": 1.7136,
+ "step": 2416
+ },
+ {
+ "epoch": 6.5858310626703,
+ "grad_norm": 10.509198188781738,
+ "learning_rate": 1.9932637570444138e-05,
+ "loss": 1.4597,
+ "step": 2417
+ },
+ {
+ "epoch": 6.5885558583106265,
+ "grad_norm": 10.194021224975586,
+ "learning_rate": 1.9932535272345482e-05,
+ "loss": 1.6216,
+ "step": 2418
+ },
+ {
+ "epoch": 6.591280653950953,
+ "grad_norm": 7.701805114746094,
+ "learning_rate": 1.9932432896892563e-05,
+ "loss": 1.4561,
+ "step": 2419
+ },
+ {
+ "epoch": 6.594005449591281,
+ "grad_norm": 10.746231079101562,
+ "learning_rate": 1.9932330444086175e-05,
+ "loss": 1.6001,
+ "step": 2420
+ },
+ {
+ "epoch": 6.5967302452316074,
+ "grad_norm": 15.582562446594238,
+ "learning_rate": 1.993222791392712e-05,
+ "loss": 1.3887,
+ "step": 2421
+ },
+ {
+ "epoch": 6.599455040871934,
+ "grad_norm": 9.70804500579834,
+ "learning_rate": 1.9932125306416185e-05,
+ "loss": 1.5044,
+ "step": 2422
+ },
+ {
+ "epoch": 6.602179836512262,
+ "grad_norm": 10.683446884155273,
+ "learning_rate": 1.9932022621554185e-05,
+ "loss": 1.6841,
+ "step": 2423
+ },
+ {
+ "epoch": 6.604904632152588,
+ "grad_norm": 11.003694534301758,
+ "learning_rate": 1.993191985934191e-05,
+ "loss": 1.5566,
+ "step": 2424
+ },
+ {
+ "epoch": 6.607629427792915,
+ "grad_norm": 20.193443298339844,
+ "learning_rate": 1.9931817019780165e-05,
+ "loss": 1.7471,
+ "step": 2425
+ },
+ {
+ "epoch": 6.610354223433243,
+ "grad_norm": 10.888099670410156,
+ "learning_rate": 1.993171410286975e-05,
+ "loss": 1.5444,
+ "step": 2426
+ },
+ {
+ "epoch": 6.613079019073569,
+ "grad_norm": 9.50598430633545,
+ "learning_rate": 1.9931611108611458e-05,
+ "loss": 1.6055,
+ "step": 2427
+ },
+ {
+ "epoch": 6.615803814713896,
+ "grad_norm": 9.374114990234375,
+ "learning_rate": 1.9931508037006106e-05,
+ "loss": 1.6694,
+ "step": 2428
+ },
+ {
+ "epoch": 6.618528610354224,
+ "grad_norm": 10.345595359802246,
+ "learning_rate": 1.9931404888054486e-05,
+ "loss": 1.6248,
+ "step": 2429
+ },
+ {
+ "epoch": 6.62125340599455,
+ "grad_norm": 12.015646934509277,
+ "learning_rate": 1.99313016617574e-05,
+ "loss": 1.3783,
+ "step": 2430
+ },
+ {
+ "epoch": 6.623978201634877,
+ "grad_norm": 10.096620559692383,
+ "learning_rate": 1.9931198358115665e-05,
+ "loss": 1.2698,
+ "step": 2431
+ },
+ {
+ "epoch": 6.6267029972752045,
+ "grad_norm": 13.323445320129395,
+ "learning_rate": 1.9931094977130072e-05,
+ "loss": 1.5256,
+ "step": 2432
+ },
+ {
+ "epoch": 6.629427792915531,
+ "grad_norm": 10.597187995910645,
+ "learning_rate": 1.9930991518801434e-05,
+ "loss": 1.6113,
+ "step": 2433
+ },
+ {
+ "epoch": 6.632152588555858,
+ "grad_norm": 11.72788143157959,
+ "learning_rate": 1.993088798313055e-05,
+ "loss": 1.6721,
+ "step": 2434
+ },
+ {
+ "epoch": 6.6348773841961854,
+ "grad_norm": 12.03602123260498,
+ "learning_rate": 1.993078437011823e-05,
+ "loss": 1.6377,
+ "step": 2435
+ },
+ {
+ "epoch": 6.637602179836512,
+ "grad_norm": 10.530377388000488,
+ "learning_rate": 1.9930680679765283e-05,
+ "loss": 1.6748,
+ "step": 2436
+ },
+ {
+ "epoch": 6.640326975476839,
+ "grad_norm": 9.889983177185059,
+ "learning_rate": 1.9930576912072514e-05,
+ "loss": 1.6863,
+ "step": 2437
+ },
+ {
+ "epoch": 6.643051771117166,
+ "grad_norm": 16.77570152282715,
+ "learning_rate": 1.993047306704073e-05,
+ "loss": 1.4214,
+ "step": 2438
+ },
+ {
+ "epoch": 6.645776566757493,
+ "grad_norm": 9.434869766235352,
+ "learning_rate": 1.9930369144670744e-05,
+ "loss": 1.585,
+ "step": 2439
+ },
+ {
+ "epoch": 6.64850136239782,
+ "grad_norm": 10.706549644470215,
+ "learning_rate": 1.993026514496336e-05,
+ "loss": 1.6279,
+ "step": 2440
+ },
+ {
+ "epoch": 6.651226158038147,
+ "grad_norm": 10.672386169433594,
+ "learning_rate": 1.9930161067919392e-05,
+ "loss": 1.5964,
+ "step": 2441
+ },
+ {
+ "epoch": 6.653950953678474,
+ "grad_norm": 14.484672546386719,
+ "learning_rate": 1.9930056913539647e-05,
+ "loss": 1.6155,
+ "step": 2442
+ },
+ {
+ "epoch": 6.656675749318801,
+ "grad_norm": 9.874717712402344,
+ "learning_rate": 1.9929952681824944e-05,
+ "loss": 1.6836,
+ "step": 2443
+ },
+ {
+ "epoch": 6.659400544959128,
+ "grad_norm": 10.416218757629395,
+ "learning_rate": 1.9929848372776085e-05,
+ "loss": 1.6025,
+ "step": 2444
+ },
+ {
+ "epoch": 6.662125340599455,
+ "grad_norm": 12.917311668395996,
+ "learning_rate": 1.9929743986393886e-05,
+ "loss": 1.6995,
+ "step": 2445
+ },
+ {
+ "epoch": 6.664850136239782,
+ "grad_norm": 10.260004043579102,
+ "learning_rate": 1.9929639522679163e-05,
+ "loss": 1.4712,
+ "step": 2446
+ },
+ {
+ "epoch": 6.667574931880109,
+ "grad_norm": 8.553717613220215,
+ "learning_rate": 1.9929534981632726e-05,
+ "loss": 1.572,
+ "step": 2447
+ },
+ {
+ "epoch": 6.670299727520436,
+ "grad_norm": 8.03495979309082,
+ "learning_rate": 1.9929430363255387e-05,
+ "loss": 1.3491,
+ "step": 2448
+ },
+ {
+ "epoch": 6.6730245231607626,
+ "grad_norm": 8.828189849853516,
+ "learning_rate": 1.9929325667547968e-05,
+ "loss": 1.6265,
+ "step": 2449
+ },
+ {
+ "epoch": 6.67574931880109,
+ "grad_norm": 10.107748031616211,
+ "learning_rate": 1.9929220894511275e-05,
+ "loss": 1.5894,
+ "step": 2450
+ },
+ {
+ "epoch": 6.678474114441417,
+ "grad_norm": 10.143497467041016,
+ "learning_rate": 1.9929116044146137e-05,
+ "loss": 1.6353,
+ "step": 2451
+ },
+ {
+ "epoch": 6.6811989100817435,
+ "grad_norm": 11.173709869384766,
+ "learning_rate": 1.9929011116453358e-05,
+ "loss": 1.6279,
+ "step": 2452
+ },
+ {
+ "epoch": 6.683923705722071,
+ "grad_norm": 10.3662109375,
+ "learning_rate": 1.9928906111433762e-05,
+ "loss": 1.4197,
+ "step": 2453
+ },
+ {
+ "epoch": 6.686648501362398,
+ "grad_norm": 9.1519775390625,
+ "learning_rate": 1.9928801029088162e-05,
+ "loss": 1.4307,
+ "step": 2454
+ },
+ {
+ "epoch": 6.689373297002724,
+ "grad_norm": 11.98711109161377,
+ "learning_rate": 1.9928695869417383e-05,
+ "loss": 1.7588,
+ "step": 2455
+ },
+ {
+ "epoch": 6.692098092643052,
+ "grad_norm": 12.33102798461914,
+ "learning_rate": 1.9928590632422236e-05,
+ "loss": 1.5356,
+ "step": 2456
+ },
+ {
+ "epoch": 6.694822888283379,
+ "grad_norm": 13.80027961730957,
+ "learning_rate": 1.9928485318103545e-05,
+ "loss": 1.5417,
+ "step": 2457
+ },
+ {
+ "epoch": 6.697547683923705,
+ "grad_norm": 11.349905967712402,
+ "learning_rate": 1.992837992646213e-05,
+ "loss": 1.8628,
+ "step": 2458
+ },
+ {
+ "epoch": 6.700272479564033,
+ "grad_norm": 12.577153205871582,
+ "learning_rate": 1.9928274457498818e-05,
+ "loss": 1.5457,
+ "step": 2459
+ },
+ {
+ "epoch": 6.70299727520436,
+ "grad_norm": 12.215507507324219,
+ "learning_rate": 1.9928168911214415e-05,
+ "loss": 1.5699,
+ "step": 2460
+ },
+ {
+ "epoch": 6.705722070844686,
+ "grad_norm": 11.409568786621094,
+ "learning_rate": 1.9928063287609758e-05,
+ "loss": 1.6504,
+ "step": 2461
+ },
+ {
+ "epoch": 6.708446866485014,
+ "grad_norm": 11.919694900512695,
+ "learning_rate": 1.9927957586685664e-05,
+ "loss": 1.5984,
+ "step": 2462
+ },
+ {
+ "epoch": 6.7111716621253406,
+ "grad_norm": 11.449212074279785,
+ "learning_rate": 1.992785180844295e-05,
+ "loss": 1.5847,
+ "step": 2463
+ },
+ {
+ "epoch": 6.713896457765667,
+ "grad_norm": 9.151398658752441,
+ "learning_rate": 1.9927745952882452e-05,
+ "loss": 1.5081,
+ "step": 2464
+ },
+ {
+ "epoch": 6.716621253405995,
+ "grad_norm": 10.904823303222656,
+ "learning_rate": 1.9927640020004985e-05,
+ "loss": 1.5444,
+ "step": 2465
+ },
+ {
+ "epoch": 6.7193460490463215,
+ "grad_norm": 9.86526870727539,
+ "learning_rate": 1.9927534009811377e-05,
+ "loss": 1.6147,
+ "step": 2466
+ },
+ {
+ "epoch": 6.722070844686648,
+ "grad_norm": 10.476258277893066,
+ "learning_rate": 1.9927427922302452e-05,
+ "loss": 1.6111,
+ "step": 2467
+ },
+ {
+ "epoch": 6.724795640326976,
+ "grad_norm": 9.763236045837402,
+ "learning_rate": 1.9927321757479043e-05,
+ "loss": 1.4932,
+ "step": 2468
+ },
+ {
+ "epoch": 6.727520435967302,
+ "grad_norm": 12.400291442871094,
+ "learning_rate": 1.992721551534197e-05,
+ "loss": 1.491,
+ "step": 2469
+ },
+ {
+ "epoch": 6.730245231607629,
+ "grad_norm": 11.978157043457031,
+ "learning_rate": 1.9927109195892062e-05,
+ "loss": 1.4448,
+ "step": 2470
+ },
+ {
+ "epoch": 6.732970027247957,
+ "grad_norm": 9.739986419677734,
+ "learning_rate": 1.9927002799130144e-05,
+ "loss": 1.7478,
+ "step": 2471
+ },
+ {
+ "epoch": 6.735694822888283,
+ "grad_norm": 10.663016319274902,
+ "learning_rate": 1.992689632505705e-05,
+ "loss": 1.5623,
+ "step": 2472
+ },
+ {
+ "epoch": 6.73841961852861,
+ "grad_norm": 12.673657417297363,
+ "learning_rate": 1.9926789773673606e-05,
+ "loss": 1.771,
+ "step": 2473
+ },
+ {
+ "epoch": 6.741144414168938,
+ "grad_norm": 13.936773300170898,
+ "learning_rate": 1.9926683144980643e-05,
+ "loss": 1.7021,
+ "step": 2474
+ },
+ {
+ "epoch": 6.743869209809264,
+ "grad_norm": 11.60373592376709,
+ "learning_rate": 1.992657643897899e-05,
+ "loss": 1.7454,
+ "step": 2475
+ },
+ {
+ "epoch": 6.746594005449591,
+ "grad_norm": 10.127052307128906,
+ "learning_rate": 1.992646965566948e-05,
+ "loss": 1.5261,
+ "step": 2476
+ },
+ {
+ "epoch": 6.7493188010899186,
+ "grad_norm": 11.759267807006836,
+ "learning_rate": 1.9926362795052947e-05,
+ "loss": 1.5005,
+ "step": 2477
+ },
+ {
+ "epoch": 6.752043596730245,
+ "grad_norm": 13.64344596862793,
+ "learning_rate": 1.9926255857130216e-05,
+ "loss": 1.645,
+ "step": 2478
+ },
+ {
+ "epoch": 6.754768392370572,
+ "grad_norm": 11.076778411865234,
+ "learning_rate": 1.9926148841902123e-05,
+ "loss": 1.4646,
+ "step": 2479
+ },
+ {
+ "epoch": 6.7574931880108995,
+ "grad_norm": 15.128584861755371,
+ "learning_rate": 1.9926041749369507e-05,
+ "loss": 1.6904,
+ "step": 2480
+ },
+ {
+ "epoch": 6.760217983651226,
+ "grad_norm": 11.720351219177246,
+ "learning_rate": 1.9925934579533195e-05,
+ "loss": 1.728,
+ "step": 2481
+ },
+ {
+ "epoch": 6.762942779291553,
+ "grad_norm": 8.59024429321289,
+ "learning_rate": 1.9925827332394023e-05,
+ "loss": 1.4097,
+ "step": 2482
+ },
+ {
+ "epoch": 6.76566757493188,
+ "grad_norm": 13.756746292114258,
+ "learning_rate": 1.9925720007952826e-05,
+ "loss": 1.6008,
+ "step": 2483
+ },
+ {
+ "epoch": 6.768392370572207,
+ "grad_norm": 11.337132453918457,
+ "learning_rate": 1.9925612606210446e-05,
+ "loss": 1.4539,
+ "step": 2484
+ },
+ {
+ "epoch": 6.771117166212534,
+ "grad_norm": 11.355990409851074,
+ "learning_rate": 1.992550512716771e-05,
+ "loss": 1.738,
+ "step": 2485
+ },
+ {
+ "epoch": 6.773841961852861,
+ "grad_norm": 12.595316886901855,
+ "learning_rate": 1.9925397570825463e-05,
+ "loss": 1.6526,
+ "step": 2486
+ },
+ {
+ "epoch": 6.776566757493188,
+ "grad_norm": 10.657020568847656,
+ "learning_rate": 1.9925289937184534e-05,
+ "loss": 1.6196,
+ "step": 2487
+ },
+ {
+ "epoch": 6.779291553133515,
+ "grad_norm": 12.440933227539062,
+ "learning_rate": 1.992518222624577e-05,
+ "loss": 1.6235,
+ "step": 2488
+ },
+ {
+ "epoch": 6.782016348773842,
+ "grad_norm": 9.319437026977539,
+ "learning_rate": 1.992507443801001e-05,
+ "loss": 1.6362,
+ "step": 2489
+ },
+ {
+ "epoch": 6.784741144414169,
+ "grad_norm": 41.49929428100586,
+ "learning_rate": 1.9924966572478083e-05,
+ "loss": 1.5034,
+ "step": 2490
+ },
+ {
+ "epoch": 6.787465940054496,
+ "grad_norm": 15.431757926940918,
+ "learning_rate": 1.992485862965084e-05,
+ "loss": 1.4822,
+ "step": 2491
+ },
+ {
+ "epoch": 6.790190735694823,
+ "grad_norm": 13.493185043334961,
+ "learning_rate": 1.9924750609529116e-05,
+ "loss": 1.4744,
+ "step": 2492
+ },
+ {
+ "epoch": 6.79291553133515,
+ "grad_norm": 18.08843421936035,
+ "learning_rate": 1.992464251211375e-05,
+ "loss": 1.6089,
+ "step": 2493
+ },
+ {
+ "epoch": 6.795640326975477,
+ "grad_norm": 12.009065628051758,
+ "learning_rate": 1.992453433740559e-05,
+ "loss": 1.6089,
+ "step": 2494
+ },
+ {
+ "epoch": 6.798365122615804,
+ "grad_norm": 11.761157989501953,
+ "learning_rate": 1.9924426085405478e-05,
+ "loss": 1.5273,
+ "step": 2495
+ },
+ {
+ "epoch": 6.801089918256131,
+ "grad_norm": 10.267550468444824,
+ "learning_rate": 1.9924317756114255e-05,
+ "loss": 1.5486,
+ "step": 2496
+ },
+ {
+ "epoch": 6.8038147138964575,
+ "grad_norm": 11.865041732788086,
+ "learning_rate": 1.9924209349532763e-05,
+ "loss": 1.5554,
+ "step": 2497
+ },
+ {
+ "epoch": 6.806539509536785,
+ "grad_norm": 9.561129570007324,
+ "learning_rate": 1.992410086566185e-05,
+ "loss": 1.4812,
+ "step": 2498
+ },
+ {
+ "epoch": 6.809264305177112,
+ "grad_norm": 9.084714889526367,
+ "learning_rate": 1.9923992304502357e-05,
+ "loss": 1.3855,
+ "step": 2499
+ },
+ {
+ "epoch": 6.8119891008174385,
+ "grad_norm": 12.381909370422363,
+ "learning_rate": 1.9923883666055133e-05,
+ "loss": 1.5867,
+ "step": 2500
+ },
+ {
+ "epoch": 6.814713896457766,
+ "grad_norm": 15.723135948181152,
+ "learning_rate": 1.992377495032102e-05,
+ "loss": 1.6187,
+ "step": 2501
+ },
+ {
+ "epoch": 6.817438692098093,
+ "grad_norm": 16.490381240844727,
+ "learning_rate": 1.992366615730087e-05,
+ "loss": 1.6401,
+ "step": 2502
+ },
+ {
+ "epoch": 6.820163487738419,
+ "grad_norm": 13.186235427856445,
+ "learning_rate": 1.9923557286995524e-05,
+ "loss": 1.4634,
+ "step": 2503
+ },
+ {
+ "epoch": 6.822888283378747,
+ "grad_norm": 12.261408805847168,
+ "learning_rate": 1.9923448339405835e-05,
+ "loss": 1.4092,
+ "step": 2504
+ },
+ {
+ "epoch": 6.825613079019074,
+ "grad_norm": 21.39244842529297,
+ "learning_rate": 1.992333931453265e-05,
+ "loss": 1.6294,
+ "step": 2505
+ },
+ {
+ "epoch": 6.8283378746594,
+ "grad_norm": 12.436821937561035,
+ "learning_rate": 1.992323021237682e-05,
+ "loss": 1.5833,
+ "step": 2506
+ },
+ {
+ "epoch": 6.831062670299728,
+ "grad_norm": 13.260921478271484,
+ "learning_rate": 1.992312103293919e-05,
+ "loss": 1.5767,
+ "step": 2507
+ },
+ {
+ "epoch": 6.833787465940055,
+ "grad_norm": 15.177225112915039,
+ "learning_rate": 1.9923011776220612e-05,
+ "loss": 1.5896,
+ "step": 2508
+ },
+ {
+ "epoch": 6.836512261580381,
+ "grad_norm": 15.003098487854004,
+ "learning_rate": 1.992290244222194e-05,
+ "loss": 1.8267,
+ "step": 2509
+ },
+ {
+ "epoch": 6.839237057220709,
+ "grad_norm": 11.336455345153809,
+ "learning_rate": 1.992279303094402e-05,
+ "loss": 1.5039,
+ "step": 2510
+ },
+ {
+ "epoch": 6.8419618528610355,
+ "grad_norm": 11.886491775512695,
+ "learning_rate": 1.9922683542387707e-05,
+ "loss": 1.6057,
+ "step": 2511
+ },
+ {
+ "epoch": 6.844686648501362,
+ "grad_norm": 14.85074234008789,
+ "learning_rate": 1.9922573976553857e-05,
+ "loss": 1.7595,
+ "step": 2512
+ },
+ {
+ "epoch": 6.84741144414169,
+ "grad_norm": 11.935297966003418,
+ "learning_rate": 1.9922464333443318e-05,
+ "loss": 1.4692,
+ "step": 2513
+ },
+ {
+ "epoch": 6.8501362397820165,
+ "grad_norm": 12.974621772766113,
+ "learning_rate": 1.9922354613056946e-05,
+ "loss": 1.5085,
+ "step": 2514
+ },
+ {
+ "epoch": 6.852861035422343,
+ "grad_norm": 10.358409881591797,
+ "learning_rate": 1.9922244815395597e-05,
+ "loss": 1.4092,
+ "step": 2515
+ },
+ {
+ "epoch": 6.855585831062671,
+ "grad_norm": 29.964595794677734,
+ "learning_rate": 1.9922134940460126e-05,
+ "loss": 1.5103,
+ "step": 2516
+ },
+ {
+ "epoch": 6.858310626702997,
+ "grad_norm": 12.04236125946045,
+ "learning_rate": 1.9922024988251384e-05,
+ "loss": 1.4392,
+ "step": 2517
+ },
+ {
+ "epoch": 6.861035422343324,
+ "grad_norm": 10.837052345275879,
+ "learning_rate": 1.9921914958770235e-05,
+ "loss": 1.5547,
+ "step": 2518
+ },
+ {
+ "epoch": 6.863760217983652,
+ "grad_norm": 12.022932052612305,
+ "learning_rate": 1.992180485201753e-05,
+ "loss": 1.5935,
+ "step": 2519
+ },
+ {
+ "epoch": 6.866485013623978,
+ "grad_norm": 13.637711524963379,
+ "learning_rate": 1.9921694667994126e-05,
+ "loss": 1.749,
+ "step": 2520
+ },
+ {
+ "epoch": 6.869209809264305,
+ "grad_norm": 10.001995086669922,
+ "learning_rate": 1.9921584406700883e-05,
+ "loss": 1.918,
+ "step": 2521
+ },
+ {
+ "epoch": 6.871934604904633,
+ "grad_norm": 29.265378952026367,
+ "learning_rate": 1.9921474068138665e-05,
+ "loss": 1.5459,
+ "step": 2522
+ },
+ {
+ "epoch": 6.874659400544959,
+ "grad_norm": 12.276293754577637,
+ "learning_rate": 1.9921363652308324e-05,
+ "loss": 1.4941,
+ "step": 2523
+ },
+ {
+ "epoch": 6.877384196185286,
+ "grad_norm": 11.9083251953125,
+ "learning_rate": 1.9921253159210718e-05,
+ "loss": 1.6221,
+ "step": 2524
+ },
+ {
+ "epoch": 6.8801089918256135,
+ "grad_norm": 11.969018936157227,
+ "learning_rate": 1.9921142588846717e-05,
+ "loss": 1.5964,
+ "step": 2525
+ },
+ {
+ "epoch": 6.88283378746594,
+ "grad_norm": 9.593964576721191,
+ "learning_rate": 1.9921031941217173e-05,
+ "loss": 1.458,
+ "step": 2526
+ },
+ {
+ "epoch": 6.885558583106267,
+ "grad_norm": 9.690338134765625,
+ "learning_rate": 1.9920921216322953e-05,
+ "loss": 1.3936,
+ "step": 2527
+ },
+ {
+ "epoch": 6.8882833787465945,
+ "grad_norm": 10.085105895996094,
+ "learning_rate": 1.992081041416492e-05,
+ "loss": 1.5444,
+ "step": 2528
+ },
+ {
+ "epoch": 6.891008174386921,
+ "grad_norm": 14.536722183227539,
+ "learning_rate": 1.9920699534743932e-05,
+ "loss": 1.7988,
+ "step": 2529
+ },
+ {
+ "epoch": 6.893732970027248,
+ "grad_norm": 10.853922843933105,
+ "learning_rate": 1.9920588578060854e-05,
+ "loss": 1.6394,
+ "step": 2530
+ },
+ {
+ "epoch": 6.896457765667575,
+ "grad_norm": 12.865930557250977,
+ "learning_rate": 1.9920477544116554e-05,
+ "loss": 1.481,
+ "step": 2531
+ },
+ {
+ "epoch": 6.899182561307902,
+ "grad_norm": 9.311355590820312,
+ "learning_rate": 1.9920366432911895e-05,
+ "loss": 1.7463,
+ "step": 2532
+ },
+ {
+ "epoch": 6.901907356948229,
+ "grad_norm": 13.008605003356934,
+ "learning_rate": 1.992025524444774e-05,
+ "loss": 1.6851,
+ "step": 2533
+ },
+ {
+ "epoch": 6.904632152588556,
+ "grad_norm": 17.339941024780273,
+ "learning_rate": 1.9920143978724958e-05,
+ "loss": 1.6743,
+ "step": 2534
+ },
+ {
+ "epoch": 6.907356948228883,
+ "grad_norm": 11.650899887084961,
+ "learning_rate": 1.992003263574441e-05,
+ "loss": 1.675,
+ "step": 2535
+ },
+ {
+ "epoch": 6.91008174386921,
+ "grad_norm": 9.174309730529785,
+ "learning_rate": 1.991992121550697e-05,
+ "loss": 1.5598,
+ "step": 2536
+ },
+ {
+ "epoch": 6.912806539509537,
+ "grad_norm": 9.838683128356934,
+ "learning_rate": 1.9919809718013505e-05,
+ "loss": 1.48,
+ "step": 2537
+ },
+ {
+ "epoch": 6.915531335149864,
+ "grad_norm": 8.482483863830566,
+ "learning_rate": 1.991969814326488e-05,
+ "loss": 1.5427,
+ "step": 2538
+ },
+ {
+ "epoch": 6.918256130790191,
+ "grad_norm": 11.64597225189209,
+ "learning_rate": 1.9919586491261962e-05,
+ "loss": 1.6533,
+ "step": 2539
+ },
+ {
+ "epoch": 6.920980926430518,
+ "grad_norm": 11.544082641601562,
+ "learning_rate": 1.9919474762005625e-05,
+ "loss": 1.8208,
+ "step": 2540
+ },
+ {
+ "epoch": 6.923705722070845,
+ "grad_norm": 12.081391334533691,
+ "learning_rate": 1.991936295549674e-05,
+ "loss": 1.7241,
+ "step": 2541
+ },
+ {
+ "epoch": 6.926430517711172,
+ "grad_norm": 12.315491676330566,
+ "learning_rate": 1.9919251071736176e-05,
+ "loss": 1.6943,
+ "step": 2542
+ },
+ {
+ "epoch": 6.929155313351498,
+ "grad_norm": 8.521120071411133,
+ "learning_rate": 1.9919139110724798e-05,
+ "loss": 1.6357,
+ "step": 2543
+ },
+ {
+ "epoch": 6.931880108991826,
+ "grad_norm": 9.169511795043945,
+ "learning_rate": 1.991902707246349e-05,
+ "loss": 1.5173,
+ "step": 2544
+ },
+ {
+ "epoch": 6.9346049046321525,
+ "grad_norm": 9.596213340759277,
+ "learning_rate": 1.9918914956953116e-05,
+ "loss": 1.5217,
+ "step": 2545
+ },
+ {
+ "epoch": 6.937329700272479,
+ "grad_norm": 8.34455394744873,
+ "learning_rate": 1.991880276419455e-05,
+ "loss": 1.5686,
+ "step": 2546
+ },
+ {
+ "epoch": 6.940054495912807,
+ "grad_norm": 9.147504806518555,
+ "learning_rate": 1.991869049418867e-05,
+ "loss": 1.4917,
+ "step": 2547
+ },
+ {
+ "epoch": 6.9427792915531334,
+ "grad_norm": 11.00312614440918,
+ "learning_rate": 1.9918578146936346e-05,
+ "loss": 1.8115,
+ "step": 2548
+ },
+ {
+ "epoch": 6.94550408719346,
+ "grad_norm": 11.378459930419922,
+ "learning_rate": 1.9918465722438456e-05,
+ "loss": 1.6875,
+ "step": 2549
+ },
+ {
+ "epoch": 6.948228882833788,
+ "grad_norm": 9.615368843078613,
+ "learning_rate": 1.9918353220695875e-05,
+ "loss": 1.6191,
+ "step": 2550
+ },
+ {
+ "epoch": 6.950953678474114,
+ "grad_norm": 8.775830268859863,
+ "learning_rate": 1.9918240641709475e-05,
+ "loss": 1.5447,
+ "step": 2551
+ },
+ {
+ "epoch": 6.953678474114441,
+ "grad_norm": 9.215841293334961,
+ "learning_rate": 1.991812798548014e-05,
+ "loss": 1.7075,
+ "step": 2552
+ },
+ {
+ "epoch": 6.956403269754769,
+ "grad_norm": 11.271383285522461,
+ "learning_rate": 1.991801525200874e-05,
+ "loss": 1.5977,
+ "step": 2553
+ },
+ {
+ "epoch": 6.959128065395095,
+ "grad_norm": 9.250890731811523,
+ "learning_rate": 1.9917902441296156e-05,
+ "loss": 1.6226,
+ "step": 2554
+ },
+ {
+ "epoch": 6.961852861035422,
+ "grad_norm": 8.830961227416992,
+ "learning_rate": 1.991778955334327e-05,
+ "loss": 1.5269,
+ "step": 2555
+ },
+ {
+ "epoch": 6.96457765667575,
+ "grad_norm": 11.751460075378418,
+ "learning_rate": 1.991767658815096e-05,
+ "loss": 1.7437,
+ "step": 2556
+ },
+ {
+ "epoch": 6.967302452316076,
+ "grad_norm": 12.019865036010742,
+ "learning_rate": 1.9917563545720098e-05,
+ "loss": 1.7788,
+ "step": 2557
+ },
+ {
+ "epoch": 6.970027247956403,
+ "grad_norm": 9.664366722106934,
+ "learning_rate": 1.9917450426051572e-05,
+ "loss": 1.595,
+ "step": 2558
+ },
+ {
+ "epoch": 6.9727520435967305,
+ "grad_norm": 10.568838119506836,
+ "learning_rate": 1.9917337229146266e-05,
+ "loss": 1.5591,
+ "step": 2559
+ },
+ {
+ "epoch": 6.975476839237057,
+ "grad_norm": 7.393206596374512,
+ "learning_rate": 1.9917223955005053e-05,
+ "loss": 1.4487,
+ "step": 2560
+ },
+ {
+ "epoch": 6.978201634877384,
+ "grad_norm": 9.041869163513184,
+ "learning_rate": 1.9917110603628818e-05,
+ "loss": 1.5823,
+ "step": 2561
+ },
+ {
+ "epoch": 6.9809264305177114,
+ "grad_norm": 8.957469940185547,
+ "learning_rate": 1.9916997175018445e-05,
+ "loss": 1.4365,
+ "step": 2562
+ },
+ {
+ "epoch": 6.983651226158038,
+ "grad_norm": 8.627134323120117,
+ "learning_rate": 1.9916883669174818e-05,
+ "loss": 1.5144,
+ "step": 2563
+ },
+ {
+ "epoch": 6.986376021798365,
+ "grad_norm": 9.489056587219238,
+ "learning_rate": 1.991677008609882e-05,
+ "loss": 1.6389,
+ "step": 2564
+ },
+ {
+ "epoch": 6.989100817438692,
+ "grad_norm": 10.777949333190918,
+ "learning_rate": 1.9916656425791338e-05,
+ "loss": 1.3235,
+ "step": 2565
+ },
+ {
+ "epoch": 6.991825613079019,
+ "grad_norm": 11.10266399383545,
+ "learning_rate": 1.9916542688253253e-05,
+ "loss": 1.6667,
+ "step": 2566
+ },
+ {
+ "epoch": 6.994550408719346,
+ "grad_norm": 16.274316787719727,
+ "learning_rate": 1.9916428873485452e-05,
+ "loss": 1.7275,
+ "step": 2567
+ },
+ {
+ "epoch": 6.997275204359673,
+ "grad_norm": 10.998518943786621,
+ "learning_rate": 1.9916314981488822e-05,
+ "loss": 1.5061,
+ "step": 2568
+ },
+ {
+ "epoch": 7.0,
+ "grad_norm": 13.744210243225098,
+ "learning_rate": 1.9916201012264255e-05,
+ "loss": 1.4661,
+ "step": 2569
+ },
+ {
+ "epoch": 7.002724795640327,
+ "grad_norm": 12.455055236816406,
+ "learning_rate": 1.9916086965812627e-05,
+ "loss": 1.5776,
+ "step": 2570
+ },
+ {
+ "epoch": 7.005449591280654,
+ "grad_norm": 8.5689115524292,
+ "learning_rate": 1.9915972842134837e-05,
+ "loss": 1.5989,
+ "step": 2571
+ },
+ {
+ "epoch": 7.008174386920981,
+ "grad_norm": 9.611258506774902,
+ "learning_rate": 1.991585864123177e-05,
+ "loss": 1.5684,
+ "step": 2572
+ },
+ {
+ "epoch": 7.010899182561308,
+ "grad_norm": 10.000003814697266,
+ "learning_rate": 1.991574436310431e-05,
+ "loss": 1.6243,
+ "step": 2573
+ },
+ {
+ "epoch": 7.013623978201635,
+ "grad_norm": 9.323932647705078,
+ "learning_rate": 1.991563000775336e-05,
+ "loss": 1.6792,
+ "step": 2574
+ },
+ {
+ "epoch": 7.016348773841962,
+ "grad_norm": 13.849161148071289,
+ "learning_rate": 1.9915515575179793e-05,
+ "loss": 1.4006,
+ "step": 2575
+ },
+ {
+ "epoch": 7.0190735694822886,
+ "grad_norm": 12.729543685913086,
+ "learning_rate": 1.9915401065384518e-05,
+ "loss": 1.6182,
+ "step": 2576
+ },
+ {
+ "epoch": 7.021798365122616,
+ "grad_norm": 9.167952537536621,
+ "learning_rate": 1.9915286478368414e-05,
+ "loss": 1.5718,
+ "step": 2577
+ },
+ {
+ "epoch": 7.024523160762943,
+ "grad_norm": 10.326859474182129,
+ "learning_rate": 1.9915171814132378e-05,
+ "loss": 1.3718,
+ "step": 2578
+ },
+ {
+ "epoch": 7.0272479564032695,
+ "grad_norm": 9.17179012298584,
+ "learning_rate": 1.9915057072677305e-05,
+ "loss": 1.4885,
+ "step": 2579
+ },
+ {
+ "epoch": 7.029972752043597,
+ "grad_norm": 10.229643821716309,
+ "learning_rate": 1.9914942254004086e-05,
+ "loss": 1.668,
+ "step": 2580
+ },
+ {
+ "epoch": 7.032697547683924,
+ "grad_norm": 12.10188102722168,
+ "learning_rate": 1.9914827358113616e-05,
+ "loss": 1.3757,
+ "step": 2581
+ },
+ {
+ "epoch": 7.03542234332425,
+ "grad_norm": 8.516680717468262,
+ "learning_rate": 1.991471238500679e-05,
+ "loss": 1.5469,
+ "step": 2582
+ },
+ {
+ "epoch": 7.038147138964578,
+ "grad_norm": 16.977920532226562,
+ "learning_rate": 1.9914597334684502e-05,
+ "loss": 1.5964,
+ "step": 2583
+ },
+ {
+ "epoch": 7.040871934604905,
+ "grad_norm": 10.091428756713867,
+ "learning_rate": 1.9914482207147648e-05,
+ "loss": 1.5515,
+ "step": 2584
+ },
+ {
+ "epoch": 7.043596730245231,
+ "grad_norm": 11.44006061553955,
+ "learning_rate": 1.9914367002397127e-05,
+ "loss": 1.5601,
+ "step": 2585
+ },
+ {
+ "epoch": 7.046321525885559,
+ "grad_norm": 10.585381507873535,
+ "learning_rate": 1.9914251720433837e-05,
+ "loss": 1.3669,
+ "step": 2586
+ },
+ {
+ "epoch": 7.049046321525886,
+ "grad_norm": 12.6299467086792,
+ "learning_rate": 1.9914136361258673e-05,
+ "loss": 1.7812,
+ "step": 2587
+ },
+ {
+ "epoch": 7.051771117166212,
+ "grad_norm": 23.789104461669922,
+ "learning_rate": 1.991402092487253e-05,
+ "loss": 1.6086,
+ "step": 2588
+ },
+ {
+ "epoch": 7.05449591280654,
+ "grad_norm": 10.832141876220703,
+ "learning_rate": 1.991390541127632e-05,
+ "loss": 1.5283,
+ "step": 2589
+ },
+ {
+ "epoch": 7.0572207084468666,
+ "grad_norm": 9.405333518981934,
+ "learning_rate": 1.9913789820470925e-05,
+ "loss": 1.6958,
+ "step": 2590
+ },
+ {
+ "epoch": 7.059945504087193,
+ "grad_norm": 10.257238388061523,
+ "learning_rate": 1.9913674152457254e-05,
+ "loss": 1.4604,
+ "step": 2591
+ },
+ {
+ "epoch": 7.062670299727521,
+ "grad_norm": 9.994807243347168,
+ "learning_rate": 1.991355840723621e-05,
+ "loss": 1.5125,
+ "step": 2592
+ },
+ {
+ "epoch": 7.0653950953678475,
+ "grad_norm": 10.089841842651367,
+ "learning_rate": 1.9913442584808694e-05,
+ "loss": 1.4565,
+ "step": 2593
+ },
+ {
+ "epoch": 7.068119891008174,
+ "grad_norm": 9.78079605102539,
+ "learning_rate": 1.9913326685175606e-05,
+ "loss": 1.4182,
+ "step": 2594
+ },
+ {
+ "epoch": 7.070844686648502,
+ "grad_norm": 15.902073860168457,
+ "learning_rate": 1.991321070833785e-05,
+ "loss": 1.3955,
+ "step": 2595
+ },
+ {
+ "epoch": 7.073569482288828,
+ "grad_norm": 17.8822078704834,
+ "learning_rate": 1.9913094654296324e-05,
+ "loss": 1.4043,
+ "step": 2596
+ },
+ {
+ "epoch": 7.076294277929155,
+ "grad_norm": 13.469987869262695,
+ "learning_rate": 1.9912978523051936e-05,
+ "loss": 1.3516,
+ "step": 2597
+ },
+ {
+ "epoch": 7.079019073569483,
+ "grad_norm": 18.184144973754883,
+ "learning_rate": 1.9912862314605594e-05,
+ "loss": 1.4761,
+ "step": 2598
+ },
+ {
+ "epoch": 7.081743869209809,
+ "grad_norm": 10.457294464111328,
+ "learning_rate": 1.9912746028958195e-05,
+ "loss": 1.5325,
+ "step": 2599
+ },
+ {
+ "epoch": 7.084468664850136,
+ "grad_norm": 13.190240859985352,
+ "learning_rate": 1.9912629666110656e-05,
+ "loss": 1.5283,
+ "step": 2600
+ },
+ {
+ "epoch": 7.087193460490464,
+ "grad_norm": 12.5562105178833,
+ "learning_rate": 1.9912513226063866e-05,
+ "loss": 1.3442,
+ "step": 2601
+ },
+ {
+ "epoch": 7.08991825613079,
+ "grad_norm": 11.620115280151367,
+ "learning_rate": 1.9912396708818748e-05,
+ "loss": 1.5303,
+ "step": 2602
+ },
+ {
+ "epoch": 7.092643051771117,
+ "grad_norm": 16.161975860595703,
+ "learning_rate": 1.9912280114376205e-05,
+ "loss": 1.7246,
+ "step": 2603
+ },
+ {
+ "epoch": 7.0953678474114446,
+ "grad_norm": 12.94520378112793,
+ "learning_rate": 1.9912163442737143e-05,
+ "loss": 1.4026,
+ "step": 2604
+ },
+ {
+ "epoch": 7.098092643051771,
+ "grad_norm": 32.33180236816406,
+ "learning_rate": 1.9912046693902466e-05,
+ "loss": 1.6226,
+ "step": 2605
+ },
+ {
+ "epoch": 7.100817438692098,
+ "grad_norm": 14.084209442138672,
+ "learning_rate": 1.9911929867873093e-05,
+ "loss": 1.6404,
+ "step": 2606
+ },
+ {
+ "epoch": 7.1035422343324255,
+ "grad_norm": 12.616997718811035,
+ "learning_rate": 1.991181296464993e-05,
+ "loss": 1.3081,
+ "step": 2607
+ },
+ {
+ "epoch": 7.106267029972752,
+ "grad_norm": 11.319100379943848,
+ "learning_rate": 1.9911695984233885e-05,
+ "loss": 1.3953,
+ "step": 2608
+ },
+ {
+ "epoch": 7.108991825613079,
+ "grad_norm": 19.24335289001465,
+ "learning_rate": 1.991157892662587e-05,
+ "loss": 1.5649,
+ "step": 2609
+ },
+ {
+ "epoch": 7.111716621253406,
+ "grad_norm": 19.046993255615234,
+ "learning_rate": 1.99114617918268e-05,
+ "loss": 1.4734,
+ "step": 2610
+ },
+ {
+ "epoch": 7.114441416893733,
+ "grad_norm": 35.106143951416016,
+ "learning_rate": 1.991134457983758e-05,
+ "loss": 1.6211,
+ "step": 2611
+ },
+ {
+ "epoch": 7.11716621253406,
+ "grad_norm": 12.001912117004395,
+ "learning_rate": 1.991122729065913e-05,
+ "loss": 1.5916,
+ "step": 2612
+ },
+ {
+ "epoch": 7.1198910081743865,
+ "grad_norm": 14.034006118774414,
+ "learning_rate": 1.9911109924292362e-05,
+ "loss": 1.3315,
+ "step": 2613
+ },
+ {
+ "epoch": 7.122615803814714,
+ "grad_norm": 24.54100799560547,
+ "learning_rate": 1.991099248073819e-05,
+ "loss": 1.3369,
+ "step": 2614
+ },
+ {
+ "epoch": 7.125340599455041,
+ "grad_norm": 18.295448303222656,
+ "learning_rate": 1.991087495999752e-05,
+ "loss": 1.4895,
+ "step": 2615
+ },
+ {
+ "epoch": 7.128065395095367,
+ "grad_norm": 10.534333229064941,
+ "learning_rate": 1.9910757362071282e-05,
+ "loss": 1.282,
+ "step": 2616
+ },
+ {
+ "epoch": 7.130790190735695,
+ "grad_norm": 16.28651237487793,
+ "learning_rate": 1.9910639686960382e-05,
+ "loss": 1.387,
+ "step": 2617
+ },
+ {
+ "epoch": 7.133514986376022,
+ "grad_norm": 17.221111297607422,
+ "learning_rate": 1.991052193466574e-05,
+ "loss": 1.5898,
+ "step": 2618
+ },
+ {
+ "epoch": 7.136239782016348,
+ "grad_norm": 12.247292518615723,
+ "learning_rate": 1.991040410518827e-05,
+ "loss": 1.3435,
+ "step": 2619
+ },
+ {
+ "epoch": 7.138964577656676,
+ "grad_norm": 14.799015998840332,
+ "learning_rate": 1.9910286198528897e-05,
+ "loss": 1.5859,
+ "step": 2620
+ },
+ {
+ "epoch": 7.141689373297003,
+ "grad_norm": 13.674405097961426,
+ "learning_rate": 1.9910168214688527e-05,
+ "loss": 1.4153,
+ "step": 2621
+ },
+ {
+ "epoch": 7.144414168937329,
+ "grad_norm": 54.96337890625,
+ "learning_rate": 1.991005015366809e-05,
+ "loss": 1.3645,
+ "step": 2622
+ },
+ {
+ "epoch": 7.147138964577657,
+ "grad_norm": 19.959274291992188,
+ "learning_rate": 1.9909932015468504e-05,
+ "loss": 1.5613,
+ "step": 2623
+ },
+ {
+ "epoch": 7.1498637602179835,
+ "grad_norm": 15.985265731811523,
+ "learning_rate": 1.9909813800090682e-05,
+ "loss": 1.4902,
+ "step": 2624
+ },
+ {
+ "epoch": 7.15258855585831,
+ "grad_norm": 19.88857650756836,
+ "learning_rate": 1.9909695507535552e-05,
+ "loss": 1.5559,
+ "step": 2625
+ },
+ {
+ "epoch": 7.155313351498638,
+ "grad_norm": 18.16654396057129,
+ "learning_rate": 1.9909577137804028e-05,
+ "loss": 1.4475,
+ "step": 2626
+ },
+ {
+ "epoch": 7.1580381471389645,
+ "grad_norm": 18.870697021484375,
+ "learning_rate": 1.9909458690897038e-05,
+ "loss": 1.2856,
+ "step": 2627
+ },
+ {
+ "epoch": 7.160762942779291,
+ "grad_norm": 35.931060791015625,
+ "learning_rate": 1.9909340166815504e-05,
+ "loss": 1.5642,
+ "step": 2628
+ },
+ {
+ "epoch": 7.163487738419619,
+ "grad_norm": 23.01498794555664,
+ "learning_rate": 1.9909221565560348e-05,
+ "loss": 1.4214,
+ "step": 2629
+ },
+ {
+ "epoch": 7.166212534059945,
+ "grad_norm": 16.723155975341797,
+ "learning_rate": 1.9909102887132494e-05,
+ "loss": 1.541,
+ "step": 2630
+ },
+ {
+ "epoch": 7.168937329700272,
+ "grad_norm": 14.408949851989746,
+ "learning_rate": 1.9908984131532865e-05,
+ "loss": 1.4429,
+ "step": 2631
+ },
+ {
+ "epoch": 7.1716621253406,
+ "grad_norm": 54.55207824707031,
+ "learning_rate": 1.9908865298762384e-05,
+ "loss": 1.697,
+ "step": 2632
+ },
+ {
+ "epoch": 7.174386920980926,
+ "grad_norm": 37.38616943359375,
+ "learning_rate": 1.990874638882198e-05,
+ "loss": 1.374,
+ "step": 2633
+ },
+ {
+ "epoch": 7.177111716621253,
+ "grad_norm": 15.120404243469238,
+ "learning_rate": 1.990862740171258e-05,
+ "loss": 1.4287,
+ "step": 2634
+ },
+ {
+ "epoch": 7.179836512261581,
+ "grad_norm": 16.63327407836914,
+ "learning_rate": 1.990850833743511e-05,
+ "loss": 1.5898,
+ "step": 2635
+ },
+ {
+ "epoch": 7.182561307901907,
+ "grad_norm": 16.18759536743164,
+ "learning_rate": 1.9908389195990492e-05,
+ "loss": 1.5266,
+ "step": 2636
+ },
+ {
+ "epoch": 7.185286103542234,
+ "grad_norm": 19.903820037841797,
+ "learning_rate": 1.9908269977379658e-05,
+ "loss": 1.4631,
+ "step": 2637
+ },
+ {
+ "epoch": 7.1880108991825615,
+ "grad_norm": 20.78038787841797,
+ "learning_rate": 1.990815068160354e-05,
+ "loss": 1.4155,
+ "step": 2638
+ },
+ {
+ "epoch": 7.190735694822888,
+ "grad_norm": 65.83699798583984,
+ "learning_rate": 1.990803130866306e-05,
+ "loss": 1.468,
+ "step": 2639
+ },
+ {
+ "epoch": 7.193460490463215,
+ "grad_norm": 12.93549633026123,
+ "learning_rate": 1.990791185855915e-05,
+ "loss": 1.561,
+ "step": 2640
+ },
+ {
+ "epoch": 7.1961852861035425,
+ "grad_norm": 13.24904727935791,
+ "learning_rate": 1.9907792331292747e-05,
+ "loss": 1.4609,
+ "step": 2641
+ },
+ {
+ "epoch": 7.198910081743869,
+ "grad_norm": 14.132883071899414,
+ "learning_rate": 1.9907672726864772e-05,
+ "loss": 1.5366,
+ "step": 2642
+ },
+ {
+ "epoch": 7.201634877384196,
+ "grad_norm": 21.078025817871094,
+ "learning_rate": 1.9907553045276158e-05,
+ "loss": 1.6311,
+ "step": 2643
+ },
+ {
+ "epoch": 7.204359673024523,
+ "grad_norm": 17.943523406982422,
+ "learning_rate": 1.9907433286527843e-05,
+ "loss": 1.5339,
+ "step": 2644
+ },
+ {
+ "epoch": 7.20708446866485,
+ "grad_norm": 11.418760299682617,
+ "learning_rate": 1.990731345062076e-05,
+ "loss": 1.7036,
+ "step": 2645
+ },
+ {
+ "epoch": 7.209809264305177,
+ "grad_norm": 28.595006942749023,
+ "learning_rate": 1.9907193537555832e-05,
+ "loss": 1.5769,
+ "step": 2646
+ },
+ {
+ "epoch": 7.212534059945504,
+ "grad_norm": 17.612186431884766,
+ "learning_rate": 1.9907073547334002e-05,
+ "loss": 1.3901,
+ "step": 2647
+ },
+ {
+ "epoch": 7.215258855585831,
+ "grad_norm": 13.393107414245605,
+ "learning_rate": 1.9906953479956206e-05,
+ "loss": 1.4292,
+ "step": 2648
+ },
+ {
+ "epoch": 7.217983651226158,
+ "grad_norm": 15.393351554870605,
+ "learning_rate": 1.990683333542337e-05,
+ "loss": 1.5747,
+ "step": 2649
+ },
+ {
+ "epoch": 7.220708446866485,
+ "grad_norm": 11.29178237915039,
+ "learning_rate": 1.990671311373644e-05,
+ "loss": 1.5178,
+ "step": 2650
+ },
+ {
+ "epoch": 7.223433242506812,
+ "grad_norm": 10.266595840454102,
+ "learning_rate": 1.9906592814896343e-05,
+ "loss": 1.6135,
+ "step": 2651
+ },
+ {
+ "epoch": 7.226158038147139,
+ "grad_norm": 13.928282737731934,
+ "learning_rate": 1.990647243890402e-05,
+ "loss": 1.5029,
+ "step": 2652
+ },
+ {
+ "epoch": 7.228882833787466,
+ "grad_norm": 11.35490894317627,
+ "learning_rate": 1.990635198576041e-05,
+ "loss": 1.5884,
+ "step": 2653
+ },
+ {
+ "epoch": 7.231607629427793,
+ "grad_norm": 11.80521011352539,
+ "learning_rate": 1.990623145546645e-05,
+ "loss": 1.5706,
+ "step": 2654
+ },
+ {
+ "epoch": 7.23433242506812,
+ "grad_norm": 16.76881217956543,
+ "learning_rate": 1.9906110848023074e-05,
+ "loss": 1.5825,
+ "step": 2655
+ },
+ {
+ "epoch": 7.237057220708447,
+ "grad_norm": 29.365928649902344,
+ "learning_rate": 1.990599016343123e-05,
+ "loss": 1.5627,
+ "step": 2656
+ },
+ {
+ "epoch": 7.239782016348774,
+ "grad_norm": 16.728803634643555,
+ "learning_rate": 1.9905869401691854e-05,
+ "loss": 1.467,
+ "step": 2657
+ },
+ {
+ "epoch": 7.2425068119891005,
+ "grad_norm": 8.949308395385742,
+ "learning_rate": 1.990574856280588e-05,
+ "loss": 1.4473,
+ "step": 2658
+ },
+ {
+ "epoch": 7.245231607629428,
+ "grad_norm": 14.383991241455078,
+ "learning_rate": 1.9905627646774262e-05,
+ "loss": 1.5891,
+ "step": 2659
+ },
+ {
+ "epoch": 7.247956403269755,
+ "grad_norm": 14.508793830871582,
+ "learning_rate": 1.990550665359793e-05,
+ "loss": 1.6321,
+ "step": 2660
+ },
+ {
+ "epoch": 7.2506811989100814,
+ "grad_norm": 13.771912574768066,
+ "learning_rate": 1.9905385583277834e-05,
+ "loss": 1.624,
+ "step": 2661
+ },
+ {
+ "epoch": 7.253405994550409,
+ "grad_norm": 18.602794647216797,
+ "learning_rate": 1.9905264435814913e-05,
+ "loss": 1.4531,
+ "step": 2662
+ },
+ {
+ "epoch": 7.256130790190736,
+ "grad_norm": 12.330023765563965,
+ "learning_rate": 1.990514321121011e-05,
+ "loss": 1.4819,
+ "step": 2663
+ },
+ {
+ "epoch": 7.258855585831062,
+ "grad_norm": 16.42203712463379,
+ "learning_rate": 1.9905021909464372e-05,
+ "loss": 1.5513,
+ "step": 2664
+ },
+ {
+ "epoch": 7.26158038147139,
+ "grad_norm": 13.549471855163574,
+ "learning_rate": 1.9904900530578643e-05,
+ "loss": 1.5002,
+ "step": 2665
+ },
+ {
+ "epoch": 7.264305177111717,
+ "grad_norm": 10.781227111816406,
+ "learning_rate": 1.9904779074553864e-05,
+ "loss": 1.5864,
+ "step": 2666
+ },
+ {
+ "epoch": 7.267029972752043,
+ "grad_norm": 18.10679054260254,
+ "learning_rate": 1.990465754139099e-05,
+ "loss": 1.647,
+ "step": 2667
+ },
+ {
+ "epoch": 7.269754768392371,
+ "grad_norm": 12.661219596862793,
+ "learning_rate": 1.9904535931090957e-05,
+ "loss": 1.6035,
+ "step": 2668
+ },
+ {
+ "epoch": 7.272479564032698,
+ "grad_norm": 12.699142456054688,
+ "learning_rate": 1.9904414243654716e-05,
+ "loss": 1.4862,
+ "step": 2669
+ },
+ {
+ "epoch": 7.275204359673024,
+ "grad_norm": 12.930998802185059,
+ "learning_rate": 1.9904292479083217e-05,
+ "loss": 1.4475,
+ "step": 2670
+ },
+ {
+ "epoch": 7.277929155313352,
+ "grad_norm": 12.240517616271973,
+ "learning_rate": 1.9904170637377408e-05,
+ "loss": 1.6685,
+ "step": 2671
+ },
+ {
+ "epoch": 7.2806539509536785,
+ "grad_norm": 18.07870864868164,
+ "learning_rate": 1.9904048718538238e-05,
+ "loss": 1.4385,
+ "step": 2672
+ },
+ {
+ "epoch": 7.283378746594005,
+ "grad_norm": 15.409016609191895,
+ "learning_rate": 1.9903926722566655e-05,
+ "loss": 1.4524,
+ "step": 2673
+ },
+ {
+ "epoch": 7.286103542234333,
+ "grad_norm": 10.995656967163086,
+ "learning_rate": 1.990380464946361e-05,
+ "loss": 1.4021,
+ "step": 2674
+ },
+ {
+ "epoch": 7.2888283378746594,
+ "grad_norm": 16.83498764038086,
+ "learning_rate": 1.990368249923005e-05,
+ "loss": 1.7432,
+ "step": 2675
+ },
+ {
+ "epoch": 7.291553133514986,
+ "grad_norm": 11.144207954406738,
+ "learning_rate": 1.990356027186693e-05,
+ "loss": 1.4312,
+ "step": 2676
+ },
+ {
+ "epoch": 7.294277929155314,
+ "grad_norm": 10.032282829284668,
+ "learning_rate": 1.9903437967375202e-05,
+ "loss": 1.4509,
+ "step": 2677
+ },
+ {
+ "epoch": 7.29700272479564,
+ "grad_norm": 11.693425178527832,
+ "learning_rate": 1.990331558575582e-05,
+ "loss": 1.5181,
+ "step": 2678
+ },
+ {
+ "epoch": 7.299727520435967,
+ "grad_norm": 16.339767456054688,
+ "learning_rate": 1.990319312700973e-05,
+ "loss": 1.4441,
+ "step": 2679
+ },
+ {
+ "epoch": 7.302452316076295,
+ "grad_norm": 13.989665985107422,
+ "learning_rate": 1.9903070591137898e-05,
+ "loss": 1.2375,
+ "step": 2680
+ },
+ {
+ "epoch": 7.305177111716621,
+ "grad_norm": 14.806517601013184,
+ "learning_rate": 1.9902947978141265e-05,
+ "loss": 1.4504,
+ "step": 2681
+ },
+ {
+ "epoch": 7.307901907356948,
+ "grad_norm": 15.431193351745605,
+ "learning_rate": 1.9902825288020794e-05,
+ "loss": 1.5498,
+ "step": 2682
+ },
+ {
+ "epoch": 7.310626702997276,
+ "grad_norm": 14.844110488891602,
+ "learning_rate": 1.990270252077744e-05,
+ "loss": 1.8154,
+ "step": 2683
+ },
+ {
+ "epoch": 7.313351498637602,
+ "grad_norm": 12.310922622680664,
+ "learning_rate": 1.9902579676412154e-05,
+ "loss": 1.5247,
+ "step": 2684
+ },
+ {
+ "epoch": 7.316076294277929,
+ "grad_norm": 11.25191593170166,
+ "learning_rate": 1.9902456754925898e-05,
+ "loss": 1.4375,
+ "step": 2685
+ },
+ {
+ "epoch": 7.3188010899182565,
+ "grad_norm": 12.803166389465332,
+ "learning_rate": 1.990233375631963e-05,
+ "loss": 1.5872,
+ "step": 2686
+ },
+ {
+ "epoch": 7.321525885558583,
+ "grad_norm": 11.506999969482422,
+ "learning_rate": 1.99022106805943e-05,
+ "loss": 1.469,
+ "step": 2687
+ },
+ {
+ "epoch": 7.32425068119891,
+ "grad_norm": 11.528977394104004,
+ "learning_rate": 1.9902087527750876e-05,
+ "loss": 1.6492,
+ "step": 2688
+ },
+ {
+ "epoch": 7.3269754768392374,
+ "grad_norm": 15.200810432434082,
+ "learning_rate": 1.990196429779031e-05,
+ "loss": 1.6326,
+ "step": 2689
+ },
+ {
+ "epoch": 7.329700272479564,
+ "grad_norm": 8.964735984802246,
+ "learning_rate": 1.9901840990713566e-05,
+ "loss": 1.4773,
+ "step": 2690
+ },
+ {
+ "epoch": 7.332425068119891,
+ "grad_norm": 13.632256507873535,
+ "learning_rate": 1.9901717606521607e-05,
+ "loss": 1.6499,
+ "step": 2691
+ },
+ {
+ "epoch": 7.335149863760218,
+ "grad_norm": 10.2181396484375,
+ "learning_rate": 1.9901594145215382e-05,
+ "loss": 1.6406,
+ "step": 2692
+ },
+ {
+ "epoch": 7.337874659400545,
+ "grad_norm": 15.948305130004883,
+ "learning_rate": 1.9901470606795867e-05,
+ "loss": 1.4795,
+ "step": 2693
+ },
+ {
+ "epoch": 7.340599455040872,
+ "grad_norm": 10.267861366271973,
+ "learning_rate": 1.9901346991264018e-05,
+ "loss": 1.4495,
+ "step": 2694
+ },
+ {
+ "epoch": 7.343324250681199,
+ "grad_norm": 10.505049705505371,
+ "learning_rate": 1.9901223298620793e-05,
+ "loss": 1.4509,
+ "step": 2695
+ },
+ {
+ "epoch": 7.346049046321526,
+ "grad_norm": 10.342820167541504,
+ "learning_rate": 1.9901099528867164e-05,
+ "loss": 1.6152,
+ "step": 2696
+ },
+ {
+ "epoch": 7.348773841961853,
+ "grad_norm": 12.281599998474121,
+ "learning_rate": 1.9900975682004088e-05,
+ "loss": 1.4797,
+ "step": 2697
+ },
+ {
+ "epoch": 7.35149863760218,
+ "grad_norm": 11.366495132446289,
+ "learning_rate": 1.990085175803253e-05,
+ "loss": 1.5854,
+ "step": 2698
+ },
+ {
+ "epoch": 7.354223433242507,
+ "grad_norm": 10.912250518798828,
+ "learning_rate": 1.990072775695346e-05,
+ "loss": 1.5161,
+ "step": 2699
+ },
+ {
+ "epoch": 7.356948228882834,
+ "grad_norm": 12.146465301513672,
+ "learning_rate": 1.990060367876784e-05,
+ "loss": 1.5774,
+ "step": 2700
+ },
+ {
+ "epoch": 7.359673024523161,
+ "grad_norm": 13.08321762084961,
+ "learning_rate": 1.9900479523476637e-05,
+ "loss": 1.5476,
+ "step": 2701
+ },
+ {
+ "epoch": 7.362397820163488,
+ "grad_norm": 11.220298767089844,
+ "learning_rate": 1.9900355291080816e-05,
+ "loss": 1.5044,
+ "step": 2702
+ },
+ {
+ "epoch": 7.3651226158038146,
+ "grad_norm": 13.201688766479492,
+ "learning_rate": 1.990023098158135e-05,
+ "loss": 1.6455,
+ "step": 2703
+ },
+ {
+ "epoch": 7.367847411444142,
+ "grad_norm": 10.523879051208496,
+ "learning_rate": 1.9900106594979204e-05,
+ "loss": 1.5427,
+ "step": 2704
+ },
+ {
+ "epoch": 7.370572207084469,
+ "grad_norm": 11.078397750854492,
+ "learning_rate": 1.9899982131275345e-05,
+ "loss": 1.4673,
+ "step": 2705
+ },
+ {
+ "epoch": 7.3732970027247955,
+ "grad_norm": 12.766281127929688,
+ "learning_rate": 1.9899857590470745e-05,
+ "loss": 1.51,
+ "step": 2706
+ },
+ {
+ "epoch": 7.376021798365123,
+ "grad_norm": 15.339536666870117,
+ "learning_rate": 1.989973297256637e-05,
+ "loss": 1.4934,
+ "step": 2707
+ },
+ {
+ "epoch": 7.37874659400545,
+ "grad_norm": 10.396599769592285,
+ "learning_rate": 1.9899608277563197e-05,
+ "loss": 1.4001,
+ "step": 2708
+ },
+ {
+ "epoch": 7.381471389645776,
+ "grad_norm": 8.053894996643066,
+ "learning_rate": 1.989948350546219e-05,
+ "loss": 1.3518,
+ "step": 2709
+ },
+ {
+ "epoch": 7.384196185286104,
+ "grad_norm": 10.564316749572754,
+ "learning_rate": 1.9899358656264325e-05,
+ "loss": 1.4333,
+ "step": 2710
+ },
+ {
+ "epoch": 7.386920980926431,
+ "grad_norm": 9.205158233642578,
+ "learning_rate": 1.9899233729970576e-05,
+ "loss": 1.2275,
+ "step": 2711
+ },
+ {
+ "epoch": 7.389645776566757,
+ "grad_norm": 10.553511619567871,
+ "learning_rate": 1.9899108726581907e-05,
+ "loss": 1.3894,
+ "step": 2712
+ },
+ {
+ "epoch": 7.392370572207085,
+ "grad_norm": 8.432306289672852,
+ "learning_rate": 1.9898983646099304e-05,
+ "loss": 1.3279,
+ "step": 2713
+ },
+ {
+ "epoch": 7.395095367847412,
+ "grad_norm": 13.820378303527832,
+ "learning_rate": 1.989885848852373e-05,
+ "loss": 1.5513,
+ "step": 2714
+ },
+ {
+ "epoch": 7.397820163487738,
+ "grad_norm": 13.580961227416992,
+ "learning_rate": 1.989873325385617e-05,
+ "loss": 1.4382,
+ "step": 2715
+ },
+ {
+ "epoch": 7.400544959128065,
+ "grad_norm": 10.945294380187988,
+ "learning_rate": 1.989860794209759e-05,
+ "loss": 1.5232,
+ "step": 2716
+ },
+ {
+ "epoch": 7.4032697547683926,
+ "grad_norm": 10.951699256896973,
+ "learning_rate": 1.989848255324897e-05,
+ "loss": 1.564,
+ "step": 2717
+ },
+ {
+ "epoch": 7.405994550408719,
+ "grad_norm": 10.355441093444824,
+ "learning_rate": 1.989835708731129e-05,
+ "loss": 1.3796,
+ "step": 2718
+ },
+ {
+ "epoch": 7.408719346049046,
+ "grad_norm": 9.621257781982422,
+ "learning_rate": 1.9898231544285523e-05,
+ "loss": 1.5391,
+ "step": 2719
+ },
+ {
+ "epoch": 7.4114441416893735,
+ "grad_norm": 11.549651145935059,
+ "learning_rate": 1.9898105924172647e-05,
+ "loss": 1.4773,
+ "step": 2720
+ },
+ {
+ "epoch": 7.4141689373297,
+ "grad_norm": 10.521002769470215,
+ "learning_rate": 1.989798022697364e-05,
+ "loss": 1.2507,
+ "step": 2721
+ },
+ {
+ "epoch": 7.416893732970027,
+ "grad_norm": 12.156377792358398,
+ "learning_rate": 1.989785445268948e-05,
+ "loss": 1.5168,
+ "step": 2722
+ },
+ {
+ "epoch": 7.419618528610354,
+ "grad_norm": 12.271047592163086,
+ "learning_rate": 1.9897728601321148e-05,
+ "loss": 1.6658,
+ "step": 2723
+ },
+ {
+ "epoch": 7.422343324250681,
+ "grad_norm": 9.159317016601562,
+ "learning_rate": 1.9897602672869624e-05,
+ "loss": 1.406,
+ "step": 2724
+ },
+ {
+ "epoch": 7.425068119891008,
+ "grad_norm": 11.248191833496094,
+ "learning_rate": 1.989747666733589e-05,
+ "loss": 1.4246,
+ "step": 2725
+ },
+ {
+ "epoch": 7.427792915531335,
+ "grad_norm": 11.331597328186035,
+ "learning_rate": 1.9897350584720928e-05,
+ "loss": 1.5464,
+ "step": 2726
+ },
+ {
+ "epoch": 7.430517711171662,
+ "grad_norm": 18.228622436523438,
+ "learning_rate": 1.9897224425025716e-05,
+ "loss": 1.4749,
+ "step": 2727
+ },
+ {
+ "epoch": 7.433242506811989,
+ "grad_norm": 10.95228385925293,
+ "learning_rate": 1.9897098188251244e-05,
+ "loss": 1.3252,
+ "step": 2728
+ },
+ {
+ "epoch": 7.435967302452316,
+ "grad_norm": 11.155035018920898,
+ "learning_rate": 1.9896971874398485e-05,
+ "loss": 1.6357,
+ "step": 2729
+ },
+ {
+ "epoch": 7.438692098092643,
+ "grad_norm": 19.57489776611328,
+ "learning_rate": 1.9896845483468424e-05,
+ "loss": 1.5891,
+ "step": 2730
+ },
+ {
+ "epoch": 7.44141689373297,
+ "grad_norm": 11.665769577026367,
+ "learning_rate": 1.9896719015462055e-05,
+ "loss": 1.3945,
+ "step": 2731
+ },
+ {
+ "epoch": 7.444141689373297,
+ "grad_norm": 11.477259635925293,
+ "learning_rate": 1.9896592470380354e-05,
+ "loss": 1.5493,
+ "step": 2732
+ },
+ {
+ "epoch": 7.446866485013624,
+ "grad_norm": 9.968441009521484,
+ "learning_rate": 1.9896465848224312e-05,
+ "loss": 1.5725,
+ "step": 2733
+ },
+ {
+ "epoch": 7.449591280653951,
+ "grad_norm": 11.057966232299805,
+ "learning_rate": 1.9896339148994906e-05,
+ "loss": 1.3958,
+ "step": 2734
+ },
+ {
+ "epoch": 7.452316076294278,
+ "grad_norm": 23.53868865966797,
+ "learning_rate": 1.9896212372693135e-05,
+ "loss": 1.54,
+ "step": 2735
+ },
+ {
+ "epoch": 7.455040871934605,
+ "grad_norm": 12.037323951721191,
+ "learning_rate": 1.9896085519319982e-05,
+ "loss": 1.6038,
+ "step": 2736
+ },
+ {
+ "epoch": 7.4577656675749315,
+ "grad_norm": 10.729537010192871,
+ "learning_rate": 1.989595858887643e-05,
+ "loss": 1.4729,
+ "step": 2737
+ },
+ {
+ "epoch": 7.460490463215259,
+ "grad_norm": 10.37804126739502,
+ "learning_rate": 1.989583158136347e-05,
+ "loss": 1.4558,
+ "step": 2738
+ },
+ {
+ "epoch": 7.463215258855586,
+ "grad_norm": 11.308197975158691,
+ "learning_rate": 1.9895704496782097e-05,
+ "loss": 1.7019,
+ "step": 2739
+ },
+ {
+ "epoch": 7.4659400544959125,
+ "grad_norm": 12.422118186950684,
+ "learning_rate": 1.989557733513329e-05,
+ "loss": 1.4006,
+ "step": 2740
+ },
+ {
+ "epoch": 7.46866485013624,
+ "grad_norm": 14.516019821166992,
+ "learning_rate": 1.989545009641805e-05,
+ "loss": 1.325,
+ "step": 2741
+ },
+ {
+ "epoch": 7.471389645776567,
+ "grad_norm": 20.607149124145508,
+ "learning_rate": 1.9895322780637358e-05,
+ "loss": 1.4851,
+ "step": 2742
+ },
+ {
+ "epoch": 7.474114441416893,
+ "grad_norm": 10.987537384033203,
+ "learning_rate": 1.9895195387792214e-05,
+ "loss": 1.3845,
+ "step": 2743
+ },
+ {
+ "epoch": 7.476839237057221,
+ "grad_norm": 19.764270782470703,
+ "learning_rate": 1.989506791788361e-05,
+ "loss": 1.5945,
+ "step": 2744
+ },
+ {
+ "epoch": 7.479564032697548,
+ "grad_norm": 11.385480880737305,
+ "learning_rate": 1.989494037091253e-05,
+ "loss": 1.5222,
+ "step": 2745
+ },
+ {
+ "epoch": 7.482288828337874,
+ "grad_norm": 14.623588562011719,
+ "learning_rate": 1.9894812746879976e-05,
+ "loss": 1.4697,
+ "step": 2746
+ },
+ {
+ "epoch": 7.485013623978202,
+ "grad_norm": 13.755199432373047,
+ "learning_rate": 1.9894685045786935e-05,
+ "loss": 1.5461,
+ "step": 2747
+ },
+ {
+ "epoch": 7.487738419618529,
+ "grad_norm": 18.120471954345703,
+ "learning_rate": 1.989455726763441e-05,
+ "loss": 1.5591,
+ "step": 2748
+ },
+ {
+ "epoch": 7.490463215258855,
+ "grad_norm": 11.236099243164062,
+ "learning_rate": 1.9894429412423388e-05,
+ "loss": 1.3884,
+ "step": 2749
+ },
+ {
+ "epoch": 7.493188010899183,
+ "grad_norm": 12.378520011901855,
+ "learning_rate": 1.9894301480154873e-05,
+ "loss": 1.522,
+ "step": 2750
+ },
+ {
+ "epoch": 7.4959128065395095,
+ "grad_norm": 11.089034080505371,
+ "learning_rate": 1.9894173470829853e-05,
+ "loss": 1.4741,
+ "step": 2751
+ },
+ {
+ "epoch": 7.498637602179836,
+ "grad_norm": 8.702698707580566,
+ "learning_rate": 1.9894045384449328e-05,
+ "loss": 1.333,
+ "step": 2752
+ },
+ {
+ "epoch": 7.501362397820164,
+ "grad_norm": 9.997475624084473,
+ "learning_rate": 1.9893917221014294e-05,
+ "loss": 1.5024,
+ "step": 2753
+ },
+ {
+ "epoch": 7.5040871934604905,
+ "grad_norm": 10.9384765625,
+ "learning_rate": 1.9893788980525756e-05,
+ "loss": 1.4797,
+ "step": 2754
+ },
+ {
+ "epoch": 7.506811989100817,
+ "grad_norm": 13.521172523498535,
+ "learning_rate": 1.9893660662984705e-05,
+ "loss": 1.4785,
+ "step": 2755
+ },
+ {
+ "epoch": 7.509536784741145,
+ "grad_norm": 10.863540649414062,
+ "learning_rate": 1.9893532268392143e-05,
+ "loss": 1.3005,
+ "step": 2756
+ },
+ {
+ "epoch": 7.512261580381471,
+ "grad_norm": 24.522600173950195,
+ "learning_rate": 1.989340379674907e-05,
+ "loss": 1.6479,
+ "step": 2757
+ },
+ {
+ "epoch": 7.514986376021798,
+ "grad_norm": 11.219182014465332,
+ "learning_rate": 1.989327524805649e-05,
+ "loss": 1.5334,
+ "step": 2758
+ },
+ {
+ "epoch": 7.517711171662126,
+ "grad_norm": 15.490386009216309,
+ "learning_rate": 1.9893146622315398e-05,
+ "loss": 1.6729,
+ "step": 2759
+ },
+ {
+ "epoch": 7.520435967302452,
+ "grad_norm": 15.81369400024414,
+ "learning_rate": 1.9893017919526798e-05,
+ "loss": 1.6035,
+ "step": 2760
+ },
+ {
+ "epoch": 7.523160762942779,
+ "grad_norm": 10.370918273925781,
+ "learning_rate": 1.9892889139691695e-05,
+ "loss": 1.5022,
+ "step": 2761
+ },
+ {
+ "epoch": 7.525885558583107,
+ "grad_norm": 8.687206268310547,
+ "learning_rate": 1.9892760282811085e-05,
+ "loss": 1.7324,
+ "step": 2762
+ },
+ {
+ "epoch": 7.528610354223433,
+ "grad_norm": 19.682769775390625,
+ "learning_rate": 1.989263134888598e-05,
+ "loss": 1.3579,
+ "step": 2763
+ },
+ {
+ "epoch": 7.53133514986376,
+ "grad_norm": 10.744647026062012,
+ "learning_rate": 1.9892502337917382e-05,
+ "loss": 1.5437,
+ "step": 2764
+ },
+ {
+ "epoch": 7.5340599455040875,
+ "grad_norm": 12.050798416137695,
+ "learning_rate": 1.9892373249906292e-05,
+ "loss": 1.418,
+ "step": 2765
+ },
+ {
+ "epoch": 7.536784741144414,
+ "grad_norm": 20.06696319580078,
+ "learning_rate": 1.989224408485372e-05,
+ "loss": 1.7356,
+ "step": 2766
+ },
+ {
+ "epoch": 7.539509536784741,
+ "grad_norm": 10.467229843139648,
+ "learning_rate": 1.9892114842760666e-05,
+ "loss": 1.4651,
+ "step": 2767
+ },
+ {
+ "epoch": 7.5422343324250685,
+ "grad_norm": 10.829195976257324,
+ "learning_rate": 1.9891985523628142e-05,
+ "loss": 1.7073,
+ "step": 2768
+ },
+ {
+ "epoch": 7.544959128065395,
+ "grad_norm": 16.316389083862305,
+ "learning_rate": 1.9891856127457152e-05,
+ "loss": 1.4178,
+ "step": 2769
+ },
+ {
+ "epoch": 7.547683923705722,
+ "grad_norm": 9.75391674041748,
+ "learning_rate": 1.9891726654248705e-05,
+ "loss": 1.4985,
+ "step": 2770
+ },
+ {
+ "epoch": 7.550408719346049,
+ "grad_norm": 11.315629959106445,
+ "learning_rate": 1.9891597104003807e-05,
+ "loss": 1.5781,
+ "step": 2771
+ },
+ {
+ "epoch": 7.553133514986376,
+ "grad_norm": 12.688879013061523,
+ "learning_rate": 1.9891467476723472e-05,
+ "loss": 1.5378,
+ "step": 2772
+ },
+ {
+ "epoch": 7.555858310626703,
+ "grad_norm": 10.304753303527832,
+ "learning_rate": 1.9891337772408706e-05,
+ "loss": 1.4124,
+ "step": 2773
+ },
+ {
+ "epoch": 7.55858310626703,
+ "grad_norm": 20.072845458984375,
+ "learning_rate": 1.9891207991060525e-05,
+ "loss": 1.489,
+ "step": 2774
+ },
+ {
+ "epoch": 7.561307901907357,
+ "grad_norm": 10.624418258666992,
+ "learning_rate": 1.989107813267993e-05,
+ "loss": 1.5132,
+ "step": 2775
+ },
+ {
+ "epoch": 7.564032697547684,
+ "grad_norm": 11.695839881896973,
+ "learning_rate": 1.9890948197267933e-05,
+ "loss": 1.4905,
+ "step": 2776
+ },
+ {
+ "epoch": 7.566757493188011,
+ "grad_norm": 9.317418098449707,
+ "learning_rate": 1.9890818184825552e-05,
+ "loss": 1.3589,
+ "step": 2777
+ },
+ {
+ "epoch": 7.569482288828338,
+ "grad_norm": 11.279376029968262,
+ "learning_rate": 1.9890688095353802e-05,
+ "loss": 1.4741,
+ "step": 2778
+ },
+ {
+ "epoch": 7.572207084468665,
+ "grad_norm": 12.635177612304688,
+ "learning_rate": 1.9890557928853685e-05,
+ "loss": 1.4634,
+ "step": 2779
+ },
+ {
+ "epoch": 7.574931880108992,
+ "grad_norm": 12.164665222167969,
+ "learning_rate": 1.9890427685326225e-05,
+ "loss": 1.7129,
+ "step": 2780
+ },
+ {
+ "epoch": 7.577656675749319,
+ "grad_norm": 11.033668518066406,
+ "learning_rate": 1.989029736477243e-05,
+ "loss": 1.5864,
+ "step": 2781
+ },
+ {
+ "epoch": 7.580381471389646,
+ "grad_norm": 13.097576141357422,
+ "learning_rate": 1.989016696719332e-05,
+ "loss": 1.3496,
+ "step": 2782
+ },
+ {
+ "epoch": 7.583106267029972,
+ "grad_norm": 12.860251426696777,
+ "learning_rate": 1.989003649258991e-05,
+ "loss": 1.5066,
+ "step": 2783
+ },
+ {
+ "epoch": 7.5858310626703,
+ "grad_norm": 22.703773498535156,
+ "learning_rate": 1.988990594096321e-05,
+ "loss": 1.5422,
+ "step": 2784
+ },
+ {
+ "epoch": 7.5885558583106265,
+ "grad_norm": 10.591668128967285,
+ "learning_rate": 1.988977531231424e-05,
+ "loss": 1.3936,
+ "step": 2785
+ },
+ {
+ "epoch": 7.591280653950953,
+ "grad_norm": 11.378451347351074,
+ "learning_rate": 1.988964460664402e-05,
+ "loss": 1.4924,
+ "step": 2786
+ },
+ {
+ "epoch": 7.594005449591281,
+ "grad_norm": 18.895544052124023,
+ "learning_rate": 1.9889513823953568e-05,
+ "loss": 1.5862,
+ "step": 2787
+ },
+ {
+ "epoch": 7.5967302452316074,
+ "grad_norm": 12.089540481567383,
+ "learning_rate": 1.9889382964243896e-05,
+ "loss": 1.5552,
+ "step": 2788
+ },
+ {
+ "epoch": 7.599455040871934,
+ "grad_norm": 10.115679740905762,
+ "learning_rate": 1.9889252027516033e-05,
+ "loss": 1.4866,
+ "step": 2789
+ },
+ {
+ "epoch": 7.602179836512262,
+ "grad_norm": 10.996835708618164,
+ "learning_rate": 1.988912101377099e-05,
+ "loss": 1.4475,
+ "step": 2790
+ },
+ {
+ "epoch": 7.604904632152588,
+ "grad_norm": 10.201013565063477,
+ "learning_rate": 1.9888989923009792e-05,
+ "loss": 1.5649,
+ "step": 2791
+ },
+ {
+ "epoch": 7.607629427792915,
+ "grad_norm": 12.061447143554688,
+ "learning_rate": 1.988885875523346e-05,
+ "loss": 1.6538,
+ "step": 2792
+ },
+ {
+ "epoch": 7.610354223433243,
+ "grad_norm": 13.327852249145508,
+ "learning_rate": 1.988872751044301e-05,
+ "loss": 1.3782,
+ "step": 2793
+ },
+ {
+ "epoch": 7.613079019073569,
+ "grad_norm": 11.921119689941406,
+ "learning_rate": 1.9888596188639476e-05,
+ "loss": 1.5273,
+ "step": 2794
+ },
+ {
+ "epoch": 7.615803814713896,
+ "grad_norm": 9.655643463134766,
+ "learning_rate": 1.9888464789823867e-05,
+ "loss": 1.4753,
+ "step": 2795
+ },
+ {
+ "epoch": 7.618528610354224,
+ "grad_norm": 13.065455436706543,
+ "learning_rate": 1.9888333313997212e-05,
+ "loss": 1.4873,
+ "step": 2796
+ },
+ {
+ "epoch": 7.62125340599455,
+ "grad_norm": 18.854360580444336,
+ "learning_rate": 1.988820176116054e-05,
+ "loss": 1.4998,
+ "step": 2797
+ },
+ {
+ "epoch": 7.623978201634877,
+ "grad_norm": 12.455496788024902,
+ "learning_rate": 1.988807013131487e-05,
+ "loss": 1.5913,
+ "step": 2798
+ },
+ {
+ "epoch": 7.6267029972752045,
+ "grad_norm": 10.86870288848877,
+ "learning_rate": 1.9887938424461224e-05,
+ "loss": 1.2312,
+ "step": 2799
+ },
+ {
+ "epoch": 7.629427792915531,
+ "grad_norm": 13.03520393371582,
+ "learning_rate": 1.9887806640600633e-05,
+ "loss": 1.5659,
+ "step": 2800
+ },
+ {
+ "epoch": 7.632152588555858,
+ "grad_norm": 13.637677192687988,
+ "learning_rate": 1.9887674779734125e-05,
+ "loss": 1.3696,
+ "step": 2801
+ },
+ {
+ "epoch": 7.6348773841961854,
+ "grad_norm": 18.14453125,
+ "learning_rate": 1.9887542841862723e-05,
+ "loss": 1.7529,
+ "step": 2802
+ },
+ {
+ "epoch": 7.637602179836512,
+ "grad_norm": 11.575101852416992,
+ "learning_rate": 1.9887410826987455e-05,
+ "loss": 1.4529,
+ "step": 2803
+ },
+ {
+ "epoch": 7.640326975476839,
+ "grad_norm": 11.00442123413086,
+ "learning_rate": 1.988727873510935e-05,
+ "loss": 1.3838,
+ "step": 2804
+ },
+ {
+ "epoch": 7.643051771117166,
+ "grad_norm": 12.96632194519043,
+ "learning_rate": 1.9887146566229437e-05,
+ "loss": 1.6182,
+ "step": 2805
+ },
+ {
+ "epoch": 7.645776566757493,
+ "grad_norm": 10.884385108947754,
+ "learning_rate": 1.988701432034874e-05,
+ "loss": 1.2805,
+ "step": 2806
+ },
+ {
+ "epoch": 7.64850136239782,
+ "grad_norm": 10.20749282836914,
+ "learning_rate": 1.9886881997468298e-05,
+ "loss": 1.5005,
+ "step": 2807
+ },
+ {
+ "epoch": 7.651226158038147,
+ "grad_norm": 10.603687286376953,
+ "learning_rate": 1.988674959758914e-05,
+ "loss": 1.4885,
+ "step": 2808
+ },
+ {
+ "epoch": 7.653950953678474,
+ "grad_norm": 13.288247108459473,
+ "learning_rate": 1.988661712071229e-05,
+ "loss": 1.5601,
+ "step": 2809
+ },
+ {
+ "epoch": 7.656675749318801,
+ "grad_norm": 13.069999694824219,
+ "learning_rate": 1.9886484566838785e-05,
+ "loss": 1.5508,
+ "step": 2810
+ },
+ {
+ "epoch": 7.659400544959128,
+ "grad_norm": 10.288311004638672,
+ "learning_rate": 1.9886351935969658e-05,
+ "loss": 1.5603,
+ "step": 2811
+ },
+ {
+ "epoch": 7.662125340599455,
+ "grad_norm": 11.068655014038086,
+ "learning_rate": 1.9886219228105937e-05,
+ "loss": 1.6333,
+ "step": 2812
+ },
+ {
+ "epoch": 7.664850136239782,
+ "grad_norm": 11.532331466674805,
+ "learning_rate": 1.9886086443248663e-05,
+ "loss": 1.479,
+ "step": 2813
+ },
+ {
+ "epoch": 7.667574931880109,
+ "grad_norm": 10.423901557922363,
+ "learning_rate": 1.9885953581398862e-05,
+ "loss": 1.511,
+ "step": 2814
+ },
+ {
+ "epoch": 7.670299727520436,
+ "grad_norm": 15.353683471679688,
+ "learning_rate": 1.9885820642557574e-05,
+ "loss": 1.5251,
+ "step": 2815
+ },
+ {
+ "epoch": 7.6730245231607626,
+ "grad_norm": 24.267702102661133,
+ "learning_rate": 1.9885687626725833e-05,
+ "loss": 1.5012,
+ "step": 2816
+ },
+ {
+ "epoch": 7.67574931880109,
+ "grad_norm": 11.486735343933105,
+ "learning_rate": 1.9885554533904673e-05,
+ "loss": 1.5339,
+ "step": 2817
+ },
+ {
+ "epoch": 7.678474114441417,
+ "grad_norm": 21.975114822387695,
+ "learning_rate": 1.988542136409514e-05,
+ "loss": 1.4797,
+ "step": 2818
+ },
+ {
+ "epoch": 7.6811989100817435,
+ "grad_norm": 17.301342010498047,
+ "learning_rate": 1.9885288117298256e-05,
+ "loss": 1.2908,
+ "step": 2819
+ },
+ {
+ "epoch": 7.683923705722071,
+ "grad_norm": 16.25150489807129,
+ "learning_rate": 1.9885154793515066e-05,
+ "loss": 1.5159,
+ "step": 2820
+ },
+ {
+ "epoch": 7.686648501362398,
+ "grad_norm": 10.66357421875,
+ "learning_rate": 1.9885021392746614e-05,
+ "loss": 1.2976,
+ "step": 2821
+ },
+ {
+ "epoch": 7.689373297002724,
+ "grad_norm": 11.739712715148926,
+ "learning_rate": 1.9884887914993932e-05,
+ "loss": 1.5776,
+ "step": 2822
+ },
+ {
+ "epoch": 7.692098092643052,
+ "grad_norm": 13.113489151000977,
+ "learning_rate": 1.9884754360258058e-05,
+ "loss": 1.6941,
+ "step": 2823
+ },
+ {
+ "epoch": 7.694822888283379,
+ "grad_norm": 12.707517623901367,
+ "learning_rate": 1.9884620728540035e-05,
+ "loss": 1.4915,
+ "step": 2824
+ },
+ {
+ "epoch": 7.697547683923705,
+ "grad_norm": 11.471800804138184,
+ "learning_rate": 1.9884487019840907e-05,
+ "loss": 1.5256,
+ "step": 2825
+ },
+ {
+ "epoch": 7.700272479564033,
+ "grad_norm": 11.221733093261719,
+ "learning_rate": 1.9884353234161713e-05,
+ "loss": 1.4993,
+ "step": 2826
+ },
+ {
+ "epoch": 7.70299727520436,
+ "grad_norm": 11.2644681930542,
+ "learning_rate": 1.988421937150349e-05,
+ "loss": 1.3865,
+ "step": 2827
+ },
+ {
+ "epoch": 7.705722070844686,
+ "grad_norm": 11.004400253295898,
+ "learning_rate": 1.9884085431867287e-05,
+ "loss": 1.4805,
+ "step": 2828
+ },
+ {
+ "epoch": 7.708446866485014,
+ "grad_norm": 11.438688278198242,
+ "learning_rate": 1.9883951415254146e-05,
+ "loss": 1.5256,
+ "step": 2829
+ },
+ {
+ "epoch": 7.7111716621253406,
+ "grad_norm": 10.083905220031738,
+ "learning_rate": 1.988381732166511e-05,
+ "loss": 1.3486,
+ "step": 2830
+ },
+ {
+ "epoch": 7.713896457765667,
+ "grad_norm": 9.939655303955078,
+ "learning_rate": 1.988368315110122e-05,
+ "loss": 1.3533,
+ "step": 2831
+ },
+ {
+ "epoch": 7.716621253405995,
+ "grad_norm": 14.37730884552002,
+ "learning_rate": 1.9883548903563525e-05,
+ "loss": 1.5068,
+ "step": 2832
+ },
+ {
+ "epoch": 7.7193460490463215,
+ "grad_norm": 12.536720275878906,
+ "learning_rate": 1.988341457905307e-05,
+ "loss": 1.4836,
+ "step": 2833
+ },
+ {
+ "epoch": 7.722070844686648,
+ "grad_norm": 13.156996726989746,
+ "learning_rate": 1.9883280177570898e-05,
+ "loss": 1.7607,
+ "step": 2834
+ },
+ {
+ "epoch": 7.724795640326976,
+ "grad_norm": 11.064411163330078,
+ "learning_rate": 1.988314569911806e-05,
+ "loss": 1.3481,
+ "step": 2835
+ },
+ {
+ "epoch": 7.727520435967302,
+ "grad_norm": 15.014034271240234,
+ "learning_rate": 1.98830111436956e-05,
+ "loss": 1.4448,
+ "step": 2836
+ },
+ {
+ "epoch": 7.730245231607629,
+ "grad_norm": 13.946884155273438,
+ "learning_rate": 1.988287651130457e-05,
+ "loss": 1.7812,
+ "step": 2837
+ },
+ {
+ "epoch": 7.732970027247957,
+ "grad_norm": 10.989984512329102,
+ "learning_rate": 1.9882741801946014e-05,
+ "loss": 1.4023,
+ "step": 2838
+ },
+ {
+ "epoch": 7.735694822888283,
+ "grad_norm": 12.584571838378906,
+ "learning_rate": 1.988260701562098e-05,
+ "loss": 1.645,
+ "step": 2839
+ },
+ {
+ "epoch": 7.73841961852861,
+ "grad_norm": 11.218289375305176,
+ "learning_rate": 1.9882472152330522e-05,
+ "loss": 1.5212,
+ "step": 2840
+ },
+ {
+ "epoch": 7.741144414168938,
+ "grad_norm": 10.804743766784668,
+ "learning_rate": 1.9882337212075693e-05,
+ "loss": 1.3257,
+ "step": 2841
+ },
+ {
+ "epoch": 7.743869209809264,
+ "grad_norm": 31.348562240600586,
+ "learning_rate": 1.9882202194857537e-05,
+ "loss": 1.5823,
+ "step": 2842
+ },
+ {
+ "epoch": 7.746594005449591,
+ "grad_norm": 10.572625160217285,
+ "learning_rate": 1.988206710067711e-05,
+ "loss": 1.3733,
+ "step": 2843
+ },
+ {
+ "epoch": 7.7493188010899186,
+ "grad_norm": 10.134716987609863,
+ "learning_rate": 1.9881931929535462e-05,
+ "loss": 1.4509,
+ "step": 2844
+ },
+ {
+ "epoch": 7.752043596730245,
+ "grad_norm": 16.209062576293945,
+ "learning_rate": 1.988179668143364e-05,
+ "loss": 1.5938,
+ "step": 2845
+ },
+ {
+ "epoch": 7.754768392370572,
+ "grad_norm": 9.616616249084473,
+ "learning_rate": 1.988166135637271e-05,
+ "loss": 1.5181,
+ "step": 2846
+ },
+ {
+ "epoch": 7.7574931880108995,
+ "grad_norm": 16.432865142822266,
+ "learning_rate": 1.988152595435372e-05,
+ "loss": 1.8037,
+ "step": 2847
+ },
+ {
+ "epoch": 7.760217983651226,
+ "grad_norm": 11.593768119812012,
+ "learning_rate": 1.988139047537772e-05,
+ "loss": 1.4939,
+ "step": 2848
+ },
+ {
+ "epoch": 7.762942779291553,
+ "grad_norm": 11.875847816467285,
+ "learning_rate": 1.9881254919445773e-05,
+ "loss": 1.5664,
+ "step": 2849
+ },
+ {
+ "epoch": 7.76566757493188,
+ "grad_norm": 12.916208267211914,
+ "learning_rate": 1.9881119286558927e-05,
+ "loss": 1.4985,
+ "step": 2850
+ },
+ {
+ "epoch": 7.768392370572207,
+ "grad_norm": 10.447370529174805,
+ "learning_rate": 1.9880983576718247e-05,
+ "loss": 1.5913,
+ "step": 2851
+ },
+ {
+ "epoch": 7.771117166212534,
+ "grad_norm": 25.152677536010742,
+ "learning_rate": 1.988084778992478e-05,
+ "loss": 1.3577,
+ "step": 2852
+ },
+ {
+ "epoch": 7.773841961852861,
+ "grad_norm": 20.927114486694336,
+ "learning_rate": 1.988071192617959e-05,
+ "loss": 1.679,
+ "step": 2853
+ },
+ {
+ "epoch": 7.776566757493188,
+ "grad_norm": 14.398178100585938,
+ "learning_rate": 1.9880575985483734e-05,
+ "loss": 1.73,
+ "step": 2854
+ },
+ {
+ "epoch": 7.779291553133515,
+ "grad_norm": 12.64029312133789,
+ "learning_rate": 1.988043996783827e-05,
+ "loss": 1.3472,
+ "step": 2855
+ },
+ {
+ "epoch": 7.782016348773842,
+ "grad_norm": 16.54973793029785,
+ "learning_rate": 1.9880303873244258e-05,
+ "loss": 1.6577,
+ "step": 2856
+ },
+ {
+ "epoch": 7.784741144414169,
+ "grad_norm": 13.682854652404785,
+ "learning_rate": 1.9880167701702757e-05,
+ "loss": 1.5327,
+ "step": 2857
+ },
+ {
+ "epoch": 7.787465940054496,
+ "grad_norm": 45.27207946777344,
+ "learning_rate": 1.988003145321483e-05,
+ "loss": 1.6543,
+ "step": 2858
+ },
+ {
+ "epoch": 7.790190735694823,
+ "grad_norm": 11.389158248901367,
+ "learning_rate": 1.9879895127781533e-05,
+ "loss": 1.2905,
+ "step": 2859
+ },
+ {
+ "epoch": 7.79291553133515,
+ "grad_norm": 10.155439376831055,
+ "learning_rate": 1.987975872540393e-05,
+ "loss": 1.5613,
+ "step": 2860
+ },
+ {
+ "epoch": 7.795640326975477,
+ "grad_norm": 19.872411727905273,
+ "learning_rate": 1.9879622246083087e-05,
+ "loss": 1.3677,
+ "step": 2861
+ },
+ {
+ "epoch": 7.798365122615804,
+ "grad_norm": 15.025500297546387,
+ "learning_rate": 1.987948568982006e-05,
+ "loss": 1.5881,
+ "step": 2862
+ },
+ {
+ "epoch": 7.801089918256131,
+ "grad_norm": 11.375299453735352,
+ "learning_rate": 1.987934905661592e-05,
+ "loss": 1.4883,
+ "step": 2863
+ },
+ {
+ "epoch": 7.8038147138964575,
+ "grad_norm": 21.228652954101562,
+ "learning_rate": 1.9879212346471726e-05,
+ "loss": 1.6218,
+ "step": 2864
+ },
+ {
+ "epoch": 7.806539509536785,
+ "grad_norm": 12.07156753540039,
+ "learning_rate": 1.9879075559388547e-05,
+ "loss": 1.4431,
+ "step": 2865
+ },
+ {
+ "epoch": 7.809264305177112,
+ "grad_norm": 11.72398853302002,
+ "learning_rate": 1.9878938695367444e-05,
+ "loss": 1.373,
+ "step": 2866
+ },
+ {
+ "epoch": 7.8119891008174385,
+ "grad_norm": 13.358327865600586,
+ "learning_rate": 1.987880175440948e-05,
+ "loss": 1.3994,
+ "step": 2867
+ },
+ {
+ "epoch": 7.814713896457766,
+ "grad_norm": 13.322922706604004,
+ "learning_rate": 1.9878664736515732e-05,
+ "loss": 1.5703,
+ "step": 2868
+ },
+ {
+ "epoch": 7.817438692098093,
+ "grad_norm": 17.724384307861328,
+ "learning_rate": 1.9878527641687255e-05,
+ "loss": 1.376,
+ "step": 2869
+ },
+ {
+ "epoch": 7.820163487738419,
+ "grad_norm": 10.315452575683594,
+ "learning_rate": 1.987839046992513e-05,
+ "loss": 1.4697,
+ "step": 2870
+ },
+ {
+ "epoch": 7.822888283378747,
+ "grad_norm": 18.188642501831055,
+ "learning_rate": 1.9878253221230414e-05,
+ "loss": 1.835,
+ "step": 2871
+ },
+ {
+ "epoch": 7.825613079019074,
+ "grad_norm": 11.028203964233398,
+ "learning_rate": 1.9878115895604178e-05,
+ "loss": 1.4543,
+ "step": 2872
+ },
+ {
+ "epoch": 7.8283378746594,
+ "grad_norm": 10.556264877319336,
+ "learning_rate": 1.9877978493047496e-05,
+ "loss": 1.3467,
+ "step": 2873
+ },
+ {
+ "epoch": 7.831062670299728,
+ "grad_norm": 11.126514434814453,
+ "learning_rate": 1.987784101356143e-05,
+ "loss": 1.4661,
+ "step": 2874
+ },
+ {
+ "epoch": 7.833787465940055,
+ "grad_norm": 12.39341926574707,
+ "learning_rate": 1.9877703457147062e-05,
+ "loss": 1.4817,
+ "step": 2875
+ },
+ {
+ "epoch": 7.836512261580381,
+ "grad_norm": 15.889671325683594,
+ "learning_rate": 1.987756582380546e-05,
+ "loss": 1.5522,
+ "step": 2876
+ },
+ {
+ "epoch": 7.839237057220709,
+ "grad_norm": 39.488895416259766,
+ "learning_rate": 1.9877428113537686e-05,
+ "loss": 1.582,
+ "step": 2877
+ },
+ {
+ "epoch": 7.8419618528610355,
+ "grad_norm": 24.53476333618164,
+ "learning_rate": 1.9877290326344826e-05,
+ "loss": 1.5332,
+ "step": 2878
+ },
+ {
+ "epoch": 7.844686648501362,
+ "grad_norm": 15.040446281433105,
+ "learning_rate": 1.987715246222794e-05,
+ "loss": 1.6968,
+ "step": 2879
+ },
+ {
+ "epoch": 7.84741144414169,
+ "grad_norm": 18.096458435058594,
+ "learning_rate": 1.9877014521188115e-05,
+ "loss": 1.6333,
+ "step": 2880
+ },
+ {
+ "epoch": 7.8501362397820165,
+ "grad_norm": 12.122450828552246,
+ "learning_rate": 1.9876876503226418e-05,
+ "loss": 1.502,
+ "step": 2881
+ },
+ {
+ "epoch": 7.852861035422343,
+ "grad_norm": 12.410628318786621,
+ "learning_rate": 1.987673840834392e-05,
+ "loss": 1.3496,
+ "step": 2882
+ },
+ {
+ "epoch": 7.855585831062671,
+ "grad_norm": 11.923356056213379,
+ "learning_rate": 1.9876600236541705e-05,
+ "loss": 1.4607,
+ "step": 2883
+ },
+ {
+ "epoch": 7.858310626702997,
+ "grad_norm": 19.3748779296875,
+ "learning_rate": 1.9876461987820847e-05,
+ "loss": 1.5439,
+ "step": 2884
+ },
+ {
+ "epoch": 7.861035422343324,
+ "grad_norm": 17.764400482177734,
+ "learning_rate": 1.9876323662182417e-05,
+ "loss": 1.4241,
+ "step": 2885
+ },
+ {
+ "epoch": 7.863760217983652,
+ "grad_norm": 18.320411682128906,
+ "learning_rate": 1.9876185259627498e-05,
+ "loss": 1.6548,
+ "step": 2886
+ },
+ {
+ "epoch": 7.866485013623978,
+ "grad_norm": 650.7084350585938,
+ "learning_rate": 1.987604678015716e-05,
+ "loss": 1.6074,
+ "step": 2887
+ },
+ {
+ "epoch": 7.869209809264305,
+ "grad_norm": 19.571046829223633,
+ "learning_rate": 1.9875908223772497e-05,
+ "loss": 1.6182,
+ "step": 2888
+ },
+ {
+ "epoch": 7.871934604904633,
+ "grad_norm": 17.87520980834961,
+ "learning_rate": 1.9875769590474574e-05,
+ "loss": 1.4395,
+ "step": 2889
+ },
+ {
+ "epoch": 7.874659400544959,
+ "grad_norm": 38.276268005371094,
+ "learning_rate": 1.9875630880264474e-05,
+ "loss": 2.0103,
+ "step": 2890
+ },
+ {
+ "epoch": 7.877384196185286,
+ "grad_norm": 36.80160903930664,
+ "learning_rate": 1.987549209314328e-05,
+ "loss": 1.8755,
+ "step": 2891
+ },
+ {
+ "epoch": 7.8801089918256135,
+ "grad_norm": 20.255399703979492,
+ "learning_rate": 1.9875353229112076e-05,
+ "loss": 1.7363,
+ "step": 2892
+ },
+ {
+ "epoch": 7.88283378746594,
+ "grad_norm": 18.29572868347168,
+ "learning_rate": 1.9875214288171932e-05,
+ "loss": 1.6235,
+ "step": 2893
+ },
+ {
+ "epoch": 7.885558583106267,
+ "grad_norm": 26.875980377197266,
+ "learning_rate": 1.9875075270323942e-05,
+ "loss": 1.978,
+ "step": 2894
+ },
+ {
+ "epoch": 7.8882833787465945,
+ "grad_norm": 18.455490112304688,
+ "learning_rate": 1.9874936175569178e-05,
+ "loss": 1.8594,
+ "step": 2895
+ },
+ {
+ "epoch": 7.891008174386921,
+ "grad_norm": 22.575532913208008,
+ "learning_rate": 1.9874797003908735e-05,
+ "loss": 2.0298,
+ "step": 2896
+ },
+ {
+ "epoch": 7.893732970027248,
+ "grad_norm": 19.369121551513672,
+ "learning_rate": 1.9874657755343688e-05,
+ "loss": 1.7678,
+ "step": 2897
+ },
+ {
+ "epoch": 7.896457765667575,
+ "grad_norm": 15.469361305236816,
+ "learning_rate": 1.9874518429875126e-05,
+ "loss": 1.7583,
+ "step": 2898
+ },
+ {
+ "epoch": 7.899182561307902,
+ "grad_norm": 19.114458084106445,
+ "learning_rate": 1.987437902750413e-05,
+ "loss": 1.7402,
+ "step": 2899
+ },
+ {
+ "epoch": 7.901907356948229,
+ "grad_norm": 16.01736068725586,
+ "learning_rate": 1.9874239548231786e-05,
+ "loss": 1.6477,
+ "step": 2900
+ },
+ {
+ "epoch": 7.904632152588556,
+ "grad_norm": 12.80774211883545,
+ "learning_rate": 1.9874099992059185e-05,
+ "loss": 1.9751,
+ "step": 2901
+ },
+ {
+ "epoch": 7.907356948228883,
+ "grad_norm": 13.939897537231445,
+ "learning_rate": 1.9873960358987414e-05,
+ "loss": 1.7957,
+ "step": 2902
+ },
+ {
+ "epoch": 7.91008174386921,
+ "grad_norm": 10.73560905456543,
+ "learning_rate": 1.9873820649017553e-05,
+ "loss": 1.7783,
+ "step": 2903
+ },
+ {
+ "epoch": 7.912806539509537,
+ "grad_norm": 11.912135124206543,
+ "learning_rate": 1.9873680862150694e-05,
+ "loss": 1.6841,
+ "step": 2904
+ },
+ {
+ "epoch": 7.915531335149864,
+ "grad_norm": 14.469831466674805,
+ "learning_rate": 1.9873540998387928e-05,
+ "loss": 1.7317,
+ "step": 2905
+ },
+ {
+ "epoch": 7.918256130790191,
+ "grad_norm": 12.055585861206055,
+ "learning_rate": 1.9873401057730345e-05,
+ "loss": 1.6538,
+ "step": 2906
+ },
+ {
+ "epoch": 7.920980926430518,
+ "grad_norm": 17.054702758789062,
+ "learning_rate": 1.987326104017903e-05,
+ "loss": 1.843,
+ "step": 2907
+ },
+ {
+ "epoch": 7.923705722070845,
+ "grad_norm": 10.581183433532715,
+ "learning_rate": 1.9873120945735073e-05,
+ "loss": 1.9011,
+ "step": 2908
+ },
+ {
+ "epoch": 7.926430517711172,
+ "grad_norm": 11.802868843078613,
+ "learning_rate": 1.9872980774399573e-05,
+ "loss": 1.6802,
+ "step": 2909
+ },
+ {
+ "epoch": 7.929155313351498,
+ "grad_norm": 11.520299911499023,
+ "learning_rate": 1.987284052617361e-05,
+ "loss": 1.4148,
+ "step": 2910
+ },
+ {
+ "epoch": 7.931880108991826,
+ "grad_norm": 11.749201774597168,
+ "learning_rate": 1.9872700201058287e-05,
+ "loss": 1.7168,
+ "step": 2911
+ },
+ {
+ "epoch": 7.9346049046321525,
+ "grad_norm": 12.393478393554688,
+ "learning_rate": 1.9872559799054695e-05,
+ "loss": 1.7373,
+ "step": 2912
+ },
+ {
+ "epoch": 7.937329700272479,
+ "grad_norm": 10.606557846069336,
+ "learning_rate": 1.9872419320163924e-05,
+ "loss": 1.6995,
+ "step": 2913
+ },
+ {
+ "epoch": 7.940054495912807,
+ "grad_norm": 13.502483367919922,
+ "learning_rate": 1.9872278764387064e-05,
+ "loss": 1.5396,
+ "step": 2914
+ },
+ {
+ "epoch": 7.9427792915531334,
+ "grad_norm": 10.935478210449219,
+ "learning_rate": 1.987213813172522e-05,
+ "loss": 1.5857,
+ "step": 2915
+ },
+ {
+ "epoch": 7.94550408719346,
+ "grad_norm": 11.298049926757812,
+ "learning_rate": 1.987199742217948e-05,
+ "loss": 1.5662,
+ "step": 2916
+ },
+ {
+ "epoch": 7.948228882833788,
+ "grad_norm": 9.997447967529297,
+ "learning_rate": 1.987185663575094e-05,
+ "loss": 1.5146,
+ "step": 2917
+ },
+ {
+ "epoch": 7.950953678474114,
+ "grad_norm": 14.285991668701172,
+ "learning_rate": 1.98717157724407e-05,
+ "loss": 1.5615,
+ "step": 2918
+ },
+ {
+ "epoch": 7.953678474114441,
+ "grad_norm": 14.525003433227539,
+ "learning_rate": 1.9871574832249858e-05,
+ "loss": 1.5081,
+ "step": 2919
+ },
+ {
+ "epoch": 7.956403269754769,
+ "grad_norm": 13.308977127075195,
+ "learning_rate": 1.9871433815179505e-05,
+ "loss": 1.4858,
+ "step": 2920
+ },
+ {
+ "epoch": 7.959128065395095,
+ "grad_norm": 11.913995742797852,
+ "learning_rate": 1.9871292721230745e-05,
+ "loss": 1.439,
+ "step": 2921
+ },
+ {
+ "epoch": 7.961852861035422,
+ "grad_norm": 15.985111236572266,
+ "learning_rate": 1.9871151550404675e-05,
+ "loss": 1.6733,
+ "step": 2922
+ },
+ {
+ "epoch": 7.96457765667575,
+ "grad_norm": 11.745784759521484,
+ "learning_rate": 1.9871010302702393e-05,
+ "loss": 1.7202,
+ "step": 2923
+ },
+ {
+ "epoch": 7.967302452316076,
+ "grad_norm": 20.185394287109375,
+ "learning_rate": 1.9870868978125003e-05,
+ "loss": 1.749,
+ "step": 2924
+ },
+ {
+ "epoch": 7.970027247956403,
+ "grad_norm": 10.806917190551758,
+ "learning_rate": 1.98707275766736e-05,
+ "loss": 1.4927,
+ "step": 2925
+ },
+ {
+ "epoch": 7.9727520435967305,
+ "grad_norm": 11.449009895324707,
+ "learning_rate": 1.9870586098349288e-05,
+ "loss": 1.4761,
+ "step": 2926
+ },
+ {
+ "epoch": 7.975476839237057,
+ "grad_norm": 9.038079261779785,
+ "learning_rate": 1.987044454315317e-05,
+ "loss": 1.688,
+ "step": 2927
+ },
+ {
+ "epoch": 7.978201634877384,
+ "grad_norm": 14.575750350952148,
+ "learning_rate": 1.987030291108635e-05,
+ "loss": 1.6382,
+ "step": 2928
+ },
+ {
+ "epoch": 7.9809264305177114,
+ "grad_norm": 10.708087921142578,
+ "learning_rate": 1.987016120214993e-05,
+ "loss": 1.7874,
+ "step": 2929
+ },
+ {
+ "epoch": 7.983651226158038,
+ "grad_norm": 14.858932495117188,
+ "learning_rate": 1.9870019416345008e-05,
+ "loss": 1.7944,
+ "step": 2930
+ },
+ {
+ "epoch": 7.986376021798365,
+ "grad_norm": 13.036943435668945,
+ "learning_rate": 1.9869877553672693e-05,
+ "loss": 1.5779,
+ "step": 2931
+ },
+ {
+ "epoch": 7.989100817438692,
+ "grad_norm": 10.370837211608887,
+ "learning_rate": 1.9869735614134092e-05,
+ "loss": 1.6997,
+ "step": 2932
+ },
+ {
+ "epoch": 7.991825613079019,
+ "grad_norm": 18.72672462463379,
+ "learning_rate": 1.9869593597730305e-05,
+ "loss": 1.4355,
+ "step": 2933
+ },
+ {
+ "epoch": 7.994550408719346,
+ "grad_norm": 12.96975040435791,
+ "learning_rate": 1.986945150446244e-05,
+ "loss": 1.3271,
+ "step": 2934
+ },
+ {
+ "epoch": 7.997275204359673,
+ "grad_norm": 16.942413330078125,
+ "learning_rate": 1.9869309334331606e-05,
+ "loss": 1.7856,
+ "step": 2935
+ },
+ {
+ "epoch": 8.0,
+ "grad_norm": 14.696255683898926,
+ "learning_rate": 1.9869167087338908e-05,
+ "loss": 1.6475,
+ "step": 2936
+ },
+ {
+ "epoch": 8.002724795640328,
+ "grad_norm": 10.834300994873047,
+ "learning_rate": 1.9869024763485454e-05,
+ "loss": 1.623,
+ "step": 2937
+ },
+ {
+ "epoch": 8.005449591280653,
+ "grad_norm": 11.849433898925781,
+ "learning_rate": 1.9868882362772356e-05,
+ "loss": 1.5503,
+ "step": 2938
+ },
+ {
+ "epoch": 8.008174386920981,
+ "grad_norm": 9.379240036010742,
+ "learning_rate": 1.9868739885200718e-05,
+ "loss": 1.7466,
+ "step": 2939
+ },
+ {
+ "epoch": 8.010899182561309,
+ "grad_norm": 18.678430557250977,
+ "learning_rate": 1.9868597330771648e-05,
+ "loss": 1.7124,
+ "step": 2940
+ },
+ {
+ "epoch": 8.013623978201634,
+ "grad_norm": 12.0128755569458,
+ "learning_rate": 1.986845469948626e-05,
+ "loss": 1.5017,
+ "step": 2941
+ },
+ {
+ "epoch": 8.016348773841962,
+ "grad_norm": 10.23306655883789,
+ "learning_rate": 1.986831199134567e-05,
+ "loss": 1.3601,
+ "step": 2942
+ },
+ {
+ "epoch": 8.01907356948229,
+ "grad_norm": 10.015888214111328,
+ "learning_rate": 1.986816920635098e-05,
+ "loss": 1.5457,
+ "step": 2943
+ },
+ {
+ "epoch": 8.021798365122615,
+ "grad_norm": 10.267995834350586,
+ "learning_rate": 1.9868026344503307e-05,
+ "loss": 1.4854,
+ "step": 2944
+ },
+ {
+ "epoch": 8.024523160762943,
+ "grad_norm": 9.181854248046875,
+ "learning_rate": 1.986788340580376e-05,
+ "loss": 1.239,
+ "step": 2945
+ },
+ {
+ "epoch": 8.02724795640327,
+ "grad_norm": 11.752165794372559,
+ "learning_rate": 1.9867740390253458e-05,
+ "loss": 1.4785,
+ "step": 2946
+ },
+ {
+ "epoch": 8.029972752043596,
+ "grad_norm": 13.72391414642334,
+ "learning_rate": 1.986759729785351e-05,
+ "loss": 1.4178,
+ "step": 2947
+ },
+ {
+ "epoch": 8.032697547683924,
+ "grad_norm": 11.265132904052734,
+ "learning_rate": 1.9867454128605033e-05,
+ "loss": 1.689,
+ "step": 2948
+ },
+ {
+ "epoch": 8.035422343324251,
+ "grad_norm": 10.6729154586792,
+ "learning_rate": 1.9867310882509136e-05,
+ "loss": 1.3896,
+ "step": 2949
+ },
+ {
+ "epoch": 8.038147138964577,
+ "grad_norm": 14.195324897766113,
+ "learning_rate": 1.9867167559566944e-05,
+ "loss": 1.363,
+ "step": 2950
+ },
+ {
+ "epoch": 8.040871934604905,
+ "grad_norm": 11.9901762008667,
+ "learning_rate": 1.986702415977957e-05,
+ "loss": 1.4023,
+ "step": 2951
+ },
+ {
+ "epoch": 8.043596730245232,
+ "grad_norm": 11.18156909942627,
+ "learning_rate": 1.9866880683148128e-05,
+ "loss": 1.4705,
+ "step": 2952
+ },
+ {
+ "epoch": 8.046321525885558,
+ "grad_norm": 14.364361763000488,
+ "learning_rate": 1.9866737129673733e-05,
+ "loss": 1.4668,
+ "step": 2953
+ },
+ {
+ "epoch": 8.049046321525886,
+ "grad_norm": 36.69050598144531,
+ "learning_rate": 1.9866593499357508e-05,
+ "loss": 1.7817,
+ "step": 2954
+ },
+ {
+ "epoch": 8.051771117166213,
+ "grad_norm": 10.556742668151855,
+ "learning_rate": 1.9866449792200572e-05,
+ "loss": 1.5327,
+ "step": 2955
+ },
+ {
+ "epoch": 8.054495912806539,
+ "grad_norm": 13.603948593139648,
+ "learning_rate": 1.9866306008204042e-05,
+ "loss": 1.3187,
+ "step": 2956
+ },
+ {
+ "epoch": 8.057220708446867,
+ "grad_norm": 11.465261459350586,
+ "learning_rate": 1.986616214736904e-05,
+ "loss": 1.7153,
+ "step": 2957
+ },
+ {
+ "epoch": 8.059945504087194,
+ "grad_norm": 32.16316604614258,
+ "learning_rate": 1.9866018209696686e-05,
+ "loss": 1.9456,
+ "step": 2958
+ },
+ {
+ "epoch": 8.06267029972752,
+ "grad_norm": 13.840081214904785,
+ "learning_rate": 1.9865874195188095e-05,
+ "loss": 1.585,
+ "step": 2959
+ },
+ {
+ "epoch": 8.065395095367847,
+ "grad_norm": 10.292863845825195,
+ "learning_rate": 1.9865730103844397e-05,
+ "loss": 1.5513,
+ "step": 2960
+ },
+ {
+ "epoch": 8.068119891008175,
+ "grad_norm": 10.423396110534668,
+ "learning_rate": 1.9865585935666706e-05,
+ "loss": 1.5293,
+ "step": 2961
+ },
+ {
+ "epoch": 8.0708446866485,
+ "grad_norm": 18.91510772705078,
+ "learning_rate": 1.9865441690656154e-05,
+ "loss": 1.2377,
+ "step": 2962
+ },
+ {
+ "epoch": 8.073569482288828,
+ "grad_norm": 9.956671714782715,
+ "learning_rate": 1.986529736881386e-05,
+ "loss": 1.4131,
+ "step": 2963
+ },
+ {
+ "epoch": 8.076294277929156,
+ "grad_norm": 20.656063079833984,
+ "learning_rate": 1.9865152970140946e-05,
+ "loss": 1.6997,
+ "step": 2964
+ },
+ {
+ "epoch": 8.079019073569482,
+ "grad_norm": 10.994516372680664,
+ "learning_rate": 1.9865008494638536e-05,
+ "loss": 1.5242,
+ "step": 2965
+ },
+ {
+ "epoch": 8.08174386920981,
+ "grad_norm": 12.00313949584961,
+ "learning_rate": 1.986486394230776e-05,
+ "loss": 1.4519,
+ "step": 2966
+ },
+ {
+ "epoch": 8.084468664850137,
+ "grad_norm": 10.38339900970459,
+ "learning_rate": 1.986471931314974e-05,
+ "loss": 1.4712,
+ "step": 2967
+ },
+ {
+ "epoch": 8.087193460490463,
+ "grad_norm": 11.970154762268066,
+ "learning_rate": 1.9864574607165602e-05,
+ "loss": 1.5349,
+ "step": 2968
+ },
+ {
+ "epoch": 8.08991825613079,
+ "grad_norm": 14.663086891174316,
+ "learning_rate": 1.9864429824356478e-05,
+ "loss": 1.4507,
+ "step": 2969
+ },
+ {
+ "epoch": 8.092643051771118,
+ "grad_norm": 11.080653190612793,
+ "learning_rate": 1.9864284964723488e-05,
+ "loss": 1.5071,
+ "step": 2970
+ },
+ {
+ "epoch": 8.095367847411444,
+ "grad_norm": 13.981965065002441,
+ "learning_rate": 1.9864140028267767e-05,
+ "loss": 1.7878,
+ "step": 2971
+ },
+ {
+ "epoch": 8.098092643051771,
+ "grad_norm": 11.915581703186035,
+ "learning_rate": 1.986399501499044e-05,
+ "loss": 1.5005,
+ "step": 2972
+ },
+ {
+ "epoch": 8.100817438692099,
+ "grad_norm": 11.16733455657959,
+ "learning_rate": 1.986384992489264e-05,
+ "loss": 1.4048,
+ "step": 2973
+ },
+ {
+ "epoch": 8.103542234332425,
+ "grad_norm": 11.649931907653809,
+ "learning_rate": 1.9863704757975492e-05,
+ "loss": 1.3342,
+ "step": 2974
+ },
+ {
+ "epoch": 8.106267029972752,
+ "grad_norm": 10.512341499328613,
+ "learning_rate": 1.9863559514240128e-05,
+ "loss": 1.4778,
+ "step": 2975
+ },
+ {
+ "epoch": 8.10899182561308,
+ "grad_norm": 12.347107887268066,
+ "learning_rate": 1.986341419368768e-05,
+ "loss": 1.4309,
+ "step": 2976
+ },
+ {
+ "epoch": 8.111716621253406,
+ "grad_norm": 10.135472297668457,
+ "learning_rate": 1.9863268796319278e-05,
+ "loss": 1.4036,
+ "step": 2977
+ },
+ {
+ "epoch": 8.114441416893733,
+ "grad_norm": 37.992225646972656,
+ "learning_rate": 1.9863123322136058e-05,
+ "loss": 1.4419,
+ "step": 2978
+ },
+ {
+ "epoch": 8.11716621253406,
+ "grad_norm": 9.647393226623535,
+ "learning_rate": 1.9862977771139154e-05,
+ "loss": 1.5249,
+ "step": 2979
+ },
+ {
+ "epoch": 8.119891008174386,
+ "grad_norm": 11.539268493652344,
+ "learning_rate": 1.9862832143329694e-05,
+ "loss": 1.4644,
+ "step": 2980
+ },
+ {
+ "epoch": 8.122615803814714,
+ "grad_norm": 9.759735107421875,
+ "learning_rate": 1.9862686438708813e-05,
+ "loss": 1.2756,
+ "step": 2981
+ },
+ {
+ "epoch": 8.125340599455042,
+ "grad_norm": 11.171850204467773,
+ "learning_rate": 1.986254065727765e-05,
+ "loss": 1.3867,
+ "step": 2982
+ },
+ {
+ "epoch": 8.128065395095367,
+ "grad_norm": 11.682690620422363,
+ "learning_rate": 1.9862394799037338e-05,
+ "loss": 1.5037,
+ "step": 2983
+ },
+ {
+ "epoch": 8.130790190735695,
+ "grad_norm": 10.766770362854004,
+ "learning_rate": 1.986224886398901e-05,
+ "loss": 1.5959,
+ "step": 2984
+ },
+ {
+ "epoch": 8.133514986376023,
+ "grad_norm": 12.399341583251953,
+ "learning_rate": 1.986210285213381e-05,
+ "loss": 1.4543,
+ "step": 2985
+ },
+ {
+ "epoch": 8.136239782016348,
+ "grad_norm": 9.954695701599121,
+ "learning_rate": 1.9861956763472866e-05,
+ "loss": 1.4868,
+ "step": 2986
+ },
+ {
+ "epoch": 8.138964577656676,
+ "grad_norm": 11.342049598693848,
+ "learning_rate": 1.986181059800732e-05,
+ "loss": 1.6086,
+ "step": 2987
+ },
+ {
+ "epoch": 8.141689373297003,
+ "grad_norm": 10.286776542663574,
+ "learning_rate": 1.986166435573831e-05,
+ "loss": 1.3677,
+ "step": 2988
+ },
+ {
+ "epoch": 8.14441416893733,
+ "grad_norm": 9.159870147705078,
+ "learning_rate": 1.9861518036666978e-05,
+ "loss": 1.5474,
+ "step": 2989
+ },
+ {
+ "epoch": 8.147138964577657,
+ "grad_norm": 10.327608108520508,
+ "learning_rate": 1.986137164079446e-05,
+ "loss": 1.3647,
+ "step": 2990
+ },
+ {
+ "epoch": 8.149863760217984,
+ "grad_norm": 12.476815223693848,
+ "learning_rate": 1.98612251681219e-05,
+ "loss": 1.4353,
+ "step": 2991
+ },
+ {
+ "epoch": 8.15258855585831,
+ "grad_norm": 8.87645435333252,
+ "learning_rate": 1.986107861865043e-05,
+ "loss": 1.4033,
+ "step": 2992
+ },
+ {
+ "epoch": 8.155313351498638,
+ "grad_norm": 13.785514831542969,
+ "learning_rate": 1.9860931992381202e-05,
+ "loss": 1.4614,
+ "step": 2993
+ },
+ {
+ "epoch": 8.158038147138965,
+ "grad_norm": 8.921813011169434,
+ "learning_rate": 1.9860785289315352e-05,
+ "loss": 1.2593,
+ "step": 2994
+ },
+ {
+ "epoch": 8.160762942779291,
+ "grad_norm": 10.972900390625,
+ "learning_rate": 1.986063850945402e-05,
+ "loss": 1.5112,
+ "step": 2995
+ },
+ {
+ "epoch": 8.163487738419619,
+ "grad_norm": 11.340409278869629,
+ "learning_rate": 1.9860491652798358e-05,
+ "loss": 1.5261,
+ "step": 2996
+ },
+ {
+ "epoch": 8.166212534059946,
+ "grad_norm": 11.435660362243652,
+ "learning_rate": 1.98603447193495e-05,
+ "loss": 1.5381,
+ "step": 2997
+ },
+ {
+ "epoch": 8.168937329700272,
+ "grad_norm": 10.339703559875488,
+ "learning_rate": 1.9860197709108596e-05,
+ "loss": 1.3696,
+ "step": 2998
+ },
+ {
+ "epoch": 8.1716621253406,
+ "grad_norm": 10.372658729553223,
+ "learning_rate": 1.986005062207679e-05,
+ "loss": 1.3369,
+ "step": 2999
+ },
+ {
+ "epoch": 8.174386920980927,
+ "grad_norm": 12.192550659179688,
+ "learning_rate": 1.9859903458255227e-05,
+ "loss": 1.5547,
+ "step": 3000
+ },
+ {
+ "epoch": 8.177111716621253,
+ "grad_norm": 9.437643051147461,
+ "learning_rate": 1.9859756217645054e-05,
+ "loss": 1.4419,
+ "step": 3001
+ },
+ {
+ "epoch": 8.17983651226158,
+ "grad_norm": 30.47894287109375,
+ "learning_rate": 1.9859608900247417e-05,
+ "loss": 1.4702,
+ "step": 3002
+ },
+ {
+ "epoch": 8.182561307901908,
+ "grad_norm": 9.573280334472656,
+ "learning_rate": 1.985946150606346e-05,
+ "loss": 1.542,
+ "step": 3003
+ },
+ {
+ "epoch": 8.185286103542234,
+ "grad_norm": 8.637099266052246,
+ "learning_rate": 1.985931403509434e-05,
+ "loss": 1.4841,
+ "step": 3004
+ },
+ {
+ "epoch": 8.188010899182562,
+ "grad_norm": 10.783534049987793,
+ "learning_rate": 1.9859166487341194e-05,
+ "loss": 1.4346,
+ "step": 3005
+ },
+ {
+ "epoch": 8.190735694822889,
+ "grad_norm": 9.640056610107422,
+ "learning_rate": 1.985901886280518e-05,
+ "loss": 1.3105,
+ "step": 3006
+ },
+ {
+ "epoch": 8.193460490463215,
+ "grad_norm": 10.957379341125488,
+ "learning_rate": 1.985887116148744e-05,
+ "loss": 1.4785,
+ "step": 3007
+ },
+ {
+ "epoch": 8.196185286103542,
+ "grad_norm": 8.909079551696777,
+ "learning_rate": 1.9858723383389134e-05,
+ "loss": 1.2114,
+ "step": 3008
+ },
+ {
+ "epoch": 8.19891008174387,
+ "grad_norm": 9.386533737182617,
+ "learning_rate": 1.9858575528511406e-05,
+ "loss": 1.4482,
+ "step": 3009
+ },
+ {
+ "epoch": 8.201634877384196,
+ "grad_norm": 23.52212142944336,
+ "learning_rate": 1.9858427596855407e-05,
+ "loss": 1.5076,
+ "step": 3010
+ },
+ {
+ "epoch": 8.204359673024523,
+ "grad_norm": 11.575129508972168,
+ "learning_rate": 1.9858279588422294e-05,
+ "loss": 1.4038,
+ "step": 3011
+ },
+ {
+ "epoch": 8.207084468664851,
+ "grad_norm": 13.577309608459473,
+ "learning_rate": 1.9858131503213214e-05,
+ "loss": 1.5769,
+ "step": 3012
+ },
+ {
+ "epoch": 8.209809264305177,
+ "grad_norm": 11.172263145446777,
+ "learning_rate": 1.9857983341229326e-05,
+ "loss": 1.6812,
+ "step": 3013
+ },
+ {
+ "epoch": 8.212534059945504,
+ "grad_norm": 10.272761344909668,
+ "learning_rate": 1.985783510247178e-05,
+ "loss": 1.5347,
+ "step": 3014
+ },
+ {
+ "epoch": 8.215258855585832,
+ "grad_norm": 10.700855255126953,
+ "learning_rate": 1.9857686786941733e-05,
+ "loss": 1.4775,
+ "step": 3015
+ },
+ {
+ "epoch": 8.217983651226158,
+ "grad_norm": 9.62952995300293,
+ "learning_rate": 1.9857538394640336e-05,
+ "loss": 1.3901,
+ "step": 3016
+ },
+ {
+ "epoch": 8.220708446866485,
+ "grad_norm": 9.708124160766602,
+ "learning_rate": 1.9857389925568745e-05,
+ "loss": 1.5703,
+ "step": 3017
+ },
+ {
+ "epoch": 8.223433242506813,
+ "grad_norm": 17.98137092590332,
+ "learning_rate": 1.9857241379728122e-05,
+ "loss": 1.5413,
+ "step": 3018
+ },
+ {
+ "epoch": 8.226158038147139,
+ "grad_norm": 11.248151779174805,
+ "learning_rate": 1.9857092757119622e-05,
+ "loss": 1.5107,
+ "step": 3019
+ },
+ {
+ "epoch": 8.228882833787466,
+ "grad_norm": 12.324178695678711,
+ "learning_rate": 1.9856944057744398e-05,
+ "loss": 1.5288,
+ "step": 3020
+ },
+ {
+ "epoch": 8.231607629427794,
+ "grad_norm": 10.10075855255127,
+ "learning_rate": 1.985679528160361e-05,
+ "loss": 1.4973,
+ "step": 3021
+ },
+ {
+ "epoch": 8.23433242506812,
+ "grad_norm": 14.341442108154297,
+ "learning_rate": 1.985664642869842e-05,
+ "loss": 1.2368,
+ "step": 3022
+ },
+ {
+ "epoch": 8.237057220708447,
+ "grad_norm": 11.082841873168945,
+ "learning_rate": 1.9856497499029987e-05,
+ "loss": 1.3391,
+ "step": 3023
+ },
+ {
+ "epoch": 8.239782016348773,
+ "grad_norm": 10.736616134643555,
+ "learning_rate": 1.9856348492599464e-05,
+ "loss": 1.4377,
+ "step": 3024
+ },
+ {
+ "epoch": 8.2425068119891,
+ "grad_norm": 9.020471572875977,
+ "learning_rate": 1.9856199409408017e-05,
+ "loss": 1.2141,
+ "step": 3025
+ },
+ {
+ "epoch": 8.245231607629428,
+ "grad_norm": 11.725255012512207,
+ "learning_rate": 1.9856050249456808e-05,
+ "loss": 1.3958,
+ "step": 3026
+ },
+ {
+ "epoch": 8.247956403269754,
+ "grad_norm": 10.40517807006836,
+ "learning_rate": 1.9855901012746996e-05,
+ "loss": 1.4919,
+ "step": 3027
+ },
+ {
+ "epoch": 8.250681198910081,
+ "grad_norm": 11.07318115234375,
+ "learning_rate": 1.9855751699279745e-05,
+ "loss": 1.5129,
+ "step": 3028
+ },
+ {
+ "epoch": 8.253405994550409,
+ "grad_norm": 9.537273406982422,
+ "learning_rate": 1.9855602309056216e-05,
+ "loss": 1.4246,
+ "step": 3029
+ },
+ {
+ "epoch": 8.256130790190735,
+ "grad_norm": 11.27015495300293,
+ "learning_rate": 1.9855452842077573e-05,
+ "loss": 1.7637,
+ "step": 3030
+ },
+ {
+ "epoch": 8.258855585831062,
+ "grad_norm": 11.040712356567383,
+ "learning_rate": 1.9855303298344985e-05,
+ "loss": 1.3016,
+ "step": 3031
+ },
+ {
+ "epoch": 8.26158038147139,
+ "grad_norm": 12.095251083374023,
+ "learning_rate": 1.9855153677859604e-05,
+ "loss": 1.5215,
+ "step": 3032
+ },
+ {
+ "epoch": 8.264305177111716,
+ "grad_norm": 10.048185348510742,
+ "learning_rate": 1.985500398062261e-05,
+ "loss": 1.345,
+ "step": 3033
+ },
+ {
+ "epoch": 8.267029972752043,
+ "grad_norm": 11.623002052307129,
+ "learning_rate": 1.985485420663516e-05,
+ "loss": 1.4788,
+ "step": 3034
+ },
+ {
+ "epoch": 8.269754768392371,
+ "grad_norm": 10.471136093139648,
+ "learning_rate": 1.985470435589842e-05,
+ "loss": 1.3445,
+ "step": 3035
+ },
+ {
+ "epoch": 8.272479564032697,
+ "grad_norm": 26.749555587768555,
+ "learning_rate": 1.9854554428413563e-05,
+ "loss": 1.4272,
+ "step": 3036
+ },
+ {
+ "epoch": 8.275204359673024,
+ "grad_norm": 10.94150447845459,
+ "learning_rate": 1.9854404424181752e-05,
+ "loss": 1.3726,
+ "step": 3037
+ },
+ {
+ "epoch": 8.277929155313352,
+ "grad_norm": 17.83536148071289,
+ "learning_rate": 1.9854254343204155e-05,
+ "loss": 1.3127,
+ "step": 3038
+ },
+ {
+ "epoch": 8.280653950953678,
+ "grad_norm": 10.491273880004883,
+ "learning_rate": 1.9854104185481944e-05,
+ "loss": 1.396,
+ "step": 3039
+ },
+ {
+ "epoch": 8.283378746594005,
+ "grad_norm": 15.343791961669922,
+ "learning_rate": 1.985395395101629e-05,
+ "loss": 1.4219,
+ "step": 3040
+ },
+ {
+ "epoch": 8.286103542234333,
+ "grad_norm": 11.310440063476562,
+ "learning_rate": 1.9853803639808357e-05,
+ "loss": 1.3748,
+ "step": 3041
+ },
+ {
+ "epoch": 8.288828337874659,
+ "grad_norm": 12.330083847045898,
+ "learning_rate": 1.9853653251859315e-05,
+ "loss": 1.3645,
+ "step": 3042
+ },
+ {
+ "epoch": 8.291553133514986,
+ "grad_norm": 16.09228515625,
+ "learning_rate": 1.9853502787170345e-05,
+ "loss": 1.4675,
+ "step": 3043
+ },
+ {
+ "epoch": 8.294277929155314,
+ "grad_norm": 11.356207847595215,
+ "learning_rate": 1.985335224574261e-05,
+ "loss": 1.5474,
+ "step": 3044
+ },
+ {
+ "epoch": 8.29700272479564,
+ "grad_norm": 14.240828514099121,
+ "learning_rate": 1.9853201627577283e-05,
+ "loss": 1.4148,
+ "step": 3045
+ },
+ {
+ "epoch": 8.299727520435967,
+ "grad_norm": 15.836702346801758,
+ "learning_rate": 1.985305093267554e-05,
+ "loss": 1.4309,
+ "step": 3046
+ },
+ {
+ "epoch": 8.302452316076295,
+ "grad_norm": 8.947978019714355,
+ "learning_rate": 1.9852900161038552e-05,
+ "loss": 1.3464,
+ "step": 3047
+ },
+ {
+ "epoch": 8.30517711171662,
+ "grad_norm": 20.330575942993164,
+ "learning_rate": 1.9852749312667496e-05,
+ "loss": 1.3528,
+ "step": 3048
+ },
+ {
+ "epoch": 8.307901907356948,
+ "grad_norm": 12.280182838439941,
+ "learning_rate": 1.9852598387563545e-05,
+ "loss": 1.4248,
+ "step": 3049
+ },
+ {
+ "epoch": 8.310626702997276,
+ "grad_norm": 12.325653076171875,
+ "learning_rate": 1.9852447385727876e-05,
+ "loss": 1.3672,
+ "step": 3050
+ },
+ {
+ "epoch": 8.313351498637601,
+ "grad_norm": 15.524264335632324,
+ "learning_rate": 1.985229630716166e-05,
+ "loss": 1.614,
+ "step": 3051
+ },
+ {
+ "epoch": 8.316076294277929,
+ "grad_norm": 12.32604694366455,
+ "learning_rate": 1.985214515186608e-05,
+ "loss": 1.6929,
+ "step": 3052
+ },
+ {
+ "epoch": 8.318801089918257,
+ "grad_norm": 18.24497413635254,
+ "learning_rate": 1.9851993919842314e-05,
+ "loss": 1.3445,
+ "step": 3053
+ },
+ {
+ "epoch": 8.321525885558582,
+ "grad_norm": 10.476236343383789,
+ "learning_rate": 1.9851842611091534e-05,
+ "loss": 1.5415,
+ "step": 3054
+ },
+ {
+ "epoch": 8.32425068119891,
+ "grad_norm": 13.16490364074707,
+ "learning_rate": 1.985169122561492e-05,
+ "loss": 1.4502,
+ "step": 3055
+ },
+ {
+ "epoch": 8.326975476839237,
+ "grad_norm": 8.830989837646484,
+ "learning_rate": 1.9851539763413653e-05,
+ "loss": 1.3802,
+ "step": 3056
+ },
+ {
+ "epoch": 8.329700272479563,
+ "grad_norm": 14.608965873718262,
+ "learning_rate": 1.985138822448891e-05,
+ "loss": 1.436,
+ "step": 3057
+ },
+ {
+ "epoch": 8.33242506811989,
+ "grad_norm": 9.7664155960083,
+ "learning_rate": 1.9851236608841874e-05,
+ "loss": 1.3562,
+ "step": 3058
+ },
+ {
+ "epoch": 8.335149863760218,
+ "grad_norm": 8.381041526794434,
+ "learning_rate": 1.985108491647372e-05,
+ "loss": 1.374,
+ "step": 3059
+ },
+ {
+ "epoch": 8.337874659400544,
+ "grad_norm": 8.069664001464844,
+ "learning_rate": 1.9850933147385637e-05,
+ "loss": 1.3459,
+ "step": 3060
+ },
+ {
+ "epoch": 8.340599455040872,
+ "grad_norm": 11.313298225402832,
+ "learning_rate": 1.9850781301578808e-05,
+ "loss": 1.4307,
+ "step": 3061
+ },
+ {
+ "epoch": 8.3433242506812,
+ "grad_norm": 16.71454620361328,
+ "learning_rate": 1.985062937905441e-05,
+ "loss": 1.4785,
+ "step": 3062
+ },
+ {
+ "epoch": 8.346049046321525,
+ "grad_norm": 15.24333667755127,
+ "learning_rate": 1.9850477379813622e-05,
+ "loss": 1.5354,
+ "step": 3063
+ },
+ {
+ "epoch": 8.348773841961853,
+ "grad_norm": 8.75456714630127,
+ "learning_rate": 1.9850325303857634e-05,
+ "loss": 1.4526,
+ "step": 3064
+ },
+ {
+ "epoch": 8.35149863760218,
+ "grad_norm": 11.578174591064453,
+ "learning_rate": 1.9850173151187634e-05,
+ "loss": 1.4067,
+ "step": 3065
+ },
+ {
+ "epoch": 8.354223433242506,
+ "grad_norm": 16.258743286132812,
+ "learning_rate": 1.9850020921804797e-05,
+ "loss": 1.5942,
+ "step": 3066
+ },
+ {
+ "epoch": 8.356948228882834,
+ "grad_norm": 9.28243350982666,
+ "learning_rate": 1.9849868615710316e-05,
+ "loss": 1.4578,
+ "step": 3067
+ },
+ {
+ "epoch": 8.359673024523161,
+ "grad_norm": 9.199224472045898,
+ "learning_rate": 1.9849716232905378e-05,
+ "loss": 1.3044,
+ "step": 3068
+ },
+ {
+ "epoch": 8.362397820163487,
+ "grad_norm": 12.875617027282715,
+ "learning_rate": 1.9849563773391163e-05,
+ "loss": 1.4543,
+ "step": 3069
+ },
+ {
+ "epoch": 8.365122615803815,
+ "grad_norm": 10.499556541442871,
+ "learning_rate": 1.9849411237168866e-05,
+ "loss": 1.4924,
+ "step": 3070
+ },
+ {
+ "epoch": 8.367847411444142,
+ "grad_norm": 10.636470794677734,
+ "learning_rate": 1.9849258624239672e-05,
+ "loss": 1.5032,
+ "step": 3071
+ },
+ {
+ "epoch": 8.370572207084468,
+ "grad_norm": 12.64499282836914,
+ "learning_rate": 1.9849105934604766e-05,
+ "loss": 1.5383,
+ "step": 3072
+ },
+ {
+ "epoch": 8.373297002724795,
+ "grad_norm": 11.598895072937012,
+ "learning_rate": 1.9848953168265342e-05,
+ "loss": 1.3938,
+ "step": 3073
+ },
+ {
+ "epoch": 8.376021798365123,
+ "grad_norm": 10.648917198181152,
+ "learning_rate": 1.9848800325222585e-05,
+ "loss": 1.5962,
+ "step": 3074
+ },
+ {
+ "epoch": 8.378746594005449,
+ "grad_norm": 11.883172988891602,
+ "learning_rate": 1.984864740547769e-05,
+ "loss": 1.5996,
+ "step": 3075
+ },
+ {
+ "epoch": 8.381471389645776,
+ "grad_norm": 9.24280834197998,
+ "learning_rate": 1.9848494409031843e-05,
+ "loss": 1.1299,
+ "step": 3076
+ },
+ {
+ "epoch": 8.384196185286104,
+ "grad_norm": 22.34482765197754,
+ "learning_rate": 1.9848341335886243e-05,
+ "loss": 1.5037,
+ "step": 3077
+ },
+ {
+ "epoch": 8.38692098092643,
+ "grad_norm": 9.828432083129883,
+ "learning_rate": 1.9848188186042077e-05,
+ "loss": 1.4204,
+ "step": 3078
+ },
+ {
+ "epoch": 8.389645776566757,
+ "grad_norm": 9.711224555969238,
+ "learning_rate": 1.9848034959500535e-05,
+ "loss": 1.3201,
+ "step": 3079
+ },
+ {
+ "epoch": 8.392370572207085,
+ "grad_norm": 14.278112411499023,
+ "learning_rate": 1.9847881656262816e-05,
+ "loss": 1.6392,
+ "step": 3080
+ },
+ {
+ "epoch": 8.39509536784741,
+ "grad_norm": 10.200750350952148,
+ "learning_rate": 1.9847728276330113e-05,
+ "loss": 1.3245,
+ "step": 3081
+ },
+ {
+ "epoch": 8.397820163487738,
+ "grad_norm": 12.277810096740723,
+ "learning_rate": 1.9847574819703617e-05,
+ "loss": 1.4807,
+ "step": 3082
+ },
+ {
+ "epoch": 8.400544959128066,
+ "grad_norm": 9.278221130371094,
+ "learning_rate": 1.9847421286384526e-05,
+ "loss": 1.3394,
+ "step": 3083
+ },
+ {
+ "epoch": 8.403269754768392,
+ "grad_norm": 13.014542579650879,
+ "learning_rate": 1.9847267676374035e-05,
+ "loss": 1.3337,
+ "step": 3084
+ },
+ {
+ "epoch": 8.40599455040872,
+ "grad_norm": 25.616065979003906,
+ "learning_rate": 1.984711398967334e-05,
+ "loss": 1.342,
+ "step": 3085
+ },
+ {
+ "epoch": 8.408719346049047,
+ "grad_norm": 10.43862533569336,
+ "learning_rate": 1.9846960226283638e-05,
+ "loss": 1.5442,
+ "step": 3086
+ },
+ {
+ "epoch": 8.411444141689373,
+ "grad_norm": 10.15013313293457,
+ "learning_rate": 1.9846806386206127e-05,
+ "loss": 1.605,
+ "step": 3087
+ },
+ {
+ "epoch": 8.4141689373297,
+ "grad_norm": 18.991050720214844,
+ "learning_rate": 1.9846652469442003e-05,
+ "loss": 1.6562,
+ "step": 3088
+ },
+ {
+ "epoch": 8.416893732970028,
+ "grad_norm": 13.327840805053711,
+ "learning_rate": 1.9846498475992467e-05,
+ "loss": 1.4358,
+ "step": 3089
+ },
+ {
+ "epoch": 8.419618528610354,
+ "grad_norm": 13.403010368347168,
+ "learning_rate": 1.984634440585872e-05,
+ "loss": 1.4423,
+ "step": 3090
+ },
+ {
+ "epoch": 8.422343324250681,
+ "grad_norm": 12.706461906433105,
+ "learning_rate": 1.9846190259041956e-05,
+ "loss": 1.5865,
+ "step": 3091
+ },
+ {
+ "epoch": 8.425068119891009,
+ "grad_norm": 10.648401260375977,
+ "learning_rate": 1.9846036035543384e-05,
+ "loss": 1.468,
+ "step": 3092
+ },
+ {
+ "epoch": 8.427792915531334,
+ "grad_norm": 10.862265586853027,
+ "learning_rate": 1.98458817353642e-05,
+ "loss": 1.4192,
+ "step": 3093
+ },
+ {
+ "epoch": 8.430517711171662,
+ "grad_norm": 9.958219528198242,
+ "learning_rate": 1.9845727358505603e-05,
+ "loss": 1.3962,
+ "step": 3094
+ },
+ {
+ "epoch": 8.43324250681199,
+ "grad_norm": 18.21630859375,
+ "learning_rate": 1.9845572904968797e-05,
+ "loss": 1.5098,
+ "step": 3095
+ },
+ {
+ "epoch": 8.435967302452315,
+ "grad_norm": 10.30978775024414,
+ "learning_rate": 1.984541837475499e-05,
+ "loss": 1.4932,
+ "step": 3096
+ },
+ {
+ "epoch": 8.438692098092643,
+ "grad_norm": 10.251604080200195,
+ "learning_rate": 1.984526376786538e-05,
+ "loss": 1.5325,
+ "step": 3097
+ },
+ {
+ "epoch": 8.44141689373297,
+ "grad_norm": 11.313343048095703,
+ "learning_rate": 1.9845109084301173e-05,
+ "loss": 1.4907,
+ "step": 3098
+ },
+ {
+ "epoch": 8.444141689373296,
+ "grad_norm": 11.00373649597168,
+ "learning_rate": 1.984495432406357e-05,
+ "loss": 1.4763,
+ "step": 3099
+ },
+ {
+ "epoch": 8.446866485013624,
+ "grad_norm": 10.753448486328125,
+ "learning_rate": 1.9844799487153782e-05,
+ "loss": 1.4187,
+ "step": 3100
+ },
+ {
+ "epoch": 8.449591280653951,
+ "grad_norm": 9.696673393249512,
+ "learning_rate": 1.9844644573573016e-05,
+ "loss": 1.4119,
+ "step": 3101
+ },
+ {
+ "epoch": 8.452316076294277,
+ "grad_norm": 11.8190336227417,
+ "learning_rate": 1.984448958332247e-05,
+ "loss": 1.4204,
+ "step": 3102
+ },
+ {
+ "epoch": 8.455040871934605,
+ "grad_norm": 10.040216445922852,
+ "learning_rate": 1.9844334516403356e-05,
+ "loss": 1.311,
+ "step": 3103
+ },
+ {
+ "epoch": 8.457765667574932,
+ "grad_norm": 10.194698333740234,
+ "learning_rate": 1.9844179372816884e-05,
+ "loss": 1.4722,
+ "step": 3104
+ },
+ {
+ "epoch": 8.460490463215258,
+ "grad_norm": 12.599777221679688,
+ "learning_rate": 1.984402415256426e-05,
+ "loss": 1.708,
+ "step": 3105
+ },
+ {
+ "epoch": 8.463215258855586,
+ "grad_norm": 10.403139114379883,
+ "learning_rate": 1.984386885564669e-05,
+ "loss": 1.3508,
+ "step": 3106
+ },
+ {
+ "epoch": 8.465940054495913,
+ "grad_norm": 16.842971801757812,
+ "learning_rate": 1.984371348206539e-05,
+ "loss": 1.4905,
+ "step": 3107
+ },
+ {
+ "epoch": 8.46866485013624,
+ "grad_norm": 13.428004264831543,
+ "learning_rate": 1.9843558031821563e-05,
+ "loss": 1.6121,
+ "step": 3108
+ },
+ {
+ "epoch": 8.471389645776567,
+ "grad_norm": 12.502063751220703,
+ "learning_rate": 1.9843402504916424e-05,
+ "loss": 1.7378,
+ "step": 3109
+ },
+ {
+ "epoch": 8.474114441416894,
+ "grad_norm": 8.010069847106934,
+ "learning_rate": 1.9843246901351184e-05,
+ "loss": 1.3679,
+ "step": 3110
+ },
+ {
+ "epoch": 8.47683923705722,
+ "grad_norm": 11.141092300415039,
+ "learning_rate": 1.9843091221127053e-05,
+ "loss": 1.5574,
+ "step": 3111
+ },
+ {
+ "epoch": 8.479564032697548,
+ "grad_norm": 17.215499877929688,
+ "learning_rate": 1.9842935464245245e-05,
+ "loss": 1.5002,
+ "step": 3112
+ },
+ {
+ "epoch": 8.482288828337875,
+ "grad_norm": 10.081450462341309,
+ "learning_rate": 1.9842779630706972e-05,
+ "loss": 1.3403,
+ "step": 3113
+ },
+ {
+ "epoch": 8.485013623978201,
+ "grad_norm": 10.36174488067627,
+ "learning_rate": 1.9842623720513447e-05,
+ "loss": 1.4783,
+ "step": 3114
+ },
+ {
+ "epoch": 8.487738419618529,
+ "grad_norm": 9.917871475219727,
+ "learning_rate": 1.9842467733665886e-05,
+ "loss": 1.3081,
+ "step": 3115
+ },
+ {
+ "epoch": 8.490463215258856,
+ "grad_norm": 13.55300235748291,
+ "learning_rate": 1.9842311670165503e-05,
+ "loss": 1.3501,
+ "step": 3116
+ },
+ {
+ "epoch": 8.493188010899182,
+ "grad_norm": 10.539414405822754,
+ "learning_rate": 1.9842155530013514e-05,
+ "loss": 1.4915,
+ "step": 3117
+ },
+ {
+ "epoch": 8.49591280653951,
+ "grad_norm": 14.190298080444336,
+ "learning_rate": 1.9841999313211135e-05,
+ "loss": 1.5364,
+ "step": 3118
+ },
+ {
+ "epoch": 8.498637602179837,
+ "grad_norm": 11.394745826721191,
+ "learning_rate": 1.9841843019759583e-05,
+ "loss": 1.427,
+ "step": 3119
+ },
+ {
+ "epoch": 8.501362397820163,
+ "grad_norm": 11.221658706665039,
+ "learning_rate": 1.984168664966007e-05,
+ "loss": 1.394,
+ "step": 3120
+ },
+ {
+ "epoch": 8.50408719346049,
+ "grad_norm": 13.456465721130371,
+ "learning_rate": 1.9841530202913822e-05,
+ "loss": 1.386,
+ "step": 3121
+ },
+ {
+ "epoch": 8.506811989100818,
+ "grad_norm": 12.035820960998535,
+ "learning_rate": 1.984137367952205e-05,
+ "loss": 1.4299,
+ "step": 3122
+ },
+ {
+ "epoch": 8.509536784741144,
+ "grad_norm": 12.752290725708008,
+ "learning_rate": 1.984121707948598e-05,
+ "loss": 1.5894,
+ "step": 3123
+ },
+ {
+ "epoch": 8.512261580381471,
+ "grad_norm": 10.289709091186523,
+ "learning_rate": 1.9841060402806826e-05,
+ "loss": 1.4592,
+ "step": 3124
+ },
+ {
+ "epoch": 8.514986376021799,
+ "grad_norm": 12.596096992492676,
+ "learning_rate": 1.9840903649485812e-05,
+ "loss": 1.4778,
+ "step": 3125
+ },
+ {
+ "epoch": 8.517711171662125,
+ "grad_norm": 9.822829246520996,
+ "learning_rate": 1.9840746819524157e-05,
+ "loss": 1.3276,
+ "step": 3126
+ },
+ {
+ "epoch": 8.520435967302452,
+ "grad_norm": 11.025153160095215,
+ "learning_rate": 1.9840589912923082e-05,
+ "loss": 1.3391,
+ "step": 3127
+ },
+ {
+ "epoch": 8.52316076294278,
+ "grad_norm": 14.443016052246094,
+ "learning_rate": 1.984043292968381e-05,
+ "loss": 1.3357,
+ "step": 3128
+ },
+ {
+ "epoch": 8.525885558583106,
+ "grad_norm": 11.228981971740723,
+ "learning_rate": 1.984027586980756e-05,
+ "loss": 1.4622,
+ "step": 3129
+ },
+ {
+ "epoch": 8.528610354223433,
+ "grad_norm": 9.984880447387695,
+ "learning_rate": 1.984011873329556e-05,
+ "loss": 1.196,
+ "step": 3130
+ },
+ {
+ "epoch": 8.53133514986376,
+ "grad_norm": 14.243448257446289,
+ "learning_rate": 1.9839961520149035e-05,
+ "loss": 1.4465,
+ "step": 3131
+ },
+ {
+ "epoch": 8.534059945504087,
+ "grad_norm": 17.242151260375977,
+ "learning_rate": 1.9839804230369204e-05,
+ "loss": 1.3835,
+ "step": 3132
+ },
+ {
+ "epoch": 8.536784741144414,
+ "grad_norm": 10.174351692199707,
+ "learning_rate": 1.9839646863957294e-05,
+ "loss": 1.325,
+ "step": 3133
+ },
+ {
+ "epoch": 8.539509536784742,
+ "grad_norm": 14.6315279006958,
+ "learning_rate": 1.9839489420914533e-05,
+ "loss": 1.3896,
+ "step": 3134
+ },
+ {
+ "epoch": 8.542234332425068,
+ "grad_norm": 10.157470703125,
+ "learning_rate": 1.9839331901242144e-05,
+ "loss": 1.4033,
+ "step": 3135
+ },
+ {
+ "epoch": 8.544959128065395,
+ "grad_norm": 11.893716812133789,
+ "learning_rate": 1.983917430494135e-05,
+ "loss": 1.4417,
+ "step": 3136
+ },
+ {
+ "epoch": 8.547683923705723,
+ "grad_norm": 10.006495475769043,
+ "learning_rate": 1.9839016632013388e-05,
+ "loss": 1.48,
+ "step": 3137
+ },
+ {
+ "epoch": 8.550408719346049,
+ "grad_norm": 9.870905876159668,
+ "learning_rate": 1.9838858882459483e-05,
+ "loss": 1.562,
+ "step": 3138
+ },
+ {
+ "epoch": 8.553133514986376,
+ "grad_norm": 9.79379940032959,
+ "learning_rate": 1.9838701056280857e-05,
+ "loss": 1.2852,
+ "step": 3139
+ },
+ {
+ "epoch": 8.555858310626704,
+ "grad_norm": 14.175224304199219,
+ "learning_rate": 1.9838543153478746e-05,
+ "loss": 1.3904,
+ "step": 3140
+ },
+ {
+ "epoch": 8.55858310626703,
+ "grad_norm": 11.184218406677246,
+ "learning_rate": 1.9838385174054376e-05,
+ "loss": 1.4192,
+ "step": 3141
+ },
+ {
+ "epoch": 8.561307901907357,
+ "grad_norm": 14.325691223144531,
+ "learning_rate": 1.9838227118008982e-05,
+ "loss": 1.5825,
+ "step": 3142
+ },
+ {
+ "epoch": 8.564032697547685,
+ "grad_norm": 10.817137718200684,
+ "learning_rate": 1.983806898534379e-05,
+ "loss": 1.3391,
+ "step": 3143
+ },
+ {
+ "epoch": 8.56675749318801,
+ "grad_norm": 9.145304679870605,
+ "learning_rate": 1.9837910776060036e-05,
+ "loss": 1.4397,
+ "step": 3144
+ },
+ {
+ "epoch": 8.569482288828338,
+ "grad_norm": 8.59023666381836,
+ "learning_rate": 1.9837752490158946e-05,
+ "loss": 1.3081,
+ "step": 3145
+ },
+ {
+ "epoch": 8.572207084468666,
+ "grad_norm": 9.126311302185059,
+ "learning_rate": 1.9837594127641758e-05,
+ "loss": 1.4802,
+ "step": 3146
+ },
+ {
+ "epoch": 8.574931880108991,
+ "grad_norm": 9.468857765197754,
+ "learning_rate": 1.9837435688509704e-05,
+ "loss": 1.3608,
+ "step": 3147
+ },
+ {
+ "epoch": 8.577656675749319,
+ "grad_norm": 10.783597946166992,
+ "learning_rate": 1.9837277172764016e-05,
+ "loss": 1.5986,
+ "step": 3148
+ },
+ {
+ "epoch": 8.580381471389646,
+ "grad_norm": 9.311051368713379,
+ "learning_rate": 1.9837118580405928e-05,
+ "loss": 1.3455,
+ "step": 3149
+ },
+ {
+ "epoch": 8.583106267029972,
+ "grad_norm": 17.301712036132812,
+ "learning_rate": 1.9836959911436682e-05,
+ "loss": 1.5852,
+ "step": 3150
+ },
+ {
+ "epoch": 8.5858310626703,
+ "grad_norm": 9.285280227661133,
+ "learning_rate": 1.9836801165857507e-05,
+ "loss": 1.4199,
+ "step": 3151
+ },
+ {
+ "epoch": 8.588555858310627,
+ "grad_norm": 11.945184707641602,
+ "learning_rate": 1.983664234366964e-05,
+ "loss": 1.4299,
+ "step": 3152
+ },
+ {
+ "epoch": 8.591280653950953,
+ "grad_norm": 10.90672779083252,
+ "learning_rate": 1.9836483444874317e-05,
+ "loss": 1.3088,
+ "step": 3153
+ },
+ {
+ "epoch": 8.59400544959128,
+ "grad_norm": 9.78835678100586,
+ "learning_rate": 1.9836324469472782e-05,
+ "loss": 1.447,
+ "step": 3154
+ },
+ {
+ "epoch": 8.596730245231608,
+ "grad_norm": 11.199138641357422,
+ "learning_rate": 1.9836165417466266e-05,
+ "loss": 1.3364,
+ "step": 3155
+ },
+ {
+ "epoch": 8.599455040871934,
+ "grad_norm": 10.1149320602417,
+ "learning_rate": 1.983600628885601e-05,
+ "loss": 1.4536,
+ "step": 3156
+ },
+ {
+ "epoch": 8.602179836512262,
+ "grad_norm": 15.373045921325684,
+ "learning_rate": 1.9835847083643256e-05,
+ "loss": 1.7036,
+ "step": 3157
+ },
+ {
+ "epoch": 8.60490463215259,
+ "grad_norm": 11.325897216796875,
+ "learning_rate": 1.983568780182924e-05,
+ "loss": 1.3481,
+ "step": 3158
+ },
+ {
+ "epoch": 8.607629427792915,
+ "grad_norm": 10.771793365478516,
+ "learning_rate": 1.9835528443415205e-05,
+ "loss": 1.4155,
+ "step": 3159
+ },
+ {
+ "epoch": 8.610354223433243,
+ "grad_norm": 11.561205863952637,
+ "learning_rate": 1.983536900840239e-05,
+ "loss": 1.4573,
+ "step": 3160
+ },
+ {
+ "epoch": 8.61307901907357,
+ "grad_norm": 15.841632843017578,
+ "learning_rate": 1.9835209496792038e-05,
+ "loss": 1.5005,
+ "step": 3161
+ },
+ {
+ "epoch": 8.615803814713896,
+ "grad_norm": 10.387455940246582,
+ "learning_rate": 1.9835049908585388e-05,
+ "loss": 1.2476,
+ "step": 3162
+ },
+ {
+ "epoch": 8.618528610354224,
+ "grad_norm": 10.735313415527344,
+ "learning_rate": 1.983489024378369e-05,
+ "loss": 1.3098,
+ "step": 3163
+ },
+ {
+ "epoch": 8.621253405994551,
+ "grad_norm": 8.47869873046875,
+ "learning_rate": 1.983473050238818e-05,
+ "loss": 1.1816,
+ "step": 3164
+ },
+ {
+ "epoch": 8.623978201634877,
+ "grad_norm": 12.40446662902832,
+ "learning_rate": 1.983457068440011e-05,
+ "loss": 1.2859,
+ "step": 3165
+ },
+ {
+ "epoch": 8.626702997275205,
+ "grad_norm": 11.339210510253906,
+ "learning_rate": 1.983441078982072e-05,
+ "loss": 1.489,
+ "step": 3166
+ },
+ {
+ "epoch": 8.629427792915532,
+ "grad_norm": 18.086868286132812,
+ "learning_rate": 1.983425081865125e-05,
+ "loss": 1.4016,
+ "step": 3167
+ },
+ {
+ "epoch": 8.632152588555858,
+ "grad_norm": 7.482706069946289,
+ "learning_rate": 1.9834090770892952e-05,
+ "loss": 1.5005,
+ "step": 3168
+ },
+ {
+ "epoch": 8.634877384196185,
+ "grad_norm": 9.909168243408203,
+ "learning_rate": 1.9833930646547074e-05,
+ "loss": 1.3108,
+ "step": 3169
+ },
+ {
+ "epoch": 8.637602179836513,
+ "grad_norm": 14.946528434753418,
+ "learning_rate": 1.983377044561486e-05,
+ "loss": 1.592,
+ "step": 3170
+ },
+ {
+ "epoch": 8.640326975476839,
+ "grad_norm": 11.477744102478027,
+ "learning_rate": 1.9833610168097558e-05,
+ "loss": 1.4348,
+ "step": 3171
+ },
+ {
+ "epoch": 8.643051771117166,
+ "grad_norm": 13.602697372436523,
+ "learning_rate": 1.9833449813996416e-05,
+ "loss": 1.6536,
+ "step": 3172
+ },
+ {
+ "epoch": 8.645776566757494,
+ "grad_norm": 9.349848747253418,
+ "learning_rate": 1.9833289383312687e-05,
+ "loss": 1.3394,
+ "step": 3173
+ },
+ {
+ "epoch": 8.64850136239782,
+ "grad_norm": 11.529946327209473,
+ "learning_rate": 1.9833128876047612e-05,
+ "loss": 1.5176,
+ "step": 3174
+ },
+ {
+ "epoch": 8.651226158038147,
+ "grad_norm": 11.247405052185059,
+ "learning_rate": 1.9832968292202447e-05,
+ "loss": 1.4001,
+ "step": 3175
+ },
+ {
+ "epoch": 8.653950953678475,
+ "grad_norm": 7.817025184631348,
+ "learning_rate": 1.9832807631778443e-05,
+ "loss": 1.3018,
+ "step": 3176
+ },
+ {
+ "epoch": 8.6566757493188,
+ "grad_norm": 11.277419090270996,
+ "learning_rate": 1.9832646894776847e-05,
+ "loss": 1.5171,
+ "step": 3177
+ },
+ {
+ "epoch": 8.659400544959128,
+ "grad_norm": 9.400995254516602,
+ "learning_rate": 1.9832486081198915e-05,
+ "loss": 1.3835,
+ "step": 3178
+ },
+ {
+ "epoch": 8.662125340599456,
+ "grad_norm": 8.203719139099121,
+ "learning_rate": 1.9832325191045898e-05,
+ "loss": 1.2866,
+ "step": 3179
+ },
+ {
+ "epoch": 8.664850136239782,
+ "grad_norm": 10.158937454223633,
+ "learning_rate": 1.983216422431905e-05,
+ "loss": 1.4116,
+ "step": 3180
+ },
+ {
+ "epoch": 8.66757493188011,
+ "grad_norm": 9.965296745300293,
+ "learning_rate": 1.9832003181019622e-05,
+ "loss": 1.3708,
+ "step": 3181
+ },
+ {
+ "epoch": 8.670299727520437,
+ "grad_norm": 11.576178550720215,
+ "learning_rate": 1.983184206114887e-05,
+ "loss": 1.3733,
+ "step": 3182
+ },
+ {
+ "epoch": 8.673024523160763,
+ "grad_norm": 12.1446533203125,
+ "learning_rate": 1.983168086470805e-05,
+ "loss": 1.3831,
+ "step": 3183
+ },
+ {
+ "epoch": 8.67574931880109,
+ "grad_norm": 9.264537811279297,
+ "learning_rate": 1.9831519591698413e-05,
+ "loss": 1.4524,
+ "step": 3184
+ },
+ {
+ "epoch": 8.678474114441418,
+ "grad_norm": 11.140650749206543,
+ "learning_rate": 1.983135824212122e-05,
+ "loss": 1.6309,
+ "step": 3185
+ },
+ {
+ "epoch": 8.681198910081743,
+ "grad_norm": 9.234440803527832,
+ "learning_rate": 1.9831196815977724e-05,
+ "loss": 1.5391,
+ "step": 3186
+ },
+ {
+ "epoch": 8.683923705722071,
+ "grad_norm": 10.074746131896973,
+ "learning_rate": 1.9831035313269185e-05,
+ "loss": 1.582,
+ "step": 3187
+ },
+ {
+ "epoch": 8.686648501362399,
+ "grad_norm": 10.477161407470703,
+ "learning_rate": 1.9830873733996857e-05,
+ "loss": 1.5674,
+ "step": 3188
+ },
+ {
+ "epoch": 8.689373297002724,
+ "grad_norm": 8.84496784210205,
+ "learning_rate": 1.9830712078162e-05,
+ "loss": 1.4683,
+ "step": 3189
+ },
+ {
+ "epoch": 8.692098092643052,
+ "grad_norm": 9.623519897460938,
+ "learning_rate": 1.983055034576588e-05,
+ "loss": 1.5715,
+ "step": 3190
+ },
+ {
+ "epoch": 8.69482288828338,
+ "grad_norm": 27.9208927154541,
+ "learning_rate": 1.9830388536809746e-05,
+ "loss": 1.418,
+ "step": 3191
+ },
+ {
+ "epoch": 8.697547683923705,
+ "grad_norm": 14.704259872436523,
+ "learning_rate": 1.983022665129486e-05,
+ "loss": 1.6104,
+ "step": 3192
+ },
+ {
+ "epoch": 8.700272479564033,
+ "grad_norm": 10.346733093261719,
+ "learning_rate": 1.983006468922249e-05,
+ "loss": 1.5295,
+ "step": 3193
+ },
+ {
+ "epoch": 8.70299727520436,
+ "grad_norm": 7.489201068878174,
+ "learning_rate": 1.982990265059389e-05,
+ "loss": 1.408,
+ "step": 3194
+ },
+ {
+ "epoch": 8.705722070844686,
+ "grad_norm": 9.454360961914062,
+ "learning_rate": 1.9829740535410326e-05,
+ "loss": 1.3833,
+ "step": 3195
+ },
+ {
+ "epoch": 8.708446866485014,
+ "grad_norm": 10.133238792419434,
+ "learning_rate": 1.9829578343673058e-05,
+ "loss": 1.439,
+ "step": 3196
+ },
+ {
+ "epoch": 8.711171662125341,
+ "grad_norm": 10.01593017578125,
+ "learning_rate": 1.982941607538335e-05,
+ "loss": 1.623,
+ "step": 3197
+ },
+ {
+ "epoch": 8.713896457765667,
+ "grad_norm": 9.866012573242188,
+ "learning_rate": 1.9829253730542466e-05,
+ "loss": 1.325,
+ "step": 3198
+ },
+ {
+ "epoch": 8.716621253405995,
+ "grad_norm": 9.05703353881836,
+ "learning_rate": 1.9829091309151672e-05,
+ "loss": 1.3975,
+ "step": 3199
+ },
+ {
+ "epoch": 8.719346049046322,
+ "grad_norm": 8.689501762390137,
+ "learning_rate": 1.9828928811212228e-05,
+ "loss": 1.355,
+ "step": 3200
+ },
+ {
+ "epoch": 8.722070844686648,
+ "grad_norm": 89.05525207519531,
+ "learning_rate": 1.9828766236725406e-05,
+ "loss": 1.4399,
+ "step": 3201
+ },
+ {
+ "epoch": 8.724795640326976,
+ "grad_norm": 8.031493186950684,
+ "learning_rate": 1.9828603585692468e-05,
+ "loss": 1.1775,
+ "step": 3202
+ },
+ {
+ "epoch": 8.727520435967303,
+ "grad_norm": 9.144047737121582,
+ "learning_rate": 1.982844085811468e-05,
+ "loss": 1.5012,
+ "step": 3203
+ },
+ {
+ "epoch": 8.730245231607629,
+ "grad_norm": 8.287677764892578,
+ "learning_rate": 1.9828278053993313e-05,
+ "loss": 1.2903,
+ "step": 3204
+ },
+ {
+ "epoch": 8.732970027247957,
+ "grad_norm": 9.539989471435547,
+ "learning_rate": 1.982811517332963e-05,
+ "loss": 1.3569,
+ "step": 3205
+ },
+ {
+ "epoch": 8.735694822888284,
+ "grad_norm": 10.297660827636719,
+ "learning_rate": 1.9827952216124908e-05,
+ "loss": 1.6138,
+ "step": 3206
+ },
+ {
+ "epoch": 8.73841961852861,
+ "grad_norm": 9.752589225769043,
+ "learning_rate": 1.9827789182380407e-05,
+ "loss": 1.2336,
+ "step": 3207
+ },
+ {
+ "epoch": 8.741144414168938,
+ "grad_norm": 11.144782066345215,
+ "learning_rate": 1.9827626072097395e-05,
+ "loss": 1.3674,
+ "step": 3208
+ },
+ {
+ "epoch": 8.743869209809265,
+ "grad_norm": 11.73814582824707,
+ "learning_rate": 1.9827462885277155e-05,
+ "loss": 1.4758,
+ "step": 3209
+ },
+ {
+ "epoch": 8.746594005449591,
+ "grad_norm": 11.165502548217773,
+ "learning_rate": 1.9827299621920948e-05,
+ "loss": 1.5583,
+ "step": 3210
+ },
+ {
+ "epoch": 8.749318801089919,
+ "grad_norm": 10.431931495666504,
+ "learning_rate": 1.982713628203005e-05,
+ "loss": 1.5918,
+ "step": 3211
+ },
+ {
+ "epoch": 8.752043596730246,
+ "grad_norm": 14.608397483825684,
+ "learning_rate": 1.9826972865605725e-05,
+ "loss": 1.5596,
+ "step": 3212
+ },
+ {
+ "epoch": 8.754768392370572,
+ "grad_norm": 9.00948429107666,
+ "learning_rate": 1.9826809372649258e-05,
+ "loss": 1.5117,
+ "step": 3213
+ },
+ {
+ "epoch": 8.7574931880109,
+ "grad_norm": 11.614974021911621,
+ "learning_rate": 1.982664580316191e-05,
+ "loss": 1.5029,
+ "step": 3214
+ },
+ {
+ "epoch": 8.760217983651227,
+ "grad_norm": 10.131213188171387,
+ "learning_rate": 1.9826482157144962e-05,
+ "loss": 1.4861,
+ "step": 3215
+ },
+ {
+ "epoch": 8.762942779291553,
+ "grad_norm": 12.708951950073242,
+ "learning_rate": 1.9826318434599693e-05,
+ "loss": 1.4624,
+ "step": 3216
+ },
+ {
+ "epoch": 8.76566757493188,
+ "grad_norm": 10.052382469177246,
+ "learning_rate": 1.9826154635527368e-05,
+ "loss": 1.5754,
+ "step": 3217
+ },
+ {
+ "epoch": 8.768392370572208,
+ "grad_norm": 9.058707237243652,
+ "learning_rate": 1.982599075992927e-05,
+ "loss": 1.5889,
+ "step": 3218
+ },
+ {
+ "epoch": 8.771117166212534,
+ "grad_norm": 12.47221851348877,
+ "learning_rate": 1.9825826807806665e-05,
+ "loss": 1.3899,
+ "step": 3219
+ },
+ {
+ "epoch": 8.773841961852861,
+ "grad_norm": 9.93853759765625,
+ "learning_rate": 1.9825662779160843e-05,
+ "loss": 1.4197,
+ "step": 3220
+ },
+ {
+ "epoch": 8.776566757493189,
+ "grad_norm": 12.409202575683594,
+ "learning_rate": 1.9825498673993074e-05,
+ "loss": 1.4915,
+ "step": 3221
+ },
+ {
+ "epoch": 8.779291553133515,
+ "grad_norm": 11.034850120544434,
+ "learning_rate": 1.9825334492304637e-05,
+ "loss": 1.3545,
+ "step": 3222
+ },
+ {
+ "epoch": 8.782016348773842,
+ "grad_norm": 13.478449821472168,
+ "learning_rate": 1.9825170234096812e-05,
+ "loss": 1.4248,
+ "step": 3223
+ },
+ {
+ "epoch": 8.78474114441417,
+ "grad_norm": 9.65610122680664,
+ "learning_rate": 1.9825005899370877e-05,
+ "loss": 1.7104,
+ "step": 3224
+ },
+ {
+ "epoch": 8.787465940054496,
+ "grad_norm": 14.528332710266113,
+ "learning_rate": 1.982484148812811e-05,
+ "loss": 1.4719,
+ "step": 3225
+ },
+ {
+ "epoch": 8.790190735694823,
+ "grad_norm": 21.48270034790039,
+ "learning_rate": 1.9824677000369798e-05,
+ "loss": 1.5227,
+ "step": 3226
+ },
+ {
+ "epoch": 8.79291553133515,
+ "grad_norm": 9.869617462158203,
+ "learning_rate": 1.9824512436097216e-05,
+ "loss": 1.5923,
+ "step": 3227
+ },
+ {
+ "epoch": 8.795640326975477,
+ "grad_norm": 12.607680320739746,
+ "learning_rate": 1.9824347795311646e-05,
+ "loss": 1.3701,
+ "step": 3228
+ },
+ {
+ "epoch": 8.798365122615804,
+ "grad_norm": 9.923628807067871,
+ "learning_rate": 1.9824183078014373e-05,
+ "loss": 1.4026,
+ "step": 3229
+ },
+ {
+ "epoch": 8.80108991825613,
+ "grad_norm": 9.845184326171875,
+ "learning_rate": 1.9824018284206677e-05,
+ "loss": 1.3467,
+ "step": 3230
+ },
+ {
+ "epoch": 8.803814713896458,
+ "grad_norm": 10.393508911132812,
+ "learning_rate": 1.9823853413889846e-05,
+ "loss": 1.429,
+ "step": 3231
+ },
+ {
+ "epoch": 8.806539509536785,
+ "grad_norm": 8.768599510192871,
+ "learning_rate": 1.982368846706516e-05,
+ "loss": 1.3774,
+ "step": 3232
+ },
+ {
+ "epoch": 8.809264305177111,
+ "grad_norm": 10.29957103729248,
+ "learning_rate": 1.98235234437339e-05,
+ "loss": 1.5173,
+ "step": 3233
+ },
+ {
+ "epoch": 8.811989100817438,
+ "grad_norm": 11.418523788452148,
+ "learning_rate": 1.982335834389736e-05,
+ "loss": 1.3774,
+ "step": 3234
+ },
+ {
+ "epoch": 8.814713896457766,
+ "grad_norm": 13.813346862792969,
+ "learning_rate": 1.982319316755682e-05,
+ "loss": 1.5896,
+ "step": 3235
+ },
+ {
+ "epoch": 8.817438692098092,
+ "grad_norm": 13.180110931396484,
+ "learning_rate": 1.9823027914713567e-05,
+ "loss": 1.4475,
+ "step": 3236
+ },
+ {
+ "epoch": 8.82016348773842,
+ "grad_norm": 9.238238334655762,
+ "learning_rate": 1.982286258536889e-05,
+ "loss": 1.3816,
+ "step": 3237
+ },
+ {
+ "epoch": 8.822888283378747,
+ "grad_norm": 15.085087776184082,
+ "learning_rate": 1.9822697179524074e-05,
+ "loss": 1.7009,
+ "step": 3238
+ },
+ {
+ "epoch": 8.825613079019073,
+ "grad_norm": 9.169953346252441,
+ "learning_rate": 1.9822531697180412e-05,
+ "loss": 1.4221,
+ "step": 3239
+ },
+ {
+ "epoch": 8.8283378746594,
+ "grad_norm": 8.766127586364746,
+ "learning_rate": 1.9822366138339185e-05,
+ "loss": 1.5503,
+ "step": 3240
+ },
+ {
+ "epoch": 8.831062670299728,
+ "grad_norm": 8.895727157592773,
+ "learning_rate": 1.982220050300169e-05,
+ "loss": 1.5767,
+ "step": 3241
+ },
+ {
+ "epoch": 8.833787465940054,
+ "grad_norm": 18.501556396484375,
+ "learning_rate": 1.982203479116921e-05,
+ "loss": 1.6104,
+ "step": 3242
+ },
+ {
+ "epoch": 8.836512261580381,
+ "grad_norm": 9.487771987915039,
+ "learning_rate": 1.982186900284304e-05,
+ "loss": 1.5347,
+ "step": 3243
+ },
+ {
+ "epoch": 8.839237057220709,
+ "grad_norm": 8.779281616210938,
+ "learning_rate": 1.982170313802447e-05,
+ "loss": 1.5388,
+ "step": 3244
+ },
+ {
+ "epoch": 8.841961852861035,
+ "grad_norm": 15.55836009979248,
+ "learning_rate": 1.9821537196714797e-05,
+ "loss": 1.3896,
+ "step": 3245
+ },
+ {
+ "epoch": 8.844686648501362,
+ "grad_norm": 22.404815673828125,
+ "learning_rate": 1.9821371178915307e-05,
+ "loss": 1.6101,
+ "step": 3246
+ },
+ {
+ "epoch": 8.84741144414169,
+ "grad_norm": 10.606950759887695,
+ "learning_rate": 1.9821205084627292e-05,
+ "loss": 1.4644,
+ "step": 3247
+ },
+ {
+ "epoch": 8.850136239782016,
+ "grad_norm": 10.240605354309082,
+ "learning_rate": 1.982103891385205e-05,
+ "loss": 1.3381,
+ "step": 3248
+ },
+ {
+ "epoch": 8.852861035422343,
+ "grad_norm": 21.625900268554688,
+ "learning_rate": 1.982087266659087e-05,
+ "loss": 1.3345,
+ "step": 3249
+ },
+ {
+ "epoch": 8.85558583106267,
+ "grad_norm": 9.106072425842285,
+ "learning_rate": 1.982070634284505e-05,
+ "loss": 1.2634,
+ "step": 3250
+ },
+ {
+ "epoch": 8.858310626702997,
+ "grad_norm": 11.157843589782715,
+ "learning_rate": 1.9820539942615883e-05,
+ "loss": 1.4194,
+ "step": 3251
+ },
+ {
+ "epoch": 8.861035422343324,
+ "grad_norm": 11.39349365234375,
+ "learning_rate": 1.9820373465904672e-05,
+ "loss": 1.3013,
+ "step": 3252
+ },
+ {
+ "epoch": 8.863760217983652,
+ "grad_norm": 12.323468208312988,
+ "learning_rate": 1.982020691271271e-05,
+ "loss": 1.4363,
+ "step": 3253
+ },
+ {
+ "epoch": 8.866485013623977,
+ "grad_norm": 9.340956687927246,
+ "learning_rate": 1.9820040283041287e-05,
+ "loss": 1.322,
+ "step": 3254
+ },
+ {
+ "epoch": 8.869209809264305,
+ "grad_norm": 10.117134094238281,
+ "learning_rate": 1.9819873576891707e-05,
+ "loss": 1.4644,
+ "step": 3255
+ },
+ {
+ "epoch": 8.871934604904633,
+ "grad_norm": 11.121735572814941,
+ "learning_rate": 1.981970679426527e-05,
+ "loss": 1.4331,
+ "step": 3256
+ },
+ {
+ "epoch": 8.874659400544958,
+ "grad_norm": 12.51620864868164,
+ "learning_rate": 1.9819539935163272e-05,
+ "loss": 1.7354,
+ "step": 3257
+ },
+ {
+ "epoch": 8.877384196185286,
+ "grad_norm": 14.289231300354004,
+ "learning_rate": 1.9819372999587015e-05,
+ "loss": 1.5076,
+ "step": 3258
+ },
+ {
+ "epoch": 8.880108991825614,
+ "grad_norm": 9.565315246582031,
+ "learning_rate": 1.9819205987537792e-05,
+ "loss": 1.468,
+ "step": 3259
+ },
+ {
+ "epoch": 8.88283378746594,
+ "grad_norm": 34.520606994628906,
+ "learning_rate": 1.9819038899016913e-05,
+ "loss": 1.3535,
+ "step": 3260
+ },
+ {
+ "epoch": 8.885558583106267,
+ "grad_norm": 8.638131141662598,
+ "learning_rate": 1.9818871734025672e-05,
+ "loss": 1.188,
+ "step": 3261
+ },
+ {
+ "epoch": 8.888283378746594,
+ "grad_norm": 9.826519966125488,
+ "learning_rate": 1.9818704492565378e-05,
+ "loss": 1.5161,
+ "step": 3262
+ },
+ {
+ "epoch": 8.89100817438692,
+ "grad_norm": 10.681777954101562,
+ "learning_rate": 1.9818537174637328e-05,
+ "loss": 1.2725,
+ "step": 3263
+ },
+ {
+ "epoch": 8.893732970027248,
+ "grad_norm": 9.70865535736084,
+ "learning_rate": 1.9818369780242822e-05,
+ "loss": 1.4285,
+ "step": 3264
+ },
+ {
+ "epoch": 8.896457765667575,
+ "grad_norm": 9.900568962097168,
+ "learning_rate": 1.9818202309383173e-05,
+ "loss": 1.3413,
+ "step": 3265
+ },
+ {
+ "epoch": 8.899182561307901,
+ "grad_norm": 11.357996940612793,
+ "learning_rate": 1.9818034762059678e-05,
+ "loss": 1.6782,
+ "step": 3266
+ },
+ {
+ "epoch": 8.901907356948229,
+ "grad_norm": 9.975435256958008,
+ "learning_rate": 1.9817867138273645e-05,
+ "loss": 1.5435,
+ "step": 3267
+ },
+ {
+ "epoch": 8.904632152588556,
+ "grad_norm": 7.961818218231201,
+ "learning_rate": 1.981769943802638e-05,
+ "loss": 1.2671,
+ "step": 3268
+ },
+ {
+ "epoch": 8.907356948228882,
+ "grad_norm": 10.005882263183594,
+ "learning_rate": 1.981753166131919e-05,
+ "loss": 1.2932,
+ "step": 3269
+ },
+ {
+ "epoch": 8.91008174386921,
+ "grad_norm": 10.420265197753906,
+ "learning_rate": 1.9817363808153372e-05,
+ "loss": 1.5381,
+ "step": 3270
+ },
+ {
+ "epoch": 8.912806539509537,
+ "grad_norm": 19.911571502685547,
+ "learning_rate": 1.9817195878530247e-05,
+ "loss": 1.521,
+ "step": 3271
+ },
+ {
+ "epoch": 8.915531335149863,
+ "grad_norm": 10.7108736038208,
+ "learning_rate": 1.9817027872451112e-05,
+ "loss": 1.334,
+ "step": 3272
+ },
+ {
+ "epoch": 8.91825613079019,
+ "grad_norm": 10.443603515625,
+ "learning_rate": 1.9816859789917283e-05,
+ "loss": 1.604,
+ "step": 3273
+ },
+ {
+ "epoch": 8.920980926430518,
+ "grad_norm": 14.452402114868164,
+ "learning_rate": 1.9816691630930067e-05,
+ "loss": 1.3765,
+ "step": 3274
+ },
+ {
+ "epoch": 8.923705722070844,
+ "grad_norm": 14.351840019226074,
+ "learning_rate": 1.981652339549077e-05,
+ "loss": 1.5569,
+ "step": 3275
+ },
+ {
+ "epoch": 8.926430517711172,
+ "grad_norm": 11.948895454406738,
+ "learning_rate": 1.9816355083600704e-05,
+ "loss": 1.2886,
+ "step": 3276
+ },
+ {
+ "epoch": 8.9291553133515,
+ "grad_norm": 10.655186653137207,
+ "learning_rate": 1.9816186695261184e-05,
+ "loss": 1.5349,
+ "step": 3277
+ },
+ {
+ "epoch": 8.931880108991825,
+ "grad_norm": 9.585867881774902,
+ "learning_rate": 1.981601823047352e-05,
+ "loss": 1.322,
+ "step": 3278
+ },
+ {
+ "epoch": 8.934604904632153,
+ "grad_norm": 10.423274040222168,
+ "learning_rate": 1.9815849689239015e-05,
+ "loss": 1.3765,
+ "step": 3279
+ },
+ {
+ "epoch": 8.93732970027248,
+ "grad_norm": 8.449317932128906,
+ "learning_rate": 1.9815681071558992e-05,
+ "loss": 1.3672,
+ "step": 3280
+ },
+ {
+ "epoch": 8.940054495912806,
+ "grad_norm": 9.676054954528809,
+ "learning_rate": 1.9815512377434757e-05,
+ "loss": 1.4561,
+ "step": 3281
+ },
+ {
+ "epoch": 8.942779291553133,
+ "grad_norm": 9.170092582702637,
+ "learning_rate": 1.9815343606867632e-05,
+ "loss": 1.4819,
+ "step": 3282
+ },
+ {
+ "epoch": 8.945504087193461,
+ "grad_norm": 10.363265037536621,
+ "learning_rate": 1.9815174759858927e-05,
+ "loss": 1.418,
+ "step": 3283
+ },
+ {
+ "epoch": 8.948228882833787,
+ "grad_norm": 11.943129539489746,
+ "learning_rate": 1.9815005836409954e-05,
+ "loss": 1.2542,
+ "step": 3284
+ },
+ {
+ "epoch": 8.950953678474114,
+ "grad_norm": 14.964985847473145,
+ "learning_rate": 1.9814836836522035e-05,
+ "loss": 1.5339,
+ "step": 3285
+ },
+ {
+ "epoch": 8.953678474114442,
+ "grad_norm": 7.762907981872559,
+ "learning_rate": 1.981466776019648e-05,
+ "loss": 1.2019,
+ "step": 3286
+ },
+ {
+ "epoch": 8.956403269754768,
+ "grad_norm": 9.729695320129395,
+ "learning_rate": 1.9814498607434607e-05,
+ "loss": 1.2307,
+ "step": 3287
+ },
+ {
+ "epoch": 8.959128065395095,
+ "grad_norm": 8.820679664611816,
+ "learning_rate": 1.9814329378237738e-05,
+ "loss": 1.2688,
+ "step": 3288
+ },
+ {
+ "epoch": 8.961852861035423,
+ "grad_norm": 8.336542129516602,
+ "learning_rate": 1.9814160072607188e-05,
+ "loss": 1.4619,
+ "step": 3289
+ },
+ {
+ "epoch": 8.964577656675749,
+ "grad_norm": 8.730629920959473,
+ "learning_rate": 1.981399069054427e-05,
+ "loss": 1.5325,
+ "step": 3290
+ },
+ {
+ "epoch": 8.967302452316076,
+ "grad_norm": 10.467671394348145,
+ "learning_rate": 1.981382123205031e-05,
+ "loss": 1.4546,
+ "step": 3291
+ },
+ {
+ "epoch": 8.970027247956404,
+ "grad_norm": 9.506669998168945,
+ "learning_rate": 1.981365169712663e-05,
+ "loss": 1.5806,
+ "step": 3292
+ },
+ {
+ "epoch": 8.97275204359673,
+ "grad_norm": 9.008421897888184,
+ "learning_rate": 1.9813482085774548e-05,
+ "loss": 1.5046,
+ "step": 3293
+ },
+ {
+ "epoch": 8.975476839237057,
+ "grad_norm": 11.48160171508789,
+ "learning_rate": 1.9813312397995376e-05,
+ "loss": 1.574,
+ "step": 3294
+ },
+ {
+ "epoch": 8.978201634877385,
+ "grad_norm": 8.973231315612793,
+ "learning_rate": 1.9813142633790448e-05,
+ "loss": 1.3826,
+ "step": 3295
+ },
+ {
+ "epoch": 8.98092643051771,
+ "grad_norm": 10.221563339233398,
+ "learning_rate": 1.9812972793161077e-05,
+ "loss": 1.3994,
+ "step": 3296
+ },
+ {
+ "epoch": 8.983651226158038,
+ "grad_norm": 9.588338851928711,
+ "learning_rate": 1.9812802876108593e-05,
+ "loss": 1.376,
+ "step": 3297
+ },
+ {
+ "epoch": 8.986376021798366,
+ "grad_norm": 8.09337329864502,
+ "learning_rate": 1.9812632882634316e-05,
+ "loss": 1.1482,
+ "step": 3298
+ },
+ {
+ "epoch": 8.989100817438691,
+ "grad_norm": 8.78427505493164,
+ "learning_rate": 1.981246281273957e-05,
+ "loss": 1.4067,
+ "step": 3299
+ },
+ {
+ "epoch": 8.991825613079019,
+ "grad_norm": 11.519981384277344,
+ "learning_rate": 1.981229266642568e-05,
+ "loss": 1.4851,
+ "step": 3300
+ },
+ {
+ "epoch": 8.994550408719347,
+ "grad_norm": 9.364227294921875,
+ "learning_rate": 1.9812122443693967e-05,
+ "loss": 1.2976,
+ "step": 3301
+ },
+ {
+ "epoch": 8.997275204359672,
+ "grad_norm": 9.506269454956055,
+ "learning_rate": 1.9811952144545764e-05,
+ "loss": 1.6685,
+ "step": 3302
+ },
+ {
+ "epoch": 9.0,
+ "grad_norm": 10.663548469543457,
+ "learning_rate": 1.9811781768982392e-05,
+ "loss": 1.5557,
+ "step": 3303
+ },
+ {
+ "epoch": 9.002724795640328,
+ "grad_norm": 7.8914361000061035,
+ "learning_rate": 1.981161131700518e-05,
+ "loss": 1.4429,
+ "step": 3304
+ },
+ {
+ "epoch": 9.005449591280653,
+ "grad_norm": 11.845026969909668,
+ "learning_rate": 1.9811440788615454e-05,
+ "loss": 1.3181,
+ "step": 3305
+ },
+ {
+ "epoch": 9.008174386920981,
+ "grad_norm": 8.106034278869629,
+ "learning_rate": 1.981127018381454e-05,
+ "loss": 1.3188,
+ "step": 3306
+ },
+ {
+ "epoch": 9.010899182561309,
+ "grad_norm": 9.699702262878418,
+ "learning_rate": 1.9811099502603775e-05,
+ "loss": 1.1958,
+ "step": 3307
+ },
+ {
+ "epoch": 9.013623978201634,
+ "grad_norm": 9.693281173706055,
+ "learning_rate": 1.981092874498448e-05,
+ "loss": 1.4805,
+ "step": 3308
+ },
+ {
+ "epoch": 9.016348773841962,
+ "grad_norm": 11.448603630065918,
+ "learning_rate": 1.981075791095799e-05,
+ "loss": 1.355,
+ "step": 3309
+ },
+ {
+ "epoch": 9.01907356948229,
+ "grad_norm": 10.993561744689941,
+ "learning_rate": 1.9810587000525632e-05,
+ "loss": 1.4246,
+ "step": 3310
+ },
+ {
+ "epoch": 9.021798365122615,
+ "grad_norm": 12.729100227355957,
+ "learning_rate": 1.9810416013688737e-05,
+ "loss": 1.3533,
+ "step": 3311
+ },
+ {
+ "epoch": 9.024523160762943,
+ "grad_norm": 8.636086463928223,
+ "learning_rate": 1.9810244950448636e-05,
+ "loss": 1.1777,
+ "step": 3312
+ },
+ {
+ "epoch": 9.02724795640327,
+ "grad_norm": 9.697944641113281,
+ "learning_rate": 1.9810073810806668e-05,
+ "loss": 1.1409,
+ "step": 3313
+ },
+ {
+ "epoch": 9.029972752043596,
+ "grad_norm": 9.793436050415039,
+ "learning_rate": 1.9809902594764157e-05,
+ "loss": 1.4097,
+ "step": 3314
+ },
+ {
+ "epoch": 9.032697547683924,
+ "grad_norm": 9.638480186462402,
+ "learning_rate": 1.9809731302322443e-05,
+ "loss": 1.3594,
+ "step": 3315
+ },
+ {
+ "epoch": 9.035422343324251,
+ "grad_norm": 8.224684715270996,
+ "learning_rate": 1.9809559933482853e-05,
+ "loss": 1.2893,
+ "step": 3316
+ },
+ {
+ "epoch": 9.038147138964577,
+ "grad_norm": 8.498680114746094,
+ "learning_rate": 1.980938848824673e-05,
+ "loss": 1.2251,
+ "step": 3317
+ },
+ {
+ "epoch": 9.040871934604905,
+ "grad_norm": 12.3306303024292,
+ "learning_rate": 1.9809216966615406e-05,
+ "loss": 1.1919,
+ "step": 3318
+ },
+ {
+ "epoch": 9.043596730245232,
+ "grad_norm": 10.12957763671875,
+ "learning_rate": 1.9809045368590215e-05,
+ "loss": 1.1763,
+ "step": 3319
+ },
+ {
+ "epoch": 9.046321525885558,
+ "grad_norm": 9.691681861877441,
+ "learning_rate": 1.980887369417249e-05,
+ "loss": 1.4958,
+ "step": 3320
+ },
+ {
+ "epoch": 9.049046321525886,
+ "grad_norm": 9.450521469116211,
+ "learning_rate": 1.9808701943363577e-05,
+ "loss": 1.3125,
+ "step": 3321
+ },
+ {
+ "epoch": 9.051771117166213,
+ "grad_norm": 10.486001968383789,
+ "learning_rate": 1.980853011616481e-05,
+ "loss": 1.3318,
+ "step": 3322
+ },
+ {
+ "epoch": 9.054495912806539,
+ "grad_norm": 9.702750205993652,
+ "learning_rate": 1.9808358212577524e-05,
+ "loss": 1.2874,
+ "step": 3323
+ },
+ {
+ "epoch": 9.057220708446867,
+ "grad_norm": 10.693781852722168,
+ "learning_rate": 1.980818623260306e-05,
+ "loss": 1.2964,
+ "step": 3324
+ },
+ {
+ "epoch": 9.059945504087194,
+ "grad_norm": 9.388365745544434,
+ "learning_rate": 1.9808014176242754e-05,
+ "loss": 1.4871,
+ "step": 3325
+ },
+ {
+ "epoch": 9.06267029972752,
+ "grad_norm": 22.220670700073242,
+ "learning_rate": 1.9807842043497953e-05,
+ "loss": 1.1562,
+ "step": 3326
+ },
+ {
+ "epoch": 9.065395095367847,
+ "grad_norm": 25.023902893066406,
+ "learning_rate": 1.9807669834369996e-05,
+ "loss": 1.4326,
+ "step": 3327
+ },
+ {
+ "epoch": 9.068119891008175,
+ "grad_norm": 8.872845649719238,
+ "learning_rate": 1.9807497548860218e-05,
+ "loss": 1.4065,
+ "step": 3328
+ },
+ {
+ "epoch": 9.0708446866485,
+ "grad_norm": 7.357226848602295,
+ "learning_rate": 1.9807325186969964e-05,
+ "loss": 1.0891,
+ "step": 3329
+ },
+ {
+ "epoch": 9.073569482288828,
+ "grad_norm": 12.355050086975098,
+ "learning_rate": 1.980715274870058e-05,
+ "loss": 1.2792,
+ "step": 3330
+ },
+ {
+ "epoch": 9.076294277929156,
+ "grad_norm": 9.479902267456055,
+ "learning_rate": 1.9806980234053405e-05,
+ "loss": 1.614,
+ "step": 3331
+ },
+ {
+ "epoch": 9.079019073569482,
+ "grad_norm": 12.747612953186035,
+ "learning_rate": 1.9806807643029786e-05,
+ "loss": 1.4459,
+ "step": 3332
+ },
+ {
+ "epoch": 9.08174386920981,
+ "grad_norm": 13.959284782409668,
+ "learning_rate": 1.9806634975631062e-05,
+ "loss": 1.1519,
+ "step": 3333
+ },
+ {
+ "epoch": 9.084468664850137,
+ "grad_norm": 8.461284637451172,
+ "learning_rate": 1.980646223185858e-05,
+ "loss": 1.4524,
+ "step": 3334
+ },
+ {
+ "epoch": 9.087193460490463,
+ "grad_norm": 7.815034866333008,
+ "learning_rate": 1.9806289411713686e-05,
+ "loss": 1.3975,
+ "step": 3335
+ },
+ {
+ "epoch": 9.08991825613079,
+ "grad_norm": 7.936162948608398,
+ "learning_rate": 1.9806116515197728e-05,
+ "loss": 1.4258,
+ "step": 3336
+ },
+ {
+ "epoch": 9.092643051771118,
+ "grad_norm": 10.635171890258789,
+ "learning_rate": 1.980594354231205e-05,
+ "loss": 1.2351,
+ "step": 3337
+ },
+ {
+ "epoch": 9.095367847411444,
+ "grad_norm": 15.045971870422363,
+ "learning_rate": 1.9805770493057994e-05,
+ "loss": 1.6394,
+ "step": 3338
+ },
+ {
+ "epoch": 9.098092643051771,
+ "grad_norm": 9.381028175354004,
+ "learning_rate": 1.980559736743692e-05,
+ "loss": 1.3196,
+ "step": 3339
+ },
+ {
+ "epoch": 9.100817438692099,
+ "grad_norm": 10.05689525604248,
+ "learning_rate": 1.9805424165450164e-05,
+ "loss": 1.3442,
+ "step": 3340
+ },
+ {
+ "epoch": 9.103542234332425,
+ "grad_norm": 8.947305679321289,
+ "learning_rate": 1.980525088709908e-05,
+ "loss": 1.2844,
+ "step": 3341
+ },
+ {
+ "epoch": 9.106267029972752,
+ "grad_norm": 9.874502182006836,
+ "learning_rate": 1.9805077532385024e-05,
+ "loss": 1.5862,
+ "step": 3342
+ },
+ {
+ "epoch": 9.10899182561308,
+ "grad_norm": 13.851561546325684,
+ "learning_rate": 1.9804904101309333e-05,
+ "loss": 1.3845,
+ "step": 3343
+ },
+ {
+ "epoch": 9.111716621253406,
+ "grad_norm": 8.135567665100098,
+ "learning_rate": 1.980473059387337e-05,
+ "loss": 1.4084,
+ "step": 3344
+ },
+ {
+ "epoch": 9.114441416893733,
+ "grad_norm": 9.141457557678223,
+ "learning_rate": 1.9804557010078475e-05,
+ "loss": 1.4294,
+ "step": 3345
+ },
+ {
+ "epoch": 9.11716621253406,
+ "grad_norm": 9.895256042480469,
+ "learning_rate": 1.9804383349926007e-05,
+ "loss": 1.2952,
+ "step": 3346
+ },
+ {
+ "epoch": 9.119891008174386,
+ "grad_norm": 9.32097339630127,
+ "learning_rate": 1.980420961341732e-05,
+ "loss": 1.4065,
+ "step": 3347
+ },
+ {
+ "epoch": 9.122615803814714,
+ "grad_norm": 9.12514591217041,
+ "learning_rate": 1.9804035800553764e-05,
+ "loss": 1.4473,
+ "step": 3348
+ },
+ {
+ "epoch": 9.125340599455042,
+ "grad_norm": 11.255130767822266,
+ "learning_rate": 1.980386191133669e-05,
+ "loss": 1.4034,
+ "step": 3349
+ },
+ {
+ "epoch": 9.128065395095367,
+ "grad_norm": 9.776803016662598,
+ "learning_rate": 1.9803687945767457e-05,
+ "loss": 1.1127,
+ "step": 3350
+ },
+ {
+ "epoch": 9.130790190735695,
+ "grad_norm": 10.613279342651367,
+ "learning_rate": 1.9803513903847418e-05,
+ "loss": 1.3342,
+ "step": 3351
+ },
+ {
+ "epoch": 9.133514986376023,
+ "grad_norm": 9.415681838989258,
+ "learning_rate": 1.9803339785577926e-05,
+ "loss": 1.271,
+ "step": 3352
+ },
+ {
+ "epoch": 9.136239782016348,
+ "grad_norm": 8.960698127746582,
+ "learning_rate": 1.980316559096034e-05,
+ "loss": 1.4492,
+ "step": 3353
+ },
+ {
+ "epoch": 9.138964577656676,
+ "grad_norm": 9.981202125549316,
+ "learning_rate": 1.9802991319996015e-05,
+ "loss": 1.5801,
+ "step": 3354
+ },
+ {
+ "epoch": 9.141689373297003,
+ "grad_norm": 9.422486305236816,
+ "learning_rate": 1.980281697268631e-05,
+ "loss": 1.2809,
+ "step": 3355
+ },
+ {
+ "epoch": 9.14441416893733,
+ "grad_norm": 8.67933464050293,
+ "learning_rate": 1.9802642549032585e-05,
+ "loss": 1.1875,
+ "step": 3356
+ },
+ {
+ "epoch": 9.147138964577657,
+ "grad_norm": 8.95732593536377,
+ "learning_rate": 1.9802468049036192e-05,
+ "loss": 1.396,
+ "step": 3357
+ },
+ {
+ "epoch": 9.149863760217984,
+ "grad_norm": 14.806777000427246,
+ "learning_rate": 1.9802293472698496e-05,
+ "loss": 1.2542,
+ "step": 3358
+ },
+ {
+ "epoch": 9.15258855585831,
+ "grad_norm": 10.63351821899414,
+ "learning_rate": 1.980211882002085e-05,
+ "loss": 1.5439,
+ "step": 3359
+ },
+ {
+ "epoch": 9.155313351498638,
+ "grad_norm": 11.304052352905273,
+ "learning_rate": 1.980194409100462e-05,
+ "loss": 1.333,
+ "step": 3360
+ },
+ {
+ "epoch": 9.158038147138965,
+ "grad_norm": 8.953567504882812,
+ "learning_rate": 1.9801769285651168e-05,
+ "loss": 1.4475,
+ "step": 3361
+ },
+ {
+ "epoch": 9.160762942779291,
+ "grad_norm": 10.894664764404297,
+ "learning_rate": 1.9801594403961844e-05,
+ "loss": 1.4678,
+ "step": 3362
+ },
+ {
+ "epoch": 9.163487738419619,
+ "grad_norm": 8.70775032043457,
+ "learning_rate": 1.9801419445938027e-05,
+ "loss": 1.2996,
+ "step": 3363
+ },
+ {
+ "epoch": 9.166212534059946,
+ "grad_norm": 8.957754135131836,
+ "learning_rate": 1.9801244411581068e-05,
+ "loss": 1.4502,
+ "step": 3364
+ },
+ {
+ "epoch": 9.168937329700272,
+ "grad_norm": 9.401688575744629,
+ "learning_rate": 1.980106930089233e-05,
+ "loss": 1.3315,
+ "step": 3365
+ },
+ {
+ "epoch": 9.1716621253406,
+ "grad_norm": 8.487594604492188,
+ "learning_rate": 1.980089411387318e-05,
+ "loss": 1.4373,
+ "step": 3366
+ },
+ {
+ "epoch": 9.174386920980927,
+ "grad_norm": 9.587615013122559,
+ "learning_rate": 1.9800718850524987e-05,
+ "loss": 1.4124,
+ "step": 3367
+ },
+ {
+ "epoch": 9.177111716621253,
+ "grad_norm": 9.357094764709473,
+ "learning_rate": 1.9800543510849107e-05,
+ "loss": 1.4082,
+ "step": 3368
+ },
+ {
+ "epoch": 9.17983651226158,
+ "grad_norm": 8.491287231445312,
+ "learning_rate": 1.980036809484691e-05,
+ "loss": 1.2317,
+ "step": 3369
+ },
+ {
+ "epoch": 9.182561307901908,
+ "grad_norm": 10.4268159866333,
+ "learning_rate": 1.9800192602519762e-05,
+ "loss": 1.5454,
+ "step": 3370
+ },
+ {
+ "epoch": 9.185286103542234,
+ "grad_norm": 10.99485969543457,
+ "learning_rate": 1.9800017033869033e-05,
+ "loss": 1.3677,
+ "step": 3371
+ },
+ {
+ "epoch": 9.188010899182562,
+ "grad_norm": 7.159212589263916,
+ "learning_rate": 1.979984138889608e-05,
+ "loss": 1.27,
+ "step": 3372
+ },
+ {
+ "epoch": 9.190735694822889,
+ "grad_norm": 10.803590774536133,
+ "learning_rate": 1.9799665667602282e-05,
+ "loss": 1.561,
+ "step": 3373
+ },
+ {
+ "epoch": 9.193460490463215,
+ "grad_norm": 9.76352310180664,
+ "learning_rate": 1.9799489869989003e-05,
+ "loss": 1.3806,
+ "step": 3374
+ },
+ {
+ "epoch": 9.196185286103542,
+ "grad_norm": 15.681282997131348,
+ "learning_rate": 1.979931399605761e-05,
+ "loss": 1.3535,
+ "step": 3375
+ },
+ {
+ "epoch": 9.19891008174387,
+ "grad_norm": 8.559199333190918,
+ "learning_rate": 1.9799138045809482e-05,
+ "loss": 1.4304,
+ "step": 3376
+ },
+ {
+ "epoch": 9.201634877384196,
+ "grad_norm": 8.302059173583984,
+ "learning_rate": 1.979896201924597e-05,
+ "loss": 1.3557,
+ "step": 3377
+ },
+ {
+ "epoch": 9.204359673024523,
+ "grad_norm": 8.677852630615234,
+ "learning_rate": 1.979878591636847e-05,
+ "loss": 1.5125,
+ "step": 3378
+ },
+ {
+ "epoch": 9.207084468664851,
+ "grad_norm": 10.220707893371582,
+ "learning_rate": 1.9798609737178332e-05,
+ "loss": 1.3669,
+ "step": 3379
+ },
+ {
+ "epoch": 9.209809264305177,
+ "grad_norm": 10.292823791503906,
+ "learning_rate": 1.979843348167694e-05,
+ "loss": 1.5803,
+ "step": 3380
+ },
+ {
+ "epoch": 9.212534059945504,
+ "grad_norm": 7.553493499755859,
+ "learning_rate": 1.9798257149865664e-05,
+ "loss": 1.3113,
+ "step": 3381
+ },
+ {
+ "epoch": 9.215258855585832,
+ "grad_norm": 9.349052429199219,
+ "learning_rate": 1.9798080741745876e-05,
+ "loss": 1.3796,
+ "step": 3382
+ },
+ {
+ "epoch": 9.217983651226158,
+ "grad_norm": 11.313785552978516,
+ "learning_rate": 1.979790425731895e-05,
+ "loss": 1.5281,
+ "step": 3383
+ },
+ {
+ "epoch": 9.220708446866485,
+ "grad_norm": 8.335127830505371,
+ "learning_rate": 1.979772769658626e-05,
+ "loss": 1.5474,
+ "step": 3384
+ },
+ {
+ "epoch": 9.223433242506813,
+ "grad_norm": 10.918291091918945,
+ "learning_rate": 1.9797551059549182e-05,
+ "loss": 1.2739,
+ "step": 3385
+ },
+ {
+ "epoch": 9.226158038147139,
+ "grad_norm": 11.712550163269043,
+ "learning_rate": 1.979737434620909e-05,
+ "loss": 1.303,
+ "step": 3386
+ },
+ {
+ "epoch": 9.228882833787466,
+ "grad_norm": 9.832308769226074,
+ "learning_rate": 1.9797197556567368e-05,
+ "loss": 1.3599,
+ "step": 3387
+ },
+ {
+ "epoch": 9.231607629427794,
+ "grad_norm": 14.865618705749512,
+ "learning_rate": 1.9797020690625385e-05,
+ "loss": 1.3406,
+ "step": 3388
+ },
+ {
+ "epoch": 9.23433242506812,
+ "grad_norm": 8.478940963745117,
+ "learning_rate": 1.9796843748384516e-05,
+ "loss": 1.4141,
+ "step": 3389
+ },
+ {
+ "epoch": 9.237057220708447,
+ "grad_norm": 26.075153350830078,
+ "learning_rate": 1.979666672984615e-05,
+ "loss": 1.457,
+ "step": 3390
+ },
+ {
+ "epoch": 9.239782016348773,
+ "grad_norm": 10.764287948608398,
+ "learning_rate": 1.979648963501165e-05,
+ "loss": 1.4678,
+ "step": 3391
+ },
+ {
+ "epoch": 9.2425068119891,
+ "grad_norm": 9.13726806640625,
+ "learning_rate": 1.9796312463882413e-05,
+ "loss": 1.2595,
+ "step": 3392
+ },
+ {
+ "epoch": 9.245231607629428,
+ "grad_norm": 11.239102363586426,
+ "learning_rate": 1.9796135216459806e-05,
+ "loss": 1.3137,
+ "step": 3393
+ },
+ {
+ "epoch": 9.247956403269754,
+ "grad_norm": 10.32160758972168,
+ "learning_rate": 1.9795957892745212e-05,
+ "loss": 1.2859,
+ "step": 3394
+ },
+ {
+ "epoch": 9.250681198910081,
+ "grad_norm": 8.509366035461426,
+ "learning_rate": 1.9795780492740014e-05,
+ "loss": 1.4409,
+ "step": 3395
+ },
+ {
+ "epoch": 9.253405994550409,
+ "grad_norm": 8.588579177856445,
+ "learning_rate": 1.979560301644559e-05,
+ "loss": 1.3656,
+ "step": 3396
+ },
+ {
+ "epoch": 9.256130790190735,
+ "grad_norm": 7.5111308097839355,
+ "learning_rate": 1.9795425463863328e-05,
+ "loss": 1.323,
+ "step": 3397
+ },
+ {
+ "epoch": 9.258855585831062,
+ "grad_norm": 11.245231628417969,
+ "learning_rate": 1.979524783499461e-05,
+ "loss": 1.5593,
+ "step": 3398
+ },
+ {
+ "epoch": 9.26158038147139,
+ "grad_norm": 11.089567184448242,
+ "learning_rate": 1.9795070129840814e-05,
+ "loss": 1.2607,
+ "step": 3399
+ },
+ {
+ "epoch": 9.264305177111716,
+ "grad_norm": 9.891328811645508,
+ "learning_rate": 1.9794892348403327e-05,
+ "loss": 1.2742,
+ "step": 3400
+ },
+ {
+ "epoch": 9.267029972752043,
+ "grad_norm": 9.167067527770996,
+ "learning_rate": 1.9794714490683534e-05,
+ "loss": 1.2944,
+ "step": 3401
+ },
+ {
+ "epoch": 9.269754768392371,
+ "grad_norm": 8.210538864135742,
+ "learning_rate": 1.979453655668282e-05,
+ "loss": 1.0919,
+ "step": 3402
+ },
+ {
+ "epoch": 9.272479564032697,
+ "grad_norm": 10.045794486999512,
+ "learning_rate": 1.979435854640257e-05,
+ "loss": 1.2485,
+ "step": 3403
+ },
+ {
+ "epoch": 9.275204359673024,
+ "grad_norm": 8.798501968383789,
+ "learning_rate": 1.979418045984417e-05,
+ "loss": 1.3103,
+ "step": 3404
+ },
+ {
+ "epoch": 9.277929155313352,
+ "grad_norm": 8.913511276245117,
+ "learning_rate": 1.9794002297009012e-05,
+ "loss": 1.4448,
+ "step": 3405
+ },
+ {
+ "epoch": 9.280653950953678,
+ "grad_norm": 10.16838264465332,
+ "learning_rate": 1.979382405789848e-05,
+ "loss": 1.3906,
+ "step": 3406
+ },
+ {
+ "epoch": 9.283378746594005,
+ "grad_norm": 7.70815896987915,
+ "learning_rate": 1.9793645742513953e-05,
+ "loss": 1.3523,
+ "step": 3407
+ },
+ {
+ "epoch": 9.286103542234333,
+ "grad_norm": 8.3804931640625,
+ "learning_rate": 1.9793467350856838e-05,
+ "loss": 1.3953,
+ "step": 3408
+ },
+ {
+ "epoch": 9.288828337874659,
+ "grad_norm": 10.134687423706055,
+ "learning_rate": 1.979328888292851e-05,
+ "loss": 1.5552,
+ "step": 3409
+ },
+ {
+ "epoch": 9.291553133514986,
+ "grad_norm": 25.563600540161133,
+ "learning_rate": 1.9793110338730362e-05,
+ "loss": 1.2976,
+ "step": 3410
+ },
+ {
+ "epoch": 9.294277929155314,
+ "grad_norm": 7.810992240905762,
+ "learning_rate": 1.9792931718263786e-05,
+ "loss": 1.2024,
+ "step": 3411
+ },
+ {
+ "epoch": 9.29700272479564,
+ "grad_norm": 8.703335762023926,
+ "learning_rate": 1.9792753021530174e-05,
+ "loss": 1.2744,
+ "step": 3412
+ },
+ {
+ "epoch": 9.299727520435967,
+ "grad_norm": 13.916765213012695,
+ "learning_rate": 1.9792574248530915e-05,
+ "loss": 1.5369,
+ "step": 3413
+ },
+ {
+ "epoch": 9.302452316076295,
+ "grad_norm": 14.48161792755127,
+ "learning_rate": 1.9792395399267404e-05,
+ "loss": 1.1318,
+ "step": 3414
+ },
+ {
+ "epoch": 9.30517711171662,
+ "grad_norm": 8.741053581237793,
+ "learning_rate": 1.9792216473741035e-05,
+ "loss": 1.321,
+ "step": 3415
+ },
+ {
+ "epoch": 9.307901907356948,
+ "grad_norm": 9.961328506469727,
+ "learning_rate": 1.9792037471953196e-05,
+ "loss": 1.6104,
+ "step": 3416
+ },
+ {
+ "epoch": 9.310626702997276,
+ "grad_norm": 9.477543830871582,
+ "learning_rate": 1.9791858393905287e-05,
+ "loss": 1.6274,
+ "step": 3417
+ },
+ {
+ "epoch": 9.313351498637601,
+ "grad_norm": 9.631728172302246,
+ "learning_rate": 1.97916792395987e-05,
+ "loss": 1.4702,
+ "step": 3418
+ },
+ {
+ "epoch": 9.316076294277929,
+ "grad_norm": 13.435711860656738,
+ "learning_rate": 1.979150000903483e-05,
+ "loss": 1.4302,
+ "step": 3419
+ },
+ {
+ "epoch": 9.318801089918257,
+ "grad_norm": 16.355337142944336,
+ "learning_rate": 1.979132070221507e-05,
+ "loss": 1.1826,
+ "step": 3420
+ },
+ {
+ "epoch": 9.321525885558582,
+ "grad_norm": 8.597811698913574,
+ "learning_rate": 1.979114131914082e-05,
+ "loss": 1.4956,
+ "step": 3421
+ },
+ {
+ "epoch": 9.32425068119891,
+ "grad_norm": 36.2840690612793,
+ "learning_rate": 1.979096185981348e-05,
+ "loss": 1.3014,
+ "step": 3422
+ },
+ {
+ "epoch": 9.326975476839237,
+ "grad_norm": 7.845273017883301,
+ "learning_rate": 1.9790782324234442e-05,
+ "loss": 1.2791,
+ "step": 3423
+ },
+ {
+ "epoch": 9.329700272479563,
+ "grad_norm": 9.422127723693848,
+ "learning_rate": 1.9790602712405106e-05,
+ "loss": 1.2175,
+ "step": 3424
+ },
+ {
+ "epoch": 9.33242506811989,
+ "grad_norm": 12.685276985168457,
+ "learning_rate": 1.9790423024326873e-05,
+ "loss": 1.2817,
+ "step": 3425
+ },
+ {
+ "epoch": 9.335149863760218,
+ "grad_norm": 8.371520042419434,
+ "learning_rate": 1.979024326000114e-05,
+ "loss": 1.3311,
+ "step": 3426
+ },
+ {
+ "epoch": 9.337874659400544,
+ "grad_norm": 15.884763717651367,
+ "learning_rate": 1.9790063419429307e-05,
+ "loss": 1.3364,
+ "step": 3427
+ },
+ {
+ "epoch": 9.340599455040872,
+ "grad_norm": 9.083556175231934,
+ "learning_rate": 1.9789883502612778e-05,
+ "loss": 1.2952,
+ "step": 3428
+ },
+ {
+ "epoch": 9.3433242506812,
+ "grad_norm": 17.44978141784668,
+ "learning_rate": 1.9789703509552947e-05,
+ "loss": 1.4075,
+ "step": 3429
+ },
+ {
+ "epoch": 9.346049046321525,
+ "grad_norm": 10.517081260681152,
+ "learning_rate": 1.9789523440251223e-05,
+ "loss": 1.449,
+ "step": 3430
+ },
+ {
+ "epoch": 9.348773841961853,
+ "grad_norm": 11.888326644897461,
+ "learning_rate": 1.9789343294709e-05,
+ "loss": 1.2737,
+ "step": 3431
+ },
+ {
+ "epoch": 9.35149863760218,
+ "grad_norm": 9.796870231628418,
+ "learning_rate": 1.9789163072927696e-05,
+ "loss": 1.7625,
+ "step": 3432
+ },
+ {
+ "epoch": 9.354223433242506,
+ "grad_norm": 9.31047248840332,
+ "learning_rate": 1.9788982774908695e-05,
+ "loss": 1.333,
+ "step": 3433
+ },
+ {
+ "epoch": 9.356948228882834,
+ "grad_norm": 10.207380294799805,
+ "learning_rate": 1.9788802400653416e-05,
+ "loss": 1.3022,
+ "step": 3434
+ },
+ {
+ "epoch": 9.359673024523161,
+ "grad_norm": 10.310562133789062,
+ "learning_rate": 1.9788621950163264e-05,
+ "loss": 1.386,
+ "step": 3435
+ },
+ {
+ "epoch": 9.362397820163487,
+ "grad_norm": 10.685137748718262,
+ "learning_rate": 1.978844142343963e-05,
+ "loss": 1.4824,
+ "step": 3436
+ },
+ {
+ "epoch": 9.365122615803815,
+ "grad_norm": 9.386162757873535,
+ "learning_rate": 1.9788260820483935e-05,
+ "loss": 1.2722,
+ "step": 3437
+ },
+ {
+ "epoch": 9.367847411444142,
+ "grad_norm": 11.15714168548584,
+ "learning_rate": 1.9788080141297577e-05,
+ "loss": 1.1504,
+ "step": 3438
+ },
+ {
+ "epoch": 9.370572207084468,
+ "grad_norm": 14.698813438415527,
+ "learning_rate": 1.978789938588197e-05,
+ "loss": 1.6157,
+ "step": 3439
+ },
+ {
+ "epoch": 9.373297002724795,
+ "grad_norm": 12.233861923217773,
+ "learning_rate": 1.9787718554238516e-05,
+ "loss": 1.4355,
+ "step": 3440
+ },
+ {
+ "epoch": 9.376021798365123,
+ "grad_norm": 12.789555549621582,
+ "learning_rate": 1.978753764636862e-05,
+ "loss": 1.3352,
+ "step": 3441
+ },
+ {
+ "epoch": 9.378746594005449,
+ "grad_norm": 11.998162269592285,
+ "learning_rate": 1.9787356662273702e-05,
+ "loss": 1.2285,
+ "step": 3442
+ },
+ {
+ "epoch": 9.381471389645776,
+ "grad_norm": 10.554962158203125,
+ "learning_rate": 1.9787175601955163e-05,
+ "loss": 1.3799,
+ "step": 3443
+ },
+ {
+ "epoch": 9.384196185286104,
+ "grad_norm": 9.63073444366455,
+ "learning_rate": 1.9786994465414415e-05,
+ "loss": 1.5298,
+ "step": 3444
+ },
+ {
+ "epoch": 9.38692098092643,
+ "grad_norm": 7.870802879333496,
+ "learning_rate": 1.9786813252652866e-05,
+ "loss": 1.1112,
+ "step": 3445
+ },
+ {
+ "epoch": 9.389645776566757,
+ "grad_norm": 10.364745140075684,
+ "learning_rate": 1.9786631963671935e-05,
+ "loss": 1.5083,
+ "step": 3446
+ },
+ {
+ "epoch": 9.392370572207085,
+ "grad_norm": 10.149497032165527,
+ "learning_rate": 1.978645059847303e-05,
+ "loss": 1.0826,
+ "step": 3447
+ },
+ {
+ "epoch": 9.39509536784741,
+ "grad_norm": 9.680525779724121,
+ "learning_rate": 1.978626915705756e-05,
+ "loss": 1.302,
+ "step": 3448
+ },
+ {
+ "epoch": 9.397820163487738,
+ "grad_norm": 11.579989433288574,
+ "learning_rate": 1.9786087639426942e-05,
+ "loss": 1.6477,
+ "step": 3449
+ },
+ {
+ "epoch": 9.400544959128066,
+ "grad_norm": 13.586649894714355,
+ "learning_rate": 1.978590604558259e-05,
+ "loss": 1.4324,
+ "step": 3450
+ },
+ {
+ "epoch": 9.403269754768392,
+ "grad_norm": 10.524829864501953,
+ "learning_rate": 1.9785724375525913e-05,
+ "loss": 1.3755,
+ "step": 3451
+ },
+ {
+ "epoch": 9.40599455040872,
+ "grad_norm": 10.216323852539062,
+ "learning_rate": 1.978554262925833e-05,
+ "loss": 1.333,
+ "step": 3452
+ },
+ {
+ "epoch": 9.408719346049047,
+ "grad_norm": 20.44986343383789,
+ "learning_rate": 1.9785360806781256e-05,
+ "loss": 1.533,
+ "step": 3453
+ },
+ {
+ "epoch": 9.411444141689373,
+ "grad_norm": 10.247272491455078,
+ "learning_rate": 1.978517890809611e-05,
+ "loss": 1.4092,
+ "step": 3454
+ },
+ {
+ "epoch": 9.4141689373297,
+ "grad_norm": 10.937572479248047,
+ "learning_rate": 1.9784996933204303e-05,
+ "loss": 1.6558,
+ "step": 3455
+ },
+ {
+ "epoch": 9.416893732970028,
+ "grad_norm": 8.877446174621582,
+ "learning_rate": 1.9784814882107256e-05,
+ "loss": 1.3645,
+ "step": 3456
+ },
+ {
+ "epoch": 9.419618528610354,
+ "grad_norm": 9.013394355773926,
+ "learning_rate": 1.9784632754806385e-05,
+ "loss": 1.3066,
+ "step": 3457
+ },
+ {
+ "epoch": 9.422343324250681,
+ "grad_norm": 10.657892227172852,
+ "learning_rate": 1.978445055130311e-05,
+ "loss": 1.3774,
+ "step": 3458
+ },
+ {
+ "epoch": 9.425068119891009,
+ "grad_norm": 13.270530700683594,
+ "learning_rate": 1.9784268271598847e-05,
+ "loss": 1.1091,
+ "step": 3459
+ },
+ {
+ "epoch": 9.427792915531334,
+ "grad_norm": 10.21103572845459,
+ "learning_rate": 1.978408591569502e-05,
+ "loss": 1.4182,
+ "step": 3460
+ },
+ {
+ "epoch": 9.430517711171662,
+ "grad_norm": 10.06057071685791,
+ "learning_rate": 1.9783903483593045e-05,
+ "loss": 1.2573,
+ "step": 3461
+ },
+ {
+ "epoch": 9.43324250681199,
+ "grad_norm": 9.013784408569336,
+ "learning_rate": 1.9783720975294345e-05,
+ "loss": 1.3347,
+ "step": 3462
+ },
+ {
+ "epoch": 9.435967302452315,
+ "grad_norm": 9.590899467468262,
+ "learning_rate": 1.978353839080034e-05,
+ "loss": 1.3755,
+ "step": 3463
+ },
+ {
+ "epoch": 9.438692098092643,
+ "grad_norm": 10.984482765197754,
+ "learning_rate": 1.9783355730112454e-05,
+ "loss": 1.4729,
+ "step": 3464
+ },
+ {
+ "epoch": 9.44141689373297,
+ "grad_norm": 12.965763092041016,
+ "learning_rate": 1.978317299323211e-05,
+ "loss": 1.4124,
+ "step": 3465
+ },
+ {
+ "epoch": 9.444141689373296,
+ "grad_norm": 10.23265552520752,
+ "learning_rate": 1.9782990180160726e-05,
+ "loss": 1.425,
+ "step": 3466
+ },
+ {
+ "epoch": 9.446866485013624,
+ "grad_norm": 8.932223320007324,
+ "learning_rate": 1.9782807290899732e-05,
+ "loss": 1.2876,
+ "step": 3467
+ },
+ {
+ "epoch": 9.449591280653951,
+ "grad_norm": 9.65361213684082,
+ "learning_rate": 1.978262432545055e-05,
+ "loss": 1.2568,
+ "step": 3468
+ },
+ {
+ "epoch": 9.452316076294277,
+ "grad_norm": 13.760838508605957,
+ "learning_rate": 1.9782441283814606e-05,
+ "loss": 1.4006,
+ "step": 3469
+ },
+ {
+ "epoch": 9.455040871934605,
+ "grad_norm": 10.448901176452637,
+ "learning_rate": 1.978225816599332e-05,
+ "loss": 1.4226,
+ "step": 3470
+ },
+ {
+ "epoch": 9.457765667574932,
+ "grad_norm": 10.120850563049316,
+ "learning_rate": 1.9782074971988122e-05,
+ "loss": 1.2434,
+ "step": 3471
+ },
+ {
+ "epoch": 9.460490463215258,
+ "grad_norm": 11.313949584960938,
+ "learning_rate": 1.978189170180044e-05,
+ "loss": 1.3118,
+ "step": 3472
+ },
+ {
+ "epoch": 9.463215258855586,
+ "grad_norm": 11.893877029418945,
+ "learning_rate": 1.9781708355431704e-05,
+ "loss": 1.3831,
+ "step": 3473
+ },
+ {
+ "epoch": 9.465940054495913,
+ "grad_norm": 11.411081314086914,
+ "learning_rate": 1.9781524932883334e-05,
+ "loss": 1.2185,
+ "step": 3474
+ },
+ {
+ "epoch": 9.46866485013624,
+ "grad_norm": 10.715963363647461,
+ "learning_rate": 1.978134143415676e-05,
+ "loss": 1.238,
+ "step": 3475
+ },
+ {
+ "epoch": 9.471389645776567,
+ "grad_norm": 8.280133247375488,
+ "learning_rate": 1.9781157859253422e-05,
+ "loss": 1.1952,
+ "step": 3476
+ },
+ {
+ "epoch": 9.474114441416894,
+ "grad_norm": 12.157916069030762,
+ "learning_rate": 1.9780974208174737e-05,
+ "loss": 1.3921,
+ "step": 3477
+ },
+ {
+ "epoch": 9.47683923705722,
+ "grad_norm": 11.583842277526855,
+ "learning_rate": 1.978079048092214e-05,
+ "loss": 1.3665,
+ "step": 3478
+ },
+ {
+ "epoch": 9.479564032697548,
+ "grad_norm": 9.636781692504883,
+ "learning_rate": 1.978060667749706e-05,
+ "loss": 1.3503,
+ "step": 3479
+ },
+ {
+ "epoch": 9.482288828337875,
+ "grad_norm": 18.986690521240234,
+ "learning_rate": 1.9780422797900935e-05,
+ "loss": 1.3213,
+ "step": 3480
+ },
+ {
+ "epoch": 9.485013623978201,
+ "grad_norm": 7.71966552734375,
+ "learning_rate": 1.9780238842135184e-05,
+ "loss": 1.2432,
+ "step": 3481
+ },
+ {
+ "epoch": 9.487738419618529,
+ "grad_norm": 16.58133888244629,
+ "learning_rate": 1.9780054810201252e-05,
+ "loss": 1.5393,
+ "step": 3482
+ },
+ {
+ "epoch": 9.490463215258856,
+ "grad_norm": 9.143290519714355,
+ "learning_rate": 1.9779870702100566e-05,
+ "loss": 1.3428,
+ "step": 3483
+ },
+ {
+ "epoch": 9.493188010899182,
+ "grad_norm": 11.136713027954102,
+ "learning_rate": 1.9779686517834566e-05,
+ "loss": 1.2627,
+ "step": 3484
+ },
+ {
+ "epoch": 9.49591280653951,
+ "grad_norm": 8.77470874786377,
+ "learning_rate": 1.977950225740468e-05,
+ "loss": 1.1431,
+ "step": 3485
+ },
+ {
+ "epoch": 9.498637602179837,
+ "grad_norm": 8.194987297058105,
+ "learning_rate": 1.9779317920812345e-05,
+ "loss": 1.3933,
+ "step": 3486
+ },
+ {
+ "epoch": 9.501362397820163,
+ "grad_norm": 7.847334861755371,
+ "learning_rate": 1.9779133508058997e-05,
+ "loss": 1.3062,
+ "step": 3487
+ },
+ {
+ "epoch": 9.50408719346049,
+ "grad_norm": 9.563523292541504,
+ "learning_rate": 1.977894901914607e-05,
+ "loss": 1.2954,
+ "step": 3488
+ },
+ {
+ "epoch": 9.506811989100818,
+ "grad_norm": 11.261819839477539,
+ "learning_rate": 1.9778764454075006e-05,
+ "loss": 1.6628,
+ "step": 3489
+ },
+ {
+ "epoch": 9.509536784741144,
+ "grad_norm": 8.540122985839844,
+ "learning_rate": 1.9778579812847236e-05,
+ "loss": 1.4062,
+ "step": 3490
+ },
+ {
+ "epoch": 9.512261580381471,
+ "grad_norm": 8.151784896850586,
+ "learning_rate": 1.9778395095464204e-05,
+ "loss": 1.2568,
+ "step": 3491
+ },
+ {
+ "epoch": 9.514986376021799,
+ "grad_norm": 15.209368705749512,
+ "learning_rate": 1.9778210301927344e-05,
+ "loss": 1.3538,
+ "step": 3492
+ },
+ {
+ "epoch": 9.517711171662125,
+ "grad_norm": 10.50976848602295,
+ "learning_rate": 1.97780254322381e-05,
+ "loss": 1.261,
+ "step": 3493
+ },
+ {
+ "epoch": 9.520435967302452,
+ "grad_norm": 9.538342475891113,
+ "learning_rate": 1.9777840486397904e-05,
+ "loss": 1.3208,
+ "step": 3494
+ },
+ {
+ "epoch": 9.52316076294278,
+ "grad_norm": 10.738985061645508,
+ "learning_rate": 1.9777655464408204e-05,
+ "loss": 1.4824,
+ "step": 3495
+ },
+ {
+ "epoch": 9.525885558583106,
+ "grad_norm": 10.215317726135254,
+ "learning_rate": 1.9777470366270436e-05,
+ "loss": 1.0896,
+ "step": 3496
+ },
+ {
+ "epoch": 9.528610354223433,
+ "grad_norm": 11.81888198852539,
+ "learning_rate": 1.9777285191986045e-05,
+ "loss": 1.5889,
+ "step": 3497
+ },
+ {
+ "epoch": 9.53133514986376,
+ "grad_norm": 9.270798683166504,
+ "learning_rate": 1.977709994155647e-05,
+ "loss": 1.2747,
+ "step": 3498
+ },
+ {
+ "epoch": 9.534059945504087,
+ "grad_norm": 9.496274948120117,
+ "learning_rate": 1.9776914614983157e-05,
+ "loss": 1.4822,
+ "step": 3499
+ },
+ {
+ "epoch": 9.536784741144414,
+ "grad_norm": 11.32534122467041,
+ "learning_rate": 1.9776729212267547e-05,
+ "loss": 1.4426,
+ "step": 3500
+ },
+ {
+ "epoch": 9.539509536784742,
+ "grad_norm": 11.459961891174316,
+ "learning_rate": 1.9776543733411084e-05,
+ "loss": 1.5642,
+ "step": 3501
+ },
+ {
+ "epoch": 9.542234332425068,
+ "grad_norm": 9.027872085571289,
+ "learning_rate": 1.9776358178415213e-05,
+ "loss": 1.459,
+ "step": 3502
+ },
+ {
+ "epoch": 9.544959128065395,
+ "grad_norm": 11.877817153930664,
+ "learning_rate": 1.977617254728138e-05,
+ "loss": 1.2825,
+ "step": 3503
+ },
+ {
+ "epoch": 9.547683923705723,
+ "grad_norm": 10.362582206726074,
+ "learning_rate": 1.977598684001103e-05,
+ "loss": 1.2644,
+ "step": 3504
+ },
+ {
+ "epoch": 9.550408719346049,
+ "grad_norm": 9.197845458984375,
+ "learning_rate": 1.977580105660561e-05,
+ "loss": 1.333,
+ "step": 3505
+ },
+ {
+ "epoch": 9.553133514986376,
+ "grad_norm": 11.093831062316895,
+ "learning_rate": 1.977561519706656e-05,
+ "loss": 1.2373,
+ "step": 3506
+ },
+ {
+ "epoch": 9.555858310626704,
+ "grad_norm": 9.646479606628418,
+ "learning_rate": 1.9775429261395343e-05,
+ "loss": 1.396,
+ "step": 3507
+ },
+ {
+ "epoch": 9.55858310626703,
+ "grad_norm": 9.306057929992676,
+ "learning_rate": 1.977524324959339e-05,
+ "loss": 1.1592,
+ "step": 3508
+ },
+ {
+ "epoch": 9.561307901907357,
+ "grad_norm": 8.801589012145996,
+ "learning_rate": 1.9775057161662163e-05,
+ "loss": 1.437,
+ "step": 3509
+ },
+ {
+ "epoch": 9.564032697547685,
+ "grad_norm": 10.09241771697998,
+ "learning_rate": 1.97748709976031e-05,
+ "loss": 1.5378,
+ "step": 3510
+ },
+ {
+ "epoch": 9.56675749318801,
+ "grad_norm": 9.766700744628906,
+ "learning_rate": 1.977468475741766e-05,
+ "loss": 1.4834,
+ "step": 3511
+ },
+ {
+ "epoch": 9.569482288828338,
+ "grad_norm": 9.25973892211914,
+ "learning_rate": 1.9774498441107288e-05,
+ "loss": 1.5376,
+ "step": 3512
+ },
+ {
+ "epoch": 9.572207084468666,
+ "grad_norm": 10.928956985473633,
+ "learning_rate": 1.9774312048673438e-05,
+ "loss": 1.1404,
+ "step": 3513
+ },
+ {
+ "epoch": 9.574931880108991,
+ "grad_norm": 8.28603458404541,
+ "learning_rate": 1.9774125580117557e-05,
+ "loss": 1.3813,
+ "step": 3514
+ },
+ {
+ "epoch": 9.577656675749319,
+ "grad_norm": 10.744699478149414,
+ "learning_rate": 1.9773939035441106e-05,
+ "loss": 1.3232,
+ "step": 3515
+ },
+ {
+ "epoch": 9.580381471389646,
+ "grad_norm": 10.062701225280762,
+ "learning_rate": 1.9773752414645527e-05,
+ "loss": 1.3611,
+ "step": 3516
+ },
+ {
+ "epoch": 9.583106267029972,
+ "grad_norm": 8.391669273376465,
+ "learning_rate": 1.977356571773228e-05,
+ "loss": 1.4429,
+ "step": 3517
+ },
+ {
+ "epoch": 9.5858310626703,
+ "grad_norm": 10.7404203414917,
+ "learning_rate": 1.9773378944702818e-05,
+ "loss": 1.2729,
+ "step": 3518
+ },
+ {
+ "epoch": 9.588555858310627,
+ "grad_norm": 9.84868335723877,
+ "learning_rate": 1.97731920955586e-05,
+ "loss": 1.2915,
+ "step": 3519
+ },
+ {
+ "epoch": 9.591280653950953,
+ "grad_norm": 9.618789672851562,
+ "learning_rate": 1.9773005170301072e-05,
+ "loss": 1.3093,
+ "step": 3520
+ },
+ {
+ "epoch": 9.59400544959128,
+ "grad_norm": 8.259662628173828,
+ "learning_rate": 1.9772818168931693e-05,
+ "loss": 1.3381,
+ "step": 3521
+ },
+ {
+ "epoch": 9.596730245231608,
+ "grad_norm": 10.0656156539917,
+ "learning_rate": 1.9772631091451924e-05,
+ "loss": 1.3623,
+ "step": 3522
+ },
+ {
+ "epoch": 9.599455040871934,
+ "grad_norm": 7.326105117797852,
+ "learning_rate": 1.9772443937863216e-05,
+ "loss": 1.3213,
+ "step": 3523
+ },
+ {
+ "epoch": 9.602179836512262,
+ "grad_norm": 11.508100509643555,
+ "learning_rate": 1.977225670816703e-05,
+ "loss": 1.4204,
+ "step": 3524
+ },
+ {
+ "epoch": 9.60490463215259,
+ "grad_norm": 14.950603485107422,
+ "learning_rate": 1.9772069402364823e-05,
+ "loss": 1.2897,
+ "step": 3525
+ },
+ {
+ "epoch": 9.607629427792915,
+ "grad_norm": 11.285598754882812,
+ "learning_rate": 1.9771882020458055e-05,
+ "loss": 1.3894,
+ "step": 3526
+ },
+ {
+ "epoch": 9.610354223433243,
+ "grad_norm": 12.085847854614258,
+ "learning_rate": 1.9771694562448186e-05,
+ "loss": 1.6387,
+ "step": 3527
+ },
+ {
+ "epoch": 9.61307901907357,
+ "grad_norm": 9.760807037353516,
+ "learning_rate": 1.9771507028336672e-05,
+ "loss": 1.1934,
+ "step": 3528
+ },
+ {
+ "epoch": 9.615803814713896,
+ "grad_norm": 9.40585994720459,
+ "learning_rate": 1.9771319418124974e-05,
+ "loss": 1.2397,
+ "step": 3529
+ },
+ {
+ "epoch": 9.618528610354224,
+ "grad_norm": 12.485505104064941,
+ "learning_rate": 1.9771131731814558e-05,
+ "loss": 1.3064,
+ "step": 3530
+ },
+ {
+ "epoch": 9.621253405994551,
+ "grad_norm": 7.9116740226745605,
+ "learning_rate": 1.9770943969406882e-05,
+ "loss": 1.3254,
+ "step": 3531
+ },
+ {
+ "epoch": 9.623978201634877,
+ "grad_norm": 8.666459083557129,
+ "learning_rate": 1.977075613090341e-05,
+ "loss": 1.4194,
+ "step": 3532
+ },
+ {
+ "epoch": 9.626702997275205,
+ "grad_norm": 7.706989288330078,
+ "learning_rate": 1.97705682163056e-05,
+ "loss": 1.2048,
+ "step": 3533
+ },
+ {
+ "epoch": 9.629427792915532,
+ "grad_norm": 9.042607307434082,
+ "learning_rate": 1.977038022561492e-05,
+ "loss": 1.3113,
+ "step": 3534
+ },
+ {
+ "epoch": 9.632152588555858,
+ "grad_norm": 8.763065338134766,
+ "learning_rate": 1.9770192158832837e-05,
+ "loss": 1.3235,
+ "step": 3535
+ },
+ {
+ "epoch": 9.634877384196185,
+ "grad_norm": 7.559271335601807,
+ "learning_rate": 1.9770004015960808e-05,
+ "loss": 1.2393,
+ "step": 3536
+ },
+ {
+ "epoch": 9.637602179836513,
+ "grad_norm": 13.301497459411621,
+ "learning_rate": 1.9769815797000303e-05,
+ "loss": 1.0942,
+ "step": 3537
+ },
+ {
+ "epoch": 9.640326975476839,
+ "grad_norm": 8.295751571655273,
+ "learning_rate": 1.9769627501952787e-05,
+ "loss": 1.2432,
+ "step": 3538
+ },
+ {
+ "epoch": 9.643051771117166,
+ "grad_norm": 12.13232421875,
+ "learning_rate": 1.9769439130819727e-05,
+ "loss": 1.3557,
+ "step": 3539
+ },
+ {
+ "epoch": 9.645776566757494,
+ "grad_norm": 10.783136367797852,
+ "learning_rate": 1.976925068360259e-05,
+ "loss": 1.3884,
+ "step": 3540
+ },
+ {
+ "epoch": 9.64850136239782,
+ "grad_norm": 7.590921878814697,
+ "learning_rate": 1.976906216030284e-05,
+ "loss": 1.2324,
+ "step": 3541
+ },
+ {
+ "epoch": 9.651226158038147,
+ "grad_norm": 12.891176223754883,
+ "learning_rate": 1.9768873560921954e-05,
+ "loss": 1.3088,
+ "step": 3542
+ },
+ {
+ "epoch": 9.653950953678475,
+ "grad_norm": 9.654071807861328,
+ "learning_rate": 1.9768684885461394e-05,
+ "loss": 1.4294,
+ "step": 3543
+ },
+ {
+ "epoch": 9.6566757493188,
+ "grad_norm": 9.73577880859375,
+ "learning_rate": 1.9768496133922626e-05,
+ "loss": 1.3999,
+ "step": 3544
+ },
+ {
+ "epoch": 9.659400544959128,
+ "grad_norm": 12.861915588378906,
+ "learning_rate": 1.9768307306307125e-05,
+ "loss": 1.3772,
+ "step": 3545
+ },
+ {
+ "epoch": 9.662125340599456,
+ "grad_norm": 10.343432426452637,
+ "learning_rate": 1.9768118402616367e-05,
+ "loss": 1.4392,
+ "step": 3546
+ },
+ {
+ "epoch": 9.664850136239782,
+ "grad_norm": 10.485712051391602,
+ "learning_rate": 1.9767929422851814e-05,
+ "loss": 1.3408,
+ "step": 3547
+ },
+ {
+ "epoch": 9.66757493188011,
+ "grad_norm": 13.244621276855469,
+ "learning_rate": 1.9767740367014937e-05,
+ "loss": 1.2383,
+ "step": 3548
+ },
+ {
+ "epoch": 9.670299727520437,
+ "grad_norm": 11.628501892089844,
+ "learning_rate": 1.9767551235107218e-05,
+ "loss": 1.3855,
+ "step": 3549
+ },
+ {
+ "epoch": 9.673024523160763,
+ "grad_norm": 12.488821983337402,
+ "learning_rate": 1.9767362027130122e-05,
+ "loss": 1.217,
+ "step": 3550
+ },
+ {
+ "epoch": 9.67574931880109,
+ "grad_norm": 35.66632080078125,
+ "learning_rate": 1.9767172743085124e-05,
+ "loss": 1.4966,
+ "step": 3551
+ },
+ {
+ "epoch": 9.678474114441418,
+ "grad_norm": 10.492840766906738,
+ "learning_rate": 1.97669833829737e-05,
+ "loss": 1.1748,
+ "step": 3552
+ },
+ {
+ "epoch": 9.681198910081743,
+ "grad_norm": 9.04301643371582,
+ "learning_rate": 1.9766793946797324e-05,
+ "loss": 1.2639,
+ "step": 3553
+ },
+ {
+ "epoch": 9.683923705722071,
+ "grad_norm": 11.102354049682617,
+ "learning_rate": 1.976660443455747e-05,
+ "loss": 1.3433,
+ "step": 3554
+ },
+ {
+ "epoch": 9.686648501362399,
+ "grad_norm": 37.838706970214844,
+ "learning_rate": 1.9766414846255614e-05,
+ "loss": 1.3713,
+ "step": 3555
+ },
+ {
+ "epoch": 9.689373297002724,
+ "grad_norm": 11.290416717529297,
+ "learning_rate": 1.9766225181893236e-05,
+ "loss": 1.3698,
+ "step": 3556
+ },
+ {
+ "epoch": 9.692098092643052,
+ "grad_norm": 29.570707321166992,
+ "learning_rate": 1.9766035441471813e-05,
+ "loss": 1.3085,
+ "step": 3557
+ },
+ {
+ "epoch": 9.69482288828338,
+ "grad_norm": 13.721502304077148,
+ "learning_rate": 1.9765845624992814e-05,
+ "loss": 1.3857,
+ "step": 3558
+ },
+ {
+ "epoch": 9.697547683923705,
+ "grad_norm": 17.07549285888672,
+ "learning_rate": 1.9765655732457728e-05,
+ "loss": 1.4221,
+ "step": 3559
+ },
+ {
+ "epoch": 9.700272479564033,
+ "grad_norm": 10.509212493896484,
+ "learning_rate": 1.9765465763868027e-05,
+ "loss": 1.3245,
+ "step": 3560
+ },
+ {
+ "epoch": 9.70299727520436,
+ "grad_norm": 7.748059272766113,
+ "learning_rate": 1.9765275719225196e-05,
+ "loss": 1.283,
+ "step": 3561
+ },
+ {
+ "epoch": 9.705722070844686,
+ "grad_norm": 13.8661527633667,
+ "learning_rate": 1.976508559853071e-05,
+ "loss": 1.4639,
+ "step": 3562
+ },
+ {
+ "epoch": 9.708446866485014,
+ "grad_norm": 9.865267753601074,
+ "learning_rate": 1.9764895401786054e-05,
+ "loss": 1.4209,
+ "step": 3563
+ },
+ {
+ "epoch": 9.711171662125341,
+ "grad_norm": 12.632296562194824,
+ "learning_rate": 1.9764705128992704e-05,
+ "loss": 1.4805,
+ "step": 3564
+ },
+ {
+ "epoch": 9.713896457765667,
+ "grad_norm": 14.47574234008789,
+ "learning_rate": 1.9764514780152146e-05,
+ "loss": 1.5071,
+ "step": 3565
+ },
+ {
+ "epoch": 9.716621253405995,
+ "grad_norm": 12.230063438415527,
+ "learning_rate": 1.976432435526586e-05,
+ "loss": 1.314,
+ "step": 3566
+ },
+ {
+ "epoch": 9.719346049046322,
+ "grad_norm": 8.775035858154297,
+ "learning_rate": 1.976413385433533e-05,
+ "loss": 1.3423,
+ "step": 3567
+ },
+ {
+ "epoch": 9.722070844686648,
+ "grad_norm": 12.163357734680176,
+ "learning_rate": 1.976394327736204e-05,
+ "loss": 1.3538,
+ "step": 3568
+ },
+ {
+ "epoch": 9.724795640326976,
+ "grad_norm": 10.467511177062988,
+ "learning_rate": 1.9763752624347475e-05,
+ "loss": 1.2112,
+ "step": 3569
+ },
+ {
+ "epoch": 9.727520435967303,
+ "grad_norm": 10.808884620666504,
+ "learning_rate": 1.976356189529312e-05,
+ "loss": 1.2449,
+ "step": 3570
+ },
+ {
+ "epoch": 9.730245231607629,
+ "grad_norm": 9.99303150177002,
+ "learning_rate": 1.9763371090200456e-05,
+ "loss": 1.3994,
+ "step": 3571
+ },
+ {
+ "epoch": 9.732970027247957,
+ "grad_norm": 8.264053344726562,
+ "learning_rate": 1.9763180209070977e-05,
+ "loss": 1.2852,
+ "step": 3572
+ },
+ {
+ "epoch": 9.735694822888284,
+ "grad_norm": 12.849554061889648,
+ "learning_rate": 1.976298925190616e-05,
+ "loss": 1.2565,
+ "step": 3573
+ },
+ {
+ "epoch": 9.73841961852861,
+ "grad_norm": 22.483198165893555,
+ "learning_rate": 1.9762798218707496e-05,
+ "loss": 1.2776,
+ "step": 3574
+ },
+ {
+ "epoch": 9.741144414168938,
+ "grad_norm": 15.177623748779297,
+ "learning_rate": 1.976260710947648e-05,
+ "loss": 1.4773,
+ "step": 3575
+ },
+ {
+ "epoch": 9.743869209809265,
+ "grad_norm": 10.869903564453125,
+ "learning_rate": 1.976241592421459e-05,
+ "loss": 1.4231,
+ "step": 3576
+ },
+ {
+ "epoch": 9.746594005449591,
+ "grad_norm": 10.320539474487305,
+ "learning_rate": 1.976222466292332e-05,
+ "loss": 1.3938,
+ "step": 3577
+ },
+ {
+ "epoch": 9.749318801089919,
+ "grad_norm": 10.482199668884277,
+ "learning_rate": 1.9762033325604156e-05,
+ "loss": 1.3408,
+ "step": 3578
+ },
+ {
+ "epoch": 9.752043596730246,
+ "grad_norm": 9.231746673583984,
+ "learning_rate": 1.9761841912258594e-05,
+ "loss": 1.3203,
+ "step": 3579
+ },
+ {
+ "epoch": 9.754768392370572,
+ "grad_norm": 9.591264724731445,
+ "learning_rate": 1.9761650422888118e-05,
+ "loss": 1.2886,
+ "step": 3580
+ },
+ {
+ "epoch": 9.7574931880109,
+ "grad_norm": 10.6572265625,
+ "learning_rate": 1.9761458857494223e-05,
+ "loss": 1.4587,
+ "step": 3581
+ },
+ {
+ "epoch": 9.760217983651227,
+ "grad_norm": 9.55623722076416,
+ "learning_rate": 1.9761267216078403e-05,
+ "loss": 1.3806,
+ "step": 3582
+ },
+ {
+ "epoch": 9.762942779291553,
+ "grad_norm": 12.238038063049316,
+ "learning_rate": 1.9761075498642144e-05,
+ "loss": 1.4348,
+ "step": 3583
+ },
+ {
+ "epoch": 9.76566757493188,
+ "grad_norm": 9.699817657470703,
+ "learning_rate": 1.976088370518695e-05,
+ "loss": 1.3208,
+ "step": 3584
+ },
+ {
+ "epoch": 9.768392370572208,
+ "grad_norm": 8.047388076782227,
+ "learning_rate": 1.9760691835714304e-05,
+ "loss": 1.366,
+ "step": 3585
+ },
+ {
+ "epoch": 9.771117166212534,
+ "grad_norm": 9.928215980529785,
+ "learning_rate": 1.9760499890225704e-05,
+ "loss": 1.1907,
+ "step": 3586
+ },
+ {
+ "epoch": 9.773841961852861,
+ "grad_norm": 11.434212684631348,
+ "learning_rate": 1.9760307868722646e-05,
+ "loss": 1.3413,
+ "step": 3587
+ },
+ {
+ "epoch": 9.776566757493189,
+ "grad_norm": 9.478497505187988,
+ "learning_rate": 1.9760115771206624e-05,
+ "loss": 1.2214,
+ "step": 3588
+ },
+ {
+ "epoch": 9.779291553133515,
+ "grad_norm": 12.000141143798828,
+ "learning_rate": 1.9759923597679133e-05,
+ "loss": 1.3748,
+ "step": 3589
+ },
+ {
+ "epoch": 9.782016348773842,
+ "grad_norm": 16.21526336669922,
+ "learning_rate": 1.9759731348141673e-05,
+ "loss": 1.4045,
+ "step": 3590
+ },
+ {
+ "epoch": 9.78474114441417,
+ "grad_norm": 12.084442138671875,
+ "learning_rate": 1.975953902259574e-05,
+ "loss": 1.3789,
+ "step": 3591
+ },
+ {
+ "epoch": 9.787465940054496,
+ "grad_norm": 10.21094799041748,
+ "learning_rate": 1.9759346621042827e-05,
+ "loss": 1.4468,
+ "step": 3592
+ },
+ {
+ "epoch": 9.790190735694823,
+ "grad_norm": 14.390522956848145,
+ "learning_rate": 1.9759154143484443e-05,
+ "loss": 1.3589,
+ "step": 3593
+ },
+ {
+ "epoch": 9.79291553133515,
+ "grad_norm": 10.500269889831543,
+ "learning_rate": 1.9758961589922078e-05,
+ "loss": 1.2593,
+ "step": 3594
+ },
+ {
+ "epoch": 9.795640326975477,
+ "grad_norm": 16.458541870117188,
+ "learning_rate": 1.975876896035723e-05,
+ "loss": 1.5293,
+ "step": 3595
+ },
+ {
+ "epoch": 9.798365122615804,
+ "grad_norm": 10.324142456054688,
+ "learning_rate": 1.975857625479141e-05,
+ "loss": 1.3386,
+ "step": 3596
+ },
+ {
+ "epoch": 9.80108991825613,
+ "grad_norm": 17.802846908569336,
+ "learning_rate": 1.9758383473226107e-05,
+ "loss": 1.4626,
+ "step": 3597
+ },
+ {
+ "epoch": 9.803814713896458,
+ "grad_norm": 8.964858055114746,
+ "learning_rate": 1.9758190615662827e-05,
+ "loss": 1.2153,
+ "step": 3598
+ },
+ {
+ "epoch": 9.806539509536785,
+ "grad_norm": 9.028390884399414,
+ "learning_rate": 1.9757997682103077e-05,
+ "loss": 1.2297,
+ "step": 3599
+ },
+ {
+ "epoch": 9.809264305177111,
+ "grad_norm": 9.114471435546875,
+ "learning_rate": 1.975780467254835e-05,
+ "loss": 1.3013,
+ "step": 3600
+ },
+ {
+ "epoch": 9.811989100817438,
+ "grad_norm": 10.367660522460938,
+ "learning_rate": 1.9757611587000164e-05,
+ "loss": 1.3669,
+ "step": 3601
+ },
+ {
+ "epoch": 9.814713896457766,
+ "grad_norm": 9.04752254486084,
+ "learning_rate": 1.9757418425460005e-05,
+ "loss": 1.4395,
+ "step": 3602
+ },
+ {
+ "epoch": 9.817438692098092,
+ "grad_norm": 9.182389259338379,
+ "learning_rate": 1.9757225187929387e-05,
+ "loss": 1.5559,
+ "step": 3603
+ },
+ {
+ "epoch": 9.82016348773842,
+ "grad_norm": 9.73576545715332,
+ "learning_rate": 1.9757031874409813e-05,
+ "loss": 1.5352,
+ "step": 3604
+ },
+ {
+ "epoch": 9.822888283378747,
+ "grad_norm": 9.303825378417969,
+ "learning_rate": 1.975683848490279e-05,
+ "loss": 1.5632,
+ "step": 3605
+ },
+ {
+ "epoch": 9.825613079019073,
+ "grad_norm": 12.194347381591797,
+ "learning_rate": 1.975664501940982e-05,
+ "loss": 1.4282,
+ "step": 3606
+ },
+ {
+ "epoch": 9.8283378746594,
+ "grad_norm": 11.136542320251465,
+ "learning_rate": 1.9756451477932414e-05,
+ "loss": 1.2998,
+ "step": 3607
+ },
+ {
+ "epoch": 9.831062670299728,
+ "grad_norm": 9.804329872131348,
+ "learning_rate": 1.975625786047208e-05,
+ "loss": 1.1824,
+ "step": 3608
+ },
+ {
+ "epoch": 9.833787465940054,
+ "grad_norm": 7.430677890777588,
+ "learning_rate": 1.9756064167030324e-05,
+ "loss": 1.2449,
+ "step": 3609
+ },
+ {
+ "epoch": 9.836512261580381,
+ "grad_norm": 11.333991050720215,
+ "learning_rate": 1.975587039760865e-05,
+ "loss": 1.2239,
+ "step": 3610
+ },
+ {
+ "epoch": 9.839237057220709,
+ "grad_norm": 8.473504066467285,
+ "learning_rate": 1.9755676552208577e-05,
+ "loss": 1.2458,
+ "step": 3611
+ },
+ {
+ "epoch": 9.841961852861035,
+ "grad_norm": 21.26403045654297,
+ "learning_rate": 1.97554826308316e-05,
+ "loss": 1.3889,
+ "step": 3612
+ },
+ {
+ "epoch": 9.844686648501362,
+ "grad_norm": 11.096529006958008,
+ "learning_rate": 1.9755288633479245e-05,
+ "loss": 1.4622,
+ "step": 3613
+ },
+ {
+ "epoch": 9.84741144414169,
+ "grad_norm": 10.732100486755371,
+ "learning_rate": 1.975509456015302e-05,
+ "loss": 1.4268,
+ "step": 3614
+ },
+ {
+ "epoch": 9.850136239782016,
+ "grad_norm": 8.53803539276123,
+ "learning_rate": 1.9754900410854425e-05,
+ "loss": 1.1648,
+ "step": 3615
+ },
+ {
+ "epoch": 9.852861035422343,
+ "grad_norm": 12.325318336486816,
+ "learning_rate": 1.9754706185584982e-05,
+ "loss": 1.2351,
+ "step": 3616
+ },
+ {
+ "epoch": 9.85558583106267,
+ "grad_norm": 10.54158878326416,
+ "learning_rate": 1.97545118843462e-05,
+ "loss": 1.5369,
+ "step": 3617
+ },
+ {
+ "epoch": 9.858310626702997,
+ "grad_norm": 8.079790115356445,
+ "learning_rate": 1.9754317507139596e-05,
+ "loss": 1.4783,
+ "step": 3618
+ },
+ {
+ "epoch": 9.861035422343324,
+ "grad_norm": 10.943889617919922,
+ "learning_rate": 1.9754123053966682e-05,
+ "loss": 1.5005,
+ "step": 3619
+ },
+ {
+ "epoch": 9.863760217983652,
+ "grad_norm": 8.651459693908691,
+ "learning_rate": 1.9753928524828967e-05,
+ "loss": 1.3979,
+ "step": 3620
+ },
+ {
+ "epoch": 9.866485013623977,
+ "grad_norm": 10.205894470214844,
+ "learning_rate": 1.975373391972797e-05,
+ "loss": 1.3853,
+ "step": 3621
+ },
+ {
+ "epoch": 9.869209809264305,
+ "grad_norm": 9.411439895629883,
+ "learning_rate": 1.9753539238665214e-05,
+ "loss": 1.1968,
+ "step": 3622
+ },
+ {
+ "epoch": 9.871934604904633,
+ "grad_norm": 8.494278907775879,
+ "learning_rate": 1.9753344481642205e-05,
+ "loss": 1.2158,
+ "step": 3623
+ },
+ {
+ "epoch": 9.874659400544958,
+ "grad_norm": 9.459856986999512,
+ "learning_rate": 1.9753149648660463e-05,
+ "loss": 1.2537,
+ "step": 3624
+ },
+ {
+ "epoch": 9.877384196185286,
+ "grad_norm": 11.612347602844238,
+ "learning_rate": 1.9752954739721506e-05,
+ "loss": 1.281,
+ "step": 3625
+ },
+ {
+ "epoch": 9.880108991825614,
+ "grad_norm": 11.348382949829102,
+ "learning_rate": 1.9752759754826848e-05,
+ "loss": 1.657,
+ "step": 3626
+ },
+ {
+ "epoch": 9.88283378746594,
+ "grad_norm": 10.99140739440918,
+ "learning_rate": 1.9752564693978017e-05,
+ "loss": 1.5684,
+ "step": 3627
+ },
+ {
+ "epoch": 9.885558583106267,
+ "grad_norm": 8.75643253326416,
+ "learning_rate": 1.975236955717652e-05,
+ "loss": 1.228,
+ "step": 3628
+ },
+ {
+ "epoch": 9.888283378746594,
+ "grad_norm": 8.574169158935547,
+ "learning_rate": 1.9752174344423887e-05,
+ "loss": 1.6069,
+ "step": 3629
+ },
+ {
+ "epoch": 9.89100817438692,
+ "grad_norm": 10.064516067504883,
+ "learning_rate": 1.975197905572163e-05,
+ "loss": 1.5732,
+ "step": 3630
+ },
+ {
+ "epoch": 9.893732970027248,
+ "grad_norm": 10.123259544372559,
+ "learning_rate": 1.9751783691071278e-05,
+ "loss": 1.4634,
+ "step": 3631
+ },
+ {
+ "epoch": 9.896457765667575,
+ "grad_norm": 7.016714572906494,
+ "learning_rate": 1.9751588250474347e-05,
+ "loss": 1.085,
+ "step": 3632
+ },
+ {
+ "epoch": 9.899182561307901,
+ "grad_norm": 7.592134475708008,
+ "learning_rate": 1.975139273393236e-05,
+ "loss": 1.3142,
+ "step": 3633
+ },
+ {
+ "epoch": 9.901907356948229,
+ "grad_norm": 9.733391761779785,
+ "learning_rate": 1.975119714144684e-05,
+ "loss": 1.373,
+ "step": 3634
+ },
+ {
+ "epoch": 9.904632152588556,
+ "grad_norm": 9.23591136932373,
+ "learning_rate": 1.9751001473019312e-05,
+ "loss": 1.4934,
+ "step": 3635
+ },
+ {
+ "epoch": 9.907356948228882,
+ "grad_norm": 12.293094635009766,
+ "learning_rate": 1.97508057286513e-05,
+ "loss": 1.1792,
+ "step": 3636
+ },
+ {
+ "epoch": 9.91008174386921,
+ "grad_norm": 9.169655799865723,
+ "learning_rate": 1.975060990834432e-05,
+ "loss": 1.6282,
+ "step": 3637
+ },
+ {
+ "epoch": 9.912806539509537,
+ "grad_norm": 8.291810035705566,
+ "learning_rate": 1.975041401209991e-05,
+ "loss": 1.4124,
+ "step": 3638
+ },
+ {
+ "epoch": 9.915531335149863,
+ "grad_norm": 9.391378402709961,
+ "learning_rate": 1.9750218039919587e-05,
+ "loss": 1.2786,
+ "step": 3639
+ },
+ {
+ "epoch": 9.91825613079019,
+ "grad_norm": 12.229228019714355,
+ "learning_rate": 1.975002199180488e-05,
+ "loss": 1.4749,
+ "step": 3640
+ },
+ {
+ "epoch": 9.920980926430518,
+ "grad_norm": 9.75719165802002,
+ "learning_rate": 1.9749825867757316e-05,
+ "loss": 1.2493,
+ "step": 3641
+ },
+ {
+ "epoch": 9.923705722070844,
+ "grad_norm": 10.654757499694824,
+ "learning_rate": 1.974962966777842e-05,
+ "loss": 1.5508,
+ "step": 3642
+ },
+ {
+ "epoch": 9.926430517711172,
+ "grad_norm": 9.315423965454102,
+ "learning_rate": 1.9749433391869725e-05,
+ "loss": 1.3826,
+ "step": 3643
+ },
+ {
+ "epoch": 9.9291553133515,
+ "grad_norm": 10.321687698364258,
+ "learning_rate": 1.9749237040032758e-05,
+ "loss": 1.2932,
+ "step": 3644
+ },
+ {
+ "epoch": 9.931880108991825,
+ "grad_norm": 9.969890594482422,
+ "learning_rate": 1.974904061226904e-05,
+ "loss": 1.4094,
+ "step": 3645
+ },
+ {
+ "epoch": 9.934604904632153,
+ "grad_norm": 15.723612785339355,
+ "learning_rate": 1.9748844108580113e-05,
+ "loss": 1.4934,
+ "step": 3646
+ },
+ {
+ "epoch": 9.93732970027248,
+ "grad_norm": 13.158507347106934,
+ "learning_rate": 1.9748647528967503e-05,
+ "loss": 1.5178,
+ "step": 3647
+ },
+ {
+ "epoch": 9.940054495912806,
+ "grad_norm": 8.285064697265625,
+ "learning_rate": 1.9748450873432737e-05,
+ "loss": 1.1406,
+ "step": 3648
+ },
+ {
+ "epoch": 9.942779291553133,
+ "grad_norm": 8.271842002868652,
+ "learning_rate": 1.974825414197735e-05,
+ "loss": 1.4692,
+ "step": 3649
+ },
+ {
+ "epoch": 9.945504087193461,
+ "grad_norm": 7.437000751495361,
+ "learning_rate": 1.9748057334602873e-05,
+ "loss": 1.1069,
+ "step": 3650
+ },
+ {
+ "epoch": 9.948228882833787,
+ "grad_norm": 8.541642189025879,
+ "learning_rate": 1.9747860451310838e-05,
+ "loss": 1.3345,
+ "step": 3651
+ },
+ {
+ "epoch": 9.950953678474114,
+ "grad_norm": 8.020855903625488,
+ "learning_rate": 1.974766349210278e-05,
+ "loss": 1.1671,
+ "step": 3652
+ },
+ {
+ "epoch": 9.953678474114442,
+ "grad_norm": 8.065467834472656,
+ "learning_rate": 1.9747466456980232e-05,
+ "loss": 1.2144,
+ "step": 3653
+ },
+ {
+ "epoch": 9.956403269754768,
+ "grad_norm": 11.647472381591797,
+ "learning_rate": 1.974726934594473e-05,
+ "loss": 1.5593,
+ "step": 3654
+ },
+ {
+ "epoch": 9.959128065395095,
+ "grad_norm": 17.921730041503906,
+ "learning_rate": 1.9747072158997808e-05,
+ "loss": 1.4771,
+ "step": 3655
+ },
+ {
+ "epoch": 9.961852861035423,
+ "grad_norm": 11.619487762451172,
+ "learning_rate": 1.9746874896141005e-05,
+ "loss": 1.3782,
+ "step": 3656
+ },
+ {
+ "epoch": 9.964577656675749,
+ "grad_norm": 21.86222267150879,
+ "learning_rate": 1.9746677557375847e-05,
+ "loss": 1.4021,
+ "step": 3657
+ },
+ {
+ "epoch": 9.967302452316076,
+ "grad_norm": 9.413336753845215,
+ "learning_rate": 1.9746480142703883e-05,
+ "loss": 1.3765,
+ "step": 3658
+ },
+ {
+ "epoch": 9.970027247956404,
+ "grad_norm": 10.448002815246582,
+ "learning_rate": 1.9746282652126646e-05,
+ "loss": 1.2358,
+ "step": 3659
+ },
+ {
+ "epoch": 9.97275204359673,
+ "grad_norm": 7.882084846496582,
+ "learning_rate": 1.974608508564567e-05,
+ "loss": 1.2864,
+ "step": 3660
+ },
+ {
+ "epoch": 9.975476839237057,
+ "grad_norm": 13.244160652160645,
+ "learning_rate": 1.97458874432625e-05,
+ "loss": 1.3535,
+ "step": 3661
+ },
+ {
+ "epoch": 9.978201634877385,
+ "grad_norm": 9.789565086364746,
+ "learning_rate": 1.974568972497867e-05,
+ "loss": 1.5103,
+ "step": 3662
+ },
+ {
+ "epoch": 9.98092643051771,
+ "grad_norm": 10.077621459960938,
+ "learning_rate": 1.9745491930795725e-05,
+ "loss": 1.3215,
+ "step": 3663
+ },
+ {
+ "epoch": 9.983651226158038,
+ "grad_norm": 8.027867317199707,
+ "learning_rate": 1.97452940607152e-05,
+ "loss": 1.4524,
+ "step": 3664
+ },
+ {
+ "epoch": 9.986376021798366,
+ "grad_norm": 12.210448265075684,
+ "learning_rate": 1.9745096114738637e-05,
+ "loss": 1.5635,
+ "step": 3665
+ },
+ {
+ "epoch": 9.989100817438691,
+ "grad_norm": 11.715902328491211,
+ "learning_rate": 1.9744898092867584e-05,
+ "loss": 1.4033,
+ "step": 3666
+ },
+ {
+ "epoch": 9.991825613079019,
+ "grad_norm": 10.559863090515137,
+ "learning_rate": 1.9744699995103574e-05,
+ "loss": 1.2605,
+ "step": 3667
+ },
+ {
+ "epoch": 9.994550408719347,
+ "grad_norm": 11.416446685791016,
+ "learning_rate": 1.9744501821448154e-05,
+ "loss": 1.4619,
+ "step": 3668
+ },
+ {
+ "epoch": 9.997275204359672,
+ "grad_norm": 9.612354278564453,
+ "learning_rate": 1.974430357190287e-05,
+ "loss": 1.281,
+ "step": 3669
+ },
+ {
+ "epoch": 10.0,
+ "grad_norm": 10.122220993041992,
+ "learning_rate": 1.9744105246469264e-05,
+ "loss": 1.4553,
+ "step": 3670
+ },
+ {
+ "epoch": 10.002724795640328,
+ "grad_norm": 8.111466407775879,
+ "learning_rate": 1.9743906845148877e-05,
+ "loss": 1.26,
+ "step": 3671
+ },
+ {
+ "epoch": 10.005449591280653,
+ "grad_norm": 8.482653617858887,
+ "learning_rate": 1.9743708367943256e-05,
+ "loss": 1.2026,
+ "step": 3672
+ },
+ {
+ "epoch": 10.008174386920981,
+ "grad_norm": 8.723862648010254,
+ "learning_rate": 1.974350981485395e-05,
+ "loss": 1.3042,
+ "step": 3673
+ },
+ {
+ "epoch": 10.010899182561309,
+ "grad_norm": 8.500794410705566,
+ "learning_rate": 1.9743311185882503e-05,
+ "loss": 1.3416,
+ "step": 3674
+ },
+ {
+ "epoch": 10.013623978201634,
+ "grad_norm": 7.933543682098389,
+ "learning_rate": 1.9743112481030465e-05,
+ "loss": 1.4116,
+ "step": 3675
+ },
+ {
+ "epoch": 10.016348773841962,
+ "grad_norm": 10.659152030944824,
+ "learning_rate": 1.974291370029938e-05,
+ "loss": 1.3218,
+ "step": 3676
+ },
+ {
+ "epoch": 10.01907356948229,
+ "grad_norm": 8.086297035217285,
+ "learning_rate": 1.974271484369079e-05,
+ "loss": 1.2712,
+ "step": 3677
+ },
+ {
+ "epoch": 10.021798365122615,
+ "grad_norm": 10.596502304077148,
+ "learning_rate": 1.9742515911206258e-05,
+ "loss": 1.2361,
+ "step": 3678
+ },
+ {
+ "epoch": 10.024523160762943,
+ "grad_norm": 8.962627410888672,
+ "learning_rate": 1.9742316902847322e-05,
+ "loss": 1.2885,
+ "step": 3679
+ },
+ {
+ "epoch": 10.02724795640327,
+ "grad_norm": 16.210643768310547,
+ "learning_rate": 1.9742117818615536e-05,
+ "loss": 1.2329,
+ "step": 3680
+ },
+ {
+ "epoch": 10.029972752043596,
+ "grad_norm": 8.1439790725708,
+ "learning_rate": 1.974191865851245e-05,
+ "loss": 1.1716,
+ "step": 3681
+ },
+ {
+ "epoch": 10.032697547683924,
+ "grad_norm": 7.825740337371826,
+ "learning_rate": 1.9741719422539614e-05,
+ "loss": 1.1626,
+ "step": 3682
+ },
+ {
+ "epoch": 10.035422343324251,
+ "grad_norm": 9.390591621398926,
+ "learning_rate": 1.9741520110698582e-05,
+ "loss": 1.2278,
+ "step": 3683
+ },
+ {
+ "epoch": 10.038147138964577,
+ "grad_norm": 10.142020225524902,
+ "learning_rate": 1.9741320722990903e-05,
+ "loss": 1.3694,
+ "step": 3684
+ },
+ {
+ "epoch": 10.040871934604905,
+ "grad_norm": 11.591178894042969,
+ "learning_rate": 1.9741121259418135e-05,
+ "loss": 1.3064,
+ "step": 3685
+ },
+ {
+ "epoch": 10.043596730245232,
+ "grad_norm": 9.16048526763916,
+ "learning_rate": 1.9740921719981827e-05,
+ "loss": 1.3254,
+ "step": 3686
+ },
+ {
+ "epoch": 10.046321525885558,
+ "grad_norm": 10.824785232543945,
+ "learning_rate": 1.9740722104683534e-05,
+ "loss": 1.2532,
+ "step": 3687
+ },
+ {
+ "epoch": 10.049046321525886,
+ "grad_norm": 8.441052436828613,
+ "learning_rate": 1.974052241352481e-05,
+ "loss": 1.2732,
+ "step": 3688
+ },
+ {
+ "epoch": 10.051771117166213,
+ "grad_norm": 7.5722737312316895,
+ "learning_rate": 1.9740322646507213e-05,
+ "loss": 1.2148,
+ "step": 3689
+ },
+ {
+ "epoch": 10.054495912806539,
+ "grad_norm": 9.024096488952637,
+ "learning_rate": 1.9740122803632295e-05,
+ "loss": 1.2815,
+ "step": 3690
+ },
+ {
+ "epoch": 10.057220708446867,
+ "grad_norm": 8.968578338623047,
+ "learning_rate": 1.9739922884901612e-05,
+ "loss": 1.2136,
+ "step": 3691
+ },
+ {
+ "epoch": 10.059945504087194,
+ "grad_norm": 8.43995189666748,
+ "learning_rate": 1.9739722890316728e-05,
+ "loss": 1.1365,
+ "step": 3692
+ },
+ {
+ "epoch": 10.06267029972752,
+ "grad_norm": 8.175556182861328,
+ "learning_rate": 1.9739522819879192e-05,
+ "loss": 1.2385,
+ "step": 3693
+ },
+ {
+ "epoch": 10.065395095367847,
+ "grad_norm": 10.570222854614258,
+ "learning_rate": 1.9739322673590567e-05,
+ "loss": 1.2109,
+ "step": 3694
+ },
+ {
+ "epoch": 10.068119891008175,
+ "grad_norm": 10.841527938842773,
+ "learning_rate": 1.9739122451452412e-05,
+ "loss": 1.2881,
+ "step": 3695
+ },
+ {
+ "epoch": 10.0708446866485,
+ "grad_norm": 10.643328666687012,
+ "learning_rate": 1.9738922153466282e-05,
+ "loss": 1.3911,
+ "step": 3696
+ },
+ {
+ "epoch": 10.073569482288828,
+ "grad_norm": 8.971731185913086,
+ "learning_rate": 1.973872177963374e-05,
+ "loss": 1.1599,
+ "step": 3697
+ },
+ {
+ "epoch": 10.076294277929156,
+ "grad_norm": 11.588750839233398,
+ "learning_rate": 1.9738521329956347e-05,
+ "loss": 1.1902,
+ "step": 3698
+ },
+ {
+ "epoch": 10.079019073569482,
+ "grad_norm": 11.11839485168457,
+ "learning_rate": 1.9738320804435662e-05,
+ "loss": 1.3882,
+ "step": 3699
+ },
+ {
+ "epoch": 10.08174386920981,
+ "grad_norm": 9.18759536743164,
+ "learning_rate": 1.973812020307325e-05,
+ "loss": 1.179,
+ "step": 3700
+ },
+ {
+ "epoch": 10.084468664850137,
+ "grad_norm": 9.8154878616333,
+ "learning_rate": 1.973791952587067e-05,
+ "loss": 1.54,
+ "step": 3701
+ },
+ {
+ "epoch": 10.087193460490463,
+ "grad_norm": 10.527271270751953,
+ "learning_rate": 1.9737718772829485e-05,
+ "loss": 1.2053,
+ "step": 3702
+ },
+ {
+ "epoch": 10.08991825613079,
+ "grad_norm": 13.684199333190918,
+ "learning_rate": 1.9737517943951262e-05,
+ "loss": 1.176,
+ "step": 3703
+ },
+ {
+ "epoch": 10.092643051771118,
+ "grad_norm": 10.439043998718262,
+ "learning_rate": 1.9737317039237563e-05,
+ "loss": 1.2402,
+ "step": 3704
+ },
+ {
+ "epoch": 10.095367847411444,
+ "grad_norm": 17.306127548217773,
+ "learning_rate": 1.973711605868995e-05,
+ "loss": 1.2937,
+ "step": 3705
+ },
+ {
+ "epoch": 10.098092643051771,
+ "grad_norm": 10.449017524719238,
+ "learning_rate": 1.973691500230999e-05,
+ "loss": 1.3955,
+ "step": 3706
+ },
+ {
+ "epoch": 10.100817438692099,
+ "grad_norm": 7.04243803024292,
+ "learning_rate": 1.9736713870099253e-05,
+ "loss": 1.0579,
+ "step": 3707
+ },
+ {
+ "epoch": 10.103542234332425,
+ "grad_norm": 8.271339416503906,
+ "learning_rate": 1.97365126620593e-05,
+ "loss": 1.2466,
+ "step": 3708
+ },
+ {
+ "epoch": 10.106267029972752,
+ "grad_norm": 9.956682205200195,
+ "learning_rate": 1.97363113781917e-05,
+ "loss": 1.2231,
+ "step": 3709
+ },
+ {
+ "epoch": 10.10899182561308,
+ "grad_norm": 11.767767906188965,
+ "learning_rate": 1.9736110018498017e-05,
+ "loss": 1.2996,
+ "step": 3710
+ },
+ {
+ "epoch": 10.111716621253406,
+ "grad_norm": 9.663322448730469,
+ "learning_rate": 1.973590858297983e-05,
+ "loss": 1.313,
+ "step": 3711
+ },
+ {
+ "epoch": 10.114441416893733,
+ "grad_norm": 9.044020652770996,
+ "learning_rate": 1.9735707071638693e-05,
+ "loss": 1.163,
+ "step": 3712
+ },
+ {
+ "epoch": 10.11716621253406,
+ "grad_norm": 11.269691467285156,
+ "learning_rate": 1.9735505484476186e-05,
+ "loss": 1.1702,
+ "step": 3713
+ },
+ {
+ "epoch": 10.119891008174386,
+ "grad_norm": 8.530739784240723,
+ "learning_rate": 1.9735303821493876e-05,
+ "loss": 1.1389,
+ "step": 3714
+ },
+ {
+ "epoch": 10.122615803814714,
+ "grad_norm": 12.510598182678223,
+ "learning_rate": 1.9735102082693332e-05,
+ "loss": 1.3535,
+ "step": 3715
+ },
+ {
+ "epoch": 10.125340599455042,
+ "grad_norm": 8.907414436340332,
+ "learning_rate": 1.9734900268076126e-05,
+ "loss": 1.2559,
+ "step": 3716
+ },
+ {
+ "epoch": 10.128065395095367,
+ "grad_norm": 9.467856407165527,
+ "learning_rate": 1.973469837764383e-05,
+ "loss": 1.3218,
+ "step": 3717
+ },
+ {
+ "epoch": 10.130790190735695,
+ "grad_norm": 9.451179504394531,
+ "learning_rate": 1.9734496411398015e-05,
+ "loss": 1.2432,
+ "step": 3718
+ },
+ {
+ "epoch": 10.133514986376023,
+ "grad_norm": 8.923680305480957,
+ "learning_rate": 1.973429436934026e-05,
+ "loss": 1.2878,
+ "step": 3719
+ },
+ {
+ "epoch": 10.136239782016348,
+ "grad_norm": 9.132368087768555,
+ "learning_rate": 1.973409225147213e-05,
+ "loss": 1.0828,
+ "step": 3720
+ },
+ {
+ "epoch": 10.138964577656676,
+ "grad_norm": 7.689108371734619,
+ "learning_rate": 1.9733890057795203e-05,
+ "loss": 1.1726,
+ "step": 3721
+ },
+ {
+ "epoch": 10.141689373297003,
+ "grad_norm": 8.812626838684082,
+ "learning_rate": 1.9733687788311055e-05,
+ "loss": 1.3396,
+ "step": 3722
+ },
+ {
+ "epoch": 10.14441416893733,
+ "grad_norm": 9.01380729675293,
+ "learning_rate": 1.973348544302126e-05,
+ "loss": 1.4514,
+ "step": 3723
+ },
+ {
+ "epoch": 10.147138964577657,
+ "grad_norm": 9.405804634094238,
+ "learning_rate": 1.973328302192739e-05,
+ "loss": 1.4629,
+ "step": 3724
+ },
+ {
+ "epoch": 10.149863760217984,
+ "grad_norm": 10.039285659790039,
+ "learning_rate": 1.973308052503103e-05,
+ "loss": 1.2334,
+ "step": 3725
+ },
+ {
+ "epoch": 10.15258855585831,
+ "grad_norm": 9.150543212890625,
+ "learning_rate": 1.9732877952333748e-05,
+ "loss": 1.4014,
+ "step": 3726
+ },
+ {
+ "epoch": 10.155313351498638,
+ "grad_norm": 9.5938720703125,
+ "learning_rate": 1.973267530383713e-05,
+ "loss": 1.3809,
+ "step": 3727
+ },
+ {
+ "epoch": 10.158038147138965,
+ "grad_norm": 8.93763542175293,
+ "learning_rate": 1.9732472579542746e-05,
+ "loss": 1.4094,
+ "step": 3728
+ },
+ {
+ "epoch": 10.160762942779291,
+ "grad_norm": 15.509340286254883,
+ "learning_rate": 1.973226977945218e-05,
+ "loss": 1.2356,
+ "step": 3729
+ },
+ {
+ "epoch": 10.163487738419619,
+ "grad_norm": 7.8337321281433105,
+ "learning_rate": 1.973206690356701e-05,
+ "loss": 1.2112,
+ "step": 3730
+ },
+ {
+ "epoch": 10.166212534059946,
+ "grad_norm": 9.732722282409668,
+ "learning_rate": 1.9731863951888818e-05,
+ "loss": 1.5032,
+ "step": 3731
+ },
+ {
+ "epoch": 10.168937329700272,
+ "grad_norm": 10.353492736816406,
+ "learning_rate": 1.9731660924419182e-05,
+ "loss": 1.4467,
+ "step": 3732
+ },
+ {
+ "epoch": 10.1716621253406,
+ "grad_norm": 7.0989556312561035,
+ "learning_rate": 1.9731457821159684e-05,
+ "loss": 1.085,
+ "step": 3733
+ },
+ {
+ "epoch": 10.174386920980927,
+ "grad_norm": 9.056624412536621,
+ "learning_rate": 1.9731254642111902e-05,
+ "loss": 1.1536,
+ "step": 3734
+ },
+ {
+ "epoch": 10.177111716621253,
+ "grad_norm": 8.502835273742676,
+ "learning_rate": 1.9731051387277427e-05,
+ "loss": 1.1707,
+ "step": 3735
+ },
+ {
+ "epoch": 10.17983651226158,
+ "grad_norm": 9.250792503356934,
+ "learning_rate": 1.9730848056657836e-05,
+ "loss": 1.3557,
+ "step": 3736
+ },
+ {
+ "epoch": 10.182561307901908,
+ "grad_norm": 8.868075370788574,
+ "learning_rate": 1.9730644650254713e-05,
+ "loss": 1.2949,
+ "step": 3737
+ },
+ {
+ "epoch": 10.185286103542234,
+ "grad_norm": 8.198171615600586,
+ "learning_rate": 1.973044116806964e-05,
+ "loss": 1.1875,
+ "step": 3738
+ },
+ {
+ "epoch": 10.188010899182562,
+ "grad_norm": 8.920578956604004,
+ "learning_rate": 1.9730237610104206e-05,
+ "loss": 1.0823,
+ "step": 3739
+ },
+ {
+ "epoch": 10.190735694822889,
+ "grad_norm": 7.37108039855957,
+ "learning_rate": 1.9730033976359997e-05,
+ "loss": 1.155,
+ "step": 3740
+ },
+ {
+ "epoch": 10.193460490463215,
+ "grad_norm": 8.776039123535156,
+ "learning_rate": 1.9729830266838595e-05,
+ "loss": 1.3577,
+ "step": 3741
+ },
+ {
+ "epoch": 10.196185286103542,
+ "grad_norm": 7.64220666885376,
+ "learning_rate": 1.9729626481541588e-05,
+ "loss": 1.3101,
+ "step": 3742
+ },
+ {
+ "epoch": 10.19891008174387,
+ "grad_norm": 7.907156467437744,
+ "learning_rate": 1.9729422620470565e-05,
+ "loss": 1.4675,
+ "step": 3743
+ },
+ {
+ "epoch": 10.201634877384196,
+ "grad_norm": 7.8961100578308105,
+ "learning_rate": 1.972921868362711e-05,
+ "loss": 1.261,
+ "step": 3744
+ },
+ {
+ "epoch": 10.204359673024523,
+ "grad_norm": 6.774257183074951,
+ "learning_rate": 1.972901467101281e-05,
+ "loss": 1.1376,
+ "step": 3745
+ },
+ {
+ "epoch": 10.207084468664851,
+ "grad_norm": 9.262910842895508,
+ "learning_rate": 1.972881058262926e-05,
+ "loss": 1.2229,
+ "step": 3746
+ },
+ {
+ "epoch": 10.209809264305177,
+ "grad_norm": 7.917628765106201,
+ "learning_rate": 1.9728606418478046e-05,
+ "loss": 1.4253,
+ "step": 3747
+ },
+ {
+ "epoch": 10.212534059945504,
+ "grad_norm": 7.9029693603515625,
+ "learning_rate": 1.9728402178560757e-05,
+ "loss": 1.0979,
+ "step": 3748
+ },
+ {
+ "epoch": 10.215258855585832,
+ "grad_norm": 10.971442222595215,
+ "learning_rate": 1.972819786287899e-05,
+ "loss": 1.1077,
+ "step": 3749
+ },
+ {
+ "epoch": 10.217983651226158,
+ "grad_norm": 8.34411907196045,
+ "learning_rate": 1.9727993471434326e-05,
+ "loss": 1.334,
+ "step": 3750
+ },
+ {
+ "epoch": 10.220708446866485,
+ "grad_norm": 7.335469722747803,
+ "learning_rate": 1.9727789004228362e-05,
+ "loss": 1.2454,
+ "step": 3751
+ },
+ {
+ "epoch": 10.223433242506813,
+ "grad_norm": 7.210789680480957,
+ "learning_rate": 1.972758446126269e-05,
+ "loss": 1.395,
+ "step": 3752
+ },
+ {
+ "epoch": 10.226158038147139,
+ "grad_norm": 9.126672744750977,
+ "learning_rate": 1.972737984253891e-05,
+ "loss": 1.3259,
+ "step": 3753
+ },
+ {
+ "epoch": 10.228882833787466,
+ "grad_norm": 7.081237316131592,
+ "learning_rate": 1.9727175148058603e-05,
+ "loss": 1.1564,
+ "step": 3754
+ },
+ {
+ "epoch": 10.231607629427794,
+ "grad_norm": 8.507473945617676,
+ "learning_rate": 1.9726970377823367e-05,
+ "loss": 1.1432,
+ "step": 3755
+ },
+ {
+ "epoch": 10.23433242506812,
+ "grad_norm": 14.03199577331543,
+ "learning_rate": 1.9726765531834803e-05,
+ "loss": 1.4624,
+ "step": 3756
+ },
+ {
+ "epoch": 10.237057220708447,
+ "grad_norm": 8.498391151428223,
+ "learning_rate": 1.9726560610094497e-05,
+ "loss": 1.1757,
+ "step": 3757
+ },
+ {
+ "epoch": 10.239782016348773,
+ "grad_norm": 10.178677558898926,
+ "learning_rate": 1.9726355612604058e-05,
+ "loss": 1.2178,
+ "step": 3758
+ },
+ {
+ "epoch": 10.2425068119891,
+ "grad_norm": 8.009960174560547,
+ "learning_rate": 1.972615053936507e-05,
+ "loss": 1.311,
+ "step": 3759
+ },
+ {
+ "epoch": 10.245231607629428,
+ "grad_norm": 8.563240051269531,
+ "learning_rate": 1.9725945390379135e-05,
+ "loss": 1.2861,
+ "step": 3760
+ },
+ {
+ "epoch": 10.247956403269754,
+ "grad_norm": 9.629040718078613,
+ "learning_rate": 1.972574016564785e-05,
+ "loss": 1.4379,
+ "step": 3761
+ },
+ {
+ "epoch": 10.250681198910081,
+ "grad_norm": 9.098408699035645,
+ "learning_rate": 1.9725534865172814e-05,
+ "loss": 1.52,
+ "step": 3762
+ },
+ {
+ "epoch": 10.253405994550409,
+ "grad_norm": 8.469637870788574,
+ "learning_rate": 1.9725329488955625e-05,
+ "loss": 1.3036,
+ "step": 3763
+ },
+ {
+ "epoch": 10.256130790190735,
+ "grad_norm": 8.403144836425781,
+ "learning_rate": 1.972512403699788e-05,
+ "loss": 1.1606,
+ "step": 3764
+ },
+ {
+ "epoch": 10.258855585831062,
+ "grad_norm": 7.526834964752197,
+ "learning_rate": 1.9724918509301186e-05,
+ "loss": 1.3171,
+ "step": 3765
+ },
+ {
+ "epoch": 10.26158038147139,
+ "grad_norm": 9.698179244995117,
+ "learning_rate": 1.972471290586714e-05,
+ "loss": 1.4565,
+ "step": 3766
+ },
+ {
+ "epoch": 10.264305177111716,
+ "grad_norm": 8.261470794677734,
+ "learning_rate": 1.9724507226697343e-05,
+ "loss": 1.1653,
+ "step": 3767
+ },
+ {
+ "epoch": 10.267029972752043,
+ "grad_norm": 7.540979385375977,
+ "learning_rate": 1.9724301471793394e-05,
+ "loss": 1.1472,
+ "step": 3768
+ },
+ {
+ "epoch": 10.269754768392371,
+ "grad_norm": 8.067627906799316,
+ "learning_rate": 1.9724095641156903e-05,
+ "loss": 1.083,
+ "step": 3769
+ },
+ {
+ "epoch": 10.272479564032697,
+ "grad_norm": 9.930658340454102,
+ "learning_rate": 1.972388973478946e-05,
+ "loss": 1.3225,
+ "step": 3770
+ },
+ {
+ "epoch": 10.275204359673024,
+ "grad_norm": 7.763191223144531,
+ "learning_rate": 1.9723683752692683e-05,
+ "loss": 1.449,
+ "step": 3771
+ },
+ {
+ "epoch": 10.277929155313352,
+ "grad_norm": 7.233214855194092,
+ "learning_rate": 1.9723477694868166e-05,
+ "loss": 1.1707,
+ "step": 3772
+ },
+ {
+ "epoch": 10.280653950953678,
+ "grad_norm": 9.923511505126953,
+ "learning_rate": 1.972327156131752e-05,
+ "loss": 1.3611,
+ "step": 3773
+ },
+ {
+ "epoch": 10.283378746594005,
+ "grad_norm": 9.412862777709961,
+ "learning_rate": 1.972306535204235e-05,
+ "loss": 1.616,
+ "step": 3774
+ },
+ {
+ "epoch": 10.286103542234333,
+ "grad_norm": 10.132314682006836,
+ "learning_rate": 1.972285906704426e-05,
+ "loss": 1.2781,
+ "step": 3775
+ },
+ {
+ "epoch": 10.288828337874659,
+ "grad_norm": 10.205955505371094,
+ "learning_rate": 1.9722652706324853e-05,
+ "loss": 1.3584,
+ "step": 3776
+ },
+ {
+ "epoch": 10.291553133514986,
+ "grad_norm": 8.780740737915039,
+ "learning_rate": 1.972244626988574e-05,
+ "loss": 1.2617,
+ "step": 3777
+ },
+ {
+ "epoch": 10.294277929155314,
+ "grad_norm": 8.577252388000488,
+ "learning_rate": 1.972223975772853e-05,
+ "loss": 1.3442,
+ "step": 3778
+ },
+ {
+ "epoch": 10.29700272479564,
+ "grad_norm": 21.673694610595703,
+ "learning_rate": 1.9722033169854828e-05,
+ "loss": 1.2632,
+ "step": 3779
+ },
+ {
+ "epoch": 10.299727520435967,
+ "grad_norm": 10.122228622436523,
+ "learning_rate": 1.972182650626625e-05,
+ "loss": 1.3464,
+ "step": 3780
+ },
+ {
+ "epoch": 10.302452316076295,
+ "grad_norm": 9.061145782470703,
+ "learning_rate": 1.9721619766964393e-05,
+ "loss": 1.2012,
+ "step": 3781
+ },
+ {
+ "epoch": 10.30517711171662,
+ "grad_norm": 10.760348320007324,
+ "learning_rate": 1.9721412951950876e-05,
+ "loss": 1.2756,
+ "step": 3782
+ },
+ {
+ "epoch": 10.307901907356948,
+ "grad_norm": 9.252158164978027,
+ "learning_rate": 1.9721206061227312e-05,
+ "loss": 1.1973,
+ "step": 3783
+ },
+ {
+ "epoch": 10.310626702997276,
+ "grad_norm": 8.771831512451172,
+ "learning_rate": 1.9720999094795303e-05,
+ "loss": 1.3455,
+ "step": 3784
+ },
+ {
+ "epoch": 10.313351498637601,
+ "grad_norm": 42.56612777709961,
+ "learning_rate": 1.9720792052656468e-05,
+ "loss": 1.1782,
+ "step": 3785
+ },
+ {
+ "epoch": 10.316076294277929,
+ "grad_norm": 10.31918716430664,
+ "learning_rate": 1.9720584934812417e-05,
+ "loss": 1.3016,
+ "step": 3786
+ },
+ {
+ "epoch": 10.318801089918257,
+ "grad_norm": 11.992305755615234,
+ "learning_rate": 1.9720377741264762e-05,
+ "loss": 1.3696,
+ "step": 3787
+ },
+ {
+ "epoch": 10.321525885558582,
+ "grad_norm": 9.100144386291504,
+ "learning_rate": 1.972017047201512e-05,
+ "loss": 1.4116,
+ "step": 3788
+ },
+ {
+ "epoch": 10.32425068119891,
+ "grad_norm": 9.619243621826172,
+ "learning_rate": 1.9719963127065106e-05,
+ "loss": 1.2756,
+ "step": 3789
+ },
+ {
+ "epoch": 10.326975476839237,
+ "grad_norm": 9.421488761901855,
+ "learning_rate": 1.9719755706416327e-05,
+ "loss": 1.3113,
+ "step": 3790
+ },
+ {
+ "epoch": 10.329700272479563,
+ "grad_norm": 12.199220657348633,
+ "learning_rate": 1.9719548210070406e-05,
+ "loss": 1.0781,
+ "step": 3791
+ },
+ {
+ "epoch": 10.33242506811989,
+ "grad_norm": 9.928030014038086,
+ "learning_rate": 1.9719340638028952e-05,
+ "loss": 1.2095,
+ "step": 3792
+ },
+ {
+ "epoch": 10.335149863760218,
+ "grad_norm": 9.56116008758545,
+ "learning_rate": 1.971913299029359e-05,
+ "loss": 1.1885,
+ "step": 3793
+ },
+ {
+ "epoch": 10.337874659400544,
+ "grad_norm": 7.255523681640625,
+ "learning_rate": 1.9718925266865933e-05,
+ "loss": 1.1289,
+ "step": 3794
+ },
+ {
+ "epoch": 10.340599455040872,
+ "grad_norm": 9.008003234863281,
+ "learning_rate": 1.97187174677476e-05,
+ "loss": 1.291,
+ "step": 3795
+ },
+ {
+ "epoch": 10.3433242506812,
+ "grad_norm": 9.741546630859375,
+ "learning_rate": 1.9718509592940206e-05,
+ "loss": 1.5688,
+ "step": 3796
+ },
+ {
+ "epoch": 10.346049046321525,
+ "grad_norm": 9.080355644226074,
+ "learning_rate": 1.971830164244537e-05,
+ "loss": 1.5061,
+ "step": 3797
+ },
+ {
+ "epoch": 10.348773841961853,
+ "grad_norm": 10.598738670349121,
+ "learning_rate": 1.9718093616264717e-05,
+ "loss": 1.4241,
+ "step": 3798
+ },
+ {
+ "epoch": 10.35149863760218,
+ "grad_norm": 9.218337059020996,
+ "learning_rate": 1.9717885514399865e-05,
+ "loss": 1.3118,
+ "step": 3799
+ },
+ {
+ "epoch": 10.354223433242506,
+ "grad_norm": 11.137333869934082,
+ "learning_rate": 1.971767733685243e-05,
+ "loss": 1.2661,
+ "step": 3800
+ },
+ {
+ "epoch": 10.356948228882834,
+ "grad_norm": 9.336284637451172,
+ "learning_rate": 1.9717469083624037e-05,
+ "loss": 1.1646,
+ "step": 3801
+ },
+ {
+ "epoch": 10.359673024523161,
+ "grad_norm": 8.485359191894531,
+ "learning_rate": 1.9717260754716306e-05,
+ "loss": 1.2327,
+ "step": 3802
+ },
+ {
+ "epoch": 10.362397820163487,
+ "grad_norm": 10.281926155090332,
+ "learning_rate": 1.9717052350130864e-05,
+ "loss": 1.3621,
+ "step": 3803
+ },
+ {
+ "epoch": 10.365122615803815,
+ "grad_norm": 9.651093482971191,
+ "learning_rate": 1.971684386986933e-05,
+ "loss": 1.2651,
+ "step": 3804
+ },
+ {
+ "epoch": 10.367847411444142,
+ "grad_norm": 7.217008113861084,
+ "learning_rate": 1.9716635313933334e-05,
+ "loss": 1.187,
+ "step": 3805
+ },
+ {
+ "epoch": 10.370572207084468,
+ "grad_norm": 11.755059242248535,
+ "learning_rate": 1.9716426682324488e-05,
+ "loss": 1.1824,
+ "step": 3806
+ },
+ {
+ "epoch": 10.373297002724795,
+ "grad_norm": 9.702676773071289,
+ "learning_rate": 1.9716217975044426e-05,
+ "loss": 1.145,
+ "step": 3807
+ },
+ {
+ "epoch": 10.376021798365123,
+ "grad_norm": 8.324348449707031,
+ "learning_rate": 1.971600919209477e-05,
+ "loss": 1.2952,
+ "step": 3808
+ },
+ {
+ "epoch": 10.378746594005449,
+ "grad_norm": 8.522875785827637,
+ "learning_rate": 1.9715800333477148e-05,
+ "loss": 1.2107,
+ "step": 3809
+ },
+ {
+ "epoch": 10.381471389645776,
+ "grad_norm": 10.177056312561035,
+ "learning_rate": 1.9715591399193184e-05,
+ "loss": 1.2394,
+ "step": 3810
+ },
+ {
+ "epoch": 10.384196185286104,
+ "grad_norm": 8.588276863098145,
+ "learning_rate": 1.971538238924451e-05,
+ "loss": 1.4268,
+ "step": 3811
+ },
+ {
+ "epoch": 10.38692098092643,
+ "grad_norm": 9.623733520507812,
+ "learning_rate": 1.971517330363275e-05,
+ "loss": 1.2933,
+ "step": 3812
+ },
+ {
+ "epoch": 10.389645776566757,
+ "grad_norm": 8.727866172790527,
+ "learning_rate": 1.971496414235953e-05,
+ "loss": 1.2993,
+ "step": 3813
+ },
+ {
+ "epoch": 10.392370572207085,
+ "grad_norm": 7.569778919219971,
+ "learning_rate": 1.9714754905426484e-05,
+ "loss": 1.144,
+ "step": 3814
+ },
+ {
+ "epoch": 10.39509536784741,
+ "grad_norm": 10.021020889282227,
+ "learning_rate": 1.971454559283524e-05,
+ "loss": 1.3115,
+ "step": 3815
+ },
+ {
+ "epoch": 10.397820163487738,
+ "grad_norm": 9.4724702835083,
+ "learning_rate": 1.971433620458743e-05,
+ "loss": 1.1936,
+ "step": 3816
+ },
+ {
+ "epoch": 10.400544959128066,
+ "grad_norm": 8.412431716918945,
+ "learning_rate": 1.9714126740684677e-05,
+ "loss": 1.1482,
+ "step": 3817
+ },
+ {
+ "epoch": 10.403269754768392,
+ "grad_norm": 9.864459991455078,
+ "learning_rate": 1.971391720112862e-05,
+ "loss": 1.2603,
+ "step": 3818
+ },
+ {
+ "epoch": 10.40599455040872,
+ "grad_norm": 10.525559425354004,
+ "learning_rate": 1.971370758592089e-05,
+ "loss": 1.3506,
+ "step": 3819
+ },
+ {
+ "epoch": 10.408719346049047,
+ "grad_norm": 9.138388633728027,
+ "learning_rate": 1.9713497895063116e-05,
+ "loss": 1.3379,
+ "step": 3820
+ },
+ {
+ "epoch": 10.411444141689373,
+ "grad_norm": 25.672163009643555,
+ "learning_rate": 1.9713288128556932e-05,
+ "loss": 1.3042,
+ "step": 3821
+ },
+ {
+ "epoch": 10.4141689373297,
+ "grad_norm": 8.900979995727539,
+ "learning_rate": 1.9713078286403973e-05,
+ "loss": 1.3018,
+ "step": 3822
+ },
+ {
+ "epoch": 10.416893732970028,
+ "grad_norm": 9.162127494812012,
+ "learning_rate": 1.9712868368605877e-05,
+ "loss": 1.2988,
+ "step": 3823
+ },
+ {
+ "epoch": 10.419618528610354,
+ "grad_norm": 9.616890907287598,
+ "learning_rate": 1.9712658375164272e-05,
+ "loss": 1.2065,
+ "step": 3824
+ },
+ {
+ "epoch": 10.422343324250681,
+ "grad_norm": 7.914255142211914,
+ "learning_rate": 1.9712448306080793e-05,
+ "loss": 1.2363,
+ "step": 3825
+ },
+ {
+ "epoch": 10.425068119891009,
+ "grad_norm": 9.041911125183105,
+ "learning_rate": 1.9712238161357084e-05,
+ "loss": 1.2035,
+ "step": 3826
+ },
+ {
+ "epoch": 10.427792915531334,
+ "grad_norm": 9.996464729309082,
+ "learning_rate": 1.9712027940994777e-05,
+ "loss": 1.5454,
+ "step": 3827
+ },
+ {
+ "epoch": 10.430517711171662,
+ "grad_norm": 10.33507251739502,
+ "learning_rate": 1.9711817644995504e-05,
+ "loss": 1.3087,
+ "step": 3828
+ },
+ {
+ "epoch": 10.43324250681199,
+ "grad_norm": 6.783405303955078,
+ "learning_rate": 1.9711607273360912e-05,
+ "loss": 1.0486,
+ "step": 3829
+ },
+ {
+ "epoch": 10.435967302452315,
+ "grad_norm": 9.515064239501953,
+ "learning_rate": 1.9711396826092634e-05,
+ "loss": 1.2166,
+ "step": 3830
+ },
+ {
+ "epoch": 10.438692098092643,
+ "grad_norm": 11.367918014526367,
+ "learning_rate": 1.971118630319231e-05,
+ "loss": 1.2151,
+ "step": 3831
+ },
+ {
+ "epoch": 10.44141689373297,
+ "grad_norm": 11.599645614624023,
+ "learning_rate": 1.971097570466158e-05,
+ "loss": 1.4387,
+ "step": 3832
+ },
+ {
+ "epoch": 10.444141689373296,
+ "grad_norm": 9.678275108337402,
+ "learning_rate": 1.9710765030502085e-05,
+ "loss": 1.2834,
+ "step": 3833
+ },
+ {
+ "epoch": 10.446866485013624,
+ "grad_norm": 9.844661712646484,
+ "learning_rate": 1.971055428071546e-05,
+ "loss": 1.3894,
+ "step": 3834
+ },
+ {
+ "epoch": 10.449591280653951,
+ "grad_norm": 9.34825325012207,
+ "learning_rate": 1.9710343455303354e-05,
+ "loss": 1.4243,
+ "step": 3835
+ },
+ {
+ "epoch": 10.452316076294277,
+ "grad_norm": 9.034146308898926,
+ "learning_rate": 1.9710132554267404e-05,
+ "loss": 1.3154,
+ "step": 3836
+ },
+ {
+ "epoch": 10.455040871934605,
+ "grad_norm": 7.973133087158203,
+ "learning_rate": 1.9709921577609256e-05,
+ "loss": 1.2537,
+ "step": 3837
+ },
+ {
+ "epoch": 10.457765667574932,
+ "grad_norm": 8.211280822753906,
+ "learning_rate": 1.9709710525330548e-05,
+ "loss": 1.2642,
+ "step": 3838
+ },
+ {
+ "epoch": 10.460490463215258,
+ "grad_norm": 7.642856121063232,
+ "learning_rate": 1.9709499397432933e-05,
+ "loss": 1.1416,
+ "step": 3839
+ },
+ {
+ "epoch": 10.463215258855586,
+ "grad_norm": 11.273480415344238,
+ "learning_rate": 1.9709288193918044e-05,
+ "loss": 1.4062,
+ "step": 3840
+ },
+ {
+ "epoch": 10.465940054495913,
+ "grad_norm": 8.373019218444824,
+ "learning_rate": 1.9709076914787535e-05,
+ "loss": 1.3447,
+ "step": 3841
+ },
+ {
+ "epoch": 10.46866485013624,
+ "grad_norm": 6.9242167472839355,
+ "learning_rate": 1.9708865560043044e-05,
+ "loss": 1.2529,
+ "step": 3842
+ },
+ {
+ "epoch": 10.471389645776567,
+ "grad_norm": 10.533818244934082,
+ "learning_rate": 1.9708654129686224e-05,
+ "loss": 1.3271,
+ "step": 3843
+ },
+ {
+ "epoch": 10.474114441416894,
+ "grad_norm": 8.539103507995605,
+ "learning_rate": 1.9708442623718715e-05,
+ "loss": 1.3213,
+ "step": 3844
+ },
+ {
+ "epoch": 10.47683923705722,
+ "grad_norm": 18.204378128051758,
+ "learning_rate": 1.9708231042142166e-05,
+ "loss": 1.1941,
+ "step": 3845
+ },
+ {
+ "epoch": 10.479564032697548,
+ "grad_norm": 7.1978020668029785,
+ "learning_rate": 1.970801938495823e-05,
+ "loss": 1.3103,
+ "step": 3846
+ },
+ {
+ "epoch": 10.482288828337875,
+ "grad_norm": 7.041075706481934,
+ "learning_rate": 1.970780765216855e-05,
+ "loss": 1.178,
+ "step": 3847
+ },
+ {
+ "epoch": 10.485013623978201,
+ "grad_norm": 9.322103500366211,
+ "learning_rate": 1.9707595843774775e-05,
+ "loss": 1.4185,
+ "step": 3848
+ },
+ {
+ "epoch": 10.487738419618529,
+ "grad_norm": 13.164305686950684,
+ "learning_rate": 1.970738395977856e-05,
+ "loss": 1.3958,
+ "step": 3849
+ },
+ {
+ "epoch": 10.490463215258856,
+ "grad_norm": 10.326935768127441,
+ "learning_rate": 1.9707172000181546e-05,
+ "loss": 1.1398,
+ "step": 3850
+ },
+ {
+ "epoch": 10.493188010899182,
+ "grad_norm": 11.156216621398926,
+ "learning_rate": 1.9706959964985393e-05,
+ "loss": 1.3259,
+ "step": 3851
+ },
+ {
+ "epoch": 10.49591280653951,
+ "grad_norm": 8.280145645141602,
+ "learning_rate": 1.9706747854191745e-05,
+ "loss": 1.1892,
+ "step": 3852
+ },
+ {
+ "epoch": 10.498637602179837,
+ "grad_norm": 7.20928430557251,
+ "learning_rate": 1.970653566780226e-05,
+ "loss": 1.2397,
+ "step": 3853
+ },
+ {
+ "epoch": 10.501362397820163,
+ "grad_norm": 8.880866050720215,
+ "learning_rate": 1.9706323405818585e-05,
+ "loss": 1.1702,
+ "step": 3854
+ },
+ {
+ "epoch": 10.50408719346049,
+ "grad_norm": 9.814594268798828,
+ "learning_rate": 1.970611106824238e-05,
+ "loss": 1.2422,
+ "step": 3855
+ },
+ {
+ "epoch": 10.506811989100818,
+ "grad_norm": 9.441638946533203,
+ "learning_rate": 1.970589865507529e-05,
+ "loss": 1.4011,
+ "step": 3856
+ },
+ {
+ "epoch": 10.509536784741144,
+ "grad_norm": 12.693705558776855,
+ "learning_rate": 1.9705686166318973e-05,
+ "loss": 1.1509,
+ "step": 3857
+ },
+ {
+ "epoch": 10.512261580381471,
+ "grad_norm": 8.02194881439209,
+ "learning_rate": 1.9705473601975086e-05,
+ "loss": 1.2563,
+ "step": 3858
+ },
+ {
+ "epoch": 10.514986376021799,
+ "grad_norm": 9.439316749572754,
+ "learning_rate": 1.9705260962045286e-05,
+ "loss": 1.0911,
+ "step": 3859
+ },
+ {
+ "epoch": 10.517711171662125,
+ "grad_norm": 8.744632720947266,
+ "learning_rate": 1.9705048246531223e-05,
+ "loss": 1.2751,
+ "step": 3860
+ },
+ {
+ "epoch": 10.520435967302452,
+ "grad_norm": 9.701316833496094,
+ "learning_rate": 1.9704835455434556e-05,
+ "loss": 1.3284,
+ "step": 3861
+ },
+ {
+ "epoch": 10.52316076294278,
+ "grad_norm": 10.048924446105957,
+ "learning_rate": 1.9704622588756946e-05,
+ "loss": 1.1418,
+ "step": 3862
+ },
+ {
+ "epoch": 10.525885558583106,
+ "grad_norm": 9.116254806518555,
+ "learning_rate": 1.9704409646500044e-05,
+ "loss": 1.2899,
+ "step": 3863
+ },
+ {
+ "epoch": 10.528610354223433,
+ "grad_norm": 8.23773193359375,
+ "learning_rate": 1.970419662866551e-05,
+ "loss": 1.3109,
+ "step": 3864
+ },
+ {
+ "epoch": 10.53133514986376,
+ "grad_norm": 9.133581161499023,
+ "learning_rate": 1.9703983535255013e-05,
+ "loss": 1.4475,
+ "step": 3865
+ },
+ {
+ "epoch": 10.534059945504087,
+ "grad_norm": 8.2056303024292,
+ "learning_rate": 1.97037703662702e-05,
+ "loss": 1.3225,
+ "step": 3866
+ },
+ {
+ "epoch": 10.536784741144414,
+ "grad_norm": 8.202545166015625,
+ "learning_rate": 1.9703557121712737e-05,
+ "loss": 1.1953,
+ "step": 3867
+ },
+ {
+ "epoch": 10.539509536784742,
+ "grad_norm": 11.55584716796875,
+ "learning_rate": 1.9703343801584282e-05,
+ "loss": 1.2284,
+ "step": 3868
+ },
+ {
+ "epoch": 10.542234332425068,
+ "grad_norm": 10.944612503051758,
+ "learning_rate": 1.9703130405886496e-05,
+ "loss": 1.2878,
+ "step": 3869
+ },
+ {
+ "epoch": 10.544959128065395,
+ "grad_norm": 8.7283296585083,
+ "learning_rate": 1.9702916934621044e-05,
+ "loss": 1.3218,
+ "step": 3870
+ },
+ {
+ "epoch": 10.547683923705723,
+ "grad_norm": 9.210609436035156,
+ "learning_rate": 1.970270338778959e-05,
+ "loss": 1.3323,
+ "step": 3871
+ },
+ {
+ "epoch": 10.550408719346049,
+ "grad_norm": 12.175301551818848,
+ "learning_rate": 1.970248976539379e-05,
+ "loss": 1.5093,
+ "step": 3872
+ },
+ {
+ "epoch": 10.553133514986376,
+ "grad_norm": 9.581300735473633,
+ "learning_rate": 1.9702276067435316e-05,
+ "loss": 1.2495,
+ "step": 3873
+ },
+ {
+ "epoch": 10.555858310626704,
+ "grad_norm": 16.556753158569336,
+ "learning_rate": 1.9702062293915827e-05,
+ "loss": 1.4321,
+ "step": 3874
+ },
+ {
+ "epoch": 10.55858310626703,
+ "grad_norm": 10.717095375061035,
+ "learning_rate": 1.9701848444836987e-05,
+ "loss": 1.4023,
+ "step": 3875
+ },
+ {
+ "epoch": 10.561307901907357,
+ "grad_norm": 168.3912353515625,
+ "learning_rate": 1.9701634520200468e-05,
+ "loss": 1.4412,
+ "step": 3876
+ },
+ {
+ "epoch": 10.564032697547685,
+ "grad_norm": 11.4203462600708,
+ "learning_rate": 1.9701420520007928e-05,
+ "loss": 1.4312,
+ "step": 3877
+ },
+ {
+ "epoch": 10.56675749318801,
+ "grad_norm": 13.96320629119873,
+ "learning_rate": 1.970120644426104e-05,
+ "loss": 1.2971,
+ "step": 3878
+ },
+ {
+ "epoch": 10.569482288828338,
+ "grad_norm": 11.062853813171387,
+ "learning_rate": 1.9700992292961464e-05,
+ "loss": 1.5339,
+ "step": 3879
+ },
+ {
+ "epoch": 10.572207084468666,
+ "grad_norm": 21.22389793395996,
+ "learning_rate": 1.9700778066110873e-05,
+ "loss": 1.4445,
+ "step": 3880
+ },
+ {
+ "epoch": 10.574931880108991,
+ "grad_norm": 12.854517936706543,
+ "learning_rate": 1.9700563763710937e-05,
+ "loss": 1.498,
+ "step": 3881
+ },
+ {
+ "epoch": 10.577656675749319,
+ "grad_norm": 12.884160041809082,
+ "learning_rate": 1.9700349385763323e-05,
+ "loss": 1.3398,
+ "step": 3882
+ },
+ {
+ "epoch": 10.580381471389646,
+ "grad_norm": 11.598206520080566,
+ "learning_rate": 1.9700134932269698e-05,
+ "loss": 1.0874,
+ "step": 3883
+ },
+ {
+ "epoch": 10.583106267029972,
+ "grad_norm": 9.25067138671875,
+ "learning_rate": 1.9699920403231734e-05,
+ "loss": 1.1362,
+ "step": 3884
+ },
+ {
+ "epoch": 10.5858310626703,
+ "grad_norm": 14.375128746032715,
+ "learning_rate": 1.9699705798651104e-05,
+ "loss": 1.3901,
+ "step": 3885
+ },
+ {
+ "epoch": 10.588555858310627,
+ "grad_norm": 15.819267272949219,
+ "learning_rate": 1.9699491118529476e-05,
+ "loss": 1.2039,
+ "step": 3886
+ },
+ {
+ "epoch": 10.591280653950953,
+ "grad_norm": 26.65336799621582,
+ "learning_rate": 1.9699276362868526e-05,
+ "loss": 1.3782,
+ "step": 3887
+ },
+ {
+ "epoch": 10.59400544959128,
+ "grad_norm": 9.443343162536621,
+ "learning_rate": 1.9699061531669922e-05,
+ "loss": 1.2375,
+ "step": 3888
+ },
+ {
+ "epoch": 10.596730245231608,
+ "grad_norm": 11.523008346557617,
+ "learning_rate": 1.969884662493534e-05,
+ "loss": 1.2773,
+ "step": 3889
+ },
+ {
+ "epoch": 10.599455040871934,
+ "grad_norm": 13.750526428222656,
+ "learning_rate": 1.969863164266645e-05,
+ "loss": 1.1868,
+ "step": 3890
+ },
+ {
+ "epoch": 10.602179836512262,
+ "grad_norm": 13.709173202514648,
+ "learning_rate": 1.9698416584864932e-05,
+ "loss": 1.4307,
+ "step": 3891
+ },
+ {
+ "epoch": 10.60490463215259,
+ "grad_norm": 16.232471466064453,
+ "learning_rate": 1.9698201451532458e-05,
+ "loss": 1.3699,
+ "step": 3892
+ },
+ {
+ "epoch": 10.607629427792915,
+ "grad_norm": 13.37336254119873,
+ "learning_rate": 1.9697986242670703e-05,
+ "loss": 1.2227,
+ "step": 3893
+ },
+ {
+ "epoch": 10.610354223433243,
+ "grad_norm": 21.085451126098633,
+ "learning_rate": 1.969777095828134e-05,
+ "loss": 1.4746,
+ "step": 3894
+ },
+ {
+ "epoch": 10.61307901907357,
+ "grad_norm": 11.080826759338379,
+ "learning_rate": 1.969755559836605e-05,
+ "loss": 1.1066,
+ "step": 3895
+ },
+ {
+ "epoch": 10.615803814713896,
+ "grad_norm": 21.83421516418457,
+ "learning_rate": 1.969734016292651e-05,
+ "loss": 1.3494,
+ "step": 3896
+ },
+ {
+ "epoch": 10.618528610354224,
+ "grad_norm": 10.210470199584961,
+ "learning_rate": 1.9697124651964397e-05,
+ "loss": 1.2649,
+ "step": 3897
+ },
+ {
+ "epoch": 10.621253405994551,
+ "grad_norm": 11.174847602844238,
+ "learning_rate": 1.969690906548139e-05,
+ "loss": 1.4182,
+ "step": 3898
+ },
+ {
+ "epoch": 10.623978201634877,
+ "grad_norm": 18.439865112304688,
+ "learning_rate": 1.9696693403479165e-05,
+ "loss": 1.4883,
+ "step": 3899
+ },
+ {
+ "epoch": 10.626702997275205,
+ "grad_norm": 13.370489120483398,
+ "learning_rate": 1.9696477665959405e-05,
+ "loss": 1.281,
+ "step": 3900
+ },
+ {
+ "epoch": 10.629427792915532,
+ "grad_norm": 17.80059051513672,
+ "learning_rate": 1.969626185292379e-05,
+ "loss": 1.2476,
+ "step": 3901
+ },
+ {
+ "epoch": 10.632152588555858,
+ "grad_norm": 10.8162841796875,
+ "learning_rate": 1.9696045964374e-05,
+ "loss": 1.276,
+ "step": 3902
+ },
+ {
+ "epoch": 10.634877384196185,
+ "grad_norm": 9.661311149597168,
+ "learning_rate": 1.9695830000311716e-05,
+ "loss": 1.1792,
+ "step": 3903
+ },
+ {
+ "epoch": 10.637602179836513,
+ "grad_norm": 11.938919067382812,
+ "learning_rate": 1.9695613960738617e-05,
+ "loss": 1.3979,
+ "step": 3904
+ },
+ {
+ "epoch": 10.640326975476839,
+ "grad_norm": 11.777043342590332,
+ "learning_rate": 1.9695397845656393e-05,
+ "loss": 1.2119,
+ "step": 3905
+ },
+ {
+ "epoch": 10.643051771117166,
+ "grad_norm": 13.915650367736816,
+ "learning_rate": 1.9695181655066718e-05,
+ "loss": 1.3026,
+ "step": 3906
+ },
+ {
+ "epoch": 10.645776566757494,
+ "grad_norm": 13.268310546875,
+ "learning_rate": 1.9694965388971283e-05,
+ "loss": 1.428,
+ "step": 3907
+ },
+ {
+ "epoch": 10.64850136239782,
+ "grad_norm": 10.28786563873291,
+ "learning_rate": 1.969474904737177e-05,
+ "loss": 1.2898,
+ "step": 3908
+ },
+ {
+ "epoch": 10.651226158038147,
+ "grad_norm": 10.619996070861816,
+ "learning_rate": 1.9694532630269864e-05,
+ "loss": 1.1797,
+ "step": 3909
+ },
+ {
+ "epoch": 10.653950953678475,
+ "grad_norm": 17.510385513305664,
+ "learning_rate": 1.9694316137667248e-05,
+ "loss": 1.3794,
+ "step": 3910
+ },
+ {
+ "epoch": 10.6566757493188,
+ "grad_norm": 12.013043403625488,
+ "learning_rate": 1.969409956956561e-05,
+ "loss": 1.3135,
+ "step": 3911
+ },
+ {
+ "epoch": 10.659400544959128,
+ "grad_norm": 7.912718772888184,
+ "learning_rate": 1.969388292596664e-05,
+ "loss": 1.1248,
+ "step": 3912
+ },
+ {
+ "epoch": 10.662125340599456,
+ "grad_norm": 7.531147003173828,
+ "learning_rate": 1.9693666206872017e-05,
+ "loss": 1.1257,
+ "step": 3913
+ },
+ {
+ "epoch": 10.664850136239782,
+ "grad_norm": 10.835655212402344,
+ "learning_rate": 1.9693449412283435e-05,
+ "loss": 1.2842,
+ "step": 3914
+ },
+ {
+ "epoch": 10.66757493188011,
+ "grad_norm": 13.660799980163574,
+ "learning_rate": 1.9693232542202582e-05,
+ "loss": 1.3916,
+ "step": 3915
+ },
+ {
+ "epoch": 10.670299727520437,
+ "grad_norm": 14.183218955993652,
+ "learning_rate": 1.9693015596631143e-05,
+ "loss": 1.3655,
+ "step": 3916
+ },
+ {
+ "epoch": 10.673024523160763,
+ "grad_norm": 9.423027038574219,
+ "learning_rate": 1.9692798575570814e-05,
+ "loss": 1.4351,
+ "step": 3917
+ },
+ {
+ "epoch": 10.67574931880109,
+ "grad_norm": 9.637275695800781,
+ "learning_rate": 1.969258147902328e-05,
+ "loss": 1.448,
+ "step": 3918
+ },
+ {
+ "epoch": 10.678474114441418,
+ "grad_norm": 19.27906608581543,
+ "learning_rate": 1.9692364306990235e-05,
+ "loss": 1.2805,
+ "step": 3919
+ },
+ {
+ "epoch": 10.681198910081743,
+ "grad_norm": 11.753655433654785,
+ "learning_rate": 1.9692147059473367e-05,
+ "loss": 1.2595,
+ "step": 3920
+ },
+ {
+ "epoch": 10.683923705722071,
+ "grad_norm": 10.566637992858887,
+ "learning_rate": 1.969192973647437e-05,
+ "loss": 1.2373,
+ "step": 3921
+ },
+ {
+ "epoch": 10.686648501362399,
+ "grad_norm": 10.477239608764648,
+ "learning_rate": 1.9691712337994938e-05,
+ "loss": 1.4121,
+ "step": 3922
+ },
+ {
+ "epoch": 10.689373297002724,
+ "grad_norm": 9.499421119689941,
+ "learning_rate": 1.969149486403676e-05,
+ "loss": 1.2876,
+ "step": 3923
+ },
+ {
+ "epoch": 10.692098092643052,
+ "grad_norm": 19.364608764648438,
+ "learning_rate": 1.9691277314601534e-05,
+ "loss": 1.3411,
+ "step": 3924
+ },
+ {
+ "epoch": 10.69482288828338,
+ "grad_norm": 11.257384300231934,
+ "learning_rate": 1.969105968969095e-05,
+ "loss": 1.4094,
+ "step": 3925
+ },
+ {
+ "epoch": 10.697547683923705,
+ "grad_norm": 10.027420043945312,
+ "learning_rate": 1.9690841989306703e-05,
+ "loss": 1.3489,
+ "step": 3926
+ },
+ {
+ "epoch": 10.700272479564033,
+ "grad_norm": 10.581485748291016,
+ "learning_rate": 1.9690624213450493e-05,
+ "loss": 1.3269,
+ "step": 3927
+ },
+ {
+ "epoch": 10.70299727520436,
+ "grad_norm": 8.834001541137695,
+ "learning_rate": 1.9690406362124014e-05,
+ "loss": 1.2834,
+ "step": 3928
+ },
+ {
+ "epoch": 10.705722070844686,
+ "grad_norm": 10.63623332977295,
+ "learning_rate": 1.9690188435328962e-05,
+ "loss": 1.5283,
+ "step": 3929
+ },
+ {
+ "epoch": 10.708446866485014,
+ "grad_norm": 10.122505187988281,
+ "learning_rate": 1.9689970433067035e-05,
+ "loss": 1.312,
+ "step": 3930
+ },
+ {
+ "epoch": 10.711171662125341,
+ "grad_norm": 12.947110176086426,
+ "learning_rate": 1.9689752355339928e-05,
+ "loss": 1.5078,
+ "step": 3931
+ },
+ {
+ "epoch": 10.713896457765667,
+ "grad_norm": 19.704675674438477,
+ "learning_rate": 1.9689534202149344e-05,
+ "loss": 1.3325,
+ "step": 3932
+ },
+ {
+ "epoch": 10.716621253405995,
+ "grad_norm": 8.936685562133789,
+ "learning_rate": 1.9689315973496978e-05,
+ "loss": 1.3584,
+ "step": 3933
+ },
+ {
+ "epoch": 10.719346049046322,
+ "grad_norm": 11.175673484802246,
+ "learning_rate": 1.9689097669384533e-05,
+ "loss": 1.2551,
+ "step": 3934
+ },
+ {
+ "epoch": 10.722070844686648,
+ "grad_norm": 9.431500434875488,
+ "learning_rate": 1.9688879289813705e-05,
+ "loss": 1.1538,
+ "step": 3935
+ },
+ {
+ "epoch": 10.724795640326976,
+ "grad_norm": 10.447210311889648,
+ "learning_rate": 1.96886608347862e-05,
+ "loss": 1.3635,
+ "step": 3936
+ },
+ {
+ "epoch": 10.727520435967303,
+ "grad_norm": 11.345307350158691,
+ "learning_rate": 1.9688442304303713e-05,
+ "loss": 1.3945,
+ "step": 3937
+ },
+ {
+ "epoch": 10.730245231607629,
+ "grad_norm": 11.375175476074219,
+ "learning_rate": 1.968822369836795e-05,
+ "loss": 1.2881,
+ "step": 3938
+ },
+ {
+ "epoch": 10.732970027247957,
+ "grad_norm": 8.946102142333984,
+ "learning_rate": 1.968800501698061e-05,
+ "loss": 1.4264,
+ "step": 3939
+ },
+ {
+ "epoch": 10.735694822888284,
+ "grad_norm": 11.147432327270508,
+ "learning_rate": 1.96877862601434e-05,
+ "loss": 1.2141,
+ "step": 3940
+ },
+ {
+ "epoch": 10.73841961852861,
+ "grad_norm": 10.1541748046875,
+ "learning_rate": 1.9687567427858026e-05,
+ "loss": 1.2441,
+ "step": 3941
+ },
+ {
+ "epoch": 10.741144414168938,
+ "grad_norm": 8.995576858520508,
+ "learning_rate": 1.9687348520126187e-05,
+ "loss": 1.3813,
+ "step": 3942
+ },
+ {
+ "epoch": 10.743869209809265,
+ "grad_norm": 10.57896614074707,
+ "learning_rate": 1.9687129536949587e-05,
+ "loss": 1.4097,
+ "step": 3943
+ },
+ {
+ "epoch": 10.746594005449591,
+ "grad_norm": 9.385448455810547,
+ "learning_rate": 1.9686910478329938e-05,
+ "loss": 1.3086,
+ "step": 3944
+ },
+ {
+ "epoch": 10.749318801089919,
+ "grad_norm": 10.483943939208984,
+ "learning_rate": 1.968669134426894e-05,
+ "loss": 1.2358,
+ "step": 3945
+ },
+ {
+ "epoch": 10.752043596730246,
+ "grad_norm": 20.128450393676758,
+ "learning_rate": 1.96864721347683e-05,
+ "loss": 1.4196,
+ "step": 3946
+ },
+ {
+ "epoch": 10.754768392370572,
+ "grad_norm": 16.337125778198242,
+ "learning_rate": 1.968625284982973e-05,
+ "loss": 1.2693,
+ "step": 3947
+ },
+ {
+ "epoch": 10.7574931880109,
+ "grad_norm": 12.40900707244873,
+ "learning_rate": 1.9686033489454934e-05,
+ "loss": 1.5403,
+ "step": 3948
+ },
+ {
+ "epoch": 10.760217983651227,
+ "grad_norm": 10.881063461303711,
+ "learning_rate": 1.9685814053645618e-05,
+ "loss": 1.4182,
+ "step": 3949
+ },
+ {
+ "epoch": 10.762942779291553,
+ "grad_norm": 11.267525672912598,
+ "learning_rate": 1.9685594542403494e-05,
+ "loss": 1.2871,
+ "step": 3950
+ },
+ {
+ "epoch": 10.76566757493188,
+ "grad_norm": 9.441262245178223,
+ "learning_rate": 1.9685374955730275e-05,
+ "loss": 1.2678,
+ "step": 3951
+ },
+ {
+ "epoch": 10.768392370572208,
+ "grad_norm": 12.279179573059082,
+ "learning_rate": 1.9685155293627664e-05,
+ "loss": 1.4314,
+ "step": 3952
+ },
+ {
+ "epoch": 10.771117166212534,
+ "grad_norm": 9.561209678649902,
+ "learning_rate": 1.9684935556097378e-05,
+ "loss": 1.2091,
+ "step": 3953
+ },
+ {
+ "epoch": 10.773841961852861,
+ "grad_norm": 12.12336540222168,
+ "learning_rate": 1.9684715743141126e-05,
+ "loss": 1.3057,
+ "step": 3954
+ },
+ {
+ "epoch": 10.776566757493189,
+ "grad_norm": 11.090004920959473,
+ "learning_rate": 1.9684495854760616e-05,
+ "loss": 1.3801,
+ "step": 3955
+ },
+ {
+ "epoch": 10.779291553133515,
+ "grad_norm": 10.307674407958984,
+ "learning_rate": 1.9684275890957564e-05,
+ "loss": 1.2096,
+ "step": 3956
+ },
+ {
+ "epoch": 10.782016348773842,
+ "grad_norm": 9.547151565551758,
+ "learning_rate": 1.968405585173369e-05,
+ "loss": 1.4956,
+ "step": 3957
+ },
+ {
+ "epoch": 10.78474114441417,
+ "grad_norm": 11.083027839660645,
+ "learning_rate": 1.968383573709069e-05,
+ "loss": 1.2542,
+ "step": 3958
+ },
+ {
+ "epoch": 10.787465940054496,
+ "grad_norm": 11.283376693725586,
+ "learning_rate": 1.9683615547030296e-05,
+ "loss": 1.2568,
+ "step": 3959
+ },
+ {
+ "epoch": 10.790190735694823,
+ "grad_norm": 17.618133544921875,
+ "learning_rate": 1.9683395281554217e-05,
+ "loss": 1.1948,
+ "step": 3960
+ },
+ {
+ "epoch": 10.79291553133515,
+ "grad_norm": 13.181232452392578,
+ "learning_rate": 1.9683174940664163e-05,
+ "loss": 1.2615,
+ "step": 3961
+ },
+ {
+ "epoch": 10.795640326975477,
+ "grad_norm": 11.228410720825195,
+ "learning_rate": 1.9682954524361853e-05,
+ "loss": 1.3403,
+ "step": 3962
+ },
+ {
+ "epoch": 10.798365122615804,
+ "grad_norm": 14.959089279174805,
+ "learning_rate": 1.968273403264901e-05,
+ "loss": 1.1914,
+ "step": 3963
+ },
+ {
+ "epoch": 10.80108991825613,
+ "grad_norm": 14.117962837219238,
+ "learning_rate": 1.9682513465527345e-05,
+ "loss": 1.3884,
+ "step": 3964
+ },
+ {
+ "epoch": 10.803814713896458,
+ "grad_norm": 10.425492286682129,
+ "learning_rate": 1.9682292822998575e-05,
+ "loss": 1.3193,
+ "step": 3965
+ },
+ {
+ "epoch": 10.806539509536785,
+ "grad_norm": 15.191742897033691,
+ "learning_rate": 1.968207210506442e-05,
+ "loss": 1.4309,
+ "step": 3966
+ },
+ {
+ "epoch": 10.809264305177111,
+ "grad_norm": 12.611985206604004,
+ "learning_rate": 1.96818513117266e-05,
+ "loss": 1.3052,
+ "step": 3967
+ },
+ {
+ "epoch": 10.811989100817438,
+ "grad_norm": 12.097752571105957,
+ "learning_rate": 1.968163044298683e-05,
+ "loss": 1.4307,
+ "step": 3968
+ },
+ {
+ "epoch": 10.814713896457766,
+ "grad_norm": 13.448756217956543,
+ "learning_rate": 1.968140949884684e-05,
+ "loss": 1.3792,
+ "step": 3969
+ },
+ {
+ "epoch": 10.817438692098092,
+ "grad_norm": 10.021312713623047,
+ "learning_rate": 1.9681188479308343e-05,
+ "loss": 1.2178,
+ "step": 3970
+ },
+ {
+ "epoch": 10.82016348773842,
+ "grad_norm": 10.934687614440918,
+ "learning_rate": 1.9680967384373058e-05,
+ "loss": 1.3379,
+ "step": 3971
+ },
+ {
+ "epoch": 10.822888283378747,
+ "grad_norm": 10.070216178894043,
+ "learning_rate": 1.9680746214042714e-05,
+ "loss": 1.3088,
+ "step": 3972
+ },
+ {
+ "epoch": 10.825613079019073,
+ "grad_norm": 11.109722137451172,
+ "learning_rate": 1.9680524968319027e-05,
+ "loss": 1.2734,
+ "step": 3973
+ },
+ {
+ "epoch": 10.8283378746594,
+ "grad_norm": 11.988601684570312,
+ "learning_rate": 1.9680303647203723e-05,
+ "loss": 1.3433,
+ "step": 3974
+ },
+ {
+ "epoch": 10.831062670299728,
+ "grad_norm": 20.463165283203125,
+ "learning_rate": 1.968008225069853e-05,
+ "loss": 1.2795,
+ "step": 3975
+ },
+ {
+ "epoch": 10.833787465940054,
+ "grad_norm": 20.51481819152832,
+ "learning_rate": 1.9679860778805167e-05,
+ "loss": 1.4119,
+ "step": 3976
+ },
+ {
+ "epoch": 10.836512261580381,
+ "grad_norm": 9.952378273010254,
+ "learning_rate": 1.9679639231525357e-05,
+ "loss": 1.2629,
+ "step": 3977
+ },
+ {
+ "epoch": 10.839237057220709,
+ "grad_norm": 10.788759231567383,
+ "learning_rate": 1.9679417608860828e-05,
+ "loss": 1.1267,
+ "step": 3978
+ },
+ {
+ "epoch": 10.841961852861035,
+ "grad_norm": 11.57756233215332,
+ "learning_rate": 1.9679195910813308e-05,
+ "loss": 1.2061,
+ "step": 3979
+ },
+ {
+ "epoch": 10.844686648501362,
+ "grad_norm": 15.758150100708008,
+ "learning_rate": 1.9678974137384524e-05,
+ "loss": 1.1931,
+ "step": 3980
+ },
+ {
+ "epoch": 10.84741144414169,
+ "grad_norm": 13.442411422729492,
+ "learning_rate": 1.9678752288576198e-05,
+ "loss": 1.5183,
+ "step": 3981
+ },
+ {
+ "epoch": 10.850136239782016,
+ "grad_norm": 12.64612865447998,
+ "learning_rate": 1.967853036439006e-05,
+ "loss": 1.2146,
+ "step": 3982
+ },
+ {
+ "epoch": 10.852861035422343,
+ "grad_norm": 11.583940505981445,
+ "learning_rate": 1.967830836482784e-05,
+ "loss": 1.2296,
+ "step": 3983
+ },
+ {
+ "epoch": 10.85558583106267,
+ "grad_norm": 14.167618751525879,
+ "learning_rate": 1.9678086289891265e-05,
+ "loss": 1.2363,
+ "step": 3984
+ },
+ {
+ "epoch": 10.858310626702997,
+ "grad_norm": 11.235509872436523,
+ "learning_rate": 1.9677864139582066e-05,
+ "loss": 1.5708,
+ "step": 3985
+ },
+ {
+ "epoch": 10.861035422343324,
+ "grad_norm": 11.968399047851562,
+ "learning_rate": 1.9677641913901975e-05,
+ "loss": 1.255,
+ "step": 3986
+ },
+ {
+ "epoch": 10.863760217983652,
+ "grad_norm": 11.38996696472168,
+ "learning_rate": 1.9677419612852716e-05,
+ "loss": 1.178,
+ "step": 3987
+ },
+ {
+ "epoch": 10.866485013623977,
+ "grad_norm": 9.439459800720215,
+ "learning_rate": 1.9677197236436027e-05,
+ "loss": 1.3945,
+ "step": 3988
+ },
+ {
+ "epoch": 10.869209809264305,
+ "grad_norm": 51.21841812133789,
+ "learning_rate": 1.967697478465364e-05,
+ "loss": 1.2637,
+ "step": 3989
+ },
+ {
+ "epoch": 10.871934604904633,
+ "grad_norm": 9.610937118530273,
+ "learning_rate": 1.9676752257507282e-05,
+ "loss": 1.2288,
+ "step": 3990
+ },
+ {
+ "epoch": 10.874659400544958,
+ "grad_norm": 13.754937171936035,
+ "learning_rate": 1.967652965499869e-05,
+ "loss": 1.3416,
+ "step": 3991
+ },
+ {
+ "epoch": 10.877384196185286,
+ "grad_norm": 12.980363845825195,
+ "learning_rate": 1.9676306977129595e-05,
+ "loss": 1.3398,
+ "step": 3992
+ },
+ {
+ "epoch": 10.880108991825614,
+ "grad_norm": 13.093537330627441,
+ "learning_rate": 1.967608422390173e-05,
+ "loss": 1.1812,
+ "step": 3993
+ },
+ {
+ "epoch": 10.88283378746594,
+ "grad_norm": 10.763243675231934,
+ "learning_rate": 1.967586139531684e-05,
+ "loss": 1.481,
+ "step": 3994
+ },
+ {
+ "epoch": 10.885558583106267,
+ "grad_norm": 13.629618644714355,
+ "learning_rate": 1.9675638491376646e-05,
+ "loss": 1.5605,
+ "step": 3995
+ },
+ {
+ "epoch": 10.888283378746594,
+ "grad_norm": 14.426143646240234,
+ "learning_rate": 1.9675415512082895e-05,
+ "loss": 1.449,
+ "step": 3996
+ },
+ {
+ "epoch": 10.89100817438692,
+ "grad_norm": 11.355213165283203,
+ "learning_rate": 1.9675192457437316e-05,
+ "loss": 1.4153,
+ "step": 3997
+ },
+ {
+ "epoch": 10.893732970027248,
+ "grad_norm": 16.483633041381836,
+ "learning_rate": 1.9674969327441652e-05,
+ "loss": 1.3821,
+ "step": 3998
+ },
+ {
+ "epoch": 10.896457765667575,
+ "grad_norm": 12.077117919921875,
+ "learning_rate": 1.9674746122097637e-05,
+ "loss": 1.4727,
+ "step": 3999
+ },
+ {
+ "epoch": 10.899182561307901,
+ "grad_norm": 14.361942291259766,
+ "learning_rate": 1.967452284140701e-05,
+ "loss": 1.2417,
+ "step": 4000
+ },
+ {
+ "epoch": 10.901907356948229,
+ "grad_norm": 9.589673042297363,
+ "learning_rate": 1.967429948537151e-05,
+ "loss": 1.248,
+ "step": 4001
+ },
+ {
+ "epoch": 10.904632152588556,
+ "grad_norm": 12.560636520385742,
+ "learning_rate": 1.967407605399288e-05,
+ "loss": 1.3608,
+ "step": 4002
+ },
+ {
+ "epoch": 10.907356948228882,
+ "grad_norm": 13.126648902893066,
+ "learning_rate": 1.967385254727286e-05,
+ "loss": 1.3916,
+ "step": 4003
+ },
+ {
+ "epoch": 10.91008174386921,
+ "grad_norm": 12.25019645690918,
+ "learning_rate": 1.9673628965213177e-05,
+ "loss": 1.2607,
+ "step": 4004
+ },
+ {
+ "epoch": 10.912806539509537,
+ "grad_norm": 14.17881965637207,
+ "learning_rate": 1.9673405307815592e-05,
+ "loss": 1.2688,
+ "step": 4005
+ },
+ {
+ "epoch": 10.915531335149863,
+ "grad_norm": 11.824095726013184,
+ "learning_rate": 1.9673181575081837e-05,
+ "loss": 1.2573,
+ "step": 4006
+ },
+ {
+ "epoch": 10.91825613079019,
+ "grad_norm": 11.577066421508789,
+ "learning_rate": 1.9672957767013652e-05,
+ "loss": 1.5425,
+ "step": 4007
+ },
+ {
+ "epoch": 10.920980926430518,
+ "grad_norm": 10.646503448486328,
+ "learning_rate": 1.9672733883612786e-05,
+ "loss": 1.2871,
+ "step": 4008
+ },
+ {
+ "epoch": 10.923705722070844,
+ "grad_norm": 10.270605087280273,
+ "learning_rate": 1.9672509924880977e-05,
+ "loss": 1.2559,
+ "step": 4009
+ },
+ {
+ "epoch": 10.926430517711172,
+ "grad_norm": 11.509736061096191,
+ "learning_rate": 1.9672285890819974e-05,
+ "loss": 1.3875,
+ "step": 4010
+ },
+ {
+ "epoch": 10.9291553133515,
+ "grad_norm": 12.517537117004395,
+ "learning_rate": 1.967206178143152e-05,
+ "loss": 1.2605,
+ "step": 4011
+ },
+ {
+ "epoch": 10.931880108991825,
+ "grad_norm": 12.90263557434082,
+ "learning_rate": 1.967183759671736e-05,
+ "loss": 1.3694,
+ "step": 4012
+ },
+ {
+ "epoch": 10.934604904632153,
+ "grad_norm": 12.983382225036621,
+ "learning_rate": 1.9671613336679237e-05,
+ "loss": 1.2583,
+ "step": 4013
+ },
+ {
+ "epoch": 10.93732970027248,
+ "grad_norm": 15.22011661529541,
+ "learning_rate": 1.9671389001318904e-05,
+ "loss": 1.3909,
+ "step": 4014
+ },
+ {
+ "epoch": 10.940054495912806,
+ "grad_norm": 12.214634895324707,
+ "learning_rate": 1.96711645906381e-05,
+ "loss": 1.2373,
+ "step": 4015
+ },
+ {
+ "epoch": 10.942779291553133,
+ "grad_norm": 14.635167121887207,
+ "learning_rate": 1.9670940104638582e-05,
+ "loss": 1.5059,
+ "step": 4016
+ },
+ {
+ "epoch": 10.945504087193461,
+ "grad_norm": 8.975303649902344,
+ "learning_rate": 1.9670715543322093e-05,
+ "loss": 1.365,
+ "step": 4017
+ },
+ {
+ "epoch": 10.948228882833787,
+ "grad_norm": 10.037346839904785,
+ "learning_rate": 1.9670490906690386e-05,
+ "loss": 1.0637,
+ "step": 4018
+ },
+ {
+ "epoch": 10.950953678474114,
+ "grad_norm": 10.849924087524414,
+ "learning_rate": 1.96702661947452e-05,
+ "loss": 1.2229,
+ "step": 4019
+ },
+ {
+ "epoch": 10.953678474114442,
+ "grad_norm": 12.21422290802002,
+ "learning_rate": 1.9670041407488298e-05,
+ "loss": 1.5168,
+ "step": 4020
+ },
+ {
+ "epoch": 10.956403269754768,
+ "grad_norm": 10.877645492553711,
+ "learning_rate": 1.966981654492142e-05,
+ "loss": 1.2937,
+ "step": 4021
+ },
+ {
+ "epoch": 10.959128065395095,
+ "grad_norm": 10.834639549255371,
+ "learning_rate": 1.9669591607046325e-05,
+ "loss": 1.6199,
+ "step": 4022
+ },
+ {
+ "epoch": 10.961852861035423,
+ "grad_norm": 7.974213123321533,
+ "learning_rate": 1.9669366593864763e-05,
+ "loss": 1.2144,
+ "step": 4023
+ },
+ {
+ "epoch": 10.964577656675749,
+ "grad_norm": 14.464746475219727,
+ "learning_rate": 1.966914150537848e-05,
+ "loss": 1.3779,
+ "step": 4024
+ },
+ {
+ "epoch": 10.967302452316076,
+ "grad_norm": 8.732192039489746,
+ "learning_rate": 1.9668916341589242e-05,
+ "loss": 1.2466,
+ "step": 4025
+ },
+ {
+ "epoch": 10.970027247956404,
+ "grad_norm": 15.23045539855957,
+ "learning_rate": 1.966869110249879e-05,
+ "loss": 1.3286,
+ "step": 4026
+ },
+ {
+ "epoch": 10.97275204359673,
+ "grad_norm": 10.571854591369629,
+ "learning_rate": 1.966846578810888e-05,
+ "loss": 1.3718,
+ "step": 4027
+ },
+ {
+ "epoch": 10.975476839237057,
+ "grad_norm": 12.137609481811523,
+ "learning_rate": 1.9668240398421275e-05,
+ "loss": 1.4802,
+ "step": 4028
+ },
+ {
+ "epoch": 10.978201634877385,
+ "grad_norm": 9.905146598815918,
+ "learning_rate": 1.966801493343772e-05,
+ "loss": 1.1791,
+ "step": 4029
+ },
+ {
+ "epoch": 10.98092643051771,
+ "grad_norm": 11.161646842956543,
+ "learning_rate": 1.966778939315998e-05,
+ "loss": 1.4644,
+ "step": 4030
+ },
+ {
+ "epoch": 10.983651226158038,
+ "grad_norm": 9.805384635925293,
+ "learning_rate": 1.9667563777589805e-05,
+ "loss": 1.2712,
+ "step": 4031
+ },
+ {
+ "epoch": 10.986376021798366,
+ "grad_norm": 15.272140502929688,
+ "learning_rate": 1.9667338086728955e-05,
+ "loss": 1.4487,
+ "step": 4032
+ },
+ {
+ "epoch": 10.989100817438691,
+ "grad_norm": 9.714131355285645,
+ "learning_rate": 1.966711232057919e-05,
+ "loss": 1.3469,
+ "step": 4033
+ },
+ {
+ "epoch": 10.991825613079019,
+ "grad_norm": 10.3309326171875,
+ "learning_rate": 1.966688647914226e-05,
+ "loss": 1.218,
+ "step": 4034
+ },
+ {
+ "epoch": 10.994550408719347,
+ "grad_norm": 19.648483276367188,
+ "learning_rate": 1.9666660562419936e-05,
+ "loss": 1.519,
+ "step": 4035
+ },
+ {
+ "epoch": 10.997275204359672,
+ "grad_norm": 11.848732948303223,
+ "learning_rate": 1.9666434570413964e-05,
+ "loss": 1.3718,
+ "step": 4036
+ },
+ {
+ "epoch": 11.0,
+ "grad_norm": 10.305585861206055,
+ "learning_rate": 1.9666208503126115e-05,
+ "loss": 1.2573,
+ "step": 4037
+ },
+ {
+ "epoch": 11.002724795640328,
+ "grad_norm": 7.629805088043213,
+ "learning_rate": 1.9665982360558143e-05,
+ "loss": 1.3308,
+ "step": 4038
+ },
+ {
+ "epoch": 11.005449591280653,
+ "grad_norm": 11.943351745605469,
+ "learning_rate": 1.966575614271181e-05,
+ "loss": 1.2527,
+ "step": 4039
+ },
+ {
+ "epoch": 11.008174386920981,
+ "grad_norm": 8.443275451660156,
+ "learning_rate": 1.9665529849588882e-05,
+ "loss": 1.2517,
+ "step": 4040
+ },
+ {
+ "epoch": 11.010899182561309,
+ "grad_norm": 10.50875473022461,
+ "learning_rate": 1.966530348119112e-05,
+ "loss": 1.0623,
+ "step": 4041
+ },
+ {
+ "epoch": 11.013623978201634,
+ "grad_norm": 10.328377723693848,
+ "learning_rate": 1.9665077037520283e-05,
+ "loss": 1.1433,
+ "step": 4042
+ },
+ {
+ "epoch": 11.016348773841962,
+ "grad_norm": 15.970246315002441,
+ "learning_rate": 1.966485051857814e-05,
+ "loss": 1.2085,
+ "step": 4043
+ },
+ {
+ "epoch": 11.01907356948229,
+ "grad_norm": 9.247635841369629,
+ "learning_rate": 1.9664623924366446e-05,
+ "loss": 1.3401,
+ "step": 4044
+ },
+ {
+ "epoch": 11.021798365122615,
+ "grad_norm": 8.929620742797852,
+ "learning_rate": 1.9664397254886975e-05,
+ "loss": 1.3857,
+ "step": 4045
+ },
+ {
+ "epoch": 11.024523160762943,
+ "grad_norm": 8.579508781433105,
+ "learning_rate": 1.9664170510141495e-05,
+ "loss": 1.2671,
+ "step": 4046
+ },
+ {
+ "epoch": 11.02724795640327,
+ "grad_norm": 8.783073425292969,
+ "learning_rate": 1.966394369013176e-05,
+ "loss": 1.2777,
+ "step": 4047
+ },
+ {
+ "epoch": 11.029972752043596,
+ "grad_norm": 9.716208457946777,
+ "learning_rate": 1.9663716794859543e-05,
+ "loss": 1.2649,
+ "step": 4048
+ },
+ {
+ "epoch": 11.032697547683924,
+ "grad_norm": 8.254244804382324,
+ "learning_rate": 1.9663489824326612e-05,
+ "loss": 1.137,
+ "step": 4049
+ },
+ {
+ "epoch": 11.035422343324251,
+ "grad_norm": 16.232574462890625,
+ "learning_rate": 1.966326277853473e-05,
+ "loss": 1.3208,
+ "step": 4050
+ },
+ {
+ "epoch": 11.038147138964577,
+ "grad_norm": 9.67200756072998,
+ "learning_rate": 1.9663035657485673e-05,
+ "loss": 1.1733,
+ "step": 4051
+ },
+ {
+ "epoch": 11.040871934604905,
+ "grad_norm": 8.065556526184082,
+ "learning_rate": 1.9662808461181206e-05,
+ "loss": 1.1406,
+ "step": 4052
+ },
+ {
+ "epoch": 11.043596730245232,
+ "grad_norm": 21.56169891357422,
+ "learning_rate": 1.9662581189623093e-05,
+ "loss": 1.158,
+ "step": 4053
+ },
+ {
+ "epoch": 11.046321525885558,
+ "grad_norm": 13.468238830566406,
+ "learning_rate": 1.9662353842813112e-05,
+ "loss": 1.3716,
+ "step": 4054
+ },
+ {
+ "epoch": 11.049046321525886,
+ "grad_norm": 20.729324340820312,
+ "learning_rate": 1.9662126420753026e-05,
+ "loss": 1.3013,
+ "step": 4055
+ },
+ {
+ "epoch": 11.051771117166213,
+ "grad_norm": 10.317609786987305,
+ "learning_rate": 1.9661898923444616e-05,
+ "loss": 1.094,
+ "step": 4056
+ },
+ {
+ "epoch": 11.054495912806539,
+ "grad_norm": 9.526543617248535,
+ "learning_rate": 1.9661671350889645e-05,
+ "loss": 1.0095,
+ "step": 4057
+ },
+ {
+ "epoch": 11.057220708446867,
+ "grad_norm": 9.82815170288086,
+ "learning_rate": 1.9661443703089888e-05,
+ "loss": 1.0662,
+ "step": 4058
+ },
+ {
+ "epoch": 11.059945504087194,
+ "grad_norm": 11.4994478225708,
+ "learning_rate": 1.966121598004712e-05,
+ "loss": 1.3569,
+ "step": 4059
+ },
+ {
+ "epoch": 11.06267029972752,
+ "grad_norm": 11.084864616394043,
+ "learning_rate": 1.9660988181763114e-05,
+ "loss": 1.2798,
+ "step": 4060
+ },
+ {
+ "epoch": 11.065395095367847,
+ "grad_norm": 9.071287155151367,
+ "learning_rate": 1.966076030823964e-05,
+ "loss": 1.093,
+ "step": 4061
+ },
+ {
+ "epoch": 11.068119891008175,
+ "grad_norm": 14.715372085571289,
+ "learning_rate": 1.9660532359478476e-05,
+ "loss": 1.2085,
+ "step": 4062
+ },
+ {
+ "epoch": 11.0708446866485,
+ "grad_norm": 11.17330551147461,
+ "learning_rate": 1.9660304335481398e-05,
+ "loss": 1.1809,
+ "step": 4063
+ },
+ {
+ "epoch": 11.073569482288828,
+ "grad_norm": 17.41897201538086,
+ "learning_rate": 1.966007623625018e-05,
+ "loss": 1.1323,
+ "step": 4064
+ },
+ {
+ "epoch": 11.076294277929156,
+ "grad_norm": 10.150404930114746,
+ "learning_rate": 1.96598480617866e-05,
+ "loss": 1.2778,
+ "step": 4065
+ },
+ {
+ "epoch": 11.079019073569482,
+ "grad_norm": 10.516081809997559,
+ "learning_rate": 1.9659619812092434e-05,
+ "loss": 1.2273,
+ "step": 4066
+ },
+ {
+ "epoch": 11.08174386920981,
+ "grad_norm": 9.161614418029785,
+ "learning_rate": 1.965939148716946e-05,
+ "loss": 1.0337,
+ "step": 4067
+ },
+ {
+ "epoch": 11.084468664850137,
+ "grad_norm": 10.477733612060547,
+ "learning_rate": 1.9659163087019454e-05,
+ "loss": 1.1277,
+ "step": 4068
+ },
+ {
+ "epoch": 11.087193460490463,
+ "grad_norm": 7.671123027801514,
+ "learning_rate": 1.96589346116442e-05,
+ "loss": 1.043,
+ "step": 4069
+ },
+ {
+ "epoch": 11.08991825613079,
+ "grad_norm": 9.864495277404785,
+ "learning_rate": 1.9658706061045473e-05,
+ "loss": 1.2415,
+ "step": 4070
+ },
+ {
+ "epoch": 11.092643051771118,
+ "grad_norm": 9.38493537902832,
+ "learning_rate": 1.9658477435225053e-05,
+ "loss": 1.2493,
+ "step": 4071
+ },
+ {
+ "epoch": 11.095367847411444,
+ "grad_norm": 10.206192016601562,
+ "learning_rate": 1.9658248734184725e-05,
+ "loss": 1.1704,
+ "step": 4072
+ },
+ {
+ "epoch": 11.098092643051771,
+ "grad_norm": 8.365642547607422,
+ "learning_rate": 1.9658019957926263e-05,
+ "loss": 1.0044,
+ "step": 4073
+ },
+ {
+ "epoch": 11.100817438692099,
+ "grad_norm": 8.866310119628906,
+ "learning_rate": 1.9657791106451454e-05,
+ "loss": 1.3228,
+ "step": 4074
+ },
+ {
+ "epoch": 11.103542234332425,
+ "grad_norm": 43.499473571777344,
+ "learning_rate": 1.9657562179762078e-05,
+ "loss": 1.3042,
+ "step": 4075
+ },
+ {
+ "epoch": 11.106267029972752,
+ "grad_norm": 13.006279945373535,
+ "learning_rate": 1.965733317785992e-05,
+ "loss": 1.5593,
+ "step": 4076
+ },
+ {
+ "epoch": 11.10899182561308,
+ "grad_norm": 13.291231155395508,
+ "learning_rate": 1.965710410074676e-05,
+ "loss": 1.3572,
+ "step": 4077
+ },
+ {
+ "epoch": 11.111716621253406,
+ "grad_norm": 9.592552185058594,
+ "learning_rate": 1.9656874948424384e-05,
+ "loss": 1.1603,
+ "step": 4078
+ },
+ {
+ "epoch": 11.114441416893733,
+ "grad_norm": 11.061075210571289,
+ "learning_rate": 1.9656645720894577e-05,
+ "loss": 1.209,
+ "step": 4079
+ },
+ {
+ "epoch": 11.11716621253406,
+ "grad_norm": 8.441675186157227,
+ "learning_rate": 1.9656416418159127e-05,
+ "loss": 1.0714,
+ "step": 4080
+ },
+ {
+ "epoch": 11.119891008174386,
+ "grad_norm": 11.681937217712402,
+ "learning_rate": 1.9656187040219812e-05,
+ "loss": 1.3994,
+ "step": 4081
+ },
+ {
+ "epoch": 11.122615803814714,
+ "grad_norm": 11.914758682250977,
+ "learning_rate": 1.9655957587078426e-05,
+ "loss": 1.2463,
+ "step": 4082
+ },
+ {
+ "epoch": 11.125340599455042,
+ "grad_norm": 8.07807445526123,
+ "learning_rate": 1.9655728058736753e-05,
+ "loss": 1.2039,
+ "step": 4083
+ },
+ {
+ "epoch": 11.128065395095367,
+ "grad_norm": 8.954924583435059,
+ "learning_rate": 1.9655498455196576e-05,
+ "loss": 1.1509,
+ "step": 4084
+ },
+ {
+ "epoch": 11.130790190735695,
+ "grad_norm": 10.02565860748291,
+ "learning_rate": 1.9655268776459694e-05,
+ "loss": 1.2639,
+ "step": 4085
+ },
+ {
+ "epoch": 11.133514986376023,
+ "grad_norm": 9.384295463562012,
+ "learning_rate": 1.965503902252789e-05,
+ "loss": 1.1588,
+ "step": 4086
+ },
+ {
+ "epoch": 11.136239782016348,
+ "grad_norm": 9.927639961242676,
+ "learning_rate": 1.965480919340295e-05,
+ "loss": 1.1903,
+ "step": 4087
+ },
+ {
+ "epoch": 11.138964577656676,
+ "grad_norm": 7.977211952209473,
+ "learning_rate": 1.9654579289086665e-05,
+ "loss": 1.1218,
+ "step": 4088
+ },
+ {
+ "epoch": 11.141689373297003,
+ "grad_norm": 13.479766845703125,
+ "learning_rate": 1.965434930958083e-05,
+ "loss": 1.0947,
+ "step": 4089
+ },
+ {
+ "epoch": 11.14441416893733,
+ "grad_norm": 10.667736053466797,
+ "learning_rate": 1.965411925488723e-05,
+ "loss": 1.2054,
+ "step": 4090
+ },
+ {
+ "epoch": 11.147138964577657,
+ "grad_norm": 16.211450576782227,
+ "learning_rate": 1.9653889125007665e-05,
+ "loss": 1.158,
+ "step": 4091
+ },
+ {
+ "epoch": 11.149863760217984,
+ "grad_norm": 9.036359786987305,
+ "learning_rate": 1.965365891994392e-05,
+ "loss": 0.9523,
+ "step": 4092
+ },
+ {
+ "epoch": 11.15258855585831,
+ "grad_norm": 9.005630493164062,
+ "learning_rate": 1.9653428639697788e-05,
+ "loss": 1.2079,
+ "step": 4093
+ },
+ {
+ "epoch": 11.155313351498638,
+ "grad_norm": 9.042786598205566,
+ "learning_rate": 1.9653198284271065e-05,
+ "loss": 1.3333,
+ "step": 4094
+ },
+ {
+ "epoch": 11.158038147138965,
+ "grad_norm": 9.039999008178711,
+ "learning_rate": 1.9652967853665547e-05,
+ "loss": 0.9956,
+ "step": 4095
+ },
+ {
+ "epoch": 11.160762942779291,
+ "grad_norm": 14.095746040344238,
+ "learning_rate": 1.9652737347883025e-05,
+ "loss": 1.147,
+ "step": 4096
+ },
+ {
+ "epoch": 11.163487738419619,
+ "grad_norm": 8.9838228225708,
+ "learning_rate": 1.9652506766925296e-05,
+ "loss": 1.1233,
+ "step": 4097
+ },
+ {
+ "epoch": 11.166212534059946,
+ "grad_norm": 9.379589080810547,
+ "learning_rate": 1.965227611079415e-05,
+ "loss": 1.0171,
+ "step": 4098
+ },
+ {
+ "epoch": 11.168937329700272,
+ "grad_norm": 13.760157585144043,
+ "learning_rate": 1.9652045379491395e-05,
+ "loss": 1.3872,
+ "step": 4099
+ },
+ {
+ "epoch": 11.1716621253406,
+ "grad_norm": 13.840320587158203,
+ "learning_rate": 1.9651814573018818e-05,
+ "loss": 1.2776,
+ "step": 4100
+ },
+ {
+ "epoch": 11.174386920980927,
+ "grad_norm": 11.532063484191895,
+ "learning_rate": 1.965158369137822e-05,
+ "loss": 1.4041,
+ "step": 4101
+ },
+ {
+ "epoch": 11.177111716621253,
+ "grad_norm": 11.299899101257324,
+ "learning_rate": 1.96513527345714e-05,
+ "loss": 1.3455,
+ "step": 4102
+ },
+ {
+ "epoch": 11.17983651226158,
+ "grad_norm": 9.078874588012695,
+ "learning_rate": 1.9651121702600155e-05,
+ "loss": 1.1794,
+ "step": 4103
+ },
+ {
+ "epoch": 11.182561307901908,
+ "grad_norm": 11.858445167541504,
+ "learning_rate": 1.9650890595466284e-05,
+ "loss": 1.0796,
+ "step": 4104
+ },
+ {
+ "epoch": 11.185286103542234,
+ "grad_norm": 10.78423023223877,
+ "learning_rate": 1.965065941317159e-05,
+ "loss": 1.2229,
+ "step": 4105
+ },
+ {
+ "epoch": 11.188010899182562,
+ "grad_norm": 11.808480262756348,
+ "learning_rate": 1.9650428155717867e-05,
+ "loss": 1.2874,
+ "step": 4106
+ },
+ {
+ "epoch": 11.190735694822889,
+ "grad_norm": 14.424799919128418,
+ "learning_rate": 1.965019682310692e-05,
+ "loss": 1.4639,
+ "step": 4107
+ },
+ {
+ "epoch": 11.193460490463215,
+ "grad_norm": 10.045002937316895,
+ "learning_rate": 1.9649965415340553e-05,
+ "loss": 1.1688,
+ "step": 4108
+ },
+ {
+ "epoch": 11.196185286103542,
+ "grad_norm": 11.161811828613281,
+ "learning_rate": 1.9649733932420566e-05,
+ "loss": 1.3177,
+ "step": 4109
+ },
+ {
+ "epoch": 11.19891008174387,
+ "grad_norm": 9.272212982177734,
+ "learning_rate": 1.9649502374348763e-05,
+ "loss": 1.0918,
+ "step": 4110
+ },
+ {
+ "epoch": 11.201634877384196,
+ "grad_norm": 10.659878730773926,
+ "learning_rate": 1.9649270741126944e-05,
+ "loss": 1.3677,
+ "step": 4111
+ },
+ {
+ "epoch": 11.204359673024523,
+ "grad_norm": 9.117798805236816,
+ "learning_rate": 1.9649039032756913e-05,
+ "loss": 1.2502,
+ "step": 4112
+ },
+ {
+ "epoch": 11.207084468664851,
+ "grad_norm": 12.927522659301758,
+ "learning_rate": 1.964880724924048e-05,
+ "loss": 1.2788,
+ "step": 4113
+ },
+ {
+ "epoch": 11.209809264305177,
+ "grad_norm": 11.339554786682129,
+ "learning_rate": 1.9648575390579447e-05,
+ "loss": 1.4341,
+ "step": 4114
+ },
+ {
+ "epoch": 11.212534059945504,
+ "grad_norm": 12.668943405151367,
+ "learning_rate": 1.964834345677562e-05,
+ "loss": 1.4468,
+ "step": 4115
+ },
+ {
+ "epoch": 11.215258855585832,
+ "grad_norm": 17.67973518371582,
+ "learning_rate": 1.96481114478308e-05,
+ "loss": 1.1472,
+ "step": 4116
+ },
+ {
+ "epoch": 11.217983651226158,
+ "grad_norm": 16.11754035949707,
+ "learning_rate": 1.96478793637468e-05,
+ "loss": 1.3931,
+ "step": 4117
+ },
+ {
+ "epoch": 11.220708446866485,
+ "grad_norm": 11.04246711730957,
+ "learning_rate": 1.964764720452543e-05,
+ "loss": 1.1917,
+ "step": 4118
+ },
+ {
+ "epoch": 11.223433242506813,
+ "grad_norm": 18.711198806762695,
+ "learning_rate": 1.964741497016849e-05,
+ "loss": 1.2371,
+ "step": 4119
+ },
+ {
+ "epoch": 11.226158038147139,
+ "grad_norm": 10.438543319702148,
+ "learning_rate": 1.9647182660677796e-05,
+ "loss": 1.0435,
+ "step": 4120
+ },
+ {
+ "epoch": 11.228882833787466,
+ "grad_norm": 15.964482307434082,
+ "learning_rate": 1.9646950276055153e-05,
+ "loss": 1.1743,
+ "step": 4121
+ },
+ {
+ "epoch": 11.231607629427794,
+ "grad_norm": 13.605895042419434,
+ "learning_rate": 1.964671781630237e-05,
+ "loss": 1.2588,
+ "step": 4122
+ },
+ {
+ "epoch": 11.23433242506812,
+ "grad_norm": 22.46067237854004,
+ "learning_rate": 1.964648528142126e-05,
+ "loss": 1.282,
+ "step": 4123
+ },
+ {
+ "epoch": 11.237057220708447,
+ "grad_norm": 10.966947555541992,
+ "learning_rate": 1.9646252671413633e-05,
+ "loss": 1.0828,
+ "step": 4124
+ },
+ {
+ "epoch": 11.239782016348773,
+ "grad_norm": 11.58065414428711,
+ "learning_rate": 1.96460199862813e-05,
+ "loss": 1.1797,
+ "step": 4125
+ },
+ {
+ "epoch": 11.2425068119891,
+ "grad_norm": 12.301233291625977,
+ "learning_rate": 1.9645787226026075e-05,
+ "loss": 1.2278,
+ "step": 4126
+ },
+ {
+ "epoch": 11.245231607629428,
+ "grad_norm": 16.46876335144043,
+ "learning_rate": 1.964555439064977e-05,
+ "loss": 1.1877,
+ "step": 4127
+ },
+ {
+ "epoch": 11.247956403269754,
+ "grad_norm": 12.894742965698242,
+ "learning_rate": 1.96453214801542e-05,
+ "loss": 1.2786,
+ "step": 4128
+ },
+ {
+ "epoch": 11.250681198910081,
+ "grad_norm": 14.421160697937012,
+ "learning_rate": 1.9645088494541172e-05,
+ "loss": 1.3118,
+ "step": 4129
+ },
+ {
+ "epoch": 11.253405994550409,
+ "grad_norm": 14.483222007751465,
+ "learning_rate": 1.9644855433812507e-05,
+ "loss": 1.4663,
+ "step": 4130
+ },
+ {
+ "epoch": 11.256130790190735,
+ "grad_norm": 31.697895050048828,
+ "learning_rate": 1.9644622297970018e-05,
+ "loss": 1.1819,
+ "step": 4131
+ },
+ {
+ "epoch": 11.258855585831062,
+ "grad_norm": 12.084939002990723,
+ "learning_rate": 1.964438908701552e-05,
+ "loss": 1.3225,
+ "step": 4132
+ },
+ {
+ "epoch": 11.26158038147139,
+ "grad_norm": 12.784135818481445,
+ "learning_rate": 1.9644155800950832e-05,
+ "loss": 1.3584,
+ "step": 4133
+ },
+ {
+ "epoch": 11.264305177111716,
+ "grad_norm": 8.929036140441895,
+ "learning_rate": 1.964392243977777e-05,
+ "loss": 1.2412,
+ "step": 4134
+ },
+ {
+ "epoch": 11.267029972752043,
+ "grad_norm": 12.572015762329102,
+ "learning_rate": 1.9643689003498147e-05,
+ "loss": 1.3308,
+ "step": 4135
+ },
+ {
+ "epoch": 11.269754768392371,
+ "grad_norm": 12.465352058410645,
+ "learning_rate": 1.964345549211379e-05,
+ "loss": 1.2808,
+ "step": 4136
+ },
+ {
+ "epoch": 11.272479564032697,
+ "grad_norm": 9.7542724609375,
+ "learning_rate": 1.9643221905626505e-05,
+ "loss": 1.0579,
+ "step": 4137
+ },
+ {
+ "epoch": 11.275204359673024,
+ "grad_norm": 18.65604591369629,
+ "learning_rate": 1.9642988244038122e-05,
+ "loss": 1.2966,
+ "step": 4138
+ },
+ {
+ "epoch": 11.277929155313352,
+ "grad_norm": 11.757242202758789,
+ "learning_rate": 1.9642754507350457e-05,
+ "loss": 1.2561,
+ "step": 4139
+ },
+ {
+ "epoch": 11.280653950953678,
+ "grad_norm": 8.50538444519043,
+ "learning_rate": 1.9642520695565328e-05,
+ "loss": 1.1646,
+ "step": 4140
+ },
+ {
+ "epoch": 11.283378746594005,
+ "grad_norm": 9.911194801330566,
+ "learning_rate": 1.9642286808684562e-05,
+ "loss": 1.4351,
+ "step": 4141
+ },
+ {
+ "epoch": 11.286103542234333,
+ "grad_norm": 10.260211944580078,
+ "learning_rate": 1.9642052846709975e-05,
+ "loss": 1.1672,
+ "step": 4142
+ },
+ {
+ "epoch": 11.288828337874659,
+ "grad_norm": 12.260438919067383,
+ "learning_rate": 1.964181880964339e-05,
+ "loss": 1.449,
+ "step": 4143
+ },
+ {
+ "epoch": 11.291553133514986,
+ "grad_norm": 14.704292297363281,
+ "learning_rate": 1.9641584697486632e-05,
+ "loss": 1.1729,
+ "step": 4144
+ },
+ {
+ "epoch": 11.294277929155314,
+ "grad_norm": 10.67501163482666,
+ "learning_rate": 1.964135051024152e-05,
+ "loss": 1.3525,
+ "step": 4145
+ },
+ {
+ "epoch": 11.29700272479564,
+ "grad_norm": 10.726551055908203,
+ "learning_rate": 1.964111624790988e-05,
+ "loss": 1.3108,
+ "step": 4146
+ },
+ {
+ "epoch": 11.299727520435967,
+ "grad_norm": 14.48544979095459,
+ "learning_rate": 1.964088191049354e-05,
+ "loss": 1.3015,
+ "step": 4147
+ },
+ {
+ "epoch": 11.302452316076295,
+ "grad_norm": 10.027518272399902,
+ "learning_rate": 1.964064749799432e-05,
+ "loss": 1.1862,
+ "step": 4148
+ },
+ {
+ "epoch": 11.30517711171662,
+ "grad_norm": 40.34449005126953,
+ "learning_rate": 1.9640413010414048e-05,
+ "loss": 1.1127,
+ "step": 4149
+ },
+ {
+ "epoch": 11.307901907356948,
+ "grad_norm": 9.3348970413208,
+ "learning_rate": 1.9640178447754554e-05,
+ "loss": 1.0125,
+ "step": 4150
+ },
+ {
+ "epoch": 11.310626702997276,
+ "grad_norm": 11.324419021606445,
+ "learning_rate": 1.9639943810017654e-05,
+ "loss": 1.2837,
+ "step": 4151
+ },
+ {
+ "epoch": 11.313351498637601,
+ "grad_norm": 12.872102737426758,
+ "learning_rate": 1.9639709097205185e-05,
+ "loss": 1.3274,
+ "step": 4152
+ },
+ {
+ "epoch": 11.316076294277929,
+ "grad_norm": 9.504002571105957,
+ "learning_rate": 1.963947430931897e-05,
+ "loss": 1.4272,
+ "step": 4153
+ },
+ {
+ "epoch": 11.318801089918257,
+ "grad_norm": 81.22502136230469,
+ "learning_rate": 1.963923944636084e-05,
+ "loss": 1.2947,
+ "step": 4154
+ },
+ {
+ "epoch": 11.321525885558582,
+ "grad_norm": 10.916065216064453,
+ "learning_rate": 1.9639004508332627e-05,
+ "loss": 1.1638,
+ "step": 4155
+ },
+ {
+ "epoch": 11.32425068119891,
+ "grad_norm": 10.57822322845459,
+ "learning_rate": 1.9638769495236154e-05,
+ "loss": 1.3083,
+ "step": 4156
+ },
+ {
+ "epoch": 11.326975476839237,
+ "grad_norm": 12.542110443115234,
+ "learning_rate": 1.963853440707325e-05,
+ "loss": 1.3452,
+ "step": 4157
+ },
+ {
+ "epoch": 11.329700272479563,
+ "grad_norm": 9.83530044555664,
+ "learning_rate": 1.9638299243845758e-05,
+ "loss": 1.2844,
+ "step": 4158
+ },
+ {
+ "epoch": 11.33242506811989,
+ "grad_norm": 11.479257583618164,
+ "learning_rate": 1.96380640055555e-05,
+ "loss": 1.1814,
+ "step": 4159
+ },
+ {
+ "epoch": 11.335149863760218,
+ "grad_norm": 10.582036018371582,
+ "learning_rate": 1.9637828692204307e-05,
+ "loss": 1.1533,
+ "step": 4160
+ },
+ {
+ "epoch": 11.337874659400544,
+ "grad_norm": 15.099767684936523,
+ "learning_rate": 1.9637593303794015e-05,
+ "loss": 1.3831,
+ "step": 4161
+ },
+ {
+ "epoch": 11.340599455040872,
+ "grad_norm": 10.092370986938477,
+ "learning_rate": 1.9637357840326457e-05,
+ "loss": 1.1663,
+ "step": 4162
+ },
+ {
+ "epoch": 11.3433242506812,
+ "grad_norm": 11.402278900146484,
+ "learning_rate": 1.9637122301803466e-05,
+ "loss": 1.1959,
+ "step": 4163
+ },
+ {
+ "epoch": 11.346049046321525,
+ "grad_norm": 9.97726058959961,
+ "learning_rate": 1.963688668822688e-05,
+ "loss": 1.1047,
+ "step": 4164
+ },
+ {
+ "epoch": 11.348773841961853,
+ "grad_norm": 9.727554321289062,
+ "learning_rate": 1.9636650999598527e-05,
+ "loss": 1.1803,
+ "step": 4165
+ },
+ {
+ "epoch": 11.35149863760218,
+ "grad_norm": 9.918126106262207,
+ "learning_rate": 1.9636415235920246e-05,
+ "loss": 1.3164,
+ "step": 4166
+ },
+ {
+ "epoch": 11.354223433242506,
+ "grad_norm": 8.939223289489746,
+ "learning_rate": 1.9636179397193874e-05,
+ "loss": 1.4137,
+ "step": 4167
+ },
+ {
+ "epoch": 11.356948228882834,
+ "grad_norm": 14.461063385009766,
+ "learning_rate": 1.9635943483421246e-05,
+ "loss": 1.168,
+ "step": 4168
+ },
+ {
+ "epoch": 11.359673024523161,
+ "grad_norm": 8.427556037902832,
+ "learning_rate": 1.9635707494604203e-05,
+ "loss": 1.0503,
+ "step": 4169
+ },
+ {
+ "epoch": 11.362397820163487,
+ "grad_norm": 8.970022201538086,
+ "learning_rate": 1.9635471430744578e-05,
+ "loss": 1.1821,
+ "step": 4170
+ },
+ {
+ "epoch": 11.365122615803815,
+ "grad_norm": 7.9704060554504395,
+ "learning_rate": 1.9635235291844213e-05,
+ "loss": 1.2388,
+ "step": 4171
+ },
+ {
+ "epoch": 11.367847411444142,
+ "grad_norm": 10.413139343261719,
+ "learning_rate": 1.9634999077904945e-05,
+ "loss": 1.3325,
+ "step": 4172
+ },
+ {
+ "epoch": 11.370572207084468,
+ "grad_norm": 11.076361656188965,
+ "learning_rate": 1.9634762788928615e-05,
+ "loss": 1.3113,
+ "step": 4173
+ },
+ {
+ "epoch": 11.373297002724795,
+ "grad_norm": 8.550765037536621,
+ "learning_rate": 1.963452642491706e-05,
+ "loss": 1.1122,
+ "step": 4174
+ },
+ {
+ "epoch": 11.376021798365123,
+ "grad_norm": 17.111282348632812,
+ "learning_rate": 1.9634289985872126e-05,
+ "loss": 1.1338,
+ "step": 4175
+ },
+ {
+ "epoch": 11.378746594005449,
+ "grad_norm": 11.5484619140625,
+ "learning_rate": 1.963405347179565e-05,
+ "loss": 1.3228,
+ "step": 4176
+ },
+ {
+ "epoch": 11.381471389645776,
+ "grad_norm": 9.316886901855469,
+ "learning_rate": 1.963381688268948e-05,
+ "loss": 1.1422,
+ "step": 4177
+ },
+ {
+ "epoch": 11.384196185286104,
+ "grad_norm": 12.380435943603516,
+ "learning_rate": 1.963358021855545e-05,
+ "loss": 1.3149,
+ "step": 4178
+ },
+ {
+ "epoch": 11.38692098092643,
+ "grad_norm": 10.483932495117188,
+ "learning_rate": 1.9633343479395405e-05,
+ "loss": 1.3203,
+ "step": 4179
+ },
+ {
+ "epoch": 11.389645776566757,
+ "grad_norm": 9.909773826599121,
+ "learning_rate": 1.9633106665211196e-05,
+ "loss": 1.2068,
+ "step": 4180
+ },
+ {
+ "epoch": 11.392370572207085,
+ "grad_norm": 9.947454452514648,
+ "learning_rate": 1.963286977600466e-05,
+ "loss": 1.3235,
+ "step": 4181
+ },
+ {
+ "epoch": 11.39509536784741,
+ "grad_norm": 9.787384986877441,
+ "learning_rate": 1.9632632811777644e-05,
+ "loss": 1.4629,
+ "step": 4182
+ },
+ {
+ "epoch": 11.397820163487738,
+ "grad_norm": 8.918498992919922,
+ "learning_rate": 1.9632395772531993e-05,
+ "loss": 1.3926,
+ "step": 4183
+ },
+ {
+ "epoch": 11.400544959128066,
+ "grad_norm": 8.588772773742676,
+ "learning_rate": 1.9632158658269554e-05,
+ "loss": 1.2854,
+ "step": 4184
+ },
+ {
+ "epoch": 11.403269754768392,
+ "grad_norm": 10.430420875549316,
+ "learning_rate": 1.9631921468992173e-05,
+ "loss": 1.1613,
+ "step": 4185
+ },
+ {
+ "epoch": 11.40599455040872,
+ "grad_norm": 11.09743881225586,
+ "learning_rate": 1.96316842047017e-05,
+ "loss": 1.2173,
+ "step": 4186
+ },
+ {
+ "epoch": 11.408719346049047,
+ "grad_norm": 9.371150970458984,
+ "learning_rate": 1.963144686539998e-05,
+ "loss": 1.0715,
+ "step": 4187
+ },
+ {
+ "epoch": 11.411444141689373,
+ "grad_norm": 9.642024993896484,
+ "learning_rate": 1.963120945108886e-05,
+ "loss": 1.0969,
+ "step": 4188
+ },
+ {
+ "epoch": 11.4141689373297,
+ "grad_norm": 8.411330223083496,
+ "learning_rate": 1.9630971961770194e-05,
+ "loss": 1.2397,
+ "step": 4189
+ },
+ {
+ "epoch": 11.416893732970028,
+ "grad_norm": 8.898776054382324,
+ "learning_rate": 1.9630734397445824e-05,
+ "loss": 1.2456,
+ "step": 4190
+ },
+ {
+ "epoch": 11.419618528610354,
+ "grad_norm": 10.948317527770996,
+ "learning_rate": 1.963049675811761e-05,
+ "loss": 1.2649,
+ "step": 4191
+ },
+ {
+ "epoch": 11.422343324250681,
+ "grad_norm": 9.487371444702148,
+ "learning_rate": 1.963025904378739e-05,
+ "loss": 1.1331,
+ "step": 4192
+ },
+ {
+ "epoch": 11.425068119891009,
+ "grad_norm": 9.217453002929688,
+ "learning_rate": 1.9630021254457026e-05,
+ "loss": 1.297,
+ "step": 4193
+ },
+ {
+ "epoch": 11.427792915531334,
+ "grad_norm": 7.42936372756958,
+ "learning_rate": 1.9629783390128366e-05,
+ "loss": 1.4397,
+ "step": 4194
+ },
+ {
+ "epoch": 11.430517711171662,
+ "grad_norm": 10.919928550720215,
+ "learning_rate": 1.9629545450803266e-05,
+ "loss": 1.3093,
+ "step": 4195
+ },
+ {
+ "epoch": 11.43324250681199,
+ "grad_norm": 9.25825309753418,
+ "learning_rate": 1.9629307436483573e-05,
+ "loss": 1.0737,
+ "step": 4196
+ },
+ {
+ "epoch": 11.435967302452315,
+ "grad_norm": 10.210301399230957,
+ "learning_rate": 1.9629069347171144e-05,
+ "loss": 1.4414,
+ "step": 4197
+ },
+ {
+ "epoch": 11.438692098092643,
+ "grad_norm": 7.53134822845459,
+ "learning_rate": 1.9628831182867833e-05,
+ "loss": 1.3176,
+ "step": 4198
+ },
+ {
+ "epoch": 11.44141689373297,
+ "grad_norm": 7.884014129638672,
+ "learning_rate": 1.9628592943575494e-05,
+ "loss": 1.1528,
+ "step": 4199
+ },
+ {
+ "epoch": 11.444141689373296,
+ "grad_norm": 11.789016723632812,
+ "learning_rate": 1.9628354629295983e-05,
+ "loss": 1.2783,
+ "step": 4200
+ },
+ {
+ "epoch": 11.446866485013624,
+ "grad_norm": 12.273369789123535,
+ "learning_rate": 1.962811624003116e-05,
+ "loss": 1.2969,
+ "step": 4201
+ },
+ {
+ "epoch": 11.449591280653951,
+ "grad_norm": 9.086417198181152,
+ "learning_rate": 1.9627877775782873e-05,
+ "loss": 1.1382,
+ "step": 4202
+ },
+ {
+ "epoch": 11.452316076294277,
+ "grad_norm": 7.977797031402588,
+ "learning_rate": 1.9627639236552983e-05,
+ "loss": 1.3462,
+ "step": 4203
+ },
+ {
+ "epoch": 11.455040871934605,
+ "grad_norm": 8.445021629333496,
+ "learning_rate": 1.9627400622343354e-05,
+ "loss": 1.2949,
+ "step": 4204
+ },
+ {
+ "epoch": 11.457765667574932,
+ "grad_norm": 8.467462539672852,
+ "learning_rate": 1.9627161933155833e-05,
+ "loss": 1.3215,
+ "step": 4205
+ },
+ {
+ "epoch": 11.460490463215258,
+ "grad_norm": 9.459888458251953,
+ "learning_rate": 1.962692316899229e-05,
+ "loss": 1.1018,
+ "step": 4206
+ },
+ {
+ "epoch": 11.463215258855586,
+ "grad_norm": 8.615829467773438,
+ "learning_rate": 1.9626684329854575e-05,
+ "loss": 1.1511,
+ "step": 4207
+ },
+ {
+ "epoch": 11.465940054495913,
+ "grad_norm": 9.40342903137207,
+ "learning_rate": 1.9626445415744552e-05,
+ "loss": 1.0793,
+ "step": 4208
+ },
+ {
+ "epoch": 11.46866485013624,
+ "grad_norm": 10.980266571044922,
+ "learning_rate": 1.9626206426664084e-05,
+ "loss": 1.1465,
+ "step": 4209
+ },
+ {
+ "epoch": 11.471389645776567,
+ "grad_norm": 8.530308723449707,
+ "learning_rate": 1.962596736261503e-05,
+ "loss": 1.1807,
+ "step": 4210
+ },
+ {
+ "epoch": 11.474114441416894,
+ "grad_norm": 8.508332252502441,
+ "learning_rate": 1.9625728223599253e-05,
+ "loss": 1.2659,
+ "step": 4211
+ },
+ {
+ "epoch": 11.47683923705722,
+ "grad_norm": 8.210857391357422,
+ "learning_rate": 1.962548900961861e-05,
+ "loss": 1.1379,
+ "step": 4212
+ },
+ {
+ "epoch": 11.479564032697548,
+ "grad_norm": 9.084643363952637,
+ "learning_rate": 1.9625249720674975e-05,
+ "loss": 1.377,
+ "step": 4213
+ },
+ {
+ "epoch": 11.482288828337875,
+ "grad_norm": 11.54325008392334,
+ "learning_rate": 1.96250103567702e-05,
+ "loss": 1.4338,
+ "step": 4214
+ },
+ {
+ "epoch": 11.485013623978201,
+ "grad_norm": 10.700432777404785,
+ "learning_rate": 1.9624770917906156e-05,
+ "loss": 1.0547,
+ "step": 4215
+ },
+ {
+ "epoch": 11.487738419618529,
+ "grad_norm": 8.42674446105957,
+ "learning_rate": 1.9624531404084704e-05,
+ "loss": 1.2573,
+ "step": 4216
+ },
+ {
+ "epoch": 11.490463215258856,
+ "grad_norm": 10.657425880432129,
+ "learning_rate": 1.962429181530771e-05,
+ "loss": 1.2754,
+ "step": 4217
+ },
+ {
+ "epoch": 11.493188010899182,
+ "grad_norm": 7.15110445022583,
+ "learning_rate": 1.9624052151577047e-05,
+ "loss": 1.0391,
+ "step": 4218
+ },
+ {
+ "epoch": 11.49591280653951,
+ "grad_norm": 8.82170295715332,
+ "learning_rate": 1.962381241289457e-05,
+ "loss": 1.4329,
+ "step": 4219
+ },
+ {
+ "epoch": 11.498637602179837,
+ "grad_norm": 10.280640602111816,
+ "learning_rate": 1.9623572599262156e-05,
+ "loss": 1.3613,
+ "step": 4220
+ },
+ {
+ "epoch": 11.501362397820163,
+ "grad_norm": 8.611913681030273,
+ "learning_rate": 1.9623332710681666e-05,
+ "loss": 1.1653,
+ "step": 4221
+ },
+ {
+ "epoch": 11.50408719346049,
+ "grad_norm": 7.79402494430542,
+ "learning_rate": 1.962309274715497e-05,
+ "loss": 1.1033,
+ "step": 4222
+ },
+ {
+ "epoch": 11.506811989100818,
+ "grad_norm": 9.2391939163208,
+ "learning_rate": 1.962285270868394e-05,
+ "loss": 1.2617,
+ "step": 4223
+ },
+ {
+ "epoch": 11.509536784741144,
+ "grad_norm": 8.58356761932373,
+ "learning_rate": 1.962261259527044e-05,
+ "loss": 1.2402,
+ "step": 4224
+ },
+ {
+ "epoch": 11.512261580381471,
+ "grad_norm": 10.11650562286377,
+ "learning_rate": 1.9622372406916343e-05,
+ "loss": 1.1157,
+ "step": 4225
+ },
+ {
+ "epoch": 11.514986376021799,
+ "grad_norm": 10.219006538391113,
+ "learning_rate": 1.9622132143623524e-05,
+ "loss": 1.2388,
+ "step": 4226
+ },
+ {
+ "epoch": 11.517711171662125,
+ "grad_norm": 10.135218620300293,
+ "learning_rate": 1.9621891805393846e-05,
+ "loss": 1.2124,
+ "step": 4227
+ },
+ {
+ "epoch": 11.520435967302452,
+ "grad_norm": 9.944450378417969,
+ "learning_rate": 1.9621651392229182e-05,
+ "loss": 1.3591,
+ "step": 4228
+ },
+ {
+ "epoch": 11.52316076294278,
+ "grad_norm": 8.386174201965332,
+ "learning_rate": 1.9621410904131407e-05,
+ "loss": 1.2812,
+ "step": 4229
+ },
+ {
+ "epoch": 11.525885558583106,
+ "grad_norm": 9.262544631958008,
+ "learning_rate": 1.9621170341102396e-05,
+ "loss": 1.436,
+ "step": 4230
+ },
+ {
+ "epoch": 11.528610354223433,
+ "grad_norm": 10.720914840698242,
+ "learning_rate": 1.962092970314402e-05,
+ "loss": 1.3401,
+ "step": 4231
+ },
+ {
+ "epoch": 11.53133514986376,
+ "grad_norm": 7.582281589508057,
+ "learning_rate": 1.9620688990258152e-05,
+ "loss": 1.2751,
+ "step": 4232
+ },
+ {
+ "epoch": 11.534059945504087,
+ "grad_norm": 9.216172218322754,
+ "learning_rate": 1.962044820244667e-05,
+ "loss": 1.1741,
+ "step": 4233
+ },
+ {
+ "epoch": 11.536784741144414,
+ "grad_norm": 8.738519668579102,
+ "learning_rate": 1.9620207339711442e-05,
+ "loss": 1.1365,
+ "step": 4234
+ },
+ {
+ "epoch": 11.539509536784742,
+ "grad_norm": 9.072188377380371,
+ "learning_rate": 1.9619966402054355e-05,
+ "loss": 1.3137,
+ "step": 4235
+ },
+ {
+ "epoch": 11.542234332425068,
+ "grad_norm": 8.85590648651123,
+ "learning_rate": 1.9619725389477275e-05,
+ "loss": 1.2622,
+ "step": 4236
+ },
+ {
+ "epoch": 11.544959128065395,
+ "grad_norm": 9.035333633422852,
+ "learning_rate": 1.9619484301982086e-05,
+ "loss": 1.2571,
+ "step": 4237
+ },
+ {
+ "epoch": 11.547683923705723,
+ "grad_norm": 7.747833251953125,
+ "learning_rate": 1.961924313957066e-05,
+ "loss": 1.323,
+ "step": 4238
+ },
+ {
+ "epoch": 11.550408719346049,
+ "grad_norm": 7.55806827545166,
+ "learning_rate": 1.961900190224488e-05,
+ "loss": 1.4465,
+ "step": 4239
+ },
+ {
+ "epoch": 11.553133514986376,
+ "grad_norm": 10.450825691223145,
+ "learning_rate": 1.9618760590006623e-05,
+ "loss": 1.2168,
+ "step": 4240
+ },
+ {
+ "epoch": 11.555858310626704,
+ "grad_norm": 9.569533348083496,
+ "learning_rate": 1.9618519202857768e-05,
+ "loss": 1.3794,
+ "step": 4241
+ },
+ {
+ "epoch": 11.55858310626703,
+ "grad_norm": 8.513108253479004,
+ "learning_rate": 1.9618277740800195e-05,
+ "loss": 1.082,
+ "step": 4242
+ },
+ {
+ "epoch": 11.561307901907357,
+ "grad_norm": 11.943915367126465,
+ "learning_rate": 1.961803620383578e-05,
+ "loss": 1.261,
+ "step": 4243
+ },
+ {
+ "epoch": 11.564032697547685,
+ "grad_norm": 8.429560661315918,
+ "learning_rate": 1.9617794591966418e-05,
+ "loss": 1.1899,
+ "step": 4244
+ },
+ {
+ "epoch": 11.56675749318801,
+ "grad_norm": 7.78025484085083,
+ "learning_rate": 1.9617552905193972e-05,
+ "loss": 1.2947,
+ "step": 4245
+ },
+ {
+ "epoch": 11.569482288828338,
+ "grad_norm": 11.231201171875,
+ "learning_rate": 1.961731114352034e-05,
+ "loss": 1.3087,
+ "step": 4246
+ },
+ {
+ "epoch": 11.572207084468666,
+ "grad_norm": 8.603983879089355,
+ "learning_rate": 1.9617069306947394e-05,
+ "loss": 1.2297,
+ "step": 4247
+ },
+ {
+ "epoch": 11.574931880108991,
+ "grad_norm": 9.307816505432129,
+ "learning_rate": 1.9616827395477026e-05,
+ "loss": 1.1334,
+ "step": 4248
+ },
+ {
+ "epoch": 11.577656675749319,
+ "grad_norm": 8.92887020111084,
+ "learning_rate": 1.961658540911111e-05,
+ "loss": 1.3169,
+ "step": 4249
+ },
+ {
+ "epoch": 11.580381471389646,
+ "grad_norm": 8.824298858642578,
+ "learning_rate": 1.961634334785154e-05,
+ "loss": 1.2552,
+ "step": 4250
+ },
+ {
+ "epoch": 11.583106267029972,
+ "grad_norm": 8.4943208694458,
+ "learning_rate": 1.9616101211700198e-05,
+ "loss": 1.1731,
+ "step": 4251
+ },
+ {
+ "epoch": 11.5858310626703,
+ "grad_norm": 11.546370506286621,
+ "learning_rate": 1.961585900065897e-05,
+ "loss": 1.259,
+ "step": 4252
+ },
+ {
+ "epoch": 11.588555858310627,
+ "grad_norm": 11.164836883544922,
+ "learning_rate": 1.961561671472974e-05,
+ "loss": 1.3291,
+ "step": 4253
+ },
+ {
+ "epoch": 11.591280653950953,
+ "grad_norm": 9.311529159545898,
+ "learning_rate": 1.9615374353914395e-05,
+ "loss": 1.4153,
+ "step": 4254
+ },
+ {
+ "epoch": 11.59400544959128,
+ "grad_norm": 10.316414833068848,
+ "learning_rate": 1.9615131918214824e-05,
+ "loss": 1.4077,
+ "step": 4255
+ },
+ {
+ "epoch": 11.596730245231608,
+ "grad_norm": 25.058340072631836,
+ "learning_rate": 1.961488940763292e-05,
+ "loss": 1.2662,
+ "step": 4256
+ },
+ {
+ "epoch": 11.599455040871934,
+ "grad_norm": 14.15247917175293,
+ "learning_rate": 1.961464682217056e-05,
+ "loss": 1.3037,
+ "step": 4257
+ },
+ {
+ "epoch": 11.602179836512262,
+ "grad_norm": 10.92613410949707,
+ "learning_rate": 1.9614404161829643e-05,
+ "loss": 1.3882,
+ "step": 4258
+ },
+ {
+ "epoch": 11.60490463215259,
+ "grad_norm": 8.810829162597656,
+ "learning_rate": 1.9614161426612056e-05,
+ "loss": 1.2002,
+ "step": 4259
+ },
+ {
+ "epoch": 11.607629427792915,
+ "grad_norm": 8.915725708007812,
+ "learning_rate": 1.9613918616519688e-05,
+ "loss": 1.2571,
+ "step": 4260
+ },
+ {
+ "epoch": 11.610354223433243,
+ "grad_norm": 10.085176467895508,
+ "learning_rate": 1.9613675731554435e-05,
+ "loss": 1.1372,
+ "step": 4261
+ },
+ {
+ "epoch": 11.61307901907357,
+ "grad_norm": 9.723475456237793,
+ "learning_rate": 1.961343277171818e-05,
+ "loss": 1.2898,
+ "step": 4262
+ },
+ {
+ "epoch": 11.615803814713896,
+ "grad_norm": 7.391706943511963,
+ "learning_rate": 1.9613189737012824e-05,
+ "loss": 1.0732,
+ "step": 4263
+ },
+ {
+ "epoch": 11.618528610354224,
+ "grad_norm": 8.334680557250977,
+ "learning_rate": 1.9612946627440254e-05,
+ "loss": 1.2378,
+ "step": 4264
+ },
+ {
+ "epoch": 11.621253405994551,
+ "grad_norm": 10.083943367004395,
+ "learning_rate": 1.9612703443002366e-05,
+ "loss": 1.4141,
+ "step": 4265
+ },
+ {
+ "epoch": 11.623978201634877,
+ "grad_norm": 8.957664489746094,
+ "learning_rate": 1.9612460183701053e-05,
+ "loss": 1.1027,
+ "step": 4266
+ },
+ {
+ "epoch": 11.626702997275205,
+ "grad_norm": 9.454508781433105,
+ "learning_rate": 1.9612216849538205e-05,
+ "loss": 1.1311,
+ "step": 4267
+ },
+ {
+ "epoch": 11.629427792915532,
+ "grad_norm": 10.544790267944336,
+ "learning_rate": 1.9611973440515724e-05,
+ "loss": 1.3735,
+ "step": 4268
+ },
+ {
+ "epoch": 11.632152588555858,
+ "grad_norm": 13.891005516052246,
+ "learning_rate": 1.9611729956635507e-05,
+ "loss": 1.0608,
+ "step": 4269
+ },
+ {
+ "epoch": 11.634877384196185,
+ "grad_norm": 12.7100830078125,
+ "learning_rate": 1.9611486397899445e-05,
+ "loss": 1.3298,
+ "step": 4270
+ },
+ {
+ "epoch": 11.637602179836513,
+ "grad_norm": 8.996678352355957,
+ "learning_rate": 1.9611242764309434e-05,
+ "loss": 1.4302,
+ "step": 4271
+ },
+ {
+ "epoch": 11.640326975476839,
+ "grad_norm": 9.974884986877441,
+ "learning_rate": 1.9610999055867376e-05,
+ "loss": 1.2512,
+ "step": 4272
+ },
+ {
+ "epoch": 11.643051771117166,
+ "grad_norm": 10.96886157989502,
+ "learning_rate": 1.9610755272575167e-05,
+ "loss": 1.3538,
+ "step": 4273
+ },
+ {
+ "epoch": 11.645776566757494,
+ "grad_norm": 9.486754417419434,
+ "learning_rate": 1.96105114144347e-05,
+ "loss": 1.1885,
+ "step": 4274
+ },
+ {
+ "epoch": 11.64850136239782,
+ "grad_norm": 9.534106254577637,
+ "learning_rate": 1.9610267481447883e-05,
+ "loss": 1.2775,
+ "step": 4275
+ },
+ {
+ "epoch": 11.651226158038147,
+ "grad_norm": 9.522997856140137,
+ "learning_rate": 1.9610023473616616e-05,
+ "loss": 1.1348,
+ "step": 4276
+ },
+ {
+ "epoch": 11.653950953678475,
+ "grad_norm": 10.608443260192871,
+ "learning_rate": 1.960977939094279e-05,
+ "loss": 1.3552,
+ "step": 4277
+ },
+ {
+ "epoch": 11.6566757493188,
+ "grad_norm": 10.006903648376465,
+ "learning_rate": 1.9609535233428313e-05,
+ "loss": 1.2917,
+ "step": 4278
+ },
+ {
+ "epoch": 11.659400544959128,
+ "grad_norm": 10.470991134643555,
+ "learning_rate": 1.9609291001075082e-05,
+ "loss": 1.3833,
+ "step": 4279
+ },
+ {
+ "epoch": 11.662125340599456,
+ "grad_norm": 9.588545799255371,
+ "learning_rate": 1.9609046693885007e-05,
+ "loss": 1.27,
+ "step": 4280
+ },
+ {
+ "epoch": 11.664850136239782,
+ "grad_norm": 19.973514556884766,
+ "learning_rate": 1.9608802311859984e-05,
+ "loss": 1.3926,
+ "step": 4281
+ },
+ {
+ "epoch": 11.66757493188011,
+ "grad_norm": 20.925952911376953,
+ "learning_rate": 1.9608557855001918e-05,
+ "loss": 1.2761,
+ "step": 4282
+ },
+ {
+ "epoch": 11.670299727520437,
+ "grad_norm": 9.654898643493652,
+ "learning_rate": 1.9608313323312712e-05,
+ "loss": 1.3579,
+ "step": 4283
+ },
+ {
+ "epoch": 11.673024523160763,
+ "grad_norm": 10.667916297912598,
+ "learning_rate": 1.960806871679427e-05,
+ "loss": 1.2363,
+ "step": 4284
+ },
+ {
+ "epoch": 11.67574931880109,
+ "grad_norm": 8.566445350646973,
+ "learning_rate": 1.96078240354485e-05,
+ "loss": 1.1454,
+ "step": 4285
+ },
+ {
+ "epoch": 11.678474114441418,
+ "grad_norm": 8.778693199157715,
+ "learning_rate": 1.9607579279277304e-05,
+ "loss": 1.177,
+ "step": 4286
+ },
+ {
+ "epoch": 11.681198910081743,
+ "grad_norm": 13.553953170776367,
+ "learning_rate": 1.960733444828259e-05,
+ "loss": 1.4387,
+ "step": 4287
+ },
+ {
+ "epoch": 11.683923705722071,
+ "grad_norm": 9.751891136169434,
+ "learning_rate": 1.9607089542466266e-05,
+ "loss": 1.2366,
+ "step": 4288
+ },
+ {
+ "epoch": 11.686648501362399,
+ "grad_norm": 10.268438339233398,
+ "learning_rate": 1.960684456183024e-05,
+ "loss": 1.3503,
+ "step": 4289
+ },
+ {
+ "epoch": 11.689373297002724,
+ "grad_norm": 13.085841178894043,
+ "learning_rate": 1.9606599506376415e-05,
+ "loss": 1.1855,
+ "step": 4290
+ },
+ {
+ "epoch": 11.692098092643052,
+ "grad_norm": 9.935746192932129,
+ "learning_rate": 1.96063543761067e-05,
+ "loss": 1.104,
+ "step": 4291
+ },
+ {
+ "epoch": 11.69482288828338,
+ "grad_norm": 10.535567283630371,
+ "learning_rate": 1.960610917102301e-05,
+ "loss": 1.2815,
+ "step": 4292
+ },
+ {
+ "epoch": 11.697547683923705,
+ "grad_norm": 10.67478084564209,
+ "learning_rate": 1.9605863891127247e-05,
+ "loss": 1.1548,
+ "step": 4293
+ },
+ {
+ "epoch": 11.700272479564033,
+ "grad_norm": 9.28094482421875,
+ "learning_rate": 1.960561853642133e-05,
+ "loss": 1.2197,
+ "step": 4294
+ },
+ {
+ "epoch": 11.70299727520436,
+ "grad_norm": 9.412829399108887,
+ "learning_rate": 1.960537310690716e-05,
+ "loss": 1.0266,
+ "step": 4295
+ },
+ {
+ "epoch": 11.705722070844686,
+ "grad_norm": 14.982603073120117,
+ "learning_rate": 1.9605127602586656e-05,
+ "loss": 1.3112,
+ "step": 4296
+ },
+ {
+ "epoch": 11.708446866485014,
+ "grad_norm": 12.387552261352539,
+ "learning_rate": 1.9604882023461725e-05,
+ "loss": 1.4277,
+ "step": 4297
+ },
+ {
+ "epoch": 11.711171662125341,
+ "grad_norm": 13.129229545593262,
+ "learning_rate": 1.9604636369534285e-05,
+ "loss": 1.2236,
+ "step": 4298
+ },
+ {
+ "epoch": 11.713896457765667,
+ "grad_norm": 11.800368309020996,
+ "learning_rate": 1.9604390640806246e-05,
+ "loss": 1.261,
+ "step": 4299
+ },
+ {
+ "epoch": 11.716621253405995,
+ "grad_norm": 15.784507751464844,
+ "learning_rate": 1.9604144837279523e-05,
+ "loss": 1.1934,
+ "step": 4300
+ },
+ {
+ "epoch": 11.719346049046322,
+ "grad_norm": 8.646052360534668,
+ "learning_rate": 1.9603898958956024e-05,
+ "loss": 1.166,
+ "step": 4301
+ },
+ {
+ "epoch": 11.722070844686648,
+ "grad_norm": 9.307878494262695,
+ "learning_rate": 1.960365300583767e-05,
+ "loss": 1.0243,
+ "step": 4302
+ },
+ {
+ "epoch": 11.724795640326976,
+ "grad_norm": 11.6644926071167,
+ "learning_rate": 1.960340697792638e-05,
+ "loss": 1.1243,
+ "step": 4303
+ },
+ {
+ "epoch": 11.727520435967303,
+ "grad_norm": 10.589908599853516,
+ "learning_rate": 1.9603160875224067e-05,
+ "loss": 1.4622,
+ "step": 4304
+ },
+ {
+ "epoch": 11.730245231607629,
+ "grad_norm": 8.321166038513184,
+ "learning_rate": 1.960291469773264e-05,
+ "loss": 1.2344,
+ "step": 4305
+ },
+ {
+ "epoch": 11.732970027247957,
+ "grad_norm": 11.593385696411133,
+ "learning_rate": 1.9602668445454024e-05,
+ "loss": 1.1692,
+ "step": 4306
+ },
+ {
+ "epoch": 11.735694822888284,
+ "grad_norm": 10.745800971984863,
+ "learning_rate": 1.9602422118390138e-05,
+ "loss": 1.3217,
+ "step": 4307
+ },
+ {
+ "epoch": 11.73841961852861,
+ "grad_norm": 8.608404159545898,
+ "learning_rate": 1.9602175716542895e-05,
+ "loss": 1.1926,
+ "step": 4308
+ },
+ {
+ "epoch": 11.741144414168938,
+ "grad_norm": 9.466004371643066,
+ "learning_rate": 1.9601929239914217e-05,
+ "loss": 1.2781,
+ "step": 4309
+ },
+ {
+ "epoch": 11.743869209809265,
+ "grad_norm": 9.192959785461426,
+ "learning_rate": 1.960168268850602e-05,
+ "loss": 1.2083,
+ "step": 4310
+ },
+ {
+ "epoch": 11.746594005449591,
+ "grad_norm": 17.6987361907959,
+ "learning_rate": 1.9601436062320232e-05,
+ "loss": 1.333,
+ "step": 4311
+ },
+ {
+ "epoch": 11.749318801089919,
+ "grad_norm": 8.098871231079102,
+ "learning_rate": 1.960118936135877e-05,
+ "loss": 1.2598,
+ "step": 4312
+ },
+ {
+ "epoch": 11.752043596730246,
+ "grad_norm": 11.7301607131958,
+ "learning_rate": 1.960094258562355e-05,
+ "loss": 1.4526,
+ "step": 4313
+ },
+ {
+ "epoch": 11.754768392370572,
+ "grad_norm": 9.770210266113281,
+ "learning_rate": 1.9600695735116503e-05,
+ "loss": 1.2316,
+ "step": 4314
+ },
+ {
+ "epoch": 11.7574931880109,
+ "grad_norm": 8.813011169433594,
+ "learning_rate": 1.9600448809839542e-05,
+ "loss": 1.3875,
+ "step": 4315
+ },
+ {
+ "epoch": 11.760217983651227,
+ "grad_norm": 10.773046493530273,
+ "learning_rate": 1.9600201809794596e-05,
+ "loss": 1.2832,
+ "step": 4316
+ },
+ {
+ "epoch": 11.762942779291553,
+ "grad_norm": 8.112799644470215,
+ "learning_rate": 1.9599954734983586e-05,
+ "loss": 1.3123,
+ "step": 4317
+ },
+ {
+ "epoch": 11.76566757493188,
+ "grad_norm": 24.07083511352539,
+ "learning_rate": 1.9599707585408438e-05,
+ "loss": 1.3369,
+ "step": 4318
+ },
+ {
+ "epoch": 11.768392370572208,
+ "grad_norm": 12.28234577178955,
+ "learning_rate": 1.959946036107108e-05,
+ "loss": 1.397,
+ "step": 4319
+ },
+ {
+ "epoch": 11.771117166212534,
+ "grad_norm": 10.630733489990234,
+ "learning_rate": 1.959921306197343e-05,
+ "loss": 1.2463,
+ "step": 4320
+ },
+ {
+ "epoch": 11.773841961852861,
+ "grad_norm": 12.136207580566406,
+ "learning_rate": 1.959896568811742e-05,
+ "loss": 1.1973,
+ "step": 4321
+ },
+ {
+ "epoch": 11.776566757493189,
+ "grad_norm": 12.15300464630127,
+ "learning_rate": 1.959871823950497e-05,
+ "loss": 1.1873,
+ "step": 4322
+ },
+ {
+ "epoch": 11.779291553133515,
+ "grad_norm": 9.693768501281738,
+ "learning_rate": 1.9598470716138015e-05,
+ "loss": 1.3191,
+ "step": 4323
+ },
+ {
+ "epoch": 11.782016348773842,
+ "grad_norm": 10.026284217834473,
+ "learning_rate": 1.9598223118018477e-05,
+ "loss": 1.3662,
+ "step": 4324
+ },
+ {
+ "epoch": 11.78474114441417,
+ "grad_norm": 9.156767845153809,
+ "learning_rate": 1.959797544514829e-05,
+ "loss": 1.241,
+ "step": 4325
+ },
+ {
+ "epoch": 11.787465940054496,
+ "grad_norm": 11.601896286010742,
+ "learning_rate": 1.9597727697529373e-05,
+ "loss": 1.281,
+ "step": 4326
+ },
+ {
+ "epoch": 11.790190735694823,
+ "grad_norm": 9.980677604675293,
+ "learning_rate": 1.9597479875163666e-05,
+ "loss": 1.2557,
+ "step": 4327
+ },
+ {
+ "epoch": 11.79291553133515,
+ "grad_norm": 10.158729553222656,
+ "learning_rate": 1.9597231978053095e-05,
+ "loss": 1.1277,
+ "step": 4328
+ },
+ {
+ "epoch": 11.795640326975477,
+ "grad_norm": 11.920785903930664,
+ "learning_rate": 1.9596984006199585e-05,
+ "loss": 1.3772,
+ "step": 4329
+ },
+ {
+ "epoch": 11.798365122615804,
+ "grad_norm": 12.154458045959473,
+ "learning_rate": 1.9596735959605077e-05,
+ "loss": 1.2166,
+ "step": 4330
+ },
+ {
+ "epoch": 11.80108991825613,
+ "grad_norm": 12.615863800048828,
+ "learning_rate": 1.95964878382715e-05,
+ "loss": 1.1858,
+ "step": 4331
+ },
+ {
+ "epoch": 11.803814713896458,
+ "grad_norm": 9.947614669799805,
+ "learning_rate": 1.9596239642200784e-05,
+ "loss": 1.5405,
+ "step": 4332
+ },
+ {
+ "epoch": 11.806539509536785,
+ "grad_norm": 16.928955078125,
+ "learning_rate": 1.959599137139486e-05,
+ "loss": 1.182,
+ "step": 4333
+ },
+ {
+ "epoch": 11.809264305177111,
+ "grad_norm": 7.814918041229248,
+ "learning_rate": 1.959574302585566e-05,
+ "loss": 1.1677,
+ "step": 4334
+ },
+ {
+ "epoch": 11.811989100817438,
+ "grad_norm": 9.805076599121094,
+ "learning_rate": 1.9595494605585127e-05,
+ "loss": 1.2236,
+ "step": 4335
+ },
+ {
+ "epoch": 11.814713896457766,
+ "grad_norm": 18.602846145629883,
+ "learning_rate": 1.9595246110585194e-05,
+ "loss": 1.3203,
+ "step": 4336
+ },
+ {
+ "epoch": 11.817438692098092,
+ "grad_norm": 9.417820930480957,
+ "learning_rate": 1.959499754085779e-05,
+ "loss": 1.2467,
+ "step": 4337
+ },
+ {
+ "epoch": 11.82016348773842,
+ "grad_norm": 8.117120742797852,
+ "learning_rate": 1.9594748896404853e-05,
+ "loss": 1.2739,
+ "step": 4338
+ },
+ {
+ "epoch": 11.822888283378747,
+ "grad_norm": 10.711532592773438,
+ "learning_rate": 1.9594500177228322e-05,
+ "loss": 1.3523,
+ "step": 4339
+ },
+ {
+ "epoch": 11.825613079019073,
+ "grad_norm": 11.009588241577148,
+ "learning_rate": 1.959425138333013e-05,
+ "loss": 1.4854,
+ "step": 4340
+ },
+ {
+ "epoch": 11.8283378746594,
+ "grad_norm": 13.619063377380371,
+ "learning_rate": 1.959400251471222e-05,
+ "loss": 1.3606,
+ "step": 4341
+ },
+ {
+ "epoch": 11.831062670299728,
+ "grad_norm": 8.956987380981445,
+ "learning_rate": 1.9593753571376524e-05,
+ "loss": 1.2725,
+ "step": 4342
+ },
+ {
+ "epoch": 11.833787465940054,
+ "grad_norm": 10.285244941711426,
+ "learning_rate": 1.9593504553324987e-05,
+ "loss": 1.198,
+ "step": 4343
+ },
+ {
+ "epoch": 11.836512261580381,
+ "grad_norm": 12.4805908203125,
+ "learning_rate": 1.9593255460559543e-05,
+ "loss": 1.2314,
+ "step": 4344
+ },
+ {
+ "epoch": 11.839237057220709,
+ "grad_norm": 33.98967361450195,
+ "learning_rate": 1.9593006293082134e-05,
+ "loss": 1.2979,
+ "step": 4345
+ },
+ {
+ "epoch": 11.841961852861035,
+ "grad_norm": 11.135168075561523,
+ "learning_rate": 1.9592757050894705e-05,
+ "loss": 1.2222,
+ "step": 4346
+ },
+ {
+ "epoch": 11.844686648501362,
+ "grad_norm": 8.834343910217285,
+ "learning_rate": 1.9592507733999187e-05,
+ "loss": 1.1731,
+ "step": 4347
+ },
+ {
+ "epoch": 11.84741144414169,
+ "grad_norm": 10.759552001953125,
+ "learning_rate": 1.959225834239753e-05,
+ "loss": 1.2273,
+ "step": 4348
+ },
+ {
+ "epoch": 11.850136239782016,
+ "grad_norm": 8.94282054901123,
+ "learning_rate": 1.9592008876091676e-05,
+ "loss": 1.3877,
+ "step": 4349
+ },
+ {
+ "epoch": 11.852861035422343,
+ "grad_norm": 8.68305778503418,
+ "learning_rate": 1.9591759335083563e-05,
+ "loss": 1.1846,
+ "step": 4350
+ },
+ {
+ "epoch": 11.85558583106267,
+ "grad_norm": 10.559568405151367,
+ "learning_rate": 1.9591509719375136e-05,
+ "loss": 1.2915,
+ "step": 4351
+ },
+ {
+ "epoch": 11.858310626702997,
+ "grad_norm": 10.871464729309082,
+ "learning_rate": 1.9591260028968344e-05,
+ "loss": 1.3989,
+ "step": 4352
+ },
+ {
+ "epoch": 11.861035422343324,
+ "grad_norm": 9.31416130065918,
+ "learning_rate": 1.9591010263865125e-05,
+ "loss": 1.0696,
+ "step": 4353
+ },
+ {
+ "epoch": 11.863760217983652,
+ "grad_norm": 11.239910125732422,
+ "learning_rate": 1.9590760424067424e-05,
+ "loss": 1.3904,
+ "step": 4354
+ },
+ {
+ "epoch": 11.866485013623977,
+ "grad_norm": 12.502378463745117,
+ "learning_rate": 1.9590510509577195e-05,
+ "loss": 1.4033,
+ "step": 4355
+ },
+ {
+ "epoch": 11.869209809264305,
+ "grad_norm": 13.228873252868652,
+ "learning_rate": 1.9590260520396377e-05,
+ "loss": 1.355,
+ "step": 4356
+ },
+ {
+ "epoch": 11.871934604904633,
+ "grad_norm": 8.481633186340332,
+ "learning_rate": 1.9590010456526917e-05,
+ "loss": 1.3428,
+ "step": 4357
+ },
+ {
+ "epoch": 11.874659400544958,
+ "grad_norm": 11.9637451171875,
+ "learning_rate": 1.9589760317970765e-05,
+ "loss": 1.1692,
+ "step": 4358
+ },
+ {
+ "epoch": 11.877384196185286,
+ "grad_norm": 12.829935073852539,
+ "learning_rate": 1.958951010472987e-05,
+ "loss": 1.1487,
+ "step": 4359
+ },
+ {
+ "epoch": 11.880108991825614,
+ "grad_norm": 8.80949878692627,
+ "learning_rate": 1.9589259816806177e-05,
+ "loss": 1.3743,
+ "step": 4360
+ },
+ {
+ "epoch": 11.88283378746594,
+ "grad_norm": 16.82501983642578,
+ "learning_rate": 1.9589009454201634e-05,
+ "loss": 1.3043,
+ "step": 4361
+ },
+ {
+ "epoch": 11.885558583106267,
+ "grad_norm": 16.30137825012207,
+ "learning_rate": 1.9588759016918198e-05,
+ "loss": 1.0549,
+ "step": 4362
+ },
+ {
+ "epoch": 11.888283378746594,
+ "grad_norm": 11.18465805053711,
+ "learning_rate": 1.9588508504957816e-05,
+ "loss": 1.2505,
+ "step": 4363
+ },
+ {
+ "epoch": 11.89100817438692,
+ "grad_norm": 10.844934463500977,
+ "learning_rate": 1.958825791832244e-05,
+ "loss": 1.2908,
+ "step": 4364
+ },
+ {
+ "epoch": 11.893732970027248,
+ "grad_norm": 8.732866287231445,
+ "learning_rate": 1.9588007257014013e-05,
+ "loss": 1.3306,
+ "step": 4365
+ },
+ {
+ "epoch": 11.896457765667575,
+ "grad_norm": 12.165096282958984,
+ "learning_rate": 1.95877565210345e-05,
+ "loss": 1.2432,
+ "step": 4366
+ },
+ {
+ "epoch": 11.899182561307901,
+ "grad_norm": 11.769744873046875,
+ "learning_rate": 1.9587505710385847e-05,
+ "loss": 1.3108,
+ "step": 4367
+ },
+ {
+ "epoch": 11.901907356948229,
+ "grad_norm": 14.404982566833496,
+ "learning_rate": 1.958725482507001e-05,
+ "loss": 1.2993,
+ "step": 4368
+ },
+ {
+ "epoch": 11.904632152588556,
+ "grad_norm": 10.435540199279785,
+ "learning_rate": 1.9587003865088937e-05,
+ "loss": 1.2786,
+ "step": 4369
+ },
+ {
+ "epoch": 11.907356948228882,
+ "grad_norm": 9.30897331237793,
+ "learning_rate": 1.9586752830444585e-05,
+ "loss": 1.3557,
+ "step": 4370
+ },
+ {
+ "epoch": 11.91008174386921,
+ "grad_norm": 16.349184036254883,
+ "learning_rate": 1.9586501721138914e-05,
+ "loss": 1.3054,
+ "step": 4371
+ },
+ {
+ "epoch": 11.912806539509537,
+ "grad_norm": 11.184679985046387,
+ "learning_rate": 1.9586250537173878e-05,
+ "loss": 1.2993,
+ "step": 4372
+ },
+ {
+ "epoch": 11.915531335149863,
+ "grad_norm": 11.601655006408691,
+ "learning_rate": 1.9585999278551426e-05,
+ "loss": 1.3396,
+ "step": 4373
+ },
+ {
+ "epoch": 11.91825613079019,
+ "grad_norm": 9.532584190368652,
+ "learning_rate": 1.9585747945273526e-05,
+ "loss": 1.4148,
+ "step": 4374
+ },
+ {
+ "epoch": 11.920980926430518,
+ "grad_norm": 13.469198226928711,
+ "learning_rate": 1.9585496537342123e-05,
+ "loss": 1.3572,
+ "step": 4375
+ },
+ {
+ "epoch": 11.923705722070844,
+ "grad_norm": 10.040478706359863,
+ "learning_rate": 1.958524505475919e-05,
+ "loss": 1.0967,
+ "step": 4376
+ },
+ {
+ "epoch": 11.926430517711172,
+ "grad_norm": 28.938920974731445,
+ "learning_rate": 1.958499349752667e-05,
+ "loss": 1.2146,
+ "step": 4377
+ },
+ {
+ "epoch": 11.9291553133515,
+ "grad_norm": 8.300970077514648,
+ "learning_rate": 1.958474186564653e-05,
+ "loss": 1.3777,
+ "step": 4378
+ },
+ {
+ "epoch": 11.931880108991825,
+ "grad_norm": 12.287845611572266,
+ "learning_rate": 1.958449015912073e-05,
+ "loss": 1.4329,
+ "step": 4379
+ },
+ {
+ "epoch": 11.934604904632153,
+ "grad_norm": 10.114580154418945,
+ "learning_rate": 1.958423837795123e-05,
+ "loss": 1.2354,
+ "step": 4380
+ },
+ {
+ "epoch": 11.93732970027248,
+ "grad_norm": 12.478697776794434,
+ "learning_rate": 1.958398652213999e-05,
+ "loss": 1.2632,
+ "step": 4381
+ },
+ {
+ "epoch": 11.940054495912806,
+ "grad_norm": 12.757806777954102,
+ "learning_rate": 1.9583734591688966e-05,
+ "loss": 1.2795,
+ "step": 4382
+ },
+ {
+ "epoch": 11.942779291553133,
+ "grad_norm": 12.535611152648926,
+ "learning_rate": 1.9583482586600132e-05,
+ "loss": 1.2043,
+ "step": 4383
+ },
+ {
+ "epoch": 11.945504087193461,
+ "grad_norm": 13.83928394317627,
+ "learning_rate": 1.958323050687544e-05,
+ "loss": 1.3303,
+ "step": 4384
+ },
+ {
+ "epoch": 11.948228882833787,
+ "grad_norm": 12.60389232635498,
+ "learning_rate": 1.9582978352516863e-05,
+ "loss": 1.2756,
+ "step": 4385
+ },
+ {
+ "epoch": 11.950953678474114,
+ "grad_norm": 13.583793640136719,
+ "learning_rate": 1.958272612352635e-05,
+ "loss": 1.2454,
+ "step": 4386
+ },
+ {
+ "epoch": 11.953678474114442,
+ "grad_norm": 9.803666114807129,
+ "learning_rate": 1.9582473819905884e-05,
+ "loss": 1.2583,
+ "step": 4387
+ },
+ {
+ "epoch": 11.956403269754768,
+ "grad_norm": 9.510045051574707,
+ "learning_rate": 1.9582221441657413e-05,
+ "loss": 1.2581,
+ "step": 4388
+ },
+ {
+ "epoch": 11.959128065395095,
+ "grad_norm": 11.14546012878418,
+ "learning_rate": 1.9581968988782914e-05,
+ "loss": 1.3142,
+ "step": 4389
+ },
+ {
+ "epoch": 11.961852861035423,
+ "grad_norm": 11.336246490478516,
+ "learning_rate": 1.9581716461284344e-05,
+ "loss": 1.3818,
+ "step": 4390
+ },
+ {
+ "epoch": 11.964577656675749,
+ "grad_norm": 9.391512870788574,
+ "learning_rate": 1.958146385916368e-05,
+ "loss": 1.2222,
+ "step": 4391
+ },
+ {
+ "epoch": 11.967302452316076,
+ "grad_norm": 10.746350288391113,
+ "learning_rate": 1.9581211182422882e-05,
+ "loss": 1.186,
+ "step": 4392
+ },
+ {
+ "epoch": 11.970027247956404,
+ "grad_norm": 8.70995044708252,
+ "learning_rate": 1.958095843106392e-05,
+ "loss": 1.1543,
+ "step": 4393
+ },
+ {
+ "epoch": 11.97275204359673,
+ "grad_norm": 10.364996910095215,
+ "learning_rate": 1.958070560508876e-05,
+ "loss": 1.196,
+ "step": 4394
+ },
+ {
+ "epoch": 11.975476839237057,
+ "grad_norm": 11.579974174499512,
+ "learning_rate": 1.9580452704499375e-05,
+ "loss": 1.2598,
+ "step": 4395
+ },
+ {
+ "epoch": 11.978201634877385,
+ "grad_norm": 37.31267166137695,
+ "learning_rate": 1.9580199729297736e-05,
+ "loss": 1.2881,
+ "step": 4396
+ },
+ {
+ "epoch": 11.98092643051771,
+ "grad_norm": 9.780526161193848,
+ "learning_rate": 1.9579946679485803e-05,
+ "loss": 1.3279,
+ "step": 4397
+ },
+ {
+ "epoch": 11.983651226158038,
+ "grad_norm": 8.573712348937988,
+ "learning_rate": 1.9579693555065558e-05,
+ "loss": 1.1371,
+ "step": 4398
+ },
+ {
+ "epoch": 11.986376021798366,
+ "grad_norm": 10.88554859161377,
+ "learning_rate": 1.9579440356038966e-05,
+ "loss": 1.5913,
+ "step": 4399
+ },
+ {
+ "epoch": 11.989100817438691,
+ "grad_norm": 14.26610279083252,
+ "learning_rate": 1.9579187082408003e-05,
+ "loss": 1.2529,
+ "step": 4400
+ },
+ {
+ "epoch": 11.991825613079019,
+ "grad_norm": 10.75584602355957,
+ "learning_rate": 1.957893373417464e-05,
+ "loss": 1.4375,
+ "step": 4401
+ },
+ {
+ "epoch": 11.994550408719347,
+ "grad_norm": 13.039530754089355,
+ "learning_rate": 1.9578680311340846e-05,
+ "loss": 1.2537,
+ "step": 4402
+ },
+ {
+ "epoch": 11.997275204359672,
+ "grad_norm": 9.510915756225586,
+ "learning_rate": 1.95784268139086e-05,
+ "loss": 1.2441,
+ "step": 4403
+ },
+ {
+ "epoch": 12.0,
+ "grad_norm": 11.786630630493164,
+ "learning_rate": 1.957817324187987e-05,
+ "loss": 1.1521,
+ "step": 4404
+ },
+ {
+ "epoch": 12.002724795640328,
+ "grad_norm": 15.739928245544434,
+ "learning_rate": 1.9577919595256642e-05,
+ "loss": 1.0649,
+ "step": 4405
+ },
+ {
+ "epoch": 12.005449591280653,
+ "grad_norm": 8.629070281982422,
+ "learning_rate": 1.9577665874040882e-05,
+ "loss": 1.1111,
+ "step": 4406
+ },
+ {
+ "epoch": 12.008174386920981,
+ "grad_norm": 8.434273719787598,
+ "learning_rate": 1.9577412078234565e-05,
+ "loss": 1.0261,
+ "step": 4407
+ },
+ {
+ "epoch": 12.010899182561309,
+ "grad_norm": 9.693862915039062,
+ "learning_rate": 1.9577158207839674e-05,
+ "loss": 1.1152,
+ "step": 4408
+ },
+ {
+ "epoch": 12.013623978201634,
+ "grad_norm": 6.749441146850586,
+ "learning_rate": 1.9576904262858183e-05,
+ "loss": 1.1797,
+ "step": 4409
+ },
+ {
+ "epoch": 12.016348773841962,
+ "grad_norm": 8.0995454788208,
+ "learning_rate": 1.957665024329207e-05,
+ "loss": 1.1367,
+ "step": 4410
+ },
+ {
+ "epoch": 12.01907356948229,
+ "grad_norm": 9.009051322937012,
+ "learning_rate": 1.9576396149143312e-05,
+ "loss": 1.1127,
+ "step": 4411
+ },
+ {
+ "epoch": 12.021798365122615,
+ "grad_norm": 9.048227310180664,
+ "learning_rate": 1.9576141980413893e-05,
+ "loss": 1.2572,
+ "step": 4412
+ },
+ {
+ "epoch": 12.024523160762943,
+ "grad_norm": 15.703821182250977,
+ "learning_rate": 1.957588773710578e-05,
+ "loss": 1.3508,
+ "step": 4413
+ },
+ {
+ "epoch": 12.02724795640327,
+ "grad_norm": 8.47426700592041,
+ "learning_rate": 1.957563341922097e-05,
+ "loss": 1.1946,
+ "step": 4414
+ },
+ {
+ "epoch": 12.029972752043596,
+ "grad_norm": 10.599610328674316,
+ "learning_rate": 1.957537902676143e-05,
+ "loss": 1.2874,
+ "step": 4415
+ },
+ {
+ "epoch": 12.032697547683924,
+ "grad_norm": 9.831764221191406,
+ "learning_rate": 1.9575124559729147e-05,
+ "loss": 1.0459,
+ "step": 4416
+ },
+ {
+ "epoch": 12.035422343324251,
+ "grad_norm": 8.489566802978516,
+ "learning_rate": 1.9574870018126108e-05,
+ "loss": 1.2295,
+ "step": 4417
+ },
+ {
+ "epoch": 12.038147138964577,
+ "grad_norm": 12.235746383666992,
+ "learning_rate": 1.9574615401954283e-05,
+ "loss": 1.2502,
+ "step": 4418
+ },
+ {
+ "epoch": 12.040871934604905,
+ "grad_norm": 14.411274909973145,
+ "learning_rate": 1.957436071121566e-05,
+ "loss": 1.1135,
+ "step": 4419
+ },
+ {
+ "epoch": 12.043596730245232,
+ "grad_norm": 8.343754768371582,
+ "learning_rate": 1.957410594591223e-05,
+ "loss": 1.0618,
+ "step": 4420
+ },
+ {
+ "epoch": 12.046321525885558,
+ "grad_norm": 8.101775169372559,
+ "learning_rate": 1.9573851106045965e-05,
+ "loss": 1.1919,
+ "step": 4421
+ },
+ {
+ "epoch": 12.049046321525886,
+ "grad_norm": 8.42682933807373,
+ "learning_rate": 1.957359619161886e-05,
+ "loss": 1.2458,
+ "step": 4422
+ },
+ {
+ "epoch": 12.051771117166213,
+ "grad_norm": 10.502134323120117,
+ "learning_rate": 1.9573341202632897e-05,
+ "loss": 1.1694,
+ "step": 4423
+ },
+ {
+ "epoch": 12.054495912806539,
+ "grad_norm": 8.5780611038208,
+ "learning_rate": 1.9573086139090056e-05,
+ "loss": 1.1309,
+ "step": 4424
+ },
+ {
+ "epoch": 12.057220708446867,
+ "grad_norm": 10.66483211517334,
+ "learning_rate": 1.957283100099233e-05,
+ "loss": 1.0049,
+ "step": 4425
+ },
+ {
+ "epoch": 12.059945504087194,
+ "grad_norm": 9.722137451171875,
+ "learning_rate": 1.9572575788341707e-05,
+ "loss": 1.2512,
+ "step": 4426
+ },
+ {
+ "epoch": 12.06267029972752,
+ "grad_norm": 11.696825981140137,
+ "learning_rate": 1.957232050114017e-05,
+ "loss": 1.1697,
+ "step": 4427
+ },
+ {
+ "epoch": 12.065395095367847,
+ "grad_norm": 9.30435848236084,
+ "learning_rate": 1.957206513938971e-05,
+ "loss": 1.1656,
+ "step": 4428
+ },
+ {
+ "epoch": 12.068119891008175,
+ "grad_norm": 7.531614780426025,
+ "learning_rate": 1.957180970309231e-05,
+ "loss": 1.1726,
+ "step": 4429
+ },
+ {
+ "epoch": 12.0708446866485,
+ "grad_norm": 10.614941596984863,
+ "learning_rate": 1.957155419224997e-05,
+ "loss": 1.4146,
+ "step": 4430
+ },
+ {
+ "epoch": 12.073569482288828,
+ "grad_norm": 10.960173606872559,
+ "learning_rate": 1.957129860686467e-05,
+ "loss": 1.136,
+ "step": 4431
+ },
+ {
+ "epoch": 12.076294277929156,
+ "grad_norm": 8.614213943481445,
+ "learning_rate": 1.9571042946938408e-05,
+ "loss": 1.1938,
+ "step": 4432
+ },
+ {
+ "epoch": 12.079019073569482,
+ "grad_norm": 9.550384521484375,
+ "learning_rate": 1.957078721247317e-05,
+ "loss": 1.2781,
+ "step": 4433
+ },
+ {
+ "epoch": 12.08174386920981,
+ "grad_norm": 48.99443054199219,
+ "learning_rate": 1.957053140347095e-05,
+ "loss": 0.9927,
+ "step": 4434
+ },
+ {
+ "epoch": 12.084468664850137,
+ "grad_norm": 10.192533493041992,
+ "learning_rate": 1.957027551993374e-05,
+ "loss": 1.1252,
+ "step": 4435
+ },
+ {
+ "epoch": 12.087193460490463,
+ "grad_norm": 9.485245704650879,
+ "learning_rate": 1.957001956186353e-05,
+ "loss": 1.2756,
+ "step": 4436
+ },
+ {
+ "epoch": 12.08991825613079,
+ "grad_norm": 11.191668510437012,
+ "learning_rate": 1.9569763529262315e-05,
+ "loss": 1.1938,
+ "step": 4437
+ },
+ {
+ "epoch": 12.092643051771118,
+ "grad_norm": 9.03013801574707,
+ "learning_rate": 1.9569507422132092e-05,
+ "loss": 1.1267,
+ "step": 4438
+ },
+ {
+ "epoch": 12.095367847411444,
+ "grad_norm": 11.902277946472168,
+ "learning_rate": 1.956925124047485e-05,
+ "loss": 1.2581,
+ "step": 4439
+ },
+ {
+ "epoch": 12.098092643051771,
+ "grad_norm": 10.63662052154541,
+ "learning_rate": 1.9568994984292592e-05,
+ "loss": 1.1394,
+ "step": 4440
+ },
+ {
+ "epoch": 12.100817438692099,
+ "grad_norm": 7.562166690826416,
+ "learning_rate": 1.9568738653587304e-05,
+ "loss": 1.186,
+ "step": 4441
+ },
+ {
+ "epoch": 12.103542234332425,
+ "grad_norm": 9.163925170898438,
+ "learning_rate": 1.9568482248360992e-05,
+ "loss": 1.0581,
+ "step": 4442
+ },
+ {
+ "epoch": 12.106267029972752,
+ "grad_norm": 10.432324409484863,
+ "learning_rate": 1.956822576861565e-05,
+ "loss": 1.1753,
+ "step": 4443
+ },
+ {
+ "epoch": 12.10899182561308,
+ "grad_norm": 10.020838737487793,
+ "learning_rate": 1.9567969214353266e-05,
+ "loss": 1.1882,
+ "step": 4444
+ },
+ {
+ "epoch": 12.111716621253406,
+ "grad_norm": 10.333386421203613,
+ "learning_rate": 1.956771258557585e-05,
+ "loss": 1.1543,
+ "step": 4445
+ },
+ {
+ "epoch": 12.114441416893733,
+ "grad_norm": 13.603619575500488,
+ "learning_rate": 1.9567455882285397e-05,
+ "loss": 1.3115,
+ "step": 4446
+ },
+ {
+ "epoch": 12.11716621253406,
+ "grad_norm": 8.085104942321777,
+ "learning_rate": 1.95671991044839e-05,
+ "loss": 1.0378,
+ "step": 4447
+ },
+ {
+ "epoch": 12.119891008174386,
+ "grad_norm": 10.977900505065918,
+ "learning_rate": 1.9566942252173373e-05,
+ "loss": 1.2616,
+ "step": 4448
+ },
+ {
+ "epoch": 12.122615803814714,
+ "grad_norm": 11.41482162475586,
+ "learning_rate": 1.9566685325355803e-05,
+ "loss": 1.3162,
+ "step": 4449
+ },
+ {
+ "epoch": 12.125340599455042,
+ "grad_norm": 23.697675704956055,
+ "learning_rate": 1.9566428324033192e-05,
+ "loss": 1.0796,
+ "step": 4450
+ },
+ {
+ "epoch": 12.128065395095367,
+ "grad_norm": 11.825977325439453,
+ "learning_rate": 1.9566171248207552e-05,
+ "loss": 1.2524,
+ "step": 4451
+ },
+ {
+ "epoch": 12.130790190735695,
+ "grad_norm": 9.793973922729492,
+ "learning_rate": 1.9565914097880874e-05,
+ "loss": 1.2634,
+ "step": 4452
+ },
+ {
+ "epoch": 12.133514986376023,
+ "grad_norm": 10.945475578308105,
+ "learning_rate": 1.956565687305517e-05,
+ "loss": 1.3218,
+ "step": 4453
+ },
+ {
+ "epoch": 12.136239782016348,
+ "grad_norm": 7.100282192230225,
+ "learning_rate": 1.9565399573732432e-05,
+ "loss": 1.1567,
+ "step": 4454
+ },
+ {
+ "epoch": 12.138964577656676,
+ "grad_norm": 11.469827651977539,
+ "learning_rate": 1.956514219991467e-05,
+ "loss": 1.1404,
+ "step": 4455
+ },
+ {
+ "epoch": 12.141689373297003,
+ "grad_norm": 8.892791748046875,
+ "learning_rate": 1.956488475160389e-05,
+ "loss": 1.2952,
+ "step": 4456
+ },
+ {
+ "epoch": 12.14441416893733,
+ "grad_norm": 7.216567039489746,
+ "learning_rate": 1.9564627228802098e-05,
+ "loss": 1.1753,
+ "step": 4457
+ },
+ {
+ "epoch": 12.147138964577657,
+ "grad_norm": 7.672146320343018,
+ "learning_rate": 1.9564369631511296e-05,
+ "loss": 1.3711,
+ "step": 4458
+ },
+ {
+ "epoch": 12.149863760217984,
+ "grad_norm": 7.896295547485352,
+ "learning_rate": 1.956411195973349e-05,
+ "loss": 1.0814,
+ "step": 4459
+ },
+ {
+ "epoch": 12.15258855585831,
+ "grad_norm": 9.343679428100586,
+ "learning_rate": 1.956385421347069e-05,
+ "loss": 1.1007,
+ "step": 4460
+ },
+ {
+ "epoch": 12.155313351498638,
+ "grad_norm": 11.700438499450684,
+ "learning_rate": 1.9563596392724897e-05,
+ "loss": 1.3137,
+ "step": 4461
+ },
+ {
+ "epoch": 12.158038147138965,
+ "grad_norm": 10.045361518859863,
+ "learning_rate": 1.9563338497498127e-05,
+ "loss": 1.3904,
+ "step": 4462
+ },
+ {
+ "epoch": 12.160762942779291,
+ "grad_norm": 11.074722290039062,
+ "learning_rate": 1.9563080527792383e-05,
+ "loss": 1.197,
+ "step": 4463
+ },
+ {
+ "epoch": 12.163487738419619,
+ "grad_norm": 15.348587036132812,
+ "learning_rate": 1.9562822483609675e-05,
+ "loss": 1.1335,
+ "step": 4464
+ },
+ {
+ "epoch": 12.166212534059946,
+ "grad_norm": 10.257996559143066,
+ "learning_rate": 1.9562564364952012e-05,
+ "loss": 1.2634,
+ "step": 4465
+ },
+ {
+ "epoch": 12.168937329700272,
+ "grad_norm": 8.52253246307373,
+ "learning_rate": 1.956230617182141e-05,
+ "loss": 1.0405,
+ "step": 4466
+ },
+ {
+ "epoch": 12.1716621253406,
+ "grad_norm": 10.670637130737305,
+ "learning_rate": 1.956204790421987e-05,
+ "loss": 1.271,
+ "step": 4467
+ },
+ {
+ "epoch": 12.174386920980927,
+ "grad_norm": 8.055587768554688,
+ "learning_rate": 1.956178956214941e-05,
+ "loss": 1.2493,
+ "step": 4468
+ },
+ {
+ "epoch": 12.177111716621253,
+ "grad_norm": 8.456838607788086,
+ "learning_rate": 1.9561531145612042e-05,
+ "loss": 0.9962,
+ "step": 4469
+ },
+ {
+ "epoch": 12.17983651226158,
+ "grad_norm": 8.796440124511719,
+ "learning_rate": 1.956127265460978e-05,
+ "loss": 1.1199,
+ "step": 4470
+ },
+ {
+ "epoch": 12.182561307901908,
+ "grad_norm": 8.285974502563477,
+ "learning_rate": 1.9561014089144634e-05,
+ "loss": 1.3137,
+ "step": 4471
+ },
+ {
+ "epoch": 12.185286103542234,
+ "grad_norm": 9.08488941192627,
+ "learning_rate": 1.9560755449218612e-05,
+ "loss": 1.0901,
+ "step": 4472
+ },
+ {
+ "epoch": 12.188010899182562,
+ "grad_norm": 9.358592987060547,
+ "learning_rate": 1.956049673483374e-05,
+ "loss": 1.1443,
+ "step": 4473
+ },
+ {
+ "epoch": 12.190735694822889,
+ "grad_norm": 9.08774471282959,
+ "learning_rate": 1.956023794599202e-05,
+ "loss": 1.2371,
+ "step": 4474
+ },
+ {
+ "epoch": 12.193460490463215,
+ "grad_norm": 16.300308227539062,
+ "learning_rate": 1.9559979082695483e-05,
+ "loss": 1.3635,
+ "step": 4475
+ },
+ {
+ "epoch": 12.196185286103542,
+ "grad_norm": 9.76804256439209,
+ "learning_rate": 1.955972014494613e-05,
+ "loss": 1.3032,
+ "step": 4476
+ },
+ {
+ "epoch": 12.19891008174387,
+ "grad_norm": 8.860701560974121,
+ "learning_rate": 1.955946113274599e-05,
+ "loss": 1.1211,
+ "step": 4477
+ },
+ {
+ "epoch": 12.201634877384196,
+ "grad_norm": 7.7827606201171875,
+ "learning_rate": 1.955920204609707e-05,
+ "loss": 1.2136,
+ "step": 4478
+ },
+ {
+ "epoch": 12.204359673024523,
+ "grad_norm": 9.018577575683594,
+ "learning_rate": 1.9558942885001394e-05,
+ "loss": 1.3269,
+ "step": 4479
+ },
+ {
+ "epoch": 12.207084468664851,
+ "grad_norm": 11.849574089050293,
+ "learning_rate": 1.9558683649460977e-05,
+ "loss": 1.2241,
+ "step": 4480
+ },
+ {
+ "epoch": 12.209809264305177,
+ "grad_norm": 14.160171508789062,
+ "learning_rate": 1.955842433947784e-05,
+ "loss": 1.1177,
+ "step": 4481
+ },
+ {
+ "epoch": 12.212534059945504,
+ "grad_norm": 39.62517547607422,
+ "learning_rate": 1.9558164955054005e-05,
+ "loss": 1.1292,
+ "step": 4482
+ },
+ {
+ "epoch": 12.215258855585832,
+ "grad_norm": 12.130826950073242,
+ "learning_rate": 1.9557905496191485e-05,
+ "loss": 1.1411,
+ "step": 4483
+ },
+ {
+ "epoch": 12.217983651226158,
+ "grad_norm": 9.747757911682129,
+ "learning_rate": 1.9557645962892306e-05,
+ "loss": 1.0795,
+ "step": 4484
+ },
+ {
+ "epoch": 12.220708446866485,
+ "grad_norm": 9.641395568847656,
+ "learning_rate": 1.9557386355158487e-05,
+ "loss": 1.0536,
+ "step": 4485
+ },
+ {
+ "epoch": 12.223433242506813,
+ "grad_norm": 7.763537406921387,
+ "learning_rate": 1.955712667299205e-05,
+ "loss": 1.1582,
+ "step": 4486
+ },
+ {
+ "epoch": 12.226158038147139,
+ "grad_norm": 9.421480178833008,
+ "learning_rate": 1.9556866916395025e-05,
+ "loss": 1.292,
+ "step": 4487
+ },
+ {
+ "epoch": 12.228882833787466,
+ "grad_norm": 19.76326560974121,
+ "learning_rate": 1.9556607085369423e-05,
+ "loss": 1.0522,
+ "step": 4488
+ },
+ {
+ "epoch": 12.231607629427794,
+ "grad_norm": 10.995299339294434,
+ "learning_rate": 1.955634717991727e-05,
+ "loss": 1.1641,
+ "step": 4489
+ },
+ {
+ "epoch": 12.23433242506812,
+ "grad_norm": 8.183566093444824,
+ "learning_rate": 1.9556087200040595e-05,
+ "loss": 1.2008,
+ "step": 4490
+ },
+ {
+ "epoch": 12.237057220708447,
+ "grad_norm": 8.867317199707031,
+ "learning_rate": 1.9555827145741418e-05,
+ "loss": 1.0337,
+ "step": 4491
+ },
+ {
+ "epoch": 12.239782016348773,
+ "grad_norm": 9.299468040466309,
+ "learning_rate": 1.955556701702177e-05,
+ "loss": 1.0896,
+ "step": 4492
+ },
+ {
+ "epoch": 12.2425068119891,
+ "grad_norm": 10.6619873046875,
+ "learning_rate": 1.955530681388367e-05,
+ "loss": 1.1201,
+ "step": 4493
+ },
+ {
+ "epoch": 12.245231607629428,
+ "grad_norm": 8.409582138061523,
+ "learning_rate": 1.9555046536329154e-05,
+ "loss": 1.1041,
+ "step": 4494
+ },
+ {
+ "epoch": 12.247956403269754,
+ "grad_norm": 13.844766616821289,
+ "learning_rate": 1.955478618436024e-05,
+ "loss": 1.2786,
+ "step": 4495
+ },
+ {
+ "epoch": 12.250681198910081,
+ "grad_norm": 9.929696083068848,
+ "learning_rate": 1.9554525757978958e-05,
+ "loss": 1.2646,
+ "step": 4496
+ },
+ {
+ "epoch": 12.253405994550409,
+ "grad_norm": 9.000109672546387,
+ "learning_rate": 1.9554265257187336e-05,
+ "loss": 1.1101,
+ "step": 4497
+ },
+ {
+ "epoch": 12.256130790190735,
+ "grad_norm": 11.595155715942383,
+ "learning_rate": 1.955400468198741e-05,
+ "loss": 1.0933,
+ "step": 4498
+ },
+ {
+ "epoch": 12.258855585831062,
+ "grad_norm": 11.236772537231445,
+ "learning_rate": 1.9553744032381198e-05,
+ "loss": 1.231,
+ "step": 4499
+ },
+ {
+ "epoch": 12.26158038147139,
+ "grad_norm": 9.075350761413574,
+ "learning_rate": 1.9553483308370732e-05,
+ "loss": 1.1371,
+ "step": 4500
+ },
+ {
+ "epoch": 12.264305177111716,
+ "grad_norm": 30.546899795532227,
+ "learning_rate": 1.955322250995805e-05,
+ "loss": 1.1213,
+ "step": 4501
+ },
+ {
+ "epoch": 12.267029972752043,
+ "grad_norm": 12.340591430664062,
+ "learning_rate": 1.9552961637145177e-05,
+ "loss": 1.1868,
+ "step": 4502
+ },
+ {
+ "epoch": 12.269754768392371,
+ "grad_norm": 10.846833229064941,
+ "learning_rate": 1.9552700689934146e-05,
+ "loss": 1.2559,
+ "step": 4503
+ },
+ {
+ "epoch": 12.272479564032697,
+ "grad_norm": 9.99949836730957,
+ "learning_rate": 1.9552439668326993e-05,
+ "loss": 1.1394,
+ "step": 4504
+ },
+ {
+ "epoch": 12.275204359673024,
+ "grad_norm": 10.80855655670166,
+ "learning_rate": 1.955217857232574e-05,
+ "loss": 1.2053,
+ "step": 4505
+ },
+ {
+ "epoch": 12.277929155313352,
+ "grad_norm": 10.59102725982666,
+ "learning_rate": 1.9551917401932436e-05,
+ "loss": 1.229,
+ "step": 4506
+ },
+ {
+ "epoch": 12.280653950953678,
+ "grad_norm": 9.98192310333252,
+ "learning_rate": 1.95516561571491e-05,
+ "loss": 1.1077,
+ "step": 4507
+ },
+ {
+ "epoch": 12.283378746594005,
+ "grad_norm": 10.518499374389648,
+ "learning_rate": 1.9551394837977776e-05,
+ "loss": 1.2952,
+ "step": 4508
+ },
+ {
+ "epoch": 12.286103542234333,
+ "grad_norm": 20.259326934814453,
+ "learning_rate": 1.9551133444420495e-05,
+ "loss": 1.1157,
+ "step": 4509
+ },
+ {
+ "epoch": 12.288828337874659,
+ "grad_norm": 17.111726760864258,
+ "learning_rate": 1.9550871976479297e-05,
+ "loss": 1.1477,
+ "step": 4510
+ },
+ {
+ "epoch": 12.291553133514986,
+ "grad_norm": 18.629878997802734,
+ "learning_rate": 1.9550610434156213e-05,
+ "loss": 1.078,
+ "step": 4511
+ },
+ {
+ "epoch": 12.294277929155314,
+ "grad_norm": 11.988139152526855,
+ "learning_rate": 1.9550348817453286e-05,
+ "loss": 1.2703,
+ "step": 4512
+ },
+ {
+ "epoch": 12.29700272479564,
+ "grad_norm": 10.327305793762207,
+ "learning_rate": 1.9550087126372544e-05,
+ "loss": 1.0684,
+ "step": 4513
+ },
+ {
+ "epoch": 12.299727520435967,
+ "grad_norm": 11.47162914276123,
+ "learning_rate": 1.9549825360916035e-05,
+ "loss": 1.0139,
+ "step": 4514
+ },
+ {
+ "epoch": 12.302452316076295,
+ "grad_norm": 11.214944839477539,
+ "learning_rate": 1.954956352108579e-05,
+ "loss": 1.0042,
+ "step": 4515
+ },
+ {
+ "epoch": 12.30517711171662,
+ "grad_norm": 19.47401237487793,
+ "learning_rate": 1.9549301606883855e-05,
+ "loss": 1.1846,
+ "step": 4516
+ },
+ {
+ "epoch": 12.307901907356948,
+ "grad_norm": 15.151413917541504,
+ "learning_rate": 1.9549039618312268e-05,
+ "loss": 1.1472,
+ "step": 4517
+ },
+ {
+ "epoch": 12.310626702997276,
+ "grad_norm": 16.04181671142578,
+ "learning_rate": 1.9548777555373065e-05,
+ "loss": 1.167,
+ "step": 4518
+ },
+ {
+ "epoch": 12.313351498637601,
+ "grad_norm": 13.755768775939941,
+ "learning_rate": 1.954851541806829e-05,
+ "loss": 1.1953,
+ "step": 4519
+ },
+ {
+ "epoch": 12.316076294277929,
+ "grad_norm": 8.122154235839844,
+ "learning_rate": 1.9548253206399983e-05,
+ "loss": 1.1219,
+ "step": 4520
+ },
+ {
+ "epoch": 12.318801089918257,
+ "grad_norm": 15.348465919494629,
+ "learning_rate": 1.954799092037019e-05,
+ "loss": 1.2222,
+ "step": 4521
+ },
+ {
+ "epoch": 12.321525885558582,
+ "grad_norm": 14.399018287658691,
+ "learning_rate": 1.9547728559980948e-05,
+ "loss": 1.2212,
+ "step": 4522
+ },
+ {
+ "epoch": 12.32425068119891,
+ "grad_norm": 16.025836944580078,
+ "learning_rate": 1.9547466125234305e-05,
+ "loss": 1.0447,
+ "step": 4523
+ },
+ {
+ "epoch": 12.326975476839237,
+ "grad_norm": 16.8812255859375,
+ "learning_rate": 1.95472036161323e-05,
+ "loss": 1.2146,
+ "step": 4524
+ },
+ {
+ "epoch": 12.329700272479563,
+ "grad_norm": 9.85257339477539,
+ "learning_rate": 1.9546941032676986e-05,
+ "loss": 1.5183,
+ "step": 4525
+ },
+ {
+ "epoch": 12.33242506811989,
+ "grad_norm": 9.414003372192383,
+ "learning_rate": 1.95466783748704e-05,
+ "loss": 1.3218,
+ "step": 4526
+ },
+ {
+ "epoch": 12.335149863760218,
+ "grad_norm": 12.69359016418457,
+ "learning_rate": 1.954641564271459e-05,
+ "loss": 1.0989,
+ "step": 4527
+ },
+ {
+ "epoch": 12.337874659400544,
+ "grad_norm": 13.881927490234375,
+ "learning_rate": 1.95461528362116e-05,
+ "loss": 1.2754,
+ "step": 4528
+ },
+ {
+ "epoch": 12.340599455040872,
+ "grad_norm": 20.145729064941406,
+ "learning_rate": 1.9545889955363483e-05,
+ "loss": 1.3813,
+ "step": 4529
+ },
+ {
+ "epoch": 12.3433242506812,
+ "grad_norm": 12.239202499389648,
+ "learning_rate": 1.954562700017228e-05,
+ "loss": 1.2983,
+ "step": 4530
+ },
+ {
+ "epoch": 12.346049046321525,
+ "grad_norm": 12.98681354522705,
+ "learning_rate": 1.954536397064004e-05,
+ "loss": 1.3801,
+ "step": 4531
+ },
+ {
+ "epoch": 12.348773841961853,
+ "grad_norm": 22.513046264648438,
+ "learning_rate": 1.954510086676882e-05,
+ "loss": 1.1106,
+ "step": 4532
+ },
+ {
+ "epoch": 12.35149863760218,
+ "grad_norm": 13.772794723510742,
+ "learning_rate": 1.9544837688560653e-05,
+ "loss": 1.0582,
+ "step": 4533
+ },
+ {
+ "epoch": 12.354223433242506,
+ "grad_norm": 10.135868072509766,
+ "learning_rate": 1.95445744360176e-05,
+ "loss": 1.4319,
+ "step": 4534
+ },
+ {
+ "epoch": 12.356948228882834,
+ "grad_norm": 9.674370765686035,
+ "learning_rate": 1.954431110914171e-05,
+ "loss": 1.1812,
+ "step": 4535
+ },
+ {
+ "epoch": 12.359673024523161,
+ "grad_norm": 11.166690826416016,
+ "learning_rate": 1.9544047707935026e-05,
+ "loss": 1.2947,
+ "step": 4536
+ },
+ {
+ "epoch": 12.362397820163487,
+ "grad_norm": 9.085147857666016,
+ "learning_rate": 1.954378423239961e-05,
+ "loss": 1.1365,
+ "step": 4537
+ },
+ {
+ "epoch": 12.365122615803815,
+ "grad_norm": 15.084121704101562,
+ "learning_rate": 1.9543520682537514e-05,
+ "loss": 1.2815,
+ "step": 4538
+ },
+ {
+ "epoch": 12.367847411444142,
+ "grad_norm": 43.925254821777344,
+ "learning_rate": 1.954325705835078e-05,
+ "loss": 1.313,
+ "step": 4539
+ },
+ {
+ "epoch": 12.370572207084468,
+ "grad_norm": 9.097298622131348,
+ "learning_rate": 1.954299335984147e-05,
+ "loss": 1.1218,
+ "step": 4540
+ },
+ {
+ "epoch": 12.373297002724795,
+ "grad_norm": 7.759567737579346,
+ "learning_rate": 1.9542729587011635e-05,
+ "loss": 1.1088,
+ "step": 4541
+ },
+ {
+ "epoch": 12.376021798365123,
+ "grad_norm": 8.935018539428711,
+ "learning_rate": 1.954246573986333e-05,
+ "loss": 1.0938,
+ "step": 4542
+ },
+ {
+ "epoch": 12.378746594005449,
+ "grad_norm": 12.664612770080566,
+ "learning_rate": 1.9542201818398606e-05,
+ "loss": 1.2271,
+ "step": 4543
+ },
+ {
+ "epoch": 12.381471389645776,
+ "grad_norm": 8.754498481750488,
+ "learning_rate": 1.9541937822619524e-05,
+ "loss": 1.1702,
+ "step": 4544
+ },
+ {
+ "epoch": 12.384196185286104,
+ "grad_norm": 11.0216646194458,
+ "learning_rate": 1.9541673752528135e-05,
+ "loss": 1.1772,
+ "step": 4545
+ },
+ {
+ "epoch": 12.38692098092643,
+ "grad_norm": 14.213191986083984,
+ "learning_rate": 1.95414096081265e-05,
+ "loss": 1.2859,
+ "step": 4546
+ },
+ {
+ "epoch": 12.389645776566757,
+ "grad_norm": 8.516196250915527,
+ "learning_rate": 1.954114538941667e-05,
+ "loss": 1.0405,
+ "step": 4547
+ },
+ {
+ "epoch": 12.392370572207085,
+ "grad_norm": 11.736917495727539,
+ "learning_rate": 1.954088109640071e-05,
+ "loss": 1.3147,
+ "step": 4548
+ },
+ {
+ "epoch": 12.39509536784741,
+ "grad_norm": 11.034043312072754,
+ "learning_rate": 1.9540616729080676e-05,
+ "loss": 1.3899,
+ "step": 4549
+ },
+ {
+ "epoch": 12.397820163487738,
+ "grad_norm": 9.75068187713623,
+ "learning_rate": 1.9540352287458624e-05,
+ "loss": 1.281,
+ "step": 4550
+ },
+ {
+ "epoch": 12.400544959128066,
+ "grad_norm": 12.010876655578613,
+ "learning_rate": 1.9540087771536617e-05,
+ "loss": 1.3296,
+ "step": 4551
+ },
+ {
+ "epoch": 12.403269754768392,
+ "grad_norm": 12.708393096923828,
+ "learning_rate": 1.953982318131671e-05,
+ "loss": 1.24,
+ "step": 4552
+ },
+ {
+ "epoch": 12.40599455040872,
+ "grad_norm": 8.05755615234375,
+ "learning_rate": 1.9539558516800968e-05,
+ "loss": 1.1244,
+ "step": 4553
+ },
+ {
+ "epoch": 12.408719346049047,
+ "grad_norm": 11.966116905212402,
+ "learning_rate": 1.9539293777991456e-05,
+ "loss": 1.281,
+ "step": 4554
+ },
+ {
+ "epoch": 12.411444141689373,
+ "grad_norm": 12.17050552368164,
+ "learning_rate": 1.9539028964890227e-05,
+ "loss": 1.2935,
+ "step": 4555
+ },
+ {
+ "epoch": 12.4141689373297,
+ "grad_norm": 10.085892677307129,
+ "learning_rate": 1.953876407749935e-05,
+ "loss": 1.2612,
+ "step": 4556
+ },
+ {
+ "epoch": 12.416893732970028,
+ "grad_norm": 8.45280647277832,
+ "learning_rate": 1.9538499115820883e-05,
+ "loss": 1.1785,
+ "step": 4557
+ },
+ {
+ "epoch": 12.419618528610354,
+ "grad_norm": 10.129697799682617,
+ "learning_rate": 1.9538234079856892e-05,
+ "loss": 1.5048,
+ "step": 4558
+ },
+ {
+ "epoch": 12.422343324250681,
+ "grad_norm": 6.851092338562012,
+ "learning_rate": 1.9537968969609444e-05,
+ "loss": 1.0962,
+ "step": 4559
+ },
+ {
+ "epoch": 12.425068119891009,
+ "grad_norm": 8.825153350830078,
+ "learning_rate": 1.9537703785080598e-05,
+ "loss": 1.0917,
+ "step": 4560
+ },
+ {
+ "epoch": 12.427792915531334,
+ "grad_norm": 10.525093078613281,
+ "learning_rate": 1.953743852627242e-05,
+ "loss": 1.2708,
+ "step": 4561
+ },
+ {
+ "epoch": 12.430517711171662,
+ "grad_norm": 18.500041961669922,
+ "learning_rate": 1.953717319318698e-05,
+ "loss": 1.1589,
+ "step": 4562
+ },
+ {
+ "epoch": 12.43324250681199,
+ "grad_norm": 9.579687118530273,
+ "learning_rate": 1.9536907785826345e-05,
+ "loss": 1.1946,
+ "step": 4563
+ },
+ {
+ "epoch": 12.435967302452315,
+ "grad_norm": 10.064245223999023,
+ "learning_rate": 1.9536642304192574e-05,
+ "loss": 1.4142,
+ "step": 4564
+ },
+ {
+ "epoch": 12.438692098092643,
+ "grad_norm": 8.188551902770996,
+ "learning_rate": 1.9536376748287743e-05,
+ "loss": 1.1736,
+ "step": 4565
+ },
+ {
+ "epoch": 12.44141689373297,
+ "grad_norm": 6.685877323150635,
+ "learning_rate": 1.9536111118113917e-05,
+ "loss": 1.0797,
+ "step": 4566
+ },
+ {
+ "epoch": 12.444141689373296,
+ "grad_norm": 7.987151622772217,
+ "learning_rate": 1.953584541367316e-05,
+ "loss": 1.2999,
+ "step": 4567
+ },
+ {
+ "epoch": 12.446866485013624,
+ "grad_norm": 9.174522399902344,
+ "learning_rate": 1.9535579634967548e-05,
+ "loss": 1.1052,
+ "step": 4568
+ },
+ {
+ "epoch": 12.449591280653951,
+ "grad_norm": 10.419933319091797,
+ "learning_rate": 1.9535313781999155e-05,
+ "loss": 1.1375,
+ "step": 4569
+ },
+ {
+ "epoch": 12.452316076294277,
+ "grad_norm": 7.917226314544678,
+ "learning_rate": 1.9535047854770038e-05,
+ "loss": 1.1587,
+ "step": 4570
+ },
+ {
+ "epoch": 12.455040871934605,
+ "grad_norm": 11.952027320861816,
+ "learning_rate": 1.9534781853282278e-05,
+ "loss": 1.2106,
+ "step": 4571
+ },
+ {
+ "epoch": 12.457765667574932,
+ "grad_norm": 15.018729209899902,
+ "learning_rate": 1.953451577753794e-05,
+ "loss": 1.3325,
+ "step": 4572
+ },
+ {
+ "epoch": 12.460490463215258,
+ "grad_norm": 10.02099609375,
+ "learning_rate": 1.9534249627539105e-05,
+ "loss": 1.0997,
+ "step": 4573
+ },
+ {
+ "epoch": 12.463215258855586,
+ "grad_norm": 8.177393913269043,
+ "learning_rate": 1.953398340328784e-05,
+ "loss": 1.0704,
+ "step": 4574
+ },
+ {
+ "epoch": 12.465940054495913,
+ "grad_norm": 8.423258781433105,
+ "learning_rate": 1.9533717104786218e-05,
+ "loss": 1.1108,
+ "step": 4575
+ },
+ {
+ "epoch": 12.46866485013624,
+ "grad_norm": 9.97563648223877,
+ "learning_rate": 1.953345073203631e-05,
+ "loss": 1.3052,
+ "step": 4576
+ },
+ {
+ "epoch": 12.471389645776567,
+ "grad_norm": 9.08750057220459,
+ "learning_rate": 1.95331842850402e-05,
+ "loss": 1.2687,
+ "step": 4577
+ },
+ {
+ "epoch": 12.474114441416894,
+ "grad_norm": 11.651878356933594,
+ "learning_rate": 1.9532917763799957e-05,
+ "loss": 1.2065,
+ "step": 4578
+ },
+ {
+ "epoch": 12.47683923705722,
+ "grad_norm": 8.31631088256836,
+ "learning_rate": 1.9532651168317657e-05,
+ "loss": 1.115,
+ "step": 4579
+ },
+ {
+ "epoch": 12.479564032697548,
+ "grad_norm": 8.28477668762207,
+ "learning_rate": 1.9532384498595376e-05,
+ "loss": 1.2628,
+ "step": 4580
+ },
+ {
+ "epoch": 12.482288828337875,
+ "grad_norm": 13.442248344421387,
+ "learning_rate": 1.953211775463519e-05,
+ "loss": 1.4312,
+ "step": 4581
+ },
+ {
+ "epoch": 12.485013623978201,
+ "grad_norm": 8.9275541305542,
+ "learning_rate": 1.9531850936439177e-05,
+ "loss": 1.2312,
+ "step": 4582
+ },
+ {
+ "epoch": 12.487738419618529,
+ "grad_norm": 8.316483497619629,
+ "learning_rate": 1.953158404400942e-05,
+ "loss": 1.1727,
+ "step": 4583
+ },
+ {
+ "epoch": 12.490463215258856,
+ "grad_norm": 8.06887149810791,
+ "learning_rate": 1.953131707734799e-05,
+ "loss": 1.144,
+ "step": 4584
+ },
+ {
+ "epoch": 12.493188010899182,
+ "grad_norm": 8.375883102416992,
+ "learning_rate": 1.9531050036456972e-05,
+ "loss": 1.2737,
+ "step": 4585
+ },
+ {
+ "epoch": 12.49591280653951,
+ "grad_norm": 8.302019119262695,
+ "learning_rate": 1.9530782921338442e-05,
+ "loss": 1.1799,
+ "step": 4586
+ },
+ {
+ "epoch": 12.498637602179837,
+ "grad_norm": 8.256749153137207,
+ "learning_rate": 1.953051573199448e-05,
+ "loss": 1.0681,
+ "step": 4587
+ },
+ {
+ "epoch": 12.501362397820163,
+ "grad_norm": 7.484298229217529,
+ "learning_rate": 1.9530248468427166e-05,
+ "loss": 1.2612,
+ "step": 4588
+ },
+ {
+ "epoch": 12.50408719346049,
+ "grad_norm": 8.9029541015625,
+ "learning_rate": 1.9529981130638585e-05,
+ "loss": 1.1285,
+ "step": 4589
+ },
+ {
+ "epoch": 12.506811989100818,
+ "grad_norm": 11.159380912780762,
+ "learning_rate": 1.952971371863082e-05,
+ "loss": 1.3145,
+ "step": 4590
+ },
+ {
+ "epoch": 12.509536784741144,
+ "grad_norm": 11.16989803314209,
+ "learning_rate": 1.952944623240595e-05,
+ "loss": 1.1538,
+ "step": 4591
+ },
+ {
+ "epoch": 12.512261580381471,
+ "grad_norm": 9.007346153259277,
+ "learning_rate": 1.952917867196606e-05,
+ "loss": 1.3169,
+ "step": 4592
+ },
+ {
+ "epoch": 12.514986376021799,
+ "grad_norm": 8.884353637695312,
+ "learning_rate": 1.9528911037313233e-05,
+ "loss": 1.1614,
+ "step": 4593
+ },
+ {
+ "epoch": 12.517711171662125,
+ "grad_norm": 8.167776107788086,
+ "learning_rate": 1.9528643328449554e-05,
+ "loss": 1.1514,
+ "step": 4594
+ },
+ {
+ "epoch": 12.520435967302452,
+ "grad_norm": 8.666801452636719,
+ "learning_rate": 1.9528375545377107e-05,
+ "loss": 1.0505,
+ "step": 4595
+ },
+ {
+ "epoch": 12.52316076294278,
+ "grad_norm": 6.815107822418213,
+ "learning_rate": 1.9528107688097978e-05,
+ "loss": 0.9323,
+ "step": 4596
+ },
+ {
+ "epoch": 12.525885558583106,
+ "grad_norm": 8.493805885314941,
+ "learning_rate": 1.9527839756614253e-05,
+ "loss": 1.1121,
+ "step": 4597
+ },
+ {
+ "epoch": 12.528610354223433,
+ "grad_norm": 8.735637664794922,
+ "learning_rate": 1.952757175092802e-05,
+ "loss": 1.208,
+ "step": 4598
+ },
+ {
+ "epoch": 12.53133514986376,
+ "grad_norm": 8.221902847290039,
+ "learning_rate": 1.952730367104136e-05,
+ "loss": 1.0355,
+ "step": 4599
+ },
+ {
+ "epoch": 12.534059945504087,
+ "grad_norm": 8.883963584899902,
+ "learning_rate": 1.9527035516956368e-05,
+ "loss": 1.3167,
+ "step": 4600
+ },
+ {
+ "epoch": 12.536784741144414,
+ "grad_norm": 9.42188549041748,
+ "learning_rate": 1.9526767288675134e-05,
+ "loss": 1.0435,
+ "step": 4601
+ },
+ {
+ "epoch": 12.539509536784742,
+ "grad_norm": 8.609175682067871,
+ "learning_rate": 1.952649898619974e-05,
+ "loss": 1.2488,
+ "step": 4602
+ },
+ {
+ "epoch": 12.542234332425068,
+ "grad_norm": 10.529431343078613,
+ "learning_rate": 1.952623060953228e-05,
+ "loss": 1.1753,
+ "step": 4603
+ },
+ {
+ "epoch": 12.544959128065395,
+ "grad_norm": 9.760684967041016,
+ "learning_rate": 1.952596215867484e-05,
+ "loss": 1.0697,
+ "step": 4604
+ },
+ {
+ "epoch": 12.547683923705723,
+ "grad_norm": 15.903693199157715,
+ "learning_rate": 1.9525693633629514e-05,
+ "loss": 1.171,
+ "step": 4605
+ },
+ {
+ "epoch": 12.550408719346049,
+ "grad_norm": 9.444087982177734,
+ "learning_rate": 1.9525425034398394e-05,
+ "loss": 1.2163,
+ "step": 4606
+ },
+ {
+ "epoch": 12.553133514986376,
+ "grad_norm": 9.362471580505371,
+ "learning_rate": 1.952515636098357e-05,
+ "loss": 1.0851,
+ "step": 4607
+ },
+ {
+ "epoch": 12.555858310626704,
+ "grad_norm": 8.800759315490723,
+ "learning_rate": 1.9524887613387133e-05,
+ "loss": 1.126,
+ "step": 4608
+ },
+ {
+ "epoch": 12.55858310626703,
+ "grad_norm": 14.719269752502441,
+ "learning_rate": 1.9524618791611177e-05,
+ "loss": 1.1335,
+ "step": 4609
+ },
+ {
+ "epoch": 12.561307901907357,
+ "grad_norm": 9.89954662322998,
+ "learning_rate": 1.9524349895657798e-05,
+ "loss": 1.2173,
+ "step": 4610
+ },
+ {
+ "epoch": 12.564032697547685,
+ "grad_norm": 7.570556640625,
+ "learning_rate": 1.9524080925529093e-05,
+ "loss": 1.283,
+ "step": 4611
+ },
+ {
+ "epoch": 12.56675749318801,
+ "grad_norm": 11.356952667236328,
+ "learning_rate": 1.9523811881227147e-05,
+ "loss": 1.2185,
+ "step": 4612
+ },
+ {
+ "epoch": 12.569482288828338,
+ "grad_norm": 56.742427825927734,
+ "learning_rate": 1.952354276275406e-05,
+ "loss": 1.0366,
+ "step": 4613
+ },
+ {
+ "epoch": 12.572207084468666,
+ "grad_norm": 9.515989303588867,
+ "learning_rate": 1.952327357011193e-05,
+ "loss": 1.184,
+ "step": 4614
+ },
+ {
+ "epoch": 12.574931880108991,
+ "grad_norm": 16.08742904663086,
+ "learning_rate": 1.9523004303302854e-05,
+ "loss": 1.4866,
+ "step": 4615
+ },
+ {
+ "epoch": 12.577656675749319,
+ "grad_norm": 8.824570655822754,
+ "learning_rate": 1.9522734962328926e-05,
+ "loss": 1.3364,
+ "step": 4616
+ },
+ {
+ "epoch": 12.580381471389646,
+ "grad_norm": 10.563802719116211,
+ "learning_rate": 1.952246554719224e-05,
+ "loss": 1.2041,
+ "step": 4617
+ },
+ {
+ "epoch": 12.583106267029972,
+ "grad_norm": 8.585123062133789,
+ "learning_rate": 1.9522196057894905e-05,
+ "loss": 0.9529,
+ "step": 4618
+ },
+ {
+ "epoch": 12.5858310626703,
+ "grad_norm": 8.832019805908203,
+ "learning_rate": 1.952192649443901e-05,
+ "loss": 1.0126,
+ "step": 4619
+ },
+ {
+ "epoch": 12.588555858310627,
+ "grad_norm": 9.905095100402832,
+ "learning_rate": 1.952165685682666e-05,
+ "loss": 1.1479,
+ "step": 4620
+ },
+ {
+ "epoch": 12.591280653950953,
+ "grad_norm": 8.778387069702148,
+ "learning_rate": 1.9521387145059952e-05,
+ "loss": 1.2529,
+ "step": 4621
+ },
+ {
+ "epoch": 12.59400544959128,
+ "grad_norm": 13.142505645751953,
+ "learning_rate": 1.9521117359140985e-05,
+ "loss": 1.2751,
+ "step": 4622
+ },
+ {
+ "epoch": 12.596730245231608,
+ "grad_norm": 14.675884246826172,
+ "learning_rate": 1.952084749907187e-05,
+ "loss": 1.2427,
+ "step": 4623
+ },
+ {
+ "epoch": 12.599455040871934,
+ "grad_norm": 9.52199649810791,
+ "learning_rate": 1.9520577564854696e-05,
+ "loss": 1.2654,
+ "step": 4624
+ },
+ {
+ "epoch": 12.602179836512262,
+ "grad_norm": 9.89417839050293,
+ "learning_rate": 1.952030755649157e-05,
+ "loss": 1.1506,
+ "step": 4625
+ },
+ {
+ "epoch": 12.60490463215259,
+ "grad_norm": 27.12210464477539,
+ "learning_rate": 1.952003747398459e-05,
+ "loss": 1.2183,
+ "step": 4626
+ },
+ {
+ "epoch": 12.607629427792915,
+ "grad_norm": 10.320030212402344,
+ "learning_rate": 1.9519767317335875e-05,
+ "loss": 1.2805,
+ "step": 4627
+ },
+ {
+ "epoch": 12.610354223433243,
+ "grad_norm": 11.5519380569458,
+ "learning_rate": 1.951949708654751e-05,
+ "loss": 1.3403,
+ "step": 4628
+ },
+ {
+ "epoch": 12.61307901907357,
+ "grad_norm": 12.985690116882324,
+ "learning_rate": 1.9519226781621613e-05,
+ "loss": 1.228,
+ "step": 4629
+ },
+ {
+ "epoch": 12.615803814713896,
+ "grad_norm": 9.530143737792969,
+ "learning_rate": 1.9518956402560282e-05,
+ "loss": 1.1143,
+ "step": 4630
+ },
+ {
+ "epoch": 12.618528610354224,
+ "grad_norm": 10.194968223571777,
+ "learning_rate": 1.9518685949365626e-05,
+ "loss": 1.1965,
+ "step": 4631
+ },
+ {
+ "epoch": 12.621253405994551,
+ "grad_norm": 8.98924446105957,
+ "learning_rate": 1.951841542203975e-05,
+ "loss": 1.2051,
+ "step": 4632
+ },
+ {
+ "epoch": 12.623978201634877,
+ "grad_norm": 8.00615119934082,
+ "learning_rate": 1.9518144820584763e-05,
+ "loss": 0.9694,
+ "step": 4633
+ },
+ {
+ "epoch": 12.626702997275205,
+ "grad_norm": 10.693278312683105,
+ "learning_rate": 1.9517874145002768e-05,
+ "loss": 1.1099,
+ "step": 4634
+ },
+ {
+ "epoch": 12.629427792915532,
+ "grad_norm": 10.002409934997559,
+ "learning_rate": 1.9517603395295873e-05,
+ "loss": 1.2314,
+ "step": 4635
+ },
+ {
+ "epoch": 12.632152588555858,
+ "grad_norm": 11.508398056030273,
+ "learning_rate": 1.951733257146619e-05,
+ "loss": 1.2388,
+ "step": 4636
+ },
+ {
+ "epoch": 12.634877384196185,
+ "grad_norm": 9.302984237670898,
+ "learning_rate": 1.9517061673515832e-05,
+ "loss": 1.176,
+ "step": 4637
+ },
+ {
+ "epoch": 12.637602179836513,
+ "grad_norm": 9.541932106018066,
+ "learning_rate": 1.95167907014469e-05,
+ "loss": 1.0867,
+ "step": 4638
+ },
+ {
+ "epoch": 12.640326975476839,
+ "grad_norm": 8.283167839050293,
+ "learning_rate": 1.951651965526151e-05,
+ "loss": 1.0667,
+ "step": 4639
+ },
+ {
+ "epoch": 12.643051771117166,
+ "grad_norm": 9.077845573425293,
+ "learning_rate": 1.9516248534961773e-05,
+ "loss": 1.1912,
+ "step": 4640
+ },
+ {
+ "epoch": 12.645776566757494,
+ "grad_norm": 8.404955863952637,
+ "learning_rate": 1.9515977340549794e-05,
+ "loss": 1.1189,
+ "step": 4641
+ },
+ {
+ "epoch": 12.64850136239782,
+ "grad_norm": 16.992172241210938,
+ "learning_rate": 1.9515706072027694e-05,
+ "loss": 1.3352,
+ "step": 4642
+ },
+ {
+ "epoch": 12.651226158038147,
+ "grad_norm": 9.835552215576172,
+ "learning_rate": 1.9515434729397577e-05,
+ "loss": 1.1182,
+ "step": 4643
+ },
+ {
+ "epoch": 12.653950953678475,
+ "grad_norm": 16.78769302368164,
+ "learning_rate": 1.9515163312661563e-05,
+ "loss": 1.2881,
+ "step": 4644
+ },
+ {
+ "epoch": 12.6566757493188,
+ "grad_norm": 10.720549583435059,
+ "learning_rate": 1.9514891821821768e-05,
+ "loss": 1.1658,
+ "step": 4645
+ },
+ {
+ "epoch": 12.659400544959128,
+ "grad_norm": 9.843253135681152,
+ "learning_rate": 1.9514620256880294e-05,
+ "loss": 1.4648,
+ "step": 4646
+ },
+ {
+ "epoch": 12.662125340599456,
+ "grad_norm": 10.77347183227539,
+ "learning_rate": 1.9514348617839268e-05,
+ "loss": 1.1985,
+ "step": 4647
+ },
+ {
+ "epoch": 12.664850136239782,
+ "grad_norm": 12.356215476989746,
+ "learning_rate": 1.95140769047008e-05,
+ "loss": 1.2772,
+ "step": 4648
+ },
+ {
+ "epoch": 12.66757493188011,
+ "grad_norm": 9.784097671508789,
+ "learning_rate": 1.9513805117467007e-05,
+ "loss": 1.2134,
+ "step": 4649
+ },
+ {
+ "epoch": 12.670299727520437,
+ "grad_norm": 9.46358871459961,
+ "learning_rate": 1.9513533256140004e-05,
+ "loss": 0.9877,
+ "step": 4650
+ },
+ {
+ "epoch": 12.673024523160763,
+ "grad_norm": 8.930076599121094,
+ "learning_rate": 1.9513261320721915e-05,
+ "loss": 1.1536,
+ "step": 4651
+ },
+ {
+ "epoch": 12.67574931880109,
+ "grad_norm": 13.492873191833496,
+ "learning_rate": 1.951298931121485e-05,
+ "loss": 1.1965,
+ "step": 4652
+ },
+ {
+ "epoch": 12.678474114441418,
+ "grad_norm": 15.724522590637207,
+ "learning_rate": 1.951271722762093e-05,
+ "loss": 1.3823,
+ "step": 4653
+ },
+ {
+ "epoch": 12.681198910081743,
+ "grad_norm": 10.186450004577637,
+ "learning_rate": 1.9512445069942275e-05,
+ "loss": 1.2336,
+ "step": 4654
+ },
+ {
+ "epoch": 12.683923705722071,
+ "grad_norm": 9.98702621459961,
+ "learning_rate": 1.9512172838181005e-05,
+ "loss": 1.1196,
+ "step": 4655
+ },
+ {
+ "epoch": 12.686648501362399,
+ "grad_norm": 11.274605751037598,
+ "learning_rate": 1.9511900532339237e-05,
+ "loss": 1.1848,
+ "step": 4656
+ },
+ {
+ "epoch": 12.689373297002724,
+ "grad_norm": 10.36972427368164,
+ "learning_rate": 1.9511628152419098e-05,
+ "loss": 1.0969,
+ "step": 4657
+ },
+ {
+ "epoch": 12.692098092643052,
+ "grad_norm": 53.64316177368164,
+ "learning_rate": 1.9511355698422702e-05,
+ "loss": 1.2065,
+ "step": 4658
+ },
+ {
+ "epoch": 12.69482288828338,
+ "grad_norm": 8.796631813049316,
+ "learning_rate": 1.9511083170352173e-05,
+ "loss": 1.4153,
+ "step": 4659
+ },
+ {
+ "epoch": 12.697547683923705,
+ "grad_norm": 10.043909072875977,
+ "learning_rate": 1.9510810568209634e-05,
+ "loss": 0.9744,
+ "step": 4660
+ },
+ {
+ "epoch": 12.700272479564033,
+ "grad_norm": 9.707660675048828,
+ "learning_rate": 1.9510537891997214e-05,
+ "loss": 1.1343,
+ "step": 4661
+ },
+ {
+ "epoch": 12.70299727520436,
+ "grad_norm": 15.499692916870117,
+ "learning_rate": 1.9510265141717024e-05,
+ "loss": 1.1963,
+ "step": 4662
+ },
+ {
+ "epoch": 12.705722070844686,
+ "grad_norm": 9.693360328674316,
+ "learning_rate": 1.9509992317371196e-05,
+ "loss": 1.2511,
+ "step": 4663
+ },
+ {
+ "epoch": 12.708446866485014,
+ "grad_norm": 9.773543357849121,
+ "learning_rate": 1.9509719418961858e-05,
+ "loss": 1.0464,
+ "step": 4664
+ },
+ {
+ "epoch": 12.711171662125341,
+ "grad_norm": 9.990696907043457,
+ "learning_rate": 1.9509446446491127e-05,
+ "loss": 1.0648,
+ "step": 4665
+ },
+ {
+ "epoch": 12.713896457765667,
+ "grad_norm": 9.596586227416992,
+ "learning_rate": 1.9509173399961137e-05,
+ "loss": 1.2563,
+ "step": 4666
+ },
+ {
+ "epoch": 12.716621253405995,
+ "grad_norm": 13.25296688079834,
+ "learning_rate": 1.950890027937401e-05,
+ "loss": 1.1661,
+ "step": 4667
+ },
+ {
+ "epoch": 12.719346049046322,
+ "grad_norm": 8.975726127624512,
+ "learning_rate": 1.9508627084731872e-05,
+ "loss": 1.1356,
+ "step": 4668
+ },
+ {
+ "epoch": 12.722070844686648,
+ "grad_norm": 8.937646865844727,
+ "learning_rate": 1.9508353816036853e-05,
+ "loss": 1.1023,
+ "step": 4669
+ },
+ {
+ "epoch": 12.724795640326976,
+ "grad_norm": 10.015127182006836,
+ "learning_rate": 1.950808047329108e-05,
+ "loss": 1.2043,
+ "step": 4670
+ },
+ {
+ "epoch": 12.727520435967303,
+ "grad_norm": 9.980385780334473,
+ "learning_rate": 1.9507807056496683e-05,
+ "loss": 1.1761,
+ "step": 4671
+ },
+ {
+ "epoch": 12.730245231607629,
+ "grad_norm": 11.312211036682129,
+ "learning_rate": 1.950753356565579e-05,
+ "loss": 1.2368,
+ "step": 4672
+ },
+ {
+ "epoch": 12.732970027247957,
+ "grad_norm": 8.812410354614258,
+ "learning_rate": 1.950726000077053e-05,
+ "loss": 1.5366,
+ "step": 4673
+ },
+ {
+ "epoch": 12.735694822888284,
+ "grad_norm": 13.870210647583008,
+ "learning_rate": 1.950698636184304e-05,
+ "loss": 1.2469,
+ "step": 4674
+ },
+ {
+ "epoch": 12.73841961852861,
+ "grad_norm": 11.117531776428223,
+ "learning_rate": 1.9506712648875444e-05,
+ "loss": 1.3184,
+ "step": 4675
+ },
+ {
+ "epoch": 12.741144414168938,
+ "grad_norm": 21.896833419799805,
+ "learning_rate": 1.9506438861869875e-05,
+ "loss": 1.2288,
+ "step": 4676
+ },
+ {
+ "epoch": 12.743869209809265,
+ "grad_norm": 9.635631561279297,
+ "learning_rate": 1.9506165000828467e-05,
+ "loss": 1.0354,
+ "step": 4677
+ },
+ {
+ "epoch": 12.746594005449591,
+ "grad_norm": 17.402633666992188,
+ "learning_rate": 1.950589106575335e-05,
+ "loss": 1.29,
+ "step": 4678
+ },
+ {
+ "epoch": 12.749318801089919,
+ "grad_norm": 8.623910903930664,
+ "learning_rate": 1.9505617056646658e-05,
+ "loss": 1.278,
+ "step": 4679
+ },
+ {
+ "epoch": 12.752043596730246,
+ "grad_norm": 8.760870933532715,
+ "learning_rate": 1.950534297351053e-05,
+ "loss": 1.156,
+ "step": 4680
+ },
+ {
+ "epoch": 12.754768392370572,
+ "grad_norm": 8.295570373535156,
+ "learning_rate": 1.9505068816347095e-05,
+ "loss": 1.2488,
+ "step": 4681
+ },
+ {
+ "epoch": 12.7574931880109,
+ "grad_norm": 8.168697357177734,
+ "learning_rate": 1.9504794585158492e-05,
+ "loss": 0.9883,
+ "step": 4682
+ },
+ {
+ "epoch": 12.760217983651227,
+ "grad_norm": 8.455802917480469,
+ "learning_rate": 1.9504520279946853e-05,
+ "loss": 1.1169,
+ "step": 4683
+ },
+ {
+ "epoch": 12.762942779291553,
+ "grad_norm": 10.661886215209961,
+ "learning_rate": 1.9504245900714313e-05,
+ "loss": 1.2681,
+ "step": 4684
+ },
+ {
+ "epoch": 12.76566757493188,
+ "grad_norm": 7.8510284423828125,
+ "learning_rate": 1.9503971447463016e-05,
+ "loss": 1.0563,
+ "step": 4685
+ },
+ {
+ "epoch": 12.768392370572208,
+ "grad_norm": 9.176054000854492,
+ "learning_rate": 1.9503696920195096e-05,
+ "loss": 1.1731,
+ "step": 4686
+ },
+ {
+ "epoch": 12.771117166212534,
+ "grad_norm": 10.042091369628906,
+ "learning_rate": 1.950342231891269e-05,
+ "loss": 1.2781,
+ "step": 4687
+ },
+ {
+ "epoch": 12.773841961852861,
+ "grad_norm": 8.199237823486328,
+ "learning_rate": 1.9503147643617932e-05,
+ "loss": 1.1545,
+ "step": 4688
+ },
+ {
+ "epoch": 12.776566757493189,
+ "grad_norm": 11.569225311279297,
+ "learning_rate": 1.950287289431297e-05,
+ "loss": 1.3064,
+ "step": 4689
+ },
+ {
+ "epoch": 12.779291553133515,
+ "grad_norm": 10.179621696472168,
+ "learning_rate": 1.950259807099994e-05,
+ "loss": 1.0471,
+ "step": 4690
+ },
+ {
+ "epoch": 12.782016348773842,
+ "grad_norm": 9.003026008605957,
+ "learning_rate": 1.9502323173680983e-05,
+ "loss": 1.1021,
+ "step": 4691
+ },
+ {
+ "epoch": 12.78474114441417,
+ "grad_norm": 11.675942420959473,
+ "learning_rate": 1.9502048202358236e-05,
+ "loss": 1.0442,
+ "step": 4692
+ },
+ {
+ "epoch": 12.787465940054496,
+ "grad_norm": 9.208623886108398,
+ "learning_rate": 1.9501773157033847e-05,
+ "loss": 1.0453,
+ "step": 4693
+ },
+ {
+ "epoch": 12.790190735694823,
+ "grad_norm": 8.950695991516113,
+ "learning_rate": 1.9501498037709948e-05,
+ "loss": 0.9741,
+ "step": 4694
+ },
+ {
+ "epoch": 12.79291553133515,
+ "grad_norm": 10.017278671264648,
+ "learning_rate": 1.9501222844388696e-05,
+ "loss": 1.1675,
+ "step": 4695
+ },
+ {
+ "epoch": 12.795640326975477,
+ "grad_norm": 8.59681510925293,
+ "learning_rate": 1.950094757707222e-05,
+ "loss": 1.2896,
+ "step": 4696
+ },
+ {
+ "epoch": 12.798365122615804,
+ "grad_norm": 12.797869682312012,
+ "learning_rate": 1.950067223576267e-05,
+ "loss": 1.2446,
+ "step": 4697
+ },
+ {
+ "epoch": 12.80108991825613,
+ "grad_norm": 11.969429969787598,
+ "learning_rate": 1.9500396820462194e-05,
+ "loss": 1.1785,
+ "step": 4698
+ },
+ {
+ "epoch": 12.803814713896458,
+ "grad_norm": 8.822981834411621,
+ "learning_rate": 1.9500121331172936e-05,
+ "loss": 1.0251,
+ "step": 4699
+ },
+ {
+ "epoch": 12.806539509536785,
+ "grad_norm": 15.670023918151855,
+ "learning_rate": 1.9499845767897033e-05,
+ "loss": 1.4297,
+ "step": 4700
+ },
+ {
+ "epoch": 12.809264305177111,
+ "grad_norm": 8.35623836517334,
+ "learning_rate": 1.9499570130636638e-05,
+ "loss": 1.0447,
+ "step": 4701
+ },
+ {
+ "epoch": 12.811989100817438,
+ "grad_norm": 9.654727935791016,
+ "learning_rate": 1.9499294419393898e-05,
+ "loss": 1.1633,
+ "step": 4702
+ },
+ {
+ "epoch": 12.814713896457766,
+ "grad_norm": 8.043304443359375,
+ "learning_rate": 1.949901863417096e-05,
+ "loss": 1.1345,
+ "step": 4703
+ },
+ {
+ "epoch": 12.817438692098092,
+ "grad_norm": 9.322258949279785,
+ "learning_rate": 1.9498742774969968e-05,
+ "loss": 1.0305,
+ "step": 4704
+ },
+ {
+ "epoch": 12.82016348773842,
+ "grad_norm": 13.219219207763672,
+ "learning_rate": 1.9498466841793073e-05,
+ "loss": 1.3967,
+ "step": 4705
+ },
+ {
+ "epoch": 12.822888283378747,
+ "grad_norm": 10.525544166564941,
+ "learning_rate": 1.9498190834642426e-05,
+ "loss": 1.0349,
+ "step": 4706
+ },
+ {
+ "epoch": 12.825613079019073,
+ "grad_norm": 9.625303268432617,
+ "learning_rate": 1.9497914753520175e-05,
+ "loss": 1.2478,
+ "step": 4707
+ },
+ {
+ "epoch": 12.8283378746594,
+ "grad_norm": 8.864691734313965,
+ "learning_rate": 1.9497638598428464e-05,
+ "loss": 1.0991,
+ "step": 4708
+ },
+ {
+ "epoch": 12.831062670299728,
+ "grad_norm": 11.785776138305664,
+ "learning_rate": 1.9497362369369456e-05,
+ "loss": 1.1125,
+ "step": 4709
+ },
+ {
+ "epoch": 12.833787465940054,
+ "grad_norm": 9.78260326385498,
+ "learning_rate": 1.949708606634529e-05,
+ "loss": 1.4175,
+ "step": 4710
+ },
+ {
+ "epoch": 12.836512261580381,
+ "grad_norm": 18.374671936035156,
+ "learning_rate": 1.9496809689358127e-05,
+ "loss": 1.1838,
+ "step": 4711
+ },
+ {
+ "epoch": 12.839237057220709,
+ "grad_norm": 10.118465423583984,
+ "learning_rate": 1.9496533238410117e-05,
+ "loss": 1.1545,
+ "step": 4712
+ },
+ {
+ "epoch": 12.841961852861035,
+ "grad_norm": 10.40396785736084,
+ "learning_rate": 1.949625671350341e-05,
+ "loss": 1.1724,
+ "step": 4713
+ },
+ {
+ "epoch": 12.844686648501362,
+ "grad_norm": 11.841177940368652,
+ "learning_rate": 1.949598011464016e-05,
+ "loss": 1.2544,
+ "step": 4714
+ },
+ {
+ "epoch": 12.84741144414169,
+ "grad_norm": 9.664090156555176,
+ "learning_rate": 1.949570344182252e-05,
+ "loss": 1.2993,
+ "step": 4715
+ },
+ {
+ "epoch": 12.850136239782016,
+ "grad_norm": 11.260235786437988,
+ "learning_rate": 1.9495426695052652e-05,
+ "loss": 1.2002,
+ "step": 4716
+ },
+ {
+ "epoch": 12.852861035422343,
+ "grad_norm": 9.741466522216797,
+ "learning_rate": 1.9495149874332707e-05,
+ "loss": 1.0798,
+ "step": 4717
+ },
+ {
+ "epoch": 12.85558583106267,
+ "grad_norm": 12.825498580932617,
+ "learning_rate": 1.9494872979664838e-05,
+ "loss": 1.176,
+ "step": 4718
+ },
+ {
+ "epoch": 12.858310626702997,
+ "grad_norm": 14.039491653442383,
+ "learning_rate": 1.9494596011051205e-05,
+ "loss": 1.1194,
+ "step": 4719
+ },
+ {
+ "epoch": 12.861035422343324,
+ "grad_norm": 8.56617546081543,
+ "learning_rate": 1.9494318968493965e-05,
+ "loss": 1.1135,
+ "step": 4720
+ },
+ {
+ "epoch": 12.863760217983652,
+ "grad_norm": 11.367093086242676,
+ "learning_rate": 1.949404185199527e-05,
+ "loss": 1.0955,
+ "step": 4721
+ },
+ {
+ "epoch": 12.866485013623977,
+ "grad_norm": 8.225251197814941,
+ "learning_rate": 1.9493764661557287e-05,
+ "loss": 1.1096,
+ "step": 4722
+ },
+ {
+ "epoch": 12.869209809264305,
+ "grad_norm": 18.134790420532227,
+ "learning_rate": 1.949348739718217e-05,
+ "loss": 1.2549,
+ "step": 4723
+ },
+ {
+ "epoch": 12.871934604904633,
+ "grad_norm": 14.881370544433594,
+ "learning_rate": 1.9493210058872075e-05,
+ "loss": 1.401,
+ "step": 4724
+ },
+ {
+ "epoch": 12.874659400544958,
+ "grad_norm": 10.585454940795898,
+ "learning_rate": 1.949293264662917e-05,
+ "loss": 1.0671,
+ "step": 4725
+ },
+ {
+ "epoch": 12.877384196185286,
+ "grad_norm": 11.371530532836914,
+ "learning_rate": 1.9492655160455607e-05,
+ "loss": 1.0669,
+ "step": 4726
+ },
+ {
+ "epoch": 12.880108991825614,
+ "grad_norm": 11.10936164855957,
+ "learning_rate": 1.9492377600353555e-05,
+ "loss": 1.1472,
+ "step": 4727
+ },
+ {
+ "epoch": 12.88283378746594,
+ "grad_norm": 10.045562744140625,
+ "learning_rate": 1.9492099966325168e-05,
+ "loss": 1.0927,
+ "step": 4728
+ },
+ {
+ "epoch": 12.885558583106267,
+ "grad_norm": 9.858827590942383,
+ "learning_rate": 1.9491822258372614e-05,
+ "loss": 1.1929,
+ "step": 4729
+ },
+ {
+ "epoch": 12.888283378746594,
+ "grad_norm": 12.741924285888672,
+ "learning_rate": 1.9491544476498054e-05,
+ "loss": 1.2134,
+ "step": 4730
+ },
+ {
+ "epoch": 12.89100817438692,
+ "grad_norm": 9.4379243850708,
+ "learning_rate": 1.949126662070365e-05,
+ "loss": 1.0623,
+ "step": 4731
+ },
+ {
+ "epoch": 12.893732970027248,
+ "grad_norm": 12.204022407531738,
+ "learning_rate": 1.949098869099157e-05,
+ "loss": 1.3323,
+ "step": 4732
+ },
+ {
+ "epoch": 12.896457765667575,
+ "grad_norm": 10.362288475036621,
+ "learning_rate": 1.949071068736397e-05,
+ "loss": 1.2102,
+ "step": 4733
+ },
+ {
+ "epoch": 12.899182561307901,
+ "grad_norm": 22.170654296875,
+ "learning_rate": 1.9490432609823027e-05,
+ "loss": 1.1755,
+ "step": 4734
+ },
+ {
+ "epoch": 12.901907356948229,
+ "grad_norm": 12.023188591003418,
+ "learning_rate": 1.94901544583709e-05,
+ "loss": 1.1824,
+ "step": 4735
+ },
+ {
+ "epoch": 12.904632152588556,
+ "grad_norm": 11.377690315246582,
+ "learning_rate": 1.9489876233009747e-05,
+ "loss": 1.4109,
+ "step": 4736
+ },
+ {
+ "epoch": 12.907356948228882,
+ "grad_norm": 17.193017959594727,
+ "learning_rate": 1.9489597933741754e-05,
+ "loss": 1.1846,
+ "step": 4737
+ },
+ {
+ "epoch": 12.91008174386921,
+ "grad_norm": 17.572160720825195,
+ "learning_rate": 1.948931956056907e-05,
+ "loss": 1.2808,
+ "step": 4738
+ },
+ {
+ "epoch": 12.912806539509537,
+ "grad_norm": 10.966382026672363,
+ "learning_rate": 1.9489041113493875e-05,
+ "loss": 1.2979,
+ "step": 4739
+ },
+ {
+ "epoch": 12.915531335149863,
+ "grad_norm": 12.861130714416504,
+ "learning_rate": 1.9488762592518332e-05,
+ "loss": 1.0878,
+ "step": 4740
+ },
+ {
+ "epoch": 12.91825613079019,
+ "grad_norm": 12.99240493774414,
+ "learning_rate": 1.9488483997644613e-05,
+ "loss": 1.1365,
+ "step": 4741
+ },
+ {
+ "epoch": 12.920980926430518,
+ "grad_norm": 15.539706230163574,
+ "learning_rate": 1.948820532887488e-05,
+ "loss": 1.2317,
+ "step": 4742
+ },
+ {
+ "epoch": 12.923705722070844,
+ "grad_norm": 10.954058647155762,
+ "learning_rate": 1.9487926586211314e-05,
+ "loss": 1.1658,
+ "step": 4743
+ },
+ {
+ "epoch": 12.926430517711172,
+ "grad_norm": 9.134175300598145,
+ "learning_rate": 1.9487647769656082e-05,
+ "loss": 1.3232,
+ "step": 4744
+ },
+ {
+ "epoch": 12.9291553133515,
+ "grad_norm": 10.19599437713623,
+ "learning_rate": 1.948736887921135e-05,
+ "loss": 1.1957,
+ "step": 4745
+ },
+ {
+ "epoch": 12.931880108991825,
+ "grad_norm": 9.151069641113281,
+ "learning_rate": 1.94870899148793e-05,
+ "loss": 1.2957,
+ "step": 4746
+ },
+ {
+ "epoch": 12.934604904632153,
+ "grad_norm": 10.090906143188477,
+ "learning_rate": 1.9486810876662097e-05,
+ "loss": 1.1069,
+ "step": 4747
+ },
+ {
+ "epoch": 12.93732970027248,
+ "grad_norm": 14.232126235961914,
+ "learning_rate": 1.9486531764561915e-05,
+ "loss": 1.2755,
+ "step": 4748
+ },
+ {
+ "epoch": 12.940054495912806,
+ "grad_norm": 12.848154067993164,
+ "learning_rate": 1.948625257858093e-05,
+ "loss": 1.1897,
+ "step": 4749
+ },
+ {
+ "epoch": 12.942779291553133,
+ "grad_norm": 10.731879234313965,
+ "learning_rate": 1.9485973318721316e-05,
+ "loss": 1.1263,
+ "step": 4750
+ },
+ {
+ "epoch": 12.945504087193461,
+ "grad_norm": 8.240216255187988,
+ "learning_rate": 1.9485693984985246e-05,
+ "loss": 1.1028,
+ "step": 4751
+ },
+ {
+ "epoch": 12.948228882833787,
+ "grad_norm": 7.984894752502441,
+ "learning_rate": 1.9485414577374896e-05,
+ "loss": 1.0601,
+ "step": 4752
+ },
+ {
+ "epoch": 12.950953678474114,
+ "grad_norm": 19.504682540893555,
+ "learning_rate": 1.9485135095892444e-05,
+ "loss": 1.1667,
+ "step": 4753
+ },
+ {
+ "epoch": 12.953678474114442,
+ "grad_norm": 12.880973815917969,
+ "learning_rate": 1.9484855540540063e-05,
+ "loss": 1.1313,
+ "step": 4754
+ },
+ {
+ "epoch": 12.956403269754768,
+ "grad_norm": 14.527582168579102,
+ "learning_rate": 1.9484575911319934e-05,
+ "loss": 1.2534,
+ "step": 4755
+ },
+ {
+ "epoch": 12.959128065395095,
+ "grad_norm": 12.558151245117188,
+ "learning_rate": 1.9484296208234232e-05,
+ "loss": 1.4653,
+ "step": 4756
+ },
+ {
+ "epoch": 12.961852861035423,
+ "grad_norm": 16.638273239135742,
+ "learning_rate": 1.9484016431285137e-05,
+ "loss": 1.2145,
+ "step": 4757
+ },
+ {
+ "epoch": 12.964577656675749,
+ "grad_norm": 11.54865550994873,
+ "learning_rate": 1.948373658047483e-05,
+ "loss": 1.1606,
+ "step": 4758
+ },
+ {
+ "epoch": 12.967302452316076,
+ "grad_norm": 28.242734909057617,
+ "learning_rate": 1.9483456655805485e-05,
+ "loss": 1.3115,
+ "step": 4759
+ },
+ {
+ "epoch": 12.970027247956404,
+ "grad_norm": 13.323819160461426,
+ "learning_rate": 1.9483176657279282e-05,
+ "loss": 1.4126,
+ "step": 4760
+ },
+ {
+ "epoch": 12.97275204359673,
+ "grad_norm": 14.263542175292969,
+ "learning_rate": 1.948289658489841e-05,
+ "loss": 1.2168,
+ "step": 4761
+ },
+ {
+ "epoch": 12.975476839237057,
+ "grad_norm": 11.75001335144043,
+ "learning_rate": 1.9482616438665037e-05,
+ "loss": 1.4028,
+ "step": 4762
+ },
+ {
+ "epoch": 12.978201634877385,
+ "grad_norm": 12.625207901000977,
+ "learning_rate": 1.9482336218581358e-05,
+ "loss": 1.2711,
+ "step": 4763
+ },
+ {
+ "epoch": 12.98092643051771,
+ "grad_norm": 12.272146224975586,
+ "learning_rate": 1.9482055924649552e-05,
+ "loss": 1.2874,
+ "step": 4764
+ },
+ {
+ "epoch": 12.983651226158038,
+ "grad_norm": 13.786018371582031,
+ "learning_rate": 1.9481775556871795e-05,
+ "loss": 1.2549,
+ "step": 4765
+ },
+ {
+ "epoch": 12.986376021798366,
+ "grad_norm": 10.136306762695312,
+ "learning_rate": 1.9481495115250277e-05,
+ "loss": 1.1978,
+ "step": 4766
+ },
+ {
+ "epoch": 12.989100817438691,
+ "grad_norm": 10.84641170501709,
+ "learning_rate": 1.9481214599787178e-05,
+ "loss": 1.2397,
+ "step": 4767
+ },
+ {
+ "epoch": 12.991825613079019,
+ "grad_norm": 10.182979583740234,
+ "learning_rate": 1.948093401048469e-05,
+ "loss": 1.1631,
+ "step": 4768
+ },
+ {
+ "epoch": 12.994550408719347,
+ "grad_norm": 9.386366844177246,
+ "learning_rate": 1.9480653347344992e-05,
+ "loss": 1.2756,
+ "step": 4769
+ },
+ {
+ "epoch": 12.997275204359672,
+ "grad_norm": 10.589299201965332,
+ "learning_rate": 1.9480372610370265e-05,
+ "loss": 0.9358,
+ "step": 4770
+ },
+ {
+ "epoch": 13.0,
+ "grad_norm": 9.844215393066406,
+ "learning_rate": 1.9480091799562706e-05,
+ "loss": 1.0752,
+ "step": 4771
+ },
+ {
+ "epoch": 13.002724795640328,
+ "grad_norm": 7.666797637939453,
+ "learning_rate": 1.9479810914924498e-05,
+ "loss": 0.9545,
+ "step": 4772
+ },
+ {
+ "epoch": 13.005449591280653,
+ "grad_norm": 7.6852946281433105,
+ "learning_rate": 1.9479529956457825e-05,
+ "loss": 1.082,
+ "step": 4773
+ },
+ {
+ "epoch": 13.008174386920981,
+ "grad_norm": 12.821184158325195,
+ "learning_rate": 1.9479248924164878e-05,
+ "loss": 1.1492,
+ "step": 4774
+ },
+ {
+ "epoch": 13.010899182561309,
+ "grad_norm": 8.613661766052246,
+ "learning_rate": 1.9478967818047846e-05,
+ "loss": 1.1296,
+ "step": 4775
+ },
+ {
+ "epoch": 13.013623978201634,
+ "grad_norm": 9.4019136428833,
+ "learning_rate": 1.947868663810892e-05,
+ "loss": 1.0706,
+ "step": 4776
+ },
+ {
+ "epoch": 13.016348773841962,
+ "grad_norm": 11.372208595275879,
+ "learning_rate": 1.9478405384350283e-05,
+ "loss": 0.9995,
+ "step": 4777
+ },
+ {
+ "epoch": 13.01907356948229,
+ "grad_norm": 8.624147415161133,
+ "learning_rate": 1.9478124056774133e-05,
+ "loss": 1.0875,
+ "step": 4778
+ },
+ {
+ "epoch": 13.021798365122615,
+ "grad_norm": 10.279169082641602,
+ "learning_rate": 1.9477842655382656e-05,
+ "loss": 1.126,
+ "step": 4779
+ },
+ {
+ "epoch": 13.024523160762943,
+ "grad_norm": 10.575634002685547,
+ "learning_rate": 1.9477561180178048e-05,
+ "loss": 1.1987,
+ "step": 4780
+ },
+ {
+ "epoch": 13.02724795640327,
+ "grad_norm": 11.488377571105957,
+ "learning_rate": 1.9477279631162494e-05,
+ "loss": 1.0762,
+ "step": 4781
+ },
+ {
+ "epoch": 13.029972752043596,
+ "grad_norm": 10.141093254089355,
+ "learning_rate": 1.9476998008338197e-05,
+ "loss": 1.0608,
+ "step": 4782
+ },
+ {
+ "epoch": 13.032697547683924,
+ "grad_norm": 9.139327049255371,
+ "learning_rate": 1.9476716311707342e-05,
+ "loss": 1.238,
+ "step": 4783
+ },
+ {
+ "epoch": 13.035422343324251,
+ "grad_norm": 8.857711791992188,
+ "learning_rate": 1.9476434541272127e-05,
+ "loss": 1.1503,
+ "step": 4784
+ },
+ {
+ "epoch": 13.038147138964577,
+ "grad_norm": 10.265288352966309,
+ "learning_rate": 1.9476152697034743e-05,
+ "loss": 1.0933,
+ "step": 4785
+ },
+ {
+ "epoch": 13.040871934604905,
+ "grad_norm": 9.10065746307373,
+ "learning_rate": 1.9475870778997386e-05,
+ "loss": 1.1567,
+ "step": 4786
+ },
+ {
+ "epoch": 13.043596730245232,
+ "grad_norm": 7.665113925933838,
+ "learning_rate": 1.947558878716225e-05,
+ "loss": 1.103,
+ "step": 4787
+ },
+ {
+ "epoch": 13.046321525885558,
+ "grad_norm": 8.798256874084473,
+ "learning_rate": 1.947530672153154e-05,
+ "loss": 1.1296,
+ "step": 4788
+ },
+ {
+ "epoch": 13.049046321525886,
+ "grad_norm": 8.013124465942383,
+ "learning_rate": 1.9475024582107443e-05,
+ "loss": 1.1741,
+ "step": 4789
+ },
+ {
+ "epoch": 13.051771117166213,
+ "grad_norm": 8.364792823791504,
+ "learning_rate": 1.9474742368892162e-05,
+ "loss": 1.1431,
+ "step": 4790
+ },
+ {
+ "epoch": 13.054495912806539,
+ "grad_norm": 7.662590026855469,
+ "learning_rate": 1.9474460081887888e-05,
+ "loss": 1.2012,
+ "step": 4791
+ },
+ {
+ "epoch": 13.057220708446867,
+ "grad_norm": 9.507669448852539,
+ "learning_rate": 1.9474177721096825e-05,
+ "loss": 1.1265,
+ "step": 4792
+ },
+ {
+ "epoch": 13.059945504087194,
+ "grad_norm": 10.31091594696045,
+ "learning_rate": 1.9473895286521173e-05,
+ "loss": 0.9613,
+ "step": 4793
+ },
+ {
+ "epoch": 13.06267029972752,
+ "grad_norm": 7.168553352355957,
+ "learning_rate": 1.9473612778163126e-05,
+ "loss": 0.9987,
+ "step": 4794
+ },
+ {
+ "epoch": 13.065395095367847,
+ "grad_norm": 9.055052757263184,
+ "learning_rate": 1.9473330196024892e-05,
+ "loss": 1.1428,
+ "step": 4795
+ },
+ {
+ "epoch": 13.068119891008175,
+ "grad_norm": 8.657708168029785,
+ "learning_rate": 1.947304754010866e-05,
+ "loss": 1.0333,
+ "step": 4796
+ },
+ {
+ "epoch": 13.0708446866485,
+ "grad_norm": 8.923104286193848,
+ "learning_rate": 1.9472764810416647e-05,
+ "loss": 1.1104,
+ "step": 4797
+ },
+ {
+ "epoch": 13.073569482288828,
+ "grad_norm": 7.689241886138916,
+ "learning_rate": 1.9472482006951045e-05,
+ "loss": 1.0107,
+ "step": 4798
+ },
+ {
+ "epoch": 13.076294277929156,
+ "grad_norm": 8.09443473815918,
+ "learning_rate": 1.9472199129714053e-05,
+ "loss": 0.9927,
+ "step": 4799
+ },
+ {
+ "epoch": 13.079019073569482,
+ "grad_norm": 9.916367530822754,
+ "learning_rate": 1.947191617870788e-05,
+ "loss": 1.1208,
+ "step": 4800
+ },
+ {
+ "epoch": 13.08174386920981,
+ "grad_norm": 7.7582106590271,
+ "learning_rate": 1.9471633153934735e-05,
+ "loss": 1.0,
+ "step": 4801
+ },
+ {
+ "epoch": 13.084468664850137,
+ "grad_norm": 8.89434814453125,
+ "learning_rate": 1.9471350055396813e-05,
+ "loss": 1.0178,
+ "step": 4802
+ },
+ {
+ "epoch": 13.087193460490463,
+ "grad_norm": 10.418031692504883,
+ "learning_rate": 1.9471066883096318e-05,
+ "loss": 1.1067,
+ "step": 4803
+ },
+ {
+ "epoch": 13.08991825613079,
+ "grad_norm": 8.61137866973877,
+ "learning_rate": 1.947078363703546e-05,
+ "loss": 1.058,
+ "step": 4804
+ },
+ {
+ "epoch": 13.092643051771118,
+ "grad_norm": 8.120413780212402,
+ "learning_rate": 1.9470500317216447e-05,
+ "loss": 1.09,
+ "step": 4805
+ },
+ {
+ "epoch": 13.095367847411444,
+ "grad_norm": 8.580293655395508,
+ "learning_rate": 1.947021692364148e-05,
+ "loss": 1.0365,
+ "step": 4806
+ },
+ {
+ "epoch": 13.098092643051771,
+ "grad_norm": 11.327431678771973,
+ "learning_rate": 1.9469933456312768e-05,
+ "loss": 1.1143,
+ "step": 4807
+ },
+ {
+ "epoch": 13.100817438692099,
+ "grad_norm": 8.277037620544434,
+ "learning_rate": 1.946964991523252e-05,
+ "loss": 1.1616,
+ "step": 4808
+ },
+ {
+ "epoch": 13.103542234332425,
+ "grad_norm": 16.122602462768555,
+ "learning_rate": 1.9469366300402943e-05,
+ "loss": 0.9401,
+ "step": 4809
+ },
+ {
+ "epoch": 13.106267029972752,
+ "grad_norm": 11.935078620910645,
+ "learning_rate": 1.9469082611826247e-05,
+ "loss": 1.2131,
+ "step": 4810
+ },
+ {
+ "epoch": 13.10899182561308,
+ "grad_norm": 9.547844886779785,
+ "learning_rate": 1.9468798849504637e-05,
+ "loss": 1.1139,
+ "step": 4811
+ },
+ {
+ "epoch": 13.111716621253406,
+ "grad_norm": 8.435270309448242,
+ "learning_rate": 1.946851501344033e-05,
+ "loss": 1.1428,
+ "step": 4812
+ },
+ {
+ "epoch": 13.114441416893733,
+ "grad_norm": 11.99997329711914,
+ "learning_rate": 1.946823110363553e-05,
+ "loss": 1.0203,
+ "step": 4813
+ },
+ {
+ "epoch": 13.11716621253406,
+ "grad_norm": 10.833842277526855,
+ "learning_rate": 1.9467947120092456e-05,
+ "loss": 1.2686,
+ "step": 4814
+ },
+ {
+ "epoch": 13.119891008174386,
+ "grad_norm": 10.036761283874512,
+ "learning_rate": 1.946766306281331e-05,
+ "loss": 1.2429,
+ "step": 4815
+ },
+ {
+ "epoch": 13.122615803814714,
+ "grad_norm": 12.2543306350708,
+ "learning_rate": 1.9467378931800307e-05,
+ "loss": 1.2078,
+ "step": 4816
+ },
+ {
+ "epoch": 13.125340599455042,
+ "grad_norm": 11.304621696472168,
+ "learning_rate": 1.9467094727055666e-05,
+ "loss": 1.0267,
+ "step": 4817
+ },
+ {
+ "epoch": 13.128065395095367,
+ "grad_norm": 7.782921314239502,
+ "learning_rate": 1.9466810448581593e-05,
+ "loss": 1.2629,
+ "step": 4818
+ },
+ {
+ "epoch": 13.130790190735695,
+ "grad_norm": 10.114357948303223,
+ "learning_rate": 1.9466526096380306e-05,
+ "loss": 1.1245,
+ "step": 4819
+ },
+ {
+ "epoch": 13.133514986376023,
+ "grad_norm": 12.20517349243164,
+ "learning_rate": 1.946624167045402e-05,
+ "loss": 1.1082,
+ "step": 4820
+ },
+ {
+ "epoch": 13.136239782016348,
+ "grad_norm": 7.676155090332031,
+ "learning_rate": 1.9465957170804945e-05,
+ "loss": 0.9092,
+ "step": 4821
+ },
+ {
+ "epoch": 13.138964577656676,
+ "grad_norm": 17.275049209594727,
+ "learning_rate": 1.9465672597435305e-05,
+ "loss": 1.0386,
+ "step": 4822
+ },
+ {
+ "epoch": 13.141689373297003,
+ "grad_norm": 9.47167682647705,
+ "learning_rate": 1.946538795034731e-05,
+ "loss": 1.1665,
+ "step": 4823
+ },
+ {
+ "epoch": 13.14441416893733,
+ "grad_norm": 10.40883731842041,
+ "learning_rate": 1.9465103229543177e-05,
+ "loss": 0.9478,
+ "step": 4824
+ },
+ {
+ "epoch": 13.147138964577657,
+ "grad_norm": 8.743013381958008,
+ "learning_rate": 1.9464818435025123e-05,
+ "loss": 1.0924,
+ "step": 4825
+ },
+ {
+ "epoch": 13.149863760217984,
+ "grad_norm": 9.411235809326172,
+ "learning_rate": 1.946453356679537e-05,
+ "loss": 1.4094,
+ "step": 4826
+ },
+ {
+ "epoch": 13.15258855585831,
+ "grad_norm": 7.757769584655762,
+ "learning_rate": 1.946424862485613e-05,
+ "loss": 1.0376,
+ "step": 4827
+ },
+ {
+ "epoch": 13.155313351498638,
+ "grad_norm": 11.2542142868042,
+ "learning_rate": 1.9463963609209634e-05,
+ "loss": 1.0562,
+ "step": 4828
+ },
+ {
+ "epoch": 13.158038147138965,
+ "grad_norm": 18.28806495666504,
+ "learning_rate": 1.946367851985809e-05,
+ "loss": 1.0532,
+ "step": 4829
+ },
+ {
+ "epoch": 13.160762942779291,
+ "grad_norm": 10.936038970947266,
+ "learning_rate": 1.946339335680372e-05,
+ "loss": 1.187,
+ "step": 4830
+ },
+ {
+ "epoch": 13.163487738419619,
+ "grad_norm": 9.41383171081543,
+ "learning_rate": 1.946310812004875e-05,
+ "loss": 1.1675,
+ "step": 4831
+ },
+ {
+ "epoch": 13.166212534059946,
+ "grad_norm": 8.845934867858887,
+ "learning_rate": 1.94628228095954e-05,
+ "loss": 1.0764,
+ "step": 4832
+ },
+ {
+ "epoch": 13.168937329700272,
+ "grad_norm": 8.47250747680664,
+ "learning_rate": 1.9462537425445886e-05,
+ "loss": 1.2778,
+ "step": 4833
+ },
+ {
+ "epoch": 13.1716621253406,
+ "grad_norm": 7.736001014709473,
+ "learning_rate": 1.946225196760244e-05,
+ "loss": 1.1509,
+ "step": 4834
+ },
+ {
+ "epoch": 13.174386920980927,
+ "grad_norm": 10.229379653930664,
+ "learning_rate": 1.9461966436067277e-05,
+ "loss": 1.1388,
+ "step": 4835
+ },
+ {
+ "epoch": 13.177111716621253,
+ "grad_norm": 7.262877941131592,
+ "learning_rate": 1.9461680830842623e-05,
+ "loss": 1.1038,
+ "step": 4836
+ },
+ {
+ "epoch": 13.17983651226158,
+ "grad_norm": 12.27935791015625,
+ "learning_rate": 1.9461395151930707e-05,
+ "loss": 1.2803,
+ "step": 4837
+ },
+ {
+ "epoch": 13.182561307901908,
+ "grad_norm": 9.038432121276855,
+ "learning_rate": 1.9461109399333748e-05,
+ "loss": 1.2936,
+ "step": 4838
+ },
+ {
+ "epoch": 13.185286103542234,
+ "grad_norm": 13.52312183380127,
+ "learning_rate": 1.9460823573053972e-05,
+ "loss": 1.2933,
+ "step": 4839
+ },
+ {
+ "epoch": 13.188010899182562,
+ "grad_norm": 10.074718475341797,
+ "learning_rate": 1.946053767309361e-05,
+ "loss": 1.0635,
+ "step": 4840
+ },
+ {
+ "epoch": 13.190735694822889,
+ "grad_norm": 8.525565147399902,
+ "learning_rate": 1.946025169945488e-05,
+ "loss": 1.052,
+ "step": 4841
+ },
+ {
+ "epoch": 13.193460490463215,
+ "grad_norm": 8.379159927368164,
+ "learning_rate": 1.945996565214002e-05,
+ "loss": 1.0662,
+ "step": 4842
+ },
+ {
+ "epoch": 13.196185286103542,
+ "grad_norm": 7.827342987060547,
+ "learning_rate": 1.9459679531151246e-05,
+ "loss": 1.02,
+ "step": 4843
+ },
+ {
+ "epoch": 13.19891008174387,
+ "grad_norm": 9.321455001831055,
+ "learning_rate": 1.9459393336490797e-05,
+ "loss": 1.0466,
+ "step": 4844
+ },
+ {
+ "epoch": 13.201634877384196,
+ "grad_norm": 8.47685432434082,
+ "learning_rate": 1.9459107068160898e-05,
+ "loss": 1.0537,
+ "step": 4845
+ },
+ {
+ "epoch": 13.204359673024523,
+ "grad_norm": 10.115507125854492,
+ "learning_rate": 1.9458820726163774e-05,
+ "loss": 1.1064,
+ "step": 4846
+ },
+ {
+ "epoch": 13.207084468664851,
+ "grad_norm": 9.728424072265625,
+ "learning_rate": 1.945853431050166e-05,
+ "loss": 1.0018,
+ "step": 4847
+ },
+ {
+ "epoch": 13.209809264305177,
+ "grad_norm": 8.614083290100098,
+ "learning_rate": 1.9458247821176787e-05,
+ "loss": 0.9924,
+ "step": 4848
+ },
+ {
+ "epoch": 13.212534059945504,
+ "grad_norm": 10.828216552734375,
+ "learning_rate": 1.945796125819138e-05,
+ "loss": 1.1628,
+ "step": 4849
+ },
+ {
+ "epoch": 13.215258855585832,
+ "grad_norm": 7.806414604187012,
+ "learning_rate": 1.9457674621547678e-05,
+ "loss": 1.1448,
+ "step": 4850
+ },
+ {
+ "epoch": 13.217983651226158,
+ "grad_norm": 10.824487686157227,
+ "learning_rate": 1.945738791124791e-05,
+ "loss": 1.1963,
+ "step": 4851
+ },
+ {
+ "epoch": 13.220708446866485,
+ "grad_norm": 9.565332412719727,
+ "learning_rate": 1.945710112729431e-05,
+ "loss": 1.0291,
+ "step": 4852
+ },
+ {
+ "epoch": 13.223433242506813,
+ "grad_norm": 9.20203685760498,
+ "learning_rate": 1.9456814269689112e-05,
+ "loss": 1.2798,
+ "step": 4853
+ },
+ {
+ "epoch": 13.226158038147139,
+ "grad_norm": 14.028481483459473,
+ "learning_rate": 1.9456527338434545e-05,
+ "loss": 1.0686,
+ "step": 4854
+ },
+ {
+ "epoch": 13.228882833787466,
+ "grad_norm": 8.253077507019043,
+ "learning_rate": 1.945624033353285e-05,
+ "loss": 1.2712,
+ "step": 4855
+ },
+ {
+ "epoch": 13.231607629427794,
+ "grad_norm": 12.524160385131836,
+ "learning_rate": 1.945595325498626e-05,
+ "loss": 1.1675,
+ "step": 4856
+ },
+ {
+ "epoch": 13.23433242506812,
+ "grad_norm": 9.643004417419434,
+ "learning_rate": 1.9455666102797007e-05,
+ "loss": 1.1772,
+ "step": 4857
+ },
+ {
+ "epoch": 13.237057220708447,
+ "grad_norm": 9.738412857055664,
+ "learning_rate": 1.9455378876967335e-05,
+ "loss": 1.032,
+ "step": 4858
+ },
+ {
+ "epoch": 13.239782016348773,
+ "grad_norm": 8.651823043823242,
+ "learning_rate": 1.9455091577499476e-05,
+ "loss": 1.1724,
+ "step": 4859
+ },
+ {
+ "epoch": 13.2425068119891,
+ "grad_norm": 11.075654029846191,
+ "learning_rate": 1.9454804204395667e-05,
+ "loss": 1.0635,
+ "step": 4860
+ },
+ {
+ "epoch": 13.245231607629428,
+ "grad_norm": 12.856353759765625,
+ "learning_rate": 1.9454516757658142e-05,
+ "loss": 1.1277,
+ "step": 4861
+ },
+ {
+ "epoch": 13.247956403269754,
+ "grad_norm": 8.579092979431152,
+ "learning_rate": 1.9454229237289152e-05,
+ "loss": 1.0472,
+ "step": 4862
+ },
+ {
+ "epoch": 13.250681198910081,
+ "grad_norm": 10.595727920532227,
+ "learning_rate": 1.9453941643290928e-05,
+ "loss": 1.1139,
+ "step": 4863
+ },
+ {
+ "epoch": 13.253405994550409,
+ "grad_norm": 11.85381031036377,
+ "learning_rate": 1.945365397566571e-05,
+ "loss": 1.0942,
+ "step": 4864
+ },
+ {
+ "epoch": 13.256130790190735,
+ "grad_norm": 14.746014595031738,
+ "learning_rate": 1.9453366234415737e-05,
+ "loss": 1.1694,
+ "step": 4865
+ },
+ {
+ "epoch": 13.258855585831062,
+ "grad_norm": 8.3314847946167,
+ "learning_rate": 1.9453078419543257e-05,
+ "loss": 0.9364,
+ "step": 4866
+ },
+ {
+ "epoch": 13.26158038147139,
+ "grad_norm": 10.424186706542969,
+ "learning_rate": 1.9452790531050502e-05,
+ "loss": 1.1519,
+ "step": 4867
+ },
+ {
+ "epoch": 13.264305177111716,
+ "grad_norm": 10.4879732131958,
+ "learning_rate": 1.945250256893972e-05,
+ "loss": 1.062,
+ "step": 4868
+ },
+ {
+ "epoch": 13.267029972752043,
+ "grad_norm": 9.179813385009766,
+ "learning_rate": 1.945221453321315e-05,
+ "loss": 1.2612,
+ "step": 4869
+ },
+ {
+ "epoch": 13.269754768392371,
+ "grad_norm": 11.862262725830078,
+ "learning_rate": 1.945192642387304e-05,
+ "loss": 1.2861,
+ "step": 4870
+ },
+ {
+ "epoch": 13.272479564032697,
+ "grad_norm": 15.201726913452148,
+ "learning_rate": 1.945163824092163e-05,
+ "loss": 1.2764,
+ "step": 4871
+ },
+ {
+ "epoch": 13.275204359673024,
+ "grad_norm": 9.373326301574707,
+ "learning_rate": 1.9451349984361168e-05,
+ "loss": 1.1027,
+ "step": 4872
+ },
+ {
+ "epoch": 13.277929155313352,
+ "grad_norm": 9.788365364074707,
+ "learning_rate": 1.9451061654193893e-05,
+ "loss": 1.0702,
+ "step": 4873
+ },
+ {
+ "epoch": 13.280653950953678,
+ "grad_norm": 10.5549955368042,
+ "learning_rate": 1.9450773250422058e-05,
+ "loss": 1.0361,
+ "step": 4874
+ },
+ {
+ "epoch": 13.283378746594005,
+ "grad_norm": 16.18577003479004,
+ "learning_rate": 1.9450484773047905e-05,
+ "loss": 0.9915,
+ "step": 4875
+ },
+ {
+ "epoch": 13.286103542234333,
+ "grad_norm": 9.295065879821777,
+ "learning_rate": 1.9450196222073676e-05,
+ "loss": 1.0227,
+ "step": 4876
+ },
+ {
+ "epoch": 13.288828337874659,
+ "grad_norm": 9.181978225708008,
+ "learning_rate": 1.9449907597501626e-05,
+ "loss": 1.218,
+ "step": 4877
+ },
+ {
+ "epoch": 13.291553133514986,
+ "grad_norm": 8.142616271972656,
+ "learning_rate": 1.9449618899334e-05,
+ "loss": 0.8522,
+ "step": 4878
+ },
+ {
+ "epoch": 13.294277929155314,
+ "grad_norm": 11.572206497192383,
+ "learning_rate": 1.9449330127573044e-05,
+ "loss": 1.0811,
+ "step": 4879
+ },
+ {
+ "epoch": 13.29700272479564,
+ "grad_norm": 9.058589935302734,
+ "learning_rate": 1.9449041282221012e-05,
+ "loss": 1.0762,
+ "step": 4880
+ },
+ {
+ "epoch": 13.299727520435967,
+ "grad_norm": 11.395737648010254,
+ "learning_rate": 1.9448752363280147e-05,
+ "loss": 1.343,
+ "step": 4881
+ },
+ {
+ "epoch": 13.302452316076295,
+ "grad_norm": 10.529814720153809,
+ "learning_rate": 1.9448463370752705e-05,
+ "loss": 0.9668,
+ "step": 4882
+ },
+ {
+ "epoch": 13.30517711171662,
+ "grad_norm": 7.888298034667969,
+ "learning_rate": 1.9448174304640936e-05,
+ "loss": 0.9543,
+ "step": 4883
+ },
+ {
+ "epoch": 13.307901907356948,
+ "grad_norm": 9.759827613830566,
+ "learning_rate": 1.944788516494709e-05,
+ "loss": 1.3025,
+ "step": 4884
+ },
+ {
+ "epoch": 13.310626702997276,
+ "grad_norm": 11.753057479858398,
+ "learning_rate": 1.9447595951673415e-05,
+ "loss": 1.0895,
+ "step": 4885
+ },
+ {
+ "epoch": 13.313351498637601,
+ "grad_norm": 10.756237983703613,
+ "learning_rate": 1.9447306664822166e-05,
+ "loss": 1.1907,
+ "step": 4886
+ },
+ {
+ "epoch": 13.316076294277929,
+ "grad_norm": 9.583301544189453,
+ "learning_rate": 1.94470173043956e-05,
+ "loss": 1.1617,
+ "step": 4887
+ },
+ {
+ "epoch": 13.318801089918257,
+ "grad_norm": 8.751459121704102,
+ "learning_rate": 1.9446727870395964e-05,
+ "loss": 0.9995,
+ "step": 4888
+ },
+ {
+ "epoch": 13.321525885558582,
+ "grad_norm": 12.962774276733398,
+ "learning_rate": 1.944643836282552e-05,
+ "loss": 1.1714,
+ "step": 4889
+ },
+ {
+ "epoch": 13.32425068119891,
+ "grad_norm": 9.904338836669922,
+ "learning_rate": 1.9446148781686515e-05,
+ "loss": 1.114,
+ "step": 4890
+ },
+ {
+ "epoch": 13.326975476839237,
+ "grad_norm": 8.514065742492676,
+ "learning_rate": 1.9445859126981207e-05,
+ "loss": 0.9292,
+ "step": 4891
+ },
+ {
+ "epoch": 13.329700272479563,
+ "grad_norm": 13.031332969665527,
+ "learning_rate": 1.9445569398711853e-05,
+ "loss": 1.1843,
+ "step": 4892
+ },
+ {
+ "epoch": 13.33242506811989,
+ "grad_norm": 8.385294914245605,
+ "learning_rate": 1.944527959688071e-05,
+ "loss": 1.3203,
+ "step": 4893
+ },
+ {
+ "epoch": 13.335149863760218,
+ "grad_norm": 10.21648120880127,
+ "learning_rate": 1.9444989721490034e-05,
+ "loss": 1.2075,
+ "step": 4894
+ },
+ {
+ "epoch": 13.337874659400544,
+ "grad_norm": 9.46163272857666,
+ "learning_rate": 1.9444699772542076e-05,
+ "loss": 1.0375,
+ "step": 4895
+ },
+ {
+ "epoch": 13.340599455040872,
+ "grad_norm": 7.836633205413818,
+ "learning_rate": 1.9444409750039107e-05,
+ "loss": 0.8973,
+ "step": 4896
+ },
+ {
+ "epoch": 13.3433242506812,
+ "grad_norm": 9.458667755126953,
+ "learning_rate": 1.9444119653983376e-05,
+ "loss": 1.175,
+ "step": 4897
+ },
+ {
+ "epoch": 13.346049046321525,
+ "grad_norm": 10.297599792480469,
+ "learning_rate": 1.9443829484377147e-05,
+ "loss": 1.1794,
+ "step": 4898
+ },
+ {
+ "epoch": 13.348773841961853,
+ "grad_norm": 8.998893737792969,
+ "learning_rate": 1.9443539241222672e-05,
+ "loss": 1.0908,
+ "step": 4899
+ },
+ {
+ "epoch": 13.35149863760218,
+ "grad_norm": 9.326870918273926,
+ "learning_rate": 1.9443248924522223e-05,
+ "loss": 0.962,
+ "step": 4900
+ },
+ {
+ "epoch": 13.354223433242506,
+ "grad_norm": 14.722137451171875,
+ "learning_rate": 1.9442958534278054e-05,
+ "loss": 1.2463,
+ "step": 4901
+ },
+ {
+ "epoch": 13.356948228882834,
+ "grad_norm": 11.660216331481934,
+ "learning_rate": 1.944266807049243e-05,
+ "loss": 1.0574,
+ "step": 4902
+ },
+ {
+ "epoch": 13.359673024523161,
+ "grad_norm": 9.365885734558105,
+ "learning_rate": 1.944237753316761e-05,
+ "loss": 1.0701,
+ "step": 4903
+ },
+ {
+ "epoch": 13.362397820163487,
+ "grad_norm": 10.935153007507324,
+ "learning_rate": 1.944208692230585e-05,
+ "loss": 1.0439,
+ "step": 4904
+ },
+ {
+ "epoch": 13.365122615803815,
+ "grad_norm": 8.973504066467285,
+ "learning_rate": 1.944179623790943e-05,
+ "loss": 0.9796,
+ "step": 4905
+ },
+ {
+ "epoch": 13.367847411444142,
+ "grad_norm": 12.400835037231445,
+ "learning_rate": 1.9441505479980602e-05,
+ "loss": 1.0642,
+ "step": 4906
+ },
+ {
+ "epoch": 13.370572207084468,
+ "grad_norm": 16.130796432495117,
+ "learning_rate": 1.9441214648521633e-05,
+ "loss": 1.3103,
+ "step": 4907
+ },
+ {
+ "epoch": 13.373297002724795,
+ "grad_norm": 10.828619003295898,
+ "learning_rate": 1.944092374353479e-05,
+ "loss": 1.0986,
+ "step": 4908
+ },
+ {
+ "epoch": 13.376021798365123,
+ "grad_norm": 10.00255012512207,
+ "learning_rate": 1.9440632765022332e-05,
+ "loss": 0.9907,
+ "step": 4909
+ },
+ {
+ "epoch": 13.378746594005449,
+ "grad_norm": 9.481042861938477,
+ "learning_rate": 1.9440341712986534e-05,
+ "loss": 1.1254,
+ "step": 4910
+ },
+ {
+ "epoch": 13.381471389645776,
+ "grad_norm": 9.945815086364746,
+ "learning_rate": 1.944005058742966e-05,
+ "loss": 1.1763,
+ "step": 4911
+ },
+ {
+ "epoch": 13.384196185286104,
+ "grad_norm": 12.883193969726562,
+ "learning_rate": 1.9439759388353972e-05,
+ "loss": 1.0884,
+ "step": 4912
+ },
+ {
+ "epoch": 13.38692098092643,
+ "grad_norm": 13.921396255493164,
+ "learning_rate": 1.9439468115761745e-05,
+ "loss": 1.2479,
+ "step": 4913
+ },
+ {
+ "epoch": 13.389645776566757,
+ "grad_norm": 8.882813453674316,
+ "learning_rate": 1.943917676965524e-05,
+ "loss": 1.1646,
+ "step": 4914
+ },
+ {
+ "epoch": 13.392370572207085,
+ "grad_norm": 12.870677947998047,
+ "learning_rate": 1.9438885350036735e-05,
+ "loss": 1.4008,
+ "step": 4915
+ },
+ {
+ "epoch": 13.39509536784741,
+ "grad_norm": 8.222795486450195,
+ "learning_rate": 1.943859385690849e-05,
+ "loss": 0.9674,
+ "step": 4916
+ },
+ {
+ "epoch": 13.397820163487738,
+ "grad_norm": 9.917922973632812,
+ "learning_rate": 1.9438302290272782e-05,
+ "loss": 1.0837,
+ "step": 4917
+ },
+ {
+ "epoch": 13.400544959128066,
+ "grad_norm": 13.1954927444458,
+ "learning_rate": 1.943801065013188e-05,
+ "loss": 1.3821,
+ "step": 4918
+ },
+ {
+ "epoch": 13.403269754768392,
+ "grad_norm": 8.951169967651367,
+ "learning_rate": 1.9437718936488054e-05,
+ "loss": 1.1001,
+ "step": 4919
+ },
+ {
+ "epoch": 13.40599455040872,
+ "grad_norm": 14.295671463012695,
+ "learning_rate": 1.9437427149343576e-05,
+ "loss": 1.103,
+ "step": 4920
+ },
+ {
+ "epoch": 13.408719346049047,
+ "grad_norm": 23.772388458251953,
+ "learning_rate": 1.943713528870072e-05,
+ "loss": 1.1239,
+ "step": 4921
+ },
+ {
+ "epoch": 13.411444141689373,
+ "grad_norm": 20.6263484954834,
+ "learning_rate": 1.943684335456176e-05,
+ "loss": 1.2134,
+ "step": 4922
+ },
+ {
+ "epoch": 13.4141689373297,
+ "grad_norm": 12.296714782714844,
+ "learning_rate": 1.9436551346928963e-05,
+ "loss": 1.2314,
+ "step": 4923
+ },
+ {
+ "epoch": 13.416893732970028,
+ "grad_norm": 9.434287071228027,
+ "learning_rate": 1.943625926580461e-05,
+ "loss": 1.0848,
+ "step": 4924
+ },
+ {
+ "epoch": 13.419618528610354,
+ "grad_norm": 8.973977088928223,
+ "learning_rate": 1.9435967111190975e-05,
+ "loss": 1.1523,
+ "step": 4925
+ },
+ {
+ "epoch": 13.422343324250681,
+ "grad_norm": 10.713934898376465,
+ "learning_rate": 1.9435674883090333e-05,
+ "loss": 1.241,
+ "step": 4926
+ },
+ {
+ "epoch": 13.425068119891009,
+ "grad_norm": 12.549975395202637,
+ "learning_rate": 1.9435382581504955e-05,
+ "loss": 1.1179,
+ "step": 4927
+ },
+ {
+ "epoch": 13.427792915531334,
+ "grad_norm": 12.254369735717773,
+ "learning_rate": 1.9435090206437124e-05,
+ "loss": 1.0909,
+ "step": 4928
+ },
+ {
+ "epoch": 13.430517711171662,
+ "grad_norm": 9.583385467529297,
+ "learning_rate": 1.9434797757889114e-05,
+ "loss": 0.9912,
+ "step": 4929
+ },
+ {
+ "epoch": 13.43324250681199,
+ "grad_norm": 12.13889217376709,
+ "learning_rate": 1.94345052358632e-05,
+ "loss": 1.3284,
+ "step": 4930
+ },
+ {
+ "epoch": 13.435967302452315,
+ "grad_norm": 10.6828031539917,
+ "learning_rate": 1.9434212640361662e-05,
+ "loss": 1.0371,
+ "step": 4931
+ },
+ {
+ "epoch": 13.438692098092643,
+ "grad_norm": 8.419368743896484,
+ "learning_rate": 1.9433919971386785e-05,
+ "loss": 1.0361,
+ "step": 4932
+ },
+ {
+ "epoch": 13.44141689373297,
+ "grad_norm": 9.591110229492188,
+ "learning_rate": 1.943362722894084e-05,
+ "loss": 1.3,
+ "step": 4933
+ },
+ {
+ "epoch": 13.444141689373296,
+ "grad_norm": 13.010809898376465,
+ "learning_rate": 1.943333441302611e-05,
+ "loss": 1.002,
+ "step": 4934
+ },
+ {
+ "epoch": 13.446866485013624,
+ "grad_norm": 7.335751056671143,
+ "learning_rate": 1.9433041523644873e-05,
+ "loss": 0.9941,
+ "step": 4935
+ },
+ {
+ "epoch": 13.449591280653951,
+ "grad_norm": 13.550209999084473,
+ "learning_rate": 1.9432748560799416e-05,
+ "loss": 1.3273,
+ "step": 4936
+ },
+ {
+ "epoch": 13.452316076294277,
+ "grad_norm": 10.893725395202637,
+ "learning_rate": 1.9432455524492014e-05,
+ "loss": 0.9391,
+ "step": 4937
+ },
+ {
+ "epoch": 13.455040871934605,
+ "grad_norm": 8.60975170135498,
+ "learning_rate": 1.9432162414724952e-05,
+ "loss": 1.0885,
+ "step": 4938
+ },
+ {
+ "epoch": 13.457765667574932,
+ "grad_norm": 10.962531089782715,
+ "learning_rate": 1.9431869231500516e-05,
+ "loss": 1.2214,
+ "step": 4939
+ },
+ {
+ "epoch": 13.460490463215258,
+ "grad_norm": 10.27914047241211,
+ "learning_rate": 1.9431575974820983e-05,
+ "loss": 1.1592,
+ "step": 4940
+ },
+ {
+ "epoch": 13.463215258855586,
+ "grad_norm": 8.277831077575684,
+ "learning_rate": 1.943128264468864e-05,
+ "loss": 1.0098,
+ "step": 4941
+ },
+ {
+ "epoch": 13.465940054495913,
+ "grad_norm": 8.443522453308105,
+ "learning_rate": 1.943098924110577e-05,
+ "loss": 1.1726,
+ "step": 4942
+ },
+ {
+ "epoch": 13.46866485013624,
+ "grad_norm": 9.645376205444336,
+ "learning_rate": 1.9430695764074662e-05,
+ "loss": 1.0812,
+ "step": 4943
+ },
+ {
+ "epoch": 13.471389645776567,
+ "grad_norm": 11.037893295288086,
+ "learning_rate": 1.9430402213597598e-05,
+ "loss": 1.0818,
+ "step": 4944
+ },
+ {
+ "epoch": 13.474114441416894,
+ "grad_norm": 13.38748836517334,
+ "learning_rate": 1.9430108589676868e-05,
+ "loss": 1.2874,
+ "step": 4945
+ },
+ {
+ "epoch": 13.47683923705722,
+ "grad_norm": 10.455015182495117,
+ "learning_rate": 1.9429814892314752e-05,
+ "loss": 1.1831,
+ "step": 4946
+ },
+ {
+ "epoch": 13.479564032697548,
+ "grad_norm": 11.289458274841309,
+ "learning_rate": 1.9429521121513542e-05,
+ "loss": 1.144,
+ "step": 4947
+ },
+ {
+ "epoch": 13.482288828337875,
+ "grad_norm": 9.35831356048584,
+ "learning_rate": 1.9429227277275525e-05,
+ "loss": 1.0409,
+ "step": 4948
+ },
+ {
+ "epoch": 13.485013623978201,
+ "grad_norm": 18.667573928833008,
+ "learning_rate": 1.942893335960299e-05,
+ "loss": 1.0792,
+ "step": 4949
+ },
+ {
+ "epoch": 13.487738419618529,
+ "grad_norm": 11.403008460998535,
+ "learning_rate": 1.9428639368498223e-05,
+ "loss": 1.2703,
+ "step": 4950
+ },
+ {
+ "epoch": 13.490463215258856,
+ "grad_norm": 9.828926086425781,
+ "learning_rate": 1.9428345303963517e-05,
+ "loss": 1.0442,
+ "step": 4951
+ },
+ {
+ "epoch": 13.493188010899182,
+ "grad_norm": 10.004315376281738,
+ "learning_rate": 1.9428051166001162e-05,
+ "loss": 1.1315,
+ "step": 4952
+ },
+ {
+ "epoch": 13.49591280653951,
+ "grad_norm": 8.655510902404785,
+ "learning_rate": 1.942775695461345e-05,
+ "loss": 0.9866,
+ "step": 4953
+ },
+ {
+ "epoch": 13.498637602179837,
+ "grad_norm": 7.741220951080322,
+ "learning_rate": 1.942746266980267e-05,
+ "loss": 1.1243,
+ "step": 4954
+ },
+ {
+ "epoch": 13.501362397820163,
+ "grad_norm": 7.098425388336182,
+ "learning_rate": 1.942716831157111e-05,
+ "loss": 0.8582,
+ "step": 4955
+ },
+ {
+ "epoch": 13.50408719346049,
+ "grad_norm": 13.48908519744873,
+ "learning_rate": 1.942687387992107e-05,
+ "loss": 1.1384,
+ "step": 4956
+ },
+ {
+ "epoch": 13.506811989100818,
+ "grad_norm": 14.542173385620117,
+ "learning_rate": 1.9426579374854838e-05,
+ "loss": 1.1768,
+ "step": 4957
+ },
+ {
+ "epoch": 13.509536784741144,
+ "grad_norm": 121.65567016601562,
+ "learning_rate": 1.9426284796374712e-05,
+ "loss": 1.3164,
+ "step": 4958
+ },
+ {
+ "epoch": 13.512261580381471,
+ "grad_norm": 11.893477439880371,
+ "learning_rate": 1.942599014448298e-05,
+ "loss": 1.2727,
+ "step": 4959
+ },
+ {
+ "epoch": 13.514986376021799,
+ "grad_norm": 11.721236228942871,
+ "learning_rate": 1.942569541918194e-05,
+ "loss": 0.9863,
+ "step": 4960
+ },
+ {
+ "epoch": 13.517711171662125,
+ "grad_norm": 9.663614273071289,
+ "learning_rate": 1.9425400620473893e-05,
+ "loss": 1.1519,
+ "step": 4961
+ },
+ {
+ "epoch": 13.520435967302452,
+ "grad_norm": 11.535460472106934,
+ "learning_rate": 1.9425105748361122e-05,
+ "loss": 1.1575,
+ "step": 4962
+ },
+ {
+ "epoch": 13.52316076294278,
+ "grad_norm": 15.516406059265137,
+ "learning_rate": 1.9424810802845937e-05,
+ "loss": 1.2666,
+ "step": 4963
+ },
+ {
+ "epoch": 13.525885558583106,
+ "grad_norm": 12.936622619628906,
+ "learning_rate": 1.9424515783930624e-05,
+ "loss": 1.2213,
+ "step": 4964
+ },
+ {
+ "epoch": 13.528610354223433,
+ "grad_norm": 16.40265464782715,
+ "learning_rate": 1.942422069161749e-05,
+ "loss": 1.1985,
+ "step": 4965
+ },
+ {
+ "epoch": 13.53133514986376,
+ "grad_norm": 17.725162506103516,
+ "learning_rate": 1.9423925525908826e-05,
+ "loss": 1.2993,
+ "step": 4966
+ },
+ {
+ "epoch": 13.534059945504087,
+ "grad_norm": 9.422935485839844,
+ "learning_rate": 1.9423630286806928e-05,
+ "loss": 1.166,
+ "step": 4967
+ },
+ {
+ "epoch": 13.536784741144414,
+ "grad_norm": 18.535873413085938,
+ "learning_rate": 1.942333497431411e-05,
+ "loss": 1.3313,
+ "step": 4968
+ },
+ {
+ "epoch": 13.539509536784742,
+ "grad_norm": 10.134592056274414,
+ "learning_rate": 1.9423039588432657e-05,
+ "loss": 1.1255,
+ "step": 4969
+ },
+ {
+ "epoch": 13.542234332425068,
+ "grad_norm": 11.532000541687012,
+ "learning_rate": 1.9422744129164877e-05,
+ "loss": 1.2673,
+ "step": 4970
+ },
+ {
+ "epoch": 13.544959128065395,
+ "grad_norm": 13.674302101135254,
+ "learning_rate": 1.9422448596513067e-05,
+ "loss": 1.2104,
+ "step": 4971
+ },
+ {
+ "epoch": 13.547683923705723,
+ "grad_norm": 9.66440200805664,
+ "learning_rate": 1.9422152990479533e-05,
+ "loss": 1.2751,
+ "step": 4972
+ },
+ {
+ "epoch": 13.550408719346049,
+ "grad_norm": 13.31756591796875,
+ "learning_rate": 1.9421857311066575e-05,
+ "loss": 1.3547,
+ "step": 4973
+ },
+ {
+ "epoch": 13.553133514986376,
+ "grad_norm": 12.21282958984375,
+ "learning_rate": 1.9421561558276495e-05,
+ "loss": 1.1848,
+ "step": 4974
+ },
+ {
+ "epoch": 13.555858310626704,
+ "grad_norm": 11.367598533630371,
+ "learning_rate": 1.942126573211159e-05,
+ "loss": 1.1157,
+ "step": 4975
+ },
+ {
+ "epoch": 13.55858310626703,
+ "grad_norm": 13.134461402893066,
+ "learning_rate": 1.942096983257418e-05,
+ "loss": 1.1757,
+ "step": 4976
+ },
+ {
+ "epoch": 13.561307901907357,
+ "grad_norm": 13.335122108459473,
+ "learning_rate": 1.9420673859666557e-05,
+ "loss": 1.3433,
+ "step": 4977
+ },
+ {
+ "epoch": 13.564032697547685,
+ "grad_norm": 13.226652145385742,
+ "learning_rate": 1.942037781339103e-05,
+ "loss": 1.439,
+ "step": 4978
+ },
+ {
+ "epoch": 13.56675749318801,
+ "grad_norm": 11.82116413116455,
+ "learning_rate": 1.9420081693749903e-05,
+ "loss": 0.9768,
+ "step": 4979
+ },
+ {
+ "epoch": 13.569482288828338,
+ "grad_norm": 10.326279640197754,
+ "learning_rate": 1.941978550074548e-05,
+ "loss": 1.1863,
+ "step": 4980
+ },
+ {
+ "epoch": 13.572207084468666,
+ "grad_norm": 15.456771850585938,
+ "learning_rate": 1.9419489234380077e-05,
+ "loss": 1.1077,
+ "step": 4981
+ },
+ {
+ "epoch": 13.574931880108991,
+ "grad_norm": 22.4259090423584,
+ "learning_rate": 1.941919289465599e-05,
+ "loss": 1.1985,
+ "step": 4982
+ },
+ {
+ "epoch": 13.577656675749319,
+ "grad_norm": 11.79200267791748,
+ "learning_rate": 1.9418896481575534e-05,
+ "loss": 1.1946,
+ "step": 4983
+ },
+ {
+ "epoch": 13.580381471389646,
+ "grad_norm": 12.975360870361328,
+ "learning_rate": 1.9418599995141013e-05,
+ "loss": 1.0375,
+ "step": 4984
+ },
+ {
+ "epoch": 13.583106267029972,
+ "grad_norm": 12.62851333618164,
+ "learning_rate": 1.941830343535474e-05,
+ "loss": 1.311,
+ "step": 4985
+ },
+ {
+ "epoch": 13.5858310626703,
+ "grad_norm": 14.895894050598145,
+ "learning_rate": 1.9418006802219022e-05,
+ "loss": 1.3494,
+ "step": 4986
+ },
+ {
+ "epoch": 13.588555858310627,
+ "grad_norm": 15.663689613342285,
+ "learning_rate": 1.9417710095736173e-05,
+ "loss": 1.1829,
+ "step": 4987
+ },
+ {
+ "epoch": 13.591280653950953,
+ "grad_norm": 8.505025863647461,
+ "learning_rate": 1.94174133159085e-05,
+ "loss": 1.0594,
+ "step": 4988
+ },
+ {
+ "epoch": 13.59400544959128,
+ "grad_norm": 10.836217880249023,
+ "learning_rate": 1.9417116462738312e-05,
+ "loss": 1.2996,
+ "step": 4989
+ },
+ {
+ "epoch": 13.596730245231608,
+ "grad_norm": 12.67309856414795,
+ "learning_rate": 1.9416819536227928e-05,
+ "loss": 1.2812,
+ "step": 4990
+ },
+ {
+ "epoch": 13.599455040871934,
+ "grad_norm": 37.39385223388672,
+ "learning_rate": 1.9416522536379653e-05,
+ "loss": 1.1196,
+ "step": 4991
+ },
+ {
+ "epoch": 13.602179836512262,
+ "grad_norm": 13.147069931030273,
+ "learning_rate": 1.9416225463195807e-05,
+ "loss": 1.3328,
+ "step": 4992
+ },
+ {
+ "epoch": 13.60490463215259,
+ "grad_norm": 14.431489944458008,
+ "learning_rate": 1.94159283166787e-05,
+ "loss": 1.074,
+ "step": 4993
+ },
+ {
+ "epoch": 13.607629427792915,
+ "grad_norm": 40.52897644042969,
+ "learning_rate": 1.9415631096830644e-05,
+ "loss": 1.2249,
+ "step": 4994
+ },
+ {
+ "epoch": 13.610354223433243,
+ "grad_norm": 11.68537425994873,
+ "learning_rate": 1.9415333803653955e-05,
+ "loss": 1.0654,
+ "step": 4995
+ },
+ {
+ "epoch": 13.61307901907357,
+ "grad_norm": 10.335807800292969,
+ "learning_rate": 1.941503643715095e-05,
+ "loss": 1.1626,
+ "step": 4996
+ },
+ {
+ "epoch": 13.615803814713896,
+ "grad_norm": 63.72047805786133,
+ "learning_rate": 1.9414738997323947e-05,
+ "loss": 1.1919,
+ "step": 4997
+ },
+ {
+ "epoch": 13.618528610354224,
+ "grad_norm": 10.672576904296875,
+ "learning_rate": 1.9414441484175258e-05,
+ "loss": 1.2578,
+ "step": 4998
+ },
+ {
+ "epoch": 13.621253405994551,
+ "grad_norm": 12.725996971130371,
+ "learning_rate": 1.9414143897707204e-05,
+ "loss": 1.2,
+ "step": 4999
+ },
+ {
+ "epoch": 13.623978201634877,
+ "grad_norm": 9.036222457885742,
+ "learning_rate": 1.9413846237922098e-05,
+ "loss": 1.3495,
+ "step": 5000
+ },
+ {
+ "epoch": 13.626702997275205,
+ "grad_norm": 20.720375061035156,
+ "learning_rate": 1.941354850482226e-05,
+ "loss": 1.2527,
+ "step": 5001
+ },
+ {
+ "epoch": 13.629427792915532,
+ "grad_norm": 15.53624153137207,
+ "learning_rate": 1.941325069841001e-05,
+ "loss": 1.4265,
+ "step": 5002
+ },
+ {
+ "epoch": 13.632152588555858,
+ "grad_norm": 13.139444351196289,
+ "learning_rate": 1.9412952818687665e-05,
+ "loss": 1.3018,
+ "step": 5003
+ },
+ {
+ "epoch": 13.634877384196185,
+ "grad_norm": 10.584000587463379,
+ "learning_rate": 1.941265486565755e-05,
+ "loss": 1.416,
+ "step": 5004
+ },
+ {
+ "epoch": 13.637602179836513,
+ "grad_norm": 9.378589630126953,
+ "learning_rate": 1.941235683932198e-05,
+ "loss": 1.271,
+ "step": 5005
+ },
+ {
+ "epoch": 13.640326975476839,
+ "grad_norm": 19.38829803466797,
+ "learning_rate": 1.9412058739683276e-05,
+ "loss": 1.4248,
+ "step": 5006
+ },
+ {
+ "epoch": 13.643051771117166,
+ "grad_norm": 11.798781394958496,
+ "learning_rate": 1.9411760566743765e-05,
+ "loss": 1.2646,
+ "step": 5007
+ },
+ {
+ "epoch": 13.645776566757494,
+ "grad_norm": 10.712326049804688,
+ "learning_rate": 1.941146232050576e-05,
+ "loss": 1.314,
+ "step": 5008
+ },
+ {
+ "epoch": 13.64850136239782,
+ "grad_norm": 10.130495071411133,
+ "learning_rate": 1.9411164000971597e-05,
+ "loss": 1.2925,
+ "step": 5009
+ },
+ {
+ "epoch": 13.651226158038147,
+ "grad_norm": 21.946491241455078,
+ "learning_rate": 1.9410865608143586e-05,
+ "loss": 1.2432,
+ "step": 5010
+ },
+ {
+ "epoch": 13.653950953678475,
+ "grad_norm": 9.57172966003418,
+ "learning_rate": 1.941056714202406e-05,
+ "loss": 1.2327,
+ "step": 5011
+ },
+ {
+ "epoch": 13.6566757493188,
+ "grad_norm": 12.476937294006348,
+ "learning_rate": 1.9410268602615338e-05,
+ "loss": 1.1344,
+ "step": 5012
+ },
+ {
+ "epoch": 13.659400544959128,
+ "grad_norm": 14.384178161621094,
+ "learning_rate": 1.9409969989919746e-05,
+ "loss": 1.2058,
+ "step": 5013
+ },
+ {
+ "epoch": 13.662125340599456,
+ "grad_norm": 13.131757736206055,
+ "learning_rate": 1.940967130393961e-05,
+ "loss": 1.1837,
+ "step": 5014
+ },
+ {
+ "epoch": 13.664850136239782,
+ "grad_norm": 13.937726974487305,
+ "learning_rate": 1.940937254467726e-05,
+ "loss": 1.2732,
+ "step": 5015
+ },
+ {
+ "epoch": 13.66757493188011,
+ "grad_norm": 12.27633285522461,
+ "learning_rate": 1.940907371213502e-05,
+ "loss": 1.1104,
+ "step": 5016
+ },
+ {
+ "epoch": 13.670299727520437,
+ "grad_norm": 14.232234001159668,
+ "learning_rate": 1.9408774806315215e-05,
+ "loss": 1.2317,
+ "step": 5017
+ },
+ {
+ "epoch": 13.673024523160763,
+ "grad_norm": 11.793499946594238,
+ "learning_rate": 1.9408475827220173e-05,
+ "loss": 1.2783,
+ "step": 5018
+ },
+ {
+ "epoch": 13.67574931880109,
+ "grad_norm": 14.1796293258667,
+ "learning_rate": 1.9408176774852224e-05,
+ "loss": 1.0769,
+ "step": 5019
+ },
+ {
+ "epoch": 13.678474114441418,
+ "grad_norm": 10.935534477233887,
+ "learning_rate": 1.9407877649213696e-05,
+ "loss": 0.9988,
+ "step": 5020
+ },
+ {
+ "epoch": 13.681198910081743,
+ "grad_norm": 10.10819149017334,
+ "learning_rate": 1.9407578450306926e-05,
+ "loss": 1.1537,
+ "step": 5021
+ },
+ {
+ "epoch": 13.683923705722071,
+ "grad_norm": 12.352477073669434,
+ "learning_rate": 1.9407279178134233e-05,
+ "loss": 1.046,
+ "step": 5022
+ },
+ {
+ "epoch": 13.686648501362399,
+ "grad_norm": 12.96524715423584,
+ "learning_rate": 1.9406979832697953e-05,
+ "loss": 1.261,
+ "step": 5023
+ },
+ {
+ "epoch": 13.689373297002724,
+ "grad_norm": 12.40776538848877,
+ "learning_rate": 1.9406680414000418e-05,
+ "loss": 1.2307,
+ "step": 5024
+ },
+ {
+ "epoch": 13.692098092643052,
+ "grad_norm": 9.899091720581055,
+ "learning_rate": 1.9406380922043955e-05,
+ "loss": 1.1104,
+ "step": 5025
+ },
+ {
+ "epoch": 13.69482288828338,
+ "grad_norm": 9.56047534942627,
+ "learning_rate": 1.9406081356830906e-05,
+ "loss": 1.0581,
+ "step": 5026
+ },
+ {
+ "epoch": 13.697547683923705,
+ "grad_norm": 8.775030136108398,
+ "learning_rate": 1.9405781718363595e-05,
+ "loss": 1.0488,
+ "step": 5027
+ },
+ {
+ "epoch": 13.700272479564033,
+ "grad_norm": 10.675580978393555,
+ "learning_rate": 1.940548200664436e-05,
+ "loss": 1.1741,
+ "step": 5028
+ },
+ {
+ "epoch": 13.70299727520436,
+ "grad_norm": 7.952402114868164,
+ "learning_rate": 1.9405182221675535e-05,
+ "loss": 1.1293,
+ "step": 5029
+ },
+ {
+ "epoch": 13.705722070844686,
+ "grad_norm": 9.325764656066895,
+ "learning_rate": 1.940488236345945e-05,
+ "loss": 1.157,
+ "step": 5030
+ },
+ {
+ "epoch": 13.708446866485014,
+ "grad_norm": 10.313379287719727,
+ "learning_rate": 1.9404582431998446e-05,
+ "loss": 1.1921,
+ "step": 5031
+ },
+ {
+ "epoch": 13.711171662125341,
+ "grad_norm": 10.060182571411133,
+ "learning_rate": 1.9404282427294854e-05,
+ "loss": 1.1826,
+ "step": 5032
+ },
+ {
+ "epoch": 13.713896457765667,
+ "grad_norm": 9.37794303894043,
+ "learning_rate": 1.9403982349351014e-05,
+ "loss": 1.1277,
+ "step": 5033
+ },
+ {
+ "epoch": 13.716621253405995,
+ "grad_norm": 12.922962188720703,
+ "learning_rate": 1.9403682198169266e-05,
+ "loss": 1.2212,
+ "step": 5034
+ },
+ {
+ "epoch": 13.719346049046322,
+ "grad_norm": 10.3358793258667,
+ "learning_rate": 1.940338197375194e-05,
+ "loss": 1.1089,
+ "step": 5035
+ },
+ {
+ "epoch": 13.722070844686648,
+ "grad_norm": 10.662749290466309,
+ "learning_rate": 1.940308167610138e-05,
+ "loss": 1.2673,
+ "step": 5036
+ },
+ {
+ "epoch": 13.724795640326976,
+ "grad_norm": 8.988673210144043,
+ "learning_rate": 1.940278130521992e-05,
+ "loss": 1.1497,
+ "step": 5037
+ },
+ {
+ "epoch": 13.727520435967303,
+ "grad_norm": 10.619245529174805,
+ "learning_rate": 1.94024808611099e-05,
+ "loss": 1.1885,
+ "step": 5038
+ },
+ {
+ "epoch": 13.730245231607629,
+ "grad_norm": 10.40213680267334,
+ "learning_rate": 1.9402180343773665e-05,
+ "loss": 1.1804,
+ "step": 5039
+ },
+ {
+ "epoch": 13.732970027247957,
+ "grad_norm": 8.468010902404785,
+ "learning_rate": 1.9401879753213556e-05,
+ "loss": 1.2205,
+ "step": 5040
+ },
+ {
+ "epoch": 13.735694822888284,
+ "grad_norm": 10.093297958374023,
+ "learning_rate": 1.9401579089431904e-05,
+ "loss": 0.8463,
+ "step": 5041
+ },
+ {
+ "epoch": 13.73841961852861,
+ "grad_norm": 10.707527160644531,
+ "learning_rate": 1.940127835243106e-05,
+ "loss": 1.1765,
+ "step": 5042
+ },
+ {
+ "epoch": 13.741144414168938,
+ "grad_norm": 8.857259750366211,
+ "learning_rate": 1.940097754221336e-05,
+ "loss": 1.4438,
+ "step": 5043
+ },
+ {
+ "epoch": 13.743869209809265,
+ "grad_norm": 11.06920051574707,
+ "learning_rate": 1.940067665878115e-05,
+ "loss": 1.3408,
+ "step": 5044
+ },
+ {
+ "epoch": 13.746594005449591,
+ "grad_norm": 8.317543029785156,
+ "learning_rate": 1.9400375702136777e-05,
+ "loss": 0.8645,
+ "step": 5045
+ },
+ {
+ "epoch": 13.749318801089919,
+ "grad_norm": 7.602947235107422,
+ "learning_rate": 1.9400074672282576e-05,
+ "loss": 1.2239,
+ "step": 5046
+ },
+ {
+ "epoch": 13.752043596730246,
+ "grad_norm": 10.72529411315918,
+ "learning_rate": 1.9399773569220896e-05,
+ "loss": 1.2053,
+ "step": 5047
+ },
+ {
+ "epoch": 13.754768392370572,
+ "grad_norm": 9.096590995788574,
+ "learning_rate": 1.939947239295408e-05,
+ "loss": 1.114,
+ "step": 5048
+ },
+ {
+ "epoch": 13.7574931880109,
+ "grad_norm": 8.262537002563477,
+ "learning_rate": 1.939917114348448e-05,
+ "loss": 1.1478,
+ "step": 5049
+ },
+ {
+ "epoch": 13.760217983651227,
+ "grad_norm": 7.784013271331787,
+ "learning_rate": 1.939886982081444e-05,
+ "loss": 1.1875,
+ "step": 5050
+ },
+ {
+ "epoch": 13.762942779291553,
+ "grad_norm": 8.267370223999023,
+ "learning_rate": 1.93985684249463e-05,
+ "loss": 1.0675,
+ "step": 5051
+ },
+ {
+ "epoch": 13.76566757493188,
+ "grad_norm": 7.184292316436768,
+ "learning_rate": 1.939826695588241e-05,
+ "loss": 1.1619,
+ "step": 5052
+ },
+ {
+ "epoch": 13.768392370572208,
+ "grad_norm": 14.374281883239746,
+ "learning_rate": 1.939796541362512e-05,
+ "loss": 1.2981,
+ "step": 5053
+ },
+ {
+ "epoch": 13.771117166212534,
+ "grad_norm": 11.208491325378418,
+ "learning_rate": 1.9397663798176783e-05,
+ "loss": 1.1274,
+ "step": 5054
+ },
+ {
+ "epoch": 13.773841961852861,
+ "grad_norm": 20.029939651489258,
+ "learning_rate": 1.939736210953974e-05,
+ "loss": 1.1852,
+ "step": 5055
+ },
+ {
+ "epoch": 13.776566757493189,
+ "grad_norm": 8.747542381286621,
+ "learning_rate": 1.939706034771634e-05,
+ "loss": 1.1677,
+ "step": 5056
+ },
+ {
+ "epoch": 13.779291553133515,
+ "grad_norm": 8.436010360717773,
+ "learning_rate": 1.9396758512708943e-05,
+ "loss": 1.156,
+ "step": 5057
+ },
+ {
+ "epoch": 13.782016348773842,
+ "grad_norm": 19.555360794067383,
+ "learning_rate": 1.9396456604519885e-05,
+ "loss": 1.2537,
+ "step": 5058
+ },
+ {
+ "epoch": 13.78474114441417,
+ "grad_norm": 9.587838172912598,
+ "learning_rate": 1.939615462315153e-05,
+ "loss": 1.1218,
+ "step": 5059
+ },
+ {
+ "epoch": 13.787465940054496,
+ "grad_norm": 8.060758590698242,
+ "learning_rate": 1.9395852568606225e-05,
+ "loss": 0.8926,
+ "step": 5060
+ },
+ {
+ "epoch": 13.790190735694823,
+ "grad_norm": 9.282258033752441,
+ "learning_rate": 1.9395550440886325e-05,
+ "loss": 1.3179,
+ "step": 5061
+ },
+ {
+ "epoch": 13.79291553133515,
+ "grad_norm": 9.416927337646484,
+ "learning_rate": 1.9395248239994177e-05,
+ "loss": 1.1321,
+ "step": 5062
+ },
+ {
+ "epoch": 13.795640326975477,
+ "grad_norm": 9.92941665649414,
+ "learning_rate": 1.939494596593214e-05,
+ "loss": 1.1082,
+ "step": 5063
+ },
+ {
+ "epoch": 13.798365122615804,
+ "grad_norm": 12.008455276489258,
+ "learning_rate": 1.939464361870256e-05,
+ "loss": 1.0618,
+ "step": 5064
+ },
+ {
+ "epoch": 13.80108991825613,
+ "grad_norm": 8.59157657623291,
+ "learning_rate": 1.9394341198307808e-05,
+ "loss": 0.9966,
+ "step": 5065
+ },
+ {
+ "epoch": 13.803814713896458,
+ "grad_norm": 10.721652030944824,
+ "learning_rate": 1.9394038704750225e-05,
+ "loss": 1.3184,
+ "step": 5066
+ },
+ {
+ "epoch": 13.806539509536785,
+ "grad_norm": 10.89718246459961,
+ "learning_rate": 1.939373613803217e-05,
+ "loss": 1.2522,
+ "step": 5067
+ },
+ {
+ "epoch": 13.809264305177111,
+ "grad_norm": 11.09522533416748,
+ "learning_rate": 1.9393433498155997e-05,
+ "loss": 0.9753,
+ "step": 5068
+ },
+ {
+ "epoch": 13.811989100817438,
+ "grad_norm": 9.063777923583984,
+ "learning_rate": 1.9393130785124073e-05,
+ "loss": 1.3086,
+ "step": 5069
+ },
+ {
+ "epoch": 13.814713896457766,
+ "grad_norm": 12.276968002319336,
+ "learning_rate": 1.9392827998938744e-05,
+ "loss": 1.1953,
+ "step": 5070
+ },
+ {
+ "epoch": 13.817438692098092,
+ "grad_norm": 11.270060539245605,
+ "learning_rate": 1.9392525139602373e-05,
+ "loss": 0.8892,
+ "step": 5071
+ },
+ {
+ "epoch": 13.82016348773842,
+ "grad_norm": 11.454496383666992,
+ "learning_rate": 1.939222220711732e-05,
+ "loss": 1.3066,
+ "step": 5072
+ },
+ {
+ "epoch": 13.822888283378747,
+ "grad_norm": 8.781437873840332,
+ "learning_rate": 1.9391919201485945e-05,
+ "loss": 1.2725,
+ "step": 5073
+ },
+ {
+ "epoch": 13.825613079019073,
+ "grad_norm": 8.515535354614258,
+ "learning_rate": 1.93916161227106e-05,
+ "loss": 0.9761,
+ "step": 5074
+ },
+ {
+ "epoch": 13.8283378746594,
+ "grad_norm": 8.936002731323242,
+ "learning_rate": 1.9391312970793654e-05,
+ "loss": 0.9933,
+ "step": 5075
+ },
+ {
+ "epoch": 13.831062670299728,
+ "grad_norm": 11.896123886108398,
+ "learning_rate": 1.9391009745737465e-05,
+ "loss": 1.0779,
+ "step": 5076
+ },
+ {
+ "epoch": 13.833787465940054,
+ "grad_norm": 8.316001892089844,
+ "learning_rate": 1.9390706447544393e-05,
+ "loss": 1.0015,
+ "step": 5077
+ },
+ {
+ "epoch": 13.836512261580381,
+ "grad_norm": 9.644735336303711,
+ "learning_rate": 1.9390403076216805e-05,
+ "loss": 1.2458,
+ "step": 5078
+ },
+ {
+ "epoch": 13.839237057220709,
+ "grad_norm": 9.578886032104492,
+ "learning_rate": 1.9390099631757057e-05,
+ "loss": 1.3386,
+ "step": 5079
+ },
+ {
+ "epoch": 13.841961852861035,
+ "grad_norm": 7.128910064697266,
+ "learning_rate": 1.938979611416752e-05,
+ "loss": 1.0,
+ "step": 5080
+ },
+ {
+ "epoch": 13.844686648501362,
+ "grad_norm": 8.676445960998535,
+ "learning_rate": 1.9389492523450545e-05,
+ "loss": 1.0251,
+ "step": 5081
+ },
+ {
+ "epoch": 13.84741144414169,
+ "grad_norm": 9.316558837890625,
+ "learning_rate": 1.938918885960851e-05,
+ "loss": 0.9949,
+ "step": 5082
+ },
+ {
+ "epoch": 13.850136239782016,
+ "grad_norm": 12.280668258666992,
+ "learning_rate": 1.9388885122643773e-05,
+ "loss": 1.1279,
+ "step": 5083
+ },
+ {
+ "epoch": 13.852861035422343,
+ "grad_norm": 9.22166633605957,
+ "learning_rate": 1.9388581312558702e-05,
+ "loss": 1.1763,
+ "step": 5084
+ },
+ {
+ "epoch": 13.85558583106267,
+ "grad_norm": 8.401951789855957,
+ "learning_rate": 1.938827742935566e-05,
+ "loss": 1.2942,
+ "step": 5085
+ },
+ {
+ "epoch": 13.858310626702997,
+ "grad_norm": 11.350404739379883,
+ "learning_rate": 1.9387973473037016e-05,
+ "loss": 1.1261,
+ "step": 5086
+ },
+ {
+ "epoch": 13.861035422343324,
+ "grad_norm": 10.082850456237793,
+ "learning_rate": 1.9387669443605137e-05,
+ "loss": 1.0293,
+ "step": 5087
+ },
+ {
+ "epoch": 13.863760217983652,
+ "grad_norm": 10.138223648071289,
+ "learning_rate": 1.938736534106239e-05,
+ "loss": 1.0718,
+ "step": 5088
+ },
+ {
+ "epoch": 13.866485013623977,
+ "grad_norm": 11.336297988891602,
+ "learning_rate": 1.938706116541114e-05,
+ "loss": 1.2708,
+ "step": 5089
+ },
+ {
+ "epoch": 13.869209809264305,
+ "grad_norm": 10.716597557067871,
+ "learning_rate": 1.9386756916653765e-05,
+ "loss": 1.1121,
+ "step": 5090
+ },
+ {
+ "epoch": 13.871934604904633,
+ "grad_norm": 16.344484329223633,
+ "learning_rate": 1.938645259479263e-05,
+ "loss": 1.3132,
+ "step": 5091
+ },
+ {
+ "epoch": 13.874659400544958,
+ "grad_norm": 11.688093185424805,
+ "learning_rate": 1.9386148199830104e-05,
+ "loss": 1.1921,
+ "step": 5092
+ },
+ {
+ "epoch": 13.877384196185286,
+ "grad_norm": 11.601099014282227,
+ "learning_rate": 1.9385843731768556e-05,
+ "loss": 1.0042,
+ "step": 5093
+ },
+ {
+ "epoch": 13.880108991825614,
+ "grad_norm": 14.272059440612793,
+ "learning_rate": 1.9385539190610358e-05,
+ "loss": 1.1868,
+ "step": 5094
+ },
+ {
+ "epoch": 13.88283378746594,
+ "grad_norm": 32.3015022277832,
+ "learning_rate": 1.9385234576357885e-05,
+ "loss": 1.2266,
+ "step": 5095
+ },
+ {
+ "epoch": 13.885558583106267,
+ "grad_norm": 10.42785358428955,
+ "learning_rate": 1.9384929889013507e-05,
+ "loss": 1.1726,
+ "step": 5096
+ },
+ {
+ "epoch": 13.888283378746594,
+ "grad_norm": 10.774063110351562,
+ "learning_rate": 1.9384625128579597e-05,
+ "loss": 1.0793,
+ "step": 5097
+ },
+ {
+ "epoch": 13.89100817438692,
+ "grad_norm": 13.434088706970215,
+ "learning_rate": 1.9384320295058528e-05,
+ "loss": 1.3506,
+ "step": 5098
+ },
+ {
+ "epoch": 13.893732970027248,
+ "grad_norm": 9.60982608795166,
+ "learning_rate": 1.9384015388452674e-05,
+ "loss": 1.2122,
+ "step": 5099
+ },
+ {
+ "epoch": 13.896457765667575,
+ "grad_norm": 9.065067291259766,
+ "learning_rate": 1.9383710408764412e-05,
+ "loss": 1.1741,
+ "step": 5100
+ },
+ {
+ "epoch": 13.899182561307901,
+ "grad_norm": 8.91007137298584,
+ "learning_rate": 1.938340535599611e-05,
+ "loss": 1.0735,
+ "step": 5101
+ },
+ {
+ "epoch": 13.901907356948229,
+ "grad_norm": 9.0178861618042,
+ "learning_rate": 1.938310023015016e-05,
+ "loss": 1.0222,
+ "step": 5102
+ },
+ {
+ "epoch": 13.904632152588556,
+ "grad_norm": 11.126150131225586,
+ "learning_rate": 1.9382795031228915e-05,
+ "loss": 1.3145,
+ "step": 5103
+ },
+ {
+ "epoch": 13.907356948228882,
+ "grad_norm": 15.351320266723633,
+ "learning_rate": 1.9382489759234773e-05,
+ "loss": 1.2039,
+ "step": 5104
+ },
+ {
+ "epoch": 13.91008174386921,
+ "grad_norm": 10.8551025390625,
+ "learning_rate": 1.93821844141701e-05,
+ "loss": 1.2683,
+ "step": 5105
+ },
+ {
+ "epoch": 13.912806539509537,
+ "grad_norm": 9.00561809539795,
+ "learning_rate": 1.9381878996037276e-05,
+ "loss": 1.3562,
+ "step": 5106
+ },
+ {
+ "epoch": 13.915531335149863,
+ "grad_norm": 9.64782428741455,
+ "learning_rate": 1.938157350483868e-05,
+ "loss": 1.0952,
+ "step": 5107
+ },
+ {
+ "epoch": 13.91825613079019,
+ "grad_norm": 19.437721252441406,
+ "learning_rate": 1.9381267940576694e-05,
+ "loss": 1.1235,
+ "step": 5108
+ },
+ {
+ "epoch": 13.920980926430518,
+ "grad_norm": 8.850643157958984,
+ "learning_rate": 1.9380962303253695e-05,
+ "loss": 1.2327,
+ "step": 5109
+ },
+ {
+ "epoch": 13.923705722070844,
+ "grad_norm": 11.061198234558105,
+ "learning_rate": 1.938065659287206e-05,
+ "loss": 1.4087,
+ "step": 5110
+ },
+ {
+ "epoch": 13.926430517711172,
+ "grad_norm": 8.402247428894043,
+ "learning_rate": 1.9380350809434176e-05,
+ "loss": 1.2124,
+ "step": 5111
+ },
+ {
+ "epoch": 13.9291553133515,
+ "grad_norm": 8.88551139831543,
+ "learning_rate": 1.938004495294242e-05,
+ "loss": 1.1362,
+ "step": 5112
+ },
+ {
+ "epoch": 13.931880108991825,
+ "grad_norm": 9.316143989562988,
+ "learning_rate": 1.9379739023399177e-05,
+ "loss": 1.0752,
+ "step": 5113
+ },
+ {
+ "epoch": 13.934604904632153,
+ "grad_norm": 8.615004539489746,
+ "learning_rate": 1.937943302080683e-05,
+ "loss": 1.2195,
+ "step": 5114
+ },
+ {
+ "epoch": 13.93732970027248,
+ "grad_norm": 14.729580879211426,
+ "learning_rate": 1.9379126945167755e-05,
+ "loss": 1.1555,
+ "step": 5115
+ },
+ {
+ "epoch": 13.940054495912806,
+ "grad_norm": 9.22382640838623,
+ "learning_rate": 1.9378820796484348e-05,
+ "loss": 1.0374,
+ "step": 5116
+ },
+ {
+ "epoch": 13.942779291553133,
+ "grad_norm": 14.224115371704102,
+ "learning_rate": 1.9378514574758983e-05,
+ "loss": 1.136,
+ "step": 5117
+ },
+ {
+ "epoch": 13.945504087193461,
+ "grad_norm": 11.138895034790039,
+ "learning_rate": 1.937820827999405e-05,
+ "loss": 0.9072,
+ "step": 5118
+ },
+ {
+ "epoch": 13.948228882833787,
+ "grad_norm": 12.33624267578125,
+ "learning_rate": 1.937790191219193e-05,
+ "loss": 1.3173,
+ "step": 5119
+ },
+ {
+ "epoch": 13.950953678474114,
+ "grad_norm": 9.658340454101562,
+ "learning_rate": 1.9377595471355016e-05,
+ "loss": 1.1707,
+ "step": 5120
+ },
+ {
+ "epoch": 13.953678474114442,
+ "grad_norm": 16.252883911132812,
+ "learning_rate": 1.9377288957485687e-05,
+ "loss": 1.3693,
+ "step": 5121
+ },
+ {
+ "epoch": 13.956403269754768,
+ "grad_norm": 9.234550476074219,
+ "learning_rate": 1.9376982370586335e-05,
+ "loss": 0.9656,
+ "step": 5122
+ },
+ {
+ "epoch": 13.959128065395095,
+ "grad_norm": 9.315324783325195,
+ "learning_rate": 1.9376675710659344e-05,
+ "loss": 1.1426,
+ "step": 5123
+ },
+ {
+ "epoch": 13.961852861035423,
+ "grad_norm": 10.235756874084473,
+ "learning_rate": 1.9376368977707107e-05,
+ "loss": 1.2695,
+ "step": 5124
+ },
+ {
+ "epoch": 13.964577656675749,
+ "grad_norm": 7.971922397613525,
+ "learning_rate": 1.9376062171732005e-05,
+ "loss": 0.9756,
+ "step": 5125
+ },
+ {
+ "epoch": 13.967302452316076,
+ "grad_norm": 13.746105194091797,
+ "learning_rate": 1.937575529273644e-05,
+ "loss": 1.3748,
+ "step": 5126
+ },
+ {
+ "epoch": 13.970027247956404,
+ "grad_norm": 10.527334213256836,
+ "learning_rate": 1.937544834072279e-05,
+ "loss": 1.2439,
+ "step": 5127
+ },
+ {
+ "epoch": 13.97275204359673,
+ "grad_norm": 10.209712982177734,
+ "learning_rate": 1.937514131569345e-05,
+ "loss": 1.0908,
+ "step": 5128
+ },
+ {
+ "epoch": 13.975476839237057,
+ "grad_norm": 11.231954574584961,
+ "learning_rate": 1.9374834217650814e-05,
+ "loss": 1.3093,
+ "step": 5129
+ },
+ {
+ "epoch": 13.978201634877385,
+ "grad_norm": 8.496438026428223,
+ "learning_rate": 1.9374527046597267e-05,
+ "loss": 1.05,
+ "step": 5130
+ },
+ {
+ "epoch": 13.98092643051771,
+ "grad_norm": 9.906559944152832,
+ "learning_rate": 1.9374219802535207e-05,
+ "loss": 1.3284,
+ "step": 5131
+ },
+ {
+ "epoch": 13.983651226158038,
+ "grad_norm": 9.432076454162598,
+ "learning_rate": 1.9373912485467027e-05,
+ "loss": 1.2576,
+ "step": 5132
+ },
+ {
+ "epoch": 13.986376021798366,
+ "grad_norm": 9.473461151123047,
+ "learning_rate": 1.9373605095395114e-05,
+ "loss": 1.0918,
+ "step": 5133
+ },
+ {
+ "epoch": 13.989100817438691,
+ "grad_norm": 8.349873542785645,
+ "learning_rate": 1.937329763232187e-05,
+ "loss": 1.261,
+ "step": 5134
+ },
+ {
+ "epoch": 13.991825613079019,
+ "grad_norm": 8.589016914367676,
+ "learning_rate": 1.9372990096249684e-05,
+ "loss": 1.1616,
+ "step": 5135
+ },
+ {
+ "epoch": 13.994550408719347,
+ "grad_norm": 9.705038070678711,
+ "learning_rate": 1.9372682487180953e-05,
+ "loss": 1.1487,
+ "step": 5136
+ },
+ {
+ "epoch": 13.997275204359672,
+ "grad_norm": 9.136675834655762,
+ "learning_rate": 1.937237480511807e-05,
+ "loss": 1.0737,
+ "step": 5137
+ },
+ {
+ "epoch": 14.0,
+ "grad_norm": 8.555794715881348,
+ "learning_rate": 1.937206705006344e-05,
+ "loss": 1.0691,
+ "step": 5138
+ },
+ {
+ "epoch": 14.002724795640328,
+ "grad_norm": 10.775039672851562,
+ "learning_rate": 1.9371759222019446e-05,
+ "loss": 1.1906,
+ "step": 5139
+ },
+ {
+ "epoch": 14.005449591280653,
+ "grad_norm": 10.422962188720703,
+ "learning_rate": 1.93714513209885e-05,
+ "loss": 1.2634,
+ "step": 5140
+ },
+ {
+ "epoch": 14.008174386920981,
+ "grad_norm": 11.841338157653809,
+ "learning_rate": 1.937114334697299e-05,
+ "loss": 1.0758,
+ "step": 5141
+ },
+ {
+ "epoch": 14.010899182561309,
+ "grad_norm": 7.517180919647217,
+ "learning_rate": 1.9370835299975312e-05,
+ "loss": 0.9236,
+ "step": 5142
+ },
+ {
+ "epoch": 14.013623978201634,
+ "grad_norm": 9.28675365447998,
+ "learning_rate": 1.9370527179997877e-05,
+ "loss": 1.0269,
+ "step": 5143
+ },
+ {
+ "epoch": 14.016348773841962,
+ "grad_norm": 8.840786933898926,
+ "learning_rate": 1.937021898704307e-05,
+ "loss": 0.9282,
+ "step": 5144
+ },
+ {
+ "epoch": 14.01907356948229,
+ "grad_norm": 11.340668678283691,
+ "learning_rate": 1.9369910721113307e-05,
+ "loss": 1.0544,
+ "step": 5145
+ },
+ {
+ "epoch": 14.021798365122615,
+ "grad_norm": 8.026557922363281,
+ "learning_rate": 1.936960238221098e-05,
+ "loss": 1.0471,
+ "step": 5146
+ },
+ {
+ "epoch": 14.024523160762943,
+ "grad_norm": 9.061466217041016,
+ "learning_rate": 1.936929397033849e-05,
+ "loss": 1.064,
+ "step": 5147
+ },
+ {
+ "epoch": 14.02724795640327,
+ "grad_norm": 9.586761474609375,
+ "learning_rate": 1.936898548549824e-05,
+ "loss": 1.1797,
+ "step": 5148
+ },
+ {
+ "epoch": 14.029972752043596,
+ "grad_norm": 7.718034267425537,
+ "learning_rate": 1.9368676927692633e-05,
+ "loss": 0.8347,
+ "step": 5149
+ },
+ {
+ "epoch": 14.032697547683924,
+ "grad_norm": 8.380197525024414,
+ "learning_rate": 1.936836829692407e-05,
+ "loss": 0.9882,
+ "step": 5150
+ },
+ {
+ "epoch": 14.035422343324251,
+ "grad_norm": 10.051340103149414,
+ "learning_rate": 1.9368059593194957e-05,
+ "loss": 0.9783,
+ "step": 5151
+ },
+ {
+ "epoch": 14.038147138964577,
+ "grad_norm": 6.907543659210205,
+ "learning_rate": 1.9367750816507697e-05,
+ "loss": 0.9395,
+ "step": 5152
+ },
+ {
+ "epoch": 14.040871934604905,
+ "grad_norm": 8.483818054199219,
+ "learning_rate": 1.9367441966864696e-05,
+ "loss": 1.1664,
+ "step": 5153
+ },
+ {
+ "epoch": 14.043596730245232,
+ "grad_norm": 8.694487571716309,
+ "learning_rate": 1.9367133044268357e-05,
+ "loss": 1.072,
+ "step": 5154
+ },
+ {
+ "epoch": 14.046321525885558,
+ "grad_norm": 9.576281547546387,
+ "learning_rate": 1.9366824048721092e-05,
+ "loss": 0.9762,
+ "step": 5155
+ },
+ {
+ "epoch": 14.049046321525886,
+ "grad_norm": 8.219457626342773,
+ "learning_rate": 1.9366514980225297e-05,
+ "loss": 0.9261,
+ "step": 5156
+ },
+ {
+ "epoch": 14.051771117166213,
+ "grad_norm": 17.113773345947266,
+ "learning_rate": 1.9366205838783386e-05,
+ "loss": 0.8933,
+ "step": 5157
+ },
+ {
+ "epoch": 14.054495912806539,
+ "grad_norm": 9.046813011169434,
+ "learning_rate": 1.9365896624397767e-05,
+ "loss": 1.0859,
+ "step": 5158
+ },
+ {
+ "epoch": 14.057220708446867,
+ "grad_norm": 16.562040328979492,
+ "learning_rate": 1.9365587337070847e-05,
+ "loss": 1.1587,
+ "step": 5159
+ },
+ {
+ "epoch": 14.059945504087194,
+ "grad_norm": 11.743142127990723,
+ "learning_rate": 1.936527797680503e-05,
+ "loss": 1.0215,
+ "step": 5160
+ },
+ {
+ "epoch": 14.06267029972752,
+ "grad_norm": 13.082555770874023,
+ "learning_rate": 1.9364968543602734e-05,
+ "loss": 1.2086,
+ "step": 5161
+ },
+ {
+ "epoch": 14.065395095367847,
+ "grad_norm": 9.03809642791748,
+ "learning_rate": 1.9364659037466363e-05,
+ "loss": 1.127,
+ "step": 5162
+ },
+ {
+ "epoch": 14.068119891008175,
+ "grad_norm": 10.348206520080566,
+ "learning_rate": 1.936434945839833e-05,
+ "loss": 0.9873,
+ "step": 5163
+ },
+ {
+ "epoch": 14.0708446866485,
+ "grad_norm": 9.243765830993652,
+ "learning_rate": 1.9364039806401044e-05,
+ "loss": 1.0645,
+ "step": 5164
+ },
+ {
+ "epoch": 14.073569482288828,
+ "grad_norm": 8.912335395812988,
+ "learning_rate": 1.9363730081476917e-05,
+ "loss": 1.0516,
+ "step": 5165
+ },
+ {
+ "epoch": 14.076294277929156,
+ "grad_norm": 11.13410758972168,
+ "learning_rate": 1.9363420283628362e-05,
+ "loss": 1.0215,
+ "step": 5166
+ },
+ {
+ "epoch": 14.079019073569482,
+ "grad_norm": 19.718351364135742,
+ "learning_rate": 1.9363110412857792e-05,
+ "loss": 1.218,
+ "step": 5167
+ },
+ {
+ "epoch": 14.08174386920981,
+ "grad_norm": 8.111212730407715,
+ "learning_rate": 1.9362800469167616e-05,
+ "loss": 0.9565,
+ "step": 5168
+ },
+ {
+ "epoch": 14.084468664850137,
+ "grad_norm": 21.195087432861328,
+ "learning_rate": 1.9362490452560253e-05,
+ "loss": 1.0968,
+ "step": 5169
+ },
+ {
+ "epoch": 14.087193460490463,
+ "grad_norm": 12.929117202758789,
+ "learning_rate": 1.936218036303812e-05,
+ "loss": 1.1819,
+ "step": 5170
+ },
+ {
+ "epoch": 14.08991825613079,
+ "grad_norm": 12.823680877685547,
+ "learning_rate": 1.9361870200603622e-05,
+ "loss": 0.9674,
+ "step": 5171
+ },
+ {
+ "epoch": 14.092643051771118,
+ "grad_norm": 8.026865005493164,
+ "learning_rate": 1.9361559965259183e-05,
+ "loss": 1.0482,
+ "step": 5172
+ },
+ {
+ "epoch": 14.095367847411444,
+ "grad_norm": 14.824681282043457,
+ "learning_rate": 1.9361249657007212e-05,
+ "loss": 1.175,
+ "step": 5173
+ },
+ {
+ "epoch": 14.098092643051771,
+ "grad_norm": 9.480208396911621,
+ "learning_rate": 1.9360939275850136e-05,
+ "loss": 0.9825,
+ "step": 5174
+ },
+ {
+ "epoch": 14.100817438692099,
+ "grad_norm": 10.715375900268555,
+ "learning_rate": 1.9360628821790365e-05,
+ "loss": 0.98,
+ "step": 5175
+ },
+ {
+ "epoch": 14.103542234332425,
+ "grad_norm": 8.420612335205078,
+ "learning_rate": 1.9360318294830316e-05,
+ "loss": 1.0737,
+ "step": 5176
+ },
+ {
+ "epoch": 14.106267029972752,
+ "grad_norm": 55.007171630859375,
+ "learning_rate": 1.936000769497241e-05,
+ "loss": 1.03,
+ "step": 5177
+ },
+ {
+ "epoch": 14.10899182561308,
+ "grad_norm": 10.606861114501953,
+ "learning_rate": 1.9359697022219065e-05,
+ "loss": 1.0549,
+ "step": 5178
+ },
+ {
+ "epoch": 14.111716621253406,
+ "grad_norm": 11.335735321044922,
+ "learning_rate": 1.93593862765727e-05,
+ "loss": 0.9281,
+ "step": 5179
+ },
+ {
+ "epoch": 14.114441416893733,
+ "grad_norm": 9.67910099029541,
+ "learning_rate": 1.9359075458035737e-05,
+ "loss": 1.0305,
+ "step": 5180
+ },
+ {
+ "epoch": 14.11716621253406,
+ "grad_norm": 11.689078330993652,
+ "learning_rate": 1.9358764566610598e-05,
+ "loss": 1.166,
+ "step": 5181
+ },
+ {
+ "epoch": 14.119891008174386,
+ "grad_norm": 9.712400436401367,
+ "learning_rate": 1.9358453602299697e-05,
+ "loss": 1.0057,
+ "step": 5182
+ },
+ {
+ "epoch": 14.122615803814714,
+ "grad_norm": 8.734127044677734,
+ "learning_rate": 1.9358142565105463e-05,
+ "loss": 1.1764,
+ "step": 5183
+ },
+ {
+ "epoch": 14.125340599455042,
+ "grad_norm": 11.82819938659668,
+ "learning_rate": 1.9357831455030315e-05,
+ "loss": 1.1128,
+ "step": 5184
+ },
+ {
+ "epoch": 14.128065395095367,
+ "grad_norm": 9.787619590759277,
+ "learning_rate": 1.9357520272076676e-05,
+ "loss": 1.0128,
+ "step": 5185
+ },
+ {
+ "epoch": 14.130790190735695,
+ "grad_norm": 10.834694862365723,
+ "learning_rate": 1.9357209016246972e-05,
+ "loss": 1.0073,
+ "step": 5186
+ },
+ {
+ "epoch": 14.133514986376023,
+ "grad_norm": 11.580232620239258,
+ "learning_rate": 1.9356897687543626e-05,
+ "loss": 1.1733,
+ "step": 5187
+ },
+ {
+ "epoch": 14.136239782016348,
+ "grad_norm": 10.885783195495605,
+ "learning_rate": 1.9356586285969062e-05,
+ "loss": 1.0463,
+ "step": 5188
+ },
+ {
+ "epoch": 14.138964577656676,
+ "grad_norm": 11.105716705322266,
+ "learning_rate": 1.9356274811525707e-05,
+ "loss": 1.0547,
+ "step": 5189
+ },
+ {
+ "epoch": 14.141689373297003,
+ "grad_norm": 10.251579284667969,
+ "learning_rate": 1.935596326421598e-05,
+ "loss": 1.0901,
+ "step": 5190
+ },
+ {
+ "epoch": 14.14441416893733,
+ "grad_norm": 9.170507431030273,
+ "learning_rate": 1.9355651644042312e-05,
+ "loss": 1.2407,
+ "step": 5191
+ },
+ {
+ "epoch": 14.147138964577657,
+ "grad_norm": 12.432571411132812,
+ "learning_rate": 1.9355339951007133e-05,
+ "loss": 1.2239,
+ "step": 5192
+ },
+ {
+ "epoch": 14.149863760217984,
+ "grad_norm": 9.303281784057617,
+ "learning_rate": 1.935502818511287e-05,
+ "loss": 1.1278,
+ "step": 5193
+ },
+ {
+ "epoch": 14.15258855585831,
+ "grad_norm": 9.055807113647461,
+ "learning_rate": 1.9354716346361947e-05,
+ "loss": 0.8248,
+ "step": 5194
+ },
+ {
+ "epoch": 14.155313351498638,
+ "grad_norm": 9.458588600158691,
+ "learning_rate": 1.935440443475679e-05,
+ "loss": 1.0507,
+ "step": 5195
+ },
+ {
+ "epoch": 14.158038147138965,
+ "grad_norm": 24.18316650390625,
+ "learning_rate": 1.9354092450299835e-05,
+ "loss": 1.2896,
+ "step": 5196
+ },
+ {
+ "epoch": 14.160762942779291,
+ "grad_norm": 8.916409492492676,
+ "learning_rate": 1.9353780392993512e-05,
+ "loss": 1.0306,
+ "step": 5197
+ },
+ {
+ "epoch": 14.163487738419619,
+ "grad_norm": 8.950216293334961,
+ "learning_rate": 1.9353468262840242e-05,
+ "loss": 1.0764,
+ "step": 5198
+ },
+ {
+ "epoch": 14.166212534059946,
+ "grad_norm": 10.580193519592285,
+ "learning_rate": 1.9353156059842467e-05,
+ "loss": 1.1387,
+ "step": 5199
+ },
+ {
+ "epoch": 14.168937329700272,
+ "grad_norm": 10.426873207092285,
+ "learning_rate": 1.9352843784002613e-05,
+ "loss": 0.9557,
+ "step": 5200
+ },
+ {
+ "epoch": 14.1716621253406,
+ "grad_norm": 14.51240348815918,
+ "learning_rate": 1.9352531435323113e-05,
+ "loss": 0.9541,
+ "step": 5201
+ },
+ {
+ "epoch": 14.174386920980927,
+ "grad_norm": 9.402112007141113,
+ "learning_rate": 1.9352219013806396e-05,
+ "loss": 1.006,
+ "step": 5202
+ },
+ {
+ "epoch": 14.177111716621253,
+ "grad_norm": 23.714242935180664,
+ "learning_rate": 1.93519065194549e-05,
+ "loss": 1.0583,
+ "step": 5203
+ },
+ {
+ "epoch": 14.17983651226158,
+ "grad_norm": 10.282632827758789,
+ "learning_rate": 1.935159395227106e-05,
+ "loss": 1.0785,
+ "step": 5204
+ },
+ {
+ "epoch": 14.182561307901908,
+ "grad_norm": 13.316774368286133,
+ "learning_rate": 1.9351281312257304e-05,
+ "loss": 1.032,
+ "step": 5205
+ },
+ {
+ "epoch": 14.185286103542234,
+ "grad_norm": 11.040825843811035,
+ "learning_rate": 1.9350968599416073e-05,
+ "loss": 1.3308,
+ "step": 5206
+ },
+ {
+ "epoch": 14.188010899182562,
+ "grad_norm": 9.174239158630371,
+ "learning_rate": 1.9350655813749795e-05,
+ "loss": 1.0178,
+ "step": 5207
+ },
+ {
+ "epoch": 14.190735694822889,
+ "grad_norm": 10.617894172668457,
+ "learning_rate": 1.9350342955260913e-05,
+ "loss": 0.8774,
+ "step": 5208
+ },
+ {
+ "epoch": 14.193460490463215,
+ "grad_norm": 7.703207015991211,
+ "learning_rate": 1.935003002395186e-05,
+ "loss": 1.0482,
+ "step": 5209
+ },
+ {
+ "epoch": 14.196185286103542,
+ "grad_norm": 9.032089233398438,
+ "learning_rate": 1.9349717019825076e-05,
+ "loss": 1.175,
+ "step": 5210
+ },
+ {
+ "epoch": 14.19891008174387,
+ "grad_norm": 10.903448104858398,
+ "learning_rate": 1.9349403942882995e-05,
+ "loss": 1.0756,
+ "step": 5211
+ },
+ {
+ "epoch": 14.201634877384196,
+ "grad_norm": 10.451948165893555,
+ "learning_rate": 1.934909079312806e-05,
+ "loss": 1.1343,
+ "step": 5212
+ },
+ {
+ "epoch": 14.204359673024523,
+ "grad_norm": 8.245926856994629,
+ "learning_rate": 1.9348777570562705e-05,
+ "loss": 1.23,
+ "step": 5213
+ },
+ {
+ "epoch": 14.207084468664851,
+ "grad_norm": 9.887392044067383,
+ "learning_rate": 1.934846427518937e-05,
+ "loss": 1.0542,
+ "step": 5214
+ },
+ {
+ "epoch": 14.209809264305177,
+ "grad_norm": 10.74023151397705,
+ "learning_rate": 1.9348150907010495e-05,
+ "loss": 1.0374,
+ "step": 5215
+ },
+ {
+ "epoch": 14.212534059945504,
+ "grad_norm": 12.305845260620117,
+ "learning_rate": 1.9347837466028524e-05,
+ "loss": 1.178,
+ "step": 5216
+ },
+ {
+ "epoch": 14.215258855585832,
+ "grad_norm": 9.770783424377441,
+ "learning_rate": 1.9347523952245898e-05,
+ "loss": 1.1133,
+ "step": 5217
+ },
+ {
+ "epoch": 14.217983651226158,
+ "grad_norm": 9.333532333374023,
+ "learning_rate": 1.9347210365665052e-05,
+ "loss": 0.9165,
+ "step": 5218
+ },
+ {
+ "epoch": 14.220708446866485,
+ "grad_norm": 9.938899040222168,
+ "learning_rate": 1.9346896706288433e-05,
+ "loss": 1.1858,
+ "step": 5219
+ },
+ {
+ "epoch": 14.223433242506813,
+ "grad_norm": 10.495904922485352,
+ "learning_rate": 1.9346582974118484e-05,
+ "loss": 1.28,
+ "step": 5220
+ },
+ {
+ "epoch": 14.226158038147139,
+ "grad_norm": 8.536820411682129,
+ "learning_rate": 1.934626916915765e-05,
+ "loss": 1.0775,
+ "step": 5221
+ },
+ {
+ "epoch": 14.228882833787466,
+ "grad_norm": 8.524038314819336,
+ "learning_rate": 1.9345955291408368e-05,
+ "loss": 1.0872,
+ "step": 5222
+ },
+ {
+ "epoch": 14.231607629427794,
+ "grad_norm": 7.942371845245361,
+ "learning_rate": 1.934564134087309e-05,
+ "loss": 1.166,
+ "step": 5223
+ },
+ {
+ "epoch": 14.23433242506812,
+ "grad_norm": 11.302346229553223,
+ "learning_rate": 1.9345327317554258e-05,
+ "loss": 0.9764,
+ "step": 5224
+ },
+ {
+ "epoch": 14.237057220708447,
+ "grad_norm": 7.489410400390625,
+ "learning_rate": 1.934501322145432e-05,
+ "loss": 0.9688,
+ "step": 5225
+ },
+ {
+ "epoch": 14.239782016348773,
+ "grad_norm": 9.616244316101074,
+ "learning_rate": 1.9344699052575713e-05,
+ "loss": 1.0598,
+ "step": 5226
+ },
+ {
+ "epoch": 14.2425068119891,
+ "grad_norm": 7.459101676940918,
+ "learning_rate": 1.9344384810920894e-05,
+ "loss": 0.9845,
+ "step": 5227
+ },
+ {
+ "epoch": 14.245231607629428,
+ "grad_norm": 7.418712139129639,
+ "learning_rate": 1.9344070496492307e-05,
+ "loss": 1.0337,
+ "step": 5228
+ },
+ {
+ "epoch": 14.247956403269754,
+ "grad_norm": 12.477212905883789,
+ "learning_rate": 1.93437561092924e-05,
+ "loss": 0.9674,
+ "step": 5229
+ },
+ {
+ "epoch": 14.250681198910081,
+ "grad_norm": 10.46294116973877,
+ "learning_rate": 1.9343441649323623e-05,
+ "loss": 1.1455,
+ "step": 5230
+ },
+ {
+ "epoch": 14.253405994550409,
+ "grad_norm": 11.074926376342773,
+ "learning_rate": 1.9343127116588422e-05,
+ "loss": 1.0607,
+ "step": 5231
+ },
+ {
+ "epoch": 14.256130790190735,
+ "grad_norm": 12.724575996398926,
+ "learning_rate": 1.9342812511089245e-05,
+ "loss": 1.0946,
+ "step": 5232
+ },
+ {
+ "epoch": 14.258855585831062,
+ "grad_norm": 11.567410469055176,
+ "learning_rate": 1.9342497832828545e-05,
+ "loss": 1.2377,
+ "step": 5233
+ },
+ {
+ "epoch": 14.26158038147139,
+ "grad_norm": 10.05311107635498,
+ "learning_rate": 1.9342183081808776e-05,
+ "loss": 0.9814,
+ "step": 5234
+ },
+ {
+ "epoch": 14.264305177111716,
+ "grad_norm": 12.47072696685791,
+ "learning_rate": 1.9341868258032383e-05,
+ "loss": 1.0944,
+ "step": 5235
+ },
+ {
+ "epoch": 14.267029972752043,
+ "grad_norm": 9.628125190734863,
+ "learning_rate": 1.9341553361501823e-05,
+ "loss": 0.9958,
+ "step": 5236
+ },
+ {
+ "epoch": 14.269754768392371,
+ "grad_norm": 8.3932523727417,
+ "learning_rate": 1.9341238392219546e-05,
+ "loss": 0.9589,
+ "step": 5237
+ },
+ {
+ "epoch": 14.272479564032697,
+ "grad_norm": 14.278056144714355,
+ "learning_rate": 1.9340923350188004e-05,
+ "loss": 1.0369,
+ "step": 5238
+ },
+ {
+ "epoch": 14.275204359673024,
+ "grad_norm": 13.667935371398926,
+ "learning_rate": 1.934060823540965e-05,
+ "loss": 1.0345,
+ "step": 5239
+ },
+ {
+ "epoch": 14.277929155313352,
+ "grad_norm": 9.29685115814209,
+ "learning_rate": 1.9340293047886943e-05,
+ "loss": 1.1643,
+ "step": 5240
+ },
+ {
+ "epoch": 14.280653950953678,
+ "grad_norm": 8.895401000976562,
+ "learning_rate": 1.9339977787622332e-05,
+ "loss": 1.0632,
+ "step": 5241
+ },
+ {
+ "epoch": 14.283378746594005,
+ "grad_norm": 8.890891075134277,
+ "learning_rate": 1.9339662454618277e-05,
+ "loss": 1.0703,
+ "step": 5242
+ },
+ {
+ "epoch": 14.286103542234333,
+ "grad_norm": 8.847053527832031,
+ "learning_rate": 1.9339347048877228e-05,
+ "loss": 0.9144,
+ "step": 5243
+ },
+ {
+ "epoch": 14.288828337874659,
+ "grad_norm": 9.546551704406738,
+ "learning_rate": 1.9339031570401647e-05,
+ "loss": 1.175,
+ "step": 5244
+ },
+ {
+ "epoch": 14.291553133514986,
+ "grad_norm": 10.097752571105957,
+ "learning_rate": 1.933871601919399e-05,
+ "loss": 1.637,
+ "step": 5245
+ },
+ {
+ "epoch": 14.294277929155314,
+ "grad_norm": 10.346940994262695,
+ "learning_rate": 1.9338400395256708e-05,
+ "loss": 1.2756,
+ "step": 5246
+ },
+ {
+ "epoch": 14.29700272479564,
+ "grad_norm": 12.138782501220703,
+ "learning_rate": 1.9338084698592266e-05,
+ "loss": 1.1531,
+ "step": 5247
+ },
+ {
+ "epoch": 14.299727520435967,
+ "grad_norm": 8.375985145568848,
+ "learning_rate": 1.9337768929203124e-05,
+ "loss": 0.8945,
+ "step": 5248
+ },
+ {
+ "epoch": 14.302452316076295,
+ "grad_norm": 13.717570304870605,
+ "learning_rate": 1.933745308709174e-05,
+ "loss": 0.981,
+ "step": 5249
+ },
+ {
+ "epoch": 14.30517711171662,
+ "grad_norm": 8.631799697875977,
+ "learning_rate": 1.9337137172260568e-05,
+ "loss": 1.1099,
+ "step": 5250
+ },
+ {
+ "epoch": 14.307901907356948,
+ "grad_norm": 7.853982448577881,
+ "learning_rate": 1.933682118471207e-05,
+ "loss": 1.0149,
+ "step": 5251
+ },
+ {
+ "epoch": 14.310626702997276,
+ "grad_norm": 10.202895164489746,
+ "learning_rate": 1.9336505124448714e-05,
+ "loss": 1.0979,
+ "step": 5252
+ },
+ {
+ "epoch": 14.313351498637601,
+ "grad_norm": 9.769791603088379,
+ "learning_rate": 1.9336188991472956e-05,
+ "loss": 1.1184,
+ "step": 5253
+ },
+ {
+ "epoch": 14.316076294277929,
+ "grad_norm": 8.059771537780762,
+ "learning_rate": 1.9335872785787257e-05,
+ "loss": 1.0947,
+ "step": 5254
+ },
+ {
+ "epoch": 14.318801089918257,
+ "grad_norm": 68.8738021850586,
+ "learning_rate": 1.933555650739408e-05,
+ "loss": 1.2471,
+ "step": 5255
+ },
+ {
+ "epoch": 14.321525885558582,
+ "grad_norm": 9.558309555053711,
+ "learning_rate": 1.933524015629589e-05,
+ "loss": 1.2317,
+ "step": 5256
+ },
+ {
+ "epoch": 14.32425068119891,
+ "grad_norm": 8.446417808532715,
+ "learning_rate": 1.9334923732495153e-05,
+ "loss": 1.1877,
+ "step": 5257
+ },
+ {
+ "epoch": 14.326975476839237,
+ "grad_norm": 8.942597389221191,
+ "learning_rate": 1.9334607235994328e-05,
+ "loss": 1.1284,
+ "step": 5258
+ },
+ {
+ "epoch": 14.329700272479563,
+ "grad_norm": 9.941106796264648,
+ "learning_rate": 1.933429066679588e-05,
+ "loss": 1.0425,
+ "step": 5259
+ },
+ {
+ "epoch": 14.33242506811989,
+ "grad_norm": 8.345467567443848,
+ "learning_rate": 1.9333974024902278e-05,
+ "loss": 1.0031,
+ "step": 5260
+ },
+ {
+ "epoch": 14.335149863760218,
+ "grad_norm": 8.661430358886719,
+ "learning_rate": 1.933365731031599e-05,
+ "loss": 1.1255,
+ "step": 5261
+ },
+ {
+ "epoch": 14.337874659400544,
+ "grad_norm": 8.243463516235352,
+ "learning_rate": 1.9333340523039477e-05,
+ "loss": 1.0671,
+ "step": 5262
+ },
+ {
+ "epoch": 14.340599455040872,
+ "grad_norm": 9.933423042297363,
+ "learning_rate": 1.9333023663075208e-05,
+ "loss": 0.934,
+ "step": 5263
+ },
+ {
+ "epoch": 14.3433242506812,
+ "grad_norm": 8.510039329528809,
+ "learning_rate": 1.9332706730425654e-05,
+ "loss": 1.0812,
+ "step": 5264
+ },
+ {
+ "epoch": 14.346049046321525,
+ "grad_norm": 9.866889953613281,
+ "learning_rate": 1.9332389725093276e-05,
+ "loss": 1.1134,
+ "step": 5265
+ },
+ {
+ "epoch": 14.348773841961853,
+ "grad_norm": 8.618088722229004,
+ "learning_rate": 1.9332072647080548e-05,
+ "loss": 0.9312,
+ "step": 5266
+ },
+ {
+ "epoch": 14.35149863760218,
+ "grad_norm": 9.735777854919434,
+ "learning_rate": 1.933175549638994e-05,
+ "loss": 0.9116,
+ "step": 5267
+ },
+ {
+ "epoch": 14.354223433242506,
+ "grad_norm": 13.522176742553711,
+ "learning_rate": 1.933143827302392e-05,
+ "loss": 0.99,
+ "step": 5268
+ },
+ {
+ "epoch": 14.356948228882834,
+ "grad_norm": 12.312538146972656,
+ "learning_rate": 1.9331120976984962e-05,
+ "loss": 0.9844,
+ "step": 5269
+ },
+ {
+ "epoch": 14.359673024523161,
+ "grad_norm": 9.45966625213623,
+ "learning_rate": 1.933080360827553e-05,
+ "loss": 1.1396,
+ "step": 5270
+ },
+ {
+ "epoch": 14.362397820163487,
+ "grad_norm": 9.67317008972168,
+ "learning_rate": 1.93304861668981e-05,
+ "loss": 1.0793,
+ "step": 5271
+ },
+ {
+ "epoch": 14.365122615803815,
+ "grad_norm": 11.211816787719727,
+ "learning_rate": 1.933016865285515e-05,
+ "loss": 1.2239,
+ "step": 5272
+ },
+ {
+ "epoch": 14.367847411444142,
+ "grad_norm": 9.201240539550781,
+ "learning_rate": 1.9329851066149138e-05,
+ "loss": 1.0579,
+ "step": 5273
+ },
+ {
+ "epoch": 14.370572207084468,
+ "grad_norm": 12.017439842224121,
+ "learning_rate": 1.932953340678255e-05,
+ "loss": 1.2026,
+ "step": 5274
+ },
+ {
+ "epoch": 14.373297002724795,
+ "grad_norm": 9.993738174438477,
+ "learning_rate": 1.9329215674757856e-05,
+ "loss": 0.9805,
+ "step": 5275
+ },
+ {
+ "epoch": 14.376021798365123,
+ "grad_norm": 8.909194946289062,
+ "learning_rate": 1.932889787007753e-05,
+ "loss": 1.0084,
+ "step": 5276
+ },
+ {
+ "epoch": 14.378746594005449,
+ "grad_norm": 19.06960105895996,
+ "learning_rate": 1.932857999274405e-05,
+ "loss": 1.1138,
+ "step": 5277
+ },
+ {
+ "epoch": 14.381471389645776,
+ "grad_norm": 10.438451766967773,
+ "learning_rate": 1.932826204275989e-05,
+ "loss": 1.0244,
+ "step": 5278
+ },
+ {
+ "epoch": 14.384196185286104,
+ "grad_norm": 11.111006736755371,
+ "learning_rate": 1.932794402012752e-05,
+ "loss": 1.0233,
+ "step": 5279
+ },
+ {
+ "epoch": 14.38692098092643,
+ "grad_norm": 11.95139217376709,
+ "learning_rate": 1.932762592484943e-05,
+ "loss": 1.3044,
+ "step": 5280
+ },
+ {
+ "epoch": 14.389645776566757,
+ "grad_norm": 12.746063232421875,
+ "learning_rate": 1.9327307756928082e-05,
+ "loss": 1.1691,
+ "step": 5281
+ },
+ {
+ "epoch": 14.392370572207085,
+ "grad_norm": 13.35183334350586,
+ "learning_rate": 1.9326989516365965e-05,
+ "loss": 1.2515,
+ "step": 5282
+ },
+ {
+ "epoch": 14.39509536784741,
+ "grad_norm": 7.97482442855835,
+ "learning_rate": 1.9326671203165555e-05,
+ "loss": 0.9849,
+ "step": 5283
+ },
+ {
+ "epoch": 14.397820163487738,
+ "grad_norm": 11.38698673248291,
+ "learning_rate": 1.9326352817329325e-05,
+ "loss": 1.2874,
+ "step": 5284
+ },
+ {
+ "epoch": 14.400544959128066,
+ "grad_norm": 8.816800117492676,
+ "learning_rate": 1.9326034358859763e-05,
+ "loss": 1.072,
+ "step": 5285
+ },
+ {
+ "epoch": 14.403269754768392,
+ "grad_norm": 9.06088638305664,
+ "learning_rate": 1.9325715827759347e-05,
+ "loss": 1.157,
+ "step": 5286
+ },
+ {
+ "epoch": 14.40599455040872,
+ "grad_norm": 12.826264381408691,
+ "learning_rate": 1.9325397224030556e-05,
+ "loss": 0.9587,
+ "step": 5287
+ },
+ {
+ "epoch": 14.408719346049047,
+ "grad_norm": 8.464082717895508,
+ "learning_rate": 1.932507854767587e-05,
+ "loss": 1.0815,
+ "step": 5288
+ },
+ {
+ "epoch": 14.411444141689373,
+ "grad_norm": 11.152374267578125,
+ "learning_rate": 1.932475979869777e-05,
+ "loss": 1.0793,
+ "step": 5289
+ },
+ {
+ "epoch": 14.4141689373297,
+ "grad_norm": 9.872017860412598,
+ "learning_rate": 1.9324440977098743e-05,
+ "loss": 1.2461,
+ "step": 5290
+ },
+ {
+ "epoch": 14.416893732970028,
+ "grad_norm": 8.444131851196289,
+ "learning_rate": 1.9324122082881273e-05,
+ "loss": 1.0906,
+ "step": 5291
+ },
+ {
+ "epoch": 14.419618528610354,
+ "grad_norm": 13.058818817138672,
+ "learning_rate": 1.9323803116047835e-05,
+ "loss": 1.0557,
+ "step": 5292
+ },
+ {
+ "epoch": 14.422343324250681,
+ "grad_norm": 9.907197952270508,
+ "learning_rate": 1.932348407660092e-05,
+ "loss": 1.2539,
+ "step": 5293
+ },
+ {
+ "epoch": 14.425068119891009,
+ "grad_norm": 8.678665161132812,
+ "learning_rate": 1.932316496454301e-05,
+ "loss": 0.843,
+ "step": 5294
+ },
+ {
+ "epoch": 14.427792915531334,
+ "grad_norm": 10.322772026062012,
+ "learning_rate": 1.9322845779876594e-05,
+ "loss": 1.1262,
+ "step": 5295
+ },
+ {
+ "epoch": 14.430517711171662,
+ "grad_norm": 24.07590103149414,
+ "learning_rate": 1.9322526522604158e-05,
+ "loss": 1.002,
+ "step": 5296
+ },
+ {
+ "epoch": 14.43324250681199,
+ "grad_norm": 11.389932632446289,
+ "learning_rate": 1.932220719272818e-05,
+ "loss": 1.0343,
+ "step": 5297
+ },
+ {
+ "epoch": 14.435967302452315,
+ "grad_norm": 9.001762390136719,
+ "learning_rate": 1.932188779025115e-05,
+ "loss": 1.0803,
+ "step": 5298
+ },
+ {
+ "epoch": 14.438692098092643,
+ "grad_norm": 10.911750793457031,
+ "learning_rate": 1.9321568315175566e-05,
+ "loss": 1.0684,
+ "step": 5299
+ },
+ {
+ "epoch": 14.44141689373297,
+ "grad_norm": 9.265901565551758,
+ "learning_rate": 1.93212487675039e-05,
+ "loss": 1.0171,
+ "step": 5300
+ },
+ {
+ "epoch": 14.444141689373296,
+ "grad_norm": 9.530998229980469,
+ "learning_rate": 1.9320929147238656e-05,
+ "loss": 0.9602,
+ "step": 5301
+ },
+ {
+ "epoch": 14.446866485013624,
+ "grad_norm": 10.691299438476562,
+ "learning_rate": 1.9320609454382314e-05,
+ "loss": 0.9978,
+ "step": 5302
+ },
+ {
+ "epoch": 14.449591280653951,
+ "grad_norm": 11.737393379211426,
+ "learning_rate": 1.932028968893736e-05,
+ "loss": 1.0564,
+ "step": 5303
+ },
+ {
+ "epoch": 14.452316076294277,
+ "grad_norm": 13.94564151763916,
+ "learning_rate": 1.9319969850906293e-05,
+ "loss": 1.05,
+ "step": 5304
+ },
+ {
+ "epoch": 14.455040871934605,
+ "grad_norm": 8.74657154083252,
+ "learning_rate": 1.9319649940291605e-05,
+ "loss": 1.0525,
+ "step": 5305
+ },
+ {
+ "epoch": 14.457765667574932,
+ "grad_norm": 10.81070327758789,
+ "learning_rate": 1.9319329957095777e-05,
+ "loss": 1.4153,
+ "step": 5306
+ },
+ {
+ "epoch": 14.460490463215258,
+ "grad_norm": 9.045839309692383,
+ "learning_rate": 1.9319009901321312e-05,
+ "loss": 0.9253,
+ "step": 5307
+ },
+ {
+ "epoch": 14.463215258855586,
+ "grad_norm": 20.913326263427734,
+ "learning_rate": 1.9318689772970695e-05,
+ "loss": 1.1169,
+ "step": 5308
+ },
+ {
+ "epoch": 14.465940054495913,
+ "grad_norm": 10.087102890014648,
+ "learning_rate": 1.9318369572046425e-05,
+ "loss": 1.0671,
+ "step": 5309
+ },
+ {
+ "epoch": 14.46866485013624,
+ "grad_norm": 8.336085319519043,
+ "learning_rate": 1.931804929855099e-05,
+ "loss": 1.223,
+ "step": 5310
+ },
+ {
+ "epoch": 14.471389645776567,
+ "grad_norm": 11.849065780639648,
+ "learning_rate": 1.931772895248689e-05,
+ "loss": 1.0393,
+ "step": 5311
+ },
+ {
+ "epoch": 14.474114441416894,
+ "grad_norm": 8.905378341674805,
+ "learning_rate": 1.931740853385661e-05,
+ "loss": 1.0046,
+ "step": 5312
+ },
+ {
+ "epoch": 14.47683923705722,
+ "grad_norm": 8.513957023620605,
+ "learning_rate": 1.9317088042662656e-05,
+ "loss": 1.1963,
+ "step": 5313
+ },
+ {
+ "epoch": 14.479564032697548,
+ "grad_norm": 9.680682182312012,
+ "learning_rate": 1.931676747890752e-05,
+ "loss": 0.9915,
+ "step": 5314
+ },
+ {
+ "epoch": 14.482288828337875,
+ "grad_norm": 9.793913841247559,
+ "learning_rate": 1.93164468425937e-05,
+ "loss": 1.2289,
+ "step": 5315
+ },
+ {
+ "epoch": 14.485013623978201,
+ "grad_norm": 8.151663780212402,
+ "learning_rate": 1.9316126133723694e-05,
+ "loss": 0.994,
+ "step": 5316
+ },
+ {
+ "epoch": 14.487738419618529,
+ "grad_norm": 8.099178314208984,
+ "learning_rate": 1.9315805352299996e-05,
+ "loss": 0.8774,
+ "step": 5317
+ },
+ {
+ "epoch": 14.490463215258856,
+ "grad_norm": 14.407559394836426,
+ "learning_rate": 1.9315484498325103e-05,
+ "loss": 1.0383,
+ "step": 5318
+ },
+ {
+ "epoch": 14.493188010899182,
+ "grad_norm": 11.349617004394531,
+ "learning_rate": 1.9315163571801517e-05,
+ "loss": 1.0759,
+ "step": 5319
+ },
+ {
+ "epoch": 14.49591280653951,
+ "grad_norm": 38.68876647949219,
+ "learning_rate": 1.9314842572731737e-05,
+ "loss": 1.156,
+ "step": 5320
+ },
+ {
+ "epoch": 14.498637602179837,
+ "grad_norm": 8.868889808654785,
+ "learning_rate": 1.9314521501118265e-05,
+ "loss": 1.0035,
+ "step": 5321
+ },
+ {
+ "epoch": 14.501362397820163,
+ "grad_norm": 8.173551559448242,
+ "learning_rate": 1.93142003569636e-05,
+ "loss": 1.1855,
+ "step": 5322
+ },
+ {
+ "epoch": 14.50408719346049,
+ "grad_norm": 8.55869197845459,
+ "learning_rate": 1.931387914027024e-05,
+ "loss": 1.0449,
+ "step": 5323
+ },
+ {
+ "epoch": 14.506811989100818,
+ "grad_norm": 12.509915351867676,
+ "learning_rate": 1.931355785104069e-05,
+ "loss": 1.0078,
+ "step": 5324
+ },
+ {
+ "epoch": 14.509536784741144,
+ "grad_norm": 10.232088088989258,
+ "learning_rate": 1.931323648927745e-05,
+ "loss": 1.0969,
+ "step": 5325
+ },
+ {
+ "epoch": 14.512261580381471,
+ "grad_norm": 10.29968547821045,
+ "learning_rate": 1.9312915054983023e-05,
+ "loss": 1.1525,
+ "step": 5326
+ },
+ {
+ "epoch": 14.514986376021799,
+ "grad_norm": 44.228973388671875,
+ "learning_rate": 1.9312593548159916e-05,
+ "loss": 1.2103,
+ "step": 5327
+ },
+ {
+ "epoch": 14.517711171662125,
+ "grad_norm": 20.510353088378906,
+ "learning_rate": 1.931227196881063e-05,
+ "loss": 1.0187,
+ "step": 5328
+ },
+ {
+ "epoch": 14.520435967302452,
+ "grad_norm": 12.056849479675293,
+ "learning_rate": 1.9311950316937666e-05,
+ "loss": 0.8915,
+ "step": 5329
+ },
+ {
+ "epoch": 14.52316076294278,
+ "grad_norm": 12.606382369995117,
+ "learning_rate": 1.9311628592543538e-05,
+ "loss": 1.1522,
+ "step": 5330
+ },
+ {
+ "epoch": 14.525885558583106,
+ "grad_norm": 14.394980430603027,
+ "learning_rate": 1.9311306795630745e-05,
+ "loss": 1.1936,
+ "step": 5331
+ },
+ {
+ "epoch": 14.528610354223433,
+ "grad_norm": 11.048859596252441,
+ "learning_rate": 1.931098492620179e-05,
+ "loss": 1.037,
+ "step": 5332
+ },
+ {
+ "epoch": 14.53133514986376,
+ "grad_norm": 14.999587059020996,
+ "learning_rate": 1.9310662984259187e-05,
+ "loss": 1.1234,
+ "step": 5333
+ },
+ {
+ "epoch": 14.534059945504087,
+ "grad_norm": 10.57614517211914,
+ "learning_rate": 1.931034096980544e-05,
+ "loss": 0.8899,
+ "step": 5334
+ },
+ {
+ "epoch": 14.536784741144414,
+ "grad_norm": 10.451554298400879,
+ "learning_rate": 1.931001888284306e-05,
+ "loss": 0.8661,
+ "step": 5335
+ },
+ {
+ "epoch": 14.539509536784742,
+ "grad_norm": 12.769274711608887,
+ "learning_rate": 1.9309696723374548e-05,
+ "loss": 1.1665,
+ "step": 5336
+ },
+ {
+ "epoch": 14.542234332425068,
+ "grad_norm": 13.212369918823242,
+ "learning_rate": 1.930937449140242e-05,
+ "loss": 1.1079,
+ "step": 5337
+ },
+ {
+ "epoch": 14.544959128065395,
+ "grad_norm": 16.784992218017578,
+ "learning_rate": 1.9309052186929184e-05,
+ "loss": 1.1338,
+ "step": 5338
+ },
+ {
+ "epoch": 14.547683923705723,
+ "grad_norm": 10.934957504272461,
+ "learning_rate": 1.930872980995735e-05,
+ "loss": 1.0775,
+ "step": 5339
+ },
+ {
+ "epoch": 14.550408719346049,
+ "grad_norm": 108.7918701171875,
+ "learning_rate": 1.930840736048942e-05,
+ "loss": 0.9453,
+ "step": 5340
+ },
+ {
+ "epoch": 14.553133514986376,
+ "grad_norm": 10.363018989562988,
+ "learning_rate": 1.9308084838527922e-05,
+ "loss": 1.1213,
+ "step": 5341
+ },
+ {
+ "epoch": 14.555858310626704,
+ "grad_norm": 10.330005645751953,
+ "learning_rate": 1.9307762244075357e-05,
+ "loss": 1.2231,
+ "step": 5342
+ },
+ {
+ "epoch": 14.55858310626703,
+ "grad_norm": 12.0515718460083,
+ "learning_rate": 1.9307439577134238e-05,
+ "loss": 1.2269,
+ "step": 5343
+ },
+ {
+ "epoch": 14.561307901907357,
+ "grad_norm": 9.661890983581543,
+ "learning_rate": 1.9307116837707078e-05,
+ "loss": 1.3032,
+ "step": 5344
+ },
+ {
+ "epoch": 14.564032697547685,
+ "grad_norm": 10.54574966430664,
+ "learning_rate": 1.9306794025796395e-05,
+ "loss": 1.1172,
+ "step": 5345
+ },
+ {
+ "epoch": 14.56675749318801,
+ "grad_norm": 8.823716163635254,
+ "learning_rate": 1.9306471141404696e-05,
+ "loss": 1.0186,
+ "step": 5346
+ },
+ {
+ "epoch": 14.569482288828338,
+ "grad_norm": 9.0007905960083,
+ "learning_rate": 1.93061481845345e-05,
+ "loss": 1.1873,
+ "step": 5347
+ },
+ {
+ "epoch": 14.572207084468666,
+ "grad_norm": 11.603144645690918,
+ "learning_rate": 1.9305825155188324e-05,
+ "loss": 1.1558,
+ "step": 5348
+ },
+ {
+ "epoch": 14.574931880108991,
+ "grad_norm": 11.087784767150879,
+ "learning_rate": 1.930550205336868e-05,
+ "loss": 1.1632,
+ "step": 5349
+ },
+ {
+ "epoch": 14.577656675749319,
+ "grad_norm": 11.974077224731445,
+ "learning_rate": 1.9305178879078083e-05,
+ "loss": 1.1041,
+ "step": 5350
+ },
+ {
+ "epoch": 14.580381471389646,
+ "grad_norm": 10.979742050170898,
+ "learning_rate": 1.9304855632319052e-05,
+ "loss": 1.1948,
+ "step": 5351
+ },
+ {
+ "epoch": 14.583106267029972,
+ "grad_norm": 9.695462226867676,
+ "learning_rate": 1.930453231309411e-05,
+ "loss": 1.0532,
+ "step": 5352
+ },
+ {
+ "epoch": 14.5858310626703,
+ "grad_norm": 16.92827606201172,
+ "learning_rate": 1.9304208921405766e-05,
+ "loss": 1.0894,
+ "step": 5353
+ },
+ {
+ "epoch": 14.588555858310627,
+ "grad_norm": 8.352365493774414,
+ "learning_rate": 1.9303885457256543e-05,
+ "loss": 0.8616,
+ "step": 5354
+ },
+ {
+ "epoch": 14.591280653950953,
+ "grad_norm": 14.493141174316406,
+ "learning_rate": 1.930356192064896e-05,
+ "loss": 1.083,
+ "step": 5355
+ },
+ {
+ "epoch": 14.59400544959128,
+ "grad_norm": 10.147053718566895,
+ "learning_rate": 1.9303238311585534e-05,
+ "loss": 1.1628,
+ "step": 5356
+ },
+ {
+ "epoch": 14.596730245231608,
+ "grad_norm": 10.885664939880371,
+ "learning_rate": 1.930291463006879e-05,
+ "loss": 1.1016,
+ "step": 5357
+ },
+ {
+ "epoch": 14.599455040871934,
+ "grad_norm": 13.00692081451416,
+ "learning_rate": 1.9302590876101248e-05,
+ "loss": 1.1027,
+ "step": 5358
+ },
+ {
+ "epoch": 14.602179836512262,
+ "grad_norm": 9.570802688598633,
+ "learning_rate": 1.9302267049685424e-05,
+ "loss": 1.0396,
+ "step": 5359
+ },
+ {
+ "epoch": 14.60490463215259,
+ "grad_norm": 12.471563339233398,
+ "learning_rate": 1.9301943150823845e-05,
+ "loss": 1.1912,
+ "step": 5360
+ },
+ {
+ "epoch": 14.607629427792915,
+ "grad_norm": 12.29695987701416,
+ "learning_rate": 1.930161917951903e-05,
+ "loss": 1.1016,
+ "step": 5361
+ },
+ {
+ "epoch": 14.610354223433243,
+ "grad_norm": 18.859411239624023,
+ "learning_rate": 1.9301295135773507e-05,
+ "loss": 1.21,
+ "step": 5362
+ },
+ {
+ "epoch": 14.61307901907357,
+ "grad_norm": 9.199820518493652,
+ "learning_rate": 1.9300971019589796e-05,
+ "loss": 1.0422,
+ "step": 5363
+ },
+ {
+ "epoch": 14.615803814713896,
+ "grad_norm": 15.703910827636719,
+ "learning_rate": 1.9300646830970423e-05,
+ "loss": 1.1895,
+ "step": 5364
+ },
+ {
+ "epoch": 14.618528610354224,
+ "grad_norm": 13.497588157653809,
+ "learning_rate": 1.930032256991791e-05,
+ "loss": 1.4207,
+ "step": 5365
+ },
+ {
+ "epoch": 14.621253405994551,
+ "grad_norm": 21.071622848510742,
+ "learning_rate": 1.9299998236434786e-05,
+ "loss": 1.1438,
+ "step": 5366
+ },
+ {
+ "epoch": 14.623978201634877,
+ "grad_norm": 11.96397876739502,
+ "learning_rate": 1.9299673830523574e-05,
+ "loss": 1.1494,
+ "step": 5367
+ },
+ {
+ "epoch": 14.626702997275205,
+ "grad_norm": 7.910435199737549,
+ "learning_rate": 1.9299349352186803e-05,
+ "loss": 1.3066,
+ "step": 5368
+ },
+ {
+ "epoch": 14.629427792915532,
+ "grad_norm": 11.785028457641602,
+ "learning_rate": 1.9299024801426994e-05,
+ "loss": 1.24,
+ "step": 5369
+ },
+ {
+ "epoch": 14.632152588555858,
+ "grad_norm": 13.936634063720703,
+ "learning_rate": 1.9298700178246685e-05,
+ "loss": 1.0817,
+ "step": 5370
+ },
+ {
+ "epoch": 14.634877384196185,
+ "grad_norm": 13.785355567932129,
+ "learning_rate": 1.9298375482648396e-05,
+ "loss": 1.0967,
+ "step": 5371
+ },
+ {
+ "epoch": 14.637602179836513,
+ "grad_norm": 14.386396408081055,
+ "learning_rate": 1.9298050714634654e-05,
+ "loss": 1.1433,
+ "step": 5372
+ },
+ {
+ "epoch": 14.640326975476839,
+ "grad_norm": 9.83299446105957,
+ "learning_rate": 1.9297725874208e-05,
+ "loss": 1.1227,
+ "step": 5373
+ },
+ {
+ "epoch": 14.643051771117166,
+ "grad_norm": 10.26580810546875,
+ "learning_rate": 1.9297400961370953e-05,
+ "loss": 1.0359,
+ "step": 5374
+ },
+ {
+ "epoch": 14.645776566757494,
+ "grad_norm": 8.300336837768555,
+ "learning_rate": 1.9297075976126044e-05,
+ "loss": 1.0693,
+ "step": 5375
+ },
+ {
+ "epoch": 14.64850136239782,
+ "grad_norm": 15.77609634399414,
+ "learning_rate": 1.9296750918475807e-05,
+ "loss": 1.1682,
+ "step": 5376
+ },
+ {
+ "epoch": 14.651226158038147,
+ "grad_norm": 13.076919555664062,
+ "learning_rate": 1.9296425788422776e-05,
+ "loss": 1.0071,
+ "step": 5377
+ },
+ {
+ "epoch": 14.653950953678475,
+ "grad_norm": 9.423595428466797,
+ "learning_rate": 1.9296100585969478e-05,
+ "loss": 0.8604,
+ "step": 5378
+ },
+ {
+ "epoch": 14.6566757493188,
+ "grad_norm": 11.712821006774902,
+ "learning_rate": 1.9295775311118445e-05,
+ "loss": 1.2681,
+ "step": 5379
+ },
+ {
+ "epoch": 14.659400544959128,
+ "grad_norm": 13.311676025390625,
+ "learning_rate": 1.9295449963872217e-05,
+ "loss": 1.0983,
+ "step": 5380
+ },
+ {
+ "epoch": 14.662125340599456,
+ "grad_norm": 11.761080741882324,
+ "learning_rate": 1.9295124544233322e-05,
+ "loss": 1.1125,
+ "step": 5381
+ },
+ {
+ "epoch": 14.664850136239782,
+ "grad_norm": 9.576361656188965,
+ "learning_rate": 1.92947990522043e-05,
+ "loss": 1.0984,
+ "step": 5382
+ },
+ {
+ "epoch": 14.66757493188011,
+ "grad_norm": 38.030128479003906,
+ "learning_rate": 1.929447348778768e-05,
+ "loss": 1.2019,
+ "step": 5383
+ },
+ {
+ "epoch": 14.670299727520437,
+ "grad_norm": 11.681124687194824,
+ "learning_rate": 1.9294147850985997e-05,
+ "loss": 0.9224,
+ "step": 5384
+ },
+ {
+ "epoch": 14.673024523160763,
+ "grad_norm": 11.757031440734863,
+ "learning_rate": 1.929382214180179e-05,
+ "loss": 0.9999,
+ "step": 5385
+ },
+ {
+ "epoch": 14.67574931880109,
+ "grad_norm": 16.173267364501953,
+ "learning_rate": 1.92934963602376e-05,
+ "loss": 1.1206,
+ "step": 5386
+ },
+ {
+ "epoch": 14.678474114441418,
+ "grad_norm": 10.76258659362793,
+ "learning_rate": 1.9293170506295955e-05,
+ "loss": 1.177,
+ "step": 5387
+ },
+ {
+ "epoch": 14.681198910081743,
+ "grad_norm": 12.828961372375488,
+ "learning_rate": 1.92928445799794e-05,
+ "loss": 1.079,
+ "step": 5388
+ },
+ {
+ "epoch": 14.683923705722071,
+ "grad_norm": 12.985787391662598,
+ "learning_rate": 1.929251858129047e-05,
+ "loss": 1.1857,
+ "step": 5389
+ },
+ {
+ "epoch": 14.686648501362399,
+ "grad_norm": 11.821076393127441,
+ "learning_rate": 1.92921925102317e-05,
+ "loss": 1.2253,
+ "step": 5390
+ },
+ {
+ "epoch": 14.689373297002724,
+ "grad_norm": 9.981273651123047,
+ "learning_rate": 1.929186636680564e-05,
+ "loss": 1.1775,
+ "step": 5391
+ },
+ {
+ "epoch": 14.692098092643052,
+ "grad_norm": 8.71783447265625,
+ "learning_rate": 1.929154015101482e-05,
+ "loss": 1.1611,
+ "step": 5392
+ },
+ {
+ "epoch": 14.69482288828338,
+ "grad_norm": 11.263312339782715,
+ "learning_rate": 1.9291213862861785e-05,
+ "loss": 1.094,
+ "step": 5393
+ },
+ {
+ "epoch": 14.697547683923705,
+ "grad_norm": 13.133688926696777,
+ "learning_rate": 1.9290887502349078e-05,
+ "loss": 1.167,
+ "step": 5394
+ },
+ {
+ "epoch": 14.700272479564033,
+ "grad_norm": 9.394452095031738,
+ "learning_rate": 1.9290561069479237e-05,
+ "loss": 1.0637,
+ "step": 5395
+ },
+ {
+ "epoch": 14.70299727520436,
+ "grad_norm": 13.00540542602539,
+ "learning_rate": 1.9290234564254803e-05,
+ "loss": 1.1196,
+ "step": 5396
+ },
+ {
+ "epoch": 14.705722070844686,
+ "grad_norm": 9.813802719116211,
+ "learning_rate": 1.928990798667832e-05,
+ "loss": 1.1252,
+ "step": 5397
+ },
+ {
+ "epoch": 14.708446866485014,
+ "grad_norm": 11.41059398651123,
+ "learning_rate": 1.9289581336752338e-05,
+ "loss": 1.0109,
+ "step": 5398
+ },
+ {
+ "epoch": 14.711171662125341,
+ "grad_norm": 9.798429489135742,
+ "learning_rate": 1.928925461447939e-05,
+ "loss": 1.1284,
+ "step": 5399
+ },
+ {
+ "epoch": 14.713896457765667,
+ "grad_norm": 8.876011848449707,
+ "learning_rate": 1.9288927819862033e-05,
+ "loss": 1.1147,
+ "step": 5400
+ },
+ {
+ "epoch": 14.716621253405995,
+ "grad_norm": 9.106521606445312,
+ "learning_rate": 1.92886009529028e-05,
+ "loss": 1.0334,
+ "step": 5401
+ },
+ {
+ "epoch": 14.719346049046322,
+ "grad_norm": 9.955561637878418,
+ "learning_rate": 1.9288274013604242e-05,
+ "loss": 1.1182,
+ "step": 5402
+ },
+ {
+ "epoch": 14.722070844686648,
+ "grad_norm": 9.079973220825195,
+ "learning_rate": 1.928794700196891e-05,
+ "loss": 1.1797,
+ "step": 5403
+ },
+ {
+ "epoch": 14.724795640326976,
+ "grad_norm": 12.39723014831543,
+ "learning_rate": 1.9287619917999336e-05,
+ "loss": 1.1438,
+ "step": 5404
+ },
+ {
+ "epoch": 14.727520435967303,
+ "grad_norm": 10.512011528015137,
+ "learning_rate": 1.9287292761698083e-05,
+ "loss": 1.0942,
+ "step": 5405
+ },
+ {
+ "epoch": 14.730245231607629,
+ "grad_norm": 12.560011863708496,
+ "learning_rate": 1.9286965533067694e-05,
+ "loss": 1.0437,
+ "step": 5406
+ },
+ {
+ "epoch": 14.732970027247957,
+ "grad_norm": 9.511140823364258,
+ "learning_rate": 1.9286638232110714e-05,
+ "loss": 1.1846,
+ "step": 5407
+ },
+ {
+ "epoch": 14.735694822888284,
+ "grad_norm": 10.107234001159668,
+ "learning_rate": 1.9286310858829696e-05,
+ "loss": 1.2512,
+ "step": 5408
+ },
+ {
+ "epoch": 14.73841961852861,
+ "grad_norm": 10.85128402709961,
+ "learning_rate": 1.9285983413227186e-05,
+ "loss": 0.8578,
+ "step": 5409
+ },
+ {
+ "epoch": 14.741144414168938,
+ "grad_norm": 11.938522338867188,
+ "learning_rate": 1.928565589530574e-05,
+ "loss": 1.0198,
+ "step": 5410
+ },
+ {
+ "epoch": 14.743869209809265,
+ "grad_norm": 11.250466346740723,
+ "learning_rate": 1.9285328305067898e-05,
+ "loss": 1.2422,
+ "step": 5411
+ },
+ {
+ "epoch": 14.746594005449591,
+ "grad_norm": 9.212725639343262,
+ "learning_rate": 1.928500064251622e-05,
+ "loss": 1.2889,
+ "step": 5412
+ },
+ {
+ "epoch": 14.749318801089919,
+ "grad_norm": 7.821893692016602,
+ "learning_rate": 1.9284672907653258e-05,
+ "loss": 1.0786,
+ "step": 5413
+ },
+ {
+ "epoch": 14.752043596730246,
+ "grad_norm": 9.918364524841309,
+ "learning_rate": 1.928434510048156e-05,
+ "loss": 1.1282,
+ "step": 5414
+ },
+ {
+ "epoch": 14.754768392370572,
+ "grad_norm": 9.928297996520996,
+ "learning_rate": 1.9284017221003686e-05,
+ "loss": 1.1211,
+ "step": 5415
+ },
+ {
+ "epoch": 14.7574931880109,
+ "grad_norm": 8.590800285339355,
+ "learning_rate": 1.928368926922218e-05,
+ "loss": 1.1864,
+ "step": 5416
+ },
+ {
+ "epoch": 14.760217983651227,
+ "grad_norm": 8.307841300964355,
+ "learning_rate": 1.92833612451396e-05,
+ "loss": 0.9934,
+ "step": 5417
+ },
+ {
+ "epoch": 14.762942779291553,
+ "grad_norm": 8.209846496582031,
+ "learning_rate": 1.9283033148758506e-05,
+ "loss": 1.0151,
+ "step": 5418
+ },
+ {
+ "epoch": 14.76566757493188,
+ "grad_norm": 9.439775466918945,
+ "learning_rate": 1.9282704980081446e-05,
+ "loss": 1.1469,
+ "step": 5419
+ },
+ {
+ "epoch": 14.768392370572208,
+ "grad_norm": 9.905940055847168,
+ "learning_rate": 1.928237673911098e-05,
+ "loss": 1.1277,
+ "step": 5420
+ },
+ {
+ "epoch": 14.771117166212534,
+ "grad_norm": 10.38306999206543,
+ "learning_rate": 1.928204842584966e-05,
+ "loss": 1.0771,
+ "step": 5421
+ },
+ {
+ "epoch": 14.773841961852861,
+ "grad_norm": 10.64194393157959,
+ "learning_rate": 1.928172004030005e-05,
+ "loss": 1.1511,
+ "step": 5422
+ },
+ {
+ "epoch": 14.776566757493189,
+ "grad_norm": 9.811735153198242,
+ "learning_rate": 1.9281391582464697e-05,
+ "loss": 1.2218,
+ "step": 5423
+ },
+ {
+ "epoch": 14.779291553133515,
+ "grad_norm": 10.465387344360352,
+ "learning_rate": 1.9281063052346168e-05,
+ "loss": 0.9645,
+ "step": 5424
+ },
+ {
+ "epoch": 14.782016348773842,
+ "grad_norm": 9.601802825927734,
+ "learning_rate": 1.928073444994702e-05,
+ "loss": 1.1152,
+ "step": 5425
+ },
+ {
+ "epoch": 14.78474114441417,
+ "grad_norm": 8.191433906555176,
+ "learning_rate": 1.928040577526981e-05,
+ "loss": 1.0205,
+ "step": 5426
+ },
+ {
+ "epoch": 14.787465940054496,
+ "grad_norm": 8.16183090209961,
+ "learning_rate": 1.9280077028317096e-05,
+ "loss": 1.1672,
+ "step": 5427
+ },
+ {
+ "epoch": 14.790190735694823,
+ "grad_norm": 13.249311447143555,
+ "learning_rate": 1.927974820909144e-05,
+ "loss": 1.1494,
+ "step": 5428
+ },
+ {
+ "epoch": 14.79291553133515,
+ "grad_norm": 7.822423458099365,
+ "learning_rate": 1.927941931759541e-05,
+ "loss": 1.1196,
+ "step": 5429
+ },
+ {
+ "epoch": 14.795640326975477,
+ "grad_norm": 7.371486186981201,
+ "learning_rate": 1.9279090353831557e-05,
+ "loss": 0.9851,
+ "step": 5430
+ },
+ {
+ "epoch": 14.798365122615804,
+ "grad_norm": 9.159686088562012,
+ "learning_rate": 1.9278761317802448e-05,
+ "loss": 1.1333,
+ "step": 5431
+ },
+ {
+ "epoch": 14.80108991825613,
+ "grad_norm": 14.047561645507812,
+ "learning_rate": 1.9278432209510644e-05,
+ "loss": 1.1741,
+ "step": 5432
+ },
+ {
+ "epoch": 14.803814713896458,
+ "grad_norm": 12.84555435180664,
+ "learning_rate": 1.9278103028958707e-05,
+ "loss": 1.0486,
+ "step": 5433
+ },
+ {
+ "epoch": 14.806539509536785,
+ "grad_norm": 8.609007835388184,
+ "learning_rate": 1.9277773776149208e-05,
+ "loss": 1.0444,
+ "step": 5434
+ },
+ {
+ "epoch": 14.809264305177111,
+ "grad_norm": 8.697768211364746,
+ "learning_rate": 1.92774444510847e-05,
+ "loss": 1.1321,
+ "step": 5435
+ },
+ {
+ "epoch": 14.811989100817438,
+ "grad_norm": 7.1575798988342285,
+ "learning_rate": 1.927711505376775e-05,
+ "loss": 1.1589,
+ "step": 5436
+ },
+ {
+ "epoch": 14.814713896457766,
+ "grad_norm": 32.84316635131836,
+ "learning_rate": 1.9276785584200935e-05,
+ "loss": 1.0726,
+ "step": 5437
+ },
+ {
+ "epoch": 14.817438692098092,
+ "grad_norm": 9.116987228393555,
+ "learning_rate": 1.9276456042386806e-05,
+ "loss": 1.0488,
+ "step": 5438
+ },
+ {
+ "epoch": 14.82016348773842,
+ "grad_norm": 8.860197067260742,
+ "learning_rate": 1.927612642832794e-05,
+ "loss": 1.098,
+ "step": 5439
+ },
+ {
+ "epoch": 14.822888283378747,
+ "grad_norm": 9.601526260375977,
+ "learning_rate": 1.9275796742026898e-05,
+ "loss": 1.1243,
+ "step": 5440
+ },
+ {
+ "epoch": 14.825613079019073,
+ "grad_norm": 11.47438907623291,
+ "learning_rate": 1.9275466983486247e-05,
+ "loss": 1.1287,
+ "step": 5441
+ },
+ {
+ "epoch": 14.8283378746594,
+ "grad_norm": 8.937363624572754,
+ "learning_rate": 1.9275137152708564e-05,
+ "loss": 0.9294,
+ "step": 5442
+ },
+ {
+ "epoch": 14.831062670299728,
+ "grad_norm": 9.600807189941406,
+ "learning_rate": 1.9274807249696405e-05,
+ "loss": 1.077,
+ "step": 5443
+ },
+ {
+ "epoch": 14.833787465940054,
+ "grad_norm": 8.64490795135498,
+ "learning_rate": 1.927447727445235e-05,
+ "loss": 0.9917,
+ "step": 5444
+ },
+ {
+ "epoch": 14.836512261580381,
+ "grad_norm": 9.722396850585938,
+ "learning_rate": 1.9274147226978962e-05,
+ "loss": 0.9272,
+ "step": 5445
+ },
+ {
+ "epoch": 14.839237057220709,
+ "grad_norm": 9.325379371643066,
+ "learning_rate": 1.9273817107278815e-05,
+ "loss": 1.0829,
+ "step": 5446
+ },
+ {
+ "epoch": 14.841961852861035,
+ "grad_norm": 9.744324684143066,
+ "learning_rate": 1.927348691535448e-05,
+ "loss": 1.0204,
+ "step": 5447
+ },
+ {
+ "epoch": 14.844686648501362,
+ "grad_norm": 10.210845947265625,
+ "learning_rate": 1.9273156651208525e-05,
+ "loss": 1.2598,
+ "step": 5448
+ },
+ {
+ "epoch": 14.84741144414169,
+ "grad_norm": 8.943734169006348,
+ "learning_rate": 1.9272826314843526e-05,
+ "loss": 1.0222,
+ "step": 5449
+ },
+ {
+ "epoch": 14.850136239782016,
+ "grad_norm": 7.680088520050049,
+ "learning_rate": 1.9272495906262053e-05,
+ "loss": 0.9257,
+ "step": 5450
+ },
+ {
+ "epoch": 14.852861035422343,
+ "grad_norm": 11.96497631072998,
+ "learning_rate": 1.927216542546668e-05,
+ "loss": 1.1292,
+ "step": 5451
+ },
+ {
+ "epoch": 14.85558583106267,
+ "grad_norm": 7.999666213989258,
+ "learning_rate": 1.9271834872459982e-05,
+ "loss": 1.0208,
+ "step": 5452
+ },
+ {
+ "epoch": 14.858310626702997,
+ "grad_norm": 10.969223976135254,
+ "learning_rate": 1.9271504247244534e-05,
+ "loss": 1.1418,
+ "step": 5453
+ },
+ {
+ "epoch": 14.861035422343324,
+ "grad_norm": 10.95656967163086,
+ "learning_rate": 1.927117354982291e-05,
+ "loss": 1.1616,
+ "step": 5454
+ },
+ {
+ "epoch": 14.863760217983652,
+ "grad_norm": 11.002049446105957,
+ "learning_rate": 1.927084278019768e-05,
+ "loss": 1.04,
+ "step": 5455
+ },
+ {
+ "epoch": 14.866485013623977,
+ "grad_norm": 9.948211669921875,
+ "learning_rate": 1.9270511938371425e-05,
+ "loss": 1.1589,
+ "step": 5456
+ },
+ {
+ "epoch": 14.869209809264305,
+ "grad_norm": 7.003767967224121,
+ "learning_rate": 1.9270181024346727e-05,
+ "loss": 1.054,
+ "step": 5457
+ },
+ {
+ "epoch": 14.871934604904633,
+ "grad_norm": 9.24045181274414,
+ "learning_rate": 1.9269850038126152e-05,
+ "loss": 0.9512,
+ "step": 5458
+ },
+ {
+ "epoch": 14.874659400544958,
+ "grad_norm": 9.06789493560791,
+ "learning_rate": 1.9269518979712285e-05,
+ "loss": 1.1877,
+ "step": 5459
+ },
+ {
+ "epoch": 14.877384196185286,
+ "grad_norm": 10.27806282043457,
+ "learning_rate": 1.9269187849107703e-05,
+ "loss": 1.1566,
+ "step": 5460
+ },
+ {
+ "epoch": 14.880108991825614,
+ "grad_norm": 8.048421859741211,
+ "learning_rate": 1.9268856646314983e-05,
+ "loss": 1.1638,
+ "step": 5461
+ },
+ {
+ "epoch": 14.88283378746594,
+ "grad_norm": 11.141575813293457,
+ "learning_rate": 1.926852537133671e-05,
+ "loss": 1.2466,
+ "step": 5462
+ },
+ {
+ "epoch": 14.885558583106267,
+ "grad_norm": 8.194379806518555,
+ "learning_rate": 1.926819402417546e-05,
+ "loss": 1.1511,
+ "step": 5463
+ },
+ {
+ "epoch": 14.888283378746594,
+ "grad_norm": 8.322203636169434,
+ "learning_rate": 1.9267862604833808e-05,
+ "loss": 1.0703,
+ "step": 5464
+ },
+ {
+ "epoch": 14.89100817438692,
+ "grad_norm": 8.79293155670166,
+ "learning_rate": 1.9267531113314343e-05,
+ "loss": 1.2595,
+ "step": 5465
+ },
+ {
+ "epoch": 14.893732970027248,
+ "grad_norm": 12.21040153503418,
+ "learning_rate": 1.9267199549619643e-05,
+ "loss": 1.0713,
+ "step": 5466
+ },
+ {
+ "epoch": 14.896457765667575,
+ "grad_norm": 13.462485313415527,
+ "learning_rate": 1.926686791375229e-05,
+ "loss": 1.0867,
+ "step": 5467
+ },
+ {
+ "epoch": 14.899182561307901,
+ "grad_norm": 8.758882522583008,
+ "learning_rate": 1.926653620571487e-05,
+ "loss": 1.1934,
+ "step": 5468
+ },
+ {
+ "epoch": 14.901907356948229,
+ "grad_norm": 8.370561599731445,
+ "learning_rate": 1.9266204425509962e-05,
+ "loss": 1.1484,
+ "step": 5469
+ },
+ {
+ "epoch": 14.904632152588556,
+ "grad_norm": 9.9232816696167,
+ "learning_rate": 1.9265872573140156e-05,
+ "loss": 1.0056,
+ "step": 5470
+ },
+ {
+ "epoch": 14.907356948228882,
+ "grad_norm": 9.87440013885498,
+ "learning_rate": 1.926554064860803e-05,
+ "loss": 1.1371,
+ "step": 5471
+ },
+ {
+ "epoch": 14.91008174386921,
+ "grad_norm": 9.33785343170166,
+ "learning_rate": 1.9265208651916172e-05,
+ "loss": 1.063,
+ "step": 5472
+ },
+ {
+ "epoch": 14.912806539509537,
+ "grad_norm": 16.72821044921875,
+ "learning_rate": 1.9264876583067167e-05,
+ "loss": 1.2517,
+ "step": 5473
+ },
+ {
+ "epoch": 14.915531335149863,
+ "grad_norm": 9.422157287597656,
+ "learning_rate": 1.92645444420636e-05,
+ "loss": 1.1331,
+ "step": 5474
+ },
+ {
+ "epoch": 14.91825613079019,
+ "grad_norm": 8.592704772949219,
+ "learning_rate": 1.9264212228908063e-05,
+ "loss": 1.0295,
+ "step": 5475
+ },
+ {
+ "epoch": 14.920980926430518,
+ "grad_norm": 8.709903717041016,
+ "learning_rate": 1.9263879943603136e-05,
+ "loss": 1.0198,
+ "step": 5476
+ },
+ {
+ "epoch": 14.923705722070844,
+ "grad_norm": 8.811495780944824,
+ "learning_rate": 1.9263547586151412e-05,
+ "loss": 0.9832,
+ "step": 5477
+ },
+ {
+ "epoch": 14.926430517711172,
+ "grad_norm": 10.670900344848633,
+ "learning_rate": 1.9263215156555477e-05,
+ "loss": 1.1501,
+ "step": 5478
+ },
+ {
+ "epoch": 14.9291553133515,
+ "grad_norm": 9.27827262878418,
+ "learning_rate": 1.9262882654817918e-05,
+ "loss": 1.157,
+ "step": 5479
+ },
+ {
+ "epoch": 14.931880108991825,
+ "grad_norm": 11.302102088928223,
+ "learning_rate": 1.926255008094133e-05,
+ "loss": 1.0518,
+ "step": 5480
+ },
+ {
+ "epoch": 14.934604904632153,
+ "grad_norm": 7.121042728424072,
+ "learning_rate": 1.92622174349283e-05,
+ "loss": 0.9431,
+ "step": 5481
+ },
+ {
+ "epoch": 14.93732970027248,
+ "grad_norm": 9.873361587524414,
+ "learning_rate": 1.9261884716781417e-05,
+ "loss": 1.1199,
+ "step": 5482
+ },
+ {
+ "epoch": 14.940054495912806,
+ "grad_norm": 10.81009578704834,
+ "learning_rate": 1.9261551926503277e-05,
+ "loss": 1.1157,
+ "step": 5483
+ },
+ {
+ "epoch": 14.942779291553133,
+ "grad_norm": 10.118577003479004,
+ "learning_rate": 1.9261219064096467e-05,
+ "loss": 1.0876,
+ "step": 5484
+ },
+ {
+ "epoch": 14.945504087193461,
+ "grad_norm": 9.304665565490723,
+ "learning_rate": 1.926088612956358e-05,
+ "loss": 1.1548,
+ "step": 5485
+ },
+ {
+ "epoch": 14.948228882833787,
+ "grad_norm": 8.310667991638184,
+ "learning_rate": 1.926055312290721e-05,
+ "loss": 1.0819,
+ "step": 5486
+ },
+ {
+ "epoch": 14.950953678474114,
+ "grad_norm": 10.15754508972168,
+ "learning_rate": 1.9260220044129953e-05,
+ "loss": 0.9282,
+ "step": 5487
+ },
+ {
+ "epoch": 14.953678474114442,
+ "grad_norm": 10.331604957580566,
+ "learning_rate": 1.9259886893234397e-05,
+ "loss": 1.1792,
+ "step": 5488
+ },
+ {
+ "epoch": 14.956403269754768,
+ "grad_norm": 10.211618423461914,
+ "learning_rate": 1.925955367022314e-05,
+ "loss": 1.0898,
+ "step": 5489
+ },
+ {
+ "epoch": 14.959128065395095,
+ "grad_norm": 11.046704292297363,
+ "learning_rate": 1.925922037509878e-05,
+ "loss": 1.0498,
+ "step": 5490
+ },
+ {
+ "epoch": 14.961852861035423,
+ "grad_norm": 13.784923553466797,
+ "learning_rate": 1.925888700786391e-05,
+ "loss": 0.9541,
+ "step": 5491
+ },
+ {
+ "epoch": 14.964577656675749,
+ "grad_norm": 14.446078300476074,
+ "learning_rate": 1.925855356852112e-05,
+ "loss": 1.0426,
+ "step": 5492
+ },
+ {
+ "epoch": 14.967302452316076,
+ "grad_norm": 13.812178611755371,
+ "learning_rate": 1.925822005707302e-05,
+ "loss": 1.2158,
+ "step": 5493
+ },
+ {
+ "epoch": 14.970027247956404,
+ "grad_norm": 9.299683570861816,
+ "learning_rate": 1.9257886473522194e-05,
+ "loss": 1.2102,
+ "step": 5494
+ },
+ {
+ "epoch": 14.97275204359673,
+ "grad_norm": 11.779254913330078,
+ "learning_rate": 1.925755281787125e-05,
+ "loss": 1.1792,
+ "step": 5495
+ },
+ {
+ "epoch": 14.975476839237057,
+ "grad_norm": 15.099937438964844,
+ "learning_rate": 1.9257219090122782e-05,
+ "loss": 1.0396,
+ "step": 5496
+ },
+ {
+ "epoch": 14.978201634877385,
+ "grad_norm": 21.414133071899414,
+ "learning_rate": 1.925688529027939e-05,
+ "loss": 1.3333,
+ "step": 5497
+ },
+ {
+ "epoch": 14.98092643051771,
+ "grad_norm": 12.682548522949219,
+ "learning_rate": 1.925655141834367e-05,
+ "loss": 1.3135,
+ "step": 5498
+ },
+ {
+ "epoch": 14.983651226158038,
+ "grad_norm": 9.636043548583984,
+ "learning_rate": 1.9256217474318227e-05,
+ "loss": 1.1958,
+ "step": 5499
+ },
+ {
+ "epoch": 14.986376021798366,
+ "grad_norm": 9.636250495910645,
+ "learning_rate": 1.9255883458205664e-05,
+ "loss": 0.9243,
+ "step": 5500
+ },
+ {
+ "epoch": 14.989100817438691,
+ "grad_norm": 17.597333908081055,
+ "learning_rate": 1.9255549370008575e-05,
+ "loss": 1.0493,
+ "step": 5501
+ },
+ {
+ "epoch": 14.991825613079019,
+ "grad_norm": 8.619144439697266,
+ "learning_rate": 1.925521520972957e-05,
+ "loss": 1.1733,
+ "step": 5502
+ },
+ {
+ "epoch": 14.994550408719347,
+ "grad_norm": 10.077827453613281,
+ "learning_rate": 1.925488097737124e-05,
+ "loss": 1.0237,
+ "step": 5503
+ },
+ {
+ "epoch": 14.997275204359672,
+ "grad_norm": 8.45253849029541,
+ "learning_rate": 1.92545466729362e-05,
+ "loss": 1.1523,
+ "step": 5504
+ },
+ {
+ "epoch": 15.0,
+ "grad_norm": 9.242919921875,
+ "learning_rate": 1.9254212296427043e-05,
+ "loss": 1.1511,
+ "step": 5505
+ },
+ {
+ "epoch": 15.002724795640328,
+ "grad_norm": 9.065591812133789,
+ "learning_rate": 1.925387784784638e-05,
+ "loss": 0.8765,
+ "step": 5506
+ },
+ {
+ "epoch": 15.005449591280653,
+ "grad_norm": 9.483454704284668,
+ "learning_rate": 1.925354332719682e-05,
+ "loss": 0.8127,
+ "step": 5507
+ },
+ {
+ "epoch": 15.008174386920981,
+ "grad_norm": 9.035008430480957,
+ "learning_rate": 1.9253208734480953e-05,
+ "loss": 1.0515,
+ "step": 5508
+ },
+ {
+ "epoch": 15.010899182561309,
+ "grad_norm": 10.661617279052734,
+ "learning_rate": 1.9252874069701405e-05,
+ "loss": 0.9171,
+ "step": 5509
+ },
+ {
+ "epoch": 15.013623978201634,
+ "grad_norm": 8.760483741760254,
+ "learning_rate": 1.9252539332860762e-05,
+ "loss": 1.2288,
+ "step": 5510
+ },
+ {
+ "epoch": 15.016348773841962,
+ "grad_norm": 7.86459493637085,
+ "learning_rate": 1.9252204523961645e-05,
+ "loss": 0.906,
+ "step": 5511
+ },
+ {
+ "epoch": 15.01907356948229,
+ "grad_norm": 10.616339683532715,
+ "learning_rate": 1.9251869643006657e-05,
+ "loss": 1.2582,
+ "step": 5512
+ },
+ {
+ "epoch": 15.021798365122615,
+ "grad_norm": 7.371670722961426,
+ "learning_rate": 1.9251534689998406e-05,
+ "loss": 1.0967,
+ "step": 5513
+ },
+ {
+ "epoch": 15.024523160762943,
+ "grad_norm": 6.8104567527771,
+ "learning_rate": 1.92511996649395e-05,
+ "loss": 0.828,
+ "step": 5514
+ },
+ {
+ "epoch": 15.02724795640327,
+ "grad_norm": 12.358208656311035,
+ "learning_rate": 1.925086456783255e-05,
+ "loss": 1.0417,
+ "step": 5515
+ },
+ {
+ "epoch": 15.029972752043596,
+ "grad_norm": 8.836557388305664,
+ "learning_rate": 1.925052939868016e-05,
+ "loss": 1.0027,
+ "step": 5516
+ },
+ {
+ "epoch": 15.032697547683924,
+ "grad_norm": 9.613363265991211,
+ "learning_rate": 1.925019415748495e-05,
+ "loss": 1.0148,
+ "step": 5517
+ },
+ {
+ "epoch": 15.035422343324251,
+ "grad_norm": 8.410662651062012,
+ "learning_rate": 1.924985884424952e-05,
+ "loss": 0.9382,
+ "step": 5518
+ },
+ {
+ "epoch": 15.038147138964577,
+ "grad_norm": 8.761898040771484,
+ "learning_rate": 1.9249523458976494e-05,
+ "loss": 0.9354,
+ "step": 5519
+ },
+ {
+ "epoch": 15.040871934604905,
+ "grad_norm": 10.815780639648438,
+ "learning_rate": 1.9249188001668474e-05,
+ "loss": 0.8989,
+ "step": 5520
+ },
+ {
+ "epoch": 15.043596730245232,
+ "grad_norm": 8.083906173706055,
+ "learning_rate": 1.9248852472328075e-05,
+ "loss": 1.0005,
+ "step": 5521
+ },
+ {
+ "epoch": 15.046321525885558,
+ "grad_norm": 7.896905422210693,
+ "learning_rate": 1.924851687095791e-05,
+ "loss": 1.0674,
+ "step": 5522
+ },
+ {
+ "epoch": 15.049046321525886,
+ "grad_norm": 7.164858818054199,
+ "learning_rate": 1.9248181197560594e-05,
+ "loss": 0.9547,
+ "step": 5523
+ },
+ {
+ "epoch": 15.051771117166213,
+ "grad_norm": 11.201558113098145,
+ "learning_rate": 1.924784545213874e-05,
+ "loss": 0.9178,
+ "step": 5524
+ },
+ {
+ "epoch": 15.054495912806539,
+ "grad_norm": 9.608845710754395,
+ "learning_rate": 1.9247509634694963e-05,
+ "loss": 0.993,
+ "step": 5525
+ },
+ {
+ "epoch": 15.057220708446867,
+ "grad_norm": 9.189961433410645,
+ "learning_rate": 1.924717374523188e-05,
+ "loss": 1.0779,
+ "step": 5526
+ },
+ {
+ "epoch": 15.059945504087194,
+ "grad_norm": 8.895902633666992,
+ "learning_rate": 1.9246837783752106e-05,
+ "loss": 1.0948,
+ "step": 5527
+ },
+ {
+ "epoch": 15.06267029972752,
+ "grad_norm": 8.975088119506836,
+ "learning_rate": 1.9246501750258256e-05,
+ "loss": 0.959,
+ "step": 5528
+ },
+ {
+ "epoch": 15.065395095367847,
+ "grad_norm": 11.457137107849121,
+ "learning_rate": 1.9246165644752944e-05,
+ "loss": 0.8561,
+ "step": 5529
+ },
+ {
+ "epoch": 15.068119891008175,
+ "grad_norm": 8.237933158874512,
+ "learning_rate": 1.92458294672388e-05,
+ "loss": 0.9904,
+ "step": 5530
+ },
+ {
+ "epoch": 15.0708446866485,
+ "grad_norm": 12.692983627319336,
+ "learning_rate": 1.9245493217718426e-05,
+ "loss": 1.02,
+ "step": 5531
+ },
+ {
+ "epoch": 15.073569482288828,
+ "grad_norm": 8.939153671264648,
+ "learning_rate": 1.924515689619445e-05,
+ "loss": 0.9595,
+ "step": 5532
+ },
+ {
+ "epoch": 15.076294277929156,
+ "grad_norm": 7.779260635375977,
+ "learning_rate": 1.9244820502669494e-05,
+ "loss": 1.1637,
+ "step": 5533
+ },
+ {
+ "epoch": 15.079019073569482,
+ "grad_norm": 13.962143898010254,
+ "learning_rate": 1.924448403714617e-05,
+ "loss": 1.0122,
+ "step": 5534
+ },
+ {
+ "epoch": 15.08174386920981,
+ "grad_norm": 27.474210739135742,
+ "learning_rate": 1.9244147499627103e-05,
+ "loss": 0.9863,
+ "step": 5535
+ },
+ {
+ "epoch": 15.084468664850137,
+ "grad_norm": 11.234265327453613,
+ "learning_rate": 1.924381089011491e-05,
+ "loss": 1.0011,
+ "step": 5536
+ },
+ {
+ "epoch": 15.087193460490463,
+ "grad_norm": 25.47540855407715,
+ "learning_rate": 1.924347420861222e-05,
+ "loss": 0.9214,
+ "step": 5537
+ },
+ {
+ "epoch": 15.08991825613079,
+ "grad_norm": 9.881484985351562,
+ "learning_rate": 1.9243137455121648e-05,
+ "loss": 0.9729,
+ "step": 5538
+ },
+ {
+ "epoch": 15.092643051771118,
+ "grad_norm": 7.067080497741699,
+ "learning_rate": 1.9242800629645815e-05,
+ "loss": 0.9155,
+ "step": 5539
+ },
+ {
+ "epoch": 15.095367847411444,
+ "grad_norm": 8.203058242797852,
+ "learning_rate": 1.9242463732187355e-05,
+ "loss": 0.9041,
+ "step": 5540
+ },
+ {
+ "epoch": 15.098092643051771,
+ "grad_norm": 11.838784217834473,
+ "learning_rate": 1.924212676274888e-05,
+ "loss": 1.014,
+ "step": 5541
+ },
+ {
+ "epoch": 15.100817438692099,
+ "grad_norm": 8.50169849395752,
+ "learning_rate": 1.9241789721333023e-05,
+ "loss": 0.9708,
+ "step": 5542
+ },
+ {
+ "epoch": 15.103542234332425,
+ "grad_norm": 9.780434608459473,
+ "learning_rate": 1.9241452607942405e-05,
+ "loss": 0.99,
+ "step": 5543
+ },
+ {
+ "epoch": 15.106267029972752,
+ "grad_norm": 10.974543571472168,
+ "learning_rate": 1.9241115422579647e-05,
+ "loss": 1.0862,
+ "step": 5544
+ },
+ {
+ "epoch": 15.10899182561308,
+ "grad_norm": 9.12978744506836,
+ "learning_rate": 1.9240778165247384e-05,
+ "loss": 1.0861,
+ "step": 5545
+ },
+ {
+ "epoch": 15.111716621253406,
+ "grad_norm": 10.310650825500488,
+ "learning_rate": 1.9240440835948236e-05,
+ "loss": 1.0051,
+ "step": 5546
+ },
+ {
+ "epoch": 15.114441416893733,
+ "grad_norm": 13.019513130187988,
+ "learning_rate": 1.924010343468483e-05,
+ "loss": 0.9302,
+ "step": 5547
+ },
+ {
+ "epoch": 15.11716621253406,
+ "grad_norm": 14.484766006469727,
+ "learning_rate": 1.92397659614598e-05,
+ "loss": 1.1006,
+ "step": 5548
+ },
+ {
+ "epoch": 15.119891008174386,
+ "grad_norm": 11.86329174041748,
+ "learning_rate": 1.923942841627577e-05,
+ "loss": 1.0583,
+ "step": 5549
+ },
+ {
+ "epoch": 15.122615803814714,
+ "grad_norm": 13.653573989868164,
+ "learning_rate": 1.9239090799135365e-05,
+ "loss": 1.0862,
+ "step": 5550
+ },
+ {
+ "epoch": 15.125340599455042,
+ "grad_norm": 13.406563758850098,
+ "learning_rate": 1.923875311004122e-05,
+ "loss": 0.9261,
+ "step": 5551
+ },
+ {
+ "epoch": 15.128065395095367,
+ "grad_norm": 13.019432067871094,
+ "learning_rate": 1.9238415348995965e-05,
+ "loss": 1.0138,
+ "step": 5552
+ },
+ {
+ "epoch": 15.130790190735695,
+ "grad_norm": 12.109644889831543,
+ "learning_rate": 1.9238077516002228e-05,
+ "loss": 1.1106,
+ "step": 5553
+ },
+ {
+ "epoch": 15.133514986376023,
+ "grad_norm": 13.985251426696777,
+ "learning_rate": 1.9237739611062637e-05,
+ "loss": 0.9958,
+ "step": 5554
+ },
+ {
+ "epoch": 15.136239782016348,
+ "grad_norm": 12.948760986328125,
+ "learning_rate": 1.923740163417983e-05,
+ "loss": 1.1196,
+ "step": 5555
+ },
+ {
+ "epoch": 15.138964577656676,
+ "grad_norm": 12.464645385742188,
+ "learning_rate": 1.9237063585356438e-05,
+ "loss": 0.9337,
+ "step": 5556
+ },
+ {
+ "epoch": 15.141689373297003,
+ "grad_norm": 19.540958404541016,
+ "learning_rate": 1.923672546459509e-05,
+ "loss": 1.0425,
+ "step": 5557
+ },
+ {
+ "epoch": 15.14441416893733,
+ "grad_norm": 11.664422988891602,
+ "learning_rate": 1.9236387271898422e-05,
+ "loss": 0.9451,
+ "step": 5558
+ },
+ {
+ "epoch": 15.147138964577657,
+ "grad_norm": 14.192788124084473,
+ "learning_rate": 1.9236049007269065e-05,
+ "loss": 1.0309,
+ "step": 5559
+ },
+ {
+ "epoch": 15.149863760217984,
+ "grad_norm": 10.858256340026855,
+ "learning_rate": 1.923571067070966e-05,
+ "loss": 0.983,
+ "step": 5560
+ },
+ {
+ "epoch": 15.15258855585831,
+ "grad_norm": 62.61029052734375,
+ "learning_rate": 1.9235372262222836e-05,
+ "loss": 1.1512,
+ "step": 5561
+ },
+ {
+ "epoch": 15.155313351498638,
+ "grad_norm": 13.153077125549316,
+ "learning_rate": 1.923503378181123e-05,
+ "loss": 1.0171,
+ "step": 5562
+ },
+ {
+ "epoch": 15.158038147138965,
+ "grad_norm": 14.244160652160645,
+ "learning_rate": 1.9234695229477475e-05,
+ "loss": 0.9473,
+ "step": 5563
+ },
+ {
+ "epoch": 15.160762942779291,
+ "grad_norm": 11.219650268554688,
+ "learning_rate": 1.9234356605224214e-05,
+ "loss": 1.182,
+ "step": 5564
+ },
+ {
+ "epoch": 15.163487738419619,
+ "grad_norm": 10.995183944702148,
+ "learning_rate": 1.923401790905408e-05,
+ "loss": 1.0027,
+ "step": 5565
+ },
+ {
+ "epoch": 15.166212534059946,
+ "grad_norm": 66.59759521484375,
+ "learning_rate": 1.9233679140969712e-05,
+ "loss": 1.0862,
+ "step": 5566
+ },
+ {
+ "epoch": 15.168937329700272,
+ "grad_norm": 10.47517204284668,
+ "learning_rate": 1.9233340300973748e-05,
+ "loss": 1.0009,
+ "step": 5567
+ },
+ {
+ "epoch": 15.1716621253406,
+ "grad_norm": 9.122160911560059,
+ "learning_rate": 1.923300138906883e-05,
+ "loss": 0.9331,
+ "step": 5568
+ },
+ {
+ "epoch": 15.174386920980927,
+ "grad_norm": 13.863876342773438,
+ "learning_rate": 1.9232662405257587e-05,
+ "loss": 1.0895,
+ "step": 5569
+ },
+ {
+ "epoch": 15.177111716621253,
+ "grad_norm": 30.79233169555664,
+ "learning_rate": 1.9232323349542672e-05,
+ "loss": 0.9667,
+ "step": 5570
+ },
+ {
+ "epoch": 15.17983651226158,
+ "grad_norm": 29.254474639892578,
+ "learning_rate": 1.923198422192672e-05,
+ "loss": 0.8047,
+ "step": 5571
+ },
+ {
+ "epoch": 15.182561307901908,
+ "grad_norm": 13.909764289855957,
+ "learning_rate": 1.9231645022412367e-05,
+ "loss": 1.157,
+ "step": 5572
+ },
+ {
+ "epoch": 15.185286103542234,
+ "grad_norm": 9.685226440429688,
+ "learning_rate": 1.9231305751002264e-05,
+ "loss": 1.0886,
+ "step": 5573
+ },
+ {
+ "epoch": 15.188010899182562,
+ "grad_norm": 11.024321556091309,
+ "learning_rate": 1.9230966407699048e-05,
+ "loss": 1.0128,
+ "step": 5574
+ },
+ {
+ "epoch": 15.190735694822889,
+ "grad_norm": 11.645596504211426,
+ "learning_rate": 1.9230626992505363e-05,
+ "loss": 1.0615,
+ "step": 5575
+ },
+ {
+ "epoch": 15.193460490463215,
+ "grad_norm": 34.92819595336914,
+ "learning_rate": 1.9230287505423854e-05,
+ "loss": 0.9623,
+ "step": 5576
+ },
+ {
+ "epoch": 15.196185286103542,
+ "grad_norm": 11.23338794708252,
+ "learning_rate": 1.922994794645716e-05,
+ "loss": 1.1057,
+ "step": 5577
+ },
+ {
+ "epoch": 15.19891008174387,
+ "grad_norm": 11.245293617248535,
+ "learning_rate": 1.9229608315607927e-05,
+ "loss": 1.0365,
+ "step": 5578
+ },
+ {
+ "epoch": 15.201634877384196,
+ "grad_norm": 9.669820785522461,
+ "learning_rate": 1.9229268612878805e-05,
+ "loss": 1.1202,
+ "step": 5579
+ },
+ {
+ "epoch": 15.204359673024523,
+ "grad_norm": 12.526248931884766,
+ "learning_rate": 1.9228928838272436e-05,
+ "loss": 0.9048,
+ "step": 5580
+ },
+ {
+ "epoch": 15.207084468664851,
+ "grad_norm": 9.201279640197754,
+ "learning_rate": 1.9228588991791462e-05,
+ "loss": 1.1516,
+ "step": 5581
+ },
+ {
+ "epoch": 15.209809264305177,
+ "grad_norm": 8.671073913574219,
+ "learning_rate": 1.922824907343854e-05,
+ "loss": 0.9691,
+ "step": 5582
+ },
+ {
+ "epoch": 15.212534059945504,
+ "grad_norm": 11.62646484375,
+ "learning_rate": 1.9227909083216305e-05,
+ "loss": 1.1575,
+ "step": 5583
+ },
+ {
+ "epoch": 15.215258855585832,
+ "grad_norm": 8.900074005126953,
+ "learning_rate": 1.9227569021127418e-05,
+ "loss": 1.0645,
+ "step": 5584
+ },
+ {
+ "epoch": 15.217983651226158,
+ "grad_norm": 11.487918853759766,
+ "learning_rate": 1.9227228887174517e-05,
+ "loss": 1.0321,
+ "step": 5585
+ },
+ {
+ "epoch": 15.220708446866485,
+ "grad_norm": 9.938650131225586,
+ "learning_rate": 1.9226888681360253e-05,
+ "loss": 1.1611,
+ "step": 5586
+ },
+ {
+ "epoch": 15.223433242506813,
+ "grad_norm": 12.60831356048584,
+ "learning_rate": 1.9226548403687277e-05,
+ "loss": 1.0646,
+ "step": 5587
+ },
+ {
+ "epoch": 15.226158038147139,
+ "grad_norm": 12.61571979522705,
+ "learning_rate": 1.922620805415824e-05,
+ "loss": 1.1956,
+ "step": 5588
+ },
+ {
+ "epoch": 15.228882833787466,
+ "grad_norm": 14.253225326538086,
+ "learning_rate": 1.9225867632775792e-05,
+ "loss": 1.0023,
+ "step": 5589
+ },
+ {
+ "epoch": 15.231607629427794,
+ "grad_norm": 9.755847930908203,
+ "learning_rate": 1.922552713954258e-05,
+ "loss": 1.2346,
+ "step": 5590
+ },
+ {
+ "epoch": 15.23433242506812,
+ "grad_norm": 8.390456199645996,
+ "learning_rate": 1.9225186574461267e-05,
+ "loss": 0.9659,
+ "step": 5591
+ },
+ {
+ "epoch": 15.237057220708447,
+ "grad_norm": 11.750336647033691,
+ "learning_rate": 1.9224845937534493e-05,
+ "loss": 0.9033,
+ "step": 5592
+ },
+ {
+ "epoch": 15.239782016348773,
+ "grad_norm": 8.2207612991333,
+ "learning_rate": 1.9224505228764916e-05,
+ "loss": 1.0713,
+ "step": 5593
+ },
+ {
+ "epoch": 15.2425068119891,
+ "grad_norm": 9.45234203338623,
+ "learning_rate": 1.9224164448155188e-05,
+ "loss": 0.9524,
+ "step": 5594
+ },
+ {
+ "epoch": 15.245231607629428,
+ "grad_norm": 12.078112602233887,
+ "learning_rate": 1.9223823595707965e-05,
+ "loss": 1.0212,
+ "step": 5595
+ },
+ {
+ "epoch": 15.247956403269754,
+ "grad_norm": 9.097121238708496,
+ "learning_rate": 1.9223482671425904e-05,
+ "loss": 0.9946,
+ "step": 5596
+ },
+ {
+ "epoch": 15.250681198910081,
+ "grad_norm": 10.710465431213379,
+ "learning_rate": 1.9223141675311655e-05,
+ "loss": 0.8982,
+ "step": 5597
+ },
+ {
+ "epoch": 15.253405994550409,
+ "grad_norm": 8.28371524810791,
+ "learning_rate": 1.9222800607367877e-05,
+ "loss": 1.0732,
+ "step": 5598
+ },
+ {
+ "epoch": 15.256130790190735,
+ "grad_norm": 9.326583862304688,
+ "learning_rate": 1.9222459467597222e-05,
+ "loss": 1.0354,
+ "step": 5599
+ },
+ {
+ "epoch": 15.258855585831062,
+ "grad_norm": 11.349653244018555,
+ "learning_rate": 1.9222118256002348e-05,
+ "loss": 1.0374,
+ "step": 5600
+ },
+ {
+ "epoch": 15.26158038147139,
+ "grad_norm": 23.970081329345703,
+ "learning_rate": 1.9221776972585917e-05,
+ "loss": 1.1165,
+ "step": 5601
+ },
+ {
+ "epoch": 15.264305177111716,
+ "grad_norm": 9.690476417541504,
+ "learning_rate": 1.9221435617350583e-05,
+ "loss": 0.9819,
+ "step": 5602
+ },
+ {
+ "epoch": 15.267029972752043,
+ "grad_norm": 9.96845531463623,
+ "learning_rate": 1.9221094190299004e-05,
+ "loss": 1.0791,
+ "step": 5603
+ },
+ {
+ "epoch": 15.269754768392371,
+ "grad_norm": 8.391413688659668,
+ "learning_rate": 1.922075269143384e-05,
+ "loss": 0.7684,
+ "step": 5604
+ },
+ {
+ "epoch": 15.272479564032697,
+ "grad_norm": 11.63350772857666,
+ "learning_rate": 1.9220411120757753e-05,
+ "loss": 0.844,
+ "step": 5605
+ },
+ {
+ "epoch": 15.275204359673024,
+ "grad_norm": 10.096068382263184,
+ "learning_rate": 1.92200694782734e-05,
+ "loss": 1.0132,
+ "step": 5606
+ },
+ {
+ "epoch": 15.277929155313352,
+ "grad_norm": 15.669937133789062,
+ "learning_rate": 1.9219727763983443e-05,
+ "loss": 0.9551,
+ "step": 5607
+ },
+ {
+ "epoch": 15.280653950953678,
+ "grad_norm": 11.468816757202148,
+ "learning_rate": 1.9219385977890542e-05,
+ "loss": 0.9557,
+ "step": 5608
+ },
+ {
+ "epoch": 15.283378746594005,
+ "grad_norm": 13.702680587768555,
+ "learning_rate": 1.9219044119997362e-05,
+ "loss": 1.2427,
+ "step": 5609
+ },
+ {
+ "epoch": 15.286103542234333,
+ "grad_norm": 9.633628845214844,
+ "learning_rate": 1.9218702190306563e-05,
+ "loss": 0.9138,
+ "step": 5610
+ },
+ {
+ "epoch": 15.288828337874659,
+ "grad_norm": 9.522684097290039,
+ "learning_rate": 1.9218360188820804e-05,
+ "loss": 1.0321,
+ "step": 5611
+ },
+ {
+ "epoch": 15.291553133514986,
+ "grad_norm": 10.326404571533203,
+ "learning_rate": 1.9218018115542755e-05,
+ "loss": 1.0386,
+ "step": 5612
+ },
+ {
+ "epoch": 15.294277929155314,
+ "grad_norm": 10.368290901184082,
+ "learning_rate": 1.9217675970475076e-05,
+ "loss": 1.1053,
+ "step": 5613
+ },
+ {
+ "epoch": 15.29700272479564,
+ "grad_norm": 9.028491973876953,
+ "learning_rate": 1.9217333753620436e-05,
+ "loss": 1.0016,
+ "step": 5614
+ },
+ {
+ "epoch": 15.299727520435967,
+ "grad_norm": 11.764110565185547,
+ "learning_rate": 1.9216991464981496e-05,
+ "loss": 1.1145,
+ "step": 5615
+ },
+ {
+ "epoch": 15.302452316076295,
+ "grad_norm": 12.641221046447754,
+ "learning_rate": 1.9216649104560924e-05,
+ "loss": 1.2463,
+ "step": 5616
+ },
+ {
+ "epoch": 15.30517711171662,
+ "grad_norm": 22.181150436401367,
+ "learning_rate": 1.9216306672361385e-05,
+ "loss": 0.9446,
+ "step": 5617
+ },
+ {
+ "epoch": 15.307901907356948,
+ "grad_norm": 8.716134071350098,
+ "learning_rate": 1.9215964168385547e-05,
+ "loss": 1.0924,
+ "step": 5618
+ },
+ {
+ "epoch": 15.310626702997276,
+ "grad_norm": 7.8823113441467285,
+ "learning_rate": 1.9215621592636075e-05,
+ "loss": 1.0894,
+ "step": 5619
+ },
+ {
+ "epoch": 15.313351498637601,
+ "grad_norm": 8.83913516998291,
+ "learning_rate": 1.9215278945115638e-05,
+ "loss": 1.0728,
+ "step": 5620
+ },
+ {
+ "epoch": 15.316076294277929,
+ "grad_norm": 9.809870719909668,
+ "learning_rate": 1.9214936225826905e-05,
+ "loss": 0.9838,
+ "step": 5621
+ },
+ {
+ "epoch": 15.318801089918257,
+ "grad_norm": 8.821391105651855,
+ "learning_rate": 1.9214593434772547e-05,
+ "loss": 0.9503,
+ "step": 5622
+ },
+ {
+ "epoch": 15.321525885558582,
+ "grad_norm": 11.356760025024414,
+ "learning_rate": 1.9214250571955233e-05,
+ "loss": 1.1288,
+ "step": 5623
+ },
+ {
+ "epoch": 15.32425068119891,
+ "grad_norm": 15.601412773132324,
+ "learning_rate": 1.921390763737763e-05,
+ "loss": 0.8372,
+ "step": 5624
+ },
+ {
+ "epoch": 15.326975476839237,
+ "grad_norm": 10.478775024414062,
+ "learning_rate": 1.9213564631042412e-05,
+ "loss": 1.1282,
+ "step": 5625
+ },
+ {
+ "epoch": 15.329700272479563,
+ "grad_norm": 9.698952674865723,
+ "learning_rate": 1.9213221552952248e-05,
+ "loss": 1.0259,
+ "step": 5626
+ },
+ {
+ "epoch": 15.33242506811989,
+ "grad_norm": 8.53939151763916,
+ "learning_rate": 1.921287840310981e-05,
+ "loss": 0.9272,
+ "step": 5627
+ },
+ {
+ "epoch": 15.335149863760218,
+ "grad_norm": 10.980330467224121,
+ "learning_rate": 1.9212535181517773e-05,
+ "loss": 0.9717,
+ "step": 5628
+ },
+ {
+ "epoch": 15.337874659400544,
+ "grad_norm": 18.005285263061523,
+ "learning_rate": 1.9212191888178807e-05,
+ "loss": 1.0106,
+ "step": 5629
+ },
+ {
+ "epoch": 15.340599455040872,
+ "grad_norm": 9.591465950012207,
+ "learning_rate": 1.9211848523095594e-05,
+ "loss": 1.0352,
+ "step": 5630
+ },
+ {
+ "epoch": 15.3433242506812,
+ "grad_norm": 8.144366264343262,
+ "learning_rate": 1.9211505086270795e-05,
+ "loss": 0.9304,
+ "step": 5631
+ },
+ {
+ "epoch": 15.346049046321525,
+ "grad_norm": 13.091651916503906,
+ "learning_rate": 1.9211161577707092e-05,
+ "loss": 1.0085,
+ "step": 5632
+ },
+ {
+ "epoch": 15.348773841961853,
+ "grad_norm": 10.374743461608887,
+ "learning_rate": 1.9210817997407156e-05,
+ "loss": 0.9946,
+ "step": 5633
+ },
+ {
+ "epoch": 15.35149863760218,
+ "grad_norm": 9.456803321838379,
+ "learning_rate": 1.921047434537367e-05,
+ "loss": 1.0366,
+ "step": 5634
+ },
+ {
+ "epoch": 15.354223433242506,
+ "grad_norm": 13.099303245544434,
+ "learning_rate": 1.9210130621609307e-05,
+ "loss": 0.9717,
+ "step": 5635
+ },
+ {
+ "epoch": 15.356948228882834,
+ "grad_norm": 48.675018310546875,
+ "learning_rate": 1.9209786826116738e-05,
+ "loss": 1.0432,
+ "step": 5636
+ },
+ {
+ "epoch": 15.359673024523161,
+ "grad_norm": 13.054349899291992,
+ "learning_rate": 1.920944295889865e-05,
+ "loss": 0.96,
+ "step": 5637
+ },
+ {
+ "epoch": 15.362397820163487,
+ "grad_norm": 10.781517028808594,
+ "learning_rate": 1.9209099019957715e-05,
+ "loss": 1.1687,
+ "step": 5638
+ },
+ {
+ "epoch": 15.365122615803815,
+ "grad_norm": 17.755901336669922,
+ "learning_rate": 1.9208755009296615e-05,
+ "loss": 0.9841,
+ "step": 5639
+ },
+ {
+ "epoch": 15.367847411444142,
+ "grad_norm": 18.320762634277344,
+ "learning_rate": 1.9208410926918025e-05,
+ "loss": 0.9952,
+ "step": 5640
+ },
+ {
+ "epoch": 15.370572207084468,
+ "grad_norm": 9.680475234985352,
+ "learning_rate": 1.9208066772824628e-05,
+ "loss": 0.8379,
+ "step": 5641
+ },
+ {
+ "epoch": 15.373297002724795,
+ "grad_norm": 12.532292366027832,
+ "learning_rate": 1.9207722547019104e-05,
+ "loss": 1.1055,
+ "step": 5642
+ },
+ {
+ "epoch": 15.376021798365123,
+ "grad_norm": 9.265933990478516,
+ "learning_rate": 1.9207378249504134e-05,
+ "loss": 0.9614,
+ "step": 5643
+ },
+ {
+ "epoch": 15.378746594005449,
+ "grad_norm": 21.329524993896484,
+ "learning_rate": 1.9207033880282397e-05,
+ "loss": 0.9939,
+ "step": 5644
+ },
+ {
+ "epoch": 15.381471389645776,
+ "grad_norm": 33.45063400268555,
+ "learning_rate": 1.9206689439356576e-05,
+ "loss": 1.0686,
+ "step": 5645
+ },
+ {
+ "epoch": 15.384196185286104,
+ "grad_norm": 27.425533294677734,
+ "learning_rate": 1.9206344926729355e-05,
+ "loss": 1.006,
+ "step": 5646
+ },
+ {
+ "epoch": 15.38692098092643,
+ "grad_norm": 10.662958145141602,
+ "learning_rate": 1.9206000342403415e-05,
+ "loss": 1.0957,
+ "step": 5647
+ },
+ {
+ "epoch": 15.389645776566757,
+ "grad_norm": 11.13443374633789,
+ "learning_rate": 1.920565568638144e-05,
+ "loss": 1.188,
+ "step": 5648
+ },
+ {
+ "epoch": 15.392370572207085,
+ "grad_norm": 11.14825439453125,
+ "learning_rate": 1.9205310958666118e-05,
+ "loss": 1.075,
+ "step": 5649
+ },
+ {
+ "epoch": 15.39509536784741,
+ "grad_norm": 14.481292724609375,
+ "learning_rate": 1.9204966159260128e-05,
+ "loss": 1.1101,
+ "step": 5650
+ },
+ {
+ "epoch": 15.397820163487738,
+ "grad_norm": 11.095571517944336,
+ "learning_rate": 1.9204621288166158e-05,
+ "loss": 0.9299,
+ "step": 5651
+ },
+ {
+ "epoch": 15.400544959128066,
+ "grad_norm": 11.267986297607422,
+ "learning_rate": 1.9204276345386893e-05,
+ "loss": 1.0908,
+ "step": 5652
+ },
+ {
+ "epoch": 15.403269754768392,
+ "grad_norm": 9.950570106506348,
+ "learning_rate": 1.9203931330925024e-05,
+ "loss": 1.1143,
+ "step": 5653
+ },
+ {
+ "epoch": 15.40599455040872,
+ "grad_norm": 13.616087913513184,
+ "learning_rate": 1.920358624478323e-05,
+ "loss": 1.1476,
+ "step": 5654
+ },
+ {
+ "epoch": 15.408719346049047,
+ "grad_norm": 9.59421443939209,
+ "learning_rate": 1.9203241086964203e-05,
+ "loss": 0.9622,
+ "step": 5655
+ },
+ {
+ "epoch": 15.411444141689373,
+ "grad_norm": 11.054874420166016,
+ "learning_rate": 1.920289585747063e-05,
+ "loss": 1.1445,
+ "step": 5656
+ },
+ {
+ "epoch": 15.4141689373297,
+ "grad_norm": 13.57754135131836,
+ "learning_rate": 1.9202550556305203e-05,
+ "loss": 0.9258,
+ "step": 5657
+ },
+ {
+ "epoch": 15.416893732970028,
+ "grad_norm": 17.204612731933594,
+ "learning_rate": 1.9202205183470607e-05,
+ "loss": 1.0242,
+ "step": 5658
+ },
+ {
+ "epoch": 15.419618528610354,
+ "grad_norm": 13.986005783081055,
+ "learning_rate": 1.9201859738969532e-05,
+ "loss": 1.0354,
+ "step": 5659
+ },
+ {
+ "epoch": 15.422343324250681,
+ "grad_norm": 16.004863739013672,
+ "learning_rate": 1.9201514222804672e-05,
+ "loss": 1.0708,
+ "step": 5660
+ },
+ {
+ "epoch": 15.425068119891009,
+ "grad_norm": 26.976064682006836,
+ "learning_rate": 1.9201168634978714e-05,
+ "loss": 1.1501,
+ "step": 5661
+ },
+ {
+ "epoch": 15.427792915531334,
+ "grad_norm": 11.839661598205566,
+ "learning_rate": 1.920082297549435e-05,
+ "loss": 1.0608,
+ "step": 5662
+ },
+ {
+ "epoch": 15.430517711171662,
+ "grad_norm": 10.757123947143555,
+ "learning_rate": 1.9200477244354274e-05,
+ "loss": 1.2283,
+ "step": 5663
+ },
+ {
+ "epoch": 15.43324250681199,
+ "grad_norm": 18.2895565032959,
+ "learning_rate": 1.920013144156118e-05,
+ "loss": 1.0442,
+ "step": 5664
+ },
+ {
+ "epoch": 15.435967302452315,
+ "grad_norm": 31.786094665527344,
+ "learning_rate": 1.9199785567117755e-05,
+ "loss": 1.1907,
+ "step": 5665
+ },
+ {
+ "epoch": 15.438692098092643,
+ "grad_norm": 72.43460083007812,
+ "learning_rate": 1.9199439621026696e-05,
+ "loss": 1.0413,
+ "step": 5666
+ },
+ {
+ "epoch": 15.44141689373297,
+ "grad_norm": 71.09246826171875,
+ "learning_rate": 1.9199093603290697e-05,
+ "loss": 1.1392,
+ "step": 5667
+ },
+ {
+ "epoch": 15.444141689373296,
+ "grad_norm": 10.77194595336914,
+ "learning_rate": 1.9198747513912455e-05,
+ "loss": 0.9873,
+ "step": 5668
+ },
+ {
+ "epoch": 15.446866485013624,
+ "grad_norm": 10.256016731262207,
+ "learning_rate": 1.9198401352894663e-05,
+ "loss": 0.88,
+ "step": 5669
+ },
+ {
+ "epoch": 15.449591280653951,
+ "grad_norm": 41.68864059448242,
+ "learning_rate": 1.9198055120240012e-05,
+ "loss": 1.0861,
+ "step": 5670
+ },
+ {
+ "epoch": 15.452316076294277,
+ "grad_norm": 13.512534141540527,
+ "learning_rate": 1.919770881595121e-05,
+ "loss": 0.9462,
+ "step": 5671
+ },
+ {
+ "epoch": 15.455040871934605,
+ "grad_norm": 11.331838607788086,
+ "learning_rate": 1.9197362440030946e-05,
+ "loss": 0.9468,
+ "step": 5672
+ },
+ {
+ "epoch": 15.457765667574932,
+ "grad_norm": 13.011062622070312,
+ "learning_rate": 1.9197015992481918e-05,
+ "loss": 1.0844,
+ "step": 5673
+ },
+ {
+ "epoch": 15.460490463215258,
+ "grad_norm": 24.373592376708984,
+ "learning_rate": 1.919666947330683e-05,
+ "loss": 0.9351,
+ "step": 5674
+ },
+ {
+ "epoch": 15.463215258855586,
+ "grad_norm": 17.608154296875,
+ "learning_rate": 1.9196322882508372e-05,
+ "loss": 0.9045,
+ "step": 5675
+ },
+ {
+ "epoch": 15.465940054495913,
+ "grad_norm": 13.437183380126953,
+ "learning_rate": 1.919597622008925e-05,
+ "loss": 1.1609,
+ "step": 5676
+ },
+ {
+ "epoch": 15.46866485013624,
+ "grad_norm": 13.064347267150879,
+ "learning_rate": 1.919562948605216e-05,
+ "loss": 1.0714,
+ "step": 5677
+ },
+ {
+ "epoch": 15.471389645776567,
+ "grad_norm": 27.0733642578125,
+ "learning_rate": 1.9195282680399804e-05,
+ "loss": 1.1477,
+ "step": 5678
+ },
+ {
+ "epoch": 15.474114441416894,
+ "grad_norm": 15.739130020141602,
+ "learning_rate": 1.919493580313488e-05,
+ "loss": 1.0966,
+ "step": 5679
+ },
+ {
+ "epoch": 15.47683923705722,
+ "grad_norm": 14.389317512512207,
+ "learning_rate": 1.919458885426009e-05,
+ "loss": 0.9873,
+ "step": 5680
+ },
+ {
+ "epoch": 15.479564032697548,
+ "grad_norm": 10.674415588378906,
+ "learning_rate": 1.9194241833778148e-05,
+ "loss": 1.1765,
+ "step": 5681
+ },
+ {
+ "epoch": 15.482288828337875,
+ "grad_norm": 33.03879928588867,
+ "learning_rate": 1.9193894741691735e-05,
+ "loss": 1.0614,
+ "step": 5682
+ },
+ {
+ "epoch": 15.485013623978201,
+ "grad_norm": 8.198208808898926,
+ "learning_rate": 1.9193547578003574e-05,
+ "loss": 1.0408,
+ "step": 5683
+ },
+ {
+ "epoch": 15.487738419618529,
+ "grad_norm": 10.565143585205078,
+ "learning_rate": 1.9193200342716355e-05,
+ "loss": 0.9724,
+ "step": 5684
+ },
+ {
+ "epoch": 15.490463215258856,
+ "grad_norm": 15.008692741394043,
+ "learning_rate": 1.919285303583279e-05,
+ "loss": 1.1655,
+ "step": 5685
+ },
+ {
+ "epoch": 15.493188010899182,
+ "grad_norm": 10.448790550231934,
+ "learning_rate": 1.919250565735558e-05,
+ "loss": 0.9971,
+ "step": 5686
+ },
+ {
+ "epoch": 15.49591280653951,
+ "grad_norm": 13.054065704345703,
+ "learning_rate": 1.9192158207287435e-05,
+ "loss": 1.0354,
+ "step": 5687
+ },
+ {
+ "epoch": 15.498637602179837,
+ "grad_norm": 12.612138748168945,
+ "learning_rate": 1.9191810685631055e-05,
+ "loss": 1.1664,
+ "step": 5688
+ },
+ {
+ "epoch": 15.501362397820163,
+ "grad_norm": 13.168205261230469,
+ "learning_rate": 1.919146309238915e-05,
+ "loss": 1.0864,
+ "step": 5689
+ },
+ {
+ "epoch": 15.50408719346049,
+ "grad_norm": 13.737235069274902,
+ "learning_rate": 1.9191115427564425e-05,
+ "loss": 1.0398,
+ "step": 5690
+ },
+ {
+ "epoch": 15.506811989100818,
+ "grad_norm": 10.856537818908691,
+ "learning_rate": 1.9190767691159592e-05,
+ "loss": 1.0736,
+ "step": 5691
+ },
+ {
+ "epoch": 15.509536784741144,
+ "grad_norm": 18.237037658691406,
+ "learning_rate": 1.9190419883177355e-05,
+ "loss": 0.9568,
+ "step": 5692
+ },
+ {
+ "epoch": 15.512261580381471,
+ "grad_norm": 9.727873802185059,
+ "learning_rate": 1.919007200362042e-05,
+ "loss": 1.1021,
+ "step": 5693
+ },
+ {
+ "epoch": 15.514986376021799,
+ "grad_norm": 9.597294807434082,
+ "learning_rate": 1.9189724052491502e-05,
+ "loss": 1.1595,
+ "step": 5694
+ },
+ {
+ "epoch": 15.517711171662125,
+ "grad_norm": 18.482219696044922,
+ "learning_rate": 1.918937602979331e-05,
+ "loss": 1.1152,
+ "step": 5695
+ },
+ {
+ "epoch": 15.520435967302452,
+ "grad_norm": 9.99679183959961,
+ "learning_rate": 1.9189027935528553e-05,
+ "loss": 0.9644,
+ "step": 5696
+ },
+ {
+ "epoch": 15.52316076294278,
+ "grad_norm": 9.244872093200684,
+ "learning_rate": 1.9188679769699944e-05,
+ "loss": 0.998,
+ "step": 5697
+ },
+ {
+ "epoch": 15.525885558583106,
+ "grad_norm": 24.489723205566406,
+ "learning_rate": 1.918833153231019e-05,
+ "loss": 0.972,
+ "step": 5698
+ },
+ {
+ "epoch": 15.528610354223433,
+ "grad_norm": 10.590883255004883,
+ "learning_rate": 1.9187983223362006e-05,
+ "loss": 1.0823,
+ "step": 5699
+ },
+ {
+ "epoch": 15.53133514986376,
+ "grad_norm": 10.565340995788574,
+ "learning_rate": 1.9187634842858104e-05,
+ "loss": 0.9884,
+ "step": 5700
+ },
+ {
+ "epoch": 15.534059945504087,
+ "grad_norm": 10.080450057983398,
+ "learning_rate": 1.91872863908012e-05,
+ "loss": 0.9827,
+ "step": 5701
+ },
+ {
+ "epoch": 15.536784741144414,
+ "grad_norm": 11.24704647064209,
+ "learning_rate": 1.9186937867194e-05,
+ "loss": 1.0967,
+ "step": 5702
+ },
+ {
+ "epoch": 15.539509536784742,
+ "grad_norm": 11.711875915527344,
+ "learning_rate": 1.9186589272039227e-05,
+ "loss": 1.1519,
+ "step": 5703
+ },
+ {
+ "epoch": 15.542234332425068,
+ "grad_norm": 10.722929954528809,
+ "learning_rate": 1.9186240605339596e-05,
+ "loss": 1.1758,
+ "step": 5704
+ },
+ {
+ "epoch": 15.544959128065395,
+ "grad_norm": 9.224250793457031,
+ "learning_rate": 1.9185891867097813e-05,
+ "loss": 0.9614,
+ "step": 5705
+ },
+ {
+ "epoch": 15.547683923705723,
+ "grad_norm": 14.218178749084473,
+ "learning_rate": 1.9185543057316604e-05,
+ "loss": 1.014,
+ "step": 5706
+ },
+ {
+ "epoch": 15.550408719346049,
+ "grad_norm": 9.43051815032959,
+ "learning_rate": 1.9185194175998682e-05,
+ "loss": 1.0627,
+ "step": 5707
+ },
+ {
+ "epoch": 15.553133514986376,
+ "grad_norm": 9.282830238342285,
+ "learning_rate": 1.9184845223146757e-05,
+ "loss": 1.162,
+ "step": 5708
+ },
+ {
+ "epoch": 15.555858310626704,
+ "grad_norm": 9.06210708618164,
+ "learning_rate": 1.9184496198763557e-05,
+ "loss": 1.0413,
+ "step": 5709
+ },
+ {
+ "epoch": 15.55858310626703,
+ "grad_norm": 10.454787254333496,
+ "learning_rate": 1.9184147102851796e-05,
+ "loss": 1.0507,
+ "step": 5710
+ },
+ {
+ "epoch": 15.561307901907357,
+ "grad_norm": 9.729334831237793,
+ "learning_rate": 1.9183797935414194e-05,
+ "loss": 0.9071,
+ "step": 5711
+ },
+ {
+ "epoch": 15.564032697547685,
+ "grad_norm": 11.212459564208984,
+ "learning_rate": 1.918344869645347e-05,
+ "loss": 0.8904,
+ "step": 5712
+ },
+ {
+ "epoch": 15.56675749318801,
+ "grad_norm": 9.800729751586914,
+ "learning_rate": 1.918309938597234e-05,
+ "loss": 1.1301,
+ "step": 5713
+ },
+ {
+ "epoch": 15.569482288828338,
+ "grad_norm": 11.547163009643555,
+ "learning_rate": 1.918275000397353e-05,
+ "loss": 1.1277,
+ "step": 5714
+ },
+ {
+ "epoch": 15.572207084468666,
+ "grad_norm": 11.262359619140625,
+ "learning_rate": 1.9182400550459758e-05,
+ "loss": 1.1111,
+ "step": 5715
+ },
+ {
+ "epoch": 15.574931880108991,
+ "grad_norm": 9.875480651855469,
+ "learning_rate": 1.9182051025433743e-05,
+ "loss": 1.0226,
+ "step": 5716
+ },
+ {
+ "epoch": 15.577656675749319,
+ "grad_norm": 10.523189544677734,
+ "learning_rate": 1.9181701428898215e-05,
+ "loss": 1.1477,
+ "step": 5717
+ },
+ {
+ "epoch": 15.580381471389646,
+ "grad_norm": 11.124797821044922,
+ "learning_rate": 1.9181351760855888e-05,
+ "loss": 1.2227,
+ "step": 5718
+ },
+ {
+ "epoch": 15.583106267029972,
+ "grad_norm": 9.22188949584961,
+ "learning_rate": 1.918100202130949e-05,
+ "loss": 1.1023,
+ "step": 5719
+ },
+ {
+ "epoch": 15.5858310626703,
+ "grad_norm": 12.09113883972168,
+ "learning_rate": 1.9180652210261743e-05,
+ "loss": 0.9634,
+ "step": 5720
+ },
+ {
+ "epoch": 15.588555858310627,
+ "grad_norm": 10.632393836975098,
+ "learning_rate": 1.9180302327715376e-05,
+ "loss": 1.2341,
+ "step": 5721
+ },
+ {
+ "epoch": 15.591280653950953,
+ "grad_norm": 60.9536247253418,
+ "learning_rate": 1.9179952373673106e-05,
+ "loss": 1.1792,
+ "step": 5722
+ },
+ {
+ "epoch": 15.59400544959128,
+ "grad_norm": 10.613637924194336,
+ "learning_rate": 1.9179602348137664e-05,
+ "loss": 1.0394,
+ "step": 5723
+ },
+ {
+ "epoch": 15.596730245231608,
+ "grad_norm": 11.657779693603516,
+ "learning_rate": 1.9179252251111774e-05,
+ "loss": 1.0682,
+ "step": 5724
+ },
+ {
+ "epoch": 15.599455040871934,
+ "grad_norm": 15.660120010375977,
+ "learning_rate": 1.917890208259816e-05,
+ "loss": 1.1211,
+ "step": 5725
+ },
+ {
+ "epoch": 15.602179836512262,
+ "grad_norm": 13.824321746826172,
+ "learning_rate": 1.917855184259956e-05,
+ "loss": 1.0676,
+ "step": 5726
+ },
+ {
+ "epoch": 15.60490463215259,
+ "grad_norm": 9.168793678283691,
+ "learning_rate": 1.9178201531118686e-05,
+ "loss": 0.9479,
+ "step": 5727
+ },
+ {
+ "epoch": 15.607629427792915,
+ "grad_norm": 9.639008522033691,
+ "learning_rate": 1.9177851148158274e-05,
+ "loss": 1.0037,
+ "step": 5728
+ },
+ {
+ "epoch": 15.610354223433243,
+ "grad_norm": 8.819302558898926,
+ "learning_rate": 1.917750069372106e-05,
+ "loss": 1.0223,
+ "step": 5729
+ },
+ {
+ "epoch": 15.61307901907357,
+ "grad_norm": 10.01408863067627,
+ "learning_rate": 1.9177150167809756e-05,
+ "loss": 1.2766,
+ "step": 5730
+ },
+ {
+ "epoch": 15.615803814713896,
+ "grad_norm": 12.288567543029785,
+ "learning_rate": 1.9176799570427108e-05,
+ "loss": 1.063,
+ "step": 5731
+ },
+ {
+ "epoch": 15.618528610354224,
+ "grad_norm": 9.187858581542969,
+ "learning_rate": 1.9176448901575838e-05,
+ "loss": 0.9091,
+ "step": 5732
+ },
+ {
+ "epoch": 15.621253405994551,
+ "grad_norm": 8.205780982971191,
+ "learning_rate": 1.9176098161258684e-05,
+ "loss": 0.8153,
+ "step": 5733
+ },
+ {
+ "epoch": 15.623978201634877,
+ "grad_norm": 9.210580825805664,
+ "learning_rate": 1.9175747349478366e-05,
+ "loss": 0.9578,
+ "step": 5734
+ },
+ {
+ "epoch": 15.626702997275205,
+ "grad_norm": 11.467032432556152,
+ "learning_rate": 1.917539646623763e-05,
+ "loss": 0.9211,
+ "step": 5735
+ },
+ {
+ "epoch": 15.629427792915532,
+ "grad_norm": 13.662873268127441,
+ "learning_rate": 1.9175045511539197e-05,
+ "loss": 0.8729,
+ "step": 5736
+ },
+ {
+ "epoch": 15.632152588555858,
+ "grad_norm": 8.510534286499023,
+ "learning_rate": 1.9174694485385805e-05,
+ "loss": 1.0953,
+ "step": 5737
+ },
+ {
+ "epoch": 15.634877384196185,
+ "grad_norm": 8.807907104492188,
+ "learning_rate": 1.917434338778019e-05,
+ "loss": 1.0469,
+ "step": 5738
+ },
+ {
+ "epoch": 15.637602179836513,
+ "grad_norm": 18.483234405517578,
+ "learning_rate": 1.917399221872508e-05,
+ "loss": 0.9,
+ "step": 5739
+ },
+ {
+ "epoch": 15.640326975476839,
+ "grad_norm": 7.845697402954102,
+ "learning_rate": 1.9173640978223214e-05,
+ "loss": 1.042,
+ "step": 5740
+ },
+ {
+ "epoch": 15.643051771117166,
+ "grad_norm": 14.4625883102417,
+ "learning_rate": 1.917328966627733e-05,
+ "loss": 1.0551,
+ "step": 5741
+ },
+ {
+ "epoch": 15.645776566757494,
+ "grad_norm": 9.872694969177246,
+ "learning_rate": 1.9172938282890164e-05,
+ "loss": 1.0273,
+ "step": 5742
+ },
+ {
+ "epoch": 15.64850136239782,
+ "grad_norm": 10.579270362854004,
+ "learning_rate": 1.9172586828064446e-05,
+ "loss": 1.0469,
+ "step": 5743
+ },
+ {
+ "epoch": 15.651226158038147,
+ "grad_norm": 8.047989845275879,
+ "learning_rate": 1.9172235301802916e-05,
+ "loss": 0.9785,
+ "step": 5744
+ },
+ {
+ "epoch": 15.653950953678475,
+ "grad_norm": 12.386167526245117,
+ "learning_rate": 1.9171883704108316e-05,
+ "loss": 1.1707,
+ "step": 5745
+ },
+ {
+ "epoch": 15.6566757493188,
+ "grad_norm": 7.95110559463501,
+ "learning_rate": 1.9171532034983377e-05,
+ "loss": 0.9547,
+ "step": 5746
+ },
+ {
+ "epoch": 15.659400544959128,
+ "grad_norm": 8.568359375,
+ "learning_rate": 1.9171180294430847e-05,
+ "loss": 1.0623,
+ "step": 5747
+ },
+ {
+ "epoch": 15.662125340599456,
+ "grad_norm": 9.228265762329102,
+ "learning_rate": 1.9170828482453456e-05,
+ "loss": 1.03,
+ "step": 5748
+ },
+ {
+ "epoch": 15.664850136239782,
+ "grad_norm": 14.048735618591309,
+ "learning_rate": 1.9170476599053952e-05,
+ "loss": 1.1896,
+ "step": 5749
+ },
+ {
+ "epoch": 15.66757493188011,
+ "grad_norm": 16.577896118164062,
+ "learning_rate": 1.9170124644235066e-05,
+ "loss": 1.2175,
+ "step": 5750
+ },
+ {
+ "epoch": 15.670299727520437,
+ "grad_norm": 13.842279434204102,
+ "learning_rate": 1.9169772617999545e-05,
+ "loss": 1.1901,
+ "step": 5751
+ },
+ {
+ "epoch": 15.673024523160763,
+ "grad_norm": 10.956024169921875,
+ "learning_rate": 1.9169420520350135e-05,
+ "loss": 1.0266,
+ "step": 5752
+ },
+ {
+ "epoch": 15.67574931880109,
+ "grad_norm": 10.104551315307617,
+ "learning_rate": 1.916906835128957e-05,
+ "loss": 0.9318,
+ "step": 5753
+ },
+ {
+ "epoch": 15.678474114441418,
+ "grad_norm": 11.581619262695312,
+ "learning_rate": 1.9168716110820592e-05,
+ "loss": 1.0981,
+ "step": 5754
+ },
+ {
+ "epoch": 15.681198910081743,
+ "grad_norm": 34.04673385620117,
+ "learning_rate": 1.9168363798945955e-05,
+ "loss": 1.1523,
+ "step": 5755
+ },
+ {
+ "epoch": 15.683923705722071,
+ "grad_norm": 9.896060943603516,
+ "learning_rate": 1.9168011415668392e-05,
+ "loss": 0.8792,
+ "step": 5756
+ },
+ {
+ "epoch": 15.686648501362399,
+ "grad_norm": 11.737502098083496,
+ "learning_rate": 1.916765896099065e-05,
+ "loss": 1.1477,
+ "step": 5757
+ },
+ {
+ "epoch": 15.689373297002724,
+ "grad_norm": 8.23998737335205,
+ "learning_rate": 1.9167306434915475e-05,
+ "loss": 0.9487,
+ "step": 5758
+ },
+ {
+ "epoch": 15.692098092643052,
+ "grad_norm": 8.44018840789795,
+ "learning_rate": 1.9166953837445618e-05,
+ "loss": 1.004,
+ "step": 5759
+ },
+ {
+ "epoch": 15.69482288828338,
+ "grad_norm": 10.327585220336914,
+ "learning_rate": 1.9166601168583815e-05,
+ "loss": 1.2854,
+ "step": 5760
+ },
+ {
+ "epoch": 15.697547683923705,
+ "grad_norm": 11.30803394317627,
+ "learning_rate": 1.9166248428332816e-05,
+ "loss": 1.1277,
+ "step": 5761
+ },
+ {
+ "epoch": 15.700272479564033,
+ "grad_norm": 15.84594440460205,
+ "learning_rate": 1.9165895616695373e-05,
+ "loss": 0.996,
+ "step": 5762
+ },
+ {
+ "epoch": 15.70299727520436,
+ "grad_norm": 20.89583396911621,
+ "learning_rate": 1.9165542733674226e-05,
+ "loss": 1.0647,
+ "step": 5763
+ },
+ {
+ "epoch": 15.705722070844686,
+ "grad_norm": 9.654314041137695,
+ "learning_rate": 1.916518977927213e-05,
+ "loss": 1.0873,
+ "step": 5764
+ },
+ {
+ "epoch": 15.708446866485014,
+ "grad_norm": 8.791511535644531,
+ "learning_rate": 1.9164836753491834e-05,
+ "loss": 1.0981,
+ "step": 5765
+ },
+ {
+ "epoch": 15.711171662125341,
+ "grad_norm": 9.795890808105469,
+ "learning_rate": 1.916448365633608e-05,
+ "loss": 1.1212,
+ "step": 5766
+ },
+ {
+ "epoch": 15.713896457765667,
+ "grad_norm": 8.347766876220703,
+ "learning_rate": 1.9164130487807623e-05,
+ "loss": 0.9233,
+ "step": 5767
+ },
+ {
+ "epoch": 15.716621253405995,
+ "grad_norm": 9.630997657775879,
+ "learning_rate": 1.916377724790921e-05,
+ "loss": 1.2072,
+ "step": 5768
+ },
+ {
+ "epoch": 15.719346049046322,
+ "grad_norm": 8.77739143371582,
+ "learning_rate": 1.9163423936643598e-05,
+ "loss": 1.1823,
+ "step": 5769
+ },
+ {
+ "epoch": 15.722070844686648,
+ "grad_norm": 8.231311798095703,
+ "learning_rate": 1.9163070554013535e-05,
+ "loss": 0.9652,
+ "step": 5770
+ },
+ {
+ "epoch": 15.724795640326976,
+ "grad_norm": 10.8486328125,
+ "learning_rate": 1.9162717100021772e-05,
+ "loss": 1.074,
+ "step": 5771
+ },
+ {
+ "epoch": 15.727520435967303,
+ "grad_norm": 8.435831069946289,
+ "learning_rate": 1.9162363574671062e-05,
+ "loss": 0.9534,
+ "step": 5772
+ },
+ {
+ "epoch": 15.730245231607629,
+ "grad_norm": 8.546896934509277,
+ "learning_rate": 1.9162009977964165e-05,
+ "loss": 1.0242,
+ "step": 5773
+ },
+ {
+ "epoch": 15.732970027247957,
+ "grad_norm": 16.247638702392578,
+ "learning_rate": 1.9161656309903825e-05,
+ "loss": 1.0422,
+ "step": 5774
+ },
+ {
+ "epoch": 15.735694822888284,
+ "grad_norm": 13.46705150604248,
+ "learning_rate": 1.91613025704928e-05,
+ "loss": 1.0439,
+ "step": 5775
+ },
+ {
+ "epoch": 15.73841961852861,
+ "grad_norm": 12.30317497253418,
+ "learning_rate": 1.916094875973385e-05,
+ "loss": 1.1267,
+ "step": 5776
+ },
+ {
+ "epoch": 15.741144414168938,
+ "grad_norm": 9.070901870727539,
+ "learning_rate": 1.916059487762972e-05,
+ "loss": 1.0928,
+ "step": 5777
+ },
+ {
+ "epoch": 15.743869209809265,
+ "grad_norm": 8.931979179382324,
+ "learning_rate": 1.9160240924183174e-05,
+ "loss": 1.1189,
+ "step": 5778
+ },
+ {
+ "epoch": 15.746594005449591,
+ "grad_norm": 9.261917114257812,
+ "learning_rate": 1.9159886899396966e-05,
+ "loss": 1.0011,
+ "step": 5779
+ },
+ {
+ "epoch": 15.749318801089919,
+ "grad_norm": 14.735495567321777,
+ "learning_rate": 1.9159532803273856e-05,
+ "loss": 0.8273,
+ "step": 5780
+ },
+ {
+ "epoch": 15.752043596730246,
+ "grad_norm": 12.524917602539062,
+ "learning_rate": 1.91591786358166e-05,
+ "loss": 1.0941,
+ "step": 5781
+ },
+ {
+ "epoch": 15.754768392370572,
+ "grad_norm": 9.117819786071777,
+ "learning_rate": 1.9158824397027954e-05,
+ "loss": 1.0586,
+ "step": 5782
+ },
+ {
+ "epoch": 15.7574931880109,
+ "grad_norm": 253.52011108398438,
+ "learning_rate": 1.9158470086910677e-05,
+ "loss": 1.1418,
+ "step": 5783
+ },
+ {
+ "epoch": 15.760217983651227,
+ "grad_norm": 11.384540557861328,
+ "learning_rate": 1.9158115705467528e-05,
+ "loss": 0.9756,
+ "step": 5784
+ },
+ {
+ "epoch": 15.762942779291553,
+ "grad_norm": 13.110880851745605,
+ "learning_rate": 1.9157761252701273e-05,
+ "loss": 0.955,
+ "step": 5785
+ },
+ {
+ "epoch": 15.76566757493188,
+ "grad_norm": 10.360495567321777,
+ "learning_rate": 1.915740672861467e-05,
+ "loss": 1.2449,
+ "step": 5786
+ },
+ {
+ "epoch": 15.768392370572208,
+ "grad_norm": 11.14963436126709,
+ "learning_rate": 1.915705213321047e-05,
+ "loss": 1.0106,
+ "step": 5787
+ },
+ {
+ "epoch": 15.771117166212534,
+ "grad_norm": 11.102007865905762,
+ "learning_rate": 1.9156697466491447e-05,
+ "loss": 1.11,
+ "step": 5788
+ },
+ {
+ "epoch": 15.773841961852861,
+ "grad_norm": 11.817999839782715,
+ "learning_rate": 1.915634272846036e-05,
+ "loss": 1.0494,
+ "step": 5789
+ },
+ {
+ "epoch": 15.776566757493189,
+ "grad_norm": 13.184379577636719,
+ "learning_rate": 1.9155987919119973e-05,
+ "loss": 1.1912,
+ "step": 5790
+ },
+ {
+ "epoch": 15.779291553133515,
+ "grad_norm": 10.445209503173828,
+ "learning_rate": 1.915563303847304e-05,
+ "loss": 1.0676,
+ "step": 5791
+ },
+ {
+ "epoch": 15.782016348773842,
+ "grad_norm": 17.510478973388672,
+ "learning_rate": 1.9155278086522334e-05,
+ "loss": 1.0464,
+ "step": 5792
+ },
+ {
+ "epoch": 15.78474114441417,
+ "grad_norm": 12.840875625610352,
+ "learning_rate": 1.915492306327062e-05,
+ "loss": 1.2336,
+ "step": 5793
+ },
+ {
+ "epoch": 15.787465940054496,
+ "grad_norm": 13.593019485473633,
+ "learning_rate": 1.9154567968720656e-05,
+ "loss": 0.9667,
+ "step": 5794
+ },
+ {
+ "epoch": 15.790190735694823,
+ "grad_norm": 13.132856369018555,
+ "learning_rate": 1.9154212802875215e-05,
+ "loss": 1.0829,
+ "step": 5795
+ },
+ {
+ "epoch": 15.79291553133515,
+ "grad_norm": 19.62708282470703,
+ "learning_rate": 1.9153857565737058e-05,
+ "loss": 1.007,
+ "step": 5796
+ },
+ {
+ "epoch": 15.795640326975477,
+ "grad_norm": 12.598803520202637,
+ "learning_rate": 1.9153502257308952e-05,
+ "loss": 1.0894,
+ "step": 5797
+ },
+ {
+ "epoch": 15.798365122615804,
+ "grad_norm": 12.247570991516113,
+ "learning_rate": 1.9153146877593666e-05,
+ "loss": 1.2468,
+ "step": 5798
+ },
+ {
+ "epoch": 15.80108991825613,
+ "grad_norm": 11.259017944335938,
+ "learning_rate": 1.9152791426593964e-05,
+ "loss": 0.8749,
+ "step": 5799
+ },
+ {
+ "epoch": 15.803814713896458,
+ "grad_norm": 15.317924499511719,
+ "learning_rate": 1.9152435904312617e-05,
+ "loss": 1.0837,
+ "step": 5800
+ },
+ {
+ "epoch": 15.806539509536785,
+ "grad_norm": 10.472589492797852,
+ "learning_rate": 1.9152080310752398e-05,
+ "loss": 1.1927,
+ "step": 5801
+ },
+ {
+ "epoch": 15.809264305177111,
+ "grad_norm": 8.946378707885742,
+ "learning_rate": 1.9151724645916067e-05,
+ "loss": 0.9634,
+ "step": 5802
+ },
+ {
+ "epoch": 15.811989100817438,
+ "grad_norm": 9.994170188903809,
+ "learning_rate": 1.9151368909806403e-05,
+ "loss": 1.1936,
+ "step": 5803
+ },
+ {
+ "epoch": 15.814713896457766,
+ "grad_norm": 9.011474609375,
+ "learning_rate": 1.9151013102426174e-05,
+ "loss": 0.9994,
+ "step": 5804
+ },
+ {
+ "epoch": 15.817438692098092,
+ "grad_norm": 13.082215309143066,
+ "learning_rate": 1.9150657223778144e-05,
+ "loss": 1.1785,
+ "step": 5805
+ },
+ {
+ "epoch": 15.82016348773842,
+ "grad_norm": 13.153779983520508,
+ "learning_rate": 1.9150301273865093e-05,
+ "loss": 1.2297,
+ "step": 5806
+ },
+ {
+ "epoch": 15.822888283378747,
+ "grad_norm": 12.095719337463379,
+ "learning_rate": 1.914994525268979e-05,
+ "loss": 1.0507,
+ "step": 5807
+ },
+ {
+ "epoch": 15.825613079019073,
+ "grad_norm": 14.634735107421875,
+ "learning_rate": 1.914958916025501e-05,
+ "loss": 1.0647,
+ "step": 5808
+ },
+ {
+ "epoch": 15.8283378746594,
+ "grad_norm": 19.04387855529785,
+ "learning_rate": 1.914923299656352e-05,
+ "loss": 1.1753,
+ "step": 5809
+ },
+ {
+ "epoch": 15.831062670299728,
+ "grad_norm": 12.531530380249023,
+ "learning_rate": 1.91488767616181e-05,
+ "loss": 0.8816,
+ "step": 5810
+ },
+ {
+ "epoch": 15.833787465940054,
+ "grad_norm": 15.612229347229004,
+ "learning_rate": 1.914852045542152e-05,
+ "loss": 1.1462,
+ "step": 5811
+ },
+ {
+ "epoch": 15.836512261580381,
+ "grad_norm": 8.871306419372559,
+ "learning_rate": 1.914816407797656e-05,
+ "loss": 1.1921,
+ "step": 5812
+ },
+ {
+ "epoch": 15.839237057220709,
+ "grad_norm": 9.51230525970459,
+ "learning_rate": 1.9147807629285993e-05,
+ "loss": 0.8789,
+ "step": 5813
+ },
+ {
+ "epoch": 15.841961852861035,
+ "grad_norm": 8.646533012390137,
+ "learning_rate": 1.9147451109352592e-05,
+ "loss": 0.8663,
+ "step": 5814
+ },
+ {
+ "epoch": 15.844686648501362,
+ "grad_norm": 14.684822082519531,
+ "learning_rate": 1.9147094518179136e-05,
+ "loss": 1.115,
+ "step": 5815
+ },
+ {
+ "epoch": 15.84741144414169,
+ "grad_norm": 11.252645492553711,
+ "learning_rate": 1.9146737855768407e-05,
+ "loss": 1.1289,
+ "step": 5816
+ },
+ {
+ "epoch": 15.850136239782016,
+ "grad_norm": 16.818647384643555,
+ "learning_rate": 1.9146381122123176e-05,
+ "loss": 1.0566,
+ "step": 5817
+ },
+ {
+ "epoch": 15.852861035422343,
+ "grad_norm": 12.027950286865234,
+ "learning_rate": 1.9146024317246217e-05,
+ "loss": 1.1055,
+ "step": 5818
+ },
+ {
+ "epoch": 15.85558583106267,
+ "grad_norm": 10.26107120513916,
+ "learning_rate": 1.914566744114032e-05,
+ "loss": 0.9465,
+ "step": 5819
+ },
+ {
+ "epoch": 15.858310626702997,
+ "grad_norm": 9.16214370727539,
+ "learning_rate": 1.9145310493808264e-05,
+ "loss": 0.881,
+ "step": 5820
+ },
+ {
+ "epoch": 15.861035422343324,
+ "grad_norm": 18.3576602935791,
+ "learning_rate": 1.9144953475252818e-05,
+ "loss": 0.9797,
+ "step": 5821
+ },
+ {
+ "epoch": 15.863760217983652,
+ "grad_norm": 11.488898277282715,
+ "learning_rate": 1.914459638547677e-05,
+ "loss": 1.2394,
+ "step": 5822
+ },
+ {
+ "epoch": 15.866485013623977,
+ "grad_norm": 10.461718559265137,
+ "learning_rate": 1.91442392244829e-05,
+ "loss": 0.8883,
+ "step": 5823
+ },
+ {
+ "epoch": 15.869209809264305,
+ "grad_norm": 12.152205467224121,
+ "learning_rate": 1.9143881992273988e-05,
+ "loss": 1.011,
+ "step": 5824
+ },
+ {
+ "epoch": 15.871934604904633,
+ "grad_norm": 12.241488456726074,
+ "learning_rate": 1.914352468885282e-05,
+ "loss": 1.0708,
+ "step": 5825
+ },
+ {
+ "epoch": 15.874659400544958,
+ "grad_norm": 9.718058586120605,
+ "learning_rate": 1.9143167314222172e-05,
+ "loss": 1.0092,
+ "step": 5826
+ },
+ {
+ "epoch": 15.877384196185286,
+ "grad_norm": 14.82849407196045,
+ "learning_rate": 1.9142809868384836e-05,
+ "loss": 1.0952,
+ "step": 5827
+ },
+ {
+ "epoch": 15.880108991825614,
+ "grad_norm": 9.937234878540039,
+ "learning_rate": 1.9142452351343585e-05,
+ "loss": 1.1174,
+ "step": 5828
+ },
+ {
+ "epoch": 15.88283378746594,
+ "grad_norm": 8.828649520874023,
+ "learning_rate": 1.9142094763101216e-05,
+ "loss": 1.2395,
+ "step": 5829
+ },
+ {
+ "epoch": 15.885558583106267,
+ "grad_norm": 13.135193824768066,
+ "learning_rate": 1.9141737103660503e-05,
+ "loss": 1.1481,
+ "step": 5830
+ },
+ {
+ "epoch": 15.888283378746594,
+ "grad_norm": 9.514058113098145,
+ "learning_rate": 1.9141379373024235e-05,
+ "loss": 0.9443,
+ "step": 5831
+ },
+ {
+ "epoch": 15.89100817438692,
+ "grad_norm": 10.643321990966797,
+ "learning_rate": 1.9141021571195204e-05,
+ "loss": 1.0137,
+ "step": 5832
+ },
+ {
+ "epoch": 15.893732970027248,
+ "grad_norm": 11.337188720703125,
+ "learning_rate": 1.9140663698176183e-05,
+ "loss": 1.0775,
+ "step": 5833
+ },
+ {
+ "epoch": 15.896457765667575,
+ "grad_norm": 12.842183113098145,
+ "learning_rate": 1.9140305753969977e-05,
+ "loss": 1.0387,
+ "step": 5834
+ },
+ {
+ "epoch": 15.899182561307901,
+ "grad_norm": 9.45815658569336,
+ "learning_rate": 1.913994773857936e-05,
+ "loss": 1.291,
+ "step": 5835
+ },
+ {
+ "epoch": 15.901907356948229,
+ "grad_norm": 10.153657913208008,
+ "learning_rate": 1.913958965200712e-05,
+ "loss": 1.1455,
+ "step": 5836
+ },
+ {
+ "epoch": 15.904632152588556,
+ "grad_norm": 11.954771041870117,
+ "learning_rate": 1.9139231494256054e-05,
+ "loss": 1.2424,
+ "step": 5837
+ },
+ {
+ "epoch": 15.907356948228882,
+ "grad_norm": 9.33283519744873,
+ "learning_rate": 1.9138873265328944e-05,
+ "loss": 0.9509,
+ "step": 5838
+ },
+ {
+ "epoch": 15.91008174386921,
+ "grad_norm": 11.959882736206055,
+ "learning_rate": 1.9138514965228587e-05,
+ "loss": 1.1006,
+ "step": 5839
+ },
+ {
+ "epoch": 15.912806539509537,
+ "grad_norm": 10.285158157348633,
+ "learning_rate": 1.9138156593957767e-05,
+ "loss": 1.1519,
+ "step": 5840
+ },
+ {
+ "epoch": 15.915531335149863,
+ "grad_norm": 11.74209213256836,
+ "learning_rate": 1.913779815151928e-05,
+ "loss": 1.0012,
+ "step": 5841
+ },
+ {
+ "epoch": 15.91825613079019,
+ "grad_norm": 15.43689250946045,
+ "learning_rate": 1.9137439637915912e-05,
+ "loss": 0.9618,
+ "step": 5842
+ },
+ {
+ "epoch": 15.920980926430518,
+ "grad_norm": 34.82831954956055,
+ "learning_rate": 1.9137081053150465e-05,
+ "loss": 1.1279,
+ "step": 5843
+ },
+ {
+ "epoch": 15.923705722070844,
+ "grad_norm": 17.277294158935547,
+ "learning_rate": 1.913672239722572e-05,
+ "loss": 1.1492,
+ "step": 5844
+ },
+ {
+ "epoch": 15.926430517711172,
+ "grad_norm": 11.406451225280762,
+ "learning_rate": 1.9136363670144472e-05,
+ "loss": 1.1479,
+ "step": 5845
+ },
+ {
+ "epoch": 15.9291553133515,
+ "grad_norm": 8.550233840942383,
+ "learning_rate": 1.913600487190952e-05,
+ "loss": 0.9703,
+ "step": 5846
+ },
+ {
+ "epoch": 15.931880108991825,
+ "grad_norm": 7.3839616775512695,
+ "learning_rate": 1.913564600252366e-05,
+ "loss": 0.9032,
+ "step": 5847
+ },
+ {
+ "epoch": 15.934604904632153,
+ "grad_norm": 12.862568855285645,
+ "learning_rate": 1.9135287061989677e-05,
+ "loss": 1.1243,
+ "step": 5848
+ },
+ {
+ "epoch": 15.93732970027248,
+ "grad_norm": 8.45930290222168,
+ "learning_rate": 1.9134928050310374e-05,
+ "loss": 1.1049,
+ "step": 5849
+ },
+ {
+ "epoch": 15.940054495912806,
+ "grad_norm": 8.572096824645996,
+ "learning_rate": 1.9134568967488548e-05,
+ "loss": 0.9646,
+ "step": 5850
+ },
+ {
+ "epoch": 15.942779291553133,
+ "grad_norm": 11.794368743896484,
+ "learning_rate": 1.9134209813526992e-05,
+ "loss": 1.0782,
+ "step": 5851
+ },
+ {
+ "epoch": 15.945504087193461,
+ "grad_norm": 10.465714454650879,
+ "learning_rate": 1.9133850588428503e-05,
+ "loss": 1.1124,
+ "step": 5852
+ },
+ {
+ "epoch": 15.948228882833787,
+ "grad_norm": 10.074355125427246,
+ "learning_rate": 1.9133491292195878e-05,
+ "loss": 1.0828,
+ "step": 5853
+ },
+ {
+ "epoch": 15.950953678474114,
+ "grad_norm": 26.048002243041992,
+ "learning_rate": 1.9133131924831917e-05,
+ "loss": 1.0967,
+ "step": 5854
+ },
+ {
+ "epoch": 15.953678474114442,
+ "grad_norm": 15.029605865478516,
+ "learning_rate": 1.913277248633942e-05,
+ "loss": 0.9686,
+ "step": 5855
+ },
+ {
+ "epoch": 15.956403269754768,
+ "grad_norm": 9.323305130004883,
+ "learning_rate": 1.9132412976721185e-05,
+ "loss": 1.1111,
+ "step": 5856
+ },
+ {
+ "epoch": 15.959128065395095,
+ "grad_norm": 11.37041187286377,
+ "learning_rate": 1.9132053395980013e-05,
+ "loss": 1.1589,
+ "step": 5857
+ },
+ {
+ "epoch": 15.961852861035423,
+ "grad_norm": 10.822033882141113,
+ "learning_rate": 1.91316937441187e-05,
+ "loss": 0.9663,
+ "step": 5858
+ },
+ {
+ "epoch": 15.964577656675749,
+ "grad_norm": 18.556129455566406,
+ "learning_rate": 1.9131334021140052e-05,
+ "loss": 0.9749,
+ "step": 5859
+ },
+ {
+ "epoch": 15.967302452316076,
+ "grad_norm": 9.88136100769043,
+ "learning_rate": 1.913097422704687e-05,
+ "loss": 1.0925,
+ "step": 5860
+ },
+ {
+ "epoch": 15.970027247956404,
+ "grad_norm": 10.482797622680664,
+ "learning_rate": 1.913061436184195e-05,
+ "loss": 1.2273,
+ "step": 5861
+ },
+ {
+ "epoch": 15.97275204359673,
+ "grad_norm": 8.020975112915039,
+ "learning_rate": 1.9130254425528102e-05,
+ "loss": 0.9597,
+ "step": 5862
+ },
+ {
+ "epoch": 15.975476839237057,
+ "grad_norm": 9.891862869262695,
+ "learning_rate": 1.912989441810813e-05,
+ "loss": 0.9469,
+ "step": 5863
+ },
+ {
+ "epoch": 15.978201634877385,
+ "grad_norm": 12.917484283447266,
+ "learning_rate": 1.912953433958483e-05,
+ "loss": 1.0291,
+ "step": 5864
+ },
+ {
+ "epoch": 15.98092643051771,
+ "grad_norm": 7.872670650482178,
+ "learning_rate": 1.9129174189961008e-05,
+ "loss": 1.1296,
+ "step": 5865
+ },
+ {
+ "epoch": 15.983651226158038,
+ "grad_norm": 10.53221607208252,
+ "learning_rate": 1.9128813969239477e-05,
+ "loss": 1.0547,
+ "step": 5866
+ },
+ {
+ "epoch": 15.986376021798366,
+ "grad_norm": 11.600288391113281,
+ "learning_rate": 1.9128453677423032e-05,
+ "loss": 1.1653,
+ "step": 5867
+ },
+ {
+ "epoch": 15.989100817438691,
+ "grad_norm": 8.572115898132324,
+ "learning_rate": 1.9128093314514485e-05,
+ "loss": 1.001,
+ "step": 5868
+ },
+ {
+ "epoch": 15.991825613079019,
+ "grad_norm": 9.913413047790527,
+ "learning_rate": 1.912773288051664e-05,
+ "loss": 0.8827,
+ "step": 5869
+ },
+ {
+ "epoch": 15.994550408719347,
+ "grad_norm": 11.46878719329834,
+ "learning_rate": 1.912737237543231e-05,
+ "loss": 1.1794,
+ "step": 5870
+ },
+ {
+ "epoch": 15.997275204359672,
+ "grad_norm": 9.363706588745117,
+ "learning_rate": 1.9127011799264292e-05,
+ "loss": 0.9863,
+ "step": 5871
+ },
+ {
+ "epoch": 16.0,
+ "grad_norm": 9.271892547607422,
+ "learning_rate": 1.9126651152015404e-05,
+ "loss": 0.953,
+ "step": 5872
+ },
+ {
+ "epoch": 16.002724795640326,
+ "grad_norm": 15.289605140686035,
+ "learning_rate": 1.9126290433688448e-05,
+ "loss": 1.0168,
+ "step": 5873
+ },
+ {
+ "epoch": 16.005449591280655,
+ "grad_norm": 9.585624694824219,
+ "learning_rate": 1.9125929644286235e-05,
+ "loss": 1.0023,
+ "step": 5874
+ },
+ {
+ "epoch": 16.00817438692098,
+ "grad_norm": 8.111566543579102,
+ "learning_rate": 1.9125568783811578e-05,
+ "loss": 0.8453,
+ "step": 5875
+ },
+ {
+ "epoch": 16.010899182561307,
+ "grad_norm": 9.225383758544922,
+ "learning_rate": 1.9125207852267286e-05,
+ "loss": 0.9338,
+ "step": 5876
+ },
+ {
+ "epoch": 16.013623978201636,
+ "grad_norm": 53.07051467895508,
+ "learning_rate": 1.9124846849656164e-05,
+ "loss": 0.988,
+ "step": 5877
+ },
+ {
+ "epoch": 16.016348773841962,
+ "grad_norm": 24.62909507751465,
+ "learning_rate": 1.9124485775981034e-05,
+ "loss": 1.0154,
+ "step": 5878
+ },
+ {
+ "epoch": 16.019073569482288,
+ "grad_norm": 8.376246452331543,
+ "learning_rate": 1.9124124631244698e-05,
+ "loss": 0.9277,
+ "step": 5879
+ },
+ {
+ "epoch": 16.021798365122617,
+ "grad_norm": 8.503561973571777,
+ "learning_rate": 1.9123763415449972e-05,
+ "loss": 1.1198,
+ "step": 5880
+ },
+ {
+ "epoch": 16.024523160762943,
+ "grad_norm": 20.052303314208984,
+ "learning_rate": 1.9123402128599675e-05,
+ "loss": 0.8531,
+ "step": 5881
+ },
+ {
+ "epoch": 16.02724795640327,
+ "grad_norm": 11.620841979980469,
+ "learning_rate": 1.9123040770696616e-05,
+ "loss": 0.9486,
+ "step": 5882
+ },
+ {
+ "epoch": 16.029972752043598,
+ "grad_norm": 9.297019004821777,
+ "learning_rate": 1.9122679341743606e-05,
+ "loss": 0.913,
+ "step": 5883
+ },
+ {
+ "epoch": 16.032697547683924,
+ "grad_norm": 7.423447132110596,
+ "learning_rate": 1.912231784174346e-05,
+ "loss": 0.9808,
+ "step": 5884
+ },
+ {
+ "epoch": 16.03542234332425,
+ "grad_norm": 9.530950546264648,
+ "learning_rate": 1.9121956270699005e-05,
+ "loss": 0.9365,
+ "step": 5885
+ },
+ {
+ "epoch": 16.03814713896458,
+ "grad_norm": 8.53531265258789,
+ "learning_rate": 1.9121594628613044e-05,
+ "loss": 0.8394,
+ "step": 5886
+ },
+ {
+ "epoch": 16.040871934604905,
+ "grad_norm": 9.881158828735352,
+ "learning_rate": 1.91212329154884e-05,
+ "loss": 1.0618,
+ "step": 5887
+ },
+ {
+ "epoch": 16.04359673024523,
+ "grad_norm": 7.604527950286865,
+ "learning_rate": 1.912087113132788e-05,
+ "loss": 0.8291,
+ "step": 5888
+ },
+ {
+ "epoch": 16.04632152588556,
+ "grad_norm": 9.686923027038574,
+ "learning_rate": 1.9120509276134315e-05,
+ "loss": 1.0725,
+ "step": 5889
+ },
+ {
+ "epoch": 16.049046321525886,
+ "grad_norm": 9.359725952148438,
+ "learning_rate": 1.9120147349910515e-05,
+ "loss": 1.0834,
+ "step": 5890
+ },
+ {
+ "epoch": 16.05177111716621,
+ "grad_norm": 21.178882598876953,
+ "learning_rate": 1.9119785352659303e-05,
+ "loss": 0.9655,
+ "step": 5891
+ },
+ {
+ "epoch": 16.05449591280654,
+ "grad_norm": 8.237728118896484,
+ "learning_rate": 1.9119423284383494e-05,
+ "loss": 1.085,
+ "step": 5892
+ },
+ {
+ "epoch": 16.057220708446867,
+ "grad_norm": 9.693185806274414,
+ "learning_rate": 1.9119061145085913e-05,
+ "loss": 0.8539,
+ "step": 5893
+ },
+ {
+ "epoch": 16.059945504087192,
+ "grad_norm": 8.249167442321777,
+ "learning_rate": 1.9118698934769374e-05,
+ "loss": 1.0244,
+ "step": 5894
+ },
+ {
+ "epoch": 16.06267029972752,
+ "grad_norm": 15.477276802062988,
+ "learning_rate": 1.91183366534367e-05,
+ "loss": 1.1104,
+ "step": 5895
+ },
+ {
+ "epoch": 16.065395095367847,
+ "grad_norm": 9.014497756958008,
+ "learning_rate": 1.911797430109072e-05,
+ "loss": 0.932,
+ "step": 5896
+ },
+ {
+ "epoch": 16.068119891008173,
+ "grad_norm": 21.939722061157227,
+ "learning_rate": 1.9117611877734244e-05,
+ "loss": 0.9706,
+ "step": 5897
+ },
+ {
+ "epoch": 16.070844686648503,
+ "grad_norm": 10.217493057250977,
+ "learning_rate": 1.9117249383370105e-05,
+ "loss": 0.9189,
+ "step": 5898
+ },
+ {
+ "epoch": 16.07356948228883,
+ "grad_norm": 9.95344066619873,
+ "learning_rate": 1.9116886818001118e-05,
+ "loss": 0.975,
+ "step": 5899
+ },
+ {
+ "epoch": 16.076294277929154,
+ "grad_norm": 18.62358283996582,
+ "learning_rate": 1.9116524181630106e-05,
+ "loss": 1.1211,
+ "step": 5900
+ },
+ {
+ "epoch": 16.079019073569484,
+ "grad_norm": 9.568658828735352,
+ "learning_rate": 1.9116161474259902e-05,
+ "loss": 1.1132,
+ "step": 5901
+ },
+ {
+ "epoch": 16.08174386920981,
+ "grad_norm": 11.954379081726074,
+ "learning_rate": 1.9115798695893327e-05,
+ "loss": 1.0265,
+ "step": 5902
+ },
+ {
+ "epoch": 16.084468664850135,
+ "grad_norm": 8.741806983947754,
+ "learning_rate": 1.9115435846533204e-05,
+ "loss": 1.0,
+ "step": 5903
+ },
+ {
+ "epoch": 16.087193460490465,
+ "grad_norm": 10.515434265136719,
+ "learning_rate": 1.9115072926182358e-05,
+ "loss": 0.886,
+ "step": 5904
+ },
+ {
+ "epoch": 16.08991825613079,
+ "grad_norm": 10.62269115447998,
+ "learning_rate": 1.911470993484362e-05,
+ "loss": 0.8505,
+ "step": 5905
+ },
+ {
+ "epoch": 16.092643051771116,
+ "grad_norm": 7.906174659729004,
+ "learning_rate": 1.911434687251981e-05,
+ "loss": 0.8514,
+ "step": 5906
+ },
+ {
+ "epoch": 16.095367847411445,
+ "grad_norm": 8.911808967590332,
+ "learning_rate": 1.9113983739213765e-05,
+ "loss": 0.9045,
+ "step": 5907
+ },
+ {
+ "epoch": 16.09809264305177,
+ "grad_norm": 8.223689079284668,
+ "learning_rate": 1.9113620534928307e-05,
+ "loss": 0.8833,
+ "step": 5908
+ },
+ {
+ "epoch": 16.100817438692097,
+ "grad_norm": 8.558938980102539,
+ "learning_rate": 1.9113257259666262e-05,
+ "loss": 1.0228,
+ "step": 5909
+ },
+ {
+ "epoch": 16.103542234332426,
+ "grad_norm": 19.754425048828125,
+ "learning_rate": 1.9112893913430466e-05,
+ "loss": 0.9375,
+ "step": 5910
+ },
+ {
+ "epoch": 16.106267029972752,
+ "grad_norm": 8.726752281188965,
+ "learning_rate": 1.9112530496223748e-05,
+ "loss": 1.1094,
+ "step": 5911
+ },
+ {
+ "epoch": 16.108991825613078,
+ "grad_norm": 44.32742691040039,
+ "learning_rate": 1.911216700804893e-05,
+ "loss": 0.84,
+ "step": 5912
+ },
+ {
+ "epoch": 16.111716621253407,
+ "grad_norm": 9.230029106140137,
+ "learning_rate": 1.911180344890885e-05,
+ "loss": 0.8795,
+ "step": 5913
+ },
+ {
+ "epoch": 16.114441416893733,
+ "grad_norm": 9.848237991333008,
+ "learning_rate": 1.9111439818806338e-05,
+ "loss": 0.9354,
+ "step": 5914
+ },
+ {
+ "epoch": 16.11716621253406,
+ "grad_norm": 8.80485725402832,
+ "learning_rate": 1.911107611774423e-05,
+ "loss": 0.7859,
+ "step": 5915
+ },
+ {
+ "epoch": 16.11989100817439,
+ "grad_norm": 8.519614219665527,
+ "learning_rate": 1.911071234572535e-05,
+ "loss": 0.9137,
+ "step": 5916
+ },
+ {
+ "epoch": 16.122615803814714,
+ "grad_norm": 7.780332088470459,
+ "learning_rate": 1.9110348502752537e-05,
+ "loss": 0.9954,
+ "step": 5917
+ },
+ {
+ "epoch": 16.12534059945504,
+ "grad_norm": 8.060101509094238,
+ "learning_rate": 1.9109984588828622e-05,
+ "loss": 0.8457,
+ "step": 5918
+ },
+ {
+ "epoch": 16.12806539509537,
+ "grad_norm": 11.73392391204834,
+ "learning_rate": 1.9109620603956442e-05,
+ "loss": 0.9453,
+ "step": 5919
+ },
+ {
+ "epoch": 16.130790190735695,
+ "grad_norm": 9.113224983215332,
+ "learning_rate": 1.9109256548138832e-05,
+ "loss": 0.9738,
+ "step": 5920
+ },
+ {
+ "epoch": 16.13351498637602,
+ "grad_norm": 10.089421272277832,
+ "learning_rate": 1.910889242137862e-05,
+ "loss": 0.968,
+ "step": 5921
+ },
+ {
+ "epoch": 16.13623978201635,
+ "grad_norm": 9.667669296264648,
+ "learning_rate": 1.9108528223678652e-05,
+ "loss": 0.9104,
+ "step": 5922
+ },
+ {
+ "epoch": 16.138964577656676,
+ "grad_norm": 8.784872055053711,
+ "learning_rate": 1.9108163955041754e-05,
+ "loss": 0.863,
+ "step": 5923
+ },
+ {
+ "epoch": 16.141689373297,
+ "grad_norm": 7.899500846862793,
+ "learning_rate": 1.9107799615470773e-05,
+ "loss": 1.0374,
+ "step": 5924
+ },
+ {
+ "epoch": 16.14441416893733,
+ "grad_norm": 8.752492904663086,
+ "learning_rate": 1.9107435204968538e-05,
+ "loss": 0.9602,
+ "step": 5925
+ },
+ {
+ "epoch": 16.147138964577657,
+ "grad_norm": 9.13194465637207,
+ "learning_rate": 1.910707072353789e-05,
+ "loss": 0.9746,
+ "step": 5926
+ },
+ {
+ "epoch": 16.149863760217983,
+ "grad_norm": 8.339265823364258,
+ "learning_rate": 1.9106706171181673e-05,
+ "loss": 0.9867,
+ "step": 5927
+ },
+ {
+ "epoch": 16.152588555858312,
+ "grad_norm": 10.599468231201172,
+ "learning_rate": 1.910634154790272e-05,
+ "loss": 1.0702,
+ "step": 5928
+ },
+ {
+ "epoch": 16.155313351498638,
+ "grad_norm": 9.619460105895996,
+ "learning_rate": 1.9105976853703875e-05,
+ "loss": 1.0261,
+ "step": 5929
+ },
+ {
+ "epoch": 16.158038147138964,
+ "grad_norm": 9.088080406188965,
+ "learning_rate": 1.910561208858797e-05,
+ "loss": 1.0629,
+ "step": 5930
+ },
+ {
+ "epoch": 16.160762942779293,
+ "grad_norm": 23.779102325439453,
+ "learning_rate": 1.910524725255785e-05,
+ "loss": 0.8628,
+ "step": 5931
+ },
+ {
+ "epoch": 16.16348773841962,
+ "grad_norm": 9.341630935668945,
+ "learning_rate": 1.9104882345616363e-05,
+ "loss": 0.972,
+ "step": 5932
+ },
+ {
+ "epoch": 16.166212534059945,
+ "grad_norm": 9.080842018127441,
+ "learning_rate": 1.9104517367766344e-05,
+ "loss": 0.9935,
+ "step": 5933
+ },
+ {
+ "epoch": 16.168937329700274,
+ "grad_norm": 8.801554679870605,
+ "learning_rate": 1.9104152319010634e-05,
+ "loss": 1.0988,
+ "step": 5934
+ },
+ {
+ "epoch": 16.1716621253406,
+ "grad_norm": 9.890647888183594,
+ "learning_rate": 1.9103787199352077e-05,
+ "loss": 0.8812,
+ "step": 5935
+ },
+ {
+ "epoch": 16.174386920980925,
+ "grad_norm": 8.447457313537598,
+ "learning_rate": 1.9103422008793524e-05,
+ "loss": 1.0991,
+ "step": 5936
+ },
+ {
+ "epoch": 16.177111716621255,
+ "grad_norm": 8.268943786621094,
+ "learning_rate": 1.9103056747337813e-05,
+ "loss": 1.067,
+ "step": 5937
+ },
+ {
+ "epoch": 16.17983651226158,
+ "grad_norm": 9.503392219543457,
+ "learning_rate": 1.9102691414987785e-05,
+ "loss": 0.9934,
+ "step": 5938
+ },
+ {
+ "epoch": 16.182561307901906,
+ "grad_norm": 9.845125198364258,
+ "learning_rate": 1.910232601174629e-05,
+ "loss": 0.9785,
+ "step": 5939
+ },
+ {
+ "epoch": 16.185286103542236,
+ "grad_norm": 11.63794231414795,
+ "learning_rate": 1.9101960537616174e-05,
+ "loss": 1.0958,
+ "step": 5940
+ },
+ {
+ "epoch": 16.18801089918256,
+ "grad_norm": 9.296601295471191,
+ "learning_rate": 1.9101594992600283e-05,
+ "loss": 1.1799,
+ "step": 5941
+ },
+ {
+ "epoch": 16.190735694822887,
+ "grad_norm": 10.46290397644043,
+ "learning_rate": 1.9101229376701463e-05,
+ "loss": 0.9753,
+ "step": 5942
+ },
+ {
+ "epoch": 16.193460490463217,
+ "grad_norm": 9.994993209838867,
+ "learning_rate": 1.910086368992256e-05,
+ "loss": 0.9448,
+ "step": 5943
+ },
+ {
+ "epoch": 16.196185286103542,
+ "grad_norm": 9.466861724853516,
+ "learning_rate": 1.9100497932266423e-05,
+ "loss": 0.9169,
+ "step": 5944
+ },
+ {
+ "epoch": 16.19891008174387,
+ "grad_norm": 8.074040412902832,
+ "learning_rate": 1.9100132103735906e-05,
+ "loss": 0.8988,
+ "step": 5945
+ },
+ {
+ "epoch": 16.201634877384198,
+ "grad_norm": 8.387664794921875,
+ "learning_rate": 1.9099766204333847e-05,
+ "loss": 1.0031,
+ "step": 5946
+ },
+ {
+ "epoch": 16.204359673024523,
+ "grad_norm": 18.077465057373047,
+ "learning_rate": 1.9099400234063107e-05,
+ "loss": 1.0066,
+ "step": 5947
+ },
+ {
+ "epoch": 16.20708446866485,
+ "grad_norm": 13.21737289428711,
+ "learning_rate": 1.9099034192926527e-05,
+ "loss": 1.0029,
+ "step": 5948
+ },
+ {
+ "epoch": 16.20980926430518,
+ "grad_norm": 8.066934585571289,
+ "learning_rate": 1.909866808092696e-05,
+ "loss": 1.0518,
+ "step": 5949
+ },
+ {
+ "epoch": 16.212534059945504,
+ "grad_norm": 9.0236177444458,
+ "learning_rate": 1.9098301898067264e-05,
+ "loss": 0.8417,
+ "step": 5950
+ },
+ {
+ "epoch": 16.21525885558583,
+ "grad_norm": 9.770105361938477,
+ "learning_rate": 1.9097935644350284e-05,
+ "loss": 0.9471,
+ "step": 5951
+ },
+ {
+ "epoch": 16.21798365122616,
+ "grad_norm": 8.485394477844238,
+ "learning_rate": 1.909756931977887e-05,
+ "loss": 0.9606,
+ "step": 5952
+ },
+ {
+ "epoch": 16.220708446866485,
+ "grad_norm": 8.218755722045898,
+ "learning_rate": 1.9097202924355884e-05,
+ "loss": 1.0961,
+ "step": 5953
+ },
+ {
+ "epoch": 16.22343324250681,
+ "grad_norm": 9.037432670593262,
+ "learning_rate": 1.909683645808417e-05,
+ "loss": 1.0549,
+ "step": 5954
+ },
+ {
+ "epoch": 16.22615803814714,
+ "grad_norm": 11.103666305541992,
+ "learning_rate": 1.9096469920966592e-05,
+ "loss": 1.0444,
+ "step": 5955
+ },
+ {
+ "epoch": 16.228882833787466,
+ "grad_norm": 7.901222229003906,
+ "learning_rate": 1.9096103313005992e-05,
+ "loss": 0.9113,
+ "step": 5956
+ },
+ {
+ "epoch": 16.231607629427792,
+ "grad_norm": 8.758397102355957,
+ "learning_rate": 1.909573663420524e-05,
+ "loss": 0.8389,
+ "step": 5957
+ },
+ {
+ "epoch": 16.23433242506812,
+ "grad_norm": 9.530460357666016,
+ "learning_rate": 1.9095369884567178e-05,
+ "loss": 0.9973,
+ "step": 5958
+ },
+ {
+ "epoch": 16.237057220708447,
+ "grad_norm": 9.2470703125,
+ "learning_rate": 1.909500306409467e-05,
+ "loss": 1.0751,
+ "step": 5959
+ },
+ {
+ "epoch": 16.239782016348773,
+ "grad_norm": 8.239962577819824,
+ "learning_rate": 1.909463617279057e-05,
+ "loss": 0.7488,
+ "step": 5960
+ },
+ {
+ "epoch": 16.242506811989102,
+ "grad_norm": 9.150911331176758,
+ "learning_rate": 1.9094269210657737e-05,
+ "loss": 1.0393,
+ "step": 5961
+ },
+ {
+ "epoch": 16.245231607629428,
+ "grad_norm": 8.832514762878418,
+ "learning_rate": 1.9093902177699028e-05,
+ "loss": 1.0737,
+ "step": 5962
+ },
+ {
+ "epoch": 16.247956403269754,
+ "grad_norm": 25.83500862121582,
+ "learning_rate": 1.9093535073917304e-05,
+ "loss": 1.0029,
+ "step": 5963
+ },
+ {
+ "epoch": 16.250681198910083,
+ "grad_norm": 9.633893966674805,
+ "learning_rate": 1.9093167899315417e-05,
+ "loss": 1.0497,
+ "step": 5964
+ },
+ {
+ "epoch": 16.25340599455041,
+ "grad_norm": 10.280200004577637,
+ "learning_rate": 1.9092800653896236e-05,
+ "loss": 0.9462,
+ "step": 5965
+ },
+ {
+ "epoch": 16.256130790190735,
+ "grad_norm": 8.123982429504395,
+ "learning_rate": 1.9092433337662614e-05,
+ "loss": 0.8857,
+ "step": 5966
+ },
+ {
+ "epoch": 16.258855585831064,
+ "grad_norm": 7.409641742706299,
+ "learning_rate": 1.909206595061741e-05,
+ "loss": 0.8341,
+ "step": 5967
+ },
+ {
+ "epoch": 16.26158038147139,
+ "grad_norm": 10.250338554382324,
+ "learning_rate": 1.9091698492763494e-05,
+ "loss": 1.106,
+ "step": 5968
+ },
+ {
+ "epoch": 16.264305177111716,
+ "grad_norm": 7.752365589141846,
+ "learning_rate": 1.909133096410372e-05,
+ "loss": 0.9622,
+ "step": 5969
+ },
+ {
+ "epoch": 16.267029972752045,
+ "grad_norm": 8.367024421691895,
+ "learning_rate": 1.9090963364640954e-05,
+ "loss": 0.9623,
+ "step": 5970
+ },
+ {
+ "epoch": 16.26975476839237,
+ "grad_norm": 9.059532165527344,
+ "learning_rate": 1.909059569437806e-05,
+ "loss": 1.0144,
+ "step": 5971
+ },
+ {
+ "epoch": 16.272479564032697,
+ "grad_norm": 8.470860481262207,
+ "learning_rate": 1.9090227953317896e-05,
+ "loss": 0.9541,
+ "step": 5972
+ },
+ {
+ "epoch": 16.275204359673026,
+ "grad_norm": 8.233183860778809,
+ "learning_rate": 1.908986014146333e-05,
+ "loss": 0.9636,
+ "step": 5973
+ },
+ {
+ "epoch": 16.277929155313352,
+ "grad_norm": 8.340307235717773,
+ "learning_rate": 1.9089492258817225e-05,
+ "loss": 0.9459,
+ "step": 5974
+ },
+ {
+ "epoch": 16.280653950953678,
+ "grad_norm": 8.482439994812012,
+ "learning_rate": 1.908912430538245e-05,
+ "loss": 0.9739,
+ "step": 5975
+ },
+ {
+ "epoch": 16.283378746594007,
+ "grad_norm": 8.190013885498047,
+ "learning_rate": 1.9088756281161866e-05,
+ "loss": 0.876,
+ "step": 5976
+ },
+ {
+ "epoch": 16.286103542234333,
+ "grad_norm": 8.862380027770996,
+ "learning_rate": 1.908838818615834e-05,
+ "loss": 1.0016,
+ "step": 5977
+ },
+ {
+ "epoch": 16.28882833787466,
+ "grad_norm": 9.875590324401855,
+ "learning_rate": 1.908802002037474e-05,
+ "loss": 0.9709,
+ "step": 5978
+ },
+ {
+ "epoch": 16.291553133514988,
+ "grad_norm": 8.948189735412598,
+ "learning_rate": 1.908765178381393e-05,
+ "loss": 0.7603,
+ "step": 5979
+ },
+ {
+ "epoch": 16.294277929155314,
+ "grad_norm": 7.790036678314209,
+ "learning_rate": 1.9087283476478784e-05,
+ "loss": 1.0806,
+ "step": 5980
+ },
+ {
+ "epoch": 16.29700272479564,
+ "grad_norm": 19.806018829345703,
+ "learning_rate": 1.9086915098372166e-05,
+ "loss": 1.0457,
+ "step": 5981
+ },
+ {
+ "epoch": 16.29972752043597,
+ "grad_norm": 9.134679794311523,
+ "learning_rate": 1.9086546649496943e-05,
+ "loss": 0.8326,
+ "step": 5982
+ },
+ {
+ "epoch": 16.302452316076295,
+ "grad_norm": 9.624375343322754,
+ "learning_rate": 1.908617812985599e-05,
+ "loss": 1.0908,
+ "step": 5983
+ },
+ {
+ "epoch": 16.30517711171662,
+ "grad_norm": 8.333988189697266,
+ "learning_rate": 1.9085809539452174e-05,
+ "loss": 0.9963,
+ "step": 5984
+ },
+ {
+ "epoch": 16.30790190735695,
+ "grad_norm": 8.44038200378418,
+ "learning_rate": 1.9085440878288363e-05,
+ "loss": 0.9639,
+ "step": 5985
+ },
+ {
+ "epoch": 16.310626702997276,
+ "grad_norm": 7.278705596923828,
+ "learning_rate": 1.9085072146367434e-05,
+ "loss": 1.0146,
+ "step": 5986
+ },
+ {
+ "epoch": 16.3133514986376,
+ "grad_norm": 6.198719024658203,
+ "learning_rate": 1.9084703343692253e-05,
+ "loss": 0.9016,
+ "step": 5987
+ },
+ {
+ "epoch": 16.31607629427793,
+ "grad_norm": 8.337554931640625,
+ "learning_rate": 1.90843344702657e-05,
+ "loss": 0.8571,
+ "step": 5988
+ },
+ {
+ "epoch": 16.318801089918257,
+ "grad_norm": 8.546713829040527,
+ "learning_rate": 1.9083965526090635e-05,
+ "loss": 1.0874,
+ "step": 5989
+ },
+ {
+ "epoch": 16.321525885558582,
+ "grad_norm": 8.65063762664795,
+ "learning_rate": 1.908359651116994e-05,
+ "loss": 1.2061,
+ "step": 5990
+ },
+ {
+ "epoch": 16.32425068119891,
+ "grad_norm": 7.996217250823975,
+ "learning_rate": 1.908322742550649e-05,
+ "loss": 0.8696,
+ "step": 5991
+ },
+ {
+ "epoch": 16.326975476839237,
+ "grad_norm": 8.911670684814453,
+ "learning_rate": 1.9082858269103162e-05,
+ "loss": 1.0651,
+ "step": 5992
+ },
+ {
+ "epoch": 16.329700272479563,
+ "grad_norm": 23.596555709838867,
+ "learning_rate": 1.908248904196282e-05,
+ "loss": 1.0306,
+ "step": 5993
+ },
+ {
+ "epoch": 16.332425068119893,
+ "grad_norm": 7.521470069885254,
+ "learning_rate": 1.9082119744088348e-05,
+ "loss": 1.0576,
+ "step": 5994
+ },
+ {
+ "epoch": 16.33514986376022,
+ "grad_norm": 7.754633903503418,
+ "learning_rate": 1.9081750375482618e-05,
+ "loss": 0.8788,
+ "step": 5995
+ },
+ {
+ "epoch": 16.337874659400544,
+ "grad_norm": 9.71580982208252,
+ "learning_rate": 1.908138093614851e-05,
+ "loss": 1.104,
+ "step": 5996
+ },
+ {
+ "epoch": 16.340599455040874,
+ "grad_norm": 8.19369888305664,
+ "learning_rate": 1.90810114260889e-05,
+ "loss": 0.972,
+ "step": 5997
+ },
+ {
+ "epoch": 16.3433242506812,
+ "grad_norm": 7.382881164550781,
+ "learning_rate": 1.908064184530666e-05,
+ "loss": 0.8334,
+ "step": 5998
+ },
+ {
+ "epoch": 16.346049046321525,
+ "grad_norm": 11.877547264099121,
+ "learning_rate": 1.908027219380468e-05,
+ "loss": 0.861,
+ "step": 5999
+ },
+ {
+ "epoch": 16.348773841961854,
+ "grad_norm": 7.584044933319092,
+ "learning_rate": 1.907990247158583e-05,
+ "loss": 0.8782,
+ "step": 6000
+ },
+ {
+ "epoch": 16.35149863760218,
+ "grad_norm": 7.831441879272461,
+ "learning_rate": 1.907953267865299e-05,
+ "loss": 0.9613,
+ "step": 6001
+ },
+ {
+ "epoch": 16.354223433242506,
+ "grad_norm": 8.159957885742188,
+ "learning_rate": 1.9079162815009045e-05,
+ "loss": 1.0771,
+ "step": 6002
+ },
+ {
+ "epoch": 16.356948228882835,
+ "grad_norm": 8.454666137695312,
+ "learning_rate": 1.9078792880656868e-05,
+ "loss": 0.821,
+ "step": 6003
+ },
+ {
+ "epoch": 16.35967302452316,
+ "grad_norm": 7.667445659637451,
+ "learning_rate": 1.907842287559935e-05,
+ "loss": 1.0226,
+ "step": 6004
+ },
+ {
+ "epoch": 16.362397820163487,
+ "grad_norm": 8.185620307922363,
+ "learning_rate": 1.9078052799839363e-05,
+ "loss": 0.9062,
+ "step": 6005
+ },
+ {
+ "epoch": 16.365122615803816,
+ "grad_norm": 9.708785057067871,
+ "learning_rate": 1.9077682653379795e-05,
+ "loss": 0.9871,
+ "step": 6006
+ },
+ {
+ "epoch": 16.367847411444142,
+ "grad_norm": 8.769133567810059,
+ "learning_rate": 1.9077312436223524e-05,
+ "loss": 0.9122,
+ "step": 6007
+ },
+ {
+ "epoch": 16.370572207084468,
+ "grad_norm": 8.197275161743164,
+ "learning_rate": 1.907694214837344e-05,
+ "loss": 0.9888,
+ "step": 6008
+ },
+ {
+ "epoch": 16.373297002724797,
+ "grad_norm": 7.544145584106445,
+ "learning_rate": 1.9076571789832416e-05,
+ "loss": 1.0267,
+ "step": 6009
+ },
+ {
+ "epoch": 16.376021798365123,
+ "grad_norm": 8.935723304748535,
+ "learning_rate": 1.9076201360603347e-05,
+ "loss": 0.9645,
+ "step": 6010
+ },
+ {
+ "epoch": 16.37874659400545,
+ "grad_norm": 9.968594551086426,
+ "learning_rate": 1.9075830860689114e-05,
+ "loss": 1.0848,
+ "step": 6011
+ },
+ {
+ "epoch": 16.381471389645778,
+ "grad_norm": 8.968193054199219,
+ "learning_rate": 1.9075460290092604e-05,
+ "loss": 0.9851,
+ "step": 6012
+ },
+ {
+ "epoch": 16.384196185286104,
+ "grad_norm": 9.305635452270508,
+ "learning_rate": 1.9075089648816697e-05,
+ "loss": 1.1685,
+ "step": 6013
+ },
+ {
+ "epoch": 16.38692098092643,
+ "grad_norm": 11.007704734802246,
+ "learning_rate": 1.907471893686429e-05,
+ "loss": 0.8275,
+ "step": 6014
+ },
+ {
+ "epoch": 16.38964577656676,
+ "grad_norm": 9.118929862976074,
+ "learning_rate": 1.907434815423826e-05,
+ "loss": 1.014,
+ "step": 6015
+ },
+ {
+ "epoch": 16.392370572207085,
+ "grad_norm": 8.24226188659668,
+ "learning_rate": 1.9073977300941497e-05,
+ "loss": 0.8677,
+ "step": 6016
+ },
+ {
+ "epoch": 16.39509536784741,
+ "grad_norm": 7.754024505615234,
+ "learning_rate": 1.9073606376976895e-05,
+ "loss": 1.0286,
+ "step": 6017
+ },
+ {
+ "epoch": 16.39782016348774,
+ "grad_norm": 9.166144371032715,
+ "learning_rate": 1.9073235382347336e-05,
+ "loss": 1.0774,
+ "step": 6018
+ },
+ {
+ "epoch": 16.400544959128066,
+ "grad_norm": 7.809909343719482,
+ "learning_rate": 1.907286431705571e-05,
+ "loss": 0.8898,
+ "step": 6019
+ },
+ {
+ "epoch": 16.40326975476839,
+ "grad_norm": 8.78017807006836,
+ "learning_rate": 1.9072493181104916e-05,
+ "loss": 0.9423,
+ "step": 6020
+ },
+ {
+ "epoch": 16.40599455040872,
+ "grad_norm": 10.937439918518066,
+ "learning_rate": 1.907212197449783e-05,
+ "loss": 0.9635,
+ "step": 6021
+ },
+ {
+ "epoch": 16.408719346049047,
+ "grad_norm": 8.849957466125488,
+ "learning_rate": 1.907175069723735e-05,
+ "loss": 1.0122,
+ "step": 6022
+ },
+ {
+ "epoch": 16.411444141689373,
+ "grad_norm": 8.172831535339355,
+ "learning_rate": 1.9071379349326373e-05,
+ "loss": 0.9895,
+ "step": 6023
+ },
+ {
+ "epoch": 16.414168937329702,
+ "grad_norm": 8.49582290649414,
+ "learning_rate": 1.9071007930767782e-05,
+ "loss": 0.9797,
+ "step": 6024
+ },
+ {
+ "epoch": 16.416893732970028,
+ "grad_norm": 9.933019638061523,
+ "learning_rate": 1.9070636441564474e-05,
+ "loss": 1.2769,
+ "step": 6025
+ },
+ {
+ "epoch": 16.419618528610354,
+ "grad_norm": 8.22047233581543,
+ "learning_rate": 1.907026488171934e-05,
+ "loss": 0.8754,
+ "step": 6026
+ },
+ {
+ "epoch": 16.422343324250683,
+ "grad_norm": 8.400115013122559,
+ "learning_rate": 1.9069893251235277e-05,
+ "loss": 1.0231,
+ "step": 6027
+ },
+ {
+ "epoch": 16.42506811989101,
+ "grad_norm": 7.147830963134766,
+ "learning_rate": 1.9069521550115175e-05,
+ "loss": 1.0021,
+ "step": 6028
+ },
+ {
+ "epoch": 16.427792915531334,
+ "grad_norm": 7.267785549163818,
+ "learning_rate": 1.9069149778361934e-05,
+ "loss": 0.8904,
+ "step": 6029
+ },
+ {
+ "epoch": 16.430517711171664,
+ "grad_norm": 9.049951553344727,
+ "learning_rate": 1.9068777935978444e-05,
+ "loss": 0.9927,
+ "step": 6030
+ },
+ {
+ "epoch": 16.43324250681199,
+ "grad_norm": 9.180093765258789,
+ "learning_rate": 1.9068406022967605e-05,
+ "loss": 1.0958,
+ "step": 6031
+ },
+ {
+ "epoch": 16.435967302452315,
+ "grad_norm": 8.235403060913086,
+ "learning_rate": 1.906803403933231e-05,
+ "loss": 1.249,
+ "step": 6032
+ },
+ {
+ "epoch": 16.438692098092645,
+ "grad_norm": 10.791427612304688,
+ "learning_rate": 1.906766198507546e-05,
+ "loss": 1.0869,
+ "step": 6033
+ },
+ {
+ "epoch": 16.44141689373297,
+ "grad_norm": 6.91215705871582,
+ "learning_rate": 1.9067289860199945e-05,
+ "loss": 1.085,
+ "step": 6034
+ },
+ {
+ "epoch": 16.444141689373296,
+ "grad_norm": 8.863093376159668,
+ "learning_rate": 1.9066917664708674e-05,
+ "loss": 0.99,
+ "step": 6035
+ },
+ {
+ "epoch": 16.446866485013626,
+ "grad_norm": 7.740184307098389,
+ "learning_rate": 1.9066545398604538e-05,
+ "loss": 0.9575,
+ "step": 6036
+ },
+ {
+ "epoch": 16.44959128065395,
+ "grad_norm": 7.676769733428955,
+ "learning_rate": 1.9066173061890438e-05,
+ "loss": 1.0483,
+ "step": 6037
+ },
+ {
+ "epoch": 16.452316076294277,
+ "grad_norm": 15.380928993225098,
+ "learning_rate": 1.9065800654569277e-05,
+ "loss": 0.8556,
+ "step": 6038
+ },
+ {
+ "epoch": 16.455040871934607,
+ "grad_norm": 9.415081977844238,
+ "learning_rate": 1.906542817664395e-05,
+ "loss": 0.8867,
+ "step": 6039
+ },
+ {
+ "epoch": 16.457765667574932,
+ "grad_norm": 7.816688537597656,
+ "learning_rate": 1.9065055628117358e-05,
+ "loss": 0.9417,
+ "step": 6040
+ },
+ {
+ "epoch": 16.460490463215258,
+ "grad_norm": 8.097055435180664,
+ "learning_rate": 1.9064683008992407e-05,
+ "loss": 0.8629,
+ "step": 6041
+ },
+ {
+ "epoch": 16.463215258855588,
+ "grad_norm": 9.544647216796875,
+ "learning_rate": 1.9064310319271997e-05,
+ "loss": 1.0793,
+ "step": 6042
+ },
+ {
+ "epoch": 16.465940054495913,
+ "grad_norm": 8.068865776062012,
+ "learning_rate": 1.906393755895903e-05,
+ "loss": 0.9089,
+ "step": 6043
+ },
+ {
+ "epoch": 16.46866485013624,
+ "grad_norm": 9.3299560546875,
+ "learning_rate": 1.906356472805641e-05,
+ "loss": 1.1665,
+ "step": 6044
+ },
+ {
+ "epoch": 16.47138964577657,
+ "grad_norm": 9.5327730178833,
+ "learning_rate": 1.9063191826567035e-05,
+ "loss": 0.8313,
+ "step": 6045
+ },
+ {
+ "epoch": 16.474114441416894,
+ "grad_norm": 8.465132713317871,
+ "learning_rate": 1.9062818854493816e-05,
+ "loss": 0.9471,
+ "step": 6046
+ },
+ {
+ "epoch": 16.47683923705722,
+ "grad_norm": 7.73591947555542,
+ "learning_rate": 1.9062445811839655e-05,
+ "loss": 0.8947,
+ "step": 6047
+ },
+ {
+ "epoch": 16.479564032697546,
+ "grad_norm": 8.444184303283691,
+ "learning_rate": 1.9062072698607457e-05,
+ "loss": 1.0015,
+ "step": 6048
+ },
+ {
+ "epoch": 16.482288828337875,
+ "grad_norm": 7.189904689788818,
+ "learning_rate": 1.9061699514800128e-05,
+ "loss": 0.8428,
+ "step": 6049
+ },
+ {
+ "epoch": 16.4850136239782,
+ "grad_norm": 10.970808029174805,
+ "learning_rate": 1.906132626042058e-05,
+ "loss": 0.9288,
+ "step": 6050
+ },
+ {
+ "epoch": 16.48773841961853,
+ "grad_norm": 9.308109283447266,
+ "learning_rate": 1.906095293547171e-05,
+ "loss": 0.89,
+ "step": 6051
+ },
+ {
+ "epoch": 16.490463215258856,
+ "grad_norm": 8.384902000427246,
+ "learning_rate": 1.906057953995643e-05,
+ "loss": 0.9181,
+ "step": 6052
+ },
+ {
+ "epoch": 16.493188010899182,
+ "grad_norm": 9.699617385864258,
+ "learning_rate": 1.9060206073877655e-05,
+ "loss": 0.9622,
+ "step": 6053
+ },
+ {
+ "epoch": 16.495912806539508,
+ "grad_norm": 10.59549331665039,
+ "learning_rate": 1.9059832537238278e-05,
+ "loss": 0.9661,
+ "step": 6054
+ },
+ {
+ "epoch": 16.498637602179837,
+ "grad_norm": 8.202498435974121,
+ "learning_rate": 1.9059458930041222e-05,
+ "loss": 0.9198,
+ "step": 6055
+ },
+ {
+ "epoch": 16.501362397820163,
+ "grad_norm": 10.255706787109375,
+ "learning_rate": 1.9059085252289388e-05,
+ "loss": 0.8696,
+ "step": 6056
+ },
+ {
+ "epoch": 16.504087193460492,
+ "grad_norm": 7.805537700653076,
+ "learning_rate": 1.9058711503985692e-05,
+ "loss": 0.9667,
+ "step": 6057
+ },
+ {
+ "epoch": 16.506811989100818,
+ "grad_norm": 8.793238639831543,
+ "learning_rate": 1.9058337685133043e-05,
+ "loss": 0.952,
+ "step": 6058
+ },
+ {
+ "epoch": 16.509536784741144,
+ "grad_norm": 9.71096134185791,
+ "learning_rate": 1.905796379573435e-05,
+ "loss": 1.3391,
+ "step": 6059
+ },
+ {
+ "epoch": 16.51226158038147,
+ "grad_norm": 9.125404357910156,
+ "learning_rate": 1.9057589835792524e-05,
+ "loss": 1.2024,
+ "step": 6060
+ },
+ {
+ "epoch": 16.5149863760218,
+ "grad_norm": 7.917983531951904,
+ "learning_rate": 1.9057215805310485e-05,
+ "loss": 0.9601,
+ "step": 6061
+ },
+ {
+ "epoch": 16.517711171662125,
+ "grad_norm": 8.468579292297363,
+ "learning_rate": 1.9056841704291137e-05,
+ "loss": 0.9695,
+ "step": 6062
+ },
+ {
+ "epoch": 16.520435967302454,
+ "grad_norm": 8.051939964294434,
+ "learning_rate": 1.90564675327374e-05,
+ "loss": 0.9247,
+ "step": 6063
+ },
+ {
+ "epoch": 16.52316076294278,
+ "grad_norm": 8.476173400878906,
+ "learning_rate": 1.9056093290652186e-05,
+ "loss": 0.9005,
+ "step": 6064
+ },
+ {
+ "epoch": 16.525885558583106,
+ "grad_norm": 9.824795722961426,
+ "learning_rate": 1.9055718978038404e-05,
+ "loss": 0.9658,
+ "step": 6065
+ },
+ {
+ "epoch": 16.52861035422343,
+ "grad_norm": 9.040727615356445,
+ "learning_rate": 1.9055344594898978e-05,
+ "loss": 1.0005,
+ "step": 6066
+ },
+ {
+ "epoch": 16.53133514986376,
+ "grad_norm": 9.851045608520508,
+ "learning_rate": 1.905497014123682e-05,
+ "loss": 0.8988,
+ "step": 6067
+ },
+ {
+ "epoch": 16.534059945504087,
+ "grad_norm": 8.072575569152832,
+ "learning_rate": 1.9054595617054844e-05,
+ "loss": 0.9775,
+ "step": 6068
+ },
+ {
+ "epoch": 16.536784741144416,
+ "grad_norm": 10.031383514404297,
+ "learning_rate": 1.905422102235597e-05,
+ "loss": 1.0728,
+ "step": 6069
+ },
+ {
+ "epoch": 16.539509536784742,
+ "grad_norm": 11.542708396911621,
+ "learning_rate": 1.9053846357143114e-05,
+ "loss": 0.9026,
+ "step": 6070
+ },
+ {
+ "epoch": 16.542234332425068,
+ "grad_norm": 8.84055233001709,
+ "learning_rate": 1.9053471621419193e-05,
+ "loss": 1.0281,
+ "step": 6071
+ },
+ {
+ "epoch": 16.544959128065393,
+ "grad_norm": 9.412172317504883,
+ "learning_rate": 1.9053096815187125e-05,
+ "loss": 1.2434,
+ "step": 6072
+ },
+ {
+ "epoch": 16.547683923705723,
+ "grad_norm": 10.151601791381836,
+ "learning_rate": 1.9052721938449834e-05,
+ "loss": 1.189,
+ "step": 6073
+ },
+ {
+ "epoch": 16.55040871934605,
+ "grad_norm": 13.779661178588867,
+ "learning_rate": 1.9052346991210237e-05,
+ "loss": 1.0056,
+ "step": 6074
+ },
+ {
+ "epoch": 16.553133514986374,
+ "grad_norm": 8.894524574279785,
+ "learning_rate": 1.905197197347125e-05,
+ "loss": 1.0266,
+ "step": 6075
+ },
+ {
+ "epoch": 16.555858310626704,
+ "grad_norm": 13.412213325500488,
+ "learning_rate": 1.9051596885235795e-05,
+ "loss": 0.9729,
+ "step": 6076
+ },
+ {
+ "epoch": 16.55858310626703,
+ "grad_norm": 8.03742504119873,
+ "learning_rate": 1.9051221726506795e-05,
+ "loss": 0.9557,
+ "step": 6077
+ },
+ {
+ "epoch": 16.561307901907355,
+ "grad_norm": 11.525594711303711,
+ "learning_rate": 1.9050846497287175e-05,
+ "loss": 0.9634,
+ "step": 6078
+ },
+ {
+ "epoch": 16.564032697547685,
+ "grad_norm": 9.7057523727417,
+ "learning_rate": 1.905047119757985e-05,
+ "loss": 1.1147,
+ "step": 6079
+ },
+ {
+ "epoch": 16.56675749318801,
+ "grad_norm": 8.049863815307617,
+ "learning_rate": 1.9050095827387748e-05,
+ "loss": 1.092,
+ "step": 6080
+ },
+ {
+ "epoch": 16.569482288828336,
+ "grad_norm": 8.248735427856445,
+ "learning_rate": 1.9049720386713796e-05,
+ "loss": 1.0129,
+ "step": 6081
+ },
+ {
+ "epoch": 16.572207084468666,
+ "grad_norm": 9.346665382385254,
+ "learning_rate": 1.9049344875560906e-05,
+ "loss": 0.9362,
+ "step": 6082
+ },
+ {
+ "epoch": 16.57493188010899,
+ "grad_norm": 9.57408332824707,
+ "learning_rate": 1.9048969293932012e-05,
+ "loss": 1.2029,
+ "step": 6083
+ },
+ {
+ "epoch": 16.577656675749317,
+ "grad_norm": 8.063798904418945,
+ "learning_rate": 1.9048593641830034e-05,
+ "loss": 0.9291,
+ "step": 6084
+ },
+ {
+ "epoch": 16.580381471389646,
+ "grad_norm": 7.972892761230469,
+ "learning_rate": 1.9048217919257907e-05,
+ "loss": 1.1289,
+ "step": 6085
+ },
+ {
+ "epoch": 16.583106267029972,
+ "grad_norm": 7.366415977478027,
+ "learning_rate": 1.9047842126218544e-05,
+ "loss": 0.8733,
+ "step": 6086
+ },
+ {
+ "epoch": 16.585831062670298,
+ "grad_norm": 8.68867015838623,
+ "learning_rate": 1.904746626271488e-05,
+ "loss": 0.8827,
+ "step": 6087
+ },
+ {
+ "epoch": 16.588555858310627,
+ "grad_norm": 9.911465644836426,
+ "learning_rate": 1.9047090328749837e-05,
+ "loss": 0.8958,
+ "step": 6088
+ },
+ {
+ "epoch": 16.591280653950953,
+ "grad_norm": 7.827071189880371,
+ "learning_rate": 1.9046714324326347e-05,
+ "loss": 1.0327,
+ "step": 6089
+ },
+ {
+ "epoch": 16.59400544959128,
+ "grad_norm": 7.7089409828186035,
+ "learning_rate": 1.9046338249447335e-05,
+ "loss": 1.0076,
+ "step": 6090
+ },
+ {
+ "epoch": 16.59673024523161,
+ "grad_norm": 8.589584350585938,
+ "learning_rate": 1.9045962104115738e-05,
+ "loss": 0.9946,
+ "step": 6091
+ },
+ {
+ "epoch": 16.599455040871934,
+ "grad_norm": 8.614899635314941,
+ "learning_rate": 1.9045585888334475e-05,
+ "loss": 0.8456,
+ "step": 6092
+ },
+ {
+ "epoch": 16.60217983651226,
+ "grad_norm": 8.168996810913086,
+ "learning_rate": 1.904520960210648e-05,
+ "loss": 1.0383,
+ "step": 6093
+ },
+ {
+ "epoch": 16.60490463215259,
+ "grad_norm": 6.833440780639648,
+ "learning_rate": 1.9044833245434686e-05,
+ "loss": 0.8608,
+ "step": 6094
+ },
+ {
+ "epoch": 16.607629427792915,
+ "grad_norm": 8.260551452636719,
+ "learning_rate": 1.904445681832202e-05,
+ "loss": 1.0952,
+ "step": 6095
+ },
+ {
+ "epoch": 16.61035422343324,
+ "grad_norm": 7.668336391448975,
+ "learning_rate": 1.9044080320771416e-05,
+ "loss": 1.1274,
+ "step": 6096
+ },
+ {
+ "epoch": 16.61307901907357,
+ "grad_norm": 6.161644458770752,
+ "learning_rate": 1.9043703752785804e-05,
+ "loss": 0.8849,
+ "step": 6097
+ },
+ {
+ "epoch": 16.615803814713896,
+ "grad_norm": 8.076497077941895,
+ "learning_rate": 1.9043327114368118e-05,
+ "loss": 0.9469,
+ "step": 6098
+ },
+ {
+ "epoch": 16.618528610354222,
+ "grad_norm": 13.970622062683105,
+ "learning_rate": 1.9042950405521296e-05,
+ "loss": 1.0378,
+ "step": 6099
+ },
+ {
+ "epoch": 16.62125340599455,
+ "grad_norm": 7.201518535614014,
+ "learning_rate": 1.9042573626248266e-05,
+ "loss": 0.9572,
+ "step": 6100
+ },
+ {
+ "epoch": 16.623978201634877,
+ "grad_norm": 9.967567443847656,
+ "learning_rate": 1.904219677655196e-05,
+ "loss": 1.0217,
+ "step": 6101
+ },
+ {
+ "epoch": 16.626702997275203,
+ "grad_norm": 7.625209808349609,
+ "learning_rate": 1.9041819856435318e-05,
+ "loss": 1.0759,
+ "step": 6102
+ },
+ {
+ "epoch": 16.629427792915532,
+ "grad_norm": 8.119585037231445,
+ "learning_rate": 1.9041442865901276e-05,
+ "loss": 1.0013,
+ "step": 6103
+ },
+ {
+ "epoch": 16.632152588555858,
+ "grad_norm": 8.203313827514648,
+ "learning_rate": 1.9041065804952764e-05,
+ "loss": 1.0774,
+ "step": 6104
+ },
+ {
+ "epoch": 16.634877384196184,
+ "grad_norm": 10.273894309997559,
+ "learning_rate": 1.9040688673592725e-05,
+ "loss": 1.0244,
+ "step": 6105
+ },
+ {
+ "epoch": 16.637602179836513,
+ "grad_norm": 6.8131103515625,
+ "learning_rate": 1.9040311471824092e-05,
+ "loss": 0.97,
+ "step": 6106
+ },
+ {
+ "epoch": 16.64032697547684,
+ "grad_norm": 10.750165939331055,
+ "learning_rate": 1.903993419964981e-05,
+ "loss": 1.0129,
+ "step": 6107
+ },
+ {
+ "epoch": 16.643051771117165,
+ "grad_norm": 8.18924331665039,
+ "learning_rate": 1.9039556857072808e-05,
+ "loss": 0.959,
+ "step": 6108
+ },
+ {
+ "epoch": 16.645776566757494,
+ "grad_norm": 7.18798303604126,
+ "learning_rate": 1.9039179444096025e-05,
+ "loss": 1.1155,
+ "step": 6109
+ },
+ {
+ "epoch": 16.64850136239782,
+ "grad_norm": 8.120108604431152,
+ "learning_rate": 1.9038801960722405e-05,
+ "loss": 1.0562,
+ "step": 6110
+ },
+ {
+ "epoch": 16.651226158038146,
+ "grad_norm": 9.277802467346191,
+ "learning_rate": 1.903842440695489e-05,
+ "loss": 0.9187,
+ "step": 6111
+ },
+ {
+ "epoch": 16.653950953678475,
+ "grad_norm": 9.661819458007812,
+ "learning_rate": 1.903804678279641e-05,
+ "loss": 1.0353,
+ "step": 6112
+ },
+ {
+ "epoch": 16.6566757493188,
+ "grad_norm": 7.471489906311035,
+ "learning_rate": 1.903766908824992e-05,
+ "loss": 0.9988,
+ "step": 6113
+ },
+ {
+ "epoch": 16.659400544959126,
+ "grad_norm": 8.371833801269531,
+ "learning_rate": 1.9037291323318348e-05,
+ "loss": 0.9868,
+ "step": 6114
+ },
+ {
+ "epoch": 16.662125340599456,
+ "grad_norm": 7.713346004486084,
+ "learning_rate": 1.9036913488004646e-05,
+ "loss": 0.8154,
+ "step": 6115
+ },
+ {
+ "epoch": 16.66485013623978,
+ "grad_norm": 7.333027362823486,
+ "learning_rate": 1.903653558231175e-05,
+ "loss": 1.0903,
+ "step": 6116
+ },
+ {
+ "epoch": 16.667574931880107,
+ "grad_norm": 7.406708717346191,
+ "learning_rate": 1.9036157606242603e-05,
+ "loss": 0.9045,
+ "step": 6117
+ },
+ {
+ "epoch": 16.670299727520437,
+ "grad_norm": 10.05079174041748,
+ "learning_rate": 1.903577955980016e-05,
+ "loss": 1.0574,
+ "step": 6118
+ },
+ {
+ "epoch": 16.673024523160763,
+ "grad_norm": 7.7181878089904785,
+ "learning_rate": 1.903540144298735e-05,
+ "loss": 1.1055,
+ "step": 6119
+ },
+ {
+ "epoch": 16.67574931880109,
+ "grad_norm": 8.098625183105469,
+ "learning_rate": 1.9035023255807124e-05,
+ "loss": 0.8563,
+ "step": 6120
+ },
+ {
+ "epoch": 16.678474114441418,
+ "grad_norm": 8.74626636505127,
+ "learning_rate": 1.903464499826243e-05,
+ "loss": 0.9667,
+ "step": 6121
+ },
+ {
+ "epoch": 16.681198910081743,
+ "grad_norm": 8.023555755615234,
+ "learning_rate": 1.903426667035621e-05,
+ "loss": 0.8154,
+ "step": 6122
+ },
+ {
+ "epoch": 16.68392370572207,
+ "grad_norm": 9.104249954223633,
+ "learning_rate": 1.9033888272091416e-05,
+ "loss": 0.967,
+ "step": 6123
+ },
+ {
+ "epoch": 16.6866485013624,
+ "grad_norm": 8.570528030395508,
+ "learning_rate": 1.9033509803470986e-05,
+ "loss": 1.1956,
+ "step": 6124
+ },
+ {
+ "epoch": 16.689373297002724,
+ "grad_norm": 8.387625694274902,
+ "learning_rate": 1.9033131264497876e-05,
+ "loss": 1.1216,
+ "step": 6125
+ },
+ {
+ "epoch": 16.69209809264305,
+ "grad_norm": 6.991154193878174,
+ "learning_rate": 1.9032752655175025e-05,
+ "loss": 0.9769,
+ "step": 6126
+ },
+ {
+ "epoch": 16.69482288828338,
+ "grad_norm": 8.776601791381836,
+ "learning_rate": 1.9032373975505393e-05,
+ "loss": 1.0464,
+ "step": 6127
+ },
+ {
+ "epoch": 16.697547683923705,
+ "grad_norm": 9.082233428955078,
+ "learning_rate": 1.903199522549192e-05,
+ "loss": 0.864,
+ "step": 6128
+ },
+ {
+ "epoch": 16.70027247956403,
+ "grad_norm": 10.216814994812012,
+ "learning_rate": 1.9031616405137563e-05,
+ "loss": 1.1111,
+ "step": 6129
+ },
+ {
+ "epoch": 16.70299727520436,
+ "grad_norm": 8.663824081420898,
+ "learning_rate": 1.9031237514445264e-05,
+ "loss": 0.897,
+ "step": 6130
+ },
+ {
+ "epoch": 16.705722070844686,
+ "grad_norm": 8.798577308654785,
+ "learning_rate": 1.9030858553417978e-05,
+ "loss": 0.8569,
+ "step": 6131
+ },
+ {
+ "epoch": 16.708446866485012,
+ "grad_norm": 9.070158958435059,
+ "learning_rate": 1.9030479522058656e-05,
+ "loss": 1.0791,
+ "step": 6132
+ },
+ {
+ "epoch": 16.71117166212534,
+ "grad_norm": 8.712905883789062,
+ "learning_rate": 1.9030100420370254e-05,
+ "loss": 0.8652,
+ "step": 6133
+ },
+ {
+ "epoch": 16.713896457765667,
+ "grad_norm": 8.393935203552246,
+ "learning_rate": 1.9029721248355718e-05,
+ "loss": 0.9224,
+ "step": 6134
+ },
+ {
+ "epoch": 16.716621253405993,
+ "grad_norm": 7.922507286071777,
+ "learning_rate": 1.9029342006018002e-05,
+ "loss": 0.8901,
+ "step": 6135
+ },
+ {
+ "epoch": 16.719346049046322,
+ "grad_norm": 8.726856231689453,
+ "learning_rate": 1.9028962693360062e-05,
+ "loss": 1.0376,
+ "step": 6136
+ },
+ {
+ "epoch": 16.722070844686648,
+ "grad_norm": 7.232251167297363,
+ "learning_rate": 1.9028583310384852e-05,
+ "loss": 0.8041,
+ "step": 6137
+ },
+ {
+ "epoch": 16.724795640326974,
+ "grad_norm": 8.879591941833496,
+ "learning_rate": 1.9028203857095326e-05,
+ "loss": 1.2061,
+ "step": 6138
+ },
+ {
+ "epoch": 16.727520435967303,
+ "grad_norm": 8.938133239746094,
+ "learning_rate": 1.902782433349444e-05,
+ "loss": 0.9741,
+ "step": 6139
+ },
+ {
+ "epoch": 16.73024523160763,
+ "grad_norm": 9.896289825439453,
+ "learning_rate": 1.9027444739585145e-05,
+ "loss": 0.905,
+ "step": 6140
+ },
+ {
+ "epoch": 16.732970027247955,
+ "grad_norm": 8.938760757446289,
+ "learning_rate": 1.9027065075370405e-05,
+ "loss": 0.8906,
+ "step": 6141
+ },
+ {
+ "epoch": 16.735694822888284,
+ "grad_norm": 7.5377984046936035,
+ "learning_rate": 1.9026685340853167e-05,
+ "loss": 0.8879,
+ "step": 6142
+ },
+ {
+ "epoch": 16.73841961852861,
+ "grad_norm": 8.72514533996582,
+ "learning_rate": 1.90263055360364e-05,
+ "loss": 1.0676,
+ "step": 6143
+ },
+ {
+ "epoch": 16.741144414168936,
+ "grad_norm": 8.462060928344727,
+ "learning_rate": 1.9025925660923053e-05,
+ "loss": 1.0444,
+ "step": 6144
+ },
+ {
+ "epoch": 16.743869209809265,
+ "grad_norm": 8.33977222442627,
+ "learning_rate": 1.902554571551609e-05,
+ "loss": 0.8572,
+ "step": 6145
+ },
+ {
+ "epoch": 16.74659400544959,
+ "grad_norm": 8.435555458068848,
+ "learning_rate": 1.902516569981846e-05,
+ "loss": 1.0098,
+ "step": 6146
+ },
+ {
+ "epoch": 16.749318801089917,
+ "grad_norm": 8.936212539672852,
+ "learning_rate": 1.902478561383314e-05,
+ "loss": 0.9421,
+ "step": 6147
+ },
+ {
+ "epoch": 16.752043596730246,
+ "grad_norm": 7.517622947692871,
+ "learning_rate": 1.9024405457563072e-05,
+ "loss": 0.9481,
+ "step": 6148
+ },
+ {
+ "epoch": 16.754768392370572,
+ "grad_norm": 8.736359596252441,
+ "learning_rate": 1.902402523101123e-05,
+ "loss": 1.2015,
+ "step": 6149
+ },
+ {
+ "epoch": 16.757493188010898,
+ "grad_norm": 9.770566940307617,
+ "learning_rate": 1.9023644934180568e-05,
+ "loss": 0.8751,
+ "step": 6150
+ },
+ {
+ "epoch": 16.760217983651227,
+ "grad_norm": 6.670861721038818,
+ "learning_rate": 1.902326456707405e-05,
+ "loss": 0.9161,
+ "step": 6151
+ },
+ {
+ "epoch": 16.762942779291553,
+ "grad_norm": 10.840482711791992,
+ "learning_rate": 1.902288412969464e-05,
+ "loss": 0.8964,
+ "step": 6152
+ },
+ {
+ "epoch": 16.76566757493188,
+ "grad_norm": 8.162219047546387,
+ "learning_rate": 1.9022503622045297e-05,
+ "loss": 0.9651,
+ "step": 6153
+ },
+ {
+ "epoch": 16.768392370572208,
+ "grad_norm": 10.338919639587402,
+ "learning_rate": 1.9022123044128985e-05,
+ "loss": 1.0435,
+ "step": 6154
+ },
+ {
+ "epoch": 16.771117166212534,
+ "grad_norm": 7.12001371383667,
+ "learning_rate": 1.9021742395948668e-05,
+ "loss": 0.944,
+ "step": 6155
+ },
+ {
+ "epoch": 16.77384196185286,
+ "grad_norm": 8.560159683227539,
+ "learning_rate": 1.9021361677507316e-05,
+ "loss": 1.1262,
+ "step": 6156
+ },
+ {
+ "epoch": 16.77656675749319,
+ "grad_norm": 18.946989059448242,
+ "learning_rate": 1.902098088880789e-05,
+ "loss": 0.8376,
+ "step": 6157
+ },
+ {
+ "epoch": 16.779291553133515,
+ "grad_norm": 9.131311416625977,
+ "learning_rate": 1.902060002985335e-05,
+ "loss": 0.9604,
+ "step": 6158
+ },
+ {
+ "epoch": 16.78201634877384,
+ "grad_norm": 7.698740005493164,
+ "learning_rate": 1.9020219100646667e-05,
+ "loss": 0.9002,
+ "step": 6159
+ },
+ {
+ "epoch": 16.78474114441417,
+ "grad_norm": 14.020658493041992,
+ "learning_rate": 1.9019838101190812e-05,
+ "loss": 1.1304,
+ "step": 6160
+ },
+ {
+ "epoch": 16.787465940054496,
+ "grad_norm": 17.247962951660156,
+ "learning_rate": 1.9019457031488747e-05,
+ "loss": 0.9744,
+ "step": 6161
+ },
+ {
+ "epoch": 16.79019073569482,
+ "grad_norm": 9.009391784667969,
+ "learning_rate": 1.901907589154344e-05,
+ "loss": 0.786,
+ "step": 6162
+ },
+ {
+ "epoch": 16.79291553133515,
+ "grad_norm": 11.710041999816895,
+ "learning_rate": 1.9018694681357865e-05,
+ "loss": 1.1375,
+ "step": 6163
+ },
+ {
+ "epoch": 16.795640326975477,
+ "grad_norm": 8.075738906860352,
+ "learning_rate": 1.901831340093498e-05,
+ "loss": 0.9253,
+ "step": 6164
+ },
+ {
+ "epoch": 16.798365122615802,
+ "grad_norm": 8.50547981262207,
+ "learning_rate": 1.9017932050277762e-05,
+ "loss": 0.9177,
+ "step": 6165
+ },
+ {
+ "epoch": 16.80108991825613,
+ "grad_norm": 8.390825271606445,
+ "learning_rate": 1.901755062938918e-05,
+ "loss": 0.9508,
+ "step": 6166
+ },
+ {
+ "epoch": 16.803814713896458,
+ "grad_norm": 7.8770599365234375,
+ "learning_rate": 1.9017169138272203e-05,
+ "loss": 0.9116,
+ "step": 6167
+ },
+ {
+ "epoch": 16.806539509536783,
+ "grad_norm": 7.977993011474609,
+ "learning_rate": 1.9016787576929805e-05,
+ "loss": 0.9384,
+ "step": 6168
+ },
+ {
+ "epoch": 16.809264305177113,
+ "grad_norm": 8.234292984008789,
+ "learning_rate": 1.901640594536495e-05,
+ "loss": 0.9983,
+ "step": 6169
+ },
+ {
+ "epoch": 16.81198910081744,
+ "grad_norm": 16.994550704956055,
+ "learning_rate": 1.9016024243580626e-05,
+ "loss": 0.8649,
+ "step": 6170
+ },
+ {
+ "epoch": 16.814713896457764,
+ "grad_norm": 7.928983211517334,
+ "learning_rate": 1.9015642471579786e-05,
+ "loss": 1.0641,
+ "step": 6171
+ },
+ {
+ "epoch": 16.817438692098094,
+ "grad_norm": 6.782833576202393,
+ "learning_rate": 1.9015260629365417e-05,
+ "loss": 0.978,
+ "step": 6172
+ },
+ {
+ "epoch": 16.82016348773842,
+ "grad_norm": 7.612330436706543,
+ "learning_rate": 1.9014878716940487e-05,
+ "loss": 0.9536,
+ "step": 6173
+ },
+ {
+ "epoch": 16.822888283378745,
+ "grad_norm": 9.662505149841309,
+ "learning_rate": 1.9014496734307974e-05,
+ "loss": 0.8308,
+ "step": 6174
+ },
+ {
+ "epoch": 16.825613079019075,
+ "grad_norm": 9.241847038269043,
+ "learning_rate": 1.9014114681470847e-05,
+ "loss": 1.126,
+ "step": 6175
+ },
+ {
+ "epoch": 16.8283378746594,
+ "grad_norm": 11.356974601745605,
+ "learning_rate": 1.9013732558432086e-05,
+ "loss": 1.1019,
+ "step": 6176
+ },
+ {
+ "epoch": 16.831062670299726,
+ "grad_norm": 8.605137825012207,
+ "learning_rate": 1.901335036519467e-05,
+ "loss": 0.9619,
+ "step": 6177
+ },
+ {
+ "epoch": 16.833787465940055,
+ "grad_norm": 9.019730567932129,
+ "learning_rate": 1.9012968101761567e-05,
+ "loss": 1.014,
+ "step": 6178
+ },
+ {
+ "epoch": 16.83651226158038,
+ "grad_norm": 8.747864723205566,
+ "learning_rate": 1.901258576813576e-05,
+ "loss": 1.1597,
+ "step": 6179
+ },
+ {
+ "epoch": 16.839237057220707,
+ "grad_norm": 8.210248947143555,
+ "learning_rate": 1.9012203364320223e-05,
+ "loss": 0.9534,
+ "step": 6180
+ },
+ {
+ "epoch": 16.841961852861036,
+ "grad_norm": 8.457579612731934,
+ "learning_rate": 1.901182089031794e-05,
+ "loss": 0.9187,
+ "step": 6181
+ },
+ {
+ "epoch": 16.844686648501362,
+ "grad_norm": 7.20169734954834,
+ "learning_rate": 1.9011438346131882e-05,
+ "loss": 0.9009,
+ "step": 6182
+ },
+ {
+ "epoch": 16.847411444141688,
+ "grad_norm": 7.486141681671143,
+ "learning_rate": 1.9011055731765036e-05,
+ "loss": 0.894,
+ "step": 6183
+ },
+ {
+ "epoch": 16.850136239782017,
+ "grad_norm": 7.9857177734375,
+ "learning_rate": 1.9010673047220373e-05,
+ "loss": 1.1331,
+ "step": 6184
+ },
+ {
+ "epoch": 16.852861035422343,
+ "grad_norm": 11.257291793823242,
+ "learning_rate": 1.9010290292500883e-05,
+ "loss": 0.9967,
+ "step": 6185
+ },
+ {
+ "epoch": 16.85558583106267,
+ "grad_norm": 8.070331573486328,
+ "learning_rate": 1.9009907467609544e-05,
+ "loss": 0.8953,
+ "step": 6186
+ },
+ {
+ "epoch": 16.858310626703,
+ "grad_norm": 7.690113067626953,
+ "learning_rate": 1.900952457254933e-05,
+ "loss": 1.0862,
+ "step": 6187
+ },
+ {
+ "epoch": 16.861035422343324,
+ "grad_norm": 8.162193298339844,
+ "learning_rate": 1.900914160732323e-05,
+ "loss": 1.0521,
+ "step": 6188
+ },
+ {
+ "epoch": 16.86376021798365,
+ "grad_norm": 8.463749885559082,
+ "learning_rate": 1.900875857193423e-05,
+ "loss": 0.9612,
+ "step": 6189
+ },
+ {
+ "epoch": 16.86648501362398,
+ "grad_norm": 7.926802158355713,
+ "learning_rate": 1.90083754663853e-05,
+ "loss": 1.0518,
+ "step": 6190
+ },
+ {
+ "epoch": 16.869209809264305,
+ "grad_norm": 9.436305046081543,
+ "learning_rate": 1.9007992290679437e-05,
+ "loss": 0.9889,
+ "step": 6191
+ },
+ {
+ "epoch": 16.87193460490463,
+ "grad_norm": 6.777631759643555,
+ "learning_rate": 1.900760904481962e-05,
+ "loss": 0.861,
+ "step": 6192
+ },
+ {
+ "epoch": 16.87465940054496,
+ "grad_norm": 6.63100528717041,
+ "learning_rate": 1.900722572880883e-05,
+ "loss": 0.9363,
+ "step": 6193
+ },
+ {
+ "epoch": 16.877384196185286,
+ "grad_norm": 9.927841186523438,
+ "learning_rate": 1.900684234265006e-05,
+ "loss": 1.0352,
+ "step": 6194
+ },
+ {
+ "epoch": 16.88010899182561,
+ "grad_norm": 9.591605186462402,
+ "learning_rate": 1.900645888634629e-05,
+ "loss": 1.0769,
+ "step": 6195
+ },
+ {
+ "epoch": 16.88283378746594,
+ "grad_norm": 8.075156211853027,
+ "learning_rate": 1.9006075359900507e-05,
+ "loss": 0.8705,
+ "step": 6196
+ },
+ {
+ "epoch": 16.885558583106267,
+ "grad_norm": 8.7380952835083,
+ "learning_rate": 1.9005691763315703e-05,
+ "loss": 0.8654,
+ "step": 6197
+ },
+ {
+ "epoch": 16.888283378746593,
+ "grad_norm": 9.685803413391113,
+ "learning_rate": 1.9005308096594856e-05,
+ "loss": 0.9965,
+ "step": 6198
+ },
+ {
+ "epoch": 16.891008174386922,
+ "grad_norm": 9.106147766113281,
+ "learning_rate": 1.9004924359740965e-05,
+ "loss": 0.9927,
+ "step": 6199
+ },
+ {
+ "epoch": 16.893732970027248,
+ "grad_norm": 9.183213233947754,
+ "learning_rate": 1.9004540552757008e-05,
+ "loss": 0.9373,
+ "step": 6200
+ },
+ {
+ "epoch": 16.896457765667574,
+ "grad_norm": 10.00035572052002,
+ "learning_rate": 1.900415667564598e-05,
+ "loss": 1.0916,
+ "step": 6201
+ },
+ {
+ "epoch": 16.899182561307903,
+ "grad_norm": 7.394097805023193,
+ "learning_rate": 1.900377272841087e-05,
+ "loss": 0.856,
+ "step": 6202
+ },
+ {
+ "epoch": 16.90190735694823,
+ "grad_norm": 8.062369346618652,
+ "learning_rate": 1.900338871105467e-05,
+ "loss": 1.0668,
+ "step": 6203
+ },
+ {
+ "epoch": 16.904632152588555,
+ "grad_norm": 9.141656875610352,
+ "learning_rate": 1.9003004623580365e-05,
+ "loss": 1.0283,
+ "step": 6204
+ },
+ {
+ "epoch": 16.907356948228884,
+ "grad_norm": 9.296113967895508,
+ "learning_rate": 1.9002620465990952e-05,
+ "loss": 0.9728,
+ "step": 6205
+ },
+ {
+ "epoch": 16.91008174386921,
+ "grad_norm": 7.998512268066406,
+ "learning_rate": 1.900223623828942e-05,
+ "loss": 0.99,
+ "step": 6206
+ },
+ {
+ "epoch": 16.912806539509535,
+ "grad_norm": 6.6857829093933105,
+ "learning_rate": 1.9001851940478765e-05,
+ "loss": 0.9277,
+ "step": 6207
+ },
+ {
+ "epoch": 16.915531335149865,
+ "grad_norm": 8.054292678833008,
+ "learning_rate": 1.9001467572561974e-05,
+ "loss": 1.0079,
+ "step": 6208
+ },
+ {
+ "epoch": 16.91825613079019,
+ "grad_norm": 7.670961380004883,
+ "learning_rate": 1.900108313454204e-05,
+ "loss": 0.8792,
+ "step": 6209
+ },
+ {
+ "epoch": 16.920980926430516,
+ "grad_norm": 12.54238510131836,
+ "learning_rate": 1.9000698626421966e-05,
+ "loss": 1.0015,
+ "step": 6210
+ },
+ {
+ "epoch": 16.923705722070846,
+ "grad_norm": 8.54481029510498,
+ "learning_rate": 1.9000314048204736e-05,
+ "loss": 0.9761,
+ "step": 6211
+ },
+ {
+ "epoch": 16.92643051771117,
+ "grad_norm": 7.279057025909424,
+ "learning_rate": 1.899992939989335e-05,
+ "loss": 1.0864,
+ "step": 6212
+ },
+ {
+ "epoch": 16.929155313351497,
+ "grad_norm": 11.931070327758789,
+ "learning_rate": 1.8999544681490807e-05,
+ "loss": 0.9958,
+ "step": 6213
+ },
+ {
+ "epoch": 16.931880108991827,
+ "grad_norm": 8.158348083496094,
+ "learning_rate": 1.89991598930001e-05,
+ "loss": 0.9166,
+ "step": 6214
+ },
+ {
+ "epoch": 16.934604904632153,
+ "grad_norm": 9.551117897033691,
+ "learning_rate": 1.8998775034424222e-05,
+ "loss": 1.1122,
+ "step": 6215
+ },
+ {
+ "epoch": 16.93732970027248,
+ "grad_norm": 8.071077346801758,
+ "learning_rate": 1.8998390105766175e-05,
+ "loss": 0.8949,
+ "step": 6216
+ },
+ {
+ "epoch": 16.940054495912808,
+ "grad_norm": 8.414925575256348,
+ "learning_rate": 1.8998005107028956e-05,
+ "loss": 0.8184,
+ "step": 6217
+ },
+ {
+ "epoch": 16.942779291553133,
+ "grad_norm": 8.011565208435059,
+ "learning_rate": 1.8997620038215562e-05,
+ "loss": 0.9697,
+ "step": 6218
+ },
+ {
+ "epoch": 16.94550408719346,
+ "grad_norm": 15.543701171875,
+ "learning_rate": 1.8997234899328997e-05,
+ "loss": 0.9996,
+ "step": 6219
+ },
+ {
+ "epoch": 16.94822888283379,
+ "grad_norm": 18.687339782714844,
+ "learning_rate": 1.899684969037225e-05,
+ "loss": 0.816,
+ "step": 6220
+ },
+ {
+ "epoch": 16.950953678474114,
+ "grad_norm": 9.535623550415039,
+ "learning_rate": 1.899646441134833e-05,
+ "loss": 0.9839,
+ "step": 6221
+ },
+ {
+ "epoch": 16.95367847411444,
+ "grad_norm": 9.265975952148438,
+ "learning_rate": 1.8996079062260234e-05,
+ "loss": 1.0645,
+ "step": 6222
+ },
+ {
+ "epoch": 16.95640326975477,
+ "grad_norm": 8.745752334594727,
+ "learning_rate": 1.8995693643110964e-05,
+ "loss": 1.0349,
+ "step": 6223
+ },
+ {
+ "epoch": 16.959128065395095,
+ "grad_norm": 7.420135498046875,
+ "learning_rate": 1.899530815390352e-05,
+ "loss": 0.8781,
+ "step": 6224
+ },
+ {
+ "epoch": 16.96185286103542,
+ "grad_norm": 8.341424942016602,
+ "learning_rate": 1.8994922594640907e-05,
+ "loss": 0.9097,
+ "step": 6225
+ },
+ {
+ "epoch": 16.96457765667575,
+ "grad_norm": 7.917690753936768,
+ "learning_rate": 1.899453696532613e-05,
+ "loss": 1.1034,
+ "step": 6226
+ },
+ {
+ "epoch": 16.967302452316076,
+ "grad_norm": 8.074682235717773,
+ "learning_rate": 1.8994151265962184e-05,
+ "loss": 1.0903,
+ "step": 6227
+ },
+ {
+ "epoch": 16.970027247956402,
+ "grad_norm": 7.362932205200195,
+ "learning_rate": 1.8993765496552078e-05,
+ "loss": 0.9917,
+ "step": 6228
+ },
+ {
+ "epoch": 16.97275204359673,
+ "grad_norm": 8.595783233642578,
+ "learning_rate": 1.8993379657098815e-05,
+ "loss": 0.8716,
+ "step": 6229
+ },
+ {
+ "epoch": 16.975476839237057,
+ "grad_norm": 9.306862831115723,
+ "learning_rate": 1.89929937476054e-05,
+ "loss": 0.9995,
+ "step": 6230
+ },
+ {
+ "epoch": 16.978201634877383,
+ "grad_norm": 8.560187339782715,
+ "learning_rate": 1.899260776807484e-05,
+ "loss": 1.1692,
+ "step": 6231
+ },
+ {
+ "epoch": 16.980926430517712,
+ "grad_norm": 20.176673889160156,
+ "learning_rate": 1.8992221718510143e-05,
+ "loss": 0.8344,
+ "step": 6232
+ },
+ {
+ "epoch": 16.983651226158038,
+ "grad_norm": 8.303386688232422,
+ "learning_rate": 1.8991835598914313e-05,
+ "loss": 1.0613,
+ "step": 6233
+ },
+ {
+ "epoch": 16.986376021798364,
+ "grad_norm": 9.151183128356934,
+ "learning_rate": 1.8991449409290355e-05,
+ "loss": 1.098,
+ "step": 6234
+ },
+ {
+ "epoch": 16.989100817438693,
+ "grad_norm": 7.211446285247803,
+ "learning_rate": 1.8991063149641276e-05,
+ "loss": 1.0529,
+ "step": 6235
+ },
+ {
+ "epoch": 16.99182561307902,
+ "grad_norm": 9.654312133789062,
+ "learning_rate": 1.8990676819970087e-05,
+ "loss": 1.0745,
+ "step": 6236
+ },
+ {
+ "epoch": 16.994550408719345,
+ "grad_norm": 7.851251602172852,
+ "learning_rate": 1.89902904202798e-05,
+ "loss": 0.7695,
+ "step": 6237
+ },
+ {
+ "epoch": 16.997275204359674,
+ "grad_norm": 9.32390022277832,
+ "learning_rate": 1.8989903950573422e-05,
+ "loss": 1.0144,
+ "step": 6238
+ },
+ {
+ "epoch": 17.0,
+ "grad_norm": 8.421369552612305,
+ "learning_rate": 1.8989517410853956e-05,
+ "loss": 0.8492,
+ "step": 6239
+ },
+ {
+ "epoch": 17.002724795640326,
+ "grad_norm": 10.002796173095703,
+ "learning_rate": 1.898913080112442e-05,
+ "loss": 0.9569,
+ "step": 6240
+ },
+ {
+ "epoch": 17.005449591280655,
+ "grad_norm": 13.980656623840332,
+ "learning_rate": 1.898874412138782e-05,
+ "loss": 0.9341,
+ "step": 6241
+ },
+ {
+ "epoch": 17.00817438692098,
+ "grad_norm": 7.3156561851501465,
+ "learning_rate": 1.8988357371647173e-05,
+ "loss": 0.8428,
+ "step": 6242
+ },
+ {
+ "epoch": 17.010899182561307,
+ "grad_norm": 7.414515018463135,
+ "learning_rate": 1.898797055190549e-05,
+ "loss": 0.8074,
+ "step": 6243
+ },
+ {
+ "epoch": 17.013623978201636,
+ "grad_norm": 8.65429401397705,
+ "learning_rate": 1.8987583662165775e-05,
+ "loss": 0.7615,
+ "step": 6244
+ },
+ {
+ "epoch": 17.016348773841962,
+ "grad_norm": 7.639221668243408,
+ "learning_rate": 1.8987196702431053e-05,
+ "loss": 0.7936,
+ "step": 6245
+ },
+ {
+ "epoch": 17.019073569482288,
+ "grad_norm": 7.511865615844727,
+ "learning_rate": 1.8986809672704328e-05,
+ "loss": 0.7023,
+ "step": 6246
+ },
+ {
+ "epoch": 17.021798365122617,
+ "grad_norm": 6.386614799499512,
+ "learning_rate": 1.8986422572988626e-05,
+ "loss": 0.8512,
+ "step": 6247
+ },
+ {
+ "epoch": 17.024523160762943,
+ "grad_norm": 8.6180419921875,
+ "learning_rate": 1.8986035403286948e-05,
+ "loss": 1.0215,
+ "step": 6248
+ },
+ {
+ "epoch": 17.02724795640327,
+ "grad_norm": 9.61176872253418,
+ "learning_rate": 1.8985648163602318e-05,
+ "loss": 0.9308,
+ "step": 6249
+ },
+ {
+ "epoch": 17.029972752043598,
+ "grad_norm": 7.482372283935547,
+ "learning_rate": 1.898526085393775e-05,
+ "loss": 0.9282,
+ "step": 6250
+ },
+ {
+ "epoch": 17.032697547683924,
+ "grad_norm": 8.454015731811523,
+ "learning_rate": 1.8984873474296256e-05,
+ "loss": 0.7462,
+ "step": 6251
+ },
+ {
+ "epoch": 17.03542234332425,
+ "grad_norm": 7.860104560852051,
+ "learning_rate": 1.898448602468086e-05,
+ "loss": 0.9888,
+ "step": 6252
+ },
+ {
+ "epoch": 17.03814713896458,
+ "grad_norm": 8.912753105163574,
+ "learning_rate": 1.8984098505094574e-05,
+ "loss": 0.6791,
+ "step": 6253
+ },
+ {
+ "epoch": 17.040871934604905,
+ "grad_norm": 8.656185150146484,
+ "learning_rate": 1.898371091554042e-05,
+ "loss": 0.8683,
+ "step": 6254
+ },
+ {
+ "epoch": 17.04359673024523,
+ "grad_norm": 7.228968143463135,
+ "learning_rate": 1.8983323256021412e-05,
+ "loss": 0.8091,
+ "step": 6255
+ },
+ {
+ "epoch": 17.04632152588556,
+ "grad_norm": 7.749083995819092,
+ "learning_rate": 1.8982935526540572e-05,
+ "loss": 0.901,
+ "step": 6256
+ },
+ {
+ "epoch": 17.049046321525886,
+ "grad_norm": 8.07095718383789,
+ "learning_rate": 1.898254772710092e-05,
+ "loss": 0.8671,
+ "step": 6257
+ },
+ {
+ "epoch": 17.05177111716621,
+ "grad_norm": 8.128870010375977,
+ "learning_rate": 1.8982159857705475e-05,
+ "loss": 0.8062,
+ "step": 6258
+ },
+ {
+ "epoch": 17.05449591280654,
+ "grad_norm": 8.751575469970703,
+ "learning_rate": 1.8981771918357257e-05,
+ "loss": 0.9467,
+ "step": 6259
+ },
+ {
+ "epoch": 17.057220708446867,
+ "grad_norm": 6.564663410186768,
+ "learning_rate": 1.898138390905929e-05,
+ "loss": 1.0685,
+ "step": 6260
+ },
+ {
+ "epoch": 17.059945504087192,
+ "grad_norm": 11.437712669372559,
+ "learning_rate": 1.8980995829814593e-05,
+ "loss": 1.0762,
+ "step": 6261
+ },
+ {
+ "epoch": 17.06267029972752,
+ "grad_norm": 9.941190719604492,
+ "learning_rate": 1.8980607680626194e-05,
+ "loss": 0.713,
+ "step": 6262
+ },
+ {
+ "epoch": 17.065395095367847,
+ "grad_norm": 8.763118743896484,
+ "learning_rate": 1.8980219461497106e-05,
+ "loss": 0.7267,
+ "step": 6263
+ },
+ {
+ "epoch": 17.068119891008173,
+ "grad_norm": 8.583393096923828,
+ "learning_rate": 1.8979831172430364e-05,
+ "loss": 0.9388,
+ "step": 6264
+ },
+ {
+ "epoch": 17.070844686648503,
+ "grad_norm": 10.55490779876709,
+ "learning_rate": 1.897944281342898e-05,
+ "loss": 0.8036,
+ "step": 6265
+ },
+ {
+ "epoch": 17.07356948228883,
+ "grad_norm": 6.606943130493164,
+ "learning_rate": 1.8979054384495987e-05,
+ "loss": 0.8143,
+ "step": 6266
+ },
+ {
+ "epoch": 17.076294277929154,
+ "grad_norm": 8.044092178344727,
+ "learning_rate": 1.8978665885634406e-05,
+ "loss": 0.8848,
+ "step": 6267
+ },
+ {
+ "epoch": 17.079019073569484,
+ "grad_norm": 8.02966594696045,
+ "learning_rate": 1.8978277316847265e-05,
+ "loss": 0.8705,
+ "step": 6268
+ },
+ {
+ "epoch": 17.08174386920981,
+ "grad_norm": 7.176367282867432,
+ "learning_rate": 1.897788867813759e-05,
+ "loss": 0.874,
+ "step": 6269
+ },
+ {
+ "epoch": 17.084468664850135,
+ "grad_norm": 8.880574226379395,
+ "learning_rate": 1.8977499969508405e-05,
+ "loss": 0.9612,
+ "step": 6270
+ },
+ {
+ "epoch": 17.087193460490465,
+ "grad_norm": 8.524381637573242,
+ "learning_rate": 1.897711119096274e-05,
+ "loss": 0.7632,
+ "step": 6271
+ },
+ {
+ "epoch": 17.08991825613079,
+ "grad_norm": 7.7911810874938965,
+ "learning_rate": 1.897672234250362e-05,
+ "loss": 0.8545,
+ "step": 6272
+ },
+ {
+ "epoch": 17.092643051771116,
+ "grad_norm": 6.824251174926758,
+ "learning_rate": 1.897633342413408e-05,
+ "loss": 0.7018,
+ "step": 6273
+ },
+ {
+ "epoch": 17.095367847411445,
+ "grad_norm": 8.821577072143555,
+ "learning_rate": 1.897594443585714e-05,
+ "loss": 0.916,
+ "step": 6274
+ },
+ {
+ "epoch": 17.09809264305177,
+ "grad_norm": 10.299895286560059,
+ "learning_rate": 1.8975555377675835e-05,
+ "loss": 0.8342,
+ "step": 6275
+ },
+ {
+ "epoch": 17.100817438692097,
+ "grad_norm": 17.8612117767334,
+ "learning_rate": 1.8975166249593194e-05,
+ "loss": 0.8192,
+ "step": 6276
+ },
+ {
+ "epoch": 17.103542234332426,
+ "grad_norm": 8.529385566711426,
+ "learning_rate": 1.897477705161225e-05,
+ "loss": 0.858,
+ "step": 6277
+ },
+ {
+ "epoch": 17.106267029972752,
+ "grad_norm": 6.327038288116455,
+ "learning_rate": 1.8974387783736022e-05,
+ "loss": 0.9072,
+ "step": 6278
+ },
+ {
+ "epoch": 17.108991825613078,
+ "grad_norm": 7.227954864501953,
+ "learning_rate": 1.897399844596756e-05,
+ "loss": 0.9475,
+ "step": 6279
+ },
+ {
+ "epoch": 17.111716621253407,
+ "grad_norm": 8.278307914733887,
+ "learning_rate": 1.8973609038309883e-05,
+ "loss": 0.8021,
+ "step": 6280
+ },
+ {
+ "epoch": 17.114441416893733,
+ "grad_norm": 8.912012100219727,
+ "learning_rate": 1.897321956076603e-05,
+ "loss": 0.8528,
+ "step": 6281
+ },
+ {
+ "epoch": 17.11716621253406,
+ "grad_norm": 8.555465698242188,
+ "learning_rate": 1.897283001333903e-05,
+ "loss": 0.7938,
+ "step": 6282
+ },
+ {
+ "epoch": 17.11989100817439,
+ "grad_norm": 11.952853202819824,
+ "learning_rate": 1.8972440396031916e-05,
+ "loss": 0.96,
+ "step": 6283
+ },
+ {
+ "epoch": 17.122615803814714,
+ "grad_norm": 7.701216220855713,
+ "learning_rate": 1.897205070884773e-05,
+ "loss": 0.8625,
+ "step": 6284
+ },
+ {
+ "epoch": 17.12534059945504,
+ "grad_norm": 9.567951202392578,
+ "learning_rate": 1.89716609517895e-05,
+ "loss": 1.071,
+ "step": 6285
+ },
+ {
+ "epoch": 17.12806539509537,
+ "grad_norm": 7.93927526473999,
+ "learning_rate": 1.8971271124860263e-05,
+ "loss": 1.0347,
+ "step": 6286
+ },
+ {
+ "epoch": 17.130790190735695,
+ "grad_norm": 8.100805282592773,
+ "learning_rate": 1.8970881228063055e-05,
+ "loss": 0.7579,
+ "step": 6287
+ },
+ {
+ "epoch": 17.13351498637602,
+ "grad_norm": 8.478625297546387,
+ "learning_rate": 1.8970491261400913e-05,
+ "loss": 0.9678,
+ "step": 6288
+ },
+ {
+ "epoch": 17.13623978201635,
+ "grad_norm": 8.492572784423828,
+ "learning_rate": 1.8970101224876872e-05,
+ "loss": 0.8484,
+ "step": 6289
+ },
+ {
+ "epoch": 17.138964577656676,
+ "grad_norm": 8.242562294006348,
+ "learning_rate": 1.8969711118493976e-05,
+ "loss": 0.9191,
+ "step": 6290
+ },
+ {
+ "epoch": 17.141689373297,
+ "grad_norm": 9.903480529785156,
+ "learning_rate": 1.8969320942255252e-05,
+ "loss": 0.9205,
+ "step": 6291
+ },
+ {
+ "epoch": 17.14441416893733,
+ "grad_norm": 8.240567207336426,
+ "learning_rate": 1.896893069616375e-05,
+ "loss": 0.8055,
+ "step": 6292
+ },
+ {
+ "epoch": 17.147138964577657,
+ "grad_norm": 9.593177795410156,
+ "learning_rate": 1.89685403802225e-05,
+ "loss": 1.0905,
+ "step": 6293
+ },
+ {
+ "epoch": 17.149863760217983,
+ "grad_norm": 7.517264366149902,
+ "learning_rate": 1.8968149994434552e-05,
+ "loss": 0.8064,
+ "step": 6294
+ },
+ {
+ "epoch": 17.152588555858312,
+ "grad_norm": 8.686984062194824,
+ "learning_rate": 1.896775953880294e-05,
+ "loss": 0.9446,
+ "step": 6295
+ },
+ {
+ "epoch": 17.155313351498638,
+ "grad_norm": 8.225557327270508,
+ "learning_rate": 1.8967369013330702e-05,
+ "loss": 0.8792,
+ "step": 6296
+ },
+ {
+ "epoch": 17.158038147138964,
+ "grad_norm": 8.14830493927002,
+ "learning_rate": 1.8966978418020883e-05,
+ "loss": 0.924,
+ "step": 6297
+ },
+ {
+ "epoch": 17.160762942779293,
+ "grad_norm": 7.562781810760498,
+ "learning_rate": 1.8966587752876524e-05,
+ "loss": 0.895,
+ "step": 6298
+ },
+ {
+ "epoch": 17.16348773841962,
+ "grad_norm": 8.645089149475098,
+ "learning_rate": 1.8966197017900672e-05,
+ "loss": 0.9468,
+ "step": 6299
+ },
+ {
+ "epoch": 17.166212534059945,
+ "grad_norm": 10.737967491149902,
+ "learning_rate": 1.8965806213096363e-05,
+ "loss": 0.8529,
+ "step": 6300
+ },
+ {
+ "epoch": 17.168937329700274,
+ "grad_norm": 9.399730682373047,
+ "learning_rate": 1.8965415338466645e-05,
+ "loss": 0.9579,
+ "step": 6301
+ },
+ {
+ "epoch": 17.1716621253406,
+ "grad_norm": 7.219324588775635,
+ "learning_rate": 1.896502439401456e-05,
+ "loss": 0.8975,
+ "step": 6302
+ },
+ {
+ "epoch": 17.174386920980925,
+ "grad_norm": 9.04008960723877,
+ "learning_rate": 1.8964633379743154e-05,
+ "loss": 0.927,
+ "step": 6303
+ },
+ {
+ "epoch": 17.177111716621255,
+ "grad_norm": 7.370367527008057,
+ "learning_rate": 1.8964242295655473e-05,
+ "loss": 0.7427,
+ "step": 6304
+ },
+ {
+ "epoch": 17.17983651226158,
+ "grad_norm": 9.304048538208008,
+ "learning_rate": 1.8963851141754558e-05,
+ "loss": 1.1201,
+ "step": 6305
+ },
+ {
+ "epoch": 17.182561307901906,
+ "grad_norm": 7.377665042877197,
+ "learning_rate": 1.8963459918043463e-05,
+ "loss": 0.9453,
+ "step": 6306
+ },
+ {
+ "epoch": 17.185286103542236,
+ "grad_norm": 7.910454273223877,
+ "learning_rate": 1.896306862452523e-05,
+ "loss": 0.7621,
+ "step": 6307
+ },
+ {
+ "epoch": 17.18801089918256,
+ "grad_norm": 10.67541790008545,
+ "learning_rate": 1.8962677261202905e-05,
+ "loss": 1.0029,
+ "step": 6308
+ },
+ {
+ "epoch": 17.190735694822887,
+ "grad_norm": 9.604737281799316,
+ "learning_rate": 1.896228582807954e-05,
+ "loss": 0.876,
+ "step": 6309
+ },
+ {
+ "epoch": 17.193460490463217,
+ "grad_norm": 10.053817749023438,
+ "learning_rate": 1.896189432515818e-05,
+ "loss": 0.8694,
+ "step": 6310
+ },
+ {
+ "epoch": 17.196185286103542,
+ "grad_norm": 9.115626335144043,
+ "learning_rate": 1.8961502752441875e-05,
+ "loss": 0.9108,
+ "step": 6311
+ },
+ {
+ "epoch": 17.19891008174387,
+ "grad_norm": 7.803097724914551,
+ "learning_rate": 1.8961111109933673e-05,
+ "loss": 1.002,
+ "step": 6312
+ },
+ {
+ "epoch": 17.201634877384198,
+ "grad_norm": 9.898059844970703,
+ "learning_rate": 1.896071939763663e-05,
+ "loss": 0.9833,
+ "step": 6313
+ },
+ {
+ "epoch": 17.204359673024523,
+ "grad_norm": 9.695001602172852,
+ "learning_rate": 1.8960327615553794e-05,
+ "loss": 0.8746,
+ "step": 6314
+ },
+ {
+ "epoch": 17.20708446866485,
+ "grad_norm": 7.691354274749756,
+ "learning_rate": 1.8959935763688212e-05,
+ "loss": 0.991,
+ "step": 6315
+ },
+ {
+ "epoch": 17.20980926430518,
+ "grad_norm": 9.531713485717773,
+ "learning_rate": 1.895954384204294e-05,
+ "loss": 0.8604,
+ "step": 6316
+ },
+ {
+ "epoch": 17.212534059945504,
+ "grad_norm": 8.945476531982422,
+ "learning_rate": 1.8959151850621025e-05,
+ "loss": 0.9231,
+ "step": 6317
+ },
+ {
+ "epoch": 17.21525885558583,
+ "grad_norm": 8.44931411743164,
+ "learning_rate": 1.895875978942553e-05,
+ "loss": 0.9095,
+ "step": 6318
+ },
+ {
+ "epoch": 17.21798365122616,
+ "grad_norm": 12.240138053894043,
+ "learning_rate": 1.8958367658459494e-05,
+ "loss": 0.8,
+ "step": 6319
+ },
+ {
+ "epoch": 17.220708446866485,
+ "grad_norm": 9.020398139953613,
+ "learning_rate": 1.8957975457725985e-05,
+ "loss": 0.9055,
+ "step": 6320
+ },
+ {
+ "epoch": 17.22343324250681,
+ "grad_norm": 10.042925834655762,
+ "learning_rate": 1.895758318722805e-05,
+ "loss": 1.037,
+ "step": 6321
+ },
+ {
+ "epoch": 17.22615803814714,
+ "grad_norm": 10.284613609313965,
+ "learning_rate": 1.8957190846968747e-05,
+ "loss": 0.8844,
+ "step": 6322
+ },
+ {
+ "epoch": 17.228882833787466,
+ "grad_norm": 8.101875305175781,
+ "learning_rate": 1.895679843695113e-05,
+ "loss": 0.8673,
+ "step": 6323
+ },
+ {
+ "epoch": 17.231607629427792,
+ "grad_norm": 8.890040397644043,
+ "learning_rate": 1.8956405957178253e-05,
+ "loss": 1.0253,
+ "step": 6324
+ },
+ {
+ "epoch": 17.23433242506812,
+ "grad_norm": 9.763956069946289,
+ "learning_rate": 1.8956013407653175e-05,
+ "loss": 0.7611,
+ "step": 6325
+ },
+ {
+ "epoch": 17.237057220708447,
+ "grad_norm": 11.538614273071289,
+ "learning_rate": 1.895562078837895e-05,
+ "loss": 1.0217,
+ "step": 6326
+ },
+ {
+ "epoch": 17.239782016348773,
+ "grad_norm": 7.710923194885254,
+ "learning_rate": 1.8955228099358646e-05,
+ "loss": 0.9299,
+ "step": 6327
+ },
+ {
+ "epoch": 17.242506811989102,
+ "grad_norm": 7.830203056335449,
+ "learning_rate": 1.8954835340595305e-05,
+ "loss": 0.8936,
+ "step": 6328
+ },
+ {
+ "epoch": 17.245231607629428,
+ "grad_norm": 8.240415573120117,
+ "learning_rate": 1.8954442512092e-05,
+ "loss": 0.7858,
+ "step": 6329
+ },
+ {
+ "epoch": 17.247956403269754,
+ "grad_norm": 9.944801330566406,
+ "learning_rate": 1.8954049613851783e-05,
+ "loss": 1.1096,
+ "step": 6330
+ },
+ {
+ "epoch": 17.250681198910083,
+ "grad_norm": 11.277527809143066,
+ "learning_rate": 1.895365664587772e-05,
+ "loss": 1.0118,
+ "step": 6331
+ },
+ {
+ "epoch": 17.25340599455041,
+ "grad_norm": 8.25351619720459,
+ "learning_rate": 1.8953263608172864e-05,
+ "loss": 0.9305,
+ "step": 6332
+ },
+ {
+ "epoch": 17.256130790190735,
+ "grad_norm": 13.284163475036621,
+ "learning_rate": 1.895287050074028e-05,
+ "loss": 0.9869,
+ "step": 6333
+ },
+ {
+ "epoch": 17.258855585831064,
+ "grad_norm": 11.260553359985352,
+ "learning_rate": 1.8952477323583024e-05,
+ "loss": 0.864,
+ "step": 6334
+ },
+ {
+ "epoch": 17.26158038147139,
+ "grad_norm": 6.351672649383545,
+ "learning_rate": 1.895208407670417e-05,
+ "loss": 0.811,
+ "step": 6335
+ },
+ {
+ "epoch": 17.264305177111716,
+ "grad_norm": 9.822250366210938,
+ "learning_rate": 1.895169076010677e-05,
+ "loss": 0.9417,
+ "step": 6336
+ },
+ {
+ "epoch": 17.267029972752045,
+ "grad_norm": 8.968976974487305,
+ "learning_rate": 1.895129737379389e-05,
+ "loss": 1.0801,
+ "step": 6337
+ },
+ {
+ "epoch": 17.26975476839237,
+ "grad_norm": 9.320754051208496,
+ "learning_rate": 1.8950903917768594e-05,
+ "loss": 0.9358,
+ "step": 6338
+ },
+ {
+ "epoch": 17.272479564032697,
+ "grad_norm": 9.100393295288086,
+ "learning_rate": 1.8950510392033945e-05,
+ "loss": 1.0525,
+ "step": 6339
+ },
+ {
+ "epoch": 17.275204359673026,
+ "grad_norm": 10.278422355651855,
+ "learning_rate": 1.8950116796593013e-05,
+ "loss": 0.8978,
+ "step": 6340
+ },
+ {
+ "epoch": 17.277929155313352,
+ "grad_norm": 9.044394493103027,
+ "learning_rate": 1.894972313144886e-05,
+ "loss": 0.8734,
+ "step": 6341
+ },
+ {
+ "epoch": 17.280653950953678,
+ "grad_norm": 9.296480178833008,
+ "learning_rate": 1.8949329396604544e-05,
+ "loss": 0.8167,
+ "step": 6342
+ },
+ {
+ "epoch": 17.283378746594007,
+ "grad_norm": 10.087651252746582,
+ "learning_rate": 1.8948935592063145e-05,
+ "loss": 0.9,
+ "step": 6343
+ },
+ {
+ "epoch": 17.286103542234333,
+ "grad_norm": 9.543252944946289,
+ "learning_rate": 1.8948541717827723e-05,
+ "loss": 0.995,
+ "step": 6344
+ },
+ {
+ "epoch": 17.28882833787466,
+ "grad_norm": 7.406209468841553,
+ "learning_rate": 1.8948147773901343e-05,
+ "loss": 0.9407,
+ "step": 6345
+ },
+ {
+ "epoch": 17.291553133514988,
+ "grad_norm": 10.631805419921875,
+ "learning_rate": 1.894775376028708e-05,
+ "loss": 0.8137,
+ "step": 6346
+ },
+ {
+ "epoch": 17.294277929155314,
+ "grad_norm": 7.886234283447266,
+ "learning_rate": 1.8947359676988e-05,
+ "loss": 0.7477,
+ "step": 6347
+ },
+ {
+ "epoch": 17.29700272479564,
+ "grad_norm": 7.540974140167236,
+ "learning_rate": 1.8946965524007166e-05,
+ "loss": 0.8324,
+ "step": 6348
+ },
+ {
+ "epoch": 17.29972752043597,
+ "grad_norm": 8.333446502685547,
+ "learning_rate": 1.8946571301347654e-05,
+ "loss": 0.8212,
+ "step": 6349
+ },
+ {
+ "epoch": 17.302452316076295,
+ "grad_norm": 8.617403030395508,
+ "learning_rate": 1.894617700901253e-05,
+ "loss": 1.0049,
+ "step": 6350
+ },
+ {
+ "epoch": 17.30517711171662,
+ "grad_norm": 9.715551376342773,
+ "learning_rate": 1.894578264700487e-05,
+ "loss": 0.8395,
+ "step": 6351
+ },
+ {
+ "epoch": 17.30790190735695,
+ "grad_norm": 10.217767715454102,
+ "learning_rate": 1.8945388215327746e-05,
+ "loss": 0.9055,
+ "step": 6352
+ },
+ {
+ "epoch": 17.310626702997276,
+ "grad_norm": 102.19203186035156,
+ "learning_rate": 1.8944993713984224e-05,
+ "loss": 1.031,
+ "step": 6353
+ },
+ {
+ "epoch": 17.3133514986376,
+ "grad_norm": 8.108960151672363,
+ "learning_rate": 1.8944599142977378e-05,
+ "loss": 0.8411,
+ "step": 6354
+ },
+ {
+ "epoch": 17.31607629427793,
+ "grad_norm": 9.639787673950195,
+ "learning_rate": 1.8944204502310282e-05,
+ "loss": 0.9253,
+ "step": 6355
+ },
+ {
+ "epoch": 17.318801089918257,
+ "grad_norm": 8.786418914794922,
+ "learning_rate": 1.894380979198601e-05,
+ "loss": 0.9468,
+ "step": 6356
+ },
+ {
+ "epoch": 17.321525885558582,
+ "grad_norm": 9.127197265625,
+ "learning_rate": 1.8943415012007634e-05,
+ "loss": 0.9567,
+ "step": 6357
+ },
+ {
+ "epoch": 17.32425068119891,
+ "grad_norm": 9.39046859741211,
+ "learning_rate": 1.8943020162378228e-05,
+ "loss": 0.8103,
+ "step": 6358
+ },
+ {
+ "epoch": 17.326975476839237,
+ "grad_norm": 9.742119789123535,
+ "learning_rate": 1.8942625243100874e-05,
+ "loss": 0.9304,
+ "step": 6359
+ },
+ {
+ "epoch": 17.329700272479563,
+ "grad_norm": 7.917878150939941,
+ "learning_rate": 1.8942230254178638e-05,
+ "loss": 0.8494,
+ "step": 6360
+ },
+ {
+ "epoch": 17.332425068119893,
+ "grad_norm": 8.42175579071045,
+ "learning_rate": 1.8941835195614603e-05,
+ "loss": 0.9329,
+ "step": 6361
+ },
+ {
+ "epoch": 17.33514986376022,
+ "grad_norm": 10.603105545043945,
+ "learning_rate": 1.894144006741184e-05,
+ "loss": 0.9562,
+ "step": 6362
+ },
+ {
+ "epoch": 17.337874659400544,
+ "grad_norm": 8.681341171264648,
+ "learning_rate": 1.8941044869573433e-05,
+ "loss": 0.9583,
+ "step": 6363
+ },
+ {
+ "epoch": 17.340599455040874,
+ "grad_norm": 10.419084548950195,
+ "learning_rate": 1.8940649602102454e-05,
+ "loss": 0.8289,
+ "step": 6364
+ },
+ {
+ "epoch": 17.3433242506812,
+ "grad_norm": 10.981396675109863,
+ "learning_rate": 1.8940254265001986e-05,
+ "loss": 0.92,
+ "step": 6365
+ },
+ {
+ "epoch": 17.346049046321525,
+ "grad_norm": 11.663156509399414,
+ "learning_rate": 1.8939858858275104e-05,
+ "loss": 1.0793,
+ "step": 6366
+ },
+ {
+ "epoch": 17.348773841961854,
+ "grad_norm": 8.68185043334961,
+ "learning_rate": 1.893946338192489e-05,
+ "loss": 1.0023,
+ "step": 6367
+ },
+ {
+ "epoch": 17.35149863760218,
+ "grad_norm": 8.913244247436523,
+ "learning_rate": 1.8939067835954423e-05,
+ "loss": 0.8899,
+ "step": 6368
+ },
+ {
+ "epoch": 17.354223433242506,
+ "grad_norm": 10.504867553710938,
+ "learning_rate": 1.8938672220366784e-05,
+ "loss": 0.8185,
+ "step": 6369
+ },
+ {
+ "epoch": 17.356948228882835,
+ "grad_norm": 9.94072437286377,
+ "learning_rate": 1.893827653516505e-05,
+ "loss": 0.9678,
+ "step": 6370
+ },
+ {
+ "epoch": 17.35967302452316,
+ "grad_norm": 8.40544605255127,
+ "learning_rate": 1.8937880780352307e-05,
+ "loss": 1.281,
+ "step": 6371
+ },
+ {
+ "epoch": 17.362397820163487,
+ "grad_norm": 8.515037536621094,
+ "learning_rate": 1.893748495593164e-05,
+ "loss": 0.9246,
+ "step": 6372
+ },
+ {
+ "epoch": 17.365122615803816,
+ "grad_norm": 10.380634307861328,
+ "learning_rate": 1.8937089061906123e-05,
+ "loss": 1.0804,
+ "step": 6373
+ },
+ {
+ "epoch": 17.367847411444142,
+ "grad_norm": 8.567737579345703,
+ "learning_rate": 1.8936693098278846e-05,
+ "loss": 1.0319,
+ "step": 6374
+ },
+ {
+ "epoch": 17.370572207084468,
+ "grad_norm": 9.313538551330566,
+ "learning_rate": 1.893629706505289e-05,
+ "loss": 1.0248,
+ "step": 6375
+ },
+ {
+ "epoch": 17.373297002724797,
+ "grad_norm": 7.999496936798096,
+ "learning_rate": 1.8935900962231342e-05,
+ "loss": 0.9978,
+ "step": 6376
+ },
+ {
+ "epoch": 17.376021798365123,
+ "grad_norm": 64.70576477050781,
+ "learning_rate": 1.8935504789817284e-05,
+ "loss": 0.8835,
+ "step": 6377
+ },
+ {
+ "epoch": 17.37874659400545,
+ "grad_norm": 7.945390224456787,
+ "learning_rate": 1.89351085478138e-05,
+ "loss": 0.891,
+ "step": 6378
+ },
+ {
+ "epoch": 17.381471389645778,
+ "grad_norm": 10.59921932220459,
+ "learning_rate": 1.8934712236223984e-05,
+ "loss": 0.8534,
+ "step": 6379
+ },
+ {
+ "epoch": 17.384196185286104,
+ "grad_norm": 9.016999244689941,
+ "learning_rate": 1.893431585505091e-05,
+ "loss": 0.8776,
+ "step": 6380
+ },
+ {
+ "epoch": 17.38692098092643,
+ "grad_norm": 9.705224990844727,
+ "learning_rate": 1.8933919404297676e-05,
+ "loss": 0.9087,
+ "step": 6381
+ },
+ {
+ "epoch": 17.38964577656676,
+ "grad_norm": 8.3832426071167,
+ "learning_rate": 1.8933522883967363e-05,
+ "loss": 0.8979,
+ "step": 6382
+ },
+ {
+ "epoch": 17.392370572207085,
+ "grad_norm": 8.460915565490723,
+ "learning_rate": 1.893312629406306e-05,
+ "loss": 0.9712,
+ "step": 6383
+ },
+ {
+ "epoch": 17.39509536784741,
+ "grad_norm": 11.178568840026855,
+ "learning_rate": 1.8932729634587863e-05,
+ "loss": 0.9543,
+ "step": 6384
+ },
+ {
+ "epoch": 17.39782016348774,
+ "grad_norm": 8.727524757385254,
+ "learning_rate": 1.893233290554485e-05,
+ "loss": 0.9111,
+ "step": 6385
+ },
+ {
+ "epoch": 17.400544959128066,
+ "grad_norm": 9.653977394104004,
+ "learning_rate": 1.8931936106937116e-05,
+ "loss": 0.8831,
+ "step": 6386
+ },
+ {
+ "epoch": 17.40326975476839,
+ "grad_norm": 8.617438316345215,
+ "learning_rate": 1.8931539238767753e-05,
+ "loss": 0.8729,
+ "step": 6387
+ },
+ {
+ "epoch": 17.40599455040872,
+ "grad_norm": 11.906661033630371,
+ "learning_rate": 1.893114230103985e-05,
+ "loss": 0.8965,
+ "step": 6388
+ },
+ {
+ "epoch": 17.408719346049047,
+ "grad_norm": 8.372017860412598,
+ "learning_rate": 1.8930745293756496e-05,
+ "loss": 0.9081,
+ "step": 6389
+ },
+ {
+ "epoch": 17.411444141689373,
+ "grad_norm": 10.073421478271484,
+ "learning_rate": 1.8930348216920786e-05,
+ "loss": 0.8654,
+ "step": 6390
+ },
+ {
+ "epoch": 17.414168937329702,
+ "grad_norm": 10.309469223022461,
+ "learning_rate": 1.8929951070535814e-05,
+ "loss": 1.1105,
+ "step": 6391
+ },
+ {
+ "epoch": 17.416893732970028,
+ "grad_norm": 8.19256591796875,
+ "learning_rate": 1.8929553854604667e-05,
+ "loss": 0.9758,
+ "step": 6392
+ },
+ {
+ "epoch": 17.419618528610354,
+ "grad_norm": 8.794842720031738,
+ "learning_rate": 1.892915656913044e-05,
+ "loss": 0.8052,
+ "step": 6393
+ },
+ {
+ "epoch": 17.422343324250683,
+ "grad_norm": 9.917633056640625,
+ "learning_rate": 1.8928759214116236e-05,
+ "loss": 1.0466,
+ "step": 6394
+ },
+ {
+ "epoch": 17.42506811989101,
+ "grad_norm": 7.508038520812988,
+ "learning_rate": 1.8928361789565136e-05,
+ "loss": 0.8617,
+ "step": 6395
+ },
+ {
+ "epoch": 17.427792915531334,
+ "grad_norm": 10.217451095581055,
+ "learning_rate": 1.8927964295480244e-05,
+ "loss": 0.9473,
+ "step": 6396
+ },
+ {
+ "epoch": 17.430517711171664,
+ "grad_norm": 9.991721153259277,
+ "learning_rate": 1.8927566731864658e-05,
+ "loss": 1.0593,
+ "step": 6397
+ },
+ {
+ "epoch": 17.43324250681199,
+ "grad_norm": 7.884134292602539,
+ "learning_rate": 1.8927169098721462e-05,
+ "loss": 1.0217,
+ "step": 6398
+ },
+ {
+ "epoch": 17.435967302452315,
+ "grad_norm": 9.229854583740234,
+ "learning_rate": 1.892677139605377e-05,
+ "loss": 1.0544,
+ "step": 6399
+ },
+ {
+ "epoch": 17.438692098092645,
+ "grad_norm": 10.268136024475098,
+ "learning_rate": 1.892637362386466e-05,
+ "loss": 0.9286,
+ "step": 6400
+ },
+ {
+ "epoch": 17.44141689373297,
+ "grad_norm": 10.877610206604004,
+ "learning_rate": 1.8925975782157243e-05,
+ "loss": 1.0356,
+ "step": 6401
+ },
+ {
+ "epoch": 17.444141689373296,
+ "grad_norm": 10.455604553222656,
+ "learning_rate": 1.8925577870934612e-05,
+ "loss": 0.809,
+ "step": 6402
+ },
+ {
+ "epoch": 17.446866485013626,
+ "grad_norm": 8.860418319702148,
+ "learning_rate": 1.8925179890199873e-05,
+ "loss": 0.9276,
+ "step": 6403
+ },
+ {
+ "epoch": 17.44959128065395,
+ "grad_norm": 8.77723503112793,
+ "learning_rate": 1.8924781839956116e-05,
+ "loss": 1.0107,
+ "step": 6404
+ },
+ {
+ "epoch": 17.452316076294277,
+ "grad_norm": 9.204261779785156,
+ "learning_rate": 1.8924383720206445e-05,
+ "loss": 1.035,
+ "step": 6405
+ },
+ {
+ "epoch": 17.455040871934607,
+ "grad_norm": 10.360713005065918,
+ "learning_rate": 1.8923985530953963e-05,
+ "loss": 0.999,
+ "step": 6406
+ },
+ {
+ "epoch": 17.457765667574932,
+ "grad_norm": 12.03943920135498,
+ "learning_rate": 1.892358727220177e-05,
+ "loss": 0.9657,
+ "step": 6407
+ },
+ {
+ "epoch": 17.460490463215258,
+ "grad_norm": 9.930057525634766,
+ "learning_rate": 1.892318894395296e-05,
+ "loss": 1.1375,
+ "step": 6408
+ },
+ {
+ "epoch": 17.463215258855588,
+ "grad_norm": 7.339794158935547,
+ "learning_rate": 1.892279054621065e-05,
+ "loss": 0.7582,
+ "step": 6409
+ },
+ {
+ "epoch": 17.465940054495913,
+ "grad_norm": 13.046171188354492,
+ "learning_rate": 1.892239207897793e-05,
+ "loss": 0.934,
+ "step": 6410
+ },
+ {
+ "epoch": 17.46866485013624,
+ "grad_norm": 8.831766128540039,
+ "learning_rate": 1.892199354225791e-05,
+ "loss": 0.9197,
+ "step": 6411
+ },
+ {
+ "epoch": 17.47138964577657,
+ "grad_norm": 8.978260040283203,
+ "learning_rate": 1.8921594936053686e-05,
+ "loss": 1.1469,
+ "step": 6412
+ },
+ {
+ "epoch": 17.474114441416894,
+ "grad_norm": 8.057010650634766,
+ "learning_rate": 1.8921196260368374e-05,
+ "loss": 0.7601,
+ "step": 6413
+ },
+ {
+ "epoch": 17.47683923705722,
+ "grad_norm": 10.006945610046387,
+ "learning_rate": 1.892079751520507e-05,
+ "loss": 0.7833,
+ "step": 6414
+ },
+ {
+ "epoch": 17.479564032697546,
+ "grad_norm": 9.494051933288574,
+ "learning_rate": 1.8920398700566884e-05,
+ "loss": 0.8442,
+ "step": 6415
+ },
+ {
+ "epoch": 17.482288828337875,
+ "grad_norm": 10.400253295898438,
+ "learning_rate": 1.8919999816456917e-05,
+ "loss": 0.9158,
+ "step": 6416
+ },
+ {
+ "epoch": 17.4850136239782,
+ "grad_norm": 10.488839149475098,
+ "learning_rate": 1.8919600862878282e-05,
+ "loss": 0.8466,
+ "step": 6417
+ },
+ {
+ "epoch": 17.48773841961853,
+ "grad_norm": 7.895549774169922,
+ "learning_rate": 1.8919201839834078e-05,
+ "loss": 1.0416,
+ "step": 6418
+ },
+ {
+ "epoch": 17.490463215258856,
+ "grad_norm": 9.203743934631348,
+ "learning_rate": 1.891880274732742e-05,
+ "loss": 0.908,
+ "step": 6419
+ },
+ {
+ "epoch": 17.493188010899182,
+ "grad_norm": 6.967998027801514,
+ "learning_rate": 1.891840358536141e-05,
+ "loss": 0.7302,
+ "step": 6420
+ },
+ {
+ "epoch": 17.495912806539508,
+ "grad_norm": 7.7992329597473145,
+ "learning_rate": 1.8918004353939166e-05,
+ "loss": 0.8354,
+ "step": 6421
+ },
+ {
+ "epoch": 17.498637602179837,
+ "grad_norm": 10.46932315826416,
+ "learning_rate": 1.891760505306379e-05,
+ "loss": 0.958,
+ "step": 6422
+ },
+ {
+ "epoch": 17.501362397820163,
+ "grad_norm": 10.07521915435791,
+ "learning_rate": 1.8917205682738387e-05,
+ "loss": 0.8993,
+ "step": 6423
+ },
+ {
+ "epoch": 17.504087193460492,
+ "grad_norm": 8.106224060058594,
+ "learning_rate": 1.891680624296608e-05,
+ "loss": 0.9456,
+ "step": 6424
+ },
+ {
+ "epoch": 17.506811989100818,
+ "grad_norm": 14.495341300964355,
+ "learning_rate": 1.891640673374997e-05,
+ "loss": 1.0131,
+ "step": 6425
+ },
+ {
+ "epoch": 17.509536784741144,
+ "grad_norm": 9.03091049194336,
+ "learning_rate": 1.8916007155093168e-05,
+ "loss": 0.9318,
+ "step": 6426
+ },
+ {
+ "epoch": 17.51226158038147,
+ "grad_norm": 9.570588111877441,
+ "learning_rate": 1.8915607506998796e-05,
+ "loss": 1.0874,
+ "step": 6427
+ },
+ {
+ "epoch": 17.5149863760218,
+ "grad_norm": 13.135885238647461,
+ "learning_rate": 1.8915207789469954e-05,
+ "loss": 0.9535,
+ "step": 6428
+ },
+ {
+ "epoch": 17.517711171662125,
+ "grad_norm": 7.8600664138793945,
+ "learning_rate": 1.891480800250976e-05,
+ "loss": 0.8834,
+ "step": 6429
+ },
+ {
+ "epoch": 17.520435967302454,
+ "grad_norm": 12.449604034423828,
+ "learning_rate": 1.8914408146121333e-05,
+ "loss": 0.9648,
+ "step": 6430
+ },
+ {
+ "epoch": 17.52316076294278,
+ "grad_norm": 8.533634185791016,
+ "learning_rate": 1.891400822030778e-05,
+ "loss": 1.0886,
+ "step": 6431
+ },
+ {
+ "epoch": 17.525885558583106,
+ "grad_norm": 9.208283424377441,
+ "learning_rate": 1.891360822507222e-05,
+ "loss": 0.9509,
+ "step": 6432
+ },
+ {
+ "epoch": 17.52861035422343,
+ "grad_norm": 8.09561824798584,
+ "learning_rate": 1.8913208160417763e-05,
+ "loss": 0.9425,
+ "step": 6433
+ },
+ {
+ "epoch": 17.53133514986376,
+ "grad_norm": 10.107198715209961,
+ "learning_rate": 1.8912808026347527e-05,
+ "loss": 0.9836,
+ "step": 6434
+ },
+ {
+ "epoch": 17.534059945504087,
+ "grad_norm": 8.906506538391113,
+ "learning_rate": 1.8912407822864632e-05,
+ "loss": 0.8306,
+ "step": 6435
+ },
+ {
+ "epoch": 17.536784741144416,
+ "grad_norm": 8.324662208557129,
+ "learning_rate": 1.891200754997219e-05,
+ "loss": 0.9647,
+ "step": 6436
+ },
+ {
+ "epoch": 17.539509536784742,
+ "grad_norm": 6.878514289855957,
+ "learning_rate": 1.8911607207673318e-05,
+ "loss": 0.7291,
+ "step": 6437
+ },
+ {
+ "epoch": 17.542234332425068,
+ "grad_norm": 9.264095306396484,
+ "learning_rate": 1.891120679597114e-05,
+ "loss": 1.0203,
+ "step": 6438
+ },
+ {
+ "epoch": 17.544959128065393,
+ "grad_norm": 10.99022102355957,
+ "learning_rate": 1.891080631486877e-05,
+ "loss": 0.9336,
+ "step": 6439
+ },
+ {
+ "epoch": 17.547683923705723,
+ "grad_norm": 9.272268295288086,
+ "learning_rate": 1.8910405764369326e-05,
+ "loss": 1.0581,
+ "step": 6440
+ },
+ {
+ "epoch": 17.55040871934605,
+ "grad_norm": 10.952085494995117,
+ "learning_rate": 1.891000514447593e-05,
+ "loss": 0.8505,
+ "step": 6441
+ },
+ {
+ "epoch": 17.553133514986374,
+ "grad_norm": 8.9260892868042,
+ "learning_rate": 1.8909604455191698e-05,
+ "loss": 0.7598,
+ "step": 6442
+ },
+ {
+ "epoch": 17.555858310626704,
+ "grad_norm": 9.91944408416748,
+ "learning_rate": 1.8909203696519753e-05,
+ "loss": 0.9639,
+ "step": 6443
+ },
+ {
+ "epoch": 17.55858310626703,
+ "grad_norm": 10.126349449157715,
+ "learning_rate": 1.890880286846322e-05,
+ "loss": 1.0109,
+ "step": 6444
+ },
+ {
+ "epoch": 17.561307901907355,
+ "grad_norm": 7.965224742889404,
+ "learning_rate": 1.8908401971025214e-05,
+ "loss": 0.7958,
+ "step": 6445
+ },
+ {
+ "epoch": 17.564032697547685,
+ "grad_norm": 9.00943374633789,
+ "learning_rate": 1.890800100420886e-05,
+ "loss": 0.8862,
+ "step": 6446
+ },
+ {
+ "epoch": 17.56675749318801,
+ "grad_norm": 12.013262748718262,
+ "learning_rate": 1.8907599968017284e-05,
+ "loss": 0.9553,
+ "step": 6447
+ },
+ {
+ "epoch": 17.569482288828336,
+ "grad_norm": 8.990498542785645,
+ "learning_rate": 1.8907198862453604e-05,
+ "loss": 1.1107,
+ "step": 6448
+ },
+ {
+ "epoch": 17.572207084468666,
+ "grad_norm": 9.534433364868164,
+ "learning_rate": 1.8906797687520944e-05,
+ "loss": 0.9305,
+ "step": 6449
+ },
+ {
+ "epoch": 17.57493188010899,
+ "grad_norm": 8.413612365722656,
+ "learning_rate": 1.8906396443222436e-05,
+ "loss": 0.8855,
+ "step": 6450
+ },
+ {
+ "epoch": 17.577656675749317,
+ "grad_norm": 9.258137702941895,
+ "learning_rate": 1.8905995129561195e-05,
+ "loss": 1.0669,
+ "step": 6451
+ },
+ {
+ "epoch": 17.580381471389646,
+ "grad_norm": 8.99902057647705,
+ "learning_rate": 1.890559374654035e-05,
+ "loss": 0.9724,
+ "step": 6452
+ },
+ {
+ "epoch": 17.583106267029972,
+ "grad_norm": 8.523558616638184,
+ "learning_rate": 1.8905192294163028e-05,
+ "loss": 0.8833,
+ "step": 6453
+ },
+ {
+ "epoch": 17.585831062670298,
+ "grad_norm": 8.714370727539062,
+ "learning_rate": 1.8904790772432355e-05,
+ "loss": 1.0326,
+ "step": 6454
+ },
+ {
+ "epoch": 17.588555858310627,
+ "grad_norm": 10.08273696899414,
+ "learning_rate": 1.890438918135146e-05,
+ "loss": 1.0527,
+ "step": 6455
+ },
+ {
+ "epoch": 17.591280653950953,
+ "grad_norm": 8.469697952270508,
+ "learning_rate": 1.8903987520923465e-05,
+ "loss": 0.9312,
+ "step": 6456
+ },
+ {
+ "epoch": 17.59400544959128,
+ "grad_norm": 8.257137298583984,
+ "learning_rate": 1.8903585791151506e-05,
+ "loss": 0.998,
+ "step": 6457
+ },
+ {
+ "epoch": 17.59673024523161,
+ "grad_norm": 8.074660301208496,
+ "learning_rate": 1.8903183992038705e-05,
+ "loss": 0.8622,
+ "step": 6458
+ },
+ {
+ "epoch": 17.599455040871934,
+ "grad_norm": 18.93331527709961,
+ "learning_rate": 1.8902782123588194e-05,
+ "loss": 1.0923,
+ "step": 6459
+ },
+ {
+ "epoch": 17.60217983651226,
+ "grad_norm": 6.862919807434082,
+ "learning_rate": 1.8902380185803103e-05,
+ "loss": 0.8423,
+ "step": 6460
+ },
+ {
+ "epoch": 17.60490463215259,
+ "grad_norm": 6.449989318847656,
+ "learning_rate": 1.8901978178686563e-05,
+ "loss": 0.962,
+ "step": 6461
+ },
+ {
+ "epoch": 17.607629427792915,
+ "grad_norm": 7.540862083435059,
+ "learning_rate": 1.8901576102241698e-05,
+ "loss": 0.9778,
+ "step": 6462
+ },
+ {
+ "epoch": 17.61035422343324,
+ "grad_norm": 8.875688552856445,
+ "learning_rate": 1.890117395647165e-05,
+ "loss": 0.9824,
+ "step": 6463
+ },
+ {
+ "epoch": 17.61307901907357,
+ "grad_norm": 8.375256538391113,
+ "learning_rate": 1.8900771741379544e-05,
+ "loss": 1.0098,
+ "step": 6464
+ },
+ {
+ "epoch": 17.615803814713896,
+ "grad_norm": 9.36380386352539,
+ "learning_rate": 1.8900369456968513e-05,
+ "loss": 0.9539,
+ "step": 6465
+ },
+ {
+ "epoch": 17.618528610354222,
+ "grad_norm": 8.860440254211426,
+ "learning_rate": 1.8899967103241693e-05,
+ "loss": 0.8457,
+ "step": 6466
+ },
+ {
+ "epoch": 17.62125340599455,
+ "grad_norm": 7.205599784851074,
+ "learning_rate": 1.8899564680202215e-05,
+ "loss": 1.0072,
+ "step": 6467
+ },
+ {
+ "epoch": 17.623978201634877,
+ "grad_norm": 9.090911865234375,
+ "learning_rate": 1.8899162187853215e-05,
+ "loss": 0.9652,
+ "step": 6468
+ },
+ {
+ "epoch": 17.626702997275203,
+ "grad_norm": 11.18416976928711,
+ "learning_rate": 1.889875962619782e-05,
+ "loss": 0.9319,
+ "step": 6469
+ },
+ {
+ "epoch": 17.629427792915532,
+ "grad_norm": 7.465579986572266,
+ "learning_rate": 1.889835699523918e-05,
+ "loss": 0.9143,
+ "step": 6470
+ },
+ {
+ "epoch": 17.632152588555858,
+ "grad_norm": 8.837275505065918,
+ "learning_rate": 1.889795429498042e-05,
+ "loss": 0.9601,
+ "step": 6471
+ },
+ {
+ "epoch": 17.634877384196184,
+ "grad_norm": 8.674745559692383,
+ "learning_rate": 1.8897551525424674e-05,
+ "loss": 0.9813,
+ "step": 6472
+ },
+ {
+ "epoch": 17.637602179836513,
+ "grad_norm": 7.9291839599609375,
+ "learning_rate": 1.889714868657509e-05,
+ "loss": 0.9471,
+ "step": 6473
+ },
+ {
+ "epoch": 17.64032697547684,
+ "grad_norm": 9.651131629943848,
+ "learning_rate": 1.8896745778434793e-05,
+ "loss": 0.8705,
+ "step": 6474
+ },
+ {
+ "epoch": 17.643051771117165,
+ "grad_norm": 7.559269428253174,
+ "learning_rate": 1.8896342801006927e-05,
+ "loss": 0.8284,
+ "step": 6475
+ },
+ {
+ "epoch": 17.645776566757494,
+ "grad_norm": 10.888666152954102,
+ "learning_rate": 1.8895939754294627e-05,
+ "loss": 0.8474,
+ "step": 6476
+ },
+ {
+ "epoch": 17.64850136239782,
+ "grad_norm": 8.872111320495605,
+ "learning_rate": 1.889553663830104e-05,
+ "loss": 0.9799,
+ "step": 6477
+ },
+ {
+ "epoch": 17.651226158038146,
+ "grad_norm": 11.895491600036621,
+ "learning_rate": 1.88951334530293e-05,
+ "loss": 1.1519,
+ "step": 6478
+ },
+ {
+ "epoch": 17.653950953678475,
+ "grad_norm": 17.710891723632812,
+ "learning_rate": 1.8894730198482543e-05,
+ "loss": 1.0701,
+ "step": 6479
+ },
+ {
+ "epoch": 17.6566757493188,
+ "grad_norm": 8.096800804138184,
+ "learning_rate": 1.889432687466391e-05,
+ "loss": 0.7501,
+ "step": 6480
+ },
+ {
+ "epoch": 17.659400544959126,
+ "grad_norm": 9.141026496887207,
+ "learning_rate": 1.8893923481576555e-05,
+ "loss": 0.9192,
+ "step": 6481
+ },
+ {
+ "epoch": 17.662125340599456,
+ "grad_norm": 8.910099029541016,
+ "learning_rate": 1.8893520019223605e-05,
+ "loss": 0.9043,
+ "step": 6482
+ },
+ {
+ "epoch": 17.66485013623978,
+ "grad_norm": 8.54745101928711,
+ "learning_rate": 1.889311648760821e-05,
+ "loss": 1.0664,
+ "step": 6483
+ },
+ {
+ "epoch": 17.667574931880107,
+ "grad_norm": 7.215934753417969,
+ "learning_rate": 1.8892712886733506e-05,
+ "loss": 1.1074,
+ "step": 6484
+ },
+ {
+ "epoch": 17.670299727520437,
+ "grad_norm": 10.302400588989258,
+ "learning_rate": 1.8892309216602642e-05,
+ "loss": 0.9835,
+ "step": 6485
+ },
+ {
+ "epoch": 17.673024523160763,
+ "grad_norm": 7.602528095245361,
+ "learning_rate": 1.889190547721876e-05,
+ "loss": 0.9707,
+ "step": 6486
+ },
+ {
+ "epoch": 17.67574931880109,
+ "grad_norm": 9.652894020080566,
+ "learning_rate": 1.8891501668585006e-05,
+ "loss": 0.9296,
+ "step": 6487
+ },
+ {
+ "epoch": 17.678474114441418,
+ "grad_norm": 7.052173614501953,
+ "learning_rate": 1.8891097790704522e-05,
+ "loss": 0.9863,
+ "step": 6488
+ },
+ {
+ "epoch": 17.681198910081743,
+ "grad_norm": 9.30596923828125,
+ "learning_rate": 1.8890693843580454e-05,
+ "loss": 0.8997,
+ "step": 6489
+ },
+ {
+ "epoch": 17.68392370572207,
+ "grad_norm": 11.857169151306152,
+ "learning_rate": 1.8890289827215952e-05,
+ "loss": 1.0737,
+ "step": 6490
+ },
+ {
+ "epoch": 17.6866485013624,
+ "grad_norm": 11.911252975463867,
+ "learning_rate": 1.8889885741614153e-05,
+ "loss": 1.144,
+ "step": 6491
+ },
+ {
+ "epoch": 17.689373297002724,
+ "grad_norm": 8.49942398071289,
+ "learning_rate": 1.8889481586778212e-05,
+ "loss": 1.0328,
+ "step": 6492
+ },
+ {
+ "epoch": 17.69209809264305,
+ "grad_norm": 7.845510959625244,
+ "learning_rate": 1.8889077362711277e-05,
+ "loss": 0.7596,
+ "step": 6493
+ },
+ {
+ "epoch": 17.69482288828338,
+ "grad_norm": 11.397034645080566,
+ "learning_rate": 1.888867306941649e-05,
+ "loss": 1.0274,
+ "step": 6494
+ },
+ {
+ "epoch": 17.697547683923705,
+ "grad_norm": 9.5137357711792,
+ "learning_rate": 1.8888268706897007e-05,
+ "loss": 1.0266,
+ "step": 6495
+ },
+ {
+ "epoch": 17.70027247956403,
+ "grad_norm": 8.97117805480957,
+ "learning_rate": 1.888786427515597e-05,
+ "loss": 0.8964,
+ "step": 6496
+ },
+ {
+ "epoch": 17.70299727520436,
+ "grad_norm": 8.997941970825195,
+ "learning_rate": 1.8887459774196536e-05,
+ "loss": 1.072,
+ "step": 6497
+ },
+ {
+ "epoch": 17.705722070844686,
+ "grad_norm": 7.437220573425293,
+ "learning_rate": 1.888705520402185e-05,
+ "loss": 0.8298,
+ "step": 6498
+ },
+ {
+ "epoch": 17.708446866485012,
+ "grad_norm": 7.677548408508301,
+ "learning_rate": 1.888665056463506e-05,
+ "loss": 1.0582,
+ "step": 6499
+ },
+ {
+ "epoch": 17.71117166212534,
+ "grad_norm": 8.739337921142578,
+ "learning_rate": 1.888624585603933e-05,
+ "loss": 0.9309,
+ "step": 6500
+ },
+ {
+ "epoch": 17.713896457765667,
+ "grad_norm": 10.512234687805176,
+ "learning_rate": 1.888584107823779e-05,
+ "loss": 0.9874,
+ "step": 6501
+ },
+ {
+ "epoch": 17.716621253405993,
+ "grad_norm": 9.074308395385742,
+ "learning_rate": 1.8885436231233617e-05,
+ "loss": 1.1477,
+ "step": 6502
+ },
+ {
+ "epoch": 17.719346049046322,
+ "grad_norm": 9.153244972229004,
+ "learning_rate": 1.888503131502995e-05,
+ "loss": 0.9447,
+ "step": 6503
+ },
+ {
+ "epoch": 17.722070844686648,
+ "grad_norm": 8.506519317626953,
+ "learning_rate": 1.8884626329629942e-05,
+ "loss": 1.1488,
+ "step": 6504
+ },
+ {
+ "epoch": 17.724795640326974,
+ "grad_norm": 11.738155364990234,
+ "learning_rate": 1.8884221275036753e-05,
+ "loss": 0.743,
+ "step": 6505
+ },
+ {
+ "epoch": 17.727520435967303,
+ "grad_norm": 7.9107489585876465,
+ "learning_rate": 1.8883816151253532e-05,
+ "loss": 0.8867,
+ "step": 6506
+ },
+ {
+ "epoch": 17.73024523160763,
+ "grad_norm": 7.033042907714844,
+ "learning_rate": 1.888341095828344e-05,
+ "loss": 0.9698,
+ "step": 6507
+ },
+ {
+ "epoch": 17.732970027247955,
+ "grad_norm": 10.325312614440918,
+ "learning_rate": 1.888300569612963e-05,
+ "loss": 0.9685,
+ "step": 6508
+ },
+ {
+ "epoch": 17.735694822888284,
+ "grad_norm": 8.544760704040527,
+ "learning_rate": 1.8882600364795255e-05,
+ "loss": 1.1158,
+ "step": 6509
+ },
+ {
+ "epoch": 17.73841961852861,
+ "grad_norm": 8.458165168762207,
+ "learning_rate": 1.8882194964283473e-05,
+ "loss": 0.7937,
+ "step": 6510
+ },
+ {
+ "epoch": 17.741144414168936,
+ "grad_norm": 7.65460205078125,
+ "learning_rate": 1.888178949459745e-05,
+ "loss": 0.7695,
+ "step": 6511
+ },
+ {
+ "epoch": 17.743869209809265,
+ "grad_norm": 17.94519805908203,
+ "learning_rate": 1.8881383955740324e-05,
+ "loss": 1.012,
+ "step": 6512
+ },
+ {
+ "epoch": 17.74659400544959,
+ "grad_norm": 8.303767204284668,
+ "learning_rate": 1.8880978347715272e-05,
+ "loss": 0.8011,
+ "step": 6513
+ },
+ {
+ "epoch": 17.749318801089917,
+ "grad_norm": 9.062012672424316,
+ "learning_rate": 1.888057267052545e-05,
+ "loss": 0.9065,
+ "step": 6514
+ },
+ {
+ "epoch": 17.752043596730246,
+ "grad_norm": 9.889007568359375,
+ "learning_rate": 1.888016692417401e-05,
+ "loss": 0.9719,
+ "step": 6515
+ },
+ {
+ "epoch": 17.754768392370572,
+ "grad_norm": 9.427414894104004,
+ "learning_rate": 1.8879761108664114e-05,
+ "loss": 0.9438,
+ "step": 6516
+ },
+ {
+ "epoch": 17.757493188010898,
+ "grad_norm": 12.378963470458984,
+ "learning_rate": 1.8879355223998928e-05,
+ "loss": 0.8348,
+ "step": 6517
+ },
+ {
+ "epoch": 17.760217983651227,
+ "grad_norm": 7.321284770965576,
+ "learning_rate": 1.8878949270181606e-05,
+ "loss": 0.9183,
+ "step": 6518
+ },
+ {
+ "epoch": 17.762942779291553,
+ "grad_norm": 12.255606651306152,
+ "learning_rate": 1.8878543247215314e-05,
+ "loss": 1.0635,
+ "step": 6519
+ },
+ {
+ "epoch": 17.76566757493188,
+ "grad_norm": 7.989128589630127,
+ "learning_rate": 1.8878137155103214e-05,
+ "loss": 0.8168,
+ "step": 6520
+ },
+ {
+ "epoch": 17.768392370572208,
+ "grad_norm": 7.796993732452393,
+ "learning_rate": 1.887773099384847e-05,
+ "loss": 0.8943,
+ "step": 6521
+ },
+ {
+ "epoch": 17.771117166212534,
+ "grad_norm": 9.63947582244873,
+ "learning_rate": 1.887732476345424e-05,
+ "loss": 1.1299,
+ "step": 6522
+ },
+ {
+ "epoch": 17.77384196185286,
+ "grad_norm": 9.127558708190918,
+ "learning_rate": 1.887691846392369e-05,
+ "loss": 0.9191,
+ "step": 6523
+ },
+ {
+ "epoch": 17.77656675749319,
+ "grad_norm": 6.981589317321777,
+ "learning_rate": 1.8876512095259986e-05,
+ "loss": 0.7831,
+ "step": 6524
+ },
+ {
+ "epoch": 17.779291553133515,
+ "grad_norm": 10.201642036437988,
+ "learning_rate": 1.8876105657466287e-05,
+ "loss": 0.8218,
+ "step": 6525
+ },
+ {
+ "epoch": 17.78201634877384,
+ "grad_norm": 7.945437908172607,
+ "learning_rate": 1.8875699150545768e-05,
+ "loss": 0.9926,
+ "step": 6526
+ },
+ {
+ "epoch": 17.78474114441417,
+ "grad_norm": 13.129316329956055,
+ "learning_rate": 1.887529257450159e-05,
+ "loss": 1.011,
+ "step": 6527
+ },
+ {
+ "epoch": 17.787465940054496,
+ "grad_norm": 7.099358558654785,
+ "learning_rate": 1.8874885929336916e-05,
+ "loss": 0.9521,
+ "step": 6528
+ },
+ {
+ "epoch": 17.79019073569482,
+ "grad_norm": 8.41981029510498,
+ "learning_rate": 1.8874479215054916e-05,
+ "loss": 0.8042,
+ "step": 6529
+ },
+ {
+ "epoch": 17.79291553133515,
+ "grad_norm": 7.612015247344971,
+ "learning_rate": 1.887407243165876e-05,
+ "loss": 1.0214,
+ "step": 6530
+ },
+ {
+ "epoch": 17.795640326975477,
+ "grad_norm": 7.234619140625,
+ "learning_rate": 1.887366557915161e-05,
+ "loss": 1.1766,
+ "step": 6531
+ },
+ {
+ "epoch": 17.798365122615802,
+ "grad_norm": 10.151055335998535,
+ "learning_rate": 1.8873258657536643e-05,
+ "loss": 0.7668,
+ "step": 6532
+ },
+ {
+ "epoch": 17.80108991825613,
+ "grad_norm": 11.343910217285156,
+ "learning_rate": 1.8872851666817017e-05,
+ "loss": 0.9978,
+ "step": 6533
+ },
+ {
+ "epoch": 17.803814713896458,
+ "grad_norm": 7.596022605895996,
+ "learning_rate": 1.8872444606995915e-05,
+ "loss": 0.8854,
+ "step": 6534
+ },
+ {
+ "epoch": 17.806539509536783,
+ "grad_norm": 11.584070205688477,
+ "learning_rate": 1.8872037478076494e-05,
+ "loss": 1.0798,
+ "step": 6535
+ },
+ {
+ "epoch": 17.809264305177113,
+ "grad_norm": 11.176453590393066,
+ "learning_rate": 1.8871630280061933e-05,
+ "loss": 0.9156,
+ "step": 6536
+ },
+ {
+ "epoch": 17.81198910081744,
+ "grad_norm": 7.551270961761475,
+ "learning_rate": 1.8871223012955402e-05,
+ "loss": 0.813,
+ "step": 6537
+ },
+ {
+ "epoch": 17.814713896457764,
+ "grad_norm": 7.892640113830566,
+ "learning_rate": 1.887081567676007e-05,
+ "loss": 0.7803,
+ "step": 6538
+ },
+ {
+ "epoch": 17.817438692098094,
+ "grad_norm": 8.432889938354492,
+ "learning_rate": 1.887040827147911e-05,
+ "loss": 1.0027,
+ "step": 6539
+ },
+ {
+ "epoch": 17.82016348773842,
+ "grad_norm": 10.599292755126953,
+ "learning_rate": 1.88700007971157e-05,
+ "loss": 0.9885,
+ "step": 6540
+ },
+ {
+ "epoch": 17.822888283378745,
+ "grad_norm": 13.277148246765137,
+ "learning_rate": 1.8869593253673005e-05,
+ "loss": 0.8337,
+ "step": 6541
+ },
+ {
+ "epoch": 17.825613079019075,
+ "grad_norm": 10.260055541992188,
+ "learning_rate": 1.8869185641154204e-05,
+ "loss": 1.01,
+ "step": 6542
+ },
+ {
+ "epoch": 17.8283378746594,
+ "grad_norm": 11.372323989868164,
+ "learning_rate": 1.8868777959562472e-05,
+ "loss": 1.0792,
+ "step": 6543
+ },
+ {
+ "epoch": 17.831062670299726,
+ "grad_norm": 9.509187698364258,
+ "learning_rate": 1.886837020890098e-05,
+ "loss": 0.9797,
+ "step": 6544
+ },
+ {
+ "epoch": 17.833787465940055,
+ "grad_norm": 7.478908538818359,
+ "learning_rate": 1.8867962389172912e-05,
+ "loss": 0.8768,
+ "step": 6545
+ },
+ {
+ "epoch": 17.83651226158038,
+ "grad_norm": 7.537795543670654,
+ "learning_rate": 1.8867554500381433e-05,
+ "loss": 0.9341,
+ "step": 6546
+ },
+ {
+ "epoch": 17.839237057220707,
+ "grad_norm": 6.650048732757568,
+ "learning_rate": 1.886714654252973e-05,
+ "loss": 0.697,
+ "step": 6547
+ },
+ {
+ "epoch": 17.841961852861036,
+ "grad_norm": 8.197768211364746,
+ "learning_rate": 1.886673851562097e-05,
+ "loss": 0.8198,
+ "step": 6548
+ },
+ {
+ "epoch": 17.844686648501362,
+ "grad_norm": 7.36025333404541,
+ "learning_rate": 1.8866330419658338e-05,
+ "loss": 1.0024,
+ "step": 6549
+ },
+ {
+ "epoch": 17.847411444141688,
+ "grad_norm": 7.918854236602783,
+ "learning_rate": 1.8865922254645008e-05,
+ "loss": 0.9758,
+ "step": 6550
+ },
+ {
+ "epoch": 17.850136239782017,
+ "grad_norm": 11.31563663482666,
+ "learning_rate": 1.8865514020584164e-05,
+ "loss": 1.0156,
+ "step": 6551
+ },
+ {
+ "epoch": 17.852861035422343,
+ "grad_norm": 9.666770935058594,
+ "learning_rate": 1.886510571747898e-05,
+ "loss": 1.0446,
+ "step": 6552
+ },
+ {
+ "epoch": 17.85558583106267,
+ "grad_norm": 10.833832740783691,
+ "learning_rate": 1.886469734533264e-05,
+ "loss": 0.8052,
+ "step": 6553
+ },
+ {
+ "epoch": 17.858310626703,
+ "grad_norm": 9.465039253234863,
+ "learning_rate": 1.886428890414832e-05,
+ "loss": 0.9031,
+ "step": 6554
+ },
+ {
+ "epoch": 17.861035422343324,
+ "grad_norm": 12.025474548339844,
+ "learning_rate": 1.8863880393929202e-05,
+ "loss": 0.8853,
+ "step": 6555
+ },
+ {
+ "epoch": 17.86376021798365,
+ "grad_norm": 9.478365898132324,
+ "learning_rate": 1.8863471814678475e-05,
+ "loss": 0.9048,
+ "step": 6556
+ },
+ {
+ "epoch": 17.86648501362398,
+ "grad_norm": 8.645143508911133,
+ "learning_rate": 1.886306316639931e-05,
+ "loss": 0.9694,
+ "step": 6557
+ },
+ {
+ "epoch": 17.869209809264305,
+ "grad_norm": 9.461164474487305,
+ "learning_rate": 1.8862654449094892e-05,
+ "loss": 0.9735,
+ "step": 6558
+ },
+ {
+ "epoch": 17.87193460490463,
+ "grad_norm": 7.370994567871094,
+ "learning_rate": 1.886224566276841e-05,
+ "loss": 0.7737,
+ "step": 6559
+ },
+ {
+ "epoch": 17.87465940054496,
+ "grad_norm": 8.07332992553711,
+ "learning_rate": 1.8861836807423045e-05,
+ "loss": 0.8976,
+ "step": 6560
+ },
+ {
+ "epoch": 17.877384196185286,
+ "grad_norm": 8.453144073486328,
+ "learning_rate": 1.8861427883061977e-05,
+ "loss": 0.9255,
+ "step": 6561
+ },
+ {
+ "epoch": 17.88010899182561,
+ "grad_norm": 7.679013252258301,
+ "learning_rate": 1.8861018889688395e-05,
+ "loss": 0.7972,
+ "step": 6562
+ },
+ {
+ "epoch": 17.88283378746594,
+ "grad_norm": 9.931220054626465,
+ "learning_rate": 1.8860609827305487e-05,
+ "loss": 1.0492,
+ "step": 6563
+ },
+ {
+ "epoch": 17.885558583106267,
+ "grad_norm": 8.279606819152832,
+ "learning_rate": 1.886020069591643e-05,
+ "loss": 1.0369,
+ "step": 6564
+ },
+ {
+ "epoch": 17.888283378746593,
+ "grad_norm": 10.057707786560059,
+ "learning_rate": 1.885979149552442e-05,
+ "loss": 1.0364,
+ "step": 6565
+ },
+ {
+ "epoch": 17.891008174386922,
+ "grad_norm": 7.192422866821289,
+ "learning_rate": 1.8859382226132635e-05,
+ "loss": 0.9194,
+ "step": 6566
+ },
+ {
+ "epoch": 17.893732970027248,
+ "grad_norm": 9.681727409362793,
+ "learning_rate": 1.8858972887744268e-05,
+ "loss": 1.0321,
+ "step": 6567
+ },
+ {
+ "epoch": 17.896457765667574,
+ "grad_norm": 18.173507690429688,
+ "learning_rate": 1.8858563480362503e-05,
+ "loss": 0.9209,
+ "step": 6568
+ },
+ {
+ "epoch": 17.899182561307903,
+ "grad_norm": 8.38066291809082,
+ "learning_rate": 1.885815400399053e-05,
+ "loss": 0.908,
+ "step": 6569
+ },
+ {
+ "epoch": 17.90190735694823,
+ "grad_norm": 8.17420482635498,
+ "learning_rate": 1.885774445863154e-05,
+ "loss": 0.939,
+ "step": 6570
+ },
+ {
+ "epoch": 17.904632152588555,
+ "grad_norm": 7.61351203918457,
+ "learning_rate": 1.8857334844288723e-05,
+ "loss": 0.9016,
+ "step": 6571
+ },
+ {
+ "epoch": 17.907356948228884,
+ "grad_norm": 7.483287811279297,
+ "learning_rate": 1.8856925160965267e-05,
+ "loss": 0.9607,
+ "step": 6572
+ },
+ {
+ "epoch": 17.91008174386921,
+ "grad_norm": 8.12373161315918,
+ "learning_rate": 1.8856515408664363e-05,
+ "loss": 0.9045,
+ "step": 6573
+ },
+ {
+ "epoch": 17.912806539509535,
+ "grad_norm": 10.766953468322754,
+ "learning_rate": 1.88561055873892e-05,
+ "loss": 1.0854,
+ "step": 6574
+ },
+ {
+ "epoch": 17.915531335149865,
+ "grad_norm": 7.82476806640625,
+ "learning_rate": 1.8855695697142972e-05,
+ "loss": 1.0293,
+ "step": 6575
+ },
+ {
+ "epoch": 17.91825613079019,
+ "grad_norm": 13.205169677734375,
+ "learning_rate": 1.8855285737928874e-05,
+ "loss": 1.1251,
+ "step": 6576
+ },
+ {
+ "epoch": 17.920980926430516,
+ "grad_norm": 8.568056106567383,
+ "learning_rate": 1.8854875709750092e-05,
+ "loss": 0.9249,
+ "step": 6577
+ },
+ {
+ "epoch": 17.923705722070846,
+ "grad_norm": 9.343592643737793,
+ "learning_rate": 1.8854465612609828e-05,
+ "loss": 1.0399,
+ "step": 6578
+ },
+ {
+ "epoch": 17.92643051771117,
+ "grad_norm": 8.471595764160156,
+ "learning_rate": 1.8854055446511267e-05,
+ "loss": 0.7042,
+ "step": 6579
+ },
+ {
+ "epoch": 17.929155313351497,
+ "grad_norm": 8.00652027130127,
+ "learning_rate": 1.8853645211457606e-05,
+ "loss": 1.0095,
+ "step": 6580
+ },
+ {
+ "epoch": 17.931880108991827,
+ "grad_norm": 8.351338386535645,
+ "learning_rate": 1.8853234907452042e-05,
+ "loss": 1.0315,
+ "step": 6581
+ },
+ {
+ "epoch": 17.934604904632153,
+ "grad_norm": 9.317249298095703,
+ "learning_rate": 1.8852824534497772e-05,
+ "loss": 0.9215,
+ "step": 6582
+ },
+ {
+ "epoch": 17.93732970027248,
+ "grad_norm": 10.584437370300293,
+ "learning_rate": 1.8852414092597985e-05,
+ "loss": 0.7916,
+ "step": 6583
+ },
+ {
+ "epoch": 17.940054495912808,
+ "grad_norm": 6.993414402008057,
+ "learning_rate": 1.8852003581755886e-05,
+ "loss": 0.9595,
+ "step": 6584
+ },
+ {
+ "epoch": 17.942779291553133,
+ "grad_norm": 7.56000280380249,
+ "learning_rate": 1.8851593001974663e-05,
+ "loss": 0.8101,
+ "step": 6585
+ },
+ {
+ "epoch": 17.94550408719346,
+ "grad_norm": 9.294096946716309,
+ "learning_rate": 1.8851182353257524e-05,
+ "loss": 1.0363,
+ "step": 6586
+ },
+ {
+ "epoch": 17.94822888283379,
+ "grad_norm": 7.075156211853027,
+ "learning_rate": 1.885077163560766e-05,
+ "loss": 0.7717,
+ "step": 6587
+ },
+ {
+ "epoch": 17.950953678474114,
+ "grad_norm": 8.787549018859863,
+ "learning_rate": 1.885036084902827e-05,
+ "loss": 0.8955,
+ "step": 6588
+ },
+ {
+ "epoch": 17.95367847411444,
+ "grad_norm": 9.324135780334473,
+ "learning_rate": 1.8849949993522557e-05,
+ "loss": 1.0061,
+ "step": 6589
+ },
+ {
+ "epoch": 17.95640326975477,
+ "grad_norm": 12.604859352111816,
+ "learning_rate": 1.8849539069093717e-05,
+ "loss": 0.9661,
+ "step": 6590
+ },
+ {
+ "epoch": 17.959128065395095,
+ "grad_norm": 8.067110061645508,
+ "learning_rate": 1.884912807574495e-05,
+ "loss": 0.9313,
+ "step": 6591
+ },
+ {
+ "epoch": 17.96185286103542,
+ "grad_norm": 8.262900352478027,
+ "learning_rate": 1.884871701347946e-05,
+ "loss": 0.9541,
+ "step": 6592
+ },
+ {
+ "epoch": 17.96457765667575,
+ "grad_norm": 9.744215965270996,
+ "learning_rate": 1.884830588230045e-05,
+ "loss": 0.989,
+ "step": 6593
+ },
+ {
+ "epoch": 17.967302452316076,
+ "grad_norm": 7.75123405456543,
+ "learning_rate": 1.8847894682211113e-05,
+ "loss": 0.9637,
+ "step": 6594
+ },
+ {
+ "epoch": 17.970027247956402,
+ "grad_norm": 8.812027931213379,
+ "learning_rate": 1.884748341321466e-05,
+ "loss": 0.925,
+ "step": 6595
+ },
+ {
+ "epoch": 17.97275204359673,
+ "grad_norm": 7.7459588050842285,
+ "learning_rate": 1.8847072075314288e-05,
+ "loss": 0.9319,
+ "step": 6596
+ },
+ {
+ "epoch": 17.975476839237057,
+ "grad_norm": 8.137155532836914,
+ "learning_rate": 1.8846660668513206e-05,
+ "loss": 0.8538,
+ "step": 6597
+ },
+ {
+ "epoch": 17.978201634877383,
+ "grad_norm": 10.407999992370605,
+ "learning_rate": 1.8846249192814613e-05,
+ "loss": 1.0244,
+ "step": 6598
+ },
+ {
+ "epoch": 17.980926430517712,
+ "grad_norm": 8.504861831665039,
+ "learning_rate": 1.884583764822172e-05,
+ "loss": 0.8186,
+ "step": 6599
+ },
+ {
+ "epoch": 17.983651226158038,
+ "grad_norm": 8.649380683898926,
+ "learning_rate": 1.8845426034737724e-05,
+ "loss": 0.7762,
+ "step": 6600
+ },
+ {
+ "epoch": 17.986376021798364,
+ "grad_norm": 7.561326503753662,
+ "learning_rate": 1.8845014352365836e-05,
+ "loss": 0.8407,
+ "step": 6601
+ },
+ {
+ "epoch": 17.989100817438693,
+ "grad_norm": 7.720953464508057,
+ "learning_rate": 1.8844602601109265e-05,
+ "loss": 0.9877,
+ "step": 6602
+ },
+ {
+ "epoch": 17.99182561307902,
+ "grad_norm": 9.713851928710938,
+ "learning_rate": 1.884419078097121e-05,
+ "loss": 1.0118,
+ "step": 6603
+ },
+ {
+ "epoch": 17.994550408719345,
+ "grad_norm": 8.336447715759277,
+ "learning_rate": 1.8843778891954883e-05,
+ "loss": 0.8303,
+ "step": 6604
+ },
+ {
+ "epoch": 17.997275204359674,
+ "grad_norm": 8.688618659973145,
+ "learning_rate": 1.884336693406349e-05,
+ "loss": 1.0134,
+ "step": 6605
+ },
+ {
+ "epoch": 18.0,
+ "grad_norm": 12.853461265563965,
+ "learning_rate": 1.8842954907300236e-05,
+ "loss": 1.071,
+ "step": 6606
+ },
+ {
+ "epoch": 18.002724795640326,
+ "grad_norm": 7.621571063995361,
+ "learning_rate": 1.884254281166834e-05,
+ "loss": 0.8401,
+ "step": 6607
+ },
+ {
+ "epoch": 18.005449591280655,
+ "grad_norm": 6.969585418701172,
+ "learning_rate": 1.8842130647171003e-05,
+ "loss": 0.7584,
+ "step": 6608
+ },
+ {
+ "epoch": 18.00817438692098,
+ "grad_norm": 9.190740585327148,
+ "learning_rate": 1.8841718413811433e-05,
+ "loss": 0.9208,
+ "step": 6609
+ },
+ {
+ "epoch": 18.010899182561307,
+ "grad_norm": 7.002579689025879,
+ "learning_rate": 1.884130611159285e-05,
+ "loss": 0.8711,
+ "step": 6610
+ },
+ {
+ "epoch": 18.013623978201636,
+ "grad_norm": 9.554093360900879,
+ "learning_rate": 1.8840893740518458e-05,
+ "loss": 0.8696,
+ "step": 6611
+ },
+ {
+ "epoch": 18.016348773841962,
+ "grad_norm": 7.839029788970947,
+ "learning_rate": 1.8840481300591473e-05,
+ "loss": 0.691,
+ "step": 6612
+ },
+ {
+ "epoch": 18.019073569482288,
+ "grad_norm": 9.62078857421875,
+ "learning_rate": 1.88400687918151e-05,
+ "loss": 1.0929,
+ "step": 6613
+ },
+ {
+ "epoch": 18.021798365122617,
+ "grad_norm": 8.053839683532715,
+ "learning_rate": 1.8839656214192557e-05,
+ "loss": 0.7987,
+ "step": 6614
+ },
+ {
+ "epoch": 18.024523160762943,
+ "grad_norm": 7.5099663734436035,
+ "learning_rate": 1.8839243567727053e-05,
+ "loss": 0.8634,
+ "step": 6615
+ },
+ {
+ "epoch": 18.02724795640327,
+ "grad_norm": 7.961956024169922,
+ "learning_rate": 1.8838830852421807e-05,
+ "loss": 0.816,
+ "step": 6616
+ },
+ {
+ "epoch": 18.029972752043598,
+ "grad_norm": 7.8157958984375,
+ "learning_rate": 1.8838418068280032e-05,
+ "loss": 0.7692,
+ "step": 6617
+ },
+ {
+ "epoch": 18.032697547683924,
+ "grad_norm": 8.519083976745605,
+ "learning_rate": 1.883800521530494e-05,
+ "loss": 0.8165,
+ "step": 6618
+ },
+ {
+ "epoch": 18.03542234332425,
+ "grad_norm": 8.912421226501465,
+ "learning_rate": 1.8837592293499747e-05,
+ "loss": 0.8987,
+ "step": 6619
+ },
+ {
+ "epoch": 18.03814713896458,
+ "grad_norm": 7.688618183135986,
+ "learning_rate": 1.883717930286767e-05,
+ "loss": 0.8966,
+ "step": 6620
+ },
+ {
+ "epoch": 18.040871934604905,
+ "grad_norm": 8.02383804321289,
+ "learning_rate": 1.8836766243411932e-05,
+ "loss": 0.8664,
+ "step": 6621
+ },
+ {
+ "epoch": 18.04359673024523,
+ "grad_norm": 7.162313461303711,
+ "learning_rate": 1.8836353115135735e-05,
+ "loss": 0.764,
+ "step": 6622
+ },
+ {
+ "epoch": 18.04632152588556,
+ "grad_norm": 8.650481224060059,
+ "learning_rate": 1.8835939918042308e-05,
+ "loss": 0.8461,
+ "step": 6623
+ },
+ {
+ "epoch": 18.049046321525886,
+ "grad_norm": 9.792577743530273,
+ "learning_rate": 1.883552665213486e-05,
+ "loss": 0.903,
+ "step": 6624
+ },
+ {
+ "epoch": 18.05177111716621,
+ "grad_norm": 9.125471115112305,
+ "learning_rate": 1.883511331741662e-05,
+ "loss": 0.837,
+ "step": 6625
+ },
+ {
+ "epoch": 18.05449591280654,
+ "grad_norm": 7.903054237365723,
+ "learning_rate": 1.88346999138908e-05,
+ "loss": 0.7997,
+ "step": 6626
+ },
+ {
+ "epoch": 18.057220708446867,
+ "grad_norm": 7.64015007019043,
+ "learning_rate": 1.8834286441560622e-05,
+ "loss": 0.8661,
+ "step": 6627
+ },
+ {
+ "epoch": 18.059945504087192,
+ "grad_norm": 7.844747543334961,
+ "learning_rate": 1.8833872900429307e-05,
+ "loss": 1.0045,
+ "step": 6628
+ },
+ {
+ "epoch": 18.06267029972752,
+ "grad_norm": 7.97361946105957,
+ "learning_rate": 1.8833459290500073e-05,
+ "loss": 0.8038,
+ "step": 6629
+ },
+ {
+ "epoch": 18.065395095367847,
+ "grad_norm": 8.794074058532715,
+ "learning_rate": 1.8833045611776143e-05,
+ "loss": 1.0504,
+ "step": 6630
+ },
+ {
+ "epoch": 18.068119891008173,
+ "grad_norm": 7.852278709411621,
+ "learning_rate": 1.883263186426073e-05,
+ "loss": 0.8947,
+ "step": 6631
+ },
+ {
+ "epoch": 18.070844686648503,
+ "grad_norm": 9.553807258605957,
+ "learning_rate": 1.8832218047957072e-05,
+ "loss": 0.7778,
+ "step": 6632
+ },
+ {
+ "epoch": 18.07356948228883,
+ "grad_norm": 8.006525039672852,
+ "learning_rate": 1.883180416286839e-05,
+ "loss": 0.936,
+ "step": 6633
+ },
+ {
+ "epoch": 18.076294277929154,
+ "grad_norm": 8.542932510375977,
+ "learning_rate": 1.8831390208997892e-05,
+ "loss": 0.6926,
+ "step": 6634
+ },
+ {
+ "epoch": 18.079019073569484,
+ "grad_norm": 7.582610130310059,
+ "learning_rate": 1.883097618634881e-05,
+ "loss": 0.7317,
+ "step": 6635
+ },
+ {
+ "epoch": 18.08174386920981,
+ "grad_norm": 7.989914894104004,
+ "learning_rate": 1.8830562094924375e-05,
+ "loss": 0.8495,
+ "step": 6636
+ },
+ {
+ "epoch": 18.084468664850135,
+ "grad_norm": 8.978856086730957,
+ "learning_rate": 1.8830147934727806e-05,
+ "loss": 0.8517,
+ "step": 6637
+ },
+ {
+ "epoch": 18.087193460490465,
+ "grad_norm": 8.952409744262695,
+ "learning_rate": 1.882973370576233e-05,
+ "loss": 0.8947,
+ "step": 6638
+ },
+ {
+ "epoch": 18.08991825613079,
+ "grad_norm": 7.963160037994385,
+ "learning_rate": 1.882931940803117e-05,
+ "loss": 0.7739,
+ "step": 6639
+ },
+ {
+ "epoch": 18.092643051771116,
+ "grad_norm": 8.281893730163574,
+ "learning_rate": 1.8828905041537556e-05,
+ "loss": 0.7975,
+ "step": 6640
+ },
+ {
+ "epoch": 18.095367847411445,
+ "grad_norm": 8.743407249450684,
+ "learning_rate": 1.882849060628471e-05,
+ "loss": 0.8799,
+ "step": 6641
+ },
+ {
+ "epoch": 18.09809264305177,
+ "grad_norm": 9.185464859008789,
+ "learning_rate": 1.882807610227587e-05,
+ "loss": 0.9502,
+ "step": 6642
+ },
+ {
+ "epoch": 18.100817438692097,
+ "grad_norm": 10.43502426147461,
+ "learning_rate": 1.882766152951425e-05,
+ "loss": 0.9673,
+ "step": 6643
+ },
+ {
+ "epoch": 18.103542234332426,
+ "grad_norm": 7.852787971496582,
+ "learning_rate": 1.882724688800309e-05,
+ "loss": 0.9082,
+ "step": 6644
+ },
+ {
+ "epoch": 18.106267029972752,
+ "grad_norm": 8.680418014526367,
+ "learning_rate": 1.8826832177745617e-05,
+ "loss": 0.9612,
+ "step": 6645
+ },
+ {
+ "epoch": 18.108991825613078,
+ "grad_norm": 11.557866096496582,
+ "learning_rate": 1.882641739874506e-05,
+ "loss": 0.8992,
+ "step": 6646
+ },
+ {
+ "epoch": 18.111716621253407,
+ "grad_norm": 9.403258323669434,
+ "learning_rate": 1.882600255100464e-05,
+ "loss": 0.8704,
+ "step": 6647
+ },
+ {
+ "epoch": 18.114441416893733,
+ "grad_norm": 6.144392013549805,
+ "learning_rate": 1.8825587634527603e-05,
+ "loss": 0.8552,
+ "step": 6648
+ },
+ {
+ "epoch": 18.11716621253406,
+ "grad_norm": 7.077390670776367,
+ "learning_rate": 1.8825172649317172e-05,
+ "loss": 0.8794,
+ "step": 6649
+ },
+ {
+ "epoch": 18.11989100817439,
+ "grad_norm": 8.0903902053833,
+ "learning_rate": 1.882475759537658e-05,
+ "loss": 0.958,
+ "step": 6650
+ },
+ {
+ "epoch": 18.122615803814714,
+ "grad_norm": 7.654234409332275,
+ "learning_rate": 1.882434247270906e-05,
+ "loss": 0.9238,
+ "step": 6651
+ },
+ {
+ "epoch": 18.12534059945504,
+ "grad_norm": 7.101521015167236,
+ "learning_rate": 1.8823927281317848e-05,
+ "loss": 0.9688,
+ "step": 6652
+ },
+ {
+ "epoch": 18.12806539509537,
+ "grad_norm": 7.770018577575684,
+ "learning_rate": 1.882351202120617e-05,
+ "loss": 0.6746,
+ "step": 6653
+ },
+ {
+ "epoch": 18.130790190735695,
+ "grad_norm": 10.246801376342773,
+ "learning_rate": 1.882309669237727e-05,
+ "loss": 0.908,
+ "step": 6654
+ },
+ {
+ "epoch": 18.13351498637602,
+ "grad_norm": 7.705492973327637,
+ "learning_rate": 1.882268129483437e-05,
+ "loss": 0.7057,
+ "step": 6655
+ },
+ {
+ "epoch": 18.13623978201635,
+ "grad_norm": 10.161961555480957,
+ "learning_rate": 1.8822265828580716e-05,
+ "loss": 0.8679,
+ "step": 6656
+ },
+ {
+ "epoch": 18.138964577656676,
+ "grad_norm": 7.283121585845947,
+ "learning_rate": 1.8821850293619536e-05,
+ "loss": 0.9399,
+ "step": 6657
+ },
+ {
+ "epoch": 18.141689373297,
+ "grad_norm": 8.794880867004395,
+ "learning_rate": 1.8821434689954074e-05,
+ "loss": 0.7854,
+ "step": 6658
+ },
+ {
+ "epoch": 18.14441416893733,
+ "grad_norm": 7.504270553588867,
+ "learning_rate": 1.8821019017587562e-05,
+ "loss": 0.8784,
+ "step": 6659
+ },
+ {
+ "epoch": 18.147138964577657,
+ "grad_norm": 7.3743438720703125,
+ "learning_rate": 1.882060327652324e-05,
+ "loss": 0.9117,
+ "step": 6660
+ },
+ {
+ "epoch": 18.149863760217983,
+ "grad_norm": 8.664271354675293,
+ "learning_rate": 1.8820187466764337e-05,
+ "loss": 0.849,
+ "step": 6661
+ },
+ {
+ "epoch": 18.152588555858312,
+ "grad_norm": 8.355574607849121,
+ "learning_rate": 1.88197715883141e-05,
+ "loss": 0.8354,
+ "step": 6662
+ },
+ {
+ "epoch": 18.155313351498638,
+ "grad_norm": 7.7394514083862305,
+ "learning_rate": 1.8819355641175767e-05,
+ "loss": 0.7986,
+ "step": 6663
+ },
+ {
+ "epoch": 18.158038147138964,
+ "grad_norm": 8.34272575378418,
+ "learning_rate": 1.8818939625352577e-05,
+ "loss": 0.7178,
+ "step": 6664
+ },
+ {
+ "epoch": 18.160762942779293,
+ "grad_norm": 7.23603630065918,
+ "learning_rate": 1.8818523540847768e-05,
+ "loss": 0.8145,
+ "step": 6665
+ },
+ {
+ "epoch": 18.16348773841962,
+ "grad_norm": 7.129431247711182,
+ "learning_rate": 1.8818107387664582e-05,
+ "loss": 0.6943,
+ "step": 6666
+ },
+ {
+ "epoch": 18.166212534059945,
+ "grad_norm": 9.455894470214844,
+ "learning_rate": 1.881769116580626e-05,
+ "loss": 0.9041,
+ "step": 6667
+ },
+ {
+ "epoch": 18.168937329700274,
+ "grad_norm": 8.3630952835083,
+ "learning_rate": 1.881727487527604e-05,
+ "loss": 1.0199,
+ "step": 6668
+ },
+ {
+ "epoch": 18.1716621253406,
+ "grad_norm": 9.230984687805176,
+ "learning_rate": 1.881685851607717e-05,
+ "loss": 0.9042,
+ "step": 6669
+ },
+ {
+ "epoch": 18.174386920980925,
+ "grad_norm": 6.956221580505371,
+ "learning_rate": 1.881644208821289e-05,
+ "loss": 0.6833,
+ "step": 6670
+ },
+ {
+ "epoch": 18.177111716621255,
+ "grad_norm": 8.737435340881348,
+ "learning_rate": 1.881602559168644e-05,
+ "loss": 1.0133,
+ "step": 6671
+ },
+ {
+ "epoch": 18.17983651226158,
+ "grad_norm": 7.035590171813965,
+ "learning_rate": 1.881560902650107e-05,
+ "loss": 0.8278,
+ "step": 6672
+ },
+ {
+ "epoch": 18.182561307901906,
+ "grad_norm": 13.982083320617676,
+ "learning_rate": 1.881519239266002e-05,
+ "loss": 1.0471,
+ "step": 6673
+ },
+ {
+ "epoch": 18.185286103542236,
+ "grad_norm": 7.48789119720459,
+ "learning_rate": 1.8814775690166535e-05,
+ "loss": 0.8416,
+ "step": 6674
+ },
+ {
+ "epoch": 18.18801089918256,
+ "grad_norm": 6.988489627838135,
+ "learning_rate": 1.8814358919023855e-05,
+ "loss": 0.7903,
+ "step": 6675
+ },
+ {
+ "epoch": 18.190735694822887,
+ "grad_norm": 13.37846851348877,
+ "learning_rate": 1.8813942079235237e-05,
+ "loss": 0.6805,
+ "step": 6676
+ },
+ {
+ "epoch": 18.193460490463217,
+ "grad_norm": 9.722649574279785,
+ "learning_rate": 1.881352517080392e-05,
+ "loss": 1.0209,
+ "step": 6677
+ },
+ {
+ "epoch": 18.196185286103542,
+ "grad_norm": 9.827420234680176,
+ "learning_rate": 1.8813108193733155e-05,
+ "loss": 0.83,
+ "step": 6678
+ },
+ {
+ "epoch": 18.19891008174387,
+ "grad_norm": 8.813655853271484,
+ "learning_rate": 1.8812691148026186e-05,
+ "loss": 0.828,
+ "step": 6679
+ },
+ {
+ "epoch": 18.201634877384198,
+ "grad_norm": 7.097906112670898,
+ "learning_rate": 1.881227403368626e-05,
+ "loss": 0.7917,
+ "step": 6680
+ },
+ {
+ "epoch": 18.204359673024523,
+ "grad_norm": 7.607766151428223,
+ "learning_rate": 1.881185685071663e-05,
+ "loss": 0.8481,
+ "step": 6681
+ },
+ {
+ "epoch": 18.20708446866485,
+ "grad_norm": 7.371726036071777,
+ "learning_rate": 1.8811439599120543e-05,
+ "loss": 0.8933,
+ "step": 6682
+ },
+ {
+ "epoch": 18.20980926430518,
+ "grad_norm": 7.199708938598633,
+ "learning_rate": 1.8811022278901244e-05,
+ "loss": 0.9622,
+ "step": 6683
+ },
+ {
+ "epoch": 18.212534059945504,
+ "grad_norm": 7.4748663902282715,
+ "learning_rate": 1.881060489006199e-05,
+ "loss": 1.014,
+ "step": 6684
+ },
+ {
+ "epoch": 18.21525885558583,
+ "grad_norm": 8.907736778259277,
+ "learning_rate": 1.881018743260603e-05,
+ "loss": 0.7926,
+ "step": 6685
+ },
+ {
+ "epoch": 18.21798365122616,
+ "grad_norm": 6.982027530670166,
+ "learning_rate": 1.880976990653661e-05,
+ "loss": 0.9241,
+ "step": 6686
+ },
+ {
+ "epoch": 18.220708446866485,
+ "grad_norm": 8.772224426269531,
+ "learning_rate": 1.8809352311856987e-05,
+ "loss": 0.7861,
+ "step": 6687
+ },
+ {
+ "epoch": 18.22343324250681,
+ "grad_norm": 9.9409818649292,
+ "learning_rate": 1.8808934648570412e-05,
+ "loss": 0.7244,
+ "step": 6688
+ },
+ {
+ "epoch": 18.22615803814714,
+ "grad_norm": 7.434682846069336,
+ "learning_rate": 1.8808516916680138e-05,
+ "loss": 0.9373,
+ "step": 6689
+ },
+ {
+ "epoch": 18.228882833787466,
+ "grad_norm": 7.6927642822265625,
+ "learning_rate": 1.880809911618942e-05,
+ "loss": 0.9325,
+ "step": 6690
+ },
+ {
+ "epoch": 18.231607629427792,
+ "grad_norm": 10.556446075439453,
+ "learning_rate": 1.8807681247101507e-05,
+ "loss": 0.9557,
+ "step": 6691
+ },
+ {
+ "epoch": 18.23433242506812,
+ "grad_norm": 8.532793998718262,
+ "learning_rate": 1.8807263309419656e-05,
+ "loss": 0.7985,
+ "step": 6692
+ },
+ {
+ "epoch": 18.237057220708447,
+ "grad_norm": 6.721668243408203,
+ "learning_rate": 1.8806845303147123e-05,
+ "loss": 0.902,
+ "step": 6693
+ },
+ {
+ "epoch": 18.239782016348773,
+ "grad_norm": 8.049880981445312,
+ "learning_rate": 1.880642722828716e-05,
+ "loss": 0.8823,
+ "step": 6694
+ },
+ {
+ "epoch": 18.242506811989102,
+ "grad_norm": 10.84933853149414,
+ "learning_rate": 1.8806009084843025e-05,
+ "loss": 0.8455,
+ "step": 6695
+ },
+ {
+ "epoch": 18.245231607629428,
+ "grad_norm": 9.497926712036133,
+ "learning_rate": 1.8805590872817976e-05,
+ "loss": 0.8737,
+ "step": 6696
+ },
+ {
+ "epoch": 18.247956403269754,
+ "grad_norm": 8.234804153442383,
+ "learning_rate": 1.880517259221527e-05,
+ "loss": 0.724,
+ "step": 6697
+ },
+ {
+ "epoch": 18.250681198910083,
+ "grad_norm": 8.508273124694824,
+ "learning_rate": 1.880475424303816e-05,
+ "loss": 0.7722,
+ "step": 6698
+ },
+ {
+ "epoch": 18.25340599455041,
+ "grad_norm": 9.23184871673584,
+ "learning_rate": 1.880433582528991e-05,
+ "loss": 0.8793,
+ "step": 6699
+ },
+ {
+ "epoch": 18.256130790190735,
+ "grad_norm": 8.031156539916992,
+ "learning_rate": 1.8803917338973778e-05,
+ "loss": 0.7725,
+ "step": 6700
+ },
+ {
+ "epoch": 18.258855585831064,
+ "grad_norm": 8.23066520690918,
+ "learning_rate": 1.8803498784093014e-05,
+ "loss": 0.9756,
+ "step": 6701
+ },
+ {
+ "epoch": 18.26158038147139,
+ "grad_norm": 8.178288459777832,
+ "learning_rate": 1.880308016065089e-05,
+ "loss": 0.835,
+ "step": 6702
+ },
+ {
+ "epoch": 18.264305177111716,
+ "grad_norm": 7.084980487823486,
+ "learning_rate": 1.880266146865066e-05,
+ "loss": 0.6921,
+ "step": 6703
+ },
+ {
+ "epoch": 18.267029972752045,
+ "grad_norm": 7.853808403015137,
+ "learning_rate": 1.8802242708095586e-05,
+ "loss": 0.8521,
+ "step": 6704
+ },
+ {
+ "epoch": 18.26975476839237,
+ "grad_norm": 9.48322582244873,
+ "learning_rate": 1.880182387898893e-05,
+ "loss": 0.9736,
+ "step": 6705
+ },
+ {
+ "epoch": 18.272479564032697,
+ "grad_norm": 8.77895450592041,
+ "learning_rate": 1.880140498133395e-05,
+ "loss": 0.963,
+ "step": 6706
+ },
+ {
+ "epoch": 18.275204359673026,
+ "grad_norm": 7.374267101287842,
+ "learning_rate": 1.8800986015133914e-05,
+ "loss": 0.9132,
+ "step": 6707
+ },
+ {
+ "epoch": 18.277929155313352,
+ "grad_norm": 8.246108055114746,
+ "learning_rate": 1.8800566980392082e-05,
+ "loss": 0.8914,
+ "step": 6708
+ },
+ {
+ "epoch": 18.280653950953678,
+ "grad_norm": 8.349637985229492,
+ "learning_rate": 1.8800147877111716e-05,
+ "loss": 0.7456,
+ "step": 6709
+ },
+ {
+ "epoch": 18.283378746594007,
+ "grad_norm": 9.123753547668457,
+ "learning_rate": 1.8799728705296084e-05,
+ "loss": 0.8217,
+ "step": 6710
+ },
+ {
+ "epoch": 18.286103542234333,
+ "grad_norm": 6.784246444702148,
+ "learning_rate": 1.8799309464948446e-05,
+ "loss": 0.8553,
+ "step": 6711
+ },
+ {
+ "epoch": 18.28882833787466,
+ "grad_norm": 7.580383777618408,
+ "learning_rate": 1.8798890156072068e-05,
+ "loss": 0.7469,
+ "step": 6712
+ },
+ {
+ "epoch": 18.291553133514988,
+ "grad_norm": 11.182293891906738,
+ "learning_rate": 1.879847077867022e-05,
+ "loss": 0.8315,
+ "step": 6713
+ },
+ {
+ "epoch": 18.294277929155314,
+ "grad_norm": 9.869726181030273,
+ "learning_rate": 1.879805133274616e-05,
+ "loss": 0.8164,
+ "step": 6714
+ },
+ {
+ "epoch": 18.29700272479564,
+ "grad_norm": 7.502408504486084,
+ "learning_rate": 1.8797631818303164e-05,
+ "loss": 0.9302,
+ "step": 6715
+ },
+ {
+ "epoch": 18.29972752043597,
+ "grad_norm": 8.410951614379883,
+ "learning_rate": 1.8797212235344492e-05,
+ "loss": 0.774,
+ "step": 6716
+ },
+ {
+ "epoch": 18.302452316076295,
+ "grad_norm": 7.368539333343506,
+ "learning_rate": 1.8796792583873418e-05,
+ "loss": 1.0969,
+ "step": 6717
+ },
+ {
+ "epoch": 18.30517711171662,
+ "grad_norm": 8.469276428222656,
+ "learning_rate": 1.87963728638932e-05,
+ "loss": 0.9127,
+ "step": 6718
+ },
+ {
+ "epoch": 18.30790190735695,
+ "grad_norm": 11.788848876953125,
+ "learning_rate": 1.8795953075407117e-05,
+ "loss": 0.8334,
+ "step": 6719
+ },
+ {
+ "epoch": 18.310626702997276,
+ "grad_norm": 7.8592047691345215,
+ "learning_rate": 1.8795533218418437e-05,
+ "loss": 0.8579,
+ "step": 6720
+ },
+ {
+ "epoch": 18.3133514986376,
+ "grad_norm": 8.544289588928223,
+ "learning_rate": 1.8795113292930425e-05,
+ "loss": 0.8611,
+ "step": 6721
+ },
+ {
+ "epoch": 18.31607629427793,
+ "grad_norm": 8.519726753234863,
+ "learning_rate": 1.8794693298946352e-05,
+ "loss": 0.8892,
+ "step": 6722
+ },
+ {
+ "epoch": 18.318801089918257,
+ "grad_norm": 10.280699729919434,
+ "learning_rate": 1.8794273236469495e-05,
+ "loss": 0.9015,
+ "step": 6723
+ },
+ {
+ "epoch": 18.321525885558582,
+ "grad_norm": 8.979537010192871,
+ "learning_rate": 1.8793853105503118e-05,
+ "loss": 0.9293,
+ "step": 6724
+ },
+ {
+ "epoch": 18.32425068119891,
+ "grad_norm": 6.912249565124512,
+ "learning_rate": 1.8793432906050496e-05,
+ "loss": 0.84,
+ "step": 6725
+ },
+ {
+ "epoch": 18.326975476839237,
+ "grad_norm": 6.5656256675720215,
+ "learning_rate": 1.87930126381149e-05,
+ "loss": 0.7482,
+ "step": 6726
+ },
+ {
+ "epoch": 18.329700272479563,
+ "grad_norm": 6.806774616241455,
+ "learning_rate": 1.879259230169961e-05,
+ "loss": 0.8,
+ "step": 6727
+ },
+ {
+ "epoch": 18.332425068119893,
+ "grad_norm": 15.59570026397705,
+ "learning_rate": 1.8792171896807886e-05,
+ "loss": 0.9402,
+ "step": 6728
+ },
+ {
+ "epoch": 18.33514986376022,
+ "grad_norm": 8.757286071777344,
+ "learning_rate": 1.879175142344302e-05,
+ "loss": 0.9177,
+ "step": 6729
+ },
+ {
+ "epoch": 18.337874659400544,
+ "grad_norm": 8.42879867553711,
+ "learning_rate": 1.8791330881608266e-05,
+ "loss": 0.8497,
+ "step": 6730
+ },
+ {
+ "epoch": 18.340599455040874,
+ "grad_norm": 7.903569221496582,
+ "learning_rate": 1.879091027130692e-05,
+ "loss": 0.7772,
+ "step": 6731
+ },
+ {
+ "epoch": 18.3433242506812,
+ "grad_norm": 6.854870319366455,
+ "learning_rate": 1.8790489592542243e-05,
+ "loss": 1.0813,
+ "step": 6732
+ },
+ {
+ "epoch": 18.346049046321525,
+ "grad_norm": 12.01852798461914,
+ "learning_rate": 1.8790068845317516e-05,
+ "loss": 0.9101,
+ "step": 6733
+ },
+ {
+ "epoch": 18.348773841961854,
+ "grad_norm": 8.10268497467041,
+ "learning_rate": 1.8789648029636014e-05,
+ "loss": 0.8087,
+ "step": 6734
+ },
+ {
+ "epoch": 18.35149863760218,
+ "grad_norm": 7.030385494232178,
+ "learning_rate": 1.8789227145501023e-05,
+ "loss": 0.6307,
+ "step": 6735
+ },
+ {
+ "epoch": 18.354223433242506,
+ "grad_norm": 8.755697250366211,
+ "learning_rate": 1.8788806192915804e-05,
+ "loss": 0.8468,
+ "step": 6736
+ },
+ {
+ "epoch": 18.356948228882835,
+ "grad_norm": 7.640406608581543,
+ "learning_rate": 1.8788385171883653e-05,
+ "loss": 1.0275,
+ "step": 6737
+ },
+ {
+ "epoch": 18.35967302452316,
+ "grad_norm": 6.8547515869140625,
+ "learning_rate": 1.878796408240784e-05,
+ "loss": 0.7567,
+ "step": 6738
+ },
+ {
+ "epoch": 18.362397820163487,
+ "grad_norm": 13.387345314025879,
+ "learning_rate": 1.878754292449164e-05,
+ "loss": 0.9679,
+ "step": 6739
+ },
+ {
+ "epoch": 18.365122615803816,
+ "grad_norm": 8.199585914611816,
+ "learning_rate": 1.8787121698138344e-05,
+ "loss": 0.8151,
+ "step": 6740
+ },
+ {
+ "epoch": 18.367847411444142,
+ "grad_norm": 9.504558563232422,
+ "learning_rate": 1.8786700403351226e-05,
+ "loss": 0.983,
+ "step": 6741
+ },
+ {
+ "epoch": 18.370572207084468,
+ "grad_norm": 7.679377555847168,
+ "learning_rate": 1.878627904013357e-05,
+ "loss": 0.8545,
+ "step": 6742
+ },
+ {
+ "epoch": 18.373297002724797,
+ "grad_norm": 11.670575141906738,
+ "learning_rate": 1.878585760848865e-05,
+ "loss": 0.7836,
+ "step": 6743
+ },
+ {
+ "epoch": 18.376021798365123,
+ "grad_norm": 8.45013427734375,
+ "learning_rate": 1.878543610841976e-05,
+ "loss": 0.8475,
+ "step": 6744
+ },
+ {
+ "epoch": 18.37874659400545,
+ "grad_norm": 9.006660461425781,
+ "learning_rate": 1.878501453993017e-05,
+ "loss": 0.9005,
+ "step": 6745
+ },
+ {
+ "epoch": 18.381471389645778,
+ "grad_norm": 7.631886005401611,
+ "learning_rate": 1.8784592903023175e-05,
+ "loss": 0.8474,
+ "step": 6746
+ },
+ {
+ "epoch": 18.384196185286104,
+ "grad_norm": 6.807475566864014,
+ "learning_rate": 1.8784171197702053e-05,
+ "loss": 0.7784,
+ "step": 6747
+ },
+ {
+ "epoch": 18.38692098092643,
+ "grad_norm": 8.734243392944336,
+ "learning_rate": 1.8783749423970085e-05,
+ "loss": 0.8893,
+ "step": 6748
+ },
+ {
+ "epoch": 18.38964577656676,
+ "grad_norm": 10.451774597167969,
+ "learning_rate": 1.878332758183056e-05,
+ "loss": 0.9891,
+ "step": 6749
+ },
+ {
+ "epoch": 18.392370572207085,
+ "grad_norm": 7.548184394836426,
+ "learning_rate": 1.8782905671286763e-05,
+ "loss": 0.9047,
+ "step": 6750
+ },
+ {
+ "epoch": 18.39509536784741,
+ "grad_norm": 7.679628849029541,
+ "learning_rate": 1.878248369234198e-05,
+ "loss": 0.9084,
+ "step": 6751
+ },
+ {
+ "epoch": 18.39782016348774,
+ "grad_norm": 7.905241966247559,
+ "learning_rate": 1.8782061644999497e-05,
+ "loss": 0.9534,
+ "step": 6752
+ },
+ {
+ "epoch": 18.400544959128066,
+ "grad_norm": 7.051769733428955,
+ "learning_rate": 1.8781639529262598e-05,
+ "loss": 0.7361,
+ "step": 6753
+ },
+ {
+ "epoch": 18.40326975476839,
+ "grad_norm": 10.122602462768555,
+ "learning_rate": 1.8781217345134574e-05,
+ "loss": 0.8901,
+ "step": 6754
+ },
+ {
+ "epoch": 18.40599455040872,
+ "grad_norm": 9.768773078918457,
+ "learning_rate": 1.8780795092618717e-05,
+ "loss": 0.8539,
+ "step": 6755
+ },
+ {
+ "epoch": 18.408719346049047,
+ "grad_norm": 9.212475776672363,
+ "learning_rate": 1.8780372771718302e-05,
+ "loss": 1.0101,
+ "step": 6756
+ },
+ {
+ "epoch": 18.411444141689373,
+ "grad_norm": 6.382621765136719,
+ "learning_rate": 1.8779950382436632e-05,
+ "loss": 0.7898,
+ "step": 6757
+ },
+ {
+ "epoch": 18.414168937329702,
+ "grad_norm": 8.457864761352539,
+ "learning_rate": 1.8779527924776988e-05,
+ "loss": 0.948,
+ "step": 6758
+ },
+ {
+ "epoch": 18.416893732970028,
+ "grad_norm": 8.18539810180664,
+ "learning_rate": 1.877910539874267e-05,
+ "loss": 0.8048,
+ "step": 6759
+ },
+ {
+ "epoch": 18.419618528610354,
+ "grad_norm": 7.24704122543335,
+ "learning_rate": 1.877868280433695e-05,
+ "loss": 0.8054,
+ "step": 6760
+ },
+ {
+ "epoch": 18.422343324250683,
+ "grad_norm": 10.048449516296387,
+ "learning_rate": 1.877826014156314e-05,
+ "loss": 0.9694,
+ "step": 6761
+ },
+ {
+ "epoch": 18.42506811989101,
+ "grad_norm": 8.157830238342285,
+ "learning_rate": 1.877783741042452e-05,
+ "loss": 0.9662,
+ "step": 6762
+ },
+ {
+ "epoch": 18.427792915531334,
+ "grad_norm": 7.6305928230285645,
+ "learning_rate": 1.8777414610924386e-05,
+ "loss": 0.7234,
+ "step": 6763
+ },
+ {
+ "epoch": 18.430517711171664,
+ "grad_norm": 9.370262145996094,
+ "learning_rate": 1.8776991743066025e-05,
+ "loss": 0.9136,
+ "step": 6764
+ },
+ {
+ "epoch": 18.43324250681199,
+ "grad_norm": 8.10416030883789,
+ "learning_rate": 1.8776568806852738e-05,
+ "loss": 0.7332,
+ "step": 6765
+ },
+ {
+ "epoch": 18.435967302452315,
+ "grad_norm": 7.520824909210205,
+ "learning_rate": 1.8776145802287816e-05,
+ "loss": 0.8267,
+ "step": 6766
+ },
+ {
+ "epoch": 18.438692098092645,
+ "grad_norm": 8.330543518066406,
+ "learning_rate": 1.8775722729374552e-05,
+ "loss": 0.8585,
+ "step": 6767
+ },
+ {
+ "epoch": 18.44141689373297,
+ "grad_norm": 7.984499931335449,
+ "learning_rate": 1.8775299588116243e-05,
+ "loss": 0.7097,
+ "step": 6768
+ },
+ {
+ "epoch": 18.444141689373296,
+ "grad_norm": 7.713501453399658,
+ "learning_rate": 1.877487637851618e-05,
+ "loss": 0.8645,
+ "step": 6769
+ },
+ {
+ "epoch": 18.446866485013626,
+ "grad_norm": 7.1620283126831055,
+ "learning_rate": 1.8774453100577664e-05,
+ "loss": 1.0524,
+ "step": 6770
+ },
+ {
+ "epoch": 18.44959128065395,
+ "grad_norm": 7.688859462738037,
+ "learning_rate": 1.8774029754303995e-05,
+ "loss": 0.833,
+ "step": 6771
+ },
+ {
+ "epoch": 18.452316076294277,
+ "grad_norm": 7.874576568603516,
+ "learning_rate": 1.877360633969846e-05,
+ "loss": 0.8827,
+ "step": 6772
+ },
+ {
+ "epoch": 18.455040871934607,
+ "grad_norm": 8.26817512512207,
+ "learning_rate": 1.877318285676436e-05,
+ "loss": 0.8549,
+ "step": 6773
+ },
+ {
+ "epoch": 18.457765667574932,
+ "grad_norm": 7.061283111572266,
+ "learning_rate": 1.8772759305504996e-05,
+ "loss": 0.7936,
+ "step": 6774
+ },
+ {
+ "epoch": 18.460490463215258,
+ "grad_norm": 12.622628211975098,
+ "learning_rate": 1.877233568592366e-05,
+ "loss": 0.9607,
+ "step": 6775
+ },
+ {
+ "epoch": 18.463215258855588,
+ "grad_norm": 8.405427932739258,
+ "learning_rate": 1.877191199802366e-05,
+ "loss": 0.9612,
+ "step": 6776
+ },
+ {
+ "epoch": 18.465940054495913,
+ "grad_norm": 9.933815956115723,
+ "learning_rate": 1.8771488241808295e-05,
+ "loss": 0.7939,
+ "step": 6777
+ },
+ {
+ "epoch": 18.46866485013624,
+ "grad_norm": 6.550434112548828,
+ "learning_rate": 1.8771064417280856e-05,
+ "loss": 0.9353,
+ "step": 6778
+ },
+ {
+ "epoch": 18.47138964577657,
+ "grad_norm": 10.655665397644043,
+ "learning_rate": 1.8770640524444653e-05,
+ "loss": 0.9561,
+ "step": 6779
+ },
+ {
+ "epoch": 18.474114441416894,
+ "grad_norm": 7.041699409484863,
+ "learning_rate": 1.8770216563302984e-05,
+ "loss": 0.7959,
+ "step": 6780
+ },
+ {
+ "epoch": 18.47683923705722,
+ "grad_norm": 8.465987205505371,
+ "learning_rate": 1.876979253385915e-05,
+ "loss": 0.8094,
+ "step": 6781
+ },
+ {
+ "epoch": 18.479564032697546,
+ "grad_norm": 9.416106224060059,
+ "learning_rate": 1.8769368436116454e-05,
+ "loss": 0.7689,
+ "step": 6782
+ },
+ {
+ "epoch": 18.482288828337875,
+ "grad_norm": 9.46136474609375,
+ "learning_rate": 1.87689442700782e-05,
+ "loss": 0.9694,
+ "step": 6783
+ },
+ {
+ "epoch": 18.4850136239782,
+ "grad_norm": 9.132607460021973,
+ "learning_rate": 1.876852003574769e-05,
+ "loss": 0.8503,
+ "step": 6784
+ },
+ {
+ "epoch": 18.48773841961853,
+ "grad_norm": 10.33657169342041,
+ "learning_rate": 1.8768095733128226e-05,
+ "loss": 0.907,
+ "step": 6785
+ },
+ {
+ "epoch": 18.490463215258856,
+ "grad_norm": 8.639205932617188,
+ "learning_rate": 1.8767671362223117e-05,
+ "loss": 0.8226,
+ "step": 6786
+ },
+ {
+ "epoch": 18.493188010899182,
+ "grad_norm": 8.91231632232666,
+ "learning_rate": 1.8767246923035663e-05,
+ "loss": 0.9209,
+ "step": 6787
+ },
+ {
+ "epoch": 18.495912806539508,
+ "grad_norm": 7.934805393218994,
+ "learning_rate": 1.8766822415569175e-05,
+ "loss": 0.8568,
+ "step": 6788
+ },
+ {
+ "epoch": 18.498637602179837,
+ "grad_norm": 8.37930965423584,
+ "learning_rate": 1.8766397839826952e-05,
+ "loss": 0.886,
+ "step": 6789
+ },
+ {
+ "epoch": 18.501362397820163,
+ "grad_norm": 8.110930442810059,
+ "learning_rate": 1.876597319581231e-05,
+ "loss": 0.8521,
+ "step": 6790
+ },
+ {
+ "epoch": 18.504087193460492,
+ "grad_norm": 7.500209331512451,
+ "learning_rate": 1.8765548483528548e-05,
+ "loss": 0.8661,
+ "step": 6791
+ },
+ {
+ "epoch": 18.506811989100818,
+ "grad_norm": 7.315430641174316,
+ "learning_rate": 1.876512370297898e-05,
+ "loss": 0.78,
+ "step": 6792
+ },
+ {
+ "epoch": 18.509536784741144,
+ "grad_norm": 7.014491081237793,
+ "learning_rate": 1.8764698854166904e-05,
+ "loss": 0.9225,
+ "step": 6793
+ },
+ {
+ "epoch": 18.51226158038147,
+ "grad_norm": 6.934720039367676,
+ "learning_rate": 1.8764273937095642e-05,
+ "loss": 0.8499,
+ "step": 6794
+ },
+ {
+ "epoch": 18.5149863760218,
+ "grad_norm": 7.059356689453125,
+ "learning_rate": 1.876384895176849e-05,
+ "loss": 0.8367,
+ "step": 6795
+ },
+ {
+ "epoch": 18.517711171662125,
+ "grad_norm": 9.518843650817871,
+ "learning_rate": 1.876342389818877e-05,
+ "loss": 0.8096,
+ "step": 6796
+ },
+ {
+ "epoch": 18.520435967302454,
+ "grad_norm": 7.209913730621338,
+ "learning_rate": 1.8762998776359785e-05,
+ "loss": 0.8041,
+ "step": 6797
+ },
+ {
+ "epoch": 18.52316076294278,
+ "grad_norm": 7.684715747833252,
+ "learning_rate": 1.8762573586284847e-05,
+ "loss": 0.9806,
+ "step": 6798
+ },
+ {
+ "epoch": 18.525885558583106,
+ "grad_norm": 7.682023048400879,
+ "learning_rate": 1.876214832796727e-05,
+ "loss": 0.7159,
+ "step": 6799
+ },
+ {
+ "epoch": 18.52861035422343,
+ "grad_norm": 9.923916816711426,
+ "learning_rate": 1.876172300141036e-05,
+ "loss": 0.9024,
+ "step": 6800
+ },
+ {
+ "epoch": 18.53133514986376,
+ "grad_norm": 8.820189476013184,
+ "learning_rate": 1.8761297606617436e-05,
+ "loss": 0.8292,
+ "step": 6801
+ },
+ {
+ "epoch": 18.534059945504087,
+ "grad_norm": 9.852216720581055,
+ "learning_rate": 1.876087214359181e-05,
+ "loss": 0.8995,
+ "step": 6802
+ },
+ {
+ "epoch": 18.536784741144416,
+ "grad_norm": 7.489625453948975,
+ "learning_rate": 1.876044661233679e-05,
+ "loss": 0.9141,
+ "step": 6803
+ },
+ {
+ "epoch": 18.539509536784742,
+ "grad_norm": 8.809782981872559,
+ "learning_rate": 1.8760021012855694e-05,
+ "loss": 1.0233,
+ "step": 6804
+ },
+ {
+ "epoch": 18.542234332425068,
+ "grad_norm": 8.199651718139648,
+ "learning_rate": 1.875959534515184e-05,
+ "loss": 0.8774,
+ "step": 6805
+ },
+ {
+ "epoch": 18.544959128065393,
+ "grad_norm": 10.005997657775879,
+ "learning_rate": 1.8759169609228536e-05,
+ "loss": 0.8667,
+ "step": 6806
+ },
+ {
+ "epoch": 18.547683923705723,
+ "grad_norm": 8.236612319946289,
+ "learning_rate": 1.8758743805089104e-05,
+ "loss": 0.7457,
+ "step": 6807
+ },
+ {
+ "epoch": 18.55040871934605,
+ "grad_norm": 8.340702056884766,
+ "learning_rate": 1.8758317932736855e-05,
+ "loss": 0.8894,
+ "step": 6808
+ },
+ {
+ "epoch": 18.553133514986374,
+ "grad_norm": 8.727513313293457,
+ "learning_rate": 1.8757891992175106e-05,
+ "loss": 0.9464,
+ "step": 6809
+ },
+ {
+ "epoch": 18.555858310626704,
+ "grad_norm": 8.727365493774414,
+ "learning_rate": 1.875746598340718e-05,
+ "loss": 0.9033,
+ "step": 6810
+ },
+ {
+ "epoch": 18.55858310626703,
+ "grad_norm": 8.104939460754395,
+ "learning_rate": 1.8757039906436388e-05,
+ "loss": 0.8466,
+ "step": 6811
+ },
+ {
+ "epoch": 18.561307901907355,
+ "grad_norm": 7.656373500823975,
+ "learning_rate": 1.8756613761266052e-05,
+ "loss": 0.9034,
+ "step": 6812
+ },
+ {
+ "epoch": 18.564032697547685,
+ "grad_norm": 10.777390480041504,
+ "learning_rate": 1.875618754789949e-05,
+ "loss": 0.9558,
+ "step": 6813
+ },
+ {
+ "epoch": 18.56675749318801,
+ "grad_norm": 7.567367076873779,
+ "learning_rate": 1.8755761266340018e-05,
+ "loss": 0.8656,
+ "step": 6814
+ },
+ {
+ "epoch": 18.569482288828336,
+ "grad_norm": 7.490059852600098,
+ "learning_rate": 1.8755334916590964e-05,
+ "loss": 0.9022,
+ "step": 6815
+ },
+ {
+ "epoch": 18.572207084468666,
+ "grad_norm": 8.64775276184082,
+ "learning_rate": 1.875490849865564e-05,
+ "loss": 1.0067,
+ "step": 6816
+ },
+ {
+ "epoch": 18.57493188010899,
+ "grad_norm": 8.965628623962402,
+ "learning_rate": 1.8754482012537374e-05,
+ "loss": 0.921,
+ "step": 6817
+ },
+ {
+ "epoch": 18.577656675749317,
+ "grad_norm": 9.244271278381348,
+ "learning_rate": 1.875405545823948e-05,
+ "loss": 0.6953,
+ "step": 6818
+ },
+ {
+ "epoch": 18.580381471389646,
+ "grad_norm": 8.459924697875977,
+ "learning_rate": 1.8753628835765284e-05,
+ "loss": 0.8523,
+ "step": 6819
+ },
+ {
+ "epoch": 18.583106267029972,
+ "grad_norm": 8.601913452148438,
+ "learning_rate": 1.875320214511811e-05,
+ "loss": 0.8688,
+ "step": 6820
+ },
+ {
+ "epoch": 18.585831062670298,
+ "grad_norm": 8.533843994140625,
+ "learning_rate": 1.875277538630128e-05,
+ "loss": 0.7902,
+ "step": 6821
+ },
+ {
+ "epoch": 18.588555858310627,
+ "grad_norm": 7.612013339996338,
+ "learning_rate": 1.8752348559318116e-05,
+ "loss": 0.7195,
+ "step": 6822
+ },
+ {
+ "epoch": 18.591280653950953,
+ "grad_norm": 7.308195114135742,
+ "learning_rate": 1.8751921664171944e-05,
+ "loss": 0.6616,
+ "step": 6823
+ },
+ {
+ "epoch": 18.59400544959128,
+ "grad_norm": 8.093254089355469,
+ "learning_rate": 1.8751494700866088e-05,
+ "loss": 0.8279,
+ "step": 6824
+ },
+ {
+ "epoch": 18.59673024523161,
+ "grad_norm": 7.823365688323975,
+ "learning_rate": 1.875106766940387e-05,
+ "loss": 1.1262,
+ "step": 6825
+ },
+ {
+ "epoch": 18.599455040871934,
+ "grad_norm": 7.550796985626221,
+ "learning_rate": 1.8750640569788624e-05,
+ "loss": 0.8933,
+ "step": 6826
+ },
+ {
+ "epoch": 18.60217983651226,
+ "grad_norm": 7.996880054473877,
+ "learning_rate": 1.8750213402023664e-05,
+ "loss": 0.8503,
+ "step": 6827
+ },
+ {
+ "epoch": 18.60490463215259,
+ "grad_norm": 9.51594066619873,
+ "learning_rate": 1.874978616611233e-05,
+ "loss": 0.9055,
+ "step": 6828
+ },
+ {
+ "epoch": 18.607629427792915,
+ "grad_norm": 8.002632141113281,
+ "learning_rate": 1.874935886205794e-05,
+ "loss": 0.797,
+ "step": 6829
+ },
+ {
+ "epoch": 18.61035422343324,
+ "grad_norm": 7.839196681976318,
+ "learning_rate": 1.8748931489863823e-05,
+ "loss": 0.932,
+ "step": 6830
+ },
+ {
+ "epoch": 18.61307901907357,
+ "grad_norm": 8.164216995239258,
+ "learning_rate": 1.874850404953331e-05,
+ "loss": 0.8767,
+ "step": 6831
+ },
+ {
+ "epoch": 18.615803814713896,
+ "grad_norm": 9.41263198852539,
+ "learning_rate": 1.8748076541069734e-05,
+ "loss": 0.9336,
+ "step": 6832
+ },
+ {
+ "epoch": 18.618528610354222,
+ "grad_norm": 8.057923316955566,
+ "learning_rate": 1.874764896447641e-05,
+ "loss": 0.8961,
+ "step": 6833
+ },
+ {
+ "epoch": 18.62125340599455,
+ "grad_norm": 8.388008117675781,
+ "learning_rate": 1.8747221319756686e-05,
+ "loss": 0.8668,
+ "step": 6834
+ },
+ {
+ "epoch": 18.623978201634877,
+ "grad_norm": 8.542396545410156,
+ "learning_rate": 1.874679360691388e-05,
+ "loss": 0.9678,
+ "step": 6835
+ },
+ {
+ "epoch": 18.626702997275203,
+ "grad_norm": 8.668232917785645,
+ "learning_rate": 1.874636582595133e-05,
+ "loss": 0.976,
+ "step": 6836
+ },
+ {
+ "epoch": 18.629427792915532,
+ "grad_norm": 6.552305698394775,
+ "learning_rate": 1.874593797687236e-05,
+ "loss": 0.72,
+ "step": 6837
+ },
+ {
+ "epoch": 18.632152588555858,
+ "grad_norm": 9.538304328918457,
+ "learning_rate": 1.874551005968031e-05,
+ "loss": 0.91,
+ "step": 6838
+ },
+ {
+ "epoch": 18.634877384196184,
+ "grad_norm": 8.393935203552246,
+ "learning_rate": 1.8745082074378507e-05,
+ "loss": 0.9698,
+ "step": 6839
+ },
+ {
+ "epoch": 18.637602179836513,
+ "grad_norm": 8.084198951721191,
+ "learning_rate": 1.8744654020970284e-05,
+ "loss": 0.9087,
+ "step": 6840
+ },
+ {
+ "epoch": 18.64032697547684,
+ "grad_norm": 7.184995651245117,
+ "learning_rate": 1.8744225899458982e-05,
+ "loss": 0.6638,
+ "step": 6841
+ },
+ {
+ "epoch": 18.643051771117165,
+ "grad_norm": 7.042233467102051,
+ "learning_rate": 1.874379770984793e-05,
+ "loss": 0.7306,
+ "step": 6842
+ },
+ {
+ "epoch": 18.645776566757494,
+ "grad_norm": 7.042173385620117,
+ "learning_rate": 1.8743369452140457e-05,
+ "loss": 0.879,
+ "step": 6843
+ },
+ {
+ "epoch": 18.64850136239782,
+ "grad_norm": 7.013894081115723,
+ "learning_rate": 1.874294112633991e-05,
+ "loss": 0.8345,
+ "step": 6844
+ },
+ {
+ "epoch": 18.651226158038146,
+ "grad_norm": 8.85759162902832,
+ "learning_rate": 1.874251273244962e-05,
+ "loss": 0.8652,
+ "step": 6845
+ },
+ {
+ "epoch": 18.653950953678475,
+ "grad_norm": 7.782415866851807,
+ "learning_rate": 1.874208427047292e-05,
+ "loss": 0.9827,
+ "step": 6846
+ },
+ {
+ "epoch": 18.6566757493188,
+ "grad_norm": 7.596438884735107,
+ "learning_rate": 1.8741655740413143e-05,
+ "loss": 0.9199,
+ "step": 6847
+ },
+ {
+ "epoch": 18.659400544959126,
+ "grad_norm": 7.295292854309082,
+ "learning_rate": 1.874122714227364e-05,
+ "loss": 1.0024,
+ "step": 6848
+ },
+ {
+ "epoch": 18.662125340599456,
+ "grad_norm": 7.571012496948242,
+ "learning_rate": 1.8740798476057737e-05,
+ "loss": 0.9304,
+ "step": 6849
+ },
+ {
+ "epoch": 18.66485013623978,
+ "grad_norm": 7.809437274932861,
+ "learning_rate": 1.874036974176878e-05,
+ "loss": 0.755,
+ "step": 6850
+ },
+ {
+ "epoch": 18.667574931880107,
+ "grad_norm": 8.06397533416748,
+ "learning_rate": 1.8739940939410102e-05,
+ "loss": 0.8961,
+ "step": 6851
+ },
+ {
+ "epoch": 18.670299727520437,
+ "grad_norm": 8.416884422302246,
+ "learning_rate": 1.8739512068985052e-05,
+ "loss": 0.9575,
+ "step": 6852
+ },
+ {
+ "epoch": 18.673024523160763,
+ "grad_norm": 9.632649421691895,
+ "learning_rate": 1.8739083130496957e-05,
+ "loss": 0.9338,
+ "step": 6853
+ },
+ {
+ "epoch": 18.67574931880109,
+ "grad_norm": 7.96435546875,
+ "learning_rate": 1.8738654123949165e-05,
+ "loss": 0.9298,
+ "step": 6854
+ },
+ {
+ "epoch": 18.678474114441418,
+ "grad_norm": 9.763521194458008,
+ "learning_rate": 1.8738225049345017e-05,
+ "loss": 0.7675,
+ "step": 6855
+ },
+ {
+ "epoch": 18.681198910081743,
+ "grad_norm": 7.3949384689331055,
+ "learning_rate": 1.873779590668785e-05,
+ "loss": 0.7509,
+ "step": 6856
+ },
+ {
+ "epoch": 18.68392370572207,
+ "grad_norm": 7.49371862411499,
+ "learning_rate": 1.873736669598101e-05,
+ "loss": 0.7791,
+ "step": 6857
+ },
+ {
+ "epoch": 18.6866485013624,
+ "grad_norm": 8.469500541687012,
+ "learning_rate": 1.8736937417227845e-05,
+ "loss": 1.0149,
+ "step": 6858
+ },
+ {
+ "epoch": 18.689373297002724,
+ "grad_norm": 6.933372497558594,
+ "learning_rate": 1.873650807043169e-05,
+ "loss": 0.7024,
+ "step": 6859
+ },
+ {
+ "epoch": 18.69209809264305,
+ "grad_norm": 7.969101428985596,
+ "learning_rate": 1.873607865559589e-05,
+ "loss": 1.2202,
+ "step": 6860
+ },
+ {
+ "epoch": 18.69482288828338,
+ "grad_norm": 8.198660850524902,
+ "learning_rate": 1.8735649172723792e-05,
+ "loss": 0.8574,
+ "step": 6861
+ },
+ {
+ "epoch": 18.697547683923705,
+ "grad_norm": 8.389801025390625,
+ "learning_rate": 1.8735219621818737e-05,
+ "loss": 0.807,
+ "step": 6862
+ },
+ {
+ "epoch": 18.70027247956403,
+ "grad_norm": 7.781229019165039,
+ "learning_rate": 1.8734790002884074e-05,
+ "loss": 0.7609,
+ "step": 6863
+ },
+ {
+ "epoch": 18.70299727520436,
+ "grad_norm": 8.59720516204834,
+ "learning_rate": 1.8734360315923146e-05,
+ "loss": 0.8466,
+ "step": 6864
+ },
+ {
+ "epoch": 18.705722070844686,
+ "grad_norm": 16.442710876464844,
+ "learning_rate": 1.8733930560939305e-05,
+ "loss": 0.9008,
+ "step": 6865
+ },
+ {
+ "epoch": 18.708446866485012,
+ "grad_norm": 9.491679191589355,
+ "learning_rate": 1.873350073793589e-05,
+ "loss": 0.9946,
+ "step": 6866
+ },
+ {
+ "epoch": 18.71117166212534,
+ "grad_norm": 7.669342994689941,
+ "learning_rate": 1.8733070846916253e-05,
+ "loss": 0.8419,
+ "step": 6867
+ },
+ {
+ "epoch": 18.713896457765667,
+ "grad_norm": 7.897876262664795,
+ "learning_rate": 1.8732640887883744e-05,
+ "loss": 0.8983,
+ "step": 6868
+ },
+ {
+ "epoch": 18.716621253405993,
+ "grad_norm": 7.866222381591797,
+ "learning_rate": 1.8732210860841706e-05,
+ "loss": 0.882,
+ "step": 6869
+ },
+ {
+ "epoch": 18.719346049046322,
+ "grad_norm": 7.729693412780762,
+ "learning_rate": 1.8731780765793493e-05,
+ "loss": 0.9286,
+ "step": 6870
+ },
+ {
+ "epoch": 18.722070844686648,
+ "grad_norm": 6.747142314910889,
+ "learning_rate": 1.8731350602742453e-05,
+ "loss": 0.975,
+ "step": 6871
+ },
+ {
+ "epoch": 18.724795640326974,
+ "grad_norm": 7.245094299316406,
+ "learning_rate": 1.8730920371691934e-05,
+ "loss": 0.9503,
+ "step": 6872
+ },
+ {
+ "epoch": 18.727520435967303,
+ "grad_norm": 9.75373649597168,
+ "learning_rate": 1.8730490072645285e-05,
+ "loss": 0.8794,
+ "step": 6873
+ },
+ {
+ "epoch": 18.73024523160763,
+ "grad_norm": 8.557443618774414,
+ "learning_rate": 1.8730059705605862e-05,
+ "loss": 0.7939,
+ "step": 6874
+ },
+ {
+ "epoch": 18.732970027247955,
+ "grad_norm": 8.528529167175293,
+ "learning_rate": 1.8729629270577018e-05,
+ "loss": 0.8118,
+ "step": 6875
+ },
+ {
+ "epoch": 18.735694822888284,
+ "grad_norm": 8.50214958190918,
+ "learning_rate": 1.8729198767562102e-05,
+ "loss": 0.8206,
+ "step": 6876
+ },
+ {
+ "epoch": 18.73841961852861,
+ "grad_norm": 7.377909183502197,
+ "learning_rate": 1.8728768196564467e-05,
+ "loss": 0.724,
+ "step": 6877
+ },
+ {
+ "epoch": 18.741144414168936,
+ "grad_norm": 9.095946311950684,
+ "learning_rate": 1.8728337557587464e-05,
+ "loss": 0.89,
+ "step": 6878
+ },
+ {
+ "epoch": 18.743869209809265,
+ "grad_norm": 6.619362831115723,
+ "learning_rate": 1.872790685063445e-05,
+ "loss": 0.8712,
+ "step": 6879
+ },
+ {
+ "epoch": 18.74659400544959,
+ "grad_norm": 8.90834903717041,
+ "learning_rate": 1.8727476075708778e-05,
+ "loss": 0.9437,
+ "step": 6880
+ },
+ {
+ "epoch": 18.749318801089917,
+ "grad_norm": 7.974592685699463,
+ "learning_rate": 1.8727045232813804e-05,
+ "loss": 0.7578,
+ "step": 6881
+ },
+ {
+ "epoch": 18.752043596730246,
+ "grad_norm": 15.871769905090332,
+ "learning_rate": 1.872661432195288e-05,
+ "loss": 0.8325,
+ "step": 6882
+ },
+ {
+ "epoch": 18.754768392370572,
+ "grad_norm": 7.1992692947387695,
+ "learning_rate": 1.8726183343129368e-05,
+ "loss": 0.9443,
+ "step": 6883
+ },
+ {
+ "epoch": 18.757493188010898,
+ "grad_norm": 8.193685531616211,
+ "learning_rate": 1.872575229634662e-05,
+ "loss": 1.0295,
+ "step": 6884
+ },
+ {
+ "epoch": 18.760217983651227,
+ "grad_norm": 7.6046342849731445,
+ "learning_rate": 1.8725321181607993e-05,
+ "loss": 0.8723,
+ "step": 6885
+ },
+ {
+ "epoch": 18.762942779291553,
+ "grad_norm": 9.461565017700195,
+ "learning_rate": 1.8724889998916845e-05,
+ "loss": 1.074,
+ "step": 6886
+ },
+ {
+ "epoch": 18.76566757493188,
+ "grad_norm": 9.257078170776367,
+ "learning_rate": 1.8724458748276534e-05,
+ "loss": 0.9036,
+ "step": 6887
+ },
+ {
+ "epoch": 18.768392370572208,
+ "grad_norm": 8.74255657196045,
+ "learning_rate": 1.8724027429690422e-05,
+ "loss": 0.7805,
+ "step": 6888
+ },
+ {
+ "epoch": 18.771117166212534,
+ "grad_norm": 8.370862007141113,
+ "learning_rate": 1.8723596043161865e-05,
+ "loss": 0.7791,
+ "step": 6889
+ },
+ {
+ "epoch": 18.77384196185286,
+ "grad_norm": 11.671736717224121,
+ "learning_rate": 1.872316458869422e-05,
+ "loss": 0.8114,
+ "step": 6890
+ },
+ {
+ "epoch": 18.77656675749319,
+ "grad_norm": 7.444977283477783,
+ "learning_rate": 1.872273306629085e-05,
+ "loss": 0.9426,
+ "step": 6891
+ },
+ {
+ "epoch": 18.779291553133515,
+ "grad_norm": 8.131038665771484,
+ "learning_rate": 1.872230147595512e-05,
+ "loss": 0.8264,
+ "step": 6892
+ },
+ {
+ "epoch": 18.78201634877384,
+ "grad_norm": 13.566511154174805,
+ "learning_rate": 1.872186981769038e-05,
+ "loss": 0.7626,
+ "step": 6893
+ },
+ {
+ "epoch": 18.78474114441417,
+ "grad_norm": 8.058342933654785,
+ "learning_rate": 1.8721438091500003e-05,
+ "loss": 0.9114,
+ "step": 6894
+ },
+ {
+ "epoch": 18.787465940054496,
+ "grad_norm": 7.539575099945068,
+ "learning_rate": 1.8721006297387348e-05,
+ "loss": 1.0406,
+ "step": 6895
+ },
+ {
+ "epoch": 18.79019073569482,
+ "grad_norm": 9.61542797088623,
+ "learning_rate": 1.8720574435355776e-05,
+ "loss": 0.8738,
+ "step": 6896
+ },
+ {
+ "epoch": 18.79291553133515,
+ "grad_norm": 7.583422660827637,
+ "learning_rate": 1.8720142505408648e-05,
+ "loss": 0.9052,
+ "step": 6897
+ },
+ {
+ "epoch": 18.795640326975477,
+ "grad_norm": 7.3413472175598145,
+ "learning_rate": 1.8719710507549332e-05,
+ "loss": 0.8181,
+ "step": 6898
+ },
+ {
+ "epoch": 18.798365122615802,
+ "grad_norm": 8.460395812988281,
+ "learning_rate": 1.8719278441781193e-05,
+ "loss": 0.9628,
+ "step": 6899
+ },
+ {
+ "epoch": 18.80108991825613,
+ "grad_norm": 8.27148151397705,
+ "learning_rate": 1.871884630810759e-05,
+ "loss": 0.8704,
+ "step": 6900
+ },
+ {
+ "epoch": 18.803814713896458,
+ "grad_norm": 8.32595443725586,
+ "learning_rate": 1.8718414106531898e-05,
+ "loss": 0.8131,
+ "step": 6901
+ },
+ {
+ "epoch": 18.806539509536783,
+ "grad_norm": 8.904982566833496,
+ "learning_rate": 1.8717981837057475e-05,
+ "loss": 0.939,
+ "step": 6902
+ },
+ {
+ "epoch": 18.809264305177113,
+ "grad_norm": 7.2709221839904785,
+ "learning_rate": 1.871754949968769e-05,
+ "loss": 0.8385,
+ "step": 6903
+ },
+ {
+ "epoch": 18.81198910081744,
+ "grad_norm": 8.22236442565918,
+ "learning_rate": 1.871711709442591e-05,
+ "loss": 0.814,
+ "step": 6904
+ },
+ {
+ "epoch": 18.814713896457764,
+ "grad_norm": 8.144975662231445,
+ "learning_rate": 1.87166846212755e-05,
+ "loss": 0.9263,
+ "step": 6905
+ },
+ {
+ "epoch": 18.817438692098094,
+ "grad_norm": 10.323326110839844,
+ "learning_rate": 1.8716252080239835e-05,
+ "loss": 0.8673,
+ "step": 6906
+ },
+ {
+ "epoch": 18.82016348773842,
+ "grad_norm": 10.343846321105957,
+ "learning_rate": 1.8715819471322278e-05,
+ "loss": 1.0734,
+ "step": 6907
+ },
+ {
+ "epoch": 18.822888283378745,
+ "grad_norm": 13.378046989440918,
+ "learning_rate": 1.87153867945262e-05,
+ "loss": 0.9152,
+ "step": 6908
+ },
+ {
+ "epoch": 18.825613079019075,
+ "grad_norm": 8.570001602172852,
+ "learning_rate": 1.871495404985497e-05,
+ "loss": 0.8552,
+ "step": 6909
+ },
+ {
+ "epoch": 18.8283378746594,
+ "grad_norm": 8.434952735900879,
+ "learning_rate": 1.8714521237311956e-05,
+ "loss": 0.8588,
+ "step": 6910
+ },
+ {
+ "epoch": 18.831062670299726,
+ "grad_norm": 6.612369060516357,
+ "learning_rate": 1.8714088356900536e-05,
+ "loss": 1.0029,
+ "step": 6911
+ },
+ {
+ "epoch": 18.833787465940055,
+ "grad_norm": 12.763958930969238,
+ "learning_rate": 1.8713655408624073e-05,
+ "loss": 0.8953,
+ "step": 6912
+ },
+ {
+ "epoch": 18.83651226158038,
+ "grad_norm": 11.677885055541992,
+ "learning_rate": 1.8713222392485943e-05,
+ "loss": 0.751,
+ "step": 6913
+ },
+ {
+ "epoch": 18.839237057220707,
+ "grad_norm": 8.051769256591797,
+ "learning_rate": 1.8712789308489516e-05,
+ "loss": 0.9045,
+ "step": 6914
+ },
+ {
+ "epoch": 18.841961852861036,
+ "grad_norm": 10.129505157470703,
+ "learning_rate": 1.8712356156638164e-05,
+ "loss": 0.9486,
+ "step": 6915
+ },
+ {
+ "epoch": 18.844686648501362,
+ "grad_norm": 7.85394287109375,
+ "learning_rate": 1.871192293693527e-05,
+ "loss": 0.9458,
+ "step": 6916
+ },
+ {
+ "epoch": 18.847411444141688,
+ "grad_norm": 11.273139953613281,
+ "learning_rate": 1.8711489649384194e-05,
+ "loss": 0.8696,
+ "step": 6917
+ },
+ {
+ "epoch": 18.850136239782017,
+ "grad_norm": 8.475065231323242,
+ "learning_rate": 1.8711056293988318e-05,
+ "loss": 0.9227,
+ "step": 6918
+ },
+ {
+ "epoch": 18.852861035422343,
+ "grad_norm": 8.927240371704102,
+ "learning_rate": 1.871062287075102e-05,
+ "loss": 0.7208,
+ "step": 6919
+ },
+ {
+ "epoch": 18.85558583106267,
+ "grad_norm": 10.094076156616211,
+ "learning_rate": 1.8710189379675667e-05,
+ "loss": 0.9561,
+ "step": 6920
+ },
+ {
+ "epoch": 18.858310626703,
+ "grad_norm": 8.230749130249023,
+ "learning_rate": 1.870975582076564e-05,
+ "loss": 0.9272,
+ "step": 6921
+ },
+ {
+ "epoch": 18.861035422343324,
+ "grad_norm": 8.077170372009277,
+ "learning_rate": 1.870932219402432e-05,
+ "loss": 0.947,
+ "step": 6922
+ },
+ {
+ "epoch": 18.86376021798365,
+ "grad_norm": 9.002728462219238,
+ "learning_rate": 1.8708888499455075e-05,
+ "loss": 0.8989,
+ "step": 6923
+ },
+ {
+ "epoch": 18.86648501362398,
+ "grad_norm": 8.719640731811523,
+ "learning_rate": 1.8708454737061284e-05,
+ "loss": 0.8878,
+ "step": 6924
+ },
+ {
+ "epoch": 18.869209809264305,
+ "grad_norm": 8.23000431060791,
+ "learning_rate": 1.870802090684633e-05,
+ "loss": 0.7559,
+ "step": 6925
+ },
+ {
+ "epoch": 18.87193460490463,
+ "grad_norm": 7.957650184631348,
+ "learning_rate": 1.8707587008813593e-05,
+ "loss": 0.8157,
+ "step": 6926
+ },
+ {
+ "epoch": 18.87465940054496,
+ "grad_norm": 9.691078186035156,
+ "learning_rate": 1.8707153042966445e-05,
+ "loss": 0.9717,
+ "step": 6927
+ },
+ {
+ "epoch": 18.877384196185286,
+ "grad_norm": 7.17464017868042,
+ "learning_rate": 1.870671900930827e-05,
+ "loss": 0.989,
+ "step": 6928
+ },
+ {
+ "epoch": 18.88010899182561,
+ "grad_norm": 8.259840965270996,
+ "learning_rate": 1.8706284907842446e-05,
+ "loss": 0.9609,
+ "step": 6929
+ },
+ {
+ "epoch": 18.88283378746594,
+ "grad_norm": 7.825801372528076,
+ "learning_rate": 1.8705850738572357e-05,
+ "loss": 0.7622,
+ "step": 6930
+ },
+ {
+ "epoch": 18.885558583106267,
+ "grad_norm": 9.720499038696289,
+ "learning_rate": 1.8705416501501383e-05,
+ "loss": 0.7961,
+ "step": 6931
+ },
+ {
+ "epoch": 18.888283378746593,
+ "grad_norm": 8.514625549316406,
+ "learning_rate": 1.8704982196632904e-05,
+ "loss": 0.7432,
+ "step": 6932
+ },
+ {
+ "epoch": 18.891008174386922,
+ "grad_norm": 9.289460182189941,
+ "learning_rate": 1.8704547823970306e-05,
+ "loss": 0.8408,
+ "step": 6933
+ },
+ {
+ "epoch": 18.893732970027248,
+ "grad_norm": 10.373196601867676,
+ "learning_rate": 1.8704113383516967e-05,
+ "loss": 0.9124,
+ "step": 6934
+ },
+ {
+ "epoch": 18.896457765667574,
+ "grad_norm": 9.915992736816406,
+ "learning_rate": 1.8703678875276277e-05,
+ "loss": 0.8114,
+ "step": 6935
+ },
+ {
+ "epoch": 18.899182561307903,
+ "grad_norm": 8.494244575500488,
+ "learning_rate": 1.8703244299251612e-05,
+ "loss": 0.9077,
+ "step": 6936
+ },
+ {
+ "epoch": 18.90190735694823,
+ "grad_norm": 8.14223575592041,
+ "learning_rate": 1.8702809655446364e-05,
+ "loss": 1.0366,
+ "step": 6937
+ },
+ {
+ "epoch": 18.904632152588555,
+ "grad_norm": 9.234797477722168,
+ "learning_rate": 1.8702374943863912e-05,
+ "loss": 0.825,
+ "step": 6938
+ },
+ {
+ "epoch": 18.907356948228884,
+ "grad_norm": 10.01010513305664,
+ "learning_rate": 1.8701940164507646e-05,
+ "loss": 1.0437,
+ "step": 6939
+ },
+ {
+ "epoch": 18.91008174386921,
+ "grad_norm": 8.667445182800293,
+ "learning_rate": 1.870150531738095e-05,
+ "loss": 0.9082,
+ "step": 6940
+ },
+ {
+ "epoch": 18.912806539509535,
+ "grad_norm": 8.761026382446289,
+ "learning_rate": 1.8701070402487208e-05,
+ "loss": 0.8855,
+ "step": 6941
+ },
+ {
+ "epoch": 18.915531335149865,
+ "grad_norm": 9.522194862365723,
+ "learning_rate": 1.8700635419829808e-05,
+ "loss": 1.02,
+ "step": 6942
+ },
+ {
+ "epoch": 18.91825613079019,
+ "grad_norm": 9.89741325378418,
+ "learning_rate": 1.8700200369412143e-05,
+ "loss": 1.1108,
+ "step": 6943
+ },
+ {
+ "epoch": 18.920980926430516,
+ "grad_norm": 7.780826568603516,
+ "learning_rate": 1.86997652512376e-05,
+ "loss": 0.8074,
+ "step": 6944
+ },
+ {
+ "epoch": 18.923705722070846,
+ "grad_norm": 6.950511455535889,
+ "learning_rate": 1.869933006530956e-05,
+ "loss": 0.8043,
+ "step": 6945
+ },
+ {
+ "epoch": 18.92643051771117,
+ "grad_norm": 7.270721912384033,
+ "learning_rate": 1.869889481163142e-05,
+ "loss": 0.8287,
+ "step": 6946
+ },
+ {
+ "epoch": 18.929155313351497,
+ "grad_norm": 9.197299003601074,
+ "learning_rate": 1.8698459490206568e-05,
+ "loss": 0.8691,
+ "step": 6947
+ },
+ {
+ "epoch": 18.931880108991827,
+ "grad_norm": 7.520884037017822,
+ "learning_rate": 1.8698024101038395e-05,
+ "loss": 0.7726,
+ "step": 6948
+ },
+ {
+ "epoch": 18.934604904632153,
+ "grad_norm": 8.074854850769043,
+ "learning_rate": 1.8697588644130283e-05,
+ "loss": 0.8833,
+ "step": 6949
+ },
+ {
+ "epoch": 18.93732970027248,
+ "grad_norm": 11.02020263671875,
+ "learning_rate": 1.8697153119485638e-05,
+ "loss": 1.0754,
+ "step": 6950
+ },
+ {
+ "epoch": 18.940054495912808,
+ "grad_norm": 10.82308578491211,
+ "learning_rate": 1.869671752710784e-05,
+ "loss": 1.0528,
+ "step": 6951
+ },
+ {
+ "epoch": 18.942779291553133,
+ "grad_norm": 8.439906120300293,
+ "learning_rate": 1.869628186700029e-05,
+ "loss": 0.812,
+ "step": 6952
+ },
+ {
+ "epoch": 18.94550408719346,
+ "grad_norm": 9.263603210449219,
+ "learning_rate": 1.8695846139166372e-05,
+ "loss": 0.9401,
+ "step": 6953
+ },
+ {
+ "epoch": 18.94822888283379,
+ "grad_norm": 8.745004653930664,
+ "learning_rate": 1.8695410343609487e-05,
+ "loss": 0.8589,
+ "step": 6954
+ },
+ {
+ "epoch": 18.950953678474114,
+ "grad_norm": 8.685702323913574,
+ "learning_rate": 1.8694974480333027e-05,
+ "loss": 0.8623,
+ "step": 6955
+ },
+ {
+ "epoch": 18.95367847411444,
+ "grad_norm": 8.876229286193848,
+ "learning_rate": 1.8694538549340385e-05,
+ "loss": 0.6804,
+ "step": 6956
+ },
+ {
+ "epoch": 18.95640326975477,
+ "grad_norm": 10.44974136352539,
+ "learning_rate": 1.8694102550634953e-05,
+ "loss": 0.9973,
+ "step": 6957
+ },
+ {
+ "epoch": 18.959128065395095,
+ "grad_norm": 9.667427062988281,
+ "learning_rate": 1.8693666484220134e-05,
+ "loss": 1.0387,
+ "step": 6958
+ },
+ {
+ "epoch": 18.96185286103542,
+ "grad_norm": 7.096478462219238,
+ "learning_rate": 1.8693230350099318e-05,
+ "loss": 0.7067,
+ "step": 6959
+ },
+ {
+ "epoch": 18.96457765667575,
+ "grad_norm": 7.511812686920166,
+ "learning_rate": 1.8692794148275904e-05,
+ "loss": 0.7866,
+ "step": 6960
+ },
+ {
+ "epoch": 18.967302452316076,
+ "grad_norm": 10.978753089904785,
+ "learning_rate": 1.869235787875329e-05,
+ "loss": 0.761,
+ "step": 6961
+ },
+ {
+ "epoch": 18.970027247956402,
+ "grad_norm": 7.78998327255249,
+ "learning_rate": 1.8691921541534876e-05,
+ "loss": 0.8462,
+ "step": 6962
+ },
+ {
+ "epoch": 18.97275204359673,
+ "grad_norm": 7.815904140472412,
+ "learning_rate": 1.869148513662405e-05,
+ "loss": 0.9651,
+ "step": 6963
+ },
+ {
+ "epoch": 18.975476839237057,
+ "grad_norm": 8.173052787780762,
+ "learning_rate": 1.869104866402422e-05,
+ "loss": 0.85,
+ "step": 6964
+ },
+ {
+ "epoch": 18.978201634877383,
+ "grad_norm": 10.576380729675293,
+ "learning_rate": 1.8690612123738784e-05,
+ "loss": 0.9049,
+ "step": 6965
+ },
+ {
+ "epoch": 18.980926430517712,
+ "grad_norm": 8.267260551452637,
+ "learning_rate": 1.869017551577114e-05,
+ "loss": 0.8013,
+ "step": 6966
+ },
+ {
+ "epoch": 18.983651226158038,
+ "grad_norm": 7.477278709411621,
+ "learning_rate": 1.8689738840124688e-05,
+ "loss": 0.7417,
+ "step": 6967
+ },
+ {
+ "epoch": 18.986376021798364,
+ "grad_norm": 10.80232048034668,
+ "learning_rate": 1.868930209680283e-05,
+ "loss": 0.7968,
+ "step": 6968
+ },
+ {
+ "epoch": 18.989100817438693,
+ "grad_norm": 9.751068115234375,
+ "learning_rate": 1.8688865285808968e-05,
+ "loss": 1.0911,
+ "step": 6969
+ },
+ {
+ "epoch": 18.99182561307902,
+ "grad_norm": 8.407898902893066,
+ "learning_rate": 1.8688428407146504e-05,
+ "loss": 0.8999,
+ "step": 6970
+ },
+ {
+ "epoch": 18.994550408719345,
+ "grad_norm": 9.125184059143066,
+ "learning_rate": 1.8687991460818836e-05,
+ "loss": 0.7819,
+ "step": 6971
+ },
+ {
+ "epoch": 18.997275204359674,
+ "grad_norm": 10.857903480529785,
+ "learning_rate": 1.868755444682937e-05,
+ "loss": 0.8312,
+ "step": 6972
+ },
+ {
+ "epoch": 19.0,
+ "grad_norm": 7.471215724945068,
+ "learning_rate": 1.8687117365181514e-05,
+ "loss": 0.8665,
+ "step": 6973
+ },
+ {
+ "epoch": 19.002724795640326,
+ "grad_norm": 7.7133469581604,
+ "learning_rate": 1.8686680215878663e-05,
+ "loss": 0.8215,
+ "step": 6974
+ },
+ {
+ "epoch": 19.005449591280655,
+ "grad_norm": 8.016887664794922,
+ "learning_rate": 1.8686242998924226e-05,
+ "loss": 0.7863,
+ "step": 6975
+ },
+ {
+ "epoch": 19.00817438692098,
+ "grad_norm": 9.045573234558105,
+ "learning_rate": 1.868580571432161e-05,
+ "loss": 0.9286,
+ "step": 6976
+ },
+ {
+ "epoch": 19.010899182561307,
+ "grad_norm": 8.61864185333252,
+ "learning_rate": 1.868536836207422e-05,
+ "loss": 0.9485,
+ "step": 6977
+ },
+ {
+ "epoch": 19.013623978201636,
+ "grad_norm": 9.215364456176758,
+ "learning_rate": 1.8684930942185457e-05,
+ "loss": 0.8007,
+ "step": 6978
+ },
+ {
+ "epoch": 19.016348773841962,
+ "grad_norm": 9.163359642028809,
+ "learning_rate": 1.8684493454658736e-05,
+ "loss": 0.795,
+ "step": 6979
+ },
+ {
+ "epoch": 19.019073569482288,
+ "grad_norm": 6.857732772827148,
+ "learning_rate": 1.8684055899497456e-05,
+ "loss": 0.65,
+ "step": 6980
+ },
+ {
+ "epoch": 19.021798365122617,
+ "grad_norm": 9.368291854858398,
+ "learning_rate": 1.8683618276705028e-05,
+ "loss": 0.8838,
+ "step": 6981
+ },
+ {
+ "epoch": 19.024523160762943,
+ "grad_norm": 8.756336212158203,
+ "learning_rate": 1.8683180586284862e-05,
+ "loss": 0.8461,
+ "step": 6982
+ },
+ {
+ "epoch": 19.02724795640327,
+ "grad_norm": 6.407591342926025,
+ "learning_rate": 1.8682742828240364e-05,
+ "loss": 0.855,
+ "step": 6983
+ },
+ {
+ "epoch": 19.029972752043598,
+ "grad_norm": 6.976788520812988,
+ "learning_rate": 1.8682305002574942e-05,
+ "loss": 0.9747,
+ "step": 6984
+ },
+ {
+ "epoch": 19.032697547683924,
+ "grad_norm": 11.912771224975586,
+ "learning_rate": 1.8681867109292012e-05,
+ "loss": 0.7258,
+ "step": 6985
+ },
+ {
+ "epoch": 19.03542234332425,
+ "grad_norm": 10.014404296875,
+ "learning_rate": 1.868142914839498e-05,
+ "loss": 0.8751,
+ "step": 6986
+ },
+ {
+ "epoch": 19.03814713896458,
+ "grad_norm": 10.036844253540039,
+ "learning_rate": 1.8680991119887256e-05,
+ "loss": 0.8563,
+ "step": 6987
+ },
+ {
+ "epoch": 19.040871934604905,
+ "grad_norm": 7.314995288848877,
+ "learning_rate": 1.868055302377225e-05,
+ "loss": 0.8879,
+ "step": 6988
+ },
+ {
+ "epoch": 19.04359673024523,
+ "grad_norm": 11.716142654418945,
+ "learning_rate": 1.8680114860053384e-05,
+ "loss": 0.7828,
+ "step": 6989
+ },
+ {
+ "epoch": 19.04632152588556,
+ "grad_norm": 7.671077251434326,
+ "learning_rate": 1.867967662873406e-05,
+ "loss": 0.8896,
+ "step": 6990
+ },
+ {
+ "epoch": 19.049046321525886,
+ "grad_norm": 7.949674129486084,
+ "learning_rate": 1.867923832981769e-05,
+ "loss": 0.8278,
+ "step": 6991
+ },
+ {
+ "epoch": 19.05177111716621,
+ "grad_norm": 9.292261123657227,
+ "learning_rate": 1.8678799963307693e-05,
+ "loss": 0.7715,
+ "step": 6992
+ },
+ {
+ "epoch": 19.05449591280654,
+ "grad_norm": 12.970134735107422,
+ "learning_rate": 1.867836152920748e-05,
+ "loss": 0.7914,
+ "step": 6993
+ },
+ {
+ "epoch": 19.057220708446867,
+ "grad_norm": 7.971855640411377,
+ "learning_rate": 1.867792302752047e-05,
+ "loss": 0.844,
+ "step": 6994
+ },
+ {
+ "epoch": 19.059945504087192,
+ "grad_norm": 9.02824878692627,
+ "learning_rate": 1.867748445825007e-05,
+ "loss": 0.6703,
+ "step": 6995
+ },
+ {
+ "epoch": 19.06267029972752,
+ "grad_norm": 7.739848613739014,
+ "learning_rate": 1.8677045821399705e-05,
+ "loss": 0.7098,
+ "step": 6996
+ },
+ {
+ "epoch": 19.065395095367847,
+ "grad_norm": 7.71321439743042,
+ "learning_rate": 1.8676607116972786e-05,
+ "loss": 0.871,
+ "step": 6997
+ },
+ {
+ "epoch": 19.068119891008173,
+ "grad_norm": 9.267059326171875,
+ "learning_rate": 1.8676168344972726e-05,
+ "loss": 0.8959,
+ "step": 6998
+ },
+ {
+ "epoch": 19.070844686648503,
+ "grad_norm": 7.251643180847168,
+ "learning_rate": 1.867572950540295e-05,
+ "loss": 0.8425,
+ "step": 6999
+ },
+ {
+ "epoch": 19.07356948228883,
+ "grad_norm": 8.379535675048828,
+ "learning_rate": 1.8675290598266872e-05,
+ "loss": 0.7917,
+ "step": 7000
+ },
+ {
+ "epoch": 19.076294277929154,
+ "grad_norm": 10.302045822143555,
+ "learning_rate": 1.8674851623567908e-05,
+ "loss": 0.879,
+ "step": 7001
+ },
+ {
+ "epoch": 19.079019073569484,
+ "grad_norm": 10.175151824951172,
+ "learning_rate": 1.8674412581309477e-05,
+ "loss": 0.9104,
+ "step": 7002
+ },
+ {
+ "epoch": 19.08174386920981,
+ "grad_norm": 8.297521591186523,
+ "learning_rate": 1.8673973471495005e-05,
+ "loss": 0.7986,
+ "step": 7003
+ },
+ {
+ "epoch": 19.084468664850135,
+ "grad_norm": 11.142738342285156,
+ "learning_rate": 1.8673534294127905e-05,
+ "loss": 0.9346,
+ "step": 7004
+ },
+ {
+ "epoch": 19.087193460490465,
+ "grad_norm": 7.376419544219971,
+ "learning_rate": 1.8673095049211597e-05,
+ "loss": 0.6486,
+ "step": 7005
+ },
+ {
+ "epoch": 19.08991825613079,
+ "grad_norm": 7.580418586730957,
+ "learning_rate": 1.8672655736749507e-05,
+ "loss": 0.918,
+ "step": 7006
+ },
+ {
+ "epoch": 19.092643051771116,
+ "grad_norm": 8.258780479431152,
+ "learning_rate": 1.867221635674505e-05,
+ "loss": 0.8269,
+ "step": 7007
+ },
+ {
+ "epoch": 19.095367847411445,
+ "grad_norm": 12.455347061157227,
+ "learning_rate": 1.867177690920165e-05,
+ "loss": 0.9009,
+ "step": 7008
+ },
+ {
+ "epoch": 19.09809264305177,
+ "grad_norm": 6.943690776824951,
+ "learning_rate": 1.8671337394122733e-05,
+ "loss": 0.6227,
+ "step": 7009
+ },
+ {
+ "epoch": 19.100817438692097,
+ "grad_norm": 8.154997825622559,
+ "learning_rate": 1.867089781151172e-05,
+ "loss": 0.7135,
+ "step": 7010
+ },
+ {
+ "epoch": 19.103542234332426,
+ "grad_norm": 7.797388553619385,
+ "learning_rate": 1.8670458161372033e-05,
+ "loss": 0.89,
+ "step": 7011
+ },
+ {
+ "epoch": 19.106267029972752,
+ "grad_norm": 10.197694778442383,
+ "learning_rate": 1.8670018443707098e-05,
+ "loss": 0.8024,
+ "step": 7012
+ },
+ {
+ "epoch": 19.108991825613078,
+ "grad_norm": 7.500790596008301,
+ "learning_rate": 1.866957865852034e-05,
+ "loss": 0.7478,
+ "step": 7013
+ },
+ {
+ "epoch": 19.111716621253407,
+ "grad_norm": 8.322009086608887,
+ "learning_rate": 1.866913880581518e-05,
+ "loss": 0.8334,
+ "step": 7014
+ },
+ {
+ "epoch": 19.114441416893733,
+ "grad_norm": 8.339186668395996,
+ "learning_rate": 1.8668698885595045e-05,
+ "loss": 0.8549,
+ "step": 7015
+ },
+ {
+ "epoch": 19.11716621253406,
+ "grad_norm": 7.383385181427002,
+ "learning_rate": 1.866825889786336e-05,
+ "loss": 0.8645,
+ "step": 7016
+ },
+ {
+ "epoch": 19.11989100817439,
+ "grad_norm": 7.881433486938477,
+ "learning_rate": 1.866781884262356e-05,
+ "loss": 0.7115,
+ "step": 7017
+ },
+ {
+ "epoch": 19.122615803814714,
+ "grad_norm": 7.964922904968262,
+ "learning_rate": 1.866737871987906e-05,
+ "loss": 0.808,
+ "step": 7018
+ },
+ {
+ "epoch": 19.12534059945504,
+ "grad_norm": 7.4784650802612305,
+ "learning_rate": 1.86669385296333e-05,
+ "loss": 0.7885,
+ "step": 7019
+ },
+ {
+ "epoch": 19.12806539509537,
+ "grad_norm": 9.835017204284668,
+ "learning_rate": 1.8666498271889698e-05,
+ "loss": 0.6842,
+ "step": 7020
+ },
+ {
+ "epoch": 19.130790190735695,
+ "grad_norm": 9.407984733581543,
+ "learning_rate": 1.8666057946651682e-05,
+ "loss": 0.6931,
+ "step": 7021
+ },
+ {
+ "epoch": 19.13351498637602,
+ "grad_norm": 9.08998966217041,
+ "learning_rate": 1.866561755392269e-05,
+ "loss": 0.8494,
+ "step": 7022
+ },
+ {
+ "epoch": 19.13623978201635,
+ "grad_norm": 8.443471908569336,
+ "learning_rate": 1.866517709370615e-05,
+ "loss": 0.6473,
+ "step": 7023
+ },
+ {
+ "epoch": 19.138964577656676,
+ "grad_norm": 10.57610034942627,
+ "learning_rate": 1.8664736566005487e-05,
+ "loss": 0.7864,
+ "step": 7024
+ },
+ {
+ "epoch": 19.141689373297,
+ "grad_norm": 8.669187545776367,
+ "learning_rate": 1.8664295970824136e-05,
+ "loss": 0.7316,
+ "step": 7025
+ },
+ {
+ "epoch": 19.14441416893733,
+ "grad_norm": 8.262614250183105,
+ "learning_rate": 1.8663855308165524e-05,
+ "loss": 0.9006,
+ "step": 7026
+ },
+ {
+ "epoch": 19.147138964577657,
+ "grad_norm": 7.1119842529296875,
+ "learning_rate": 1.8663414578033084e-05,
+ "loss": 0.8217,
+ "step": 7027
+ },
+ {
+ "epoch": 19.149863760217983,
+ "grad_norm": 10.65214729309082,
+ "learning_rate": 1.8662973780430256e-05,
+ "loss": 0.9548,
+ "step": 7028
+ },
+ {
+ "epoch": 19.152588555858312,
+ "grad_norm": 9.513092041015625,
+ "learning_rate": 1.8662532915360466e-05,
+ "loss": 0.8422,
+ "step": 7029
+ },
+ {
+ "epoch": 19.155313351498638,
+ "grad_norm": 11.064226150512695,
+ "learning_rate": 1.8662091982827142e-05,
+ "loss": 0.7493,
+ "step": 7030
+ },
+ {
+ "epoch": 19.158038147138964,
+ "grad_norm": 8.788904190063477,
+ "learning_rate": 1.8661650982833733e-05,
+ "loss": 0.6814,
+ "step": 7031
+ },
+ {
+ "epoch": 19.160762942779293,
+ "grad_norm": 8.584736824035645,
+ "learning_rate": 1.866120991538366e-05,
+ "loss": 0.8593,
+ "step": 7032
+ },
+ {
+ "epoch": 19.16348773841962,
+ "grad_norm": 10.5648832321167,
+ "learning_rate": 1.8660768780480364e-05,
+ "loss": 0.6584,
+ "step": 7033
+ },
+ {
+ "epoch": 19.166212534059945,
+ "grad_norm": 10.726306915283203,
+ "learning_rate": 1.866032757812728e-05,
+ "loss": 0.7759,
+ "step": 7034
+ },
+ {
+ "epoch": 19.168937329700274,
+ "grad_norm": 7.508849620819092,
+ "learning_rate": 1.8659886308327842e-05,
+ "loss": 0.6902,
+ "step": 7035
+ },
+ {
+ "epoch": 19.1716621253406,
+ "grad_norm": 9.58052921295166,
+ "learning_rate": 1.865944497108549e-05,
+ "loss": 0.8102,
+ "step": 7036
+ },
+ {
+ "epoch": 19.174386920980925,
+ "grad_norm": 15.089922904968262,
+ "learning_rate": 1.8659003566403658e-05,
+ "loss": 0.8425,
+ "step": 7037
+ },
+ {
+ "epoch": 19.177111716621255,
+ "grad_norm": 9.278483390808105,
+ "learning_rate": 1.8658562094285786e-05,
+ "loss": 0.7423,
+ "step": 7038
+ },
+ {
+ "epoch": 19.17983651226158,
+ "grad_norm": 7.667381763458252,
+ "learning_rate": 1.865812055473531e-05,
+ "loss": 0.7751,
+ "step": 7039
+ },
+ {
+ "epoch": 19.182561307901906,
+ "grad_norm": 8.727204322814941,
+ "learning_rate": 1.865767894775567e-05,
+ "loss": 0.9486,
+ "step": 7040
+ },
+ {
+ "epoch": 19.185286103542236,
+ "grad_norm": 8.394052505493164,
+ "learning_rate": 1.8657237273350305e-05,
+ "loss": 1.0408,
+ "step": 7041
+ },
+ {
+ "epoch": 19.18801089918256,
+ "grad_norm": 7.457240104675293,
+ "learning_rate": 1.8656795531522655e-05,
+ "loss": 0.6155,
+ "step": 7042
+ },
+ {
+ "epoch": 19.190735694822887,
+ "grad_norm": 11.908757209777832,
+ "learning_rate": 1.865635372227616e-05,
+ "loss": 0.9937,
+ "step": 7043
+ },
+ {
+ "epoch": 19.193460490463217,
+ "grad_norm": 9.040936470031738,
+ "learning_rate": 1.865591184561426e-05,
+ "loss": 0.7816,
+ "step": 7044
+ },
+ {
+ "epoch": 19.196185286103542,
+ "grad_norm": 6.818192958831787,
+ "learning_rate": 1.8655469901540398e-05,
+ "loss": 0.7806,
+ "step": 7045
+ },
+ {
+ "epoch": 19.19891008174387,
+ "grad_norm": 8.640161514282227,
+ "learning_rate": 1.8655027890058014e-05,
+ "loss": 0.7217,
+ "step": 7046
+ },
+ {
+ "epoch": 19.201634877384198,
+ "grad_norm": 9.699905395507812,
+ "learning_rate": 1.8654585811170553e-05,
+ "loss": 0.8181,
+ "step": 7047
+ },
+ {
+ "epoch": 19.204359673024523,
+ "grad_norm": 8.94979190826416,
+ "learning_rate": 1.8654143664881455e-05,
+ "loss": 0.9097,
+ "step": 7048
+ },
+ {
+ "epoch": 19.20708446866485,
+ "grad_norm": 7.599967956542969,
+ "learning_rate": 1.8653701451194166e-05,
+ "loss": 0.8625,
+ "step": 7049
+ },
+ {
+ "epoch": 19.20980926430518,
+ "grad_norm": 7.219893932342529,
+ "learning_rate": 1.8653259170112128e-05,
+ "loss": 0.8013,
+ "step": 7050
+ },
+ {
+ "epoch": 19.212534059945504,
+ "grad_norm": 9.76356029510498,
+ "learning_rate": 1.8652816821638783e-05,
+ "loss": 0.8273,
+ "step": 7051
+ },
+ {
+ "epoch": 19.21525885558583,
+ "grad_norm": 9.20617961883545,
+ "learning_rate": 1.8652374405777584e-05,
+ "loss": 0.8942,
+ "step": 7052
+ },
+ {
+ "epoch": 19.21798365122616,
+ "grad_norm": 8.287347793579102,
+ "learning_rate": 1.865193192253197e-05,
+ "loss": 0.7924,
+ "step": 7053
+ },
+ {
+ "epoch": 19.220708446866485,
+ "grad_norm": 6.710139751434326,
+ "learning_rate": 1.8651489371905386e-05,
+ "loss": 0.6537,
+ "step": 7054
+ },
+ {
+ "epoch": 19.22343324250681,
+ "grad_norm": 9.382214546203613,
+ "learning_rate": 1.8651046753901286e-05,
+ "loss": 0.8285,
+ "step": 7055
+ },
+ {
+ "epoch": 19.22615803814714,
+ "grad_norm": 7.651352882385254,
+ "learning_rate": 1.8650604068523107e-05,
+ "loss": 0.8624,
+ "step": 7056
+ },
+ {
+ "epoch": 19.228882833787466,
+ "grad_norm": 7.876631736755371,
+ "learning_rate": 1.8650161315774306e-05,
+ "loss": 0.8689,
+ "step": 7057
+ },
+ {
+ "epoch": 19.231607629427792,
+ "grad_norm": 8.066032409667969,
+ "learning_rate": 1.8649718495658325e-05,
+ "loss": 0.9088,
+ "step": 7058
+ },
+ {
+ "epoch": 19.23433242506812,
+ "grad_norm": 8.066088676452637,
+ "learning_rate": 1.8649275608178617e-05,
+ "loss": 0.8839,
+ "step": 7059
+ },
+ {
+ "epoch": 19.237057220708447,
+ "grad_norm": 7.8374481201171875,
+ "learning_rate": 1.8648832653338628e-05,
+ "loss": 0.9174,
+ "step": 7060
+ },
+ {
+ "epoch": 19.239782016348773,
+ "grad_norm": 9.005922317504883,
+ "learning_rate": 1.864838963114181e-05,
+ "loss": 0.7836,
+ "step": 7061
+ },
+ {
+ "epoch": 19.242506811989102,
+ "grad_norm": 8.517781257629395,
+ "learning_rate": 1.8647946541591607e-05,
+ "loss": 0.9065,
+ "step": 7062
+ },
+ {
+ "epoch": 19.245231607629428,
+ "grad_norm": 7.555675506591797,
+ "learning_rate": 1.8647503384691477e-05,
+ "loss": 0.6729,
+ "step": 7063
+ },
+ {
+ "epoch": 19.247956403269754,
+ "grad_norm": 10.002867698669434,
+ "learning_rate": 1.864706016044487e-05,
+ "loss": 0.8395,
+ "step": 7064
+ },
+ {
+ "epoch": 19.250681198910083,
+ "grad_norm": 8.23402214050293,
+ "learning_rate": 1.8646616868855236e-05,
+ "loss": 0.7773,
+ "step": 7065
+ },
+ {
+ "epoch": 19.25340599455041,
+ "grad_norm": 7.119266510009766,
+ "learning_rate": 1.864617350992603e-05,
+ "loss": 0.7239,
+ "step": 7066
+ },
+ {
+ "epoch": 19.256130790190735,
+ "grad_norm": 10.741050720214844,
+ "learning_rate": 1.86457300836607e-05,
+ "loss": 0.7881,
+ "step": 7067
+ },
+ {
+ "epoch": 19.258855585831064,
+ "grad_norm": 8.45600414276123,
+ "learning_rate": 1.8645286590062705e-05,
+ "loss": 0.6841,
+ "step": 7068
+ },
+ {
+ "epoch": 19.26158038147139,
+ "grad_norm": 8.414836883544922,
+ "learning_rate": 1.8644843029135496e-05,
+ "loss": 0.7979,
+ "step": 7069
+ },
+ {
+ "epoch": 19.264305177111716,
+ "grad_norm": 9.2487154006958,
+ "learning_rate": 1.8644399400882525e-05,
+ "loss": 0.7239,
+ "step": 7070
+ },
+ {
+ "epoch": 19.267029972752045,
+ "grad_norm": 9.046351432800293,
+ "learning_rate": 1.8643955705307252e-05,
+ "loss": 0.7223,
+ "step": 7071
+ },
+ {
+ "epoch": 19.26975476839237,
+ "grad_norm": 12.175895690917969,
+ "learning_rate": 1.864351194241313e-05,
+ "loss": 0.9025,
+ "step": 7072
+ },
+ {
+ "epoch": 19.272479564032697,
+ "grad_norm": 8.9979248046875,
+ "learning_rate": 1.8643068112203612e-05,
+ "loss": 0.8207,
+ "step": 7073
+ },
+ {
+ "epoch": 19.275204359673026,
+ "grad_norm": 13.657709121704102,
+ "learning_rate": 1.864262421468216e-05,
+ "loss": 0.8423,
+ "step": 7074
+ },
+ {
+ "epoch": 19.277929155313352,
+ "grad_norm": 14.252540588378906,
+ "learning_rate": 1.864218024985223e-05,
+ "loss": 0.8728,
+ "step": 7075
+ },
+ {
+ "epoch": 19.280653950953678,
+ "grad_norm": 11.971515655517578,
+ "learning_rate": 1.864173621771728e-05,
+ "loss": 0.7352,
+ "step": 7076
+ },
+ {
+ "epoch": 19.283378746594007,
+ "grad_norm": 9.648859024047852,
+ "learning_rate": 1.8641292118280764e-05,
+ "loss": 0.8773,
+ "step": 7077
+ },
+ {
+ "epoch": 19.286103542234333,
+ "grad_norm": 11.207634925842285,
+ "learning_rate": 1.8640847951546145e-05,
+ "loss": 0.8191,
+ "step": 7078
+ },
+ {
+ "epoch": 19.28882833787466,
+ "grad_norm": 9.115625381469727,
+ "learning_rate": 1.8640403717516877e-05,
+ "loss": 0.7565,
+ "step": 7079
+ },
+ {
+ "epoch": 19.291553133514988,
+ "grad_norm": 8.175503730773926,
+ "learning_rate": 1.8639959416196424e-05,
+ "loss": 0.7382,
+ "step": 7080
+ },
+ {
+ "epoch": 19.294277929155314,
+ "grad_norm": 8.28620719909668,
+ "learning_rate": 1.8639515047588247e-05,
+ "loss": 0.689,
+ "step": 7081
+ },
+ {
+ "epoch": 19.29700272479564,
+ "grad_norm": 10.554699897766113,
+ "learning_rate": 1.86390706116958e-05,
+ "loss": 0.7982,
+ "step": 7082
+ },
+ {
+ "epoch": 19.29972752043597,
+ "grad_norm": 12.142552375793457,
+ "learning_rate": 1.863862610852255e-05,
+ "loss": 0.9542,
+ "step": 7083
+ },
+ {
+ "epoch": 19.302452316076295,
+ "grad_norm": 9.547401428222656,
+ "learning_rate": 1.8638181538071966e-05,
+ "loss": 0.7208,
+ "step": 7084
+ },
+ {
+ "epoch": 19.30517711171662,
+ "grad_norm": 9.361517906188965,
+ "learning_rate": 1.8637736900347496e-05,
+ "loss": 0.861,
+ "step": 7085
+ },
+ {
+ "epoch": 19.30790190735695,
+ "grad_norm": 8.348713874816895,
+ "learning_rate": 1.863729219535261e-05,
+ "loss": 0.9124,
+ "step": 7086
+ },
+ {
+ "epoch": 19.310626702997276,
+ "grad_norm": 7.464922904968262,
+ "learning_rate": 1.8636847423090768e-05,
+ "loss": 0.8086,
+ "step": 7087
+ },
+ {
+ "epoch": 19.3133514986376,
+ "grad_norm": 9.388986587524414,
+ "learning_rate": 1.863640258356544e-05,
+ "loss": 0.8484,
+ "step": 7088
+ },
+ {
+ "epoch": 19.31607629427793,
+ "grad_norm": 12.31118106842041,
+ "learning_rate": 1.8635957676780085e-05,
+ "loss": 0.8545,
+ "step": 7089
+ },
+ {
+ "epoch": 19.318801089918257,
+ "grad_norm": 7.389854431152344,
+ "learning_rate": 1.8635512702738168e-05,
+ "loss": 0.8845,
+ "step": 7090
+ },
+ {
+ "epoch": 19.321525885558582,
+ "grad_norm": 9.636378288269043,
+ "learning_rate": 1.8635067661443157e-05,
+ "loss": 0.858,
+ "step": 7091
+ },
+ {
+ "epoch": 19.32425068119891,
+ "grad_norm": 12.663843154907227,
+ "learning_rate": 1.8634622552898516e-05,
+ "loss": 1.1116,
+ "step": 7092
+ },
+ {
+ "epoch": 19.326975476839237,
+ "grad_norm": 8.857486724853516,
+ "learning_rate": 1.8634177377107717e-05,
+ "loss": 0.8301,
+ "step": 7093
+ },
+ {
+ "epoch": 19.329700272479563,
+ "grad_norm": 7.673715591430664,
+ "learning_rate": 1.863373213407422e-05,
+ "loss": 0.6119,
+ "step": 7094
+ },
+ {
+ "epoch": 19.332425068119893,
+ "grad_norm": 8.896916389465332,
+ "learning_rate": 1.8633286823801495e-05,
+ "loss": 0.869,
+ "step": 7095
+ },
+ {
+ "epoch": 19.33514986376022,
+ "grad_norm": 7.086410045623779,
+ "learning_rate": 1.8632841446293008e-05,
+ "loss": 0.8376,
+ "step": 7096
+ },
+ {
+ "epoch": 19.337874659400544,
+ "grad_norm": 8.21198558807373,
+ "learning_rate": 1.8632396001552232e-05,
+ "loss": 0.741,
+ "step": 7097
+ },
+ {
+ "epoch": 19.340599455040874,
+ "grad_norm": 11.218838691711426,
+ "learning_rate": 1.863195048958263e-05,
+ "loss": 0.9675,
+ "step": 7098
+ },
+ {
+ "epoch": 19.3433242506812,
+ "grad_norm": 14.552414894104004,
+ "learning_rate": 1.863150491038768e-05,
+ "loss": 0.848,
+ "step": 7099
+ },
+ {
+ "epoch": 19.346049046321525,
+ "grad_norm": 8.315683364868164,
+ "learning_rate": 1.863105926397085e-05,
+ "loss": 0.8341,
+ "step": 7100
+ },
+ {
+ "epoch": 19.348773841961854,
+ "grad_norm": 8.802910804748535,
+ "learning_rate": 1.86306135503356e-05,
+ "loss": 0.7502,
+ "step": 7101
+ },
+ {
+ "epoch": 19.35149863760218,
+ "grad_norm": 9.626164436340332,
+ "learning_rate": 1.8630167769485417e-05,
+ "loss": 0.8588,
+ "step": 7102
+ },
+ {
+ "epoch": 19.354223433242506,
+ "grad_norm": 7.273528099060059,
+ "learning_rate": 1.862972192142376e-05,
+ "loss": 0.8357,
+ "step": 7103
+ },
+ {
+ "epoch": 19.356948228882835,
+ "grad_norm": 12.616958618164062,
+ "learning_rate": 1.862927600615411e-05,
+ "loss": 0.8398,
+ "step": 7104
+ },
+ {
+ "epoch": 19.35967302452316,
+ "grad_norm": 8.385083198547363,
+ "learning_rate": 1.862883002367993e-05,
+ "loss": 0.7583,
+ "step": 7105
+ },
+ {
+ "epoch": 19.362397820163487,
+ "grad_norm": 7.05576229095459,
+ "learning_rate": 1.8628383974004707e-05,
+ "loss": 0.8187,
+ "step": 7106
+ },
+ {
+ "epoch": 19.365122615803816,
+ "grad_norm": 10.724347114562988,
+ "learning_rate": 1.8627937857131904e-05,
+ "loss": 0.8776,
+ "step": 7107
+ },
+ {
+ "epoch": 19.367847411444142,
+ "grad_norm": 8.391908645629883,
+ "learning_rate": 1.8627491673065e-05,
+ "loss": 0.8613,
+ "step": 7108
+ },
+ {
+ "epoch": 19.370572207084468,
+ "grad_norm": 8.110748291015625,
+ "learning_rate": 1.8627045421807466e-05,
+ "loss": 0.8065,
+ "step": 7109
+ },
+ {
+ "epoch": 19.373297002724797,
+ "grad_norm": 8.11498737335205,
+ "learning_rate": 1.8626599103362783e-05,
+ "loss": 0.719,
+ "step": 7110
+ },
+ {
+ "epoch": 19.376021798365123,
+ "grad_norm": 9.259939193725586,
+ "learning_rate": 1.862615271773442e-05,
+ "loss": 0.7861,
+ "step": 7111
+ },
+ {
+ "epoch": 19.37874659400545,
+ "grad_norm": 7.308506965637207,
+ "learning_rate": 1.862570626492586e-05,
+ "loss": 0.653,
+ "step": 7112
+ },
+ {
+ "epoch": 19.381471389645778,
+ "grad_norm": 6.963586807250977,
+ "learning_rate": 1.8625259744940578e-05,
+ "loss": 0.8174,
+ "step": 7113
+ },
+ {
+ "epoch": 19.384196185286104,
+ "grad_norm": 8.394465446472168,
+ "learning_rate": 1.862481315778205e-05,
+ "loss": 0.8184,
+ "step": 7114
+ },
+ {
+ "epoch": 19.38692098092643,
+ "grad_norm": 8.269073486328125,
+ "learning_rate": 1.8624366503453752e-05,
+ "loss": 0.9324,
+ "step": 7115
+ },
+ {
+ "epoch": 19.38964577656676,
+ "grad_norm": 9.482769966125488,
+ "learning_rate": 1.862391978195917e-05,
+ "loss": 0.8301,
+ "step": 7116
+ },
+ {
+ "epoch": 19.392370572207085,
+ "grad_norm": 10.183133125305176,
+ "learning_rate": 1.8623472993301774e-05,
+ "loss": 0.7036,
+ "step": 7117
+ },
+ {
+ "epoch": 19.39509536784741,
+ "grad_norm": 8.745038986206055,
+ "learning_rate": 1.8623026137485047e-05,
+ "loss": 0.9237,
+ "step": 7118
+ },
+ {
+ "epoch": 19.39782016348774,
+ "grad_norm": 12.041457176208496,
+ "learning_rate": 1.8622579214512476e-05,
+ "loss": 0.8619,
+ "step": 7119
+ },
+ {
+ "epoch": 19.400544959128066,
+ "grad_norm": 8.609764099121094,
+ "learning_rate": 1.862213222438753e-05,
+ "loss": 0.8923,
+ "step": 7120
+ },
+ {
+ "epoch": 19.40326975476839,
+ "grad_norm": 9.28745174407959,
+ "learning_rate": 1.86216851671137e-05,
+ "loss": 0.745,
+ "step": 7121
+ },
+ {
+ "epoch": 19.40599455040872,
+ "grad_norm": 11.696236610412598,
+ "learning_rate": 1.862123804269446e-05,
+ "loss": 0.8381,
+ "step": 7122
+ },
+ {
+ "epoch": 19.408719346049047,
+ "grad_norm": 10.133161544799805,
+ "learning_rate": 1.8620790851133294e-05,
+ "loss": 1.0443,
+ "step": 7123
+ },
+ {
+ "epoch": 19.411444141689373,
+ "grad_norm": 10.21315860748291,
+ "learning_rate": 1.862034359243369e-05,
+ "loss": 0.9352,
+ "step": 7124
+ },
+ {
+ "epoch": 19.414168937329702,
+ "grad_norm": 8.50641918182373,
+ "learning_rate": 1.8619896266599128e-05,
+ "loss": 0.8772,
+ "step": 7125
+ },
+ {
+ "epoch": 19.416893732970028,
+ "grad_norm": 9.827706336975098,
+ "learning_rate": 1.861944887363309e-05,
+ "loss": 0.7192,
+ "step": 7126
+ },
+ {
+ "epoch": 19.419618528610354,
+ "grad_norm": 10.437112808227539,
+ "learning_rate": 1.861900141353906e-05,
+ "loss": 0.7804,
+ "step": 7127
+ },
+ {
+ "epoch": 19.422343324250683,
+ "grad_norm": 11.694056510925293,
+ "learning_rate": 1.8618553886320527e-05,
+ "loss": 0.858,
+ "step": 7128
+ },
+ {
+ "epoch": 19.42506811989101,
+ "grad_norm": 9.052674293518066,
+ "learning_rate": 1.861810629198097e-05,
+ "loss": 0.9775,
+ "step": 7129
+ },
+ {
+ "epoch": 19.427792915531334,
+ "grad_norm": 8.512746810913086,
+ "learning_rate": 1.8617658630523884e-05,
+ "loss": 1.0008,
+ "step": 7130
+ },
+ {
+ "epoch": 19.430517711171664,
+ "grad_norm": 9.113412857055664,
+ "learning_rate": 1.8617210901952747e-05,
+ "loss": 0.849,
+ "step": 7131
+ },
+ {
+ "epoch": 19.43324250681199,
+ "grad_norm": 7.726861476898193,
+ "learning_rate": 1.861676310627105e-05,
+ "loss": 0.7202,
+ "step": 7132
+ },
+ {
+ "epoch": 19.435967302452315,
+ "grad_norm": 9.574609756469727,
+ "learning_rate": 1.8616315243482278e-05,
+ "loss": 0.8007,
+ "step": 7133
+ },
+ {
+ "epoch": 19.438692098092645,
+ "grad_norm": 8.07555866241455,
+ "learning_rate": 1.861586731358992e-05,
+ "loss": 0.8369,
+ "step": 7134
+ },
+ {
+ "epoch": 19.44141689373297,
+ "grad_norm": 8.209267616271973,
+ "learning_rate": 1.8615419316597466e-05,
+ "loss": 0.9718,
+ "step": 7135
+ },
+ {
+ "epoch": 19.444141689373296,
+ "grad_norm": 8.566980361938477,
+ "learning_rate": 1.8614971252508404e-05,
+ "loss": 0.7947,
+ "step": 7136
+ },
+ {
+ "epoch": 19.446866485013626,
+ "grad_norm": 8.924108505249023,
+ "learning_rate": 1.861452312132622e-05,
+ "loss": 0.7556,
+ "step": 7137
+ },
+ {
+ "epoch": 19.44959128065395,
+ "grad_norm": 7.728081703186035,
+ "learning_rate": 1.861407492305441e-05,
+ "loss": 0.8705,
+ "step": 7138
+ },
+ {
+ "epoch": 19.452316076294277,
+ "grad_norm": 9.532186508178711,
+ "learning_rate": 1.861362665769646e-05,
+ "loss": 0.7142,
+ "step": 7139
+ },
+ {
+ "epoch": 19.455040871934607,
+ "grad_norm": 10.082612991333008,
+ "learning_rate": 1.8613178325255864e-05,
+ "loss": 0.8036,
+ "step": 7140
+ },
+ {
+ "epoch": 19.457765667574932,
+ "grad_norm": 7.684032917022705,
+ "learning_rate": 1.861272992573611e-05,
+ "loss": 0.7967,
+ "step": 7141
+ },
+ {
+ "epoch": 19.460490463215258,
+ "grad_norm": 9.457315444946289,
+ "learning_rate": 1.8612281459140697e-05,
+ "loss": 0.9214,
+ "step": 7142
+ },
+ {
+ "epoch": 19.463215258855588,
+ "grad_norm": 10.618170738220215,
+ "learning_rate": 1.861183292547311e-05,
+ "loss": 0.7838,
+ "step": 7143
+ },
+ {
+ "epoch": 19.465940054495913,
+ "grad_norm": 8.46899700164795,
+ "learning_rate": 1.8611384324736846e-05,
+ "loss": 0.8322,
+ "step": 7144
+ },
+ {
+ "epoch": 19.46866485013624,
+ "grad_norm": 14.252891540527344,
+ "learning_rate": 1.8610935656935397e-05,
+ "loss": 0.7529,
+ "step": 7145
+ },
+ {
+ "epoch": 19.47138964577657,
+ "grad_norm": 8.75171947479248,
+ "learning_rate": 1.8610486922072263e-05,
+ "loss": 0.9302,
+ "step": 7146
+ },
+ {
+ "epoch": 19.474114441416894,
+ "grad_norm": 9.981742858886719,
+ "learning_rate": 1.861003812015093e-05,
+ "loss": 0.8142,
+ "step": 7147
+ },
+ {
+ "epoch": 19.47683923705722,
+ "grad_norm": 8.651573181152344,
+ "learning_rate": 1.8609589251174897e-05,
+ "loss": 0.7855,
+ "step": 7148
+ },
+ {
+ "epoch": 19.479564032697546,
+ "grad_norm": 8.043776512145996,
+ "learning_rate": 1.860914031514766e-05,
+ "loss": 0.8999,
+ "step": 7149
+ },
+ {
+ "epoch": 19.482288828337875,
+ "grad_norm": 8.118514060974121,
+ "learning_rate": 1.8608691312072714e-05,
+ "loss": 0.696,
+ "step": 7150
+ },
+ {
+ "epoch": 19.4850136239782,
+ "grad_norm": 9.851868629455566,
+ "learning_rate": 1.8608242241953563e-05,
+ "loss": 0.8085,
+ "step": 7151
+ },
+ {
+ "epoch": 19.48773841961853,
+ "grad_norm": 9.400286674499512,
+ "learning_rate": 1.8607793104793696e-05,
+ "loss": 0.9197,
+ "step": 7152
+ },
+ {
+ "epoch": 19.490463215258856,
+ "grad_norm": 10.697088241577148,
+ "learning_rate": 1.8607343900596612e-05,
+ "loss": 0.8051,
+ "step": 7153
+ },
+ {
+ "epoch": 19.493188010899182,
+ "grad_norm": 8.79265022277832,
+ "learning_rate": 1.860689462936581e-05,
+ "loss": 0.9979,
+ "step": 7154
+ },
+ {
+ "epoch": 19.495912806539508,
+ "grad_norm": 10.787165641784668,
+ "learning_rate": 1.860644529110479e-05,
+ "loss": 0.9614,
+ "step": 7155
+ },
+ {
+ "epoch": 19.498637602179837,
+ "grad_norm": 15.625445365905762,
+ "learning_rate": 1.860599588581705e-05,
+ "loss": 0.9706,
+ "step": 7156
+ },
+ {
+ "epoch": 19.501362397820163,
+ "grad_norm": 8.949894905090332,
+ "learning_rate": 1.8605546413506092e-05,
+ "loss": 0.7184,
+ "step": 7157
+ },
+ {
+ "epoch": 19.504087193460492,
+ "grad_norm": 10.700446128845215,
+ "learning_rate": 1.8605096874175418e-05,
+ "loss": 0.7781,
+ "step": 7158
+ },
+ {
+ "epoch": 19.506811989100818,
+ "grad_norm": 10.570991516113281,
+ "learning_rate": 1.860464726782852e-05,
+ "loss": 0.8612,
+ "step": 7159
+ },
+ {
+ "epoch": 19.509536784741144,
+ "grad_norm": 6.78163480758667,
+ "learning_rate": 1.860419759446891e-05,
+ "loss": 0.7797,
+ "step": 7160
+ },
+ {
+ "epoch": 19.51226158038147,
+ "grad_norm": 7.994595527648926,
+ "learning_rate": 1.860374785410009e-05,
+ "loss": 0.8046,
+ "step": 7161
+ },
+ {
+ "epoch": 19.5149863760218,
+ "grad_norm": 7.7101616859436035,
+ "learning_rate": 1.8603298046725556e-05,
+ "loss": 0.7093,
+ "step": 7162
+ },
+ {
+ "epoch": 19.517711171662125,
+ "grad_norm": 8.135588645935059,
+ "learning_rate": 1.860284817234881e-05,
+ "loss": 0.9785,
+ "step": 7163
+ },
+ {
+ "epoch": 19.520435967302454,
+ "grad_norm": 8.23460578918457,
+ "learning_rate": 1.8602398230973363e-05,
+ "loss": 0.8845,
+ "step": 7164
+ },
+ {
+ "epoch": 19.52316076294278,
+ "grad_norm": 8.690340995788574,
+ "learning_rate": 1.8601948222602715e-05,
+ "loss": 0.782,
+ "step": 7165
+ },
+ {
+ "epoch": 19.525885558583106,
+ "grad_norm": 8.22935962677002,
+ "learning_rate": 1.860149814724037e-05,
+ "loss": 0.7798,
+ "step": 7166
+ },
+ {
+ "epoch": 19.52861035422343,
+ "grad_norm": 8.305482864379883,
+ "learning_rate": 1.8601048004889835e-05,
+ "loss": 0.9558,
+ "step": 7167
+ },
+ {
+ "epoch": 19.53133514986376,
+ "grad_norm": 8.000179290771484,
+ "learning_rate": 1.8600597795554613e-05,
+ "loss": 0.8922,
+ "step": 7168
+ },
+ {
+ "epoch": 19.534059945504087,
+ "grad_norm": 7.575944900512695,
+ "learning_rate": 1.8600147519238217e-05,
+ "loss": 0.5796,
+ "step": 7169
+ },
+ {
+ "epoch": 19.536784741144416,
+ "grad_norm": 7.775625228881836,
+ "learning_rate": 1.8599697175944145e-05,
+ "loss": 0.6722,
+ "step": 7170
+ },
+ {
+ "epoch": 19.539509536784742,
+ "grad_norm": 13.651352882385254,
+ "learning_rate": 1.859924676567591e-05,
+ "loss": 0.8679,
+ "step": 7171
+ },
+ {
+ "epoch": 19.542234332425068,
+ "grad_norm": 8.39905071258545,
+ "learning_rate": 1.8598796288437017e-05,
+ "loss": 0.991,
+ "step": 7172
+ },
+ {
+ "epoch": 19.544959128065393,
+ "grad_norm": 7.791860580444336,
+ "learning_rate": 1.8598345744230975e-05,
+ "loss": 0.6833,
+ "step": 7173
+ },
+ {
+ "epoch": 19.547683923705723,
+ "grad_norm": 9.090578079223633,
+ "learning_rate": 1.8597895133061293e-05,
+ "loss": 0.6956,
+ "step": 7174
+ },
+ {
+ "epoch": 19.55040871934605,
+ "grad_norm": 9.28824234008789,
+ "learning_rate": 1.859744445493148e-05,
+ "loss": 1.0017,
+ "step": 7175
+ },
+ {
+ "epoch": 19.553133514986374,
+ "grad_norm": 8.328651428222656,
+ "learning_rate": 1.8596993709845047e-05,
+ "loss": 0.817,
+ "step": 7176
+ },
+ {
+ "epoch": 19.555858310626704,
+ "grad_norm": 9.966940879821777,
+ "learning_rate": 1.8596542897805504e-05,
+ "loss": 0.9116,
+ "step": 7177
+ },
+ {
+ "epoch": 19.55858310626703,
+ "grad_norm": 8.67443561553955,
+ "learning_rate": 1.8596092018816364e-05,
+ "loss": 0.824,
+ "step": 7178
+ },
+ {
+ "epoch": 19.561307901907355,
+ "grad_norm": 8.581880569458008,
+ "learning_rate": 1.859564107288113e-05,
+ "loss": 0.7651,
+ "step": 7179
+ },
+ {
+ "epoch": 19.564032697547685,
+ "grad_norm": 6.821385383605957,
+ "learning_rate": 1.8595190060003327e-05,
+ "loss": 0.8549,
+ "step": 7180
+ },
+ {
+ "epoch": 19.56675749318801,
+ "grad_norm": 7.707915306091309,
+ "learning_rate": 1.8594738980186456e-05,
+ "loss": 0.7549,
+ "step": 7181
+ },
+ {
+ "epoch": 19.569482288828336,
+ "grad_norm": 9.711687088012695,
+ "learning_rate": 1.8594287833434033e-05,
+ "loss": 0.7441,
+ "step": 7182
+ },
+ {
+ "epoch": 19.572207084468666,
+ "grad_norm": 6.779923439025879,
+ "learning_rate": 1.8593836619749576e-05,
+ "loss": 0.9248,
+ "step": 7183
+ },
+ {
+ "epoch": 19.57493188010899,
+ "grad_norm": 8.128297805786133,
+ "learning_rate": 1.8593385339136596e-05,
+ "loss": 1.0179,
+ "step": 7184
+ },
+ {
+ "epoch": 19.577656675749317,
+ "grad_norm": 7.063774108886719,
+ "learning_rate": 1.8592933991598605e-05,
+ "loss": 0.7955,
+ "step": 7185
+ },
+ {
+ "epoch": 19.580381471389646,
+ "grad_norm": 8.919217109680176,
+ "learning_rate": 1.8592482577139125e-05,
+ "loss": 0.8444,
+ "step": 7186
+ },
+ {
+ "epoch": 19.583106267029972,
+ "grad_norm": 8.478561401367188,
+ "learning_rate": 1.8592031095761665e-05,
+ "loss": 0.7125,
+ "step": 7187
+ },
+ {
+ "epoch": 19.585831062670298,
+ "grad_norm": 8.336913108825684,
+ "learning_rate": 1.8591579547469743e-05,
+ "loss": 0.8051,
+ "step": 7188
+ },
+ {
+ "epoch": 19.588555858310627,
+ "grad_norm": 8.41412353515625,
+ "learning_rate": 1.8591127932266874e-05,
+ "loss": 0.7394,
+ "step": 7189
+ },
+ {
+ "epoch": 19.591280653950953,
+ "grad_norm": 9.4815034866333,
+ "learning_rate": 1.859067625015658e-05,
+ "loss": 0.85,
+ "step": 7190
+ },
+ {
+ "epoch": 19.59400544959128,
+ "grad_norm": 9.293360710144043,
+ "learning_rate": 1.8590224501142377e-05,
+ "loss": 0.832,
+ "step": 7191
+ },
+ {
+ "epoch": 19.59673024523161,
+ "grad_norm": 8.675623893737793,
+ "learning_rate": 1.8589772685227777e-05,
+ "loss": 1.0309,
+ "step": 7192
+ },
+ {
+ "epoch": 19.599455040871934,
+ "grad_norm": 7.507985591888428,
+ "learning_rate": 1.858932080241631e-05,
+ "loss": 0.6049,
+ "step": 7193
+ },
+ {
+ "epoch": 19.60217983651226,
+ "grad_norm": 9.1579008102417,
+ "learning_rate": 1.8588868852711487e-05,
+ "loss": 0.7317,
+ "step": 7194
+ },
+ {
+ "epoch": 19.60490463215259,
+ "grad_norm": 9.267694473266602,
+ "learning_rate": 1.8588416836116824e-05,
+ "loss": 0.9226,
+ "step": 7195
+ },
+ {
+ "epoch": 19.607629427792915,
+ "grad_norm": 8.240072250366211,
+ "learning_rate": 1.8587964752635856e-05,
+ "loss": 0.684,
+ "step": 7196
+ },
+ {
+ "epoch": 19.61035422343324,
+ "grad_norm": 7.696627616882324,
+ "learning_rate": 1.8587512602272088e-05,
+ "loss": 0.8578,
+ "step": 7197
+ },
+ {
+ "epoch": 19.61307901907357,
+ "grad_norm": 8.939593315124512,
+ "learning_rate": 1.8587060385029052e-05,
+ "loss": 0.8292,
+ "step": 7198
+ },
+ {
+ "epoch": 19.615803814713896,
+ "grad_norm": 8.204903602600098,
+ "learning_rate": 1.8586608100910265e-05,
+ "loss": 0.7584,
+ "step": 7199
+ },
+ {
+ "epoch": 19.618528610354222,
+ "grad_norm": 7.829612731933594,
+ "learning_rate": 1.858615574991925e-05,
+ "loss": 0.7552,
+ "step": 7200
+ },
+ {
+ "epoch": 19.62125340599455,
+ "grad_norm": 9.322164535522461,
+ "learning_rate": 1.858570333205953e-05,
+ "loss": 0.8754,
+ "step": 7201
+ },
+ {
+ "epoch": 19.623978201634877,
+ "grad_norm": 7.925443172454834,
+ "learning_rate": 1.858525084733463e-05,
+ "loss": 0.7184,
+ "step": 7202
+ },
+ {
+ "epoch": 19.626702997275203,
+ "grad_norm": 7.421473979949951,
+ "learning_rate": 1.8584798295748072e-05,
+ "loss": 0.8631,
+ "step": 7203
+ },
+ {
+ "epoch": 19.629427792915532,
+ "grad_norm": 8.25426197052002,
+ "learning_rate": 1.8584345677303385e-05,
+ "loss": 0.8169,
+ "step": 7204
+ },
+ {
+ "epoch": 19.632152588555858,
+ "grad_norm": 9.868017196655273,
+ "learning_rate": 1.8583892992004084e-05,
+ "loss": 0.7183,
+ "step": 7205
+ },
+ {
+ "epoch": 19.634877384196184,
+ "grad_norm": 11.133771896362305,
+ "learning_rate": 1.8583440239853705e-05,
+ "loss": 0.797,
+ "step": 7206
+ },
+ {
+ "epoch": 19.637602179836513,
+ "grad_norm": 7.968581676483154,
+ "learning_rate": 1.8582987420855766e-05,
+ "loss": 0.9005,
+ "step": 7207
+ },
+ {
+ "epoch": 19.64032697547684,
+ "grad_norm": 8.879183769226074,
+ "learning_rate": 1.8582534535013802e-05,
+ "loss": 0.8459,
+ "step": 7208
+ },
+ {
+ "epoch": 19.643051771117165,
+ "grad_norm": 9.460929870605469,
+ "learning_rate": 1.858208158233133e-05,
+ "loss": 0.8223,
+ "step": 7209
+ },
+ {
+ "epoch": 19.645776566757494,
+ "grad_norm": 10.924003601074219,
+ "learning_rate": 1.8581628562811887e-05,
+ "loss": 1.0322,
+ "step": 7210
+ },
+ {
+ "epoch": 19.64850136239782,
+ "grad_norm": 9.068217277526855,
+ "learning_rate": 1.8581175476458993e-05,
+ "loss": 0.9371,
+ "step": 7211
+ },
+ {
+ "epoch": 19.651226158038146,
+ "grad_norm": 8.336944580078125,
+ "learning_rate": 1.8580722323276186e-05,
+ "loss": 0.8612,
+ "step": 7212
+ },
+ {
+ "epoch": 19.653950953678475,
+ "grad_norm": 7.832804203033447,
+ "learning_rate": 1.8580269103266985e-05,
+ "loss": 0.7006,
+ "step": 7213
+ },
+ {
+ "epoch": 19.6566757493188,
+ "grad_norm": 11.483506202697754,
+ "learning_rate": 1.8579815816434928e-05,
+ "loss": 0.962,
+ "step": 7214
+ },
+ {
+ "epoch": 19.659400544959126,
+ "grad_norm": 9.328773498535156,
+ "learning_rate": 1.857936246278354e-05,
+ "loss": 0.7187,
+ "step": 7215
+ },
+ {
+ "epoch": 19.662125340599456,
+ "grad_norm": 9.086725234985352,
+ "learning_rate": 1.857890904231635e-05,
+ "loss": 0.8785,
+ "step": 7216
+ },
+ {
+ "epoch": 19.66485013623978,
+ "grad_norm": 8.559444427490234,
+ "learning_rate": 1.8578455555036898e-05,
+ "loss": 0.9489,
+ "step": 7217
+ },
+ {
+ "epoch": 19.667574931880107,
+ "grad_norm": 11.644548416137695,
+ "learning_rate": 1.8578002000948707e-05,
+ "loss": 0.9829,
+ "step": 7218
+ },
+ {
+ "epoch": 19.670299727520437,
+ "grad_norm": 8.787369728088379,
+ "learning_rate": 1.8577548380055312e-05,
+ "loss": 0.7469,
+ "step": 7219
+ },
+ {
+ "epoch": 19.673024523160763,
+ "grad_norm": 9.432893753051758,
+ "learning_rate": 1.8577094692360248e-05,
+ "loss": 0.8535,
+ "step": 7220
+ },
+ {
+ "epoch": 19.67574931880109,
+ "grad_norm": 8.616509437561035,
+ "learning_rate": 1.8576640937867047e-05,
+ "loss": 0.7623,
+ "step": 7221
+ },
+ {
+ "epoch": 19.678474114441418,
+ "grad_norm": 10.964095115661621,
+ "learning_rate": 1.857618711657924e-05,
+ "loss": 0.7573,
+ "step": 7222
+ },
+ {
+ "epoch": 19.681198910081743,
+ "grad_norm": 8.31070327758789,
+ "learning_rate": 1.8575733228500364e-05,
+ "loss": 0.8906,
+ "step": 7223
+ },
+ {
+ "epoch": 19.68392370572207,
+ "grad_norm": 7.251931667327881,
+ "learning_rate": 1.8575279273633957e-05,
+ "loss": 0.8314,
+ "step": 7224
+ },
+ {
+ "epoch": 19.6866485013624,
+ "grad_norm": 10.5338134765625,
+ "learning_rate": 1.857482525198355e-05,
+ "loss": 0.9138,
+ "step": 7225
+ },
+ {
+ "epoch": 19.689373297002724,
+ "grad_norm": 8.392162322998047,
+ "learning_rate": 1.8574371163552677e-05,
+ "loss": 0.6933,
+ "step": 7226
+ },
+ {
+ "epoch": 19.69209809264305,
+ "grad_norm": 9.30006217956543,
+ "learning_rate": 1.857391700834488e-05,
+ "loss": 0.824,
+ "step": 7227
+ },
+ {
+ "epoch": 19.69482288828338,
+ "grad_norm": 8.00703239440918,
+ "learning_rate": 1.857346278636369e-05,
+ "loss": 0.8078,
+ "step": 7228
+ },
+ {
+ "epoch": 19.697547683923705,
+ "grad_norm": 8.627029418945312,
+ "learning_rate": 1.857300849761265e-05,
+ "loss": 0.7823,
+ "step": 7229
+ },
+ {
+ "epoch": 19.70027247956403,
+ "grad_norm": 8.846247673034668,
+ "learning_rate": 1.8572554142095296e-05,
+ "loss": 0.8359,
+ "step": 7230
+ },
+ {
+ "epoch": 19.70299727520436,
+ "grad_norm": 9.047361373901367,
+ "learning_rate": 1.8572099719815167e-05,
+ "loss": 0.749,
+ "step": 7231
+ },
+ {
+ "epoch": 19.705722070844686,
+ "grad_norm": 7.625607490539551,
+ "learning_rate": 1.85716452307758e-05,
+ "loss": 0.8597,
+ "step": 7232
+ },
+ {
+ "epoch": 19.708446866485012,
+ "grad_norm": 9.168447494506836,
+ "learning_rate": 1.8571190674980734e-05,
+ "loss": 0.8319,
+ "step": 7233
+ },
+ {
+ "epoch": 19.71117166212534,
+ "grad_norm": 8.939648628234863,
+ "learning_rate": 1.8570736052433515e-05,
+ "loss": 0.7706,
+ "step": 7234
+ },
+ {
+ "epoch": 19.713896457765667,
+ "grad_norm": 9.04534912109375,
+ "learning_rate": 1.8570281363137677e-05,
+ "loss": 0.86,
+ "step": 7235
+ },
+ {
+ "epoch": 19.716621253405993,
+ "grad_norm": 9.590156555175781,
+ "learning_rate": 1.8569826607096764e-05,
+ "loss": 0.8484,
+ "step": 7236
+ },
+ {
+ "epoch": 19.719346049046322,
+ "grad_norm": 8.071600914001465,
+ "learning_rate": 1.8569371784314318e-05,
+ "loss": 0.7587,
+ "step": 7237
+ },
+ {
+ "epoch": 19.722070844686648,
+ "grad_norm": 7.5778703689575195,
+ "learning_rate": 1.856891689479388e-05,
+ "loss": 0.9353,
+ "step": 7238
+ },
+ {
+ "epoch": 19.724795640326974,
+ "grad_norm": 8.062702178955078,
+ "learning_rate": 1.8568461938538994e-05,
+ "loss": 0.7383,
+ "step": 7239
+ },
+ {
+ "epoch": 19.727520435967303,
+ "grad_norm": 8.187978744506836,
+ "learning_rate": 1.8568006915553202e-05,
+ "loss": 0.774,
+ "step": 7240
+ },
+ {
+ "epoch": 19.73024523160763,
+ "grad_norm": 7.880321502685547,
+ "learning_rate": 1.856755182584004e-05,
+ "loss": 0.6434,
+ "step": 7241
+ },
+ {
+ "epoch": 19.732970027247955,
+ "grad_norm": 8.603689193725586,
+ "learning_rate": 1.856709666940307e-05,
+ "loss": 0.9297,
+ "step": 7242
+ },
+ {
+ "epoch": 19.735694822888284,
+ "grad_norm": 8.921660423278809,
+ "learning_rate": 1.8566641446245825e-05,
+ "loss": 0.9548,
+ "step": 7243
+ },
+ {
+ "epoch": 19.73841961852861,
+ "grad_norm": 8.69922924041748,
+ "learning_rate": 1.856618615637185e-05,
+ "loss": 0.9243,
+ "step": 7244
+ },
+ {
+ "epoch": 19.741144414168936,
+ "grad_norm": 8.331897735595703,
+ "learning_rate": 1.8565730799784693e-05,
+ "loss": 0.8177,
+ "step": 7245
+ },
+ {
+ "epoch": 19.743869209809265,
+ "grad_norm": 8.047229766845703,
+ "learning_rate": 1.85652753764879e-05,
+ "loss": 0.7662,
+ "step": 7246
+ },
+ {
+ "epoch": 19.74659400544959,
+ "grad_norm": 11.7498140335083,
+ "learning_rate": 1.856481988648502e-05,
+ "loss": 0.77,
+ "step": 7247
+ },
+ {
+ "epoch": 19.749318801089917,
+ "grad_norm": 7.757480144500732,
+ "learning_rate": 1.85643643297796e-05,
+ "loss": 0.9216,
+ "step": 7248
+ },
+ {
+ "epoch": 19.752043596730246,
+ "grad_norm": 8.10046672821045,
+ "learning_rate": 1.8563908706375183e-05,
+ "loss": 0.916,
+ "step": 7249
+ },
+ {
+ "epoch": 19.754768392370572,
+ "grad_norm": 7.660522937774658,
+ "learning_rate": 1.8563453016275322e-05,
+ "loss": 0.7997,
+ "step": 7250
+ },
+ {
+ "epoch": 19.757493188010898,
+ "grad_norm": 8.821773529052734,
+ "learning_rate": 1.8562997259483563e-05,
+ "loss": 0.947,
+ "step": 7251
+ },
+ {
+ "epoch": 19.760217983651227,
+ "grad_norm": 7.833026885986328,
+ "learning_rate": 1.856254143600346e-05,
+ "loss": 1.0444,
+ "step": 7252
+ },
+ {
+ "epoch": 19.762942779291553,
+ "grad_norm": 9.46402359008789,
+ "learning_rate": 1.8562085545838557e-05,
+ "loss": 0.8815,
+ "step": 7253
+ },
+ {
+ "epoch": 19.76566757493188,
+ "grad_norm": 10.266973495483398,
+ "learning_rate": 1.8561629588992405e-05,
+ "loss": 0.7732,
+ "step": 7254
+ },
+ {
+ "epoch": 19.768392370572208,
+ "grad_norm": 8.80599594116211,
+ "learning_rate": 1.856117356546856e-05,
+ "loss": 0.7681,
+ "step": 7255
+ },
+ {
+ "epoch": 19.771117166212534,
+ "grad_norm": 8.57168197631836,
+ "learning_rate": 1.8560717475270573e-05,
+ "loss": 0.7834,
+ "step": 7256
+ },
+ {
+ "epoch": 19.77384196185286,
+ "grad_norm": 7.505406379699707,
+ "learning_rate": 1.856026131840199e-05,
+ "loss": 0.7225,
+ "step": 7257
+ },
+ {
+ "epoch": 19.77656675749319,
+ "grad_norm": 7.946703910827637,
+ "learning_rate": 1.855980509486637e-05,
+ "loss": 0.8301,
+ "step": 7258
+ },
+ {
+ "epoch": 19.779291553133515,
+ "grad_norm": 10.383882522583008,
+ "learning_rate": 1.8559348804667265e-05,
+ "loss": 0.7971,
+ "step": 7259
+ },
+ {
+ "epoch": 19.78201634877384,
+ "grad_norm": 7.882511615753174,
+ "learning_rate": 1.8558892447808224e-05,
+ "loss": 0.8564,
+ "step": 7260
+ },
+ {
+ "epoch": 19.78474114441417,
+ "grad_norm": 11.38111400604248,
+ "learning_rate": 1.8558436024292803e-05,
+ "loss": 0.9023,
+ "step": 7261
+ },
+ {
+ "epoch": 19.787465940054496,
+ "grad_norm": 7.0735249519348145,
+ "learning_rate": 1.855797953412456e-05,
+ "loss": 0.7559,
+ "step": 7262
+ },
+ {
+ "epoch": 19.79019073569482,
+ "grad_norm": 9.781344413757324,
+ "learning_rate": 1.8557522977307045e-05,
+ "loss": 0.8533,
+ "step": 7263
+ },
+ {
+ "epoch": 19.79291553133515,
+ "grad_norm": 8.610528945922852,
+ "learning_rate": 1.8557066353843822e-05,
+ "loss": 0.6511,
+ "step": 7264
+ },
+ {
+ "epoch": 19.795640326975477,
+ "grad_norm": 8.943483352661133,
+ "learning_rate": 1.8556609663738435e-05,
+ "loss": 0.9783,
+ "step": 7265
+ },
+ {
+ "epoch": 19.798365122615802,
+ "grad_norm": 8.305816650390625,
+ "learning_rate": 1.8556152906994453e-05,
+ "loss": 0.892,
+ "step": 7266
+ },
+ {
+ "epoch": 19.80108991825613,
+ "grad_norm": 7.825862407684326,
+ "learning_rate": 1.8555696083615425e-05,
+ "loss": 0.8247,
+ "step": 7267
+ },
+ {
+ "epoch": 19.803814713896458,
+ "grad_norm": 7.026774883270264,
+ "learning_rate": 1.8555239193604913e-05,
+ "loss": 0.7625,
+ "step": 7268
+ },
+ {
+ "epoch": 19.806539509536783,
+ "grad_norm": 10.513520240783691,
+ "learning_rate": 1.855478223696647e-05,
+ "loss": 0.8748,
+ "step": 7269
+ },
+ {
+ "epoch": 19.809264305177113,
+ "grad_norm": 8.773707389831543,
+ "learning_rate": 1.8554325213703663e-05,
+ "loss": 0.813,
+ "step": 7270
+ },
+ {
+ "epoch": 19.81198910081744,
+ "grad_norm": 46.05637741088867,
+ "learning_rate": 1.8553868123820043e-05,
+ "loss": 0.8654,
+ "step": 7271
+ },
+ {
+ "epoch": 19.814713896457764,
+ "grad_norm": 9.854783058166504,
+ "learning_rate": 1.8553410967319173e-05,
+ "loss": 1.0159,
+ "step": 7272
+ },
+ {
+ "epoch": 19.817438692098094,
+ "grad_norm": 7.48112678527832,
+ "learning_rate": 1.8552953744204613e-05,
+ "loss": 0.818,
+ "step": 7273
+ },
+ {
+ "epoch": 19.82016348773842,
+ "grad_norm": 8.394046783447266,
+ "learning_rate": 1.855249645447993e-05,
+ "loss": 0.8461,
+ "step": 7274
+ },
+ {
+ "epoch": 19.822888283378745,
+ "grad_norm": 8.375469207763672,
+ "learning_rate": 1.8552039098148677e-05,
+ "loss": 0.8241,
+ "step": 7275
+ },
+ {
+ "epoch": 19.825613079019075,
+ "grad_norm": 8.33053970336914,
+ "learning_rate": 1.8551581675214416e-05,
+ "loss": 0.8422,
+ "step": 7276
+ },
+ {
+ "epoch": 19.8283378746594,
+ "grad_norm": 9.191420555114746,
+ "learning_rate": 1.8551124185680716e-05,
+ "loss": 0.7114,
+ "step": 7277
+ },
+ {
+ "epoch": 19.831062670299726,
+ "grad_norm": 9.85604476928711,
+ "learning_rate": 1.855066662955113e-05,
+ "loss": 0.8715,
+ "step": 7278
+ },
+ {
+ "epoch": 19.833787465940055,
+ "grad_norm": 7.668471813201904,
+ "learning_rate": 1.8550209006829236e-05,
+ "loss": 1.1304,
+ "step": 7279
+ },
+ {
+ "epoch": 19.83651226158038,
+ "grad_norm": 9.162517547607422,
+ "learning_rate": 1.8549751317518583e-05,
+ "loss": 0.9307,
+ "step": 7280
+ },
+ {
+ "epoch": 19.839237057220707,
+ "grad_norm": 7.64418888092041,
+ "learning_rate": 1.8549293561622742e-05,
+ "loss": 0.7964,
+ "step": 7281
+ },
+ {
+ "epoch": 19.841961852861036,
+ "grad_norm": 10.020888328552246,
+ "learning_rate": 1.854883573914528e-05,
+ "loss": 0.8617,
+ "step": 7282
+ },
+ {
+ "epoch": 19.844686648501362,
+ "grad_norm": 8.746636390686035,
+ "learning_rate": 1.8548377850089764e-05,
+ "loss": 0.7571,
+ "step": 7283
+ },
+ {
+ "epoch": 19.847411444141688,
+ "grad_norm": 8.420528411865234,
+ "learning_rate": 1.8547919894459753e-05,
+ "loss": 0.7667,
+ "step": 7284
+ },
+ {
+ "epoch": 19.850136239782017,
+ "grad_norm": 10.011277198791504,
+ "learning_rate": 1.8547461872258816e-05,
+ "loss": 0.8011,
+ "step": 7285
+ },
+ {
+ "epoch": 19.852861035422343,
+ "grad_norm": 10.89472484588623,
+ "learning_rate": 1.854700378349052e-05,
+ "loss": 1.0264,
+ "step": 7286
+ },
+ {
+ "epoch": 19.85558583106267,
+ "grad_norm": 9.870013236999512,
+ "learning_rate": 1.854654562815844e-05,
+ "loss": 0.9823,
+ "step": 7287
+ },
+ {
+ "epoch": 19.858310626703,
+ "grad_norm": 24.940608978271484,
+ "learning_rate": 1.854608740626613e-05,
+ "loss": 1.1353,
+ "step": 7288
+ },
+ {
+ "epoch": 19.861035422343324,
+ "grad_norm": 6.848790168762207,
+ "learning_rate": 1.854562911781717e-05,
+ "loss": 0.7698,
+ "step": 7289
+ },
+ {
+ "epoch": 19.86376021798365,
+ "grad_norm": 9.606679916381836,
+ "learning_rate": 1.8545170762815122e-05,
+ "loss": 0.9084,
+ "step": 7290
+ },
+ {
+ "epoch": 19.86648501362398,
+ "grad_norm": 12.181947708129883,
+ "learning_rate": 1.8544712341263566e-05,
+ "loss": 0.9169,
+ "step": 7291
+ },
+ {
+ "epoch": 19.869209809264305,
+ "grad_norm": 8.039779663085938,
+ "learning_rate": 1.854425385316606e-05,
+ "loss": 1.0466,
+ "step": 7292
+ },
+ {
+ "epoch": 19.87193460490463,
+ "grad_norm": 8.474559783935547,
+ "learning_rate": 1.854379529852618e-05,
+ "loss": 0.912,
+ "step": 7293
+ },
+ {
+ "epoch": 19.87465940054496,
+ "grad_norm": 7.942590713500977,
+ "learning_rate": 1.85433366773475e-05,
+ "loss": 0.8755,
+ "step": 7294
+ },
+ {
+ "epoch": 19.877384196185286,
+ "grad_norm": 9.164682388305664,
+ "learning_rate": 1.854287798963359e-05,
+ "loss": 0.8634,
+ "step": 7295
+ },
+ {
+ "epoch": 19.88010899182561,
+ "grad_norm": 7.278963088989258,
+ "learning_rate": 1.8542419235388016e-05,
+ "loss": 0.8492,
+ "step": 7296
+ },
+ {
+ "epoch": 19.88283378746594,
+ "grad_norm": 9.253836631774902,
+ "learning_rate": 1.854196041461436e-05,
+ "loss": 1.0032,
+ "step": 7297
+ },
+ {
+ "epoch": 19.885558583106267,
+ "grad_norm": 10.022604942321777,
+ "learning_rate": 1.854150152731619e-05,
+ "loss": 0.7737,
+ "step": 7298
+ },
+ {
+ "epoch": 19.888283378746593,
+ "grad_norm": 6.893654823303223,
+ "learning_rate": 1.854104257349708e-05,
+ "loss": 0.8645,
+ "step": 7299
+ },
+ {
+ "epoch": 19.891008174386922,
+ "grad_norm": 6.988736152648926,
+ "learning_rate": 1.8540583553160606e-05,
+ "loss": 0.8486,
+ "step": 7300
+ },
+ {
+ "epoch": 19.893732970027248,
+ "grad_norm": 9.518927574157715,
+ "learning_rate": 1.8540124466310345e-05,
+ "loss": 0.8699,
+ "step": 7301
+ },
+ {
+ "epoch": 19.896457765667574,
+ "grad_norm": 13.948290824890137,
+ "learning_rate": 1.8539665312949864e-05,
+ "loss": 0.9276,
+ "step": 7302
+ },
+ {
+ "epoch": 19.899182561307903,
+ "grad_norm": 8.599923133850098,
+ "learning_rate": 1.8539206093082748e-05,
+ "loss": 0.7977,
+ "step": 7303
+ },
+ {
+ "epoch": 19.90190735694823,
+ "grad_norm": 10.82606029510498,
+ "learning_rate": 1.8538746806712568e-05,
+ "loss": 0.767,
+ "step": 7304
+ },
+ {
+ "epoch": 19.904632152588555,
+ "grad_norm": 9.037323951721191,
+ "learning_rate": 1.8538287453842906e-05,
+ "loss": 0.9191,
+ "step": 7305
+ },
+ {
+ "epoch": 19.907356948228884,
+ "grad_norm": 7.831912994384766,
+ "learning_rate": 1.853782803447733e-05,
+ "loss": 0.7819,
+ "step": 7306
+ },
+ {
+ "epoch": 19.91008174386921,
+ "grad_norm": 10.063775062561035,
+ "learning_rate": 1.853736854861943e-05,
+ "loss": 0.8586,
+ "step": 7307
+ },
+ {
+ "epoch": 19.912806539509535,
+ "grad_norm": 8.359786033630371,
+ "learning_rate": 1.8536908996272777e-05,
+ "loss": 0.8816,
+ "step": 7308
+ },
+ {
+ "epoch": 19.915531335149865,
+ "grad_norm": 7.736542701721191,
+ "learning_rate": 1.853644937744095e-05,
+ "loss": 0.7466,
+ "step": 7309
+ },
+ {
+ "epoch": 19.91825613079019,
+ "grad_norm": 7.516117095947266,
+ "learning_rate": 1.853598969212753e-05,
+ "loss": 0.9105,
+ "step": 7310
+ },
+ {
+ "epoch": 19.920980926430516,
+ "grad_norm": 10.034730911254883,
+ "learning_rate": 1.8535529940336098e-05,
+ "loss": 0.8567,
+ "step": 7311
+ },
+ {
+ "epoch": 19.923705722070846,
+ "grad_norm": 7.54212760925293,
+ "learning_rate": 1.8535070122070237e-05,
+ "loss": 0.7722,
+ "step": 7312
+ },
+ {
+ "epoch": 19.92643051771117,
+ "grad_norm": 7.285183429718018,
+ "learning_rate": 1.853461023733352e-05,
+ "loss": 0.7952,
+ "step": 7313
+ },
+ {
+ "epoch": 19.929155313351497,
+ "grad_norm": 7.934067726135254,
+ "learning_rate": 1.853415028612953e-05,
+ "loss": 0.7682,
+ "step": 7314
+ },
+ {
+ "epoch": 19.931880108991827,
+ "grad_norm": 9.840912818908691,
+ "learning_rate": 1.8533690268461862e-05,
+ "loss": 0.8525,
+ "step": 7315
+ },
+ {
+ "epoch": 19.934604904632153,
+ "grad_norm": 9.348376274108887,
+ "learning_rate": 1.853323018433408e-05,
+ "loss": 0.9363,
+ "step": 7316
+ },
+ {
+ "epoch": 19.93732970027248,
+ "grad_norm": 8.461465835571289,
+ "learning_rate": 1.853277003374978e-05,
+ "loss": 0.8999,
+ "step": 7317
+ },
+ {
+ "epoch": 19.940054495912808,
+ "grad_norm": 8.06180191040039,
+ "learning_rate": 1.8532309816712542e-05,
+ "loss": 0.7518,
+ "step": 7318
+ },
+ {
+ "epoch": 19.942779291553133,
+ "grad_norm": 9.115461349487305,
+ "learning_rate": 1.8531849533225948e-05,
+ "loss": 0.9355,
+ "step": 7319
+ },
+ {
+ "epoch": 19.94550408719346,
+ "grad_norm": 9.954212188720703,
+ "learning_rate": 1.8531389183293583e-05,
+ "loss": 0.8217,
+ "step": 7320
+ },
+ {
+ "epoch": 19.94822888283379,
+ "grad_norm": 8.282428741455078,
+ "learning_rate": 1.853092876691904e-05,
+ "loss": 1.0406,
+ "step": 7321
+ },
+ {
+ "epoch": 19.950953678474114,
+ "grad_norm": 8.437095642089844,
+ "learning_rate": 1.853046828410589e-05,
+ "loss": 0.8442,
+ "step": 7322
+ },
+ {
+ "epoch": 19.95367847411444,
+ "grad_norm": 7.819126129150391,
+ "learning_rate": 1.8530007734857734e-05,
+ "loss": 0.7717,
+ "step": 7323
+ },
+ {
+ "epoch": 19.95640326975477,
+ "grad_norm": 8.74654483795166,
+ "learning_rate": 1.852954711917815e-05,
+ "loss": 0.817,
+ "step": 7324
+ },
+ {
+ "epoch": 19.959128065395095,
+ "grad_norm": 8.207504272460938,
+ "learning_rate": 1.8529086437070726e-05,
+ "loss": 0.8737,
+ "step": 7325
+ },
+ {
+ "epoch": 19.96185286103542,
+ "grad_norm": 9.41775131225586,
+ "learning_rate": 1.8528625688539055e-05,
+ "loss": 0.9446,
+ "step": 7326
+ },
+ {
+ "epoch": 19.96457765667575,
+ "grad_norm": 9.330113410949707,
+ "learning_rate": 1.8528164873586717e-05,
+ "loss": 0.8481,
+ "step": 7327
+ },
+ {
+ "epoch": 19.967302452316076,
+ "grad_norm": 8.378766059875488,
+ "learning_rate": 1.852770399221731e-05,
+ "loss": 0.9222,
+ "step": 7328
+ },
+ {
+ "epoch": 19.970027247956402,
+ "grad_norm": 11.528024673461914,
+ "learning_rate": 1.8527243044434415e-05,
+ "loss": 0.7509,
+ "step": 7329
+ },
+ {
+ "epoch": 19.97275204359673,
+ "grad_norm": 7.323259353637695,
+ "learning_rate": 1.852678203024163e-05,
+ "loss": 0.9354,
+ "step": 7330
+ },
+ {
+ "epoch": 19.975476839237057,
+ "grad_norm": 7.935391902923584,
+ "learning_rate": 1.8526320949642536e-05,
+ "loss": 0.9752,
+ "step": 7331
+ },
+ {
+ "epoch": 19.978201634877383,
+ "grad_norm": 7.215292930603027,
+ "learning_rate": 1.8525859802640733e-05,
+ "loss": 0.7661,
+ "step": 7332
+ },
+ {
+ "epoch": 19.980926430517712,
+ "grad_norm": 7.696983814239502,
+ "learning_rate": 1.8525398589239803e-05,
+ "loss": 0.9115,
+ "step": 7333
+ },
+ {
+ "epoch": 19.983651226158038,
+ "grad_norm": 10.614715576171875,
+ "learning_rate": 1.8524937309443346e-05,
+ "loss": 0.6874,
+ "step": 7334
+ },
+ {
+ "epoch": 19.986376021798364,
+ "grad_norm": 9.582474708557129,
+ "learning_rate": 1.8524475963254955e-05,
+ "loss": 0.939,
+ "step": 7335
+ },
+ {
+ "epoch": 19.989100817438693,
+ "grad_norm": 7.234864711761475,
+ "learning_rate": 1.8524014550678212e-05,
+ "loss": 0.7971,
+ "step": 7336
+ },
+ {
+ "epoch": 19.99182561307902,
+ "grad_norm": 8.474017143249512,
+ "learning_rate": 1.8523553071716726e-05,
+ "loss": 0.7489,
+ "step": 7337
+ },
+ {
+ "epoch": 19.994550408719345,
+ "grad_norm": 8.070943832397461,
+ "learning_rate": 1.852309152637408e-05,
+ "loss": 0.8862,
+ "step": 7338
+ },
+ {
+ "epoch": 19.997275204359674,
+ "grad_norm": 8.766613006591797,
+ "learning_rate": 1.852262991465387e-05,
+ "loss": 0.8653,
+ "step": 7339
+ },
+ {
+ "epoch": 20.0,
+ "grad_norm": 8.434788703918457,
+ "learning_rate": 1.8522168236559693e-05,
+ "loss": 0.7374,
+ "step": 7340
+ },
+ {
+ "epoch": 20.002724795640326,
+ "grad_norm": 10.932939529418945,
+ "learning_rate": 1.8521706492095147e-05,
+ "loss": 0.8364,
+ "step": 7341
+ },
+ {
+ "epoch": 20.005449591280655,
+ "grad_norm": 7.836805820465088,
+ "learning_rate": 1.852124468126382e-05,
+ "loss": 0.8916,
+ "step": 7342
+ },
+ {
+ "epoch": 20.00817438692098,
+ "grad_norm": 7.299636363983154,
+ "learning_rate": 1.8520782804069317e-05,
+ "loss": 0.619,
+ "step": 7343
+ },
+ {
+ "epoch": 20.010899182561307,
+ "grad_norm": 6.49599027633667,
+ "learning_rate": 1.8520320860515233e-05,
+ "loss": 0.745,
+ "step": 7344
+ },
+ {
+ "epoch": 20.013623978201636,
+ "grad_norm": 7.857719421386719,
+ "learning_rate": 1.851985885060516e-05,
+ "loss": 0.7843,
+ "step": 7345
+ },
+ {
+ "epoch": 20.016348773841962,
+ "grad_norm": 6.397619247436523,
+ "learning_rate": 1.8519396774342707e-05,
+ "loss": 0.6598,
+ "step": 7346
+ },
+ {
+ "epoch": 20.019073569482288,
+ "grad_norm": 6.885274410247803,
+ "learning_rate": 1.8518934631731463e-05,
+ "loss": 0.8165,
+ "step": 7347
+ },
+ {
+ "epoch": 20.021798365122617,
+ "grad_norm": 10.903122901916504,
+ "learning_rate": 1.8518472422775027e-05,
+ "loss": 0.7291,
+ "step": 7348
+ },
+ {
+ "epoch": 20.024523160762943,
+ "grad_norm": 7.2153425216674805,
+ "learning_rate": 1.8518010147477007e-05,
+ "loss": 0.8179,
+ "step": 7349
+ },
+ {
+ "epoch": 20.02724795640327,
+ "grad_norm": 12.313626289367676,
+ "learning_rate": 1.8517547805840995e-05,
+ "loss": 0.9888,
+ "step": 7350
+ },
+ {
+ "epoch": 20.029972752043598,
+ "grad_norm": 7.701757431030273,
+ "learning_rate": 1.8517085397870594e-05,
+ "loss": 0.7278,
+ "step": 7351
+ },
+ {
+ "epoch": 20.032697547683924,
+ "grad_norm": 7.067673206329346,
+ "learning_rate": 1.8516622923569406e-05,
+ "loss": 0.7112,
+ "step": 7352
+ },
+ {
+ "epoch": 20.03542234332425,
+ "grad_norm": 16.146074295043945,
+ "learning_rate": 1.8516160382941035e-05,
+ "loss": 0.8728,
+ "step": 7353
+ },
+ {
+ "epoch": 20.03814713896458,
+ "grad_norm": 9.322784423828125,
+ "learning_rate": 1.851569777598908e-05,
+ "loss": 0.6955,
+ "step": 7354
+ },
+ {
+ "epoch": 20.040871934604905,
+ "grad_norm": 7.918156147003174,
+ "learning_rate": 1.8515235102717145e-05,
+ "loss": 0.7109,
+ "step": 7355
+ },
+ {
+ "epoch": 20.04359673024523,
+ "grad_norm": 7.2958574295043945,
+ "learning_rate": 1.8514772363128833e-05,
+ "loss": 0.8171,
+ "step": 7356
+ },
+ {
+ "epoch": 20.04632152588556,
+ "grad_norm": 7.862805366516113,
+ "learning_rate": 1.851430955722775e-05,
+ "loss": 0.5814,
+ "step": 7357
+ },
+ {
+ "epoch": 20.049046321525886,
+ "grad_norm": 7.682487964630127,
+ "learning_rate": 1.8513846685017498e-05,
+ "loss": 0.7802,
+ "step": 7358
+ },
+ {
+ "epoch": 20.05177111716621,
+ "grad_norm": 8.207341194152832,
+ "learning_rate": 1.8513383746501678e-05,
+ "loss": 0.8322,
+ "step": 7359
+ },
+ {
+ "epoch": 20.05449591280654,
+ "grad_norm": 8.06595230102539,
+ "learning_rate": 1.85129207416839e-05,
+ "loss": 0.7709,
+ "step": 7360
+ },
+ {
+ "epoch": 20.057220708446867,
+ "grad_norm": 7.644371032714844,
+ "learning_rate": 1.8512457670567773e-05,
+ "loss": 0.7821,
+ "step": 7361
+ },
+ {
+ "epoch": 20.059945504087192,
+ "grad_norm": 8.130538940429688,
+ "learning_rate": 1.8511994533156898e-05,
+ "loss": 0.8824,
+ "step": 7362
+ },
+ {
+ "epoch": 20.06267029972752,
+ "grad_norm": 8.64433479309082,
+ "learning_rate": 1.8511531329454883e-05,
+ "loss": 0.7031,
+ "step": 7363
+ },
+ {
+ "epoch": 20.065395095367847,
+ "grad_norm": 8.260018348693848,
+ "learning_rate": 1.8511068059465334e-05,
+ "loss": 0.7408,
+ "step": 7364
+ },
+ {
+ "epoch": 20.068119891008173,
+ "grad_norm": 8.091988563537598,
+ "learning_rate": 1.8510604723191865e-05,
+ "loss": 0.7526,
+ "step": 7365
+ },
+ {
+ "epoch": 20.070844686648503,
+ "grad_norm": 8.094756126403809,
+ "learning_rate": 1.8510141320638078e-05,
+ "loss": 0.7114,
+ "step": 7366
+ },
+ {
+ "epoch": 20.07356948228883,
+ "grad_norm": 10.249007225036621,
+ "learning_rate": 1.8509677851807584e-05,
+ "loss": 0.8809,
+ "step": 7367
+ },
+ {
+ "epoch": 20.076294277929154,
+ "grad_norm": 7.930947303771973,
+ "learning_rate": 1.8509214316703993e-05,
+ "loss": 0.8882,
+ "step": 7368
+ },
+ {
+ "epoch": 20.079019073569484,
+ "grad_norm": 8.538778305053711,
+ "learning_rate": 1.8508750715330913e-05,
+ "loss": 0.6705,
+ "step": 7369
+ },
+ {
+ "epoch": 20.08174386920981,
+ "grad_norm": 7.569141864776611,
+ "learning_rate": 1.850828704769196e-05,
+ "loss": 0.7793,
+ "step": 7370
+ },
+ {
+ "epoch": 20.084468664850135,
+ "grad_norm": 11.548090934753418,
+ "learning_rate": 1.850782331379074e-05,
+ "loss": 0.8179,
+ "step": 7371
+ },
+ {
+ "epoch": 20.087193460490465,
+ "grad_norm": 7.210183143615723,
+ "learning_rate": 1.8507359513630865e-05,
+ "loss": 0.7361,
+ "step": 7372
+ },
+ {
+ "epoch": 20.08991825613079,
+ "grad_norm": 7.356325149536133,
+ "learning_rate": 1.850689564721595e-05,
+ "loss": 0.7419,
+ "step": 7373
+ },
+ {
+ "epoch": 20.092643051771116,
+ "grad_norm": 8.463406562805176,
+ "learning_rate": 1.8506431714549606e-05,
+ "loss": 0.9131,
+ "step": 7374
+ },
+ {
+ "epoch": 20.095367847411445,
+ "grad_norm": 11.675747871398926,
+ "learning_rate": 1.850596771563544e-05,
+ "loss": 0.8203,
+ "step": 7375
+ },
+ {
+ "epoch": 20.09809264305177,
+ "grad_norm": 7.034526348114014,
+ "learning_rate": 1.8505503650477074e-05,
+ "loss": 0.7858,
+ "step": 7376
+ },
+ {
+ "epoch": 20.100817438692097,
+ "grad_norm": 7.410828113555908,
+ "learning_rate": 1.850503951907812e-05,
+ "loss": 0.8191,
+ "step": 7377
+ },
+ {
+ "epoch": 20.103542234332426,
+ "grad_norm": 8.026698112487793,
+ "learning_rate": 1.8504575321442194e-05,
+ "loss": 0.7474,
+ "step": 7378
+ },
+ {
+ "epoch": 20.106267029972752,
+ "grad_norm": 7.907639503479004,
+ "learning_rate": 1.8504111057572905e-05,
+ "loss": 0.7725,
+ "step": 7379
+ },
+ {
+ "epoch": 20.108991825613078,
+ "grad_norm": 6.920834064483643,
+ "learning_rate": 1.8503646727473877e-05,
+ "loss": 0.7247,
+ "step": 7380
+ },
+ {
+ "epoch": 20.111716621253407,
+ "grad_norm": 7.789642810821533,
+ "learning_rate": 1.850318233114872e-05,
+ "loss": 0.6345,
+ "step": 7381
+ },
+ {
+ "epoch": 20.114441416893733,
+ "grad_norm": 7.425340175628662,
+ "learning_rate": 1.8502717868601054e-05,
+ "loss": 0.6998,
+ "step": 7382
+ },
+ {
+ "epoch": 20.11716621253406,
+ "grad_norm": 8.662664413452148,
+ "learning_rate": 1.850225333983449e-05,
+ "loss": 0.795,
+ "step": 7383
+ },
+ {
+ "epoch": 20.11989100817439,
+ "grad_norm": 7.657357215881348,
+ "learning_rate": 1.8501788744852652e-05,
+ "loss": 0.7484,
+ "step": 7384
+ },
+ {
+ "epoch": 20.122615803814714,
+ "grad_norm": 7.295523643493652,
+ "learning_rate": 1.850132408365916e-05,
+ "loss": 0.624,
+ "step": 7385
+ },
+ {
+ "epoch": 20.12534059945504,
+ "grad_norm": 8.386079788208008,
+ "learning_rate": 1.850085935625763e-05,
+ "loss": 0.8629,
+ "step": 7386
+ },
+ {
+ "epoch": 20.12806539509537,
+ "grad_norm": 9.70673942565918,
+ "learning_rate": 1.850039456265168e-05,
+ "loss": 0.9041,
+ "step": 7387
+ },
+ {
+ "epoch": 20.130790190735695,
+ "grad_norm": 7.998185157775879,
+ "learning_rate": 1.8499929702844932e-05,
+ "loss": 0.7749,
+ "step": 7388
+ },
+ {
+ "epoch": 20.13351498637602,
+ "grad_norm": 7.6672444343566895,
+ "learning_rate": 1.8499464776841e-05,
+ "loss": 0.7769,
+ "step": 7389
+ },
+ {
+ "epoch": 20.13623978201635,
+ "grad_norm": 9.27935791015625,
+ "learning_rate": 1.8498999784643517e-05,
+ "loss": 0.8093,
+ "step": 7390
+ },
+ {
+ "epoch": 20.138964577656676,
+ "grad_norm": 7.795583724975586,
+ "learning_rate": 1.8498534726256094e-05,
+ "loss": 0.8046,
+ "step": 7391
+ },
+ {
+ "epoch": 20.141689373297,
+ "grad_norm": 7.7575273513793945,
+ "learning_rate": 1.8498069601682353e-05,
+ "loss": 0.7775,
+ "step": 7392
+ },
+ {
+ "epoch": 20.14441416893733,
+ "grad_norm": 8.204751968383789,
+ "learning_rate": 1.8497604410925923e-05,
+ "loss": 0.741,
+ "step": 7393
+ },
+ {
+ "epoch": 20.147138964577657,
+ "grad_norm": 7.928032875061035,
+ "learning_rate": 1.849713915399042e-05,
+ "loss": 0.8253,
+ "step": 7394
+ },
+ {
+ "epoch": 20.149863760217983,
+ "grad_norm": 8.550969123840332,
+ "learning_rate": 1.8496673830879475e-05,
+ "loss": 0.6736,
+ "step": 7395
+ },
+ {
+ "epoch": 20.152588555858312,
+ "grad_norm": 6.771650791168213,
+ "learning_rate": 1.8496208441596706e-05,
+ "loss": 0.7365,
+ "step": 7396
+ },
+ {
+ "epoch": 20.155313351498638,
+ "grad_norm": 8.69344425201416,
+ "learning_rate": 1.8495742986145737e-05,
+ "loss": 0.6356,
+ "step": 7397
+ },
+ {
+ "epoch": 20.158038147138964,
+ "grad_norm": 8.5400390625,
+ "learning_rate": 1.8495277464530198e-05,
+ "loss": 0.7332,
+ "step": 7398
+ },
+ {
+ "epoch": 20.160762942779293,
+ "grad_norm": 8.132911682128906,
+ "learning_rate": 1.8494811876753712e-05,
+ "loss": 0.7512,
+ "step": 7399
+ },
+ {
+ "epoch": 20.16348773841962,
+ "grad_norm": 7.471899032592773,
+ "learning_rate": 1.84943462228199e-05,
+ "loss": 0.7015,
+ "step": 7400
+ },
+ {
+ "epoch": 20.166212534059945,
+ "grad_norm": 7.605429649353027,
+ "learning_rate": 1.84938805027324e-05,
+ "loss": 0.7745,
+ "step": 7401
+ },
+ {
+ "epoch": 20.168937329700274,
+ "grad_norm": 8.774757385253906,
+ "learning_rate": 1.8493414716494826e-05,
+ "loss": 0.7217,
+ "step": 7402
+ },
+ {
+ "epoch": 20.1716621253406,
+ "grad_norm": 7.752110481262207,
+ "learning_rate": 1.849294886411081e-05,
+ "loss": 0.675,
+ "step": 7403
+ },
+ {
+ "epoch": 20.174386920980925,
+ "grad_norm": 7.987790107727051,
+ "learning_rate": 1.849248294558399e-05,
+ "loss": 0.7279,
+ "step": 7404
+ },
+ {
+ "epoch": 20.177111716621255,
+ "grad_norm": 7.009028434753418,
+ "learning_rate": 1.849201696091798e-05,
+ "loss": 0.6802,
+ "step": 7405
+ },
+ {
+ "epoch": 20.17983651226158,
+ "grad_norm": 7.810697078704834,
+ "learning_rate": 1.8491550910116415e-05,
+ "loss": 0.8302,
+ "step": 7406
+ },
+ {
+ "epoch": 20.182561307901906,
+ "grad_norm": 9.02009105682373,
+ "learning_rate": 1.8491084793182925e-05,
+ "loss": 0.8419,
+ "step": 7407
+ },
+ {
+ "epoch": 20.185286103542236,
+ "grad_norm": 9.22038459777832,
+ "learning_rate": 1.8490618610121144e-05,
+ "loss": 0.6157,
+ "step": 7408
+ },
+ {
+ "epoch": 20.18801089918256,
+ "grad_norm": 6.129733562469482,
+ "learning_rate": 1.8490152360934695e-05,
+ "loss": 0.6604,
+ "step": 7409
+ },
+ {
+ "epoch": 20.190735694822887,
+ "grad_norm": 6.585142612457275,
+ "learning_rate": 1.848968604562721e-05,
+ "loss": 0.7493,
+ "step": 7410
+ },
+ {
+ "epoch": 20.193460490463217,
+ "grad_norm": 13.595898628234863,
+ "learning_rate": 1.848921966420233e-05,
+ "loss": 0.7126,
+ "step": 7411
+ },
+ {
+ "epoch": 20.196185286103542,
+ "grad_norm": 9.962562561035156,
+ "learning_rate": 1.8488753216663675e-05,
+ "loss": 0.826,
+ "step": 7412
+ },
+ {
+ "epoch": 20.19891008174387,
+ "grad_norm": 8.39643383026123,
+ "learning_rate": 1.848828670301489e-05,
+ "loss": 0.6631,
+ "step": 7413
+ },
+ {
+ "epoch": 20.201634877384198,
+ "grad_norm": 8.44212532043457,
+ "learning_rate": 1.8487820123259595e-05,
+ "loss": 0.6271,
+ "step": 7414
+ },
+ {
+ "epoch": 20.204359673024523,
+ "grad_norm": 7.178295135498047,
+ "learning_rate": 1.848735347740143e-05,
+ "loss": 0.8287,
+ "step": 7415
+ },
+ {
+ "epoch": 20.20708446866485,
+ "grad_norm": 14.088622093200684,
+ "learning_rate": 1.848688676544403e-05,
+ "loss": 0.9037,
+ "step": 7416
+ },
+ {
+ "epoch": 20.20980926430518,
+ "grad_norm": 9.695867538452148,
+ "learning_rate": 1.848641998739103e-05,
+ "loss": 0.8507,
+ "step": 7417
+ },
+ {
+ "epoch": 20.212534059945504,
+ "grad_norm": 8.77767276763916,
+ "learning_rate": 1.8485953143246065e-05,
+ "loss": 0.6851,
+ "step": 7418
+ },
+ {
+ "epoch": 20.21525885558583,
+ "grad_norm": 7.242414474487305,
+ "learning_rate": 1.848548623301277e-05,
+ "loss": 0.6465,
+ "step": 7419
+ },
+ {
+ "epoch": 20.21798365122616,
+ "grad_norm": 11.707669258117676,
+ "learning_rate": 1.848501925669478e-05,
+ "loss": 0.7872,
+ "step": 7420
+ },
+ {
+ "epoch": 20.220708446866485,
+ "grad_norm": 8.391408920288086,
+ "learning_rate": 1.8484552214295735e-05,
+ "loss": 0.6744,
+ "step": 7421
+ },
+ {
+ "epoch": 20.22343324250681,
+ "grad_norm": 7.5969767570495605,
+ "learning_rate": 1.8484085105819267e-05,
+ "loss": 0.7931,
+ "step": 7422
+ },
+ {
+ "epoch": 20.22615803814714,
+ "grad_norm": 8.797009468078613,
+ "learning_rate": 1.8483617931269022e-05,
+ "loss": 0.7268,
+ "step": 7423
+ },
+ {
+ "epoch": 20.228882833787466,
+ "grad_norm": 8.09107780456543,
+ "learning_rate": 1.848315069064863e-05,
+ "loss": 0.7107,
+ "step": 7424
+ },
+ {
+ "epoch": 20.231607629427792,
+ "grad_norm": 10.13934326171875,
+ "learning_rate": 1.8482683383961734e-05,
+ "loss": 0.6779,
+ "step": 7425
+ },
+ {
+ "epoch": 20.23433242506812,
+ "grad_norm": 7.996647834777832,
+ "learning_rate": 1.8482216011211976e-05,
+ "loss": 0.7646,
+ "step": 7426
+ },
+ {
+ "epoch": 20.237057220708447,
+ "grad_norm": 7.624180793762207,
+ "learning_rate": 1.8481748572402986e-05,
+ "loss": 0.7559,
+ "step": 7427
+ },
+ {
+ "epoch": 20.239782016348773,
+ "grad_norm": 11.821518898010254,
+ "learning_rate": 1.8481281067538416e-05,
+ "loss": 0.7444,
+ "step": 7428
+ },
+ {
+ "epoch": 20.242506811989102,
+ "grad_norm": 9.72706413269043,
+ "learning_rate": 1.8480813496621902e-05,
+ "loss": 0.833,
+ "step": 7429
+ },
+ {
+ "epoch": 20.245231607629428,
+ "grad_norm": 13.47059154510498,
+ "learning_rate": 1.8480345859657085e-05,
+ "loss": 0.8408,
+ "step": 7430
+ },
+ {
+ "epoch": 20.247956403269754,
+ "grad_norm": 8.498688697814941,
+ "learning_rate": 1.8479878156647606e-05,
+ "loss": 0.7551,
+ "step": 7431
+ },
+ {
+ "epoch": 20.250681198910083,
+ "grad_norm": 7.454466342926025,
+ "learning_rate": 1.847941038759711e-05,
+ "loss": 0.8337,
+ "step": 7432
+ },
+ {
+ "epoch": 20.25340599455041,
+ "grad_norm": 7.318837642669678,
+ "learning_rate": 1.847894255250924e-05,
+ "loss": 0.6942,
+ "step": 7433
+ },
+ {
+ "epoch": 20.256130790190735,
+ "grad_norm": 8.633078575134277,
+ "learning_rate": 1.8478474651387633e-05,
+ "loss": 0.774,
+ "step": 7434
+ },
+ {
+ "epoch": 20.258855585831064,
+ "grad_norm": 17.29705238342285,
+ "learning_rate": 1.8478006684235944e-05,
+ "loss": 0.826,
+ "step": 7435
+ },
+ {
+ "epoch": 20.26158038147139,
+ "grad_norm": 7.4252848625183105,
+ "learning_rate": 1.8477538651057812e-05,
+ "loss": 0.6229,
+ "step": 7436
+ },
+ {
+ "epoch": 20.264305177111716,
+ "grad_norm": 7.693795680999756,
+ "learning_rate": 1.847707055185688e-05,
+ "loss": 0.6783,
+ "step": 7437
+ },
+ {
+ "epoch": 20.267029972752045,
+ "grad_norm": 10.12563705444336,
+ "learning_rate": 1.8476602386636795e-05,
+ "loss": 0.7482,
+ "step": 7438
+ },
+ {
+ "epoch": 20.26975476839237,
+ "grad_norm": 7.601416110992432,
+ "learning_rate": 1.8476134155401202e-05,
+ "loss": 0.6664,
+ "step": 7439
+ },
+ {
+ "epoch": 20.272479564032697,
+ "grad_norm": 8.094047546386719,
+ "learning_rate": 1.8475665858153752e-05,
+ "loss": 0.734,
+ "step": 7440
+ },
+ {
+ "epoch": 20.275204359673026,
+ "grad_norm": 6.953584671020508,
+ "learning_rate": 1.847519749489809e-05,
+ "loss": 0.7358,
+ "step": 7441
+ },
+ {
+ "epoch": 20.277929155313352,
+ "grad_norm": 8.376222610473633,
+ "learning_rate": 1.8474729065637858e-05,
+ "loss": 0.8031,
+ "step": 7442
+ },
+ {
+ "epoch": 20.280653950953678,
+ "grad_norm": 10.219070434570312,
+ "learning_rate": 1.847426057037671e-05,
+ "loss": 0.8011,
+ "step": 7443
+ },
+ {
+ "epoch": 20.283378746594007,
+ "grad_norm": 10.703056335449219,
+ "learning_rate": 1.8473792009118297e-05,
+ "loss": 0.7283,
+ "step": 7444
+ },
+ {
+ "epoch": 20.286103542234333,
+ "grad_norm": 8.556020736694336,
+ "learning_rate": 1.8473323381866262e-05,
+ "loss": 0.7957,
+ "step": 7445
+ },
+ {
+ "epoch": 20.28882833787466,
+ "grad_norm": 9.588483810424805,
+ "learning_rate": 1.8472854688624255e-05,
+ "loss": 0.6652,
+ "step": 7446
+ },
+ {
+ "epoch": 20.291553133514988,
+ "grad_norm": 7.484055042266846,
+ "learning_rate": 1.847238592939593e-05,
+ "loss": 0.7836,
+ "step": 7447
+ },
+ {
+ "epoch": 20.294277929155314,
+ "grad_norm": 7.0402421951293945,
+ "learning_rate": 1.847191710418494e-05,
+ "loss": 0.7645,
+ "step": 7448
+ },
+ {
+ "epoch": 20.29700272479564,
+ "grad_norm": 7.735825061798096,
+ "learning_rate": 1.8471448212994927e-05,
+ "loss": 0.7928,
+ "step": 7449
+ },
+ {
+ "epoch": 20.29972752043597,
+ "grad_norm": 8.195221900939941,
+ "learning_rate": 1.847097925582955e-05,
+ "loss": 0.8018,
+ "step": 7450
+ },
+ {
+ "epoch": 20.302452316076295,
+ "grad_norm": 8.101825714111328,
+ "learning_rate": 1.847051023269246e-05,
+ "loss": 0.6886,
+ "step": 7451
+ },
+ {
+ "epoch": 20.30517711171662,
+ "grad_norm": 9.327179908752441,
+ "learning_rate": 1.8470041143587307e-05,
+ "loss": 0.9258,
+ "step": 7452
+ },
+ {
+ "epoch": 20.30790190735695,
+ "grad_norm": 8.218055725097656,
+ "learning_rate": 1.846957198851775e-05,
+ "loss": 0.8246,
+ "step": 7453
+ },
+ {
+ "epoch": 20.310626702997276,
+ "grad_norm": 6.9764580726623535,
+ "learning_rate": 1.8469102767487434e-05,
+ "loss": 0.7168,
+ "step": 7454
+ },
+ {
+ "epoch": 20.3133514986376,
+ "grad_norm": 9.409618377685547,
+ "learning_rate": 1.8468633480500024e-05,
+ "loss": 0.8809,
+ "step": 7455
+ },
+ {
+ "epoch": 20.31607629427793,
+ "grad_norm": 7.560911178588867,
+ "learning_rate": 1.8468164127559162e-05,
+ "loss": 0.7257,
+ "step": 7456
+ },
+ {
+ "epoch": 20.318801089918257,
+ "grad_norm": 7.362529277801514,
+ "learning_rate": 1.8467694708668516e-05,
+ "loss": 0.8376,
+ "step": 7457
+ },
+ {
+ "epoch": 20.321525885558582,
+ "grad_norm": 8.374099731445312,
+ "learning_rate": 1.8467225223831733e-05,
+ "loss": 0.7881,
+ "step": 7458
+ },
+ {
+ "epoch": 20.32425068119891,
+ "grad_norm": 9.146530151367188,
+ "learning_rate": 1.8466755673052472e-05,
+ "loss": 0.781,
+ "step": 7459
+ },
+ {
+ "epoch": 20.326975476839237,
+ "grad_norm": 8.215435981750488,
+ "learning_rate": 1.8466286056334394e-05,
+ "loss": 0.9,
+ "step": 7460
+ },
+ {
+ "epoch": 20.329700272479563,
+ "grad_norm": 8.195052146911621,
+ "learning_rate": 1.846581637368115e-05,
+ "loss": 0.7197,
+ "step": 7461
+ },
+ {
+ "epoch": 20.332425068119893,
+ "grad_norm": 8.552736282348633,
+ "learning_rate": 1.84653466250964e-05,
+ "loss": 0.7437,
+ "step": 7462
+ },
+ {
+ "epoch": 20.33514986376022,
+ "grad_norm": 7.810488224029541,
+ "learning_rate": 1.8464876810583806e-05,
+ "loss": 0.7225,
+ "step": 7463
+ },
+ {
+ "epoch": 20.337874659400544,
+ "grad_norm": 9.693074226379395,
+ "learning_rate": 1.846440693014702e-05,
+ "loss": 0.9473,
+ "step": 7464
+ },
+ {
+ "epoch": 20.340599455040874,
+ "grad_norm": 8.138737678527832,
+ "learning_rate": 1.8463936983789706e-05,
+ "loss": 0.8163,
+ "step": 7465
+ },
+ {
+ "epoch": 20.3433242506812,
+ "grad_norm": 9.098084449768066,
+ "learning_rate": 1.8463466971515525e-05,
+ "loss": 0.7632,
+ "step": 7466
+ },
+ {
+ "epoch": 20.346049046321525,
+ "grad_norm": 8.016382217407227,
+ "learning_rate": 1.8462996893328134e-05,
+ "loss": 0.7781,
+ "step": 7467
+ },
+ {
+ "epoch": 20.348773841961854,
+ "grad_norm": 9.49134349822998,
+ "learning_rate": 1.84625267492312e-05,
+ "loss": 0.8644,
+ "step": 7468
+ },
+ {
+ "epoch": 20.35149863760218,
+ "grad_norm": 7.997730255126953,
+ "learning_rate": 1.8462056539228378e-05,
+ "loss": 0.7477,
+ "step": 7469
+ },
+ {
+ "epoch": 20.354223433242506,
+ "grad_norm": 7.561858177185059,
+ "learning_rate": 1.8461586263323327e-05,
+ "loss": 0.876,
+ "step": 7470
+ },
+ {
+ "epoch": 20.356948228882835,
+ "grad_norm": 9.587177276611328,
+ "learning_rate": 1.846111592151972e-05,
+ "loss": 0.5931,
+ "step": 7471
+ },
+ {
+ "epoch": 20.35967302452316,
+ "grad_norm": 10.550204277038574,
+ "learning_rate": 1.846064551382121e-05,
+ "loss": 0.9094,
+ "step": 7472
+ },
+ {
+ "epoch": 20.362397820163487,
+ "grad_norm": 9.21194839477539,
+ "learning_rate": 1.8460175040231468e-05,
+ "loss": 0.8365,
+ "step": 7473
+ },
+ {
+ "epoch": 20.365122615803816,
+ "grad_norm": 8.397749900817871,
+ "learning_rate": 1.8459704500754155e-05,
+ "loss": 0.7267,
+ "step": 7474
+ },
+ {
+ "epoch": 20.367847411444142,
+ "grad_norm": 8.124926567077637,
+ "learning_rate": 1.8459233895392933e-05,
+ "loss": 0.7791,
+ "step": 7475
+ },
+ {
+ "epoch": 20.370572207084468,
+ "grad_norm": 7.280975341796875,
+ "learning_rate": 1.8458763224151476e-05,
+ "loss": 1.043,
+ "step": 7476
+ },
+ {
+ "epoch": 20.373297002724797,
+ "grad_norm": 8.212790489196777,
+ "learning_rate": 1.845829248703344e-05,
+ "loss": 0.7695,
+ "step": 7477
+ },
+ {
+ "epoch": 20.376021798365123,
+ "grad_norm": 8.955096244812012,
+ "learning_rate": 1.8457821684042492e-05,
+ "loss": 0.8295,
+ "step": 7478
+ },
+ {
+ "epoch": 20.37874659400545,
+ "grad_norm": 8.780290603637695,
+ "learning_rate": 1.8457350815182303e-05,
+ "loss": 0.7451,
+ "step": 7479
+ },
+ {
+ "epoch": 20.381471389645778,
+ "grad_norm": 7.5337090492248535,
+ "learning_rate": 1.8456879880456537e-05,
+ "loss": 0.7841,
+ "step": 7480
+ },
+ {
+ "epoch": 20.384196185286104,
+ "grad_norm": 8.871101379394531,
+ "learning_rate": 1.8456408879868864e-05,
+ "loss": 0.8707,
+ "step": 7481
+ },
+ {
+ "epoch": 20.38692098092643,
+ "grad_norm": 16.11921501159668,
+ "learning_rate": 1.845593781342295e-05,
+ "loss": 0.6917,
+ "step": 7482
+ },
+ {
+ "epoch": 20.38964577656676,
+ "grad_norm": 8.842729568481445,
+ "learning_rate": 1.8455466681122463e-05,
+ "loss": 0.785,
+ "step": 7483
+ },
+ {
+ "epoch": 20.392370572207085,
+ "grad_norm": 8.087883949279785,
+ "learning_rate": 1.8454995482971077e-05,
+ "loss": 0.8903,
+ "step": 7484
+ },
+ {
+ "epoch": 20.39509536784741,
+ "grad_norm": 8.730992317199707,
+ "learning_rate": 1.8454524218972457e-05,
+ "loss": 0.8339,
+ "step": 7485
+ },
+ {
+ "epoch": 20.39782016348774,
+ "grad_norm": 8.91746997833252,
+ "learning_rate": 1.8454052889130273e-05,
+ "loss": 0.8063,
+ "step": 7486
+ },
+ {
+ "epoch": 20.400544959128066,
+ "grad_norm": 9.099474906921387,
+ "learning_rate": 1.84535814934482e-05,
+ "loss": 0.787,
+ "step": 7487
+ },
+ {
+ "epoch": 20.40326975476839,
+ "grad_norm": 10.209683418273926,
+ "learning_rate": 1.84531100319299e-05,
+ "loss": 0.9791,
+ "step": 7488
+ },
+ {
+ "epoch": 20.40599455040872,
+ "grad_norm": 7.775052070617676,
+ "learning_rate": 1.8452638504579056e-05,
+ "loss": 0.6804,
+ "step": 7489
+ },
+ {
+ "epoch": 20.408719346049047,
+ "grad_norm": 9.734155654907227,
+ "learning_rate": 1.8452166911399336e-05,
+ "loss": 0.7009,
+ "step": 7490
+ },
+ {
+ "epoch": 20.411444141689373,
+ "grad_norm": 7.811398506164551,
+ "learning_rate": 1.8451695252394413e-05,
+ "loss": 0.8672,
+ "step": 7491
+ },
+ {
+ "epoch": 20.414168937329702,
+ "grad_norm": 9.408904075622559,
+ "learning_rate": 1.8451223527567956e-05,
+ "loss": 0.9297,
+ "step": 7492
+ },
+ {
+ "epoch": 20.416893732970028,
+ "grad_norm": 12.2958402633667,
+ "learning_rate": 1.8450751736923644e-05,
+ "loss": 0.8146,
+ "step": 7493
+ },
+ {
+ "epoch": 20.419618528610354,
+ "grad_norm": 8.134531021118164,
+ "learning_rate": 1.845027988046515e-05,
+ "loss": 0.8298,
+ "step": 7494
+ },
+ {
+ "epoch": 20.422343324250683,
+ "grad_norm": 11.866950035095215,
+ "learning_rate": 1.844980795819615e-05,
+ "loss": 0.9991,
+ "step": 7495
+ },
+ {
+ "epoch": 20.42506811989101,
+ "grad_norm": 9.131204605102539,
+ "learning_rate": 1.844933597012031e-05,
+ "loss": 0.8635,
+ "step": 7496
+ },
+ {
+ "epoch": 20.427792915531334,
+ "grad_norm": 7.015655040740967,
+ "learning_rate": 1.8448863916241324e-05,
+ "loss": 0.6737,
+ "step": 7497
+ },
+ {
+ "epoch": 20.430517711171664,
+ "grad_norm": 8.82425308227539,
+ "learning_rate": 1.844839179656285e-05,
+ "loss": 0.7856,
+ "step": 7498
+ },
+ {
+ "epoch": 20.43324250681199,
+ "grad_norm": 8.597686767578125,
+ "learning_rate": 1.8447919611088574e-05,
+ "loss": 0.8732,
+ "step": 7499
+ },
+ {
+ "epoch": 20.435967302452315,
+ "grad_norm": 8.5596342086792,
+ "learning_rate": 1.8447447359822172e-05,
+ "loss": 0.7124,
+ "step": 7500
+ },
+ {
+ "epoch": 20.438692098092645,
+ "grad_norm": 10.065719604492188,
+ "learning_rate": 1.844697504276732e-05,
+ "loss": 0.8853,
+ "step": 7501
+ },
+ {
+ "epoch": 20.44141689373297,
+ "grad_norm": 7.822795867919922,
+ "learning_rate": 1.8446502659927702e-05,
+ "loss": 0.7365,
+ "step": 7502
+ },
+ {
+ "epoch": 20.444141689373296,
+ "grad_norm": 9.746071815490723,
+ "learning_rate": 1.8446030211306993e-05,
+ "loss": 0.6361,
+ "step": 7503
+ },
+ {
+ "epoch": 20.446866485013626,
+ "grad_norm": 8.904976844787598,
+ "learning_rate": 1.8445557696908874e-05,
+ "loss": 0.8429,
+ "step": 7504
+ },
+ {
+ "epoch": 20.44959128065395,
+ "grad_norm": 14.334179878234863,
+ "learning_rate": 1.844508511673702e-05,
+ "loss": 0.7555,
+ "step": 7505
+ },
+ {
+ "epoch": 20.452316076294277,
+ "grad_norm": 8.744474411010742,
+ "learning_rate": 1.8444612470795114e-05,
+ "loss": 0.8788,
+ "step": 7506
+ },
+ {
+ "epoch": 20.455040871934607,
+ "grad_norm": 8.65246295928955,
+ "learning_rate": 1.844413975908684e-05,
+ "loss": 0.7695,
+ "step": 7507
+ },
+ {
+ "epoch": 20.457765667574932,
+ "grad_norm": 8.80207633972168,
+ "learning_rate": 1.844366698161588e-05,
+ "loss": 0.6603,
+ "step": 7508
+ },
+ {
+ "epoch": 20.460490463215258,
+ "grad_norm": 8.420857429504395,
+ "learning_rate": 1.844319413838591e-05,
+ "loss": 0.8613,
+ "step": 7509
+ },
+ {
+ "epoch": 20.463215258855588,
+ "grad_norm": 9.497468948364258,
+ "learning_rate": 1.8442721229400615e-05,
+ "loss": 0.7391,
+ "step": 7510
+ },
+ {
+ "epoch": 20.465940054495913,
+ "grad_norm": 16.942873001098633,
+ "learning_rate": 1.844224825466368e-05,
+ "loss": 0.8069,
+ "step": 7511
+ },
+ {
+ "epoch": 20.46866485013624,
+ "grad_norm": 9.093857765197754,
+ "learning_rate": 1.8441775214178784e-05,
+ "loss": 0.7908,
+ "step": 7512
+ },
+ {
+ "epoch": 20.47138964577657,
+ "grad_norm": 8.484370231628418,
+ "learning_rate": 1.844130210794962e-05,
+ "loss": 0.8571,
+ "step": 7513
+ },
+ {
+ "epoch": 20.474114441416894,
+ "grad_norm": 7.775330066680908,
+ "learning_rate": 1.8440828935979865e-05,
+ "loss": 0.795,
+ "step": 7514
+ },
+ {
+ "epoch": 20.47683923705722,
+ "grad_norm": 10.508936882019043,
+ "learning_rate": 1.8440355698273203e-05,
+ "loss": 0.8212,
+ "step": 7515
+ },
+ {
+ "epoch": 20.479564032697546,
+ "grad_norm": 9.015315055847168,
+ "learning_rate": 1.843988239483333e-05,
+ "loss": 0.6935,
+ "step": 7516
+ },
+ {
+ "epoch": 20.482288828337875,
+ "grad_norm": 9.50527286529541,
+ "learning_rate": 1.8439409025663915e-05,
+ "loss": 0.8352,
+ "step": 7517
+ },
+ {
+ "epoch": 20.4850136239782,
+ "grad_norm": 10.273641586303711,
+ "learning_rate": 1.8438935590768658e-05,
+ "loss": 0.8578,
+ "step": 7518
+ },
+ {
+ "epoch": 20.48773841961853,
+ "grad_norm": 7.911138534545898,
+ "learning_rate": 1.8438462090151247e-05,
+ "loss": 0.8323,
+ "step": 7519
+ },
+ {
+ "epoch": 20.490463215258856,
+ "grad_norm": 8.356745719909668,
+ "learning_rate": 1.843798852381536e-05,
+ "loss": 0.7462,
+ "step": 7520
+ },
+ {
+ "epoch": 20.493188010899182,
+ "grad_norm": 9.9681978225708,
+ "learning_rate": 1.843751489176469e-05,
+ "loss": 0.7948,
+ "step": 7521
+ },
+ {
+ "epoch": 20.495912806539508,
+ "grad_norm": 8.1953763961792,
+ "learning_rate": 1.8437041194002924e-05,
+ "loss": 0.6564,
+ "step": 7522
+ },
+ {
+ "epoch": 20.498637602179837,
+ "grad_norm": 10.268936157226562,
+ "learning_rate": 1.8436567430533757e-05,
+ "loss": 0.8291,
+ "step": 7523
+ },
+ {
+ "epoch": 20.501362397820163,
+ "grad_norm": 11.004013061523438,
+ "learning_rate": 1.8436093601360872e-05,
+ "loss": 0.9343,
+ "step": 7524
+ },
+ {
+ "epoch": 20.504087193460492,
+ "grad_norm": 10.917760848999023,
+ "learning_rate": 1.843561970648796e-05,
+ "loss": 0.7391,
+ "step": 7525
+ },
+ {
+ "epoch": 20.506811989100818,
+ "grad_norm": 11.350653648376465,
+ "learning_rate": 1.8435145745918713e-05,
+ "loss": 0.6913,
+ "step": 7526
+ },
+ {
+ "epoch": 20.509536784741144,
+ "grad_norm": 10.579289436340332,
+ "learning_rate": 1.8434671719656826e-05,
+ "loss": 0.7494,
+ "step": 7527
+ },
+ {
+ "epoch": 20.51226158038147,
+ "grad_norm": 11.816920280456543,
+ "learning_rate": 1.843419762770599e-05,
+ "loss": 1.0459,
+ "step": 7528
+ },
+ {
+ "epoch": 20.5149863760218,
+ "grad_norm": 11.840269088745117,
+ "learning_rate": 1.8433723470069888e-05,
+ "loss": 0.8867,
+ "step": 7529
+ },
+ {
+ "epoch": 20.517711171662125,
+ "grad_norm": 8.952495574951172,
+ "learning_rate": 1.843324924675222e-05,
+ "loss": 0.7943,
+ "step": 7530
+ },
+ {
+ "epoch": 20.520435967302454,
+ "grad_norm": 9.813703536987305,
+ "learning_rate": 1.8432774957756677e-05,
+ "loss": 0.797,
+ "step": 7531
+ },
+ {
+ "epoch": 20.52316076294278,
+ "grad_norm": 16.976900100708008,
+ "learning_rate": 1.8432300603086957e-05,
+ "loss": 0.9147,
+ "step": 7532
+ },
+ {
+ "epoch": 20.525885558583106,
+ "grad_norm": 9.287324905395508,
+ "learning_rate": 1.843182618274675e-05,
+ "loss": 0.8871,
+ "step": 7533
+ },
+ {
+ "epoch": 20.52861035422343,
+ "grad_norm": 13.709163665771484,
+ "learning_rate": 1.8431351696739755e-05,
+ "loss": 0.7975,
+ "step": 7534
+ },
+ {
+ "epoch": 20.53133514986376,
+ "grad_norm": 9.606921195983887,
+ "learning_rate": 1.843087714506966e-05,
+ "loss": 0.8434,
+ "step": 7535
+ },
+ {
+ "epoch": 20.534059945504087,
+ "grad_norm": 12.49398422241211,
+ "learning_rate": 1.843040252774017e-05,
+ "loss": 0.7167,
+ "step": 7536
+ },
+ {
+ "epoch": 20.536784741144416,
+ "grad_norm": 7.58212423324585,
+ "learning_rate": 1.8429927844754972e-05,
+ "loss": 0.8987,
+ "step": 7537
+ },
+ {
+ "epoch": 20.539509536784742,
+ "grad_norm": 12.724702835083008,
+ "learning_rate": 1.842945309611777e-05,
+ "loss": 0.8319,
+ "step": 7538
+ },
+ {
+ "epoch": 20.542234332425068,
+ "grad_norm": 8.409048080444336,
+ "learning_rate": 1.8428978281832255e-05,
+ "loss": 0.7396,
+ "step": 7539
+ },
+ {
+ "epoch": 20.544959128065393,
+ "grad_norm": 9.053321838378906,
+ "learning_rate": 1.842850340190213e-05,
+ "loss": 0.8324,
+ "step": 7540
+ },
+ {
+ "epoch": 20.547683923705723,
+ "grad_norm": 7.629400730133057,
+ "learning_rate": 1.8428028456331093e-05,
+ "loss": 0.6138,
+ "step": 7541
+ },
+ {
+ "epoch": 20.55040871934605,
+ "grad_norm": 12.569177627563477,
+ "learning_rate": 1.8427553445122842e-05,
+ "loss": 0.7177,
+ "step": 7542
+ },
+ {
+ "epoch": 20.553133514986374,
+ "grad_norm": 7.9694132804870605,
+ "learning_rate": 1.8427078368281077e-05,
+ "loss": 0.8976,
+ "step": 7543
+ },
+ {
+ "epoch": 20.555858310626704,
+ "grad_norm": 8.255053520202637,
+ "learning_rate": 1.8426603225809493e-05,
+ "loss": 0.8405,
+ "step": 7544
+ },
+ {
+ "epoch": 20.55858310626703,
+ "grad_norm": 8.747611999511719,
+ "learning_rate": 1.8426128017711797e-05,
+ "loss": 0.9238,
+ "step": 7545
+ },
+ {
+ "epoch": 20.561307901907355,
+ "grad_norm": 10.35474681854248,
+ "learning_rate": 1.8425652743991688e-05,
+ "loss": 0.7651,
+ "step": 7546
+ },
+ {
+ "epoch": 20.564032697547685,
+ "grad_norm": 8.243481636047363,
+ "learning_rate": 1.8425177404652865e-05,
+ "loss": 0.7662,
+ "step": 7547
+ },
+ {
+ "epoch": 20.56675749318801,
+ "grad_norm": 10.073675155639648,
+ "learning_rate": 1.842470199969903e-05,
+ "loss": 0.6719,
+ "step": 7548
+ },
+ {
+ "epoch": 20.569482288828336,
+ "grad_norm": 7.270785808563232,
+ "learning_rate": 1.842422652913389e-05,
+ "loss": 0.6927,
+ "step": 7549
+ },
+ {
+ "epoch": 20.572207084468666,
+ "grad_norm": 11.287145614624023,
+ "learning_rate": 1.8423750992961143e-05,
+ "loss": 0.8513,
+ "step": 7550
+ },
+ {
+ "epoch": 20.57493188010899,
+ "grad_norm": 8.997488021850586,
+ "learning_rate": 1.8423275391184496e-05,
+ "loss": 0.795,
+ "step": 7551
+ },
+ {
+ "epoch": 20.577656675749317,
+ "grad_norm": 11.46519660949707,
+ "learning_rate": 1.842279972380765e-05,
+ "loss": 0.7411,
+ "step": 7552
+ },
+ {
+ "epoch": 20.580381471389646,
+ "grad_norm": 9.471609115600586,
+ "learning_rate": 1.842232399083431e-05,
+ "loss": 0.812,
+ "step": 7553
+ },
+ {
+ "epoch": 20.583106267029972,
+ "grad_norm": 9.562443733215332,
+ "learning_rate": 1.8421848192268187e-05,
+ "loss": 0.743,
+ "step": 7554
+ },
+ {
+ "epoch": 20.585831062670298,
+ "grad_norm": 8.251599311828613,
+ "learning_rate": 1.8421372328112974e-05,
+ "loss": 0.7606,
+ "step": 7555
+ },
+ {
+ "epoch": 20.588555858310627,
+ "grad_norm": 8.16517162322998,
+ "learning_rate": 1.842089639837239e-05,
+ "loss": 0.8248,
+ "step": 7556
+ },
+ {
+ "epoch": 20.591280653950953,
+ "grad_norm": 8.494513511657715,
+ "learning_rate": 1.8420420403050134e-05,
+ "loss": 0.7952,
+ "step": 7557
+ },
+ {
+ "epoch": 20.59400544959128,
+ "grad_norm": 9.98038387298584,
+ "learning_rate": 1.8419944342149913e-05,
+ "loss": 0.8759,
+ "step": 7558
+ },
+ {
+ "epoch": 20.59673024523161,
+ "grad_norm": 10.59455680847168,
+ "learning_rate": 1.8419468215675437e-05,
+ "loss": 0.962,
+ "step": 7559
+ },
+ {
+ "epoch": 20.599455040871934,
+ "grad_norm": 10.139543533325195,
+ "learning_rate": 1.8418992023630416e-05,
+ "loss": 0.778,
+ "step": 7560
+ },
+ {
+ "epoch": 20.60217983651226,
+ "grad_norm": 8.193345069885254,
+ "learning_rate": 1.8418515766018553e-05,
+ "loss": 0.6841,
+ "step": 7561
+ },
+ {
+ "epoch": 20.60490463215259,
+ "grad_norm": 8.825242042541504,
+ "learning_rate": 1.8418039442843562e-05,
+ "loss": 0.8464,
+ "step": 7562
+ },
+ {
+ "epoch": 20.607629427792915,
+ "grad_norm": 9.617834091186523,
+ "learning_rate": 1.8417563054109153e-05,
+ "loss": 0.7627,
+ "step": 7563
+ },
+ {
+ "epoch": 20.61035422343324,
+ "grad_norm": 12.968689918518066,
+ "learning_rate": 1.8417086599819028e-05,
+ "loss": 0.847,
+ "step": 7564
+ },
+ {
+ "epoch": 20.61307901907357,
+ "grad_norm": 7.965363025665283,
+ "learning_rate": 1.841661007997691e-05,
+ "loss": 0.7997,
+ "step": 7565
+ },
+ {
+ "epoch": 20.615803814713896,
+ "grad_norm": 8.659131050109863,
+ "learning_rate": 1.84161334945865e-05,
+ "loss": 0.745,
+ "step": 7566
+ },
+ {
+ "epoch": 20.618528610354222,
+ "grad_norm": 11.7770357131958,
+ "learning_rate": 1.8415656843651514e-05,
+ "loss": 0.6655,
+ "step": 7567
+ },
+ {
+ "epoch": 20.62125340599455,
+ "grad_norm": 8.190646171569824,
+ "learning_rate": 1.841518012717566e-05,
+ "loss": 0.8326,
+ "step": 7568
+ },
+ {
+ "epoch": 20.623978201634877,
+ "grad_norm": 6.952454090118408,
+ "learning_rate": 1.8414703345162656e-05,
+ "loss": 0.765,
+ "step": 7569
+ },
+ {
+ "epoch": 20.626702997275203,
+ "grad_norm": 8.603614807128906,
+ "learning_rate": 1.8414226497616215e-05,
+ "loss": 0.7329,
+ "step": 7570
+ },
+ {
+ "epoch": 20.629427792915532,
+ "grad_norm": 11.186273574829102,
+ "learning_rate": 1.841374958454005e-05,
+ "loss": 0.9298,
+ "step": 7571
+ },
+ {
+ "epoch": 20.632152588555858,
+ "grad_norm": 15.902365684509277,
+ "learning_rate": 1.8413272605937872e-05,
+ "loss": 0.9056,
+ "step": 7572
+ },
+ {
+ "epoch": 20.634877384196184,
+ "grad_norm": 9.482760429382324,
+ "learning_rate": 1.8412795561813397e-05,
+ "loss": 0.7537,
+ "step": 7573
+ },
+ {
+ "epoch": 20.637602179836513,
+ "grad_norm": 7.537638187408447,
+ "learning_rate": 1.8412318452170344e-05,
+ "loss": 0.7407,
+ "step": 7574
+ },
+ {
+ "epoch": 20.64032697547684,
+ "grad_norm": 8.906112670898438,
+ "learning_rate": 1.8411841277012423e-05,
+ "loss": 0.8531,
+ "step": 7575
+ },
+ {
+ "epoch": 20.643051771117165,
+ "grad_norm": 9.597343444824219,
+ "learning_rate": 1.841136403634335e-05,
+ "loss": 0.7976,
+ "step": 7576
+ },
+ {
+ "epoch": 20.645776566757494,
+ "grad_norm": 8.042146682739258,
+ "learning_rate": 1.8410886730166848e-05,
+ "loss": 0.7957,
+ "step": 7577
+ },
+ {
+ "epoch": 20.64850136239782,
+ "grad_norm": 10.171354293823242,
+ "learning_rate": 1.841040935848663e-05,
+ "loss": 0.7577,
+ "step": 7578
+ },
+ {
+ "epoch": 20.651226158038146,
+ "grad_norm": 9.854966163635254,
+ "learning_rate": 1.840993192130642e-05,
+ "loss": 0.6897,
+ "step": 7579
+ },
+ {
+ "epoch": 20.653950953678475,
+ "grad_norm": 9.036667823791504,
+ "learning_rate": 1.8409454418629925e-05,
+ "loss": 0.6295,
+ "step": 7580
+ },
+ {
+ "epoch": 20.6566757493188,
+ "grad_norm": 13.81934642791748,
+ "learning_rate": 1.840897685046087e-05,
+ "loss": 0.8835,
+ "step": 7581
+ },
+ {
+ "epoch": 20.659400544959126,
+ "grad_norm": 12.976028442382812,
+ "learning_rate": 1.8408499216802974e-05,
+ "loss": 0.8418,
+ "step": 7582
+ },
+ {
+ "epoch": 20.662125340599456,
+ "grad_norm": 9.331933975219727,
+ "learning_rate": 1.840802151765996e-05,
+ "loss": 0.6176,
+ "step": 7583
+ },
+ {
+ "epoch": 20.66485013623978,
+ "grad_norm": 10.498309135437012,
+ "learning_rate": 1.840754375303554e-05,
+ "loss": 0.8578,
+ "step": 7584
+ },
+ {
+ "epoch": 20.667574931880107,
+ "grad_norm": 9.227131843566895,
+ "learning_rate": 1.840706592293344e-05,
+ "loss": 0.848,
+ "step": 7585
+ },
+ {
+ "epoch": 20.670299727520437,
+ "grad_norm": 9.691853523254395,
+ "learning_rate": 1.8406588027357383e-05,
+ "loss": 0.9496,
+ "step": 7586
+ },
+ {
+ "epoch": 20.673024523160763,
+ "grad_norm": 8.21297550201416,
+ "learning_rate": 1.8406110066311093e-05,
+ "loss": 0.835,
+ "step": 7587
+ },
+ {
+ "epoch": 20.67574931880109,
+ "grad_norm": 8.179823875427246,
+ "learning_rate": 1.8405632039798283e-05,
+ "loss": 0.892,
+ "step": 7588
+ },
+ {
+ "epoch": 20.678474114441418,
+ "grad_norm": 12.935137748718262,
+ "learning_rate": 1.840515394782268e-05,
+ "loss": 0.8531,
+ "step": 7589
+ },
+ {
+ "epoch": 20.681198910081743,
+ "grad_norm": 11.246734619140625,
+ "learning_rate": 1.8404675790388017e-05,
+ "loss": 1.0269,
+ "step": 7590
+ },
+ {
+ "epoch": 20.68392370572207,
+ "grad_norm": 9.77748966217041,
+ "learning_rate": 1.8404197567498e-05,
+ "loss": 0.9647,
+ "step": 7591
+ },
+ {
+ "epoch": 20.6866485013624,
+ "grad_norm": 9.248991966247559,
+ "learning_rate": 1.840371927915637e-05,
+ "loss": 0.7554,
+ "step": 7592
+ },
+ {
+ "epoch": 20.689373297002724,
+ "grad_norm": 10.35046100616455,
+ "learning_rate": 1.8403240925366842e-05,
+ "loss": 0.7442,
+ "step": 7593
+ },
+ {
+ "epoch": 20.69209809264305,
+ "grad_norm": 8.65871524810791,
+ "learning_rate": 1.8402762506133145e-05,
+ "loss": 0.7538,
+ "step": 7594
+ },
+ {
+ "epoch": 20.69482288828338,
+ "grad_norm": 13.182056427001953,
+ "learning_rate": 1.8402284021459e-05,
+ "loss": 0.7523,
+ "step": 7595
+ },
+ {
+ "epoch": 20.697547683923705,
+ "grad_norm": 9.477316856384277,
+ "learning_rate": 1.840180547134814e-05,
+ "loss": 0.864,
+ "step": 7596
+ },
+ {
+ "epoch": 20.70027247956403,
+ "grad_norm": 9.479179382324219,
+ "learning_rate": 1.8401326855804293e-05,
+ "loss": 0.7625,
+ "step": 7597
+ },
+ {
+ "epoch": 20.70299727520436,
+ "grad_norm": 10.778131484985352,
+ "learning_rate": 1.8400848174831178e-05,
+ "loss": 0.7231,
+ "step": 7598
+ },
+ {
+ "epoch": 20.705722070844686,
+ "grad_norm": 9.457087516784668,
+ "learning_rate": 1.840036942843253e-05,
+ "loss": 0.9269,
+ "step": 7599
+ },
+ {
+ "epoch": 20.708446866485012,
+ "grad_norm": 8.120590209960938,
+ "learning_rate": 1.8399890616612073e-05,
+ "loss": 0.8187,
+ "step": 7600
+ },
+ {
+ "epoch": 20.71117166212534,
+ "grad_norm": 9.013141632080078,
+ "learning_rate": 1.839941173937354e-05,
+ "loss": 0.7363,
+ "step": 7601
+ },
+ {
+ "epoch": 20.713896457765667,
+ "grad_norm": 11.750839233398438,
+ "learning_rate": 1.839893279672066e-05,
+ "loss": 0.8936,
+ "step": 7602
+ },
+ {
+ "epoch": 20.716621253405993,
+ "grad_norm": 8.871647834777832,
+ "learning_rate": 1.839845378865716e-05,
+ "loss": 0.9536,
+ "step": 7603
+ },
+ {
+ "epoch": 20.719346049046322,
+ "grad_norm": 8.749375343322754,
+ "learning_rate": 1.839797471518677e-05,
+ "loss": 0.9968,
+ "step": 7604
+ },
+ {
+ "epoch": 20.722070844686648,
+ "grad_norm": 10.805994987487793,
+ "learning_rate": 1.8397495576313226e-05,
+ "loss": 0.8442,
+ "step": 7605
+ },
+ {
+ "epoch": 20.724795640326974,
+ "grad_norm": 11.166732788085938,
+ "learning_rate": 1.8397016372040256e-05,
+ "loss": 0.7979,
+ "step": 7606
+ },
+ {
+ "epoch": 20.727520435967303,
+ "grad_norm": 7.917816638946533,
+ "learning_rate": 1.8396537102371593e-05,
+ "loss": 0.6642,
+ "step": 7607
+ },
+ {
+ "epoch": 20.73024523160763,
+ "grad_norm": 8.999839782714844,
+ "learning_rate": 1.839605776731097e-05,
+ "loss": 0.8108,
+ "step": 7608
+ },
+ {
+ "epoch": 20.732970027247955,
+ "grad_norm": 11.270936965942383,
+ "learning_rate": 1.839557836686212e-05,
+ "loss": 0.8053,
+ "step": 7609
+ },
+ {
+ "epoch": 20.735694822888284,
+ "grad_norm": 8.101061820983887,
+ "learning_rate": 1.8395098901028774e-05,
+ "loss": 0.7604,
+ "step": 7610
+ },
+ {
+ "epoch": 20.73841961852861,
+ "grad_norm": 9.721184730529785,
+ "learning_rate": 1.8394619369814666e-05,
+ "loss": 0.9728,
+ "step": 7611
+ },
+ {
+ "epoch": 20.741144414168936,
+ "grad_norm": 8.81428337097168,
+ "learning_rate": 1.8394139773223537e-05,
+ "loss": 0.8023,
+ "step": 7612
+ },
+ {
+ "epoch": 20.743869209809265,
+ "grad_norm": 9.245955467224121,
+ "learning_rate": 1.8393660111259116e-05,
+ "loss": 0.8396,
+ "step": 7613
+ },
+ {
+ "epoch": 20.74659400544959,
+ "grad_norm": 15.609857559204102,
+ "learning_rate": 1.839318038392514e-05,
+ "loss": 0.9071,
+ "step": 7614
+ },
+ {
+ "epoch": 20.749318801089917,
+ "grad_norm": 7.997469902038574,
+ "learning_rate": 1.8392700591225346e-05,
+ "loss": 0.8051,
+ "step": 7615
+ },
+ {
+ "epoch": 20.752043596730246,
+ "grad_norm": 7.729000091552734,
+ "learning_rate": 1.8392220733163467e-05,
+ "loss": 0.7467,
+ "step": 7616
+ },
+ {
+ "epoch": 20.754768392370572,
+ "grad_norm": 7.590522766113281,
+ "learning_rate": 1.8391740809743245e-05,
+ "loss": 0.8373,
+ "step": 7617
+ },
+ {
+ "epoch": 20.757493188010898,
+ "grad_norm": 8.049286842346191,
+ "learning_rate": 1.8391260820968417e-05,
+ "loss": 0.7924,
+ "step": 7618
+ },
+ {
+ "epoch": 20.760217983651227,
+ "grad_norm": 8.123289108276367,
+ "learning_rate": 1.8390780766842717e-05,
+ "loss": 0.8227,
+ "step": 7619
+ },
+ {
+ "epoch": 20.762942779291553,
+ "grad_norm": 8.064492225646973,
+ "learning_rate": 1.839030064736989e-05,
+ "loss": 0.7632,
+ "step": 7620
+ },
+ {
+ "epoch": 20.76566757493188,
+ "grad_norm": 11.855932235717773,
+ "learning_rate": 1.838982046255367e-05,
+ "loss": 0.6485,
+ "step": 7621
+ },
+ {
+ "epoch": 20.768392370572208,
+ "grad_norm": 8.009469032287598,
+ "learning_rate": 1.8389340212397797e-05,
+ "loss": 0.6338,
+ "step": 7622
+ },
+ {
+ "epoch": 20.771117166212534,
+ "grad_norm": 8.831151008605957,
+ "learning_rate": 1.8388859896906014e-05,
+ "loss": 0.6919,
+ "step": 7623
+ },
+ {
+ "epoch": 20.77384196185286,
+ "grad_norm": 7.897984504699707,
+ "learning_rate": 1.838837951608206e-05,
+ "loss": 0.8043,
+ "step": 7624
+ },
+ {
+ "epoch": 20.77656675749319,
+ "grad_norm": 7.134253025054932,
+ "learning_rate": 1.8387899069929673e-05,
+ "loss": 0.8281,
+ "step": 7625
+ },
+ {
+ "epoch": 20.779291553133515,
+ "grad_norm": 8.043962478637695,
+ "learning_rate": 1.8387418558452602e-05,
+ "loss": 1.0161,
+ "step": 7626
+ },
+ {
+ "epoch": 20.78201634877384,
+ "grad_norm": 9.967580795288086,
+ "learning_rate": 1.8386937981654583e-05,
+ "loss": 0.7574,
+ "step": 7627
+ },
+ {
+ "epoch": 20.78474114441417,
+ "grad_norm": 9.644227981567383,
+ "learning_rate": 1.8386457339539364e-05,
+ "loss": 0.6687,
+ "step": 7628
+ },
+ {
+ "epoch": 20.787465940054496,
+ "grad_norm": 8.344680786132812,
+ "learning_rate": 1.8385976632110684e-05,
+ "loss": 0.7148,
+ "step": 7629
+ },
+ {
+ "epoch": 20.79019073569482,
+ "grad_norm": 9.260910034179688,
+ "learning_rate": 1.8385495859372288e-05,
+ "loss": 0.9921,
+ "step": 7630
+ },
+ {
+ "epoch": 20.79291553133515,
+ "grad_norm": 6.6078314781188965,
+ "learning_rate": 1.8385015021327916e-05,
+ "loss": 0.9178,
+ "step": 7631
+ },
+ {
+ "epoch": 20.795640326975477,
+ "grad_norm": 10.556445121765137,
+ "learning_rate": 1.838453411798132e-05,
+ "loss": 0.8213,
+ "step": 7632
+ },
+ {
+ "epoch": 20.798365122615802,
+ "grad_norm": 8.5899019241333,
+ "learning_rate": 1.8384053149336243e-05,
+ "loss": 0.6635,
+ "step": 7633
+ },
+ {
+ "epoch": 20.80108991825613,
+ "grad_norm": 7.8474650382995605,
+ "learning_rate": 1.838357211539643e-05,
+ "loss": 0.7745,
+ "step": 7634
+ },
+ {
+ "epoch": 20.803814713896458,
+ "grad_norm": 7.122204303741455,
+ "learning_rate": 1.8383091016165626e-05,
+ "loss": 0.7743,
+ "step": 7635
+ },
+ {
+ "epoch": 20.806539509536783,
+ "grad_norm": 9.272528648376465,
+ "learning_rate": 1.838260985164758e-05,
+ "loss": 0.8671,
+ "step": 7636
+ },
+ {
+ "epoch": 20.809264305177113,
+ "grad_norm": 7.35139274597168,
+ "learning_rate": 1.8382128621846034e-05,
+ "loss": 0.9444,
+ "step": 7637
+ },
+ {
+ "epoch": 20.81198910081744,
+ "grad_norm": 9.256814956665039,
+ "learning_rate": 1.8381647326764744e-05,
+ "loss": 0.651,
+ "step": 7638
+ },
+ {
+ "epoch": 20.814713896457764,
+ "grad_norm": 8.758612632751465,
+ "learning_rate": 1.8381165966407456e-05,
+ "loss": 0.7474,
+ "step": 7639
+ },
+ {
+ "epoch": 20.817438692098094,
+ "grad_norm": 8.256421089172363,
+ "learning_rate": 1.8380684540777914e-05,
+ "loss": 0.6742,
+ "step": 7640
+ },
+ {
+ "epoch": 20.82016348773842,
+ "grad_norm": 7.075945854187012,
+ "learning_rate": 1.8380203049879872e-05,
+ "loss": 0.8121,
+ "step": 7641
+ },
+ {
+ "epoch": 20.822888283378745,
+ "grad_norm": 7.424861431121826,
+ "learning_rate": 1.8379721493717077e-05,
+ "loss": 0.7523,
+ "step": 7642
+ },
+ {
+ "epoch": 20.825613079019075,
+ "grad_norm": 8.83095932006836,
+ "learning_rate": 1.837923987229328e-05,
+ "loss": 0.8737,
+ "step": 7643
+ },
+ {
+ "epoch": 20.8283378746594,
+ "grad_norm": 9.214203834533691,
+ "learning_rate": 1.8378758185612237e-05,
+ "loss": 0.8524,
+ "step": 7644
+ },
+ {
+ "epoch": 20.831062670299726,
+ "grad_norm": 8.21826457977295,
+ "learning_rate": 1.8378276433677692e-05,
+ "loss": 0.7117,
+ "step": 7645
+ },
+ {
+ "epoch": 20.833787465940055,
+ "grad_norm": 8.080403327941895,
+ "learning_rate": 1.83777946164934e-05,
+ "loss": 0.7695,
+ "step": 7646
+ },
+ {
+ "epoch": 20.83651226158038,
+ "grad_norm": 7.988407611846924,
+ "learning_rate": 1.8377312734063113e-05,
+ "loss": 0.7418,
+ "step": 7647
+ },
+ {
+ "epoch": 20.839237057220707,
+ "grad_norm": 9.077837944030762,
+ "learning_rate": 1.8376830786390584e-05,
+ "loss": 0.6626,
+ "step": 7648
+ },
+ {
+ "epoch": 20.841961852861036,
+ "grad_norm": 8.081254959106445,
+ "learning_rate": 1.8376348773479568e-05,
+ "loss": 0.8218,
+ "step": 7649
+ },
+ {
+ "epoch": 20.844686648501362,
+ "grad_norm": 7.435146331787109,
+ "learning_rate": 1.8375866695333814e-05,
+ "loss": 0.9399,
+ "step": 7650
+ },
+ {
+ "epoch": 20.847411444141688,
+ "grad_norm": 7.113531112670898,
+ "learning_rate": 1.8375384551957084e-05,
+ "loss": 0.8247,
+ "step": 7651
+ },
+ {
+ "epoch": 20.850136239782017,
+ "grad_norm": 7.996152400970459,
+ "learning_rate": 1.8374902343353124e-05,
+ "loss": 0.5957,
+ "step": 7652
+ },
+ {
+ "epoch": 20.852861035422343,
+ "grad_norm": 8.345686912536621,
+ "learning_rate": 1.8374420069525697e-05,
+ "loss": 0.7369,
+ "step": 7653
+ },
+ {
+ "epoch": 20.85558583106267,
+ "grad_norm": 9.157774925231934,
+ "learning_rate": 1.8373937730478556e-05,
+ "loss": 0.8046,
+ "step": 7654
+ },
+ {
+ "epoch": 20.858310626703,
+ "grad_norm": 8.734550476074219,
+ "learning_rate": 1.8373455326215458e-05,
+ "loss": 0.8349,
+ "step": 7655
+ },
+ {
+ "epoch": 20.861035422343324,
+ "grad_norm": 9.237524032592773,
+ "learning_rate": 1.8372972856740157e-05,
+ "loss": 0.7737,
+ "step": 7656
+ },
+ {
+ "epoch": 20.86376021798365,
+ "grad_norm": 7.846309661865234,
+ "learning_rate": 1.8372490322056414e-05,
+ "loss": 0.7671,
+ "step": 7657
+ },
+ {
+ "epoch": 20.86648501362398,
+ "grad_norm": 7.726889610290527,
+ "learning_rate": 1.8372007722167987e-05,
+ "loss": 0.8007,
+ "step": 7658
+ },
+ {
+ "epoch": 20.869209809264305,
+ "grad_norm": 7.21893310546875,
+ "learning_rate": 1.8371525057078633e-05,
+ "loss": 0.7676,
+ "step": 7659
+ },
+ {
+ "epoch": 20.87193460490463,
+ "grad_norm": 7.970730304718018,
+ "learning_rate": 1.837104232679211e-05,
+ "loss": 0.8494,
+ "step": 7660
+ },
+ {
+ "epoch": 20.87465940054496,
+ "grad_norm": 6.842720031738281,
+ "learning_rate": 1.837055953131218e-05,
+ "loss": 0.9396,
+ "step": 7661
+ },
+ {
+ "epoch": 20.877384196185286,
+ "grad_norm": 8.219659805297852,
+ "learning_rate": 1.83700766706426e-05,
+ "loss": 0.9392,
+ "step": 7662
+ },
+ {
+ "epoch": 20.88010899182561,
+ "grad_norm": 7.09730863571167,
+ "learning_rate": 1.8369593744787135e-05,
+ "loss": 0.7419,
+ "step": 7663
+ },
+ {
+ "epoch": 20.88283378746594,
+ "grad_norm": 7.974386215209961,
+ "learning_rate": 1.836911075374954e-05,
+ "loss": 0.7454,
+ "step": 7664
+ },
+ {
+ "epoch": 20.885558583106267,
+ "grad_norm": 7.594198226928711,
+ "learning_rate": 1.8368627697533583e-05,
+ "loss": 0.7988,
+ "step": 7665
+ },
+ {
+ "epoch": 20.888283378746593,
+ "grad_norm": 8.172731399536133,
+ "learning_rate": 1.836814457614302e-05,
+ "loss": 0.9724,
+ "step": 7666
+ },
+ {
+ "epoch": 20.891008174386922,
+ "grad_norm": 9.023299217224121,
+ "learning_rate": 1.836766138958162e-05,
+ "loss": 0.7821,
+ "step": 7667
+ },
+ {
+ "epoch": 20.893732970027248,
+ "grad_norm": 9.135993957519531,
+ "learning_rate": 1.836717813785314e-05,
+ "loss": 0.7178,
+ "step": 7668
+ },
+ {
+ "epoch": 20.896457765667574,
+ "grad_norm": 8.075799942016602,
+ "learning_rate": 1.8366694820961346e-05,
+ "loss": 0.9333,
+ "step": 7669
+ },
+ {
+ "epoch": 20.899182561307903,
+ "grad_norm": 8.042290687561035,
+ "learning_rate": 1.8366211438910004e-05,
+ "loss": 0.9171,
+ "step": 7670
+ },
+ {
+ "epoch": 20.90190735694823,
+ "grad_norm": 8.95767593383789,
+ "learning_rate": 1.8365727991702874e-05,
+ "loss": 0.7039,
+ "step": 7671
+ },
+ {
+ "epoch": 20.904632152588555,
+ "grad_norm": 10.070302963256836,
+ "learning_rate": 1.8365244479343723e-05,
+ "loss": 0.8101,
+ "step": 7672
+ },
+ {
+ "epoch": 20.907356948228884,
+ "grad_norm": 7.303725719451904,
+ "learning_rate": 1.836476090183632e-05,
+ "loss": 0.8423,
+ "step": 7673
+ },
+ {
+ "epoch": 20.91008174386921,
+ "grad_norm": 8.69246768951416,
+ "learning_rate": 1.8364277259184428e-05,
+ "loss": 0.7401,
+ "step": 7674
+ },
+ {
+ "epoch": 20.912806539509535,
+ "grad_norm": 9.71865463256836,
+ "learning_rate": 1.8363793551391814e-05,
+ "loss": 0.881,
+ "step": 7675
+ },
+ {
+ "epoch": 20.915531335149865,
+ "grad_norm": 8.502640724182129,
+ "learning_rate": 1.836330977846224e-05,
+ "loss": 0.5955,
+ "step": 7676
+ },
+ {
+ "epoch": 20.91825613079019,
+ "grad_norm": 9.499765396118164,
+ "learning_rate": 1.8362825940399483e-05,
+ "loss": 0.7382,
+ "step": 7677
+ },
+ {
+ "epoch": 20.920980926430516,
+ "grad_norm": 8.114084243774414,
+ "learning_rate": 1.8362342037207308e-05,
+ "loss": 0.9603,
+ "step": 7678
+ },
+ {
+ "epoch": 20.923705722070846,
+ "grad_norm": 10.1805419921875,
+ "learning_rate": 1.836185806888948e-05,
+ "loss": 0.8999,
+ "step": 7679
+ },
+ {
+ "epoch": 20.92643051771117,
+ "grad_norm": 7.986012935638428,
+ "learning_rate": 1.836137403544977e-05,
+ "loss": 0.8367,
+ "step": 7680
+ },
+ {
+ "epoch": 20.929155313351497,
+ "grad_norm": 9.502193450927734,
+ "learning_rate": 1.836088993689195e-05,
+ "loss": 0.6833,
+ "step": 7681
+ },
+ {
+ "epoch": 20.931880108991827,
+ "grad_norm": 8.042461395263672,
+ "learning_rate": 1.836040577321979e-05,
+ "loss": 0.7908,
+ "step": 7682
+ },
+ {
+ "epoch": 20.934604904632153,
+ "grad_norm": 8.619714736938477,
+ "learning_rate": 1.8359921544437055e-05,
+ "loss": 0.7698,
+ "step": 7683
+ },
+ {
+ "epoch": 20.93732970027248,
+ "grad_norm": 7.86964750289917,
+ "learning_rate": 1.835943725054752e-05,
+ "loss": 0.8191,
+ "step": 7684
+ },
+ {
+ "epoch": 20.940054495912808,
+ "grad_norm": 8.827571868896484,
+ "learning_rate": 1.835895289155496e-05,
+ "loss": 0.8391,
+ "step": 7685
+ },
+ {
+ "epoch": 20.942779291553133,
+ "grad_norm": 8.40529727935791,
+ "learning_rate": 1.835846846746314e-05,
+ "loss": 0.7603,
+ "step": 7686
+ },
+ {
+ "epoch": 20.94550408719346,
+ "grad_norm": 8.676128387451172,
+ "learning_rate": 1.835798397827584e-05,
+ "loss": 0.7245,
+ "step": 7687
+ },
+ {
+ "epoch": 20.94822888283379,
+ "grad_norm": 9.562548637390137,
+ "learning_rate": 1.835749942399683e-05,
+ "loss": 0.7974,
+ "step": 7688
+ },
+ {
+ "epoch": 20.950953678474114,
+ "grad_norm": 8.225702285766602,
+ "learning_rate": 1.835701480462988e-05,
+ "loss": 0.7402,
+ "step": 7689
+ },
+ {
+ "epoch": 20.95367847411444,
+ "grad_norm": 6.749309062957764,
+ "learning_rate": 1.8356530120178767e-05,
+ "loss": 0.7914,
+ "step": 7690
+ },
+ {
+ "epoch": 20.95640326975477,
+ "grad_norm": 8.198533058166504,
+ "learning_rate": 1.835604537064727e-05,
+ "loss": 0.8502,
+ "step": 7691
+ },
+ {
+ "epoch": 20.959128065395095,
+ "grad_norm": 6.520903587341309,
+ "learning_rate": 1.8355560556039164e-05,
+ "loss": 0.6687,
+ "step": 7692
+ },
+ {
+ "epoch": 20.96185286103542,
+ "grad_norm": 8.739531517028809,
+ "learning_rate": 1.8355075676358215e-05,
+ "loss": 0.9065,
+ "step": 7693
+ },
+ {
+ "epoch": 20.96457765667575,
+ "grad_norm": 7.634159564971924,
+ "learning_rate": 1.835459073160821e-05,
+ "loss": 0.6198,
+ "step": 7694
+ },
+ {
+ "epoch": 20.967302452316076,
+ "grad_norm": 9.236230850219727,
+ "learning_rate": 1.8354105721792917e-05,
+ "loss": 0.8596,
+ "step": 7695
+ },
+ {
+ "epoch": 20.970027247956402,
+ "grad_norm": 7.2085113525390625,
+ "learning_rate": 1.8353620646916116e-05,
+ "loss": 0.8096,
+ "step": 7696
+ },
+ {
+ "epoch": 20.97275204359673,
+ "grad_norm": 7.414519786834717,
+ "learning_rate": 1.835313550698159e-05,
+ "loss": 0.8225,
+ "step": 7697
+ },
+ {
+ "epoch": 20.975476839237057,
+ "grad_norm": 8.842377662658691,
+ "learning_rate": 1.8352650301993112e-05,
+ "loss": 0.6714,
+ "step": 7698
+ },
+ {
+ "epoch": 20.978201634877383,
+ "grad_norm": 8.369305610656738,
+ "learning_rate": 1.8352165031954468e-05,
+ "loss": 0.7489,
+ "step": 7699
+ },
+ {
+ "epoch": 20.980926430517712,
+ "grad_norm": 11.194235801696777,
+ "learning_rate": 1.8351679696869427e-05,
+ "loss": 0.8214,
+ "step": 7700
+ },
+ {
+ "epoch": 20.983651226158038,
+ "grad_norm": 7.6760663986206055,
+ "learning_rate": 1.835119429674177e-05,
+ "loss": 0.734,
+ "step": 7701
+ },
+ {
+ "epoch": 20.986376021798364,
+ "grad_norm": 8.03299331665039,
+ "learning_rate": 1.8350708831575286e-05,
+ "loss": 0.8882,
+ "step": 7702
+ },
+ {
+ "epoch": 20.989100817438693,
+ "grad_norm": 8.684178352355957,
+ "learning_rate": 1.835022330137375e-05,
+ "loss": 0.7222,
+ "step": 7703
+ },
+ {
+ "epoch": 20.99182561307902,
+ "grad_norm": 11.191232681274414,
+ "learning_rate": 1.834973770614094e-05,
+ "loss": 0.9777,
+ "step": 7704
+ },
+ {
+ "epoch": 20.994550408719345,
+ "grad_norm": 7.9103007316589355,
+ "learning_rate": 1.834925204588064e-05,
+ "loss": 0.649,
+ "step": 7705
+ },
+ {
+ "epoch": 20.997275204359674,
+ "grad_norm": 8.560781478881836,
+ "learning_rate": 1.8348766320596638e-05,
+ "loss": 0.8652,
+ "step": 7706
+ },
+ {
+ "epoch": 21.0,
+ "grad_norm": 7.691993236541748,
+ "learning_rate": 1.8348280530292712e-05,
+ "loss": 0.7366,
+ "step": 7707
+ },
+ {
+ "epoch": 21.002724795640326,
+ "grad_norm": 7.323371410369873,
+ "learning_rate": 1.834779467497265e-05,
+ "loss": 0.6414,
+ "step": 7708
+ },
+ {
+ "epoch": 21.005449591280655,
+ "grad_norm": 8.487759590148926,
+ "learning_rate": 1.834730875464022e-05,
+ "loss": 0.7064,
+ "step": 7709
+ },
+ {
+ "epoch": 21.00817438692098,
+ "grad_norm": 7.555262088775635,
+ "learning_rate": 1.834682276929923e-05,
+ "loss": 0.9084,
+ "step": 7710
+ },
+ {
+ "epoch": 21.010899182561307,
+ "grad_norm": 7.268922805786133,
+ "learning_rate": 1.8346336718953447e-05,
+ "loss": 0.6943,
+ "step": 7711
+ },
+ {
+ "epoch": 21.013623978201636,
+ "grad_norm": 6.138815402984619,
+ "learning_rate": 1.8345850603606666e-05,
+ "loss": 0.7697,
+ "step": 7712
+ },
+ {
+ "epoch": 21.016348773841962,
+ "grad_norm": 7.12817907333374,
+ "learning_rate": 1.8345364423262666e-05,
+ "loss": 0.6686,
+ "step": 7713
+ },
+ {
+ "epoch": 21.019073569482288,
+ "grad_norm": 6.738901615142822,
+ "learning_rate": 1.8344878177925238e-05,
+ "loss": 0.6882,
+ "step": 7714
+ },
+ {
+ "epoch": 21.021798365122617,
+ "grad_norm": 7.405285358428955,
+ "learning_rate": 1.8344391867598164e-05,
+ "loss": 0.6643,
+ "step": 7715
+ },
+ {
+ "epoch": 21.024523160762943,
+ "grad_norm": 8.851975440979004,
+ "learning_rate": 1.8343905492285238e-05,
+ "loss": 0.7656,
+ "step": 7716
+ },
+ {
+ "epoch": 21.02724795640327,
+ "grad_norm": 8.151577949523926,
+ "learning_rate": 1.8343419051990245e-05,
+ "loss": 0.7937,
+ "step": 7717
+ },
+ {
+ "epoch": 21.029972752043598,
+ "grad_norm": 7.610278606414795,
+ "learning_rate": 1.8342932546716973e-05,
+ "loss": 0.6821,
+ "step": 7718
+ },
+ {
+ "epoch": 21.032697547683924,
+ "grad_norm": 49.263816833496094,
+ "learning_rate": 1.8342445976469206e-05,
+ "loss": 0.7039,
+ "step": 7719
+ },
+ {
+ "epoch": 21.03542234332425,
+ "grad_norm": 6.417880058288574,
+ "learning_rate": 1.8341959341250743e-05,
+ "loss": 0.6281,
+ "step": 7720
+ },
+ {
+ "epoch": 21.03814713896458,
+ "grad_norm": 7.054736614227295,
+ "learning_rate": 1.834147264106537e-05,
+ "loss": 0.6315,
+ "step": 7721
+ },
+ {
+ "epoch": 21.040871934604905,
+ "grad_norm": 7.179330825805664,
+ "learning_rate": 1.8340985875916874e-05,
+ "loss": 0.6987,
+ "step": 7722
+ },
+ {
+ "epoch": 21.04359673024523,
+ "grad_norm": 8.369280815124512,
+ "learning_rate": 1.834049904580905e-05,
+ "loss": 0.8383,
+ "step": 7723
+ },
+ {
+ "epoch": 21.04632152588556,
+ "grad_norm": 8.203306198120117,
+ "learning_rate": 1.8340012150745685e-05,
+ "loss": 0.6147,
+ "step": 7724
+ },
+ {
+ "epoch": 21.049046321525886,
+ "grad_norm": 8.10911750793457,
+ "learning_rate": 1.8339525190730577e-05,
+ "loss": 0.8666,
+ "step": 7725
+ },
+ {
+ "epoch": 21.05177111716621,
+ "grad_norm": 8.598569869995117,
+ "learning_rate": 1.833903816576751e-05,
+ "loss": 0.6295,
+ "step": 7726
+ },
+ {
+ "epoch": 21.05449591280654,
+ "grad_norm": 8.309627532958984,
+ "learning_rate": 1.8338551075860288e-05,
+ "loss": 0.6552,
+ "step": 7727
+ },
+ {
+ "epoch": 21.057220708446867,
+ "grad_norm": 7.313740253448486,
+ "learning_rate": 1.83380639210127e-05,
+ "loss": 0.7542,
+ "step": 7728
+ },
+ {
+ "epoch": 21.059945504087192,
+ "grad_norm": 7.313722133636475,
+ "learning_rate": 1.833757670122853e-05,
+ "loss": 0.647,
+ "step": 7729
+ },
+ {
+ "epoch": 21.06267029972752,
+ "grad_norm": 7.183590412139893,
+ "learning_rate": 1.833708941651159e-05,
+ "loss": 0.7993,
+ "step": 7730
+ },
+ {
+ "epoch": 21.065395095367847,
+ "grad_norm": 20.81493377685547,
+ "learning_rate": 1.833660206686566e-05,
+ "loss": 0.8202,
+ "step": 7731
+ },
+ {
+ "epoch": 21.068119891008173,
+ "grad_norm": 8.982355117797852,
+ "learning_rate": 1.8336114652294547e-05,
+ "loss": 0.7061,
+ "step": 7732
+ },
+ {
+ "epoch": 21.070844686648503,
+ "grad_norm": 8.355277061462402,
+ "learning_rate": 1.8335627172802034e-05,
+ "loss": 0.7621,
+ "step": 7733
+ },
+ {
+ "epoch": 21.07356948228883,
+ "grad_norm": 11.035460472106934,
+ "learning_rate": 1.833513962839193e-05,
+ "loss": 0.6851,
+ "step": 7734
+ },
+ {
+ "epoch": 21.076294277929154,
+ "grad_norm": 10.80052375793457,
+ "learning_rate": 1.8334652019068024e-05,
+ "loss": 0.7092,
+ "step": 7735
+ },
+ {
+ "epoch": 21.079019073569484,
+ "grad_norm": 8.625014305114746,
+ "learning_rate": 1.833416434483412e-05,
+ "loss": 0.707,
+ "step": 7736
+ },
+ {
+ "epoch": 21.08174386920981,
+ "grad_norm": 9.866307258605957,
+ "learning_rate": 1.833367660569401e-05,
+ "loss": 0.8092,
+ "step": 7737
+ },
+ {
+ "epoch": 21.084468664850135,
+ "grad_norm": 7.818713188171387,
+ "learning_rate": 1.8333188801651497e-05,
+ "loss": 0.8223,
+ "step": 7738
+ },
+ {
+ "epoch": 21.087193460490465,
+ "grad_norm": 6.951756954193115,
+ "learning_rate": 1.8332700932710375e-05,
+ "loss": 0.6738,
+ "step": 7739
+ },
+ {
+ "epoch": 21.08991825613079,
+ "grad_norm": 8.046797752380371,
+ "learning_rate": 1.8332212998874445e-05,
+ "loss": 0.7175,
+ "step": 7740
+ },
+ {
+ "epoch": 21.092643051771116,
+ "grad_norm": 7.292179107666016,
+ "learning_rate": 1.833172500014751e-05,
+ "loss": 0.6885,
+ "step": 7741
+ },
+ {
+ "epoch": 21.095367847411445,
+ "grad_norm": 7.999224662780762,
+ "learning_rate": 1.8331236936533372e-05,
+ "loss": 0.6877,
+ "step": 7742
+ },
+ {
+ "epoch": 21.09809264305177,
+ "grad_norm": 7.979372501373291,
+ "learning_rate": 1.8330748808035827e-05,
+ "loss": 0.6896,
+ "step": 7743
+ },
+ {
+ "epoch": 21.100817438692097,
+ "grad_norm": 8.748741149902344,
+ "learning_rate": 1.8330260614658674e-05,
+ "loss": 0.7583,
+ "step": 7744
+ },
+ {
+ "epoch": 21.103542234332426,
+ "grad_norm": 6.686682224273682,
+ "learning_rate": 1.8329772356405723e-05,
+ "loss": 0.906,
+ "step": 7745
+ },
+ {
+ "epoch": 21.106267029972752,
+ "grad_norm": 6.980701923370361,
+ "learning_rate": 1.8329284033280775e-05,
+ "loss": 0.523,
+ "step": 7746
+ },
+ {
+ "epoch": 21.108991825613078,
+ "grad_norm": 11.001998901367188,
+ "learning_rate": 1.832879564528763e-05,
+ "loss": 0.8516,
+ "step": 7747
+ },
+ {
+ "epoch": 21.111716621253407,
+ "grad_norm": 8.298548698425293,
+ "learning_rate": 1.832830719243009e-05,
+ "loss": 0.6667,
+ "step": 7748
+ },
+ {
+ "epoch": 21.114441416893733,
+ "grad_norm": 11.617433547973633,
+ "learning_rate": 1.8327818674711965e-05,
+ "loss": 0.7035,
+ "step": 7749
+ },
+ {
+ "epoch": 21.11716621253406,
+ "grad_norm": 6.781091213226318,
+ "learning_rate": 1.832733009213705e-05,
+ "loss": 0.7485,
+ "step": 7750
+ },
+ {
+ "epoch": 21.11989100817439,
+ "grad_norm": 8.314715385437012,
+ "learning_rate": 1.832684144470916e-05,
+ "loss": 0.8,
+ "step": 7751
+ },
+ {
+ "epoch": 21.122615803814714,
+ "grad_norm": 7.875467300415039,
+ "learning_rate": 1.8326352732432103e-05,
+ "loss": 0.6787,
+ "step": 7752
+ },
+ {
+ "epoch": 21.12534059945504,
+ "grad_norm": 12.015420913696289,
+ "learning_rate": 1.8325863955309673e-05,
+ "loss": 0.7911,
+ "step": 7753
+ },
+ {
+ "epoch": 21.12806539509537,
+ "grad_norm": 8.246016502380371,
+ "learning_rate": 1.8325375113345684e-05,
+ "loss": 0.7249,
+ "step": 7754
+ },
+ {
+ "epoch": 21.130790190735695,
+ "grad_norm": 7.11991024017334,
+ "learning_rate": 1.832488620654394e-05,
+ "loss": 0.7421,
+ "step": 7755
+ },
+ {
+ "epoch": 21.13351498637602,
+ "grad_norm": 9.072060585021973,
+ "learning_rate": 1.8324397234908252e-05,
+ "loss": 0.8292,
+ "step": 7756
+ },
+ {
+ "epoch": 21.13623978201635,
+ "grad_norm": 10.79595947265625,
+ "learning_rate": 1.8323908198442423e-05,
+ "loss": 0.7333,
+ "step": 7757
+ },
+ {
+ "epoch": 21.138964577656676,
+ "grad_norm": 9.850205421447754,
+ "learning_rate": 1.8323419097150264e-05,
+ "loss": 0.786,
+ "step": 7758
+ },
+ {
+ "epoch": 21.141689373297,
+ "grad_norm": 8.980114936828613,
+ "learning_rate": 1.832292993103559e-05,
+ "loss": 0.675,
+ "step": 7759
+ },
+ {
+ "epoch": 21.14441416893733,
+ "grad_norm": 6.9589009284973145,
+ "learning_rate": 1.8322440700102203e-05,
+ "loss": 0.7552,
+ "step": 7760
+ },
+ {
+ "epoch": 21.147138964577657,
+ "grad_norm": 9.685104370117188,
+ "learning_rate": 1.8321951404353916e-05,
+ "loss": 0.7158,
+ "step": 7761
+ },
+ {
+ "epoch": 21.149863760217983,
+ "grad_norm": 7.686063289642334,
+ "learning_rate": 1.8321462043794538e-05,
+ "loss": 0.9153,
+ "step": 7762
+ },
+ {
+ "epoch": 21.152588555858312,
+ "grad_norm": 7.35426664352417,
+ "learning_rate": 1.8320972618427885e-05,
+ "loss": 0.7068,
+ "step": 7763
+ },
+ {
+ "epoch": 21.155313351498638,
+ "grad_norm": 8.867984771728516,
+ "learning_rate": 1.832048312825776e-05,
+ "loss": 0.8534,
+ "step": 7764
+ },
+ {
+ "epoch": 21.158038147138964,
+ "grad_norm": 7.1844096183776855,
+ "learning_rate": 1.8319993573287984e-05,
+ "loss": 0.9589,
+ "step": 7765
+ },
+ {
+ "epoch": 21.160762942779293,
+ "grad_norm": 8.416938781738281,
+ "learning_rate": 1.8319503953522368e-05,
+ "loss": 0.6345,
+ "step": 7766
+ },
+ {
+ "epoch": 21.16348773841962,
+ "grad_norm": 7.446508407592773,
+ "learning_rate": 1.8319014268964718e-05,
+ "loss": 0.667,
+ "step": 7767
+ },
+ {
+ "epoch": 21.166212534059945,
+ "grad_norm": 8.560457229614258,
+ "learning_rate": 1.8318524519618853e-05,
+ "loss": 0.6437,
+ "step": 7768
+ },
+ {
+ "epoch": 21.168937329700274,
+ "grad_norm": 7.70897102355957,
+ "learning_rate": 1.831803470548859e-05,
+ "loss": 0.5842,
+ "step": 7769
+ },
+ {
+ "epoch": 21.1716621253406,
+ "grad_norm": 7.899026393890381,
+ "learning_rate": 1.8317544826577738e-05,
+ "loss": 0.7852,
+ "step": 7770
+ },
+ {
+ "epoch": 21.174386920980925,
+ "grad_norm": 7.9237823486328125,
+ "learning_rate": 1.8317054882890114e-05,
+ "loss": 0.7289,
+ "step": 7771
+ },
+ {
+ "epoch": 21.177111716621255,
+ "grad_norm": 8.078022956848145,
+ "learning_rate": 1.8316564874429535e-05,
+ "loss": 0.7711,
+ "step": 7772
+ },
+ {
+ "epoch": 21.17983651226158,
+ "grad_norm": 6.839797019958496,
+ "learning_rate": 1.831607480119982e-05,
+ "loss": 0.5835,
+ "step": 7773
+ },
+ {
+ "epoch": 21.182561307901906,
+ "grad_norm": 8.098297119140625,
+ "learning_rate": 1.8315584663204776e-05,
+ "loss": 0.7346,
+ "step": 7774
+ },
+ {
+ "epoch": 21.185286103542236,
+ "grad_norm": 7.693576812744141,
+ "learning_rate": 1.8315094460448232e-05,
+ "loss": 0.6617,
+ "step": 7775
+ },
+ {
+ "epoch": 21.18801089918256,
+ "grad_norm": 8.116175651550293,
+ "learning_rate": 1.8314604192933997e-05,
+ "loss": 0.7086,
+ "step": 7776
+ },
+ {
+ "epoch": 21.190735694822887,
+ "grad_norm": 8.301321983337402,
+ "learning_rate": 1.8314113860665892e-05,
+ "loss": 0.8246,
+ "step": 7777
+ },
+ {
+ "epoch": 21.193460490463217,
+ "grad_norm": 12.183932304382324,
+ "learning_rate": 1.8313623463647736e-05,
+ "loss": 0.77,
+ "step": 7778
+ },
+ {
+ "epoch": 21.196185286103542,
+ "grad_norm": 7.684350490570068,
+ "learning_rate": 1.831313300188335e-05,
+ "loss": 0.7761,
+ "step": 7779
+ },
+ {
+ "epoch": 21.19891008174387,
+ "grad_norm": 8.239131927490234,
+ "learning_rate": 1.8312642475376547e-05,
+ "loss": 0.7188,
+ "step": 7780
+ },
+ {
+ "epoch": 21.201634877384198,
+ "grad_norm": 9.018391609191895,
+ "learning_rate": 1.8312151884131157e-05,
+ "loss": 0.7761,
+ "step": 7781
+ },
+ {
+ "epoch": 21.204359673024523,
+ "grad_norm": 8.890396118164062,
+ "learning_rate": 1.8311661228150994e-05,
+ "loss": 0.6096,
+ "step": 7782
+ },
+ {
+ "epoch": 21.20708446866485,
+ "grad_norm": 7.6317548751831055,
+ "learning_rate": 1.8311170507439878e-05,
+ "loss": 0.8057,
+ "step": 7783
+ },
+ {
+ "epoch": 21.20980926430518,
+ "grad_norm": 7.228536128997803,
+ "learning_rate": 1.8310679722001638e-05,
+ "loss": 0.6051,
+ "step": 7784
+ },
+ {
+ "epoch": 21.212534059945504,
+ "grad_norm": 9.289490699768066,
+ "learning_rate": 1.831018887184009e-05,
+ "loss": 0.8712,
+ "step": 7785
+ },
+ {
+ "epoch": 21.21525885558583,
+ "grad_norm": 8.295319557189941,
+ "learning_rate": 1.8309697956959057e-05,
+ "loss": 0.6566,
+ "step": 7786
+ },
+ {
+ "epoch": 21.21798365122616,
+ "grad_norm": 9.994537353515625,
+ "learning_rate": 1.8309206977362367e-05,
+ "loss": 1.0121,
+ "step": 7787
+ },
+ {
+ "epoch": 21.220708446866485,
+ "grad_norm": 9.828986167907715,
+ "learning_rate": 1.8308715933053836e-05,
+ "loss": 0.6002,
+ "step": 7788
+ },
+ {
+ "epoch": 21.22343324250681,
+ "grad_norm": 8.134908676147461,
+ "learning_rate": 1.8308224824037295e-05,
+ "loss": 0.8085,
+ "step": 7789
+ },
+ {
+ "epoch": 21.22615803814714,
+ "grad_norm": 8.998791694641113,
+ "learning_rate": 1.8307733650316567e-05,
+ "loss": 0.6447,
+ "step": 7790
+ },
+ {
+ "epoch": 21.228882833787466,
+ "grad_norm": 6.333938121795654,
+ "learning_rate": 1.8307242411895478e-05,
+ "loss": 0.8348,
+ "step": 7791
+ },
+ {
+ "epoch": 21.231607629427792,
+ "grad_norm": 6.362037658691406,
+ "learning_rate": 1.8306751108777853e-05,
+ "loss": 0.6097,
+ "step": 7792
+ },
+ {
+ "epoch": 21.23433242506812,
+ "grad_norm": 6.66240930557251,
+ "learning_rate": 1.8306259740967515e-05,
+ "loss": 0.6624,
+ "step": 7793
+ },
+ {
+ "epoch": 21.237057220708447,
+ "grad_norm": 9.169851303100586,
+ "learning_rate": 1.8305768308468294e-05,
+ "loss": 0.7953,
+ "step": 7794
+ },
+ {
+ "epoch": 21.239782016348773,
+ "grad_norm": 8.247089385986328,
+ "learning_rate": 1.8305276811284013e-05,
+ "loss": 0.6312,
+ "step": 7795
+ },
+ {
+ "epoch": 21.242506811989102,
+ "grad_norm": 7.682947158813477,
+ "learning_rate": 1.8304785249418508e-05,
+ "loss": 0.7508,
+ "step": 7796
+ },
+ {
+ "epoch": 21.245231607629428,
+ "grad_norm": 7.679996013641357,
+ "learning_rate": 1.8304293622875603e-05,
+ "loss": 0.6304,
+ "step": 7797
+ },
+ {
+ "epoch": 21.247956403269754,
+ "grad_norm": 7.897690773010254,
+ "learning_rate": 1.8303801931659127e-05,
+ "loss": 0.9888,
+ "step": 7798
+ },
+ {
+ "epoch": 21.250681198910083,
+ "grad_norm": 7.268885612487793,
+ "learning_rate": 1.8303310175772905e-05,
+ "loss": 0.7899,
+ "step": 7799
+ },
+ {
+ "epoch": 21.25340599455041,
+ "grad_norm": 7.545280456542969,
+ "learning_rate": 1.8302818355220776e-05,
+ "loss": 0.6075,
+ "step": 7800
+ },
+ {
+ "epoch": 21.256130790190735,
+ "grad_norm": 7.544144630432129,
+ "learning_rate": 1.8302326470006562e-05,
+ "loss": 0.8575,
+ "step": 7801
+ },
+ {
+ "epoch": 21.258855585831064,
+ "grad_norm": 6.4075164794921875,
+ "learning_rate": 1.8301834520134098e-05,
+ "loss": 0.7751,
+ "step": 7802
+ },
+ {
+ "epoch": 21.26158038147139,
+ "grad_norm": 7.582212448120117,
+ "learning_rate": 1.830134250560721e-05,
+ "loss": 0.6442,
+ "step": 7803
+ },
+ {
+ "epoch": 21.264305177111716,
+ "grad_norm": 9.166476249694824,
+ "learning_rate": 1.8300850426429738e-05,
+ "loss": 0.7045,
+ "step": 7804
+ },
+ {
+ "epoch": 21.267029972752045,
+ "grad_norm": 8.270711898803711,
+ "learning_rate": 1.830035828260551e-05,
+ "loss": 0.5986,
+ "step": 7805
+ },
+ {
+ "epoch": 21.26975476839237,
+ "grad_norm": 8.354194641113281,
+ "learning_rate": 1.8299866074138356e-05,
+ "loss": 0.672,
+ "step": 7806
+ },
+ {
+ "epoch": 21.272479564032697,
+ "grad_norm": 7.5973896980285645,
+ "learning_rate": 1.829937380103211e-05,
+ "loss": 0.6956,
+ "step": 7807
+ },
+ {
+ "epoch": 21.275204359673026,
+ "grad_norm": 9.056324005126953,
+ "learning_rate": 1.8298881463290613e-05,
+ "loss": 0.8167,
+ "step": 7808
+ },
+ {
+ "epoch": 21.277929155313352,
+ "grad_norm": 8.447535514831543,
+ "learning_rate": 1.8298389060917696e-05,
+ "loss": 0.6823,
+ "step": 7809
+ },
+ {
+ "epoch": 21.280653950953678,
+ "grad_norm": 6.850573539733887,
+ "learning_rate": 1.8297896593917187e-05,
+ "loss": 0.6815,
+ "step": 7810
+ },
+ {
+ "epoch": 21.283378746594007,
+ "grad_norm": 9.523035049438477,
+ "learning_rate": 1.8297404062292927e-05,
+ "loss": 0.6124,
+ "step": 7811
+ },
+ {
+ "epoch": 21.286103542234333,
+ "grad_norm": 8.456561088562012,
+ "learning_rate": 1.8296911466048754e-05,
+ "loss": 0.7413,
+ "step": 7812
+ },
+ {
+ "epoch": 21.28882833787466,
+ "grad_norm": 6.094063758850098,
+ "learning_rate": 1.82964188051885e-05,
+ "loss": 0.6749,
+ "step": 7813
+ },
+ {
+ "epoch": 21.291553133514988,
+ "grad_norm": 7.415526866912842,
+ "learning_rate": 1.8295926079716002e-05,
+ "loss": 0.7262,
+ "step": 7814
+ },
+ {
+ "epoch": 21.294277929155314,
+ "grad_norm": 6.7150654792785645,
+ "learning_rate": 1.82954332896351e-05,
+ "loss": 0.6599,
+ "step": 7815
+ },
+ {
+ "epoch": 21.29700272479564,
+ "grad_norm": 8.221084594726562,
+ "learning_rate": 1.829494043494963e-05,
+ "loss": 0.7855,
+ "step": 7816
+ },
+ {
+ "epoch": 21.29972752043597,
+ "grad_norm": 7.059593200683594,
+ "learning_rate": 1.829444751566343e-05,
+ "loss": 0.7522,
+ "step": 7817
+ },
+ {
+ "epoch": 21.302452316076295,
+ "grad_norm": 8.087608337402344,
+ "learning_rate": 1.829395453178034e-05,
+ "loss": 0.6614,
+ "step": 7818
+ },
+ {
+ "epoch": 21.30517711171662,
+ "grad_norm": 7.509298801422119,
+ "learning_rate": 1.8293461483304203e-05,
+ "loss": 0.8376,
+ "step": 7819
+ },
+ {
+ "epoch": 21.30790190735695,
+ "grad_norm": 8.698942184448242,
+ "learning_rate": 1.8292968370238852e-05,
+ "loss": 0.6471,
+ "step": 7820
+ },
+ {
+ "epoch": 21.310626702997276,
+ "grad_norm": 7.400518417358398,
+ "learning_rate": 1.829247519258813e-05,
+ "loss": 0.7327,
+ "step": 7821
+ },
+ {
+ "epoch": 21.3133514986376,
+ "grad_norm": 7.770204067230225,
+ "learning_rate": 1.8291981950355878e-05,
+ "loss": 0.7166,
+ "step": 7822
+ },
+ {
+ "epoch": 21.31607629427793,
+ "grad_norm": 9.752872467041016,
+ "learning_rate": 1.829148864354594e-05,
+ "loss": 0.6592,
+ "step": 7823
+ },
+ {
+ "epoch": 21.318801089918257,
+ "grad_norm": 8.794660568237305,
+ "learning_rate": 1.829099527216215e-05,
+ "loss": 0.6592,
+ "step": 7824
+ },
+ {
+ "epoch": 21.321525885558582,
+ "grad_norm": 8.04993724822998,
+ "learning_rate": 1.8290501836208357e-05,
+ "loss": 0.7495,
+ "step": 7825
+ },
+ {
+ "epoch": 21.32425068119891,
+ "grad_norm": 9.428915023803711,
+ "learning_rate": 1.8290008335688404e-05,
+ "loss": 0.7839,
+ "step": 7826
+ },
+ {
+ "epoch": 21.326975476839237,
+ "grad_norm": 8.758989334106445,
+ "learning_rate": 1.8289514770606133e-05,
+ "loss": 0.7225,
+ "step": 7827
+ },
+ {
+ "epoch": 21.329700272479563,
+ "grad_norm": 7.357696056365967,
+ "learning_rate": 1.828902114096539e-05,
+ "loss": 0.7797,
+ "step": 7828
+ },
+ {
+ "epoch": 21.332425068119893,
+ "grad_norm": 7.127198696136475,
+ "learning_rate": 1.8288527446770015e-05,
+ "loss": 0.6018,
+ "step": 7829
+ },
+ {
+ "epoch": 21.33514986376022,
+ "grad_norm": 8.083072662353516,
+ "learning_rate": 1.8288033688023855e-05,
+ "loss": 0.7021,
+ "step": 7830
+ },
+ {
+ "epoch": 21.337874659400544,
+ "grad_norm": 39.04533767700195,
+ "learning_rate": 1.8287539864730756e-05,
+ "loss": 0.6806,
+ "step": 7831
+ },
+ {
+ "epoch": 21.340599455040874,
+ "grad_norm": 7.802813529968262,
+ "learning_rate": 1.8287045976894563e-05,
+ "loss": 0.7299,
+ "step": 7832
+ },
+ {
+ "epoch": 21.3433242506812,
+ "grad_norm": 7.451691627502441,
+ "learning_rate": 1.828655202451912e-05,
+ "loss": 0.7479,
+ "step": 7833
+ },
+ {
+ "epoch": 21.346049046321525,
+ "grad_norm": 8.16508960723877,
+ "learning_rate": 1.828605800760828e-05,
+ "loss": 0.6664,
+ "step": 7834
+ },
+ {
+ "epoch": 21.348773841961854,
+ "grad_norm": 8.571643829345703,
+ "learning_rate": 1.8285563926165884e-05,
+ "loss": 0.7836,
+ "step": 7835
+ },
+ {
+ "epoch": 21.35149863760218,
+ "grad_norm": 8.905378341674805,
+ "learning_rate": 1.8285069780195787e-05,
+ "loss": 0.7247,
+ "step": 7836
+ },
+ {
+ "epoch": 21.354223433242506,
+ "grad_norm": 8.476143836975098,
+ "learning_rate": 1.828457556970183e-05,
+ "loss": 0.9014,
+ "step": 7837
+ },
+ {
+ "epoch": 21.356948228882835,
+ "grad_norm": 9.995495796203613,
+ "learning_rate": 1.8284081294687866e-05,
+ "loss": 0.7649,
+ "step": 7838
+ },
+ {
+ "epoch": 21.35967302452316,
+ "grad_norm": 7.34924840927124,
+ "learning_rate": 1.8283586955157744e-05,
+ "loss": 0.6138,
+ "step": 7839
+ },
+ {
+ "epoch": 21.362397820163487,
+ "grad_norm": 8.554211616516113,
+ "learning_rate": 1.8283092551115312e-05,
+ "loss": 0.6246,
+ "step": 7840
+ },
+ {
+ "epoch": 21.365122615803816,
+ "grad_norm": 9.853658676147461,
+ "learning_rate": 1.8282598082564423e-05,
+ "loss": 0.6639,
+ "step": 7841
+ },
+ {
+ "epoch": 21.367847411444142,
+ "grad_norm": 9.210776329040527,
+ "learning_rate": 1.828210354950893e-05,
+ "loss": 0.7076,
+ "step": 7842
+ },
+ {
+ "epoch": 21.370572207084468,
+ "grad_norm": 10.371861457824707,
+ "learning_rate": 1.8281608951952675e-05,
+ "loss": 0.7557,
+ "step": 7843
+ },
+ {
+ "epoch": 21.373297002724797,
+ "grad_norm": 9.623146057128906,
+ "learning_rate": 1.8281114289899515e-05,
+ "loss": 0.8533,
+ "step": 7844
+ },
+ {
+ "epoch": 21.376021798365123,
+ "grad_norm": 14.123766899108887,
+ "learning_rate": 1.8280619563353307e-05,
+ "loss": 0.7615,
+ "step": 7845
+ },
+ {
+ "epoch": 21.37874659400545,
+ "grad_norm": 8.241548538208008,
+ "learning_rate": 1.8280124772317903e-05,
+ "loss": 0.7469,
+ "step": 7846
+ },
+ {
+ "epoch": 21.381471389645778,
+ "grad_norm": 9.194026947021484,
+ "learning_rate": 1.827962991679715e-05,
+ "loss": 0.8611,
+ "step": 7847
+ },
+ {
+ "epoch": 21.384196185286104,
+ "grad_norm": 9.951804161071777,
+ "learning_rate": 1.8279134996794904e-05,
+ "loss": 0.7452,
+ "step": 7848
+ },
+ {
+ "epoch": 21.38692098092643,
+ "grad_norm": 9.589630126953125,
+ "learning_rate": 1.8278640012315026e-05,
+ "loss": 0.8759,
+ "step": 7849
+ },
+ {
+ "epoch": 21.38964577656676,
+ "grad_norm": 8.136022567749023,
+ "learning_rate": 1.8278144963361363e-05,
+ "loss": 0.8513,
+ "step": 7850
+ },
+ {
+ "epoch": 21.392370572207085,
+ "grad_norm": 7.128570079803467,
+ "learning_rate": 1.8277649849937776e-05,
+ "loss": 0.601,
+ "step": 7851
+ },
+ {
+ "epoch": 21.39509536784741,
+ "grad_norm": 8.721702575683594,
+ "learning_rate": 1.8277154672048117e-05,
+ "loss": 0.8491,
+ "step": 7852
+ },
+ {
+ "epoch": 21.39782016348774,
+ "grad_norm": 10.861640930175781,
+ "learning_rate": 1.827665942969624e-05,
+ "loss": 0.8474,
+ "step": 7853
+ },
+ {
+ "epoch": 21.400544959128066,
+ "grad_norm": 9.07026195526123,
+ "learning_rate": 1.827616412288601e-05,
+ "loss": 0.7765,
+ "step": 7854
+ },
+ {
+ "epoch": 21.40326975476839,
+ "grad_norm": 10.966297149658203,
+ "learning_rate": 1.827566875162128e-05,
+ "loss": 0.7677,
+ "step": 7855
+ },
+ {
+ "epoch": 21.40599455040872,
+ "grad_norm": 7.402095317840576,
+ "learning_rate": 1.827517331590591e-05,
+ "loss": 0.6769,
+ "step": 7856
+ },
+ {
+ "epoch": 21.408719346049047,
+ "grad_norm": 9.250561714172363,
+ "learning_rate": 1.827467781574375e-05,
+ "loss": 0.7842,
+ "step": 7857
+ },
+ {
+ "epoch": 21.411444141689373,
+ "grad_norm": 8.343886375427246,
+ "learning_rate": 1.827418225113867e-05,
+ "loss": 0.7271,
+ "step": 7858
+ },
+ {
+ "epoch": 21.414168937329702,
+ "grad_norm": 9.130738258361816,
+ "learning_rate": 1.8273686622094528e-05,
+ "loss": 0.9478,
+ "step": 7859
+ },
+ {
+ "epoch": 21.416893732970028,
+ "grad_norm": 8.603825569152832,
+ "learning_rate": 1.8273190928615175e-05,
+ "loss": 0.723,
+ "step": 7860
+ },
+ {
+ "epoch": 21.419618528610354,
+ "grad_norm": 8.468642234802246,
+ "learning_rate": 1.827269517070448e-05,
+ "loss": 0.8052,
+ "step": 7861
+ },
+ {
+ "epoch": 21.422343324250683,
+ "grad_norm": 9.678513526916504,
+ "learning_rate": 1.82721993483663e-05,
+ "loss": 0.7749,
+ "step": 7862
+ },
+ {
+ "epoch": 21.42506811989101,
+ "grad_norm": 8.318564414978027,
+ "learning_rate": 1.82717034616045e-05,
+ "loss": 0.8833,
+ "step": 7863
+ },
+ {
+ "epoch": 21.427792915531334,
+ "grad_norm": 9.165751457214355,
+ "learning_rate": 1.8271207510422936e-05,
+ "loss": 0.6578,
+ "step": 7864
+ },
+ {
+ "epoch": 21.430517711171664,
+ "grad_norm": 9.25309944152832,
+ "learning_rate": 1.827071149482548e-05,
+ "loss": 0.8782,
+ "step": 7865
+ },
+ {
+ "epoch": 21.43324250681199,
+ "grad_norm": 7.358325481414795,
+ "learning_rate": 1.8270215414815983e-05,
+ "loss": 0.7503,
+ "step": 7866
+ },
+ {
+ "epoch": 21.435967302452315,
+ "grad_norm": 10.131277084350586,
+ "learning_rate": 1.826971927039832e-05,
+ "loss": 0.8035,
+ "step": 7867
+ },
+ {
+ "epoch": 21.438692098092645,
+ "grad_norm": 6.802368640899658,
+ "learning_rate": 1.8269223061576345e-05,
+ "loss": 0.5909,
+ "step": 7868
+ },
+ {
+ "epoch": 21.44141689373297,
+ "grad_norm": 7.230935573577881,
+ "learning_rate": 1.8268726788353928e-05,
+ "loss": 0.6816,
+ "step": 7869
+ },
+ {
+ "epoch": 21.444141689373296,
+ "grad_norm": 8.83212947845459,
+ "learning_rate": 1.8268230450734933e-05,
+ "loss": 0.7934,
+ "step": 7870
+ },
+ {
+ "epoch": 21.446866485013626,
+ "grad_norm": 10.197222709655762,
+ "learning_rate": 1.8267734048723227e-05,
+ "loss": 0.7797,
+ "step": 7871
+ },
+ {
+ "epoch": 21.44959128065395,
+ "grad_norm": 7.890384197235107,
+ "learning_rate": 1.826723758232267e-05,
+ "loss": 0.7396,
+ "step": 7872
+ },
+ {
+ "epoch": 21.452316076294277,
+ "grad_norm": 22.438573837280273,
+ "learning_rate": 1.8266741051537138e-05,
+ "loss": 0.7768,
+ "step": 7873
+ },
+ {
+ "epoch": 21.455040871934607,
+ "grad_norm": 8.331838607788086,
+ "learning_rate": 1.826624445637049e-05,
+ "loss": 0.7235,
+ "step": 7874
+ },
+ {
+ "epoch": 21.457765667574932,
+ "grad_norm": 8.330008506774902,
+ "learning_rate": 1.82657477968266e-05,
+ "loss": 0.794,
+ "step": 7875
+ },
+ {
+ "epoch": 21.460490463215258,
+ "grad_norm": 8.820117950439453,
+ "learning_rate": 1.8265251072909325e-05,
+ "loss": 0.726,
+ "step": 7876
+ },
+ {
+ "epoch": 21.463215258855588,
+ "grad_norm": 8.135759353637695,
+ "learning_rate": 1.8264754284622544e-05,
+ "loss": 0.7684,
+ "step": 7877
+ },
+ {
+ "epoch": 21.465940054495913,
+ "grad_norm": 8.72147274017334,
+ "learning_rate": 1.8264257431970126e-05,
+ "loss": 0.6674,
+ "step": 7878
+ },
+ {
+ "epoch": 21.46866485013624,
+ "grad_norm": 9.059609413146973,
+ "learning_rate": 1.8263760514955934e-05,
+ "loss": 0.6546,
+ "step": 7879
+ },
+ {
+ "epoch": 21.47138964577657,
+ "grad_norm": 8.65694522857666,
+ "learning_rate": 1.826326353358384e-05,
+ "loss": 0.6604,
+ "step": 7880
+ },
+ {
+ "epoch": 21.474114441416894,
+ "grad_norm": 16.3781795501709,
+ "learning_rate": 1.826276648785772e-05,
+ "loss": 0.79,
+ "step": 7881
+ },
+ {
+ "epoch": 21.47683923705722,
+ "grad_norm": 8.262587547302246,
+ "learning_rate": 1.8262269377781433e-05,
+ "loss": 0.8599,
+ "step": 7882
+ },
+ {
+ "epoch": 21.479564032697546,
+ "grad_norm": 10.127559661865234,
+ "learning_rate": 1.8261772203358864e-05,
+ "loss": 0.806,
+ "step": 7883
+ },
+ {
+ "epoch": 21.482288828337875,
+ "grad_norm": 8.68094253540039,
+ "learning_rate": 1.826127496459388e-05,
+ "loss": 0.8834,
+ "step": 7884
+ },
+ {
+ "epoch": 21.4850136239782,
+ "grad_norm": 10.492690086364746,
+ "learning_rate": 1.8260777661490346e-05,
+ "loss": 0.8959,
+ "step": 7885
+ },
+ {
+ "epoch": 21.48773841961853,
+ "grad_norm": 9.7289457321167,
+ "learning_rate": 1.8260280294052147e-05,
+ "loss": 0.6808,
+ "step": 7886
+ },
+ {
+ "epoch": 21.490463215258856,
+ "grad_norm": 8.183979988098145,
+ "learning_rate": 1.825978286228315e-05,
+ "loss": 0.6351,
+ "step": 7887
+ },
+ {
+ "epoch": 21.493188010899182,
+ "grad_norm": 7.9571452140808105,
+ "learning_rate": 1.825928536618723e-05,
+ "loss": 0.884,
+ "step": 7888
+ },
+ {
+ "epoch": 21.495912806539508,
+ "grad_norm": 7.1114678382873535,
+ "learning_rate": 1.825878780576826e-05,
+ "loss": 0.7722,
+ "step": 7889
+ },
+ {
+ "epoch": 21.498637602179837,
+ "grad_norm": 9.125557899475098,
+ "learning_rate": 1.8258290181030118e-05,
+ "loss": 0.7119,
+ "step": 7890
+ },
+ {
+ "epoch": 21.501362397820163,
+ "grad_norm": 8.275768280029297,
+ "learning_rate": 1.8257792491976676e-05,
+ "loss": 0.7316,
+ "step": 7891
+ },
+ {
+ "epoch": 21.504087193460492,
+ "grad_norm": 6.560149669647217,
+ "learning_rate": 1.8257294738611814e-05,
+ "loss": 0.6208,
+ "step": 7892
+ },
+ {
+ "epoch": 21.506811989100818,
+ "grad_norm": 11.462034225463867,
+ "learning_rate": 1.8256796920939405e-05,
+ "loss": 0.6605,
+ "step": 7893
+ },
+ {
+ "epoch": 21.509536784741144,
+ "grad_norm": 9.567168235778809,
+ "learning_rate": 1.8256299038963326e-05,
+ "loss": 0.7499,
+ "step": 7894
+ },
+ {
+ "epoch": 21.51226158038147,
+ "grad_norm": 8.80770492553711,
+ "learning_rate": 1.8255801092687456e-05,
+ "loss": 0.6636,
+ "step": 7895
+ },
+ {
+ "epoch": 21.5149863760218,
+ "grad_norm": 7.371953010559082,
+ "learning_rate": 1.8255303082115676e-05,
+ "loss": 0.666,
+ "step": 7896
+ },
+ {
+ "epoch": 21.517711171662125,
+ "grad_norm": 9.620489120483398,
+ "learning_rate": 1.825480500725186e-05,
+ "loss": 0.9453,
+ "step": 7897
+ },
+ {
+ "epoch": 21.520435967302454,
+ "grad_norm": 10.59334945678711,
+ "learning_rate": 1.8254306868099885e-05,
+ "loss": 0.9546,
+ "step": 7898
+ },
+ {
+ "epoch": 21.52316076294278,
+ "grad_norm": 8.24769115447998,
+ "learning_rate": 1.8253808664663636e-05,
+ "loss": 0.582,
+ "step": 7899
+ },
+ {
+ "epoch": 21.525885558583106,
+ "grad_norm": 8.952377319335938,
+ "learning_rate": 1.8253310396946992e-05,
+ "loss": 0.7687,
+ "step": 7900
+ },
+ {
+ "epoch": 21.52861035422343,
+ "grad_norm": 8.575875282287598,
+ "learning_rate": 1.8252812064953832e-05,
+ "loss": 0.7123,
+ "step": 7901
+ },
+ {
+ "epoch": 21.53133514986376,
+ "grad_norm": 8.191732406616211,
+ "learning_rate": 1.8252313668688036e-05,
+ "loss": 0.7455,
+ "step": 7902
+ },
+ {
+ "epoch": 21.534059945504087,
+ "grad_norm": 8.31759262084961,
+ "learning_rate": 1.825181520815349e-05,
+ "loss": 0.7352,
+ "step": 7903
+ },
+ {
+ "epoch": 21.536784741144416,
+ "grad_norm": 7.698764324188232,
+ "learning_rate": 1.825131668335407e-05,
+ "loss": 0.6262,
+ "step": 7904
+ },
+ {
+ "epoch": 21.539509536784742,
+ "grad_norm": 8.273205757141113,
+ "learning_rate": 1.825081809429366e-05,
+ "loss": 0.6234,
+ "step": 7905
+ },
+ {
+ "epoch": 21.542234332425068,
+ "grad_norm": 8.954992294311523,
+ "learning_rate": 1.8250319440976146e-05,
+ "loss": 0.6729,
+ "step": 7906
+ },
+ {
+ "epoch": 21.544959128065393,
+ "grad_norm": 6.745213985443115,
+ "learning_rate": 1.824982072340541e-05,
+ "loss": 0.6978,
+ "step": 7907
+ },
+ {
+ "epoch": 21.547683923705723,
+ "grad_norm": 10.402472496032715,
+ "learning_rate": 1.8249321941585333e-05,
+ "loss": 0.6672,
+ "step": 7908
+ },
+ {
+ "epoch": 21.55040871934605,
+ "grad_norm": 11.216215133666992,
+ "learning_rate": 1.8248823095519804e-05,
+ "loss": 0.9177,
+ "step": 7909
+ },
+ {
+ "epoch": 21.553133514986374,
+ "grad_norm": 8.769536018371582,
+ "learning_rate": 1.824832418521271e-05,
+ "loss": 0.812,
+ "step": 7910
+ },
+ {
+ "epoch": 21.555858310626704,
+ "grad_norm": 8.631336212158203,
+ "learning_rate": 1.8247825210667926e-05,
+ "loss": 0.772,
+ "step": 7911
+ },
+ {
+ "epoch": 21.55858310626703,
+ "grad_norm": 10.451501846313477,
+ "learning_rate": 1.8247326171889346e-05,
+ "loss": 0.7401,
+ "step": 7912
+ },
+ {
+ "epoch": 21.561307901907355,
+ "grad_norm": 7.815615653991699,
+ "learning_rate": 1.824682706888086e-05,
+ "loss": 0.7202,
+ "step": 7913
+ },
+ {
+ "epoch": 21.564032697547685,
+ "grad_norm": 7.0563740730285645,
+ "learning_rate": 1.8246327901646344e-05,
+ "loss": 0.8525,
+ "step": 7914
+ },
+ {
+ "epoch": 21.56675749318801,
+ "grad_norm": 8.432811737060547,
+ "learning_rate": 1.8245828670189697e-05,
+ "loss": 0.6382,
+ "step": 7915
+ },
+ {
+ "epoch": 21.569482288828336,
+ "grad_norm": 10.904496192932129,
+ "learning_rate": 1.8245329374514803e-05,
+ "loss": 0.6903,
+ "step": 7916
+ },
+ {
+ "epoch": 21.572207084468666,
+ "grad_norm": 7.396626949310303,
+ "learning_rate": 1.8244830014625546e-05,
+ "loss": 0.6741,
+ "step": 7917
+ },
+ {
+ "epoch": 21.57493188010899,
+ "grad_norm": 7.294145584106445,
+ "learning_rate": 1.8244330590525817e-05,
+ "loss": 0.6677,
+ "step": 7918
+ },
+ {
+ "epoch": 21.577656675749317,
+ "grad_norm": 8.535848617553711,
+ "learning_rate": 1.8243831102219507e-05,
+ "loss": 0.871,
+ "step": 7919
+ },
+ {
+ "epoch": 21.580381471389646,
+ "grad_norm": 8.005303382873535,
+ "learning_rate": 1.8243331549710505e-05,
+ "loss": 0.5657,
+ "step": 7920
+ },
+ {
+ "epoch": 21.583106267029972,
+ "grad_norm": 10.448698997497559,
+ "learning_rate": 1.8242831933002704e-05,
+ "loss": 0.5724,
+ "step": 7921
+ },
+ {
+ "epoch": 21.585831062670298,
+ "grad_norm": 8.847328186035156,
+ "learning_rate": 1.8242332252099994e-05,
+ "loss": 0.8586,
+ "step": 7922
+ },
+ {
+ "epoch": 21.588555858310627,
+ "grad_norm": 8.258277893066406,
+ "learning_rate": 1.8241832507006265e-05,
+ "loss": 0.718,
+ "step": 7923
+ },
+ {
+ "epoch": 21.591280653950953,
+ "grad_norm": 9.496620178222656,
+ "learning_rate": 1.824133269772541e-05,
+ "loss": 0.8494,
+ "step": 7924
+ },
+ {
+ "epoch": 21.59400544959128,
+ "grad_norm": 14.107674598693848,
+ "learning_rate": 1.824083282426132e-05,
+ "loss": 0.6569,
+ "step": 7925
+ },
+ {
+ "epoch": 21.59673024523161,
+ "grad_norm": 9.128961563110352,
+ "learning_rate": 1.824033288661789e-05,
+ "loss": 0.7015,
+ "step": 7926
+ },
+ {
+ "epoch": 21.599455040871934,
+ "grad_norm": 10.131857872009277,
+ "learning_rate": 1.823983288479901e-05,
+ "loss": 0.6528,
+ "step": 7927
+ },
+ {
+ "epoch": 21.60217983651226,
+ "grad_norm": 9.59658145904541,
+ "learning_rate": 1.823933281880858e-05,
+ "loss": 0.8142,
+ "step": 7928
+ },
+ {
+ "epoch": 21.60490463215259,
+ "grad_norm": 8.79918098449707,
+ "learning_rate": 1.823883268865049e-05,
+ "loss": 0.7122,
+ "step": 7929
+ },
+ {
+ "epoch": 21.607629427792915,
+ "grad_norm": 7.878252029418945,
+ "learning_rate": 1.823833249432864e-05,
+ "loss": 0.7546,
+ "step": 7930
+ },
+ {
+ "epoch": 21.61035422343324,
+ "grad_norm": 9.626506805419922,
+ "learning_rate": 1.8237832235846916e-05,
+ "loss": 0.7728,
+ "step": 7931
+ },
+ {
+ "epoch": 21.61307901907357,
+ "grad_norm": 9.732280731201172,
+ "learning_rate": 1.8237331913209223e-05,
+ "loss": 0.7407,
+ "step": 7932
+ },
+ {
+ "epoch": 21.615803814713896,
+ "grad_norm": 7.609302997589111,
+ "learning_rate": 1.8236831526419453e-05,
+ "loss": 0.5814,
+ "step": 7933
+ },
+ {
+ "epoch": 21.618528610354222,
+ "grad_norm": 9.080131530761719,
+ "learning_rate": 1.8236331075481503e-05,
+ "loss": 0.6292,
+ "step": 7934
+ },
+ {
+ "epoch": 21.62125340599455,
+ "grad_norm": 9.119004249572754,
+ "learning_rate": 1.8235830560399273e-05,
+ "loss": 0.6587,
+ "step": 7935
+ },
+ {
+ "epoch": 21.623978201634877,
+ "grad_norm": 9.003334999084473,
+ "learning_rate": 1.823532998117666e-05,
+ "loss": 0.7407,
+ "step": 7936
+ },
+ {
+ "epoch": 21.626702997275203,
+ "grad_norm": 11.348891258239746,
+ "learning_rate": 1.8234829337817562e-05,
+ "loss": 0.739,
+ "step": 7937
+ },
+ {
+ "epoch": 21.629427792915532,
+ "grad_norm": 7.240442752838135,
+ "learning_rate": 1.8234328630325876e-05,
+ "loss": 0.8259,
+ "step": 7938
+ },
+ {
+ "epoch": 21.632152588555858,
+ "grad_norm": 12.556734085083008,
+ "learning_rate": 1.8233827858705507e-05,
+ "loss": 0.8721,
+ "step": 7939
+ },
+ {
+ "epoch": 21.634877384196184,
+ "grad_norm": 8.399681091308594,
+ "learning_rate": 1.823332702296035e-05,
+ "loss": 0.7849,
+ "step": 7940
+ },
+ {
+ "epoch": 21.637602179836513,
+ "grad_norm": 9.10388469696045,
+ "learning_rate": 1.8232826123094308e-05,
+ "loss": 0.6383,
+ "step": 7941
+ },
+ {
+ "epoch": 21.64032697547684,
+ "grad_norm": 7.981561183929443,
+ "learning_rate": 1.823232515911128e-05,
+ "loss": 0.8083,
+ "step": 7942
+ },
+ {
+ "epoch": 21.643051771117165,
+ "grad_norm": 7.688388347625732,
+ "learning_rate": 1.8231824131015166e-05,
+ "loss": 0.5851,
+ "step": 7943
+ },
+ {
+ "epoch": 21.645776566757494,
+ "grad_norm": 7.962990760803223,
+ "learning_rate": 1.823132303880988e-05,
+ "loss": 0.6984,
+ "step": 7944
+ },
+ {
+ "epoch": 21.64850136239782,
+ "grad_norm": 8.506324768066406,
+ "learning_rate": 1.8230821882499307e-05,
+ "loss": 0.8352,
+ "step": 7945
+ },
+ {
+ "epoch": 21.651226158038146,
+ "grad_norm": 9.10961627960205,
+ "learning_rate": 1.823032066208736e-05,
+ "loss": 0.8057,
+ "step": 7946
+ },
+ {
+ "epoch": 21.653950953678475,
+ "grad_norm": 8.348368644714355,
+ "learning_rate": 1.8229819377577938e-05,
+ "loss": 0.6708,
+ "step": 7947
+ },
+ {
+ "epoch": 21.6566757493188,
+ "grad_norm": 7.474180698394775,
+ "learning_rate": 1.822931802897495e-05,
+ "loss": 0.6534,
+ "step": 7948
+ },
+ {
+ "epoch": 21.659400544959126,
+ "grad_norm": 11.66097640991211,
+ "learning_rate": 1.8228816616282298e-05,
+ "loss": 0.7632,
+ "step": 7949
+ },
+ {
+ "epoch": 21.662125340599456,
+ "grad_norm": 14.725122451782227,
+ "learning_rate": 1.822831513950389e-05,
+ "loss": 0.8108,
+ "step": 7950
+ },
+ {
+ "epoch": 21.66485013623978,
+ "grad_norm": 7.565695285797119,
+ "learning_rate": 1.8227813598643623e-05,
+ "loss": 0.6025,
+ "step": 7951
+ },
+ {
+ "epoch": 21.667574931880107,
+ "grad_norm": 11.076896667480469,
+ "learning_rate": 1.822731199370541e-05,
+ "loss": 0.7438,
+ "step": 7952
+ },
+ {
+ "epoch": 21.670299727520437,
+ "grad_norm": 10.393583297729492,
+ "learning_rate": 1.822681032469316e-05,
+ "loss": 0.7128,
+ "step": 7953
+ },
+ {
+ "epoch": 21.673024523160763,
+ "grad_norm": 7.5954694747924805,
+ "learning_rate": 1.8226308591610772e-05,
+ "loss": 0.6598,
+ "step": 7954
+ },
+ {
+ "epoch": 21.67574931880109,
+ "grad_norm": 7.7545623779296875,
+ "learning_rate": 1.8225806794462156e-05,
+ "loss": 0.8911,
+ "step": 7955
+ },
+ {
+ "epoch": 21.678474114441418,
+ "grad_norm": 15.038293838500977,
+ "learning_rate": 1.8225304933251226e-05,
+ "loss": 0.743,
+ "step": 7956
+ },
+ {
+ "epoch": 21.681198910081743,
+ "grad_norm": 8.431268692016602,
+ "learning_rate": 1.8224803007981883e-05,
+ "loss": 0.6809,
+ "step": 7957
+ },
+ {
+ "epoch": 21.68392370572207,
+ "grad_norm": 8.869983673095703,
+ "learning_rate": 1.8224301018658042e-05,
+ "loss": 0.5802,
+ "step": 7958
+ },
+ {
+ "epoch": 21.6866485013624,
+ "grad_norm": 7.820289611816406,
+ "learning_rate": 1.8223798965283606e-05,
+ "loss": 0.8416,
+ "step": 7959
+ },
+ {
+ "epoch": 21.689373297002724,
+ "grad_norm": 9.78795051574707,
+ "learning_rate": 1.8223296847862492e-05,
+ "loss": 0.8647,
+ "step": 7960
+ },
+ {
+ "epoch": 21.69209809264305,
+ "grad_norm": 9.411185264587402,
+ "learning_rate": 1.8222794666398602e-05,
+ "loss": 0.7452,
+ "step": 7961
+ },
+ {
+ "epoch": 21.69482288828338,
+ "grad_norm": 8.101469039916992,
+ "learning_rate": 1.8222292420895857e-05,
+ "loss": 0.7953,
+ "step": 7962
+ },
+ {
+ "epoch": 21.697547683923705,
+ "grad_norm": 8.729936599731445,
+ "learning_rate": 1.8221790111358156e-05,
+ "loss": 0.7415,
+ "step": 7963
+ },
+ {
+ "epoch": 21.70027247956403,
+ "grad_norm": 6.6953511238098145,
+ "learning_rate": 1.8221287737789423e-05,
+ "loss": 0.7032,
+ "step": 7964
+ },
+ {
+ "epoch": 21.70299727520436,
+ "grad_norm": 6.772510051727295,
+ "learning_rate": 1.8220785300193565e-05,
+ "loss": 0.7838,
+ "step": 7965
+ },
+ {
+ "epoch": 21.705722070844686,
+ "grad_norm": 8.998079299926758,
+ "learning_rate": 1.8220282798574497e-05,
+ "loss": 0.8809,
+ "step": 7966
+ },
+ {
+ "epoch": 21.708446866485012,
+ "grad_norm": 10.296906471252441,
+ "learning_rate": 1.821978023293613e-05,
+ "loss": 0.6854,
+ "step": 7967
+ },
+ {
+ "epoch": 21.71117166212534,
+ "grad_norm": 7.554832458496094,
+ "learning_rate": 1.8219277603282378e-05,
+ "loss": 0.9015,
+ "step": 7968
+ },
+ {
+ "epoch": 21.713896457765667,
+ "grad_norm": 8.607104301452637,
+ "learning_rate": 1.8218774909617157e-05,
+ "loss": 0.947,
+ "step": 7969
+ },
+ {
+ "epoch": 21.716621253405993,
+ "grad_norm": 8.692824363708496,
+ "learning_rate": 1.8218272151944383e-05,
+ "loss": 0.8123,
+ "step": 7970
+ },
+ {
+ "epoch": 21.719346049046322,
+ "grad_norm": 5.778202056884766,
+ "learning_rate": 1.821776933026797e-05,
+ "loss": 0.7533,
+ "step": 7971
+ },
+ {
+ "epoch": 21.722070844686648,
+ "grad_norm": 40.46097183227539,
+ "learning_rate": 1.8217266444591835e-05,
+ "loss": 0.6561,
+ "step": 7972
+ },
+ {
+ "epoch": 21.724795640326974,
+ "grad_norm": 9.413145065307617,
+ "learning_rate": 1.8216763494919888e-05,
+ "loss": 0.8752,
+ "step": 7973
+ },
+ {
+ "epoch": 21.727520435967303,
+ "grad_norm": 9.560535430908203,
+ "learning_rate": 1.8216260481256058e-05,
+ "loss": 0.7362,
+ "step": 7974
+ },
+ {
+ "epoch": 21.73024523160763,
+ "grad_norm": 8.597753524780273,
+ "learning_rate": 1.8215757403604252e-05,
+ "loss": 0.7456,
+ "step": 7975
+ },
+ {
+ "epoch": 21.732970027247955,
+ "grad_norm": 8.375833511352539,
+ "learning_rate": 1.821525426196839e-05,
+ "loss": 0.8604,
+ "step": 7976
+ },
+ {
+ "epoch": 21.735694822888284,
+ "grad_norm": 8.554570198059082,
+ "learning_rate": 1.8214751056352397e-05,
+ "loss": 0.652,
+ "step": 7977
+ },
+ {
+ "epoch": 21.73841961852861,
+ "grad_norm": 9.537891387939453,
+ "learning_rate": 1.8214247786760184e-05,
+ "loss": 0.7294,
+ "step": 7978
+ },
+ {
+ "epoch": 21.741144414168936,
+ "grad_norm": 14.614935874938965,
+ "learning_rate": 1.8213744453195676e-05,
+ "loss": 0.9902,
+ "step": 7979
+ },
+ {
+ "epoch": 21.743869209809265,
+ "grad_norm": 9.442888259887695,
+ "learning_rate": 1.8213241055662786e-05,
+ "loss": 0.7906,
+ "step": 7980
+ },
+ {
+ "epoch": 21.74659400544959,
+ "grad_norm": 8.972207069396973,
+ "learning_rate": 1.8212737594165444e-05,
+ "loss": 0.7928,
+ "step": 7981
+ },
+ {
+ "epoch": 21.749318801089917,
+ "grad_norm": 11.947616577148438,
+ "learning_rate": 1.8212234068707563e-05,
+ "loss": 0.8579,
+ "step": 7982
+ },
+ {
+ "epoch": 21.752043596730246,
+ "grad_norm": 8.358003616333008,
+ "learning_rate": 1.8211730479293067e-05,
+ "loss": 0.712,
+ "step": 7983
+ },
+ {
+ "epoch": 21.754768392370572,
+ "grad_norm": 7.6386613845825195,
+ "learning_rate": 1.8211226825925883e-05,
+ "loss": 0.6794,
+ "step": 7984
+ },
+ {
+ "epoch": 21.757493188010898,
+ "grad_norm": 12.572188377380371,
+ "learning_rate": 1.8210723108609923e-05,
+ "loss": 0.7697,
+ "step": 7985
+ },
+ {
+ "epoch": 21.760217983651227,
+ "grad_norm": 10.8894624710083,
+ "learning_rate": 1.8210219327349122e-05,
+ "loss": 0.787,
+ "step": 7986
+ },
+ {
+ "epoch": 21.762942779291553,
+ "grad_norm": 8.683341026306152,
+ "learning_rate": 1.8209715482147393e-05,
+ "loss": 0.619,
+ "step": 7987
+ },
+ {
+ "epoch": 21.76566757493188,
+ "grad_norm": 9.78201961517334,
+ "learning_rate": 1.8209211573008663e-05,
+ "loss": 0.9135,
+ "step": 7988
+ },
+ {
+ "epoch": 21.768392370572208,
+ "grad_norm": 8.886528968811035,
+ "learning_rate": 1.8208707599936858e-05,
+ "loss": 0.8416,
+ "step": 7989
+ },
+ {
+ "epoch": 21.771117166212534,
+ "grad_norm": 8.137007713317871,
+ "learning_rate": 1.8208203562935902e-05,
+ "loss": 0.7484,
+ "step": 7990
+ },
+ {
+ "epoch": 21.77384196185286,
+ "grad_norm": 8.364813804626465,
+ "learning_rate": 1.8207699462009722e-05,
+ "loss": 0.6542,
+ "step": 7991
+ },
+ {
+ "epoch": 21.77656675749319,
+ "grad_norm": 8.100030899047852,
+ "learning_rate": 1.8207195297162245e-05,
+ "loss": 0.6743,
+ "step": 7992
+ },
+ {
+ "epoch": 21.779291553133515,
+ "grad_norm": 7.499617576599121,
+ "learning_rate": 1.820669106839739e-05,
+ "loss": 0.7401,
+ "step": 7993
+ },
+ {
+ "epoch": 21.78201634877384,
+ "grad_norm": 9.239191055297852,
+ "learning_rate": 1.8206186775719096e-05,
+ "loss": 0.7218,
+ "step": 7994
+ },
+ {
+ "epoch": 21.78474114441417,
+ "grad_norm": 8.191755294799805,
+ "learning_rate": 1.8205682419131277e-05,
+ "loss": 0.7122,
+ "step": 7995
+ },
+ {
+ "epoch": 21.787465940054496,
+ "grad_norm": 17.269739151000977,
+ "learning_rate": 1.8205177998637872e-05,
+ "loss": 0.8901,
+ "step": 7996
+ },
+ {
+ "epoch": 21.79019073569482,
+ "grad_norm": 10.68104076385498,
+ "learning_rate": 1.8204673514242804e-05,
+ "loss": 0.8568,
+ "step": 7997
+ },
+ {
+ "epoch": 21.79291553133515,
+ "grad_norm": 10.695720672607422,
+ "learning_rate": 1.820416896595e-05,
+ "loss": 0.8121,
+ "step": 7998
+ },
+ {
+ "epoch": 21.795640326975477,
+ "grad_norm": 9.297723770141602,
+ "learning_rate": 1.8203664353763393e-05,
+ "loss": 0.6395,
+ "step": 7999
+ },
+ {
+ "epoch": 21.798365122615802,
+ "grad_norm": 8.26783561706543,
+ "learning_rate": 1.8203159677686914e-05,
+ "loss": 0.6795,
+ "step": 8000
+ },
+ {
+ "epoch": 21.80108991825613,
+ "grad_norm": 8.635510444641113,
+ "learning_rate": 1.820265493772449e-05,
+ "loss": 0.5949,
+ "step": 8001
+ },
+ {
+ "epoch": 21.803814713896458,
+ "grad_norm": 9.092911720275879,
+ "learning_rate": 1.8202150133880052e-05,
+ "loss": 0.7261,
+ "step": 8002
+ },
+ {
+ "epoch": 21.806539509536783,
+ "grad_norm": 8.284882545471191,
+ "learning_rate": 1.8201645266157534e-05,
+ "loss": 0.7927,
+ "step": 8003
+ },
+ {
+ "epoch": 21.809264305177113,
+ "grad_norm": 7.807535171508789,
+ "learning_rate": 1.8201140334560867e-05,
+ "loss": 0.7951,
+ "step": 8004
+ },
+ {
+ "epoch": 21.81198910081744,
+ "grad_norm": 12.532002449035645,
+ "learning_rate": 1.8200635339093983e-05,
+ "loss": 0.7982,
+ "step": 8005
+ },
+ {
+ "epoch": 21.814713896457764,
+ "grad_norm": 8.454265594482422,
+ "learning_rate": 1.8200130279760814e-05,
+ "loss": 0.7979,
+ "step": 8006
+ },
+ {
+ "epoch": 21.817438692098094,
+ "grad_norm": 9.2294340133667,
+ "learning_rate": 1.8199625156565295e-05,
+ "loss": 0.8566,
+ "step": 8007
+ },
+ {
+ "epoch": 21.82016348773842,
+ "grad_norm": 9.567198753356934,
+ "learning_rate": 1.8199119969511362e-05,
+ "loss": 0.6354,
+ "step": 8008
+ },
+ {
+ "epoch": 21.822888283378745,
+ "grad_norm": 9.14952564239502,
+ "learning_rate": 1.8198614718602943e-05,
+ "loss": 0.7948,
+ "step": 8009
+ },
+ {
+ "epoch": 21.825613079019075,
+ "grad_norm": 17.607019424438477,
+ "learning_rate": 1.8198109403843977e-05,
+ "loss": 0.7565,
+ "step": 8010
+ },
+ {
+ "epoch": 21.8283378746594,
+ "grad_norm": 14.952523231506348,
+ "learning_rate": 1.8197604025238398e-05,
+ "loss": 0.8657,
+ "step": 8011
+ },
+ {
+ "epoch": 21.831062670299726,
+ "grad_norm": 13.148463249206543,
+ "learning_rate": 1.8197098582790144e-05,
+ "loss": 0.7017,
+ "step": 8012
+ },
+ {
+ "epoch": 21.833787465940055,
+ "grad_norm": 8.732821464538574,
+ "learning_rate": 1.819659307650315e-05,
+ "loss": 0.8524,
+ "step": 8013
+ },
+ {
+ "epoch": 21.83651226158038,
+ "grad_norm": 14.557068824768066,
+ "learning_rate": 1.8196087506381356e-05,
+ "loss": 0.8275,
+ "step": 8014
+ },
+ {
+ "epoch": 21.839237057220707,
+ "grad_norm": 10.754493713378906,
+ "learning_rate": 1.8195581872428693e-05,
+ "loss": 0.7708,
+ "step": 8015
+ },
+ {
+ "epoch": 21.841961852861036,
+ "grad_norm": 9.273686408996582,
+ "learning_rate": 1.81950761746491e-05,
+ "loss": 0.7947,
+ "step": 8016
+ },
+ {
+ "epoch": 21.844686648501362,
+ "grad_norm": 10.021817207336426,
+ "learning_rate": 1.819457041304652e-05,
+ "loss": 0.7877,
+ "step": 8017
+ },
+ {
+ "epoch": 21.847411444141688,
+ "grad_norm": 7.916262149810791,
+ "learning_rate": 1.819406458762489e-05,
+ "loss": 0.7999,
+ "step": 8018
+ },
+ {
+ "epoch": 21.850136239782017,
+ "grad_norm": 10.504857063293457,
+ "learning_rate": 1.8193558698388148e-05,
+ "loss": 0.7526,
+ "step": 8019
+ },
+ {
+ "epoch": 21.852861035422343,
+ "grad_norm": 7.127544403076172,
+ "learning_rate": 1.819305274534023e-05,
+ "loss": 0.7443,
+ "step": 8020
+ },
+ {
+ "epoch": 21.85558583106267,
+ "grad_norm": 9.729533195495605,
+ "learning_rate": 1.8192546728485087e-05,
+ "loss": 0.7009,
+ "step": 8021
+ },
+ {
+ "epoch": 21.858310626703,
+ "grad_norm": 11.557148933410645,
+ "learning_rate": 1.8192040647826652e-05,
+ "loss": 0.9875,
+ "step": 8022
+ },
+ {
+ "epoch": 21.861035422343324,
+ "grad_norm": 9.22014331817627,
+ "learning_rate": 1.819153450336887e-05,
+ "loss": 0.6754,
+ "step": 8023
+ },
+ {
+ "epoch": 21.86376021798365,
+ "grad_norm": 9.431036949157715,
+ "learning_rate": 1.819102829511568e-05,
+ "loss": 0.6737,
+ "step": 8024
+ },
+ {
+ "epoch": 21.86648501362398,
+ "grad_norm": 8.149208068847656,
+ "learning_rate": 1.819052202307102e-05,
+ "loss": 0.7744,
+ "step": 8025
+ },
+ {
+ "epoch": 21.869209809264305,
+ "grad_norm": 7.808688163757324,
+ "learning_rate": 1.8190015687238848e-05,
+ "loss": 0.8295,
+ "step": 8026
+ },
+ {
+ "epoch": 21.87193460490463,
+ "grad_norm": 8.341070175170898,
+ "learning_rate": 1.818950928762309e-05,
+ "loss": 0.7428,
+ "step": 8027
+ },
+ {
+ "epoch": 21.87465940054496,
+ "grad_norm": 10.882519721984863,
+ "learning_rate": 1.81890028242277e-05,
+ "loss": 0.7593,
+ "step": 8028
+ },
+ {
+ "epoch": 21.877384196185286,
+ "grad_norm": 11.259774208068848,
+ "learning_rate": 1.8188496297056616e-05,
+ "loss": 0.7113,
+ "step": 8029
+ },
+ {
+ "epoch": 21.88010899182561,
+ "grad_norm": 10.727615356445312,
+ "learning_rate": 1.818798970611379e-05,
+ "loss": 0.9111,
+ "step": 8030
+ },
+ {
+ "epoch": 21.88283378746594,
+ "grad_norm": 16.16585350036621,
+ "learning_rate": 1.8187483051403162e-05,
+ "loss": 0.9004,
+ "step": 8031
+ },
+ {
+ "epoch": 21.885558583106267,
+ "grad_norm": 9.897339820861816,
+ "learning_rate": 1.818697633292868e-05,
+ "loss": 0.7002,
+ "step": 8032
+ },
+ {
+ "epoch": 21.888283378746593,
+ "grad_norm": 7.668357849121094,
+ "learning_rate": 1.818646955069429e-05,
+ "loss": 0.8422,
+ "step": 8033
+ },
+ {
+ "epoch": 21.891008174386922,
+ "grad_norm": 9.614480018615723,
+ "learning_rate": 1.8185962704703942e-05,
+ "loss": 0.6727,
+ "step": 8034
+ },
+ {
+ "epoch": 21.893732970027248,
+ "grad_norm": 7.975518226623535,
+ "learning_rate": 1.8185455794961574e-05,
+ "loss": 0.8705,
+ "step": 8035
+ },
+ {
+ "epoch": 21.896457765667574,
+ "grad_norm": 8.036733627319336,
+ "learning_rate": 1.8184948821471144e-05,
+ "loss": 0.7402,
+ "step": 8036
+ },
+ {
+ "epoch": 21.899182561307903,
+ "grad_norm": 10.84546947479248,
+ "learning_rate": 1.8184441784236595e-05,
+ "loss": 0.8982,
+ "step": 8037
+ },
+ {
+ "epoch": 21.90190735694823,
+ "grad_norm": 10.531929016113281,
+ "learning_rate": 1.8183934683261875e-05,
+ "loss": 0.8087,
+ "step": 8038
+ },
+ {
+ "epoch": 21.904632152588555,
+ "grad_norm": 7.393584728240967,
+ "learning_rate": 1.8183427518550934e-05,
+ "loss": 0.7101,
+ "step": 8039
+ },
+ {
+ "epoch": 21.907356948228884,
+ "grad_norm": 7.93975305557251,
+ "learning_rate": 1.8182920290107727e-05,
+ "loss": 0.8103,
+ "step": 8040
+ },
+ {
+ "epoch": 21.91008174386921,
+ "grad_norm": 7.738041400909424,
+ "learning_rate": 1.8182412997936197e-05,
+ "loss": 0.9581,
+ "step": 8041
+ },
+ {
+ "epoch": 21.912806539509535,
+ "grad_norm": 10.444761276245117,
+ "learning_rate": 1.8181905642040298e-05,
+ "loss": 0.7683,
+ "step": 8042
+ },
+ {
+ "epoch": 21.915531335149865,
+ "grad_norm": 9.234233856201172,
+ "learning_rate": 1.8181398222423984e-05,
+ "loss": 0.7468,
+ "step": 8043
+ },
+ {
+ "epoch": 21.91825613079019,
+ "grad_norm": 9.53412914276123,
+ "learning_rate": 1.8180890739091205e-05,
+ "loss": 0.6504,
+ "step": 8044
+ },
+ {
+ "epoch": 21.920980926430516,
+ "grad_norm": 9.891529083251953,
+ "learning_rate": 1.8180383192045906e-05,
+ "loss": 0.7048,
+ "step": 8045
+ },
+ {
+ "epoch": 21.923705722070846,
+ "grad_norm": 10.515586853027344,
+ "learning_rate": 1.817987558129205e-05,
+ "loss": 0.8552,
+ "step": 8046
+ },
+ {
+ "epoch": 21.92643051771117,
+ "grad_norm": 11.16555404663086,
+ "learning_rate": 1.8179367906833586e-05,
+ "loss": 0.7252,
+ "step": 8047
+ },
+ {
+ "epoch": 21.929155313351497,
+ "grad_norm": 9.70915412902832,
+ "learning_rate": 1.817886016867447e-05,
+ "loss": 0.6676,
+ "step": 8048
+ },
+ {
+ "epoch": 21.931880108991827,
+ "grad_norm": 27.498109817504883,
+ "learning_rate": 1.817835236681865e-05,
+ "loss": 0.7378,
+ "step": 8049
+ },
+ {
+ "epoch": 21.934604904632153,
+ "grad_norm": 14.925739288330078,
+ "learning_rate": 1.8177844501270088e-05,
+ "loss": 0.8044,
+ "step": 8050
+ },
+ {
+ "epoch": 21.93732970027248,
+ "grad_norm": 8.186935424804688,
+ "learning_rate": 1.817733657203273e-05,
+ "loss": 0.8361,
+ "step": 8051
+ },
+ {
+ "epoch": 21.940054495912808,
+ "grad_norm": 7.971308708190918,
+ "learning_rate": 1.817682857911055e-05,
+ "loss": 0.7766,
+ "step": 8052
+ },
+ {
+ "epoch": 21.942779291553133,
+ "grad_norm": 8.413043975830078,
+ "learning_rate": 1.8176320522507485e-05,
+ "loss": 0.7009,
+ "step": 8053
+ },
+ {
+ "epoch": 21.94550408719346,
+ "grad_norm": 7.476767063140869,
+ "learning_rate": 1.81758124022275e-05,
+ "loss": 0.6925,
+ "step": 8054
+ },
+ {
+ "epoch": 21.94822888283379,
+ "grad_norm": 8.602943420410156,
+ "learning_rate": 1.817530421827455e-05,
+ "loss": 0.8936,
+ "step": 8055
+ },
+ {
+ "epoch": 21.950953678474114,
+ "grad_norm": 12.193194389343262,
+ "learning_rate": 1.8174795970652592e-05,
+ "loss": 0.8,
+ "step": 8056
+ },
+ {
+ "epoch": 21.95367847411444,
+ "grad_norm": 9.034198760986328,
+ "learning_rate": 1.817428765936559e-05,
+ "loss": 0.8422,
+ "step": 8057
+ },
+ {
+ "epoch": 21.95640326975477,
+ "grad_norm": 34.969703674316406,
+ "learning_rate": 1.8173779284417497e-05,
+ "loss": 0.9277,
+ "step": 8058
+ },
+ {
+ "epoch": 21.959128065395095,
+ "grad_norm": 10.297454833984375,
+ "learning_rate": 1.8173270845812273e-05,
+ "loss": 0.746,
+ "step": 8059
+ },
+ {
+ "epoch": 21.96185286103542,
+ "grad_norm": 9.3963041305542,
+ "learning_rate": 1.8172762343553883e-05,
+ "loss": 0.8197,
+ "step": 8060
+ },
+ {
+ "epoch": 21.96457765667575,
+ "grad_norm": 8.728163719177246,
+ "learning_rate": 1.817225377764628e-05,
+ "loss": 0.7479,
+ "step": 8061
+ },
+ {
+ "epoch": 21.967302452316076,
+ "grad_norm": 9.23142147064209,
+ "learning_rate": 1.8171745148093425e-05,
+ "loss": 0.703,
+ "step": 8062
+ },
+ {
+ "epoch": 21.970027247956402,
+ "grad_norm": 24.890634536743164,
+ "learning_rate": 1.8171236454899283e-05,
+ "loss": 0.8262,
+ "step": 8063
+ },
+ {
+ "epoch": 21.97275204359673,
+ "grad_norm": 8.38480281829834,
+ "learning_rate": 1.8170727698067817e-05,
+ "loss": 0.8821,
+ "step": 8064
+ },
+ {
+ "epoch": 21.975476839237057,
+ "grad_norm": 10.035608291625977,
+ "learning_rate": 1.8170218877602987e-05,
+ "loss": 0.8413,
+ "step": 8065
+ },
+ {
+ "epoch": 21.978201634877383,
+ "grad_norm": 9.714282989501953,
+ "learning_rate": 1.816970999350875e-05,
+ "loss": 0.7596,
+ "step": 8066
+ },
+ {
+ "epoch": 21.980926430517712,
+ "grad_norm": 8.85979175567627,
+ "learning_rate": 1.816920104578908e-05,
+ "loss": 0.7859,
+ "step": 8067
+ },
+ {
+ "epoch": 21.983651226158038,
+ "grad_norm": 8.130599975585938,
+ "learning_rate": 1.816869203444793e-05,
+ "loss": 0.8478,
+ "step": 8068
+ },
+ {
+ "epoch": 21.986376021798364,
+ "grad_norm": 9.997649192810059,
+ "learning_rate": 1.8168182959489277e-05,
+ "loss": 0.7366,
+ "step": 8069
+ },
+ {
+ "epoch": 21.989100817438693,
+ "grad_norm": 7.8750505447387695,
+ "learning_rate": 1.8167673820917073e-05,
+ "loss": 0.7366,
+ "step": 8070
+ },
+ {
+ "epoch": 21.99182561307902,
+ "grad_norm": 8.245959281921387,
+ "learning_rate": 1.816716461873529e-05,
+ "loss": 0.8219,
+ "step": 8071
+ },
+ {
+ "epoch": 21.994550408719345,
+ "grad_norm": 9.712108612060547,
+ "learning_rate": 1.816665535294789e-05,
+ "loss": 0.7715,
+ "step": 8072
+ },
+ {
+ "epoch": 21.997275204359674,
+ "grad_norm": 11.4086332321167,
+ "learning_rate": 1.816614602355884e-05,
+ "loss": 0.8273,
+ "step": 8073
+ },
+ {
+ "epoch": 22.0,
+ "grad_norm": 8.965995788574219,
+ "learning_rate": 1.816563663057211e-05,
+ "loss": 0.6558,
+ "step": 8074
+ },
+ {
+ "epoch": 22.002724795640326,
+ "grad_norm": 10.172837257385254,
+ "learning_rate": 1.8165127173991667e-05,
+ "loss": 0.6926,
+ "step": 8075
+ },
+ {
+ "epoch": 22.005449591280655,
+ "grad_norm": 8.559929847717285,
+ "learning_rate": 1.816461765382147e-05,
+ "loss": 0.7812,
+ "step": 8076
+ },
+ {
+ "epoch": 22.00817438692098,
+ "grad_norm": 7.295583724975586,
+ "learning_rate": 1.8164108070065498e-05,
+ "loss": 0.494,
+ "step": 8077
+ },
+ {
+ "epoch": 22.010899182561307,
+ "grad_norm": 8.792229652404785,
+ "learning_rate": 1.8163598422727714e-05,
+ "loss": 0.7005,
+ "step": 8078
+ },
+ {
+ "epoch": 22.013623978201636,
+ "grad_norm": 7.681225776672363,
+ "learning_rate": 1.816308871181209e-05,
+ "loss": 0.5142,
+ "step": 8079
+ },
+ {
+ "epoch": 22.016348773841962,
+ "grad_norm": 7.9823198318481445,
+ "learning_rate": 1.816257893732259e-05,
+ "loss": 0.7559,
+ "step": 8080
+ },
+ {
+ "epoch": 22.019073569482288,
+ "grad_norm": 8.489956855773926,
+ "learning_rate": 1.816206909926319e-05,
+ "loss": 0.5811,
+ "step": 8081
+ },
+ {
+ "epoch": 22.021798365122617,
+ "grad_norm": 8.067201614379883,
+ "learning_rate": 1.816155919763786e-05,
+ "loss": 0.8422,
+ "step": 8082
+ },
+ {
+ "epoch": 22.024523160762943,
+ "grad_norm": 15.2614107131958,
+ "learning_rate": 1.8161049232450566e-05,
+ "loss": 0.7727,
+ "step": 8083
+ },
+ {
+ "epoch": 22.02724795640327,
+ "grad_norm": 9.465600967407227,
+ "learning_rate": 1.8160539203705285e-05,
+ "loss": 0.6544,
+ "step": 8084
+ },
+ {
+ "epoch": 22.029972752043598,
+ "grad_norm": 24.28710174560547,
+ "learning_rate": 1.8160029111405986e-05,
+ "loss": 0.78,
+ "step": 8085
+ },
+ {
+ "epoch": 22.032697547683924,
+ "grad_norm": 9.697113990783691,
+ "learning_rate": 1.815951895555665e-05,
+ "loss": 0.6359,
+ "step": 8086
+ },
+ {
+ "epoch": 22.03542234332425,
+ "grad_norm": 8.137419700622559,
+ "learning_rate": 1.8159008736161236e-05,
+ "loss": 0.6996,
+ "step": 8087
+ },
+ {
+ "epoch": 22.03814713896458,
+ "grad_norm": 8.577265739440918,
+ "learning_rate": 1.815849845322373e-05,
+ "loss": 0.6985,
+ "step": 8088
+ },
+ {
+ "epoch": 22.040871934604905,
+ "grad_norm": 10.814737319946289,
+ "learning_rate": 1.815798810674809e-05,
+ "loss": 0.5823,
+ "step": 8089
+ },
+ {
+ "epoch": 22.04359673024523,
+ "grad_norm": 9.610568046569824,
+ "learning_rate": 1.8157477696738312e-05,
+ "loss": 0.8083,
+ "step": 8090
+ },
+ {
+ "epoch": 22.04632152588556,
+ "grad_norm": 10.783349990844727,
+ "learning_rate": 1.8156967223198358e-05,
+ "loss": 0.7408,
+ "step": 8091
+ },
+ {
+ "epoch": 22.049046321525886,
+ "grad_norm": 8.860383987426758,
+ "learning_rate": 1.81564566861322e-05,
+ "loss": 0.6569,
+ "step": 8092
+ },
+ {
+ "epoch": 22.05177111716621,
+ "grad_norm": 10.234100341796875,
+ "learning_rate": 1.8155946085543825e-05,
+ "loss": 0.6267,
+ "step": 8093
+ },
+ {
+ "epoch": 22.05449591280654,
+ "grad_norm": 9.198258399963379,
+ "learning_rate": 1.8155435421437202e-05,
+ "loss": 0.7501,
+ "step": 8094
+ },
+ {
+ "epoch": 22.057220708446867,
+ "grad_norm": 8.372624397277832,
+ "learning_rate": 1.8154924693816312e-05,
+ "loss": 0.783,
+ "step": 8095
+ },
+ {
+ "epoch": 22.059945504087192,
+ "grad_norm": 10.100859642028809,
+ "learning_rate": 1.8154413902685132e-05,
+ "loss": 0.6799,
+ "step": 8096
+ },
+ {
+ "epoch": 22.06267029972752,
+ "grad_norm": 8.656736373901367,
+ "learning_rate": 1.8153903048047636e-05,
+ "loss": 0.5563,
+ "step": 8097
+ },
+ {
+ "epoch": 22.065395095367847,
+ "grad_norm": 7.222809314727783,
+ "learning_rate": 1.815339212990781e-05,
+ "loss": 0.6029,
+ "step": 8098
+ },
+ {
+ "epoch": 22.068119891008173,
+ "grad_norm": 8.096519470214844,
+ "learning_rate": 1.8152881148269626e-05,
+ "loss": 0.7532,
+ "step": 8099
+ },
+ {
+ "epoch": 22.070844686648503,
+ "grad_norm": 8.562289237976074,
+ "learning_rate": 1.8152370103137063e-05,
+ "loss": 0.6422,
+ "step": 8100
+ },
+ {
+ "epoch": 22.07356948228883,
+ "grad_norm": 7.9341654777526855,
+ "learning_rate": 1.815185899451411e-05,
+ "loss": 0.876,
+ "step": 8101
+ },
+ {
+ "epoch": 22.076294277929154,
+ "grad_norm": 7.58868408203125,
+ "learning_rate": 1.8151347822404735e-05,
+ "loss": 0.6191,
+ "step": 8102
+ },
+ {
+ "epoch": 22.079019073569484,
+ "grad_norm": 10.293460845947266,
+ "learning_rate": 1.8150836586812927e-05,
+ "loss": 0.6768,
+ "step": 8103
+ },
+ {
+ "epoch": 22.08174386920981,
+ "grad_norm": 7.736724376678467,
+ "learning_rate": 1.815032528774267e-05,
+ "loss": 0.9154,
+ "step": 8104
+ },
+ {
+ "epoch": 22.084468664850135,
+ "grad_norm": 8.748819351196289,
+ "learning_rate": 1.814981392519794e-05,
+ "loss": 0.6484,
+ "step": 8105
+ },
+ {
+ "epoch": 22.087193460490465,
+ "grad_norm": 8.212860107421875,
+ "learning_rate": 1.814930249918272e-05,
+ "loss": 0.6599,
+ "step": 8106
+ },
+ {
+ "epoch": 22.08991825613079,
+ "grad_norm": 8.72126579284668,
+ "learning_rate": 1.8148791009700994e-05,
+ "loss": 0.6707,
+ "step": 8107
+ },
+ {
+ "epoch": 22.092643051771116,
+ "grad_norm": 8.394826889038086,
+ "learning_rate": 1.814827945675675e-05,
+ "loss": 0.6061,
+ "step": 8108
+ },
+ {
+ "epoch": 22.095367847411445,
+ "grad_norm": 7.980009078979492,
+ "learning_rate": 1.8147767840353966e-05,
+ "loss": 0.7402,
+ "step": 8109
+ },
+ {
+ "epoch": 22.09809264305177,
+ "grad_norm": 9.812178611755371,
+ "learning_rate": 1.8147256160496627e-05,
+ "loss": 0.7423,
+ "step": 8110
+ },
+ {
+ "epoch": 22.100817438692097,
+ "grad_norm": 8.119328498840332,
+ "learning_rate": 1.814674441718872e-05,
+ "loss": 0.5847,
+ "step": 8111
+ },
+ {
+ "epoch": 22.103542234332426,
+ "grad_norm": 9.668068885803223,
+ "learning_rate": 1.814623261043423e-05,
+ "loss": 0.717,
+ "step": 8112
+ },
+ {
+ "epoch": 22.106267029972752,
+ "grad_norm": 9.752023696899414,
+ "learning_rate": 1.8145720740237142e-05,
+ "loss": 0.6893,
+ "step": 8113
+ },
+ {
+ "epoch": 22.108991825613078,
+ "grad_norm": 9.450759887695312,
+ "learning_rate": 1.814520880660144e-05,
+ "loss": 0.7324,
+ "step": 8114
+ },
+ {
+ "epoch": 22.111716621253407,
+ "grad_norm": 10.053879737854004,
+ "learning_rate": 1.8144696809531117e-05,
+ "loss": 0.6709,
+ "step": 8115
+ },
+ {
+ "epoch": 22.114441416893733,
+ "grad_norm": 11.055795669555664,
+ "learning_rate": 1.814418474903016e-05,
+ "loss": 0.6781,
+ "step": 8116
+ },
+ {
+ "epoch": 22.11716621253406,
+ "grad_norm": 9.688031196594238,
+ "learning_rate": 1.814367262510255e-05,
+ "loss": 0.7238,
+ "step": 8117
+ },
+ {
+ "epoch": 22.11989100817439,
+ "grad_norm": 9.846515655517578,
+ "learning_rate": 1.8143160437752282e-05,
+ "loss": 0.661,
+ "step": 8118
+ },
+ {
+ "epoch": 22.122615803814714,
+ "grad_norm": 8.671991348266602,
+ "learning_rate": 1.8142648186983342e-05,
+ "loss": 0.6635,
+ "step": 8119
+ },
+ {
+ "epoch": 22.12534059945504,
+ "grad_norm": 7.699706554412842,
+ "learning_rate": 1.814213587279972e-05,
+ "loss": 0.4941,
+ "step": 8120
+ },
+ {
+ "epoch": 22.12806539509537,
+ "grad_norm": 10.536995887756348,
+ "learning_rate": 1.8141623495205407e-05,
+ "loss": 0.6252,
+ "step": 8121
+ },
+ {
+ "epoch": 22.130790190735695,
+ "grad_norm": 9.968353271484375,
+ "learning_rate": 1.814111105420439e-05,
+ "loss": 0.7587,
+ "step": 8122
+ },
+ {
+ "epoch": 22.13351498637602,
+ "grad_norm": 15.113749504089355,
+ "learning_rate": 1.8140598549800665e-05,
+ "loss": 0.7292,
+ "step": 8123
+ },
+ {
+ "epoch": 22.13623978201635,
+ "grad_norm": 10.22586727142334,
+ "learning_rate": 1.8140085981998217e-05,
+ "loss": 0.9756,
+ "step": 8124
+ },
+ {
+ "epoch": 22.138964577656676,
+ "grad_norm": 13.87658405303955,
+ "learning_rate": 1.8139573350801044e-05,
+ "loss": 0.6628,
+ "step": 8125
+ },
+ {
+ "epoch": 22.141689373297,
+ "grad_norm": 18.155254364013672,
+ "learning_rate": 1.8139060656213136e-05,
+ "loss": 0.7733,
+ "step": 8126
+ },
+ {
+ "epoch": 22.14441416893733,
+ "grad_norm": 7.1122636795043945,
+ "learning_rate": 1.8138547898238482e-05,
+ "loss": 0.7997,
+ "step": 8127
+ },
+ {
+ "epoch": 22.147138964577657,
+ "grad_norm": 7.740839004516602,
+ "learning_rate": 1.813803507688108e-05,
+ "loss": 0.688,
+ "step": 8128
+ },
+ {
+ "epoch": 22.149863760217983,
+ "grad_norm": 7.7154974937438965,
+ "learning_rate": 1.813752219214493e-05,
+ "loss": 0.5564,
+ "step": 8129
+ },
+ {
+ "epoch": 22.152588555858312,
+ "grad_norm": 15.014013290405273,
+ "learning_rate": 1.813700924403401e-05,
+ "loss": 0.8921,
+ "step": 8130
+ },
+ {
+ "epoch": 22.155313351498638,
+ "grad_norm": 6.617035388946533,
+ "learning_rate": 1.8136496232552327e-05,
+ "loss": 0.4835,
+ "step": 8131
+ },
+ {
+ "epoch": 22.158038147138964,
+ "grad_norm": 9.0719633102417,
+ "learning_rate": 1.8135983157703875e-05,
+ "loss": 0.5991,
+ "step": 8132
+ },
+ {
+ "epoch": 22.160762942779293,
+ "grad_norm": 8.152012825012207,
+ "learning_rate": 1.8135470019492645e-05,
+ "loss": 0.5002,
+ "step": 8133
+ },
+ {
+ "epoch": 22.16348773841962,
+ "grad_norm": 8.208850860595703,
+ "learning_rate": 1.813495681792264e-05,
+ "loss": 0.5294,
+ "step": 8134
+ },
+ {
+ "epoch": 22.166212534059945,
+ "grad_norm": 10.276405334472656,
+ "learning_rate": 1.8134443552997848e-05,
+ "loss": 0.5847,
+ "step": 8135
+ },
+ {
+ "epoch": 22.168937329700274,
+ "grad_norm": 9.390474319458008,
+ "learning_rate": 1.8133930224722274e-05,
+ "loss": 0.7382,
+ "step": 8136
+ },
+ {
+ "epoch": 22.1716621253406,
+ "grad_norm": 10.195333480834961,
+ "learning_rate": 1.813341683309991e-05,
+ "loss": 0.6446,
+ "step": 8137
+ },
+ {
+ "epoch": 22.174386920980925,
+ "grad_norm": 10.102724075317383,
+ "learning_rate": 1.8132903378134764e-05,
+ "loss": 0.693,
+ "step": 8138
+ },
+ {
+ "epoch": 22.177111716621255,
+ "grad_norm": 11.12580394744873,
+ "learning_rate": 1.8132389859830825e-05,
+ "loss": 0.7888,
+ "step": 8139
+ },
+ {
+ "epoch": 22.17983651226158,
+ "grad_norm": 8.86587142944336,
+ "learning_rate": 1.8131876278192097e-05,
+ "loss": 0.6686,
+ "step": 8140
+ },
+ {
+ "epoch": 22.182561307901906,
+ "grad_norm": 9.61230754852295,
+ "learning_rate": 1.8131362633222577e-05,
+ "loss": 0.7871,
+ "step": 8141
+ },
+ {
+ "epoch": 22.185286103542236,
+ "grad_norm": 8.075401306152344,
+ "learning_rate": 1.8130848924926264e-05,
+ "loss": 0.7047,
+ "step": 8142
+ },
+ {
+ "epoch": 22.18801089918256,
+ "grad_norm": 13.674467086791992,
+ "learning_rate": 1.8130335153307167e-05,
+ "loss": 0.6346,
+ "step": 8143
+ },
+ {
+ "epoch": 22.190735694822887,
+ "grad_norm": 7.627383708953857,
+ "learning_rate": 1.8129821318369278e-05,
+ "loss": 0.5735,
+ "step": 8144
+ },
+ {
+ "epoch": 22.193460490463217,
+ "grad_norm": 9.116448402404785,
+ "learning_rate": 1.81293074201166e-05,
+ "loss": 0.6015,
+ "step": 8145
+ },
+ {
+ "epoch": 22.196185286103542,
+ "grad_norm": 10.330015182495117,
+ "learning_rate": 1.812879345855314e-05,
+ "loss": 0.6343,
+ "step": 8146
+ },
+ {
+ "epoch": 22.19891008174387,
+ "grad_norm": 12.202704429626465,
+ "learning_rate": 1.8128279433682898e-05,
+ "loss": 0.6803,
+ "step": 8147
+ },
+ {
+ "epoch": 22.201634877384198,
+ "grad_norm": 9.495345115661621,
+ "learning_rate": 1.812776534550988e-05,
+ "loss": 0.7317,
+ "step": 8148
+ },
+ {
+ "epoch": 22.204359673024523,
+ "grad_norm": 10.337039947509766,
+ "learning_rate": 1.812725119403808e-05,
+ "loss": 0.7294,
+ "step": 8149
+ },
+ {
+ "epoch": 22.20708446866485,
+ "grad_norm": 9.894977569580078,
+ "learning_rate": 1.8126736979271516e-05,
+ "loss": 0.7222,
+ "step": 8150
+ },
+ {
+ "epoch": 22.20980926430518,
+ "grad_norm": 8.29999828338623,
+ "learning_rate": 1.8126222701214185e-05,
+ "loss": 0.7822,
+ "step": 8151
+ },
+ {
+ "epoch": 22.212534059945504,
+ "grad_norm": 8.871851921081543,
+ "learning_rate": 1.812570835987009e-05,
+ "loss": 0.7723,
+ "step": 8152
+ },
+ {
+ "epoch": 22.21525885558583,
+ "grad_norm": 10.580748558044434,
+ "learning_rate": 1.8125193955243244e-05,
+ "loss": 0.8129,
+ "step": 8153
+ },
+ {
+ "epoch": 22.21798365122616,
+ "grad_norm": 11.675036430358887,
+ "learning_rate": 1.8124679487337647e-05,
+ "loss": 0.782,
+ "step": 8154
+ },
+ {
+ "epoch": 22.220708446866485,
+ "grad_norm": 8.933625221252441,
+ "learning_rate": 1.8124164956157306e-05,
+ "loss": 0.5898,
+ "step": 8155
+ },
+ {
+ "epoch": 22.22343324250681,
+ "grad_norm": 7.400137901306152,
+ "learning_rate": 1.8123650361706234e-05,
+ "loss": 0.5396,
+ "step": 8156
+ },
+ {
+ "epoch": 22.22615803814714,
+ "grad_norm": 9.74735164642334,
+ "learning_rate": 1.812313570398843e-05,
+ "loss": 0.8325,
+ "step": 8157
+ },
+ {
+ "epoch": 22.228882833787466,
+ "grad_norm": 7.880486011505127,
+ "learning_rate": 1.8122620983007908e-05,
+ "loss": 0.6642,
+ "step": 8158
+ },
+ {
+ "epoch": 22.231607629427792,
+ "grad_norm": 12.720961570739746,
+ "learning_rate": 1.8122106198768675e-05,
+ "loss": 0.6642,
+ "step": 8159
+ },
+ {
+ "epoch": 22.23433242506812,
+ "grad_norm": 16.37128448486328,
+ "learning_rate": 1.8121591351274743e-05,
+ "loss": 0.6898,
+ "step": 8160
+ },
+ {
+ "epoch": 22.237057220708447,
+ "grad_norm": 7.74159574508667,
+ "learning_rate": 1.8121076440530116e-05,
+ "loss": 0.7014,
+ "step": 8161
+ },
+ {
+ "epoch": 22.239782016348773,
+ "grad_norm": 10.525813102722168,
+ "learning_rate": 1.8120561466538806e-05,
+ "loss": 0.6607,
+ "step": 8162
+ },
+ {
+ "epoch": 22.242506811989102,
+ "grad_norm": 8.556599617004395,
+ "learning_rate": 1.8120046429304828e-05,
+ "loss": 0.6026,
+ "step": 8163
+ },
+ {
+ "epoch": 22.245231607629428,
+ "grad_norm": 10.699475288391113,
+ "learning_rate": 1.8119531328832186e-05,
+ "loss": 0.7379,
+ "step": 8164
+ },
+ {
+ "epoch": 22.247956403269754,
+ "grad_norm": 10.441765785217285,
+ "learning_rate": 1.81190161651249e-05,
+ "loss": 0.6156,
+ "step": 8165
+ },
+ {
+ "epoch": 22.250681198910083,
+ "grad_norm": 7.536591529846191,
+ "learning_rate": 1.811850093818697e-05,
+ "loss": 0.5994,
+ "step": 8166
+ },
+ {
+ "epoch": 22.25340599455041,
+ "grad_norm": 7.260444164276123,
+ "learning_rate": 1.811798564802242e-05,
+ "loss": 0.7764,
+ "step": 8167
+ },
+ {
+ "epoch": 22.256130790190735,
+ "grad_norm": 8.492497444152832,
+ "learning_rate": 1.8117470294635263e-05,
+ "loss": 0.6183,
+ "step": 8168
+ },
+ {
+ "epoch": 22.258855585831064,
+ "grad_norm": 8.711894035339355,
+ "learning_rate": 1.8116954878029505e-05,
+ "loss": 0.748,
+ "step": 8169
+ },
+ {
+ "epoch": 22.26158038147139,
+ "grad_norm": 12.734328269958496,
+ "learning_rate": 1.8116439398209164e-05,
+ "loss": 0.6395,
+ "step": 8170
+ },
+ {
+ "epoch": 22.264305177111716,
+ "grad_norm": 8.598809242248535,
+ "learning_rate": 1.8115923855178253e-05,
+ "loss": 0.5896,
+ "step": 8171
+ },
+ {
+ "epoch": 22.267029972752045,
+ "grad_norm": 7.421351432800293,
+ "learning_rate": 1.8115408248940792e-05,
+ "loss": 0.5556,
+ "step": 8172
+ },
+ {
+ "epoch": 22.26975476839237,
+ "grad_norm": 14.382796287536621,
+ "learning_rate": 1.8114892579500792e-05,
+ "loss": 0.7145,
+ "step": 8173
+ },
+ {
+ "epoch": 22.272479564032697,
+ "grad_norm": 7.493317127227783,
+ "learning_rate": 1.811437684686227e-05,
+ "loss": 0.6122,
+ "step": 8174
+ },
+ {
+ "epoch": 22.275204359673026,
+ "grad_norm": 10.393016815185547,
+ "learning_rate": 1.8113861051029235e-05,
+ "loss": 0.7552,
+ "step": 8175
+ },
+ {
+ "epoch": 22.277929155313352,
+ "grad_norm": 8.7063570022583,
+ "learning_rate": 1.8113345192005718e-05,
+ "loss": 0.6884,
+ "step": 8176
+ },
+ {
+ "epoch": 22.280653950953678,
+ "grad_norm": 8.036070823669434,
+ "learning_rate": 1.8112829269795728e-05,
+ "loss": 0.6925,
+ "step": 8177
+ },
+ {
+ "epoch": 22.283378746594007,
+ "grad_norm": 8.267637252807617,
+ "learning_rate": 1.8112313284403287e-05,
+ "loss": 0.6825,
+ "step": 8178
+ },
+ {
+ "epoch": 22.286103542234333,
+ "grad_norm": 8.847068786621094,
+ "learning_rate": 1.8111797235832407e-05,
+ "loss": 0.584,
+ "step": 8179
+ },
+ {
+ "epoch": 22.28882833787466,
+ "grad_norm": 8.622603416442871,
+ "learning_rate": 1.8111281124087113e-05,
+ "loss": 0.9071,
+ "step": 8180
+ },
+ {
+ "epoch": 22.291553133514988,
+ "grad_norm": 9.915871620178223,
+ "learning_rate": 1.8110764949171423e-05,
+ "loss": 0.7716,
+ "step": 8181
+ },
+ {
+ "epoch": 22.294277929155314,
+ "grad_norm": 10.577964782714844,
+ "learning_rate": 1.811024871108936e-05,
+ "loss": 0.6343,
+ "step": 8182
+ },
+ {
+ "epoch": 22.29700272479564,
+ "grad_norm": 7.768617153167725,
+ "learning_rate": 1.8109732409844936e-05,
+ "loss": 0.787,
+ "step": 8183
+ },
+ {
+ "epoch": 22.29972752043597,
+ "grad_norm": 7.035017967224121,
+ "learning_rate": 1.810921604544218e-05,
+ "loss": 0.6422,
+ "step": 8184
+ },
+ {
+ "epoch": 22.302452316076295,
+ "grad_norm": 8.015909194946289,
+ "learning_rate": 1.810869961788511e-05,
+ "loss": 0.6508,
+ "step": 8185
+ },
+ {
+ "epoch": 22.30517711171662,
+ "grad_norm": 8.814335823059082,
+ "learning_rate": 1.810818312717775e-05,
+ "loss": 0.637,
+ "step": 8186
+ },
+ {
+ "epoch": 22.30790190735695,
+ "grad_norm": 14.538896560668945,
+ "learning_rate": 1.8107666573324113e-05,
+ "loss": 0.9564,
+ "step": 8187
+ },
+ {
+ "epoch": 22.310626702997276,
+ "grad_norm": 7.954617023468018,
+ "learning_rate": 1.810714995632824e-05,
+ "loss": 0.7405,
+ "step": 8188
+ },
+ {
+ "epoch": 22.3133514986376,
+ "grad_norm": 6.726071834564209,
+ "learning_rate": 1.8106633276194138e-05,
+ "loss": 0.5693,
+ "step": 8189
+ },
+ {
+ "epoch": 22.31607629427793,
+ "grad_norm": 7.355459690093994,
+ "learning_rate": 1.8106116532925835e-05,
+ "loss": 0.7271,
+ "step": 8190
+ },
+ {
+ "epoch": 22.318801089918257,
+ "grad_norm": 6.360330581665039,
+ "learning_rate": 1.8105599726527364e-05,
+ "loss": 0.7659,
+ "step": 8191
+ },
+ {
+ "epoch": 22.321525885558582,
+ "grad_norm": 10.908573150634766,
+ "learning_rate": 1.810508285700274e-05,
+ "loss": 0.6515,
+ "step": 8192
+ },
+ {
+ "epoch": 22.32425068119891,
+ "grad_norm": 9.36457347869873,
+ "learning_rate": 1.8104565924355987e-05,
+ "loss": 0.6348,
+ "step": 8193
+ },
+ {
+ "epoch": 22.326975476839237,
+ "grad_norm": 8.57176685333252,
+ "learning_rate": 1.810404892859114e-05,
+ "loss": 0.7372,
+ "step": 8194
+ },
+ {
+ "epoch": 22.329700272479563,
+ "grad_norm": 8.153583526611328,
+ "learning_rate": 1.8103531869712222e-05,
+ "loss": 0.6459,
+ "step": 8195
+ },
+ {
+ "epoch": 22.332425068119893,
+ "grad_norm": 8.096521377563477,
+ "learning_rate": 1.8103014747723258e-05,
+ "loss": 0.7163,
+ "step": 8196
+ },
+ {
+ "epoch": 22.33514986376022,
+ "grad_norm": 8.034278869628906,
+ "learning_rate": 1.8102497562628272e-05,
+ "loss": 0.7621,
+ "step": 8197
+ },
+ {
+ "epoch": 22.337874659400544,
+ "grad_norm": 10.737513542175293,
+ "learning_rate": 1.81019803144313e-05,
+ "loss": 0.7793,
+ "step": 8198
+ },
+ {
+ "epoch": 22.340599455040874,
+ "grad_norm": 9.598867416381836,
+ "learning_rate": 1.8101463003136365e-05,
+ "loss": 0.6896,
+ "step": 8199
+ },
+ {
+ "epoch": 22.3433242506812,
+ "grad_norm": 8.55178451538086,
+ "learning_rate": 1.81009456287475e-05,
+ "loss": 0.6556,
+ "step": 8200
+ },
+ {
+ "epoch": 22.346049046321525,
+ "grad_norm": 9.146363258361816,
+ "learning_rate": 1.8100428191268724e-05,
+ "loss": 0.6005,
+ "step": 8201
+ },
+ {
+ "epoch": 22.348773841961854,
+ "grad_norm": 7.098503112792969,
+ "learning_rate": 1.809991069070408e-05,
+ "loss": 0.8154,
+ "step": 8202
+ },
+ {
+ "epoch": 22.35149863760218,
+ "grad_norm": 14.414313316345215,
+ "learning_rate": 1.809939312705759e-05,
+ "loss": 0.6385,
+ "step": 8203
+ },
+ {
+ "epoch": 22.354223433242506,
+ "grad_norm": 8.21053409576416,
+ "learning_rate": 1.8098875500333287e-05,
+ "loss": 0.8989,
+ "step": 8204
+ },
+ {
+ "epoch": 22.356948228882835,
+ "grad_norm": 7.663893222808838,
+ "learning_rate": 1.8098357810535204e-05,
+ "loss": 0.6729,
+ "step": 8205
+ },
+ {
+ "epoch": 22.35967302452316,
+ "grad_norm": 7.619863033294678,
+ "learning_rate": 1.8097840057667366e-05,
+ "loss": 0.6927,
+ "step": 8206
+ },
+ {
+ "epoch": 22.362397820163487,
+ "grad_norm": 9.250384330749512,
+ "learning_rate": 1.8097322241733815e-05,
+ "loss": 0.5206,
+ "step": 8207
+ },
+ {
+ "epoch": 22.365122615803816,
+ "grad_norm": 7.354512691497803,
+ "learning_rate": 1.8096804362738577e-05,
+ "loss": 0.8595,
+ "step": 8208
+ },
+ {
+ "epoch": 22.367847411444142,
+ "grad_norm": 7.876550674438477,
+ "learning_rate": 1.809628642068569e-05,
+ "loss": 0.7395,
+ "step": 8209
+ },
+ {
+ "epoch": 22.370572207084468,
+ "grad_norm": 9.378175735473633,
+ "learning_rate": 1.809576841557918e-05,
+ "loss": 0.6779,
+ "step": 8210
+ },
+ {
+ "epoch": 22.373297002724797,
+ "grad_norm": 8.54090404510498,
+ "learning_rate": 1.809525034742309e-05,
+ "loss": 0.8472,
+ "step": 8211
+ },
+ {
+ "epoch": 22.376021798365123,
+ "grad_norm": 9.159504890441895,
+ "learning_rate": 1.809473221622145e-05,
+ "loss": 0.7279,
+ "step": 8212
+ },
+ {
+ "epoch": 22.37874659400545,
+ "grad_norm": 7.7075300216674805,
+ "learning_rate": 1.8094214021978295e-05,
+ "loss": 0.598,
+ "step": 8213
+ },
+ {
+ "epoch": 22.381471389645778,
+ "grad_norm": 12.308601379394531,
+ "learning_rate": 1.8093695764697664e-05,
+ "loss": 0.6523,
+ "step": 8214
+ },
+ {
+ "epoch": 22.384196185286104,
+ "grad_norm": 7.844625949859619,
+ "learning_rate": 1.8093177444383586e-05,
+ "loss": 0.9073,
+ "step": 8215
+ },
+ {
+ "epoch": 22.38692098092643,
+ "grad_norm": 7.515353679656982,
+ "learning_rate": 1.809265906104011e-05,
+ "loss": 0.8254,
+ "step": 8216
+ },
+ {
+ "epoch": 22.38964577656676,
+ "grad_norm": 8.23155403137207,
+ "learning_rate": 1.809214061467126e-05,
+ "loss": 0.5969,
+ "step": 8217
+ },
+ {
+ "epoch": 22.392370572207085,
+ "grad_norm": 8.199894905090332,
+ "learning_rate": 1.809162210528108e-05,
+ "loss": 0.7928,
+ "step": 8218
+ },
+ {
+ "epoch": 22.39509536784741,
+ "grad_norm": 7.663973808288574,
+ "learning_rate": 1.809110353287361e-05,
+ "loss": 0.7141,
+ "step": 8219
+ },
+ {
+ "epoch": 22.39782016348774,
+ "grad_norm": 10.365224838256836,
+ "learning_rate": 1.8090584897452884e-05,
+ "loss": 0.6886,
+ "step": 8220
+ },
+ {
+ "epoch": 22.400544959128066,
+ "grad_norm": 12.609064102172852,
+ "learning_rate": 1.8090066199022946e-05,
+ "loss": 0.7184,
+ "step": 8221
+ },
+ {
+ "epoch": 22.40326975476839,
+ "grad_norm": 7.5562615394592285,
+ "learning_rate": 1.8089547437587828e-05,
+ "loss": 0.6334,
+ "step": 8222
+ },
+ {
+ "epoch": 22.40599455040872,
+ "grad_norm": 7.856863021850586,
+ "learning_rate": 1.8089028613151578e-05,
+ "loss": 0.5431,
+ "step": 8223
+ },
+ {
+ "epoch": 22.408719346049047,
+ "grad_norm": 9.362018585205078,
+ "learning_rate": 1.808850972571823e-05,
+ "loss": 0.6707,
+ "step": 8224
+ },
+ {
+ "epoch": 22.411444141689373,
+ "grad_norm": 7.5704731941223145,
+ "learning_rate": 1.8087990775291835e-05,
+ "loss": 0.8016,
+ "step": 8225
+ },
+ {
+ "epoch": 22.414168937329702,
+ "grad_norm": 14.33726978302002,
+ "learning_rate": 1.8087471761876425e-05,
+ "loss": 0.9342,
+ "step": 8226
+ },
+ {
+ "epoch": 22.416893732970028,
+ "grad_norm": 9.47899341583252,
+ "learning_rate": 1.8086952685476046e-05,
+ "loss": 0.6818,
+ "step": 8227
+ },
+ {
+ "epoch": 22.419618528610354,
+ "grad_norm": 8.469098091125488,
+ "learning_rate": 1.808643354609474e-05,
+ "loss": 0.5687,
+ "step": 8228
+ },
+ {
+ "epoch": 22.422343324250683,
+ "grad_norm": 7.910406589508057,
+ "learning_rate": 1.8085914343736545e-05,
+ "loss": 0.696,
+ "step": 8229
+ },
+ {
+ "epoch": 22.42506811989101,
+ "grad_norm": 8.005192756652832,
+ "learning_rate": 1.8085395078405514e-05,
+ "loss": 0.6208,
+ "step": 8230
+ },
+ {
+ "epoch": 22.427792915531334,
+ "grad_norm": 13.900349617004395,
+ "learning_rate": 1.8084875750105685e-05,
+ "loss": 0.6278,
+ "step": 8231
+ },
+ {
+ "epoch": 22.430517711171664,
+ "grad_norm": 8.031730651855469,
+ "learning_rate": 1.8084356358841106e-05,
+ "loss": 0.6943,
+ "step": 8232
+ },
+ {
+ "epoch": 22.43324250681199,
+ "grad_norm": 8.470152854919434,
+ "learning_rate": 1.8083836904615815e-05,
+ "loss": 0.5541,
+ "step": 8233
+ },
+ {
+ "epoch": 22.435967302452315,
+ "grad_norm": 9.42927074432373,
+ "learning_rate": 1.8083317387433866e-05,
+ "loss": 0.5667,
+ "step": 8234
+ },
+ {
+ "epoch": 22.438692098092645,
+ "grad_norm": 10.382102966308594,
+ "learning_rate": 1.80827978072993e-05,
+ "loss": 0.7693,
+ "step": 8235
+ },
+ {
+ "epoch": 22.44141689373297,
+ "grad_norm": 9.156529426574707,
+ "learning_rate": 1.8082278164216166e-05,
+ "loss": 0.875,
+ "step": 8236
+ },
+ {
+ "epoch": 22.444141689373296,
+ "grad_norm": 9.471755027770996,
+ "learning_rate": 1.808175845818851e-05,
+ "loss": 0.8351,
+ "step": 8237
+ },
+ {
+ "epoch": 22.446866485013626,
+ "grad_norm": 10.10020637512207,
+ "learning_rate": 1.808123868922038e-05,
+ "loss": 0.6541,
+ "step": 8238
+ },
+ {
+ "epoch": 22.44959128065395,
+ "grad_norm": 8.335165977478027,
+ "learning_rate": 1.808071885731582e-05,
+ "loss": 0.7588,
+ "step": 8239
+ },
+ {
+ "epoch": 22.452316076294277,
+ "grad_norm": 7.9259161949157715,
+ "learning_rate": 1.8080198962478884e-05,
+ "loss": 0.6415,
+ "step": 8240
+ },
+ {
+ "epoch": 22.455040871934607,
+ "grad_norm": 20.179035186767578,
+ "learning_rate": 1.8079679004713618e-05,
+ "loss": 0.6896,
+ "step": 8241
+ },
+ {
+ "epoch": 22.457765667574932,
+ "grad_norm": 10.354724884033203,
+ "learning_rate": 1.8079158984024073e-05,
+ "loss": 0.7043,
+ "step": 8242
+ },
+ {
+ "epoch": 22.460490463215258,
+ "grad_norm": 8.078150749206543,
+ "learning_rate": 1.8078638900414292e-05,
+ "loss": 0.8281,
+ "step": 8243
+ },
+ {
+ "epoch": 22.463215258855588,
+ "grad_norm": 10.773573875427246,
+ "learning_rate": 1.8078118753888337e-05,
+ "loss": 0.679,
+ "step": 8244
+ },
+ {
+ "epoch": 22.465940054495913,
+ "grad_norm": 6.376916885375977,
+ "learning_rate": 1.8077598544450253e-05,
+ "loss": 0.5781,
+ "step": 8245
+ },
+ {
+ "epoch": 22.46866485013624,
+ "grad_norm": 7.432671546936035,
+ "learning_rate": 1.8077078272104093e-05,
+ "loss": 0.7159,
+ "step": 8246
+ },
+ {
+ "epoch": 22.47138964577657,
+ "grad_norm": 8.190813064575195,
+ "learning_rate": 1.8076557936853905e-05,
+ "loss": 0.6945,
+ "step": 8247
+ },
+ {
+ "epoch": 22.474114441416894,
+ "grad_norm": 7.159677982330322,
+ "learning_rate": 1.807603753870374e-05,
+ "loss": 0.5876,
+ "step": 8248
+ },
+ {
+ "epoch": 22.47683923705722,
+ "grad_norm": 22.71761131286621,
+ "learning_rate": 1.807551707765766e-05,
+ "loss": 0.7416,
+ "step": 8249
+ },
+ {
+ "epoch": 22.479564032697546,
+ "grad_norm": 9.451669692993164,
+ "learning_rate": 1.807499655371971e-05,
+ "loss": 0.6469,
+ "step": 8250
+ },
+ {
+ "epoch": 22.482288828337875,
+ "grad_norm": 8.264025688171387,
+ "learning_rate": 1.807447596689395e-05,
+ "loss": 0.587,
+ "step": 8251
+ },
+ {
+ "epoch": 22.4850136239782,
+ "grad_norm": 8.693696022033691,
+ "learning_rate": 1.807395531718443e-05,
+ "loss": 0.5808,
+ "step": 8252
+ },
+ {
+ "epoch": 22.48773841961853,
+ "grad_norm": 8.700834274291992,
+ "learning_rate": 1.8073434604595203e-05,
+ "loss": 0.7067,
+ "step": 8253
+ },
+ {
+ "epoch": 22.490463215258856,
+ "grad_norm": 7.785550117492676,
+ "learning_rate": 1.8072913829130326e-05,
+ "loss": 0.7192,
+ "step": 8254
+ },
+ {
+ "epoch": 22.493188010899182,
+ "grad_norm": 8.362305641174316,
+ "learning_rate": 1.8072392990793864e-05,
+ "loss": 0.589,
+ "step": 8255
+ },
+ {
+ "epoch": 22.495912806539508,
+ "grad_norm": 8.484654426574707,
+ "learning_rate": 1.8071872089589857e-05,
+ "loss": 0.5781,
+ "step": 8256
+ },
+ {
+ "epoch": 22.498637602179837,
+ "grad_norm": 10.331132888793945,
+ "learning_rate": 1.8071351125522372e-05,
+ "loss": 0.6402,
+ "step": 8257
+ },
+ {
+ "epoch": 22.501362397820163,
+ "grad_norm": 8.756699562072754,
+ "learning_rate": 1.8070830098595467e-05,
+ "loss": 0.5598,
+ "step": 8258
+ },
+ {
+ "epoch": 22.504087193460492,
+ "grad_norm": 34.18621826171875,
+ "learning_rate": 1.8070309008813195e-05,
+ "loss": 0.8003,
+ "step": 8259
+ },
+ {
+ "epoch": 22.506811989100818,
+ "grad_norm": 8.338065147399902,
+ "learning_rate": 1.8069787856179618e-05,
+ "loss": 0.7378,
+ "step": 8260
+ },
+ {
+ "epoch": 22.509536784741144,
+ "grad_norm": 8.108210563659668,
+ "learning_rate": 1.806926664069879e-05,
+ "loss": 0.6598,
+ "step": 8261
+ },
+ {
+ "epoch": 22.51226158038147,
+ "grad_norm": 8.238025665283203,
+ "learning_rate": 1.8068745362374774e-05,
+ "loss": 0.6777,
+ "step": 8262
+ },
+ {
+ "epoch": 22.5149863760218,
+ "grad_norm": 9.277074813842773,
+ "learning_rate": 1.806822402121163e-05,
+ "loss": 0.7857,
+ "step": 8263
+ },
+ {
+ "epoch": 22.517711171662125,
+ "grad_norm": 8.868127822875977,
+ "learning_rate": 1.8067702617213415e-05,
+ "loss": 0.6467,
+ "step": 8264
+ },
+ {
+ "epoch": 22.520435967302454,
+ "grad_norm": 8.341856956481934,
+ "learning_rate": 1.8067181150384195e-05,
+ "loss": 0.7299,
+ "step": 8265
+ },
+ {
+ "epoch": 22.52316076294278,
+ "grad_norm": 9.665529251098633,
+ "learning_rate": 1.8066659620728023e-05,
+ "loss": 0.7332,
+ "step": 8266
+ },
+ {
+ "epoch": 22.525885558583106,
+ "grad_norm": 9.782292366027832,
+ "learning_rate": 1.806613802824897e-05,
+ "loss": 0.6966,
+ "step": 8267
+ },
+ {
+ "epoch": 22.52861035422343,
+ "grad_norm": 8.606857299804688,
+ "learning_rate": 1.8065616372951093e-05,
+ "loss": 0.722,
+ "step": 8268
+ },
+ {
+ "epoch": 22.53133514986376,
+ "grad_norm": 11.900496482849121,
+ "learning_rate": 1.8065094654838452e-05,
+ "loss": 0.8167,
+ "step": 8269
+ },
+ {
+ "epoch": 22.534059945504087,
+ "grad_norm": 8.272493362426758,
+ "learning_rate": 1.8064572873915117e-05,
+ "loss": 0.5896,
+ "step": 8270
+ },
+ {
+ "epoch": 22.536784741144416,
+ "grad_norm": 8.059184074401855,
+ "learning_rate": 1.8064051030185145e-05,
+ "loss": 1.0009,
+ "step": 8271
+ },
+ {
+ "epoch": 22.539509536784742,
+ "grad_norm": 8.604249000549316,
+ "learning_rate": 1.8063529123652604e-05,
+ "loss": 0.662,
+ "step": 8272
+ },
+ {
+ "epoch": 22.542234332425068,
+ "grad_norm": 7.399803638458252,
+ "learning_rate": 1.8063007154321558e-05,
+ "loss": 0.6537,
+ "step": 8273
+ },
+ {
+ "epoch": 22.544959128065393,
+ "grad_norm": 8.598675727844238,
+ "learning_rate": 1.8062485122196074e-05,
+ "loss": 0.7892,
+ "step": 8274
+ },
+ {
+ "epoch": 22.547683923705723,
+ "grad_norm": 7.8193583488464355,
+ "learning_rate": 1.806196302728021e-05,
+ "loss": 0.8136,
+ "step": 8275
+ },
+ {
+ "epoch": 22.55040871934605,
+ "grad_norm": 9.113085746765137,
+ "learning_rate": 1.8061440869578043e-05,
+ "loss": 0.699,
+ "step": 8276
+ },
+ {
+ "epoch": 22.553133514986374,
+ "grad_norm": 8.494874954223633,
+ "learning_rate": 1.8060918649093634e-05,
+ "loss": 0.6088,
+ "step": 8277
+ },
+ {
+ "epoch": 22.555858310626704,
+ "grad_norm": 8.600625038146973,
+ "learning_rate": 1.8060396365831046e-05,
+ "loss": 0.6802,
+ "step": 8278
+ },
+ {
+ "epoch": 22.55858310626703,
+ "grad_norm": 8.80474853515625,
+ "learning_rate": 1.8059874019794352e-05,
+ "loss": 0.6677,
+ "step": 8279
+ },
+ {
+ "epoch": 22.561307901907355,
+ "grad_norm": 8.594862937927246,
+ "learning_rate": 1.8059351610987617e-05,
+ "loss": 0.8966,
+ "step": 8280
+ },
+ {
+ "epoch": 22.564032697547685,
+ "grad_norm": 9.526464462280273,
+ "learning_rate": 1.8058829139414915e-05,
+ "loss": 0.6548,
+ "step": 8281
+ },
+ {
+ "epoch": 22.56675749318801,
+ "grad_norm": 8.03078842163086,
+ "learning_rate": 1.805830660508031e-05,
+ "loss": 0.7498,
+ "step": 8282
+ },
+ {
+ "epoch": 22.569482288828336,
+ "grad_norm": 9.00503921508789,
+ "learning_rate": 1.805778400798787e-05,
+ "loss": 0.7373,
+ "step": 8283
+ },
+ {
+ "epoch": 22.572207084468666,
+ "grad_norm": 11.846492767333984,
+ "learning_rate": 1.805726134814167e-05,
+ "loss": 0.8224,
+ "step": 8284
+ },
+ {
+ "epoch": 22.57493188010899,
+ "grad_norm": 8.72476577758789,
+ "learning_rate": 1.8056738625545778e-05,
+ "loss": 0.6932,
+ "step": 8285
+ },
+ {
+ "epoch": 22.577656675749317,
+ "grad_norm": 6.827003479003906,
+ "learning_rate": 1.8056215840204262e-05,
+ "loss": 0.6933,
+ "step": 8286
+ },
+ {
+ "epoch": 22.580381471389646,
+ "grad_norm": 7.064388275146484,
+ "learning_rate": 1.80556929921212e-05,
+ "loss": 0.6964,
+ "step": 8287
+ },
+ {
+ "epoch": 22.583106267029972,
+ "grad_norm": 7.903183460235596,
+ "learning_rate": 1.8055170081300656e-05,
+ "loss": 0.5508,
+ "step": 8288
+ },
+ {
+ "epoch": 22.585831062670298,
+ "grad_norm": 9.286689758300781,
+ "learning_rate": 1.805464710774671e-05,
+ "loss": 0.8115,
+ "step": 8289
+ },
+ {
+ "epoch": 22.588555858310627,
+ "grad_norm": 12.02190113067627,
+ "learning_rate": 1.805412407146343e-05,
+ "loss": 0.7172,
+ "step": 8290
+ },
+ {
+ "epoch": 22.591280653950953,
+ "grad_norm": 6.979458332061768,
+ "learning_rate": 1.805360097245489e-05,
+ "loss": 0.6827,
+ "step": 8291
+ },
+ {
+ "epoch": 22.59400544959128,
+ "grad_norm": 8.05056381225586,
+ "learning_rate": 1.8053077810725167e-05,
+ "loss": 0.7211,
+ "step": 8292
+ },
+ {
+ "epoch": 22.59673024523161,
+ "grad_norm": 42.04249954223633,
+ "learning_rate": 1.8052554586278335e-05,
+ "loss": 0.6968,
+ "step": 8293
+ },
+ {
+ "epoch": 22.599455040871934,
+ "grad_norm": 9.809717178344727,
+ "learning_rate": 1.8052031299118465e-05,
+ "loss": 0.6751,
+ "step": 8294
+ },
+ {
+ "epoch": 22.60217983651226,
+ "grad_norm": 10.563461303710938,
+ "learning_rate": 1.805150794924963e-05,
+ "loss": 0.8352,
+ "step": 8295
+ },
+ {
+ "epoch": 22.60490463215259,
+ "grad_norm": 10.033594131469727,
+ "learning_rate": 1.8050984536675918e-05,
+ "loss": 0.7987,
+ "step": 8296
+ },
+ {
+ "epoch": 22.607629427792915,
+ "grad_norm": 8.315168380737305,
+ "learning_rate": 1.8050461061401394e-05,
+ "loss": 0.7013,
+ "step": 8297
+ },
+ {
+ "epoch": 22.61035422343324,
+ "grad_norm": 12.972036361694336,
+ "learning_rate": 1.8049937523430138e-05,
+ "loss": 0.7091,
+ "step": 8298
+ },
+ {
+ "epoch": 22.61307901907357,
+ "grad_norm": 9.643797874450684,
+ "learning_rate": 1.8049413922766227e-05,
+ "loss": 0.7911,
+ "step": 8299
+ },
+ {
+ "epoch": 22.615803814713896,
+ "grad_norm": 9.095795631408691,
+ "learning_rate": 1.804889025941374e-05,
+ "loss": 0.6661,
+ "step": 8300
+ },
+ {
+ "epoch": 22.618528610354222,
+ "grad_norm": 9.258108139038086,
+ "learning_rate": 1.8048366533376754e-05,
+ "loss": 0.6235,
+ "step": 8301
+ },
+ {
+ "epoch": 22.62125340599455,
+ "grad_norm": 9.524581909179688,
+ "learning_rate": 1.804784274465935e-05,
+ "loss": 0.8983,
+ "step": 8302
+ },
+ {
+ "epoch": 22.623978201634877,
+ "grad_norm": 10.910232543945312,
+ "learning_rate": 1.8047318893265606e-05,
+ "loss": 0.6393,
+ "step": 8303
+ },
+ {
+ "epoch": 22.626702997275203,
+ "grad_norm": 11.33791732788086,
+ "learning_rate": 1.80467949791996e-05,
+ "loss": 0.7798,
+ "step": 8304
+ },
+ {
+ "epoch": 22.629427792915532,
+ "grad_norm": 8.183943748474121,
+ "learning_rate": 1.8046271002465416e-05,
+ "loss": 0.7988,
+ "step": 8305
+ },
+ {
+ "epoch": 22.632152588555858,
+ "grad_norm": 9.401528358459473,
+ "learning_rate": 1.804574696306713e-05,
+ "loss": 0.7225,
+ "step": 8306
+ },
+ {
+ "epoch": 22.634877384196184,
+ "grad_norm": 9.101771354675293,
+ "learning_rate": 1.8045222861008826e-05,
+ "loss": 0.584,
+ "step": 8307
+ },
+ {
+ "epoch": 22.637602179836513,
+ "grad_norm": 8.446800231933594,
+ "learning_rate": 1.8044698696294586e-05,
+ "loss": 0.6541,
+ "step": 8308
+ },
+ {
+ "epoch": 22.64032697547684,
+ "grad_norm": 10.920446395874023,
+ "learning_rate": 1.804417446892849e-05,
+ "loss": 0.6578,
+ "step": 8309
+ },
+ {
+ "epoch": 22.643051771117165,
+ "grad_norm": 9.614753723144531,
+ "learning_rate": 1.8043650178914624e-05,
+ "loss": 0.7683,
+ "step": 8310
+ },
+ {
+ "epoch": 22.645776566757494,
+ "grad_norm": 9.82983684539795,
+ "learning_rate": 1.8043125826257067e-05,
+ "loss": 0.7668,
+ "step": 8311
+ },
+ {
+ "epoch": 22.64850136239782,
+ "grad_norm": 8.423670768737793,
+ "learning_rate": 1.8042601410959907e-05,
+ "loss": 0.8746,
+ "step": 8312
+ },
+ {
+ "epoch": 22.651226158038146,
+ "grad_norm": 8.503253936767578,
+ "learning_rate": 1.8042076933027228e-05,
+ "loss": 0.6849,
+ "step": 8313
+ },
+ {
+ "epoch": 22.653950953678475,
+ "grad_norm": 9.42237377166748,
+ "learning_rate": 1.804155239246311e-05,
+ "loss": 0.701,
+ "step": 8314
+ },
+ {
+ "epoch": 22.6566757493188,
+ "grad_norm": 10.920177459716797,
+ "learning_rate": 1.8041027789271642e-05,
+ "loss": 0.6328,
+ "step": 8315
+ },
+ {
+ "epoch": 22.659400544959126,
+ "grad_norm": 7.157051086425781,
+ "learning_rate": 1.8040503123456905e-05,
+ "loss": 0.88,
+ "step": 8316
+ },
+ {
+ "epoch": 22.662125340599456,
+ "grad_norm": 7.44293737411499,
+ "learning_rate": 1.8039978395022993e-05,
+ "loss": 0.7865,
+ "step": 8317
+ },
+ {
+ "epoch": 22.66485013623978,
+ "grad_norm": 10.239413261413574,
+ "learning_rate": 1.8039453603973984e-05,
+ "loss": 0.7601,
+ "step": 8318
+ },
+ {
+ "epoch": 22.667574931880107,
+ "grad_norm": 9.254770278930664,
+ "learning_rate": 1.803892875031397e-05,
+ "loss": 0.7531,
+ "step": 8319
+ },
+ {
+ "epoch": 22.670299727520437,
+ "grad_norm": 8.593079566955566,
+ "learning_rate": 1.803840383404704e-05,
+ "loss": 0.7659,
+ "step": 8320
+ },
+ {
+ "epoch": 22.673024523160763,
+ "grad_norm": 8.502016067504883,
+ "learning_rate": 1.8037878855177276e-05,
+ "loss": 0.9703,
+ "step": 8321
+ },
+ {
+ "epoch": 22.67574931880109,
+ "grad_norm": 9.36688232421875,
+ "learning_rate": 1.8037353813708773e-05,
+ "loss": 0.8094,
+ "step": 8322
+ },
+ {
+ "epoch": 22.678474114441418,
+ "grad_norm": 9.845867156982422,
+ "learning_rate": 1.8036828709645616e-05,
+ "loss": 0.6603,
+ "step": 8323
+ },
+ {
+ "epoch": 22.681198910081743,
+ "grad_norm": 7.752012252807617,
+ "learning_rate": 1.8036303542991898e-05,
+ "loss": 0.689,
+ "step": 8324
+ },
+ {
+ "epoch": 22.68392370572207,
+ "grad_norm": 8.684884071350098,
+ "learning_rate": 1.8035778313751704e-05,
+ "loss": 0.7348,
+ "step": 8325
+ },
+ {
+ "epoch": 22.6866485013624,
+ "grad_norm": 14.845547676086426,
+ "learning_rate": 1.803525302192913e-05,
+ "loss": 0.7791,
+ "step": 8326
+ },
+ {
+ "epoch": 22.689373297002724,
+ "grad_norm": 10.740171432495117,
+ "learning_rate": 1.803472766752826e-05,
+ "loss": 0.7183,
+ "step": 8327
+ },
+ {
+ "epoch": 22.69209809264305,
+ "grad_norm": 9.001082420349121,
+ "learning_rate": 1.8034202250553193e-05,
+ "loss": 0.7847,
+ "step": 8328
+ },
+ {
+ "epoch": 22.69482288828338,
+ "grad_norm": 8.427489280700684,
+ "learning_rate": 1.8033676771008014e-05,
+ "loss": 0.7919,
+ "step": 8329
+ },
+ {
+ "epoch": 22.697547683923705,
+ "grad_norm": 9.384603500366211,
+ "learning_rate": 1.803315122889682e-05,
+ "loss": 0.5674,
+ "step": 8330
+ },
+ {
+ "epoch": 22.70027247956403,
+ "grad_norm": 7.615623950958252,
+ "learning_rate": 1.8032625624223708e-05,
+ "loss": 0.7269,
+ "step": 8331
+ },
+ {
+ "epoch": 22.70299727520436,
+ "grad_norm": 7.652527809143066,
+ "learning_rate": 1.803209995699276e-05,
+ "loss": 0.5839,
+ "step": 8332
+ },
+ {
+ "epoch": 22.705722070844686,
+ "grad_norm": 8.273387908935547,
+ "learning_rate": 1.8031574227208078e-05,
+ "loss": 0.611,
+ "step": 8333
+ },
+ {
+ "epoch": 22.708446866485012,
+ "grad_norm": 9.620495796203613,
+ "learning_rate": 1.8031048434873754e-05,
+ "loss": 0.8767,
+ "step": 8334
+ },
+ {
+ "epoch": 22.71117166212534,
+ "grad_norm": 10.494977951049805,
+ "learning_rate": 1.8030522579993884e-05,
+ "loss": 0.6519,
+ "step": 8335
+ },
+ {
+ "epoch": 22.713896457765667,
+ "grad_norm": 9.045083999633789,
+ "learning_rate": 1.802999666257256e-05,
+ "loss": 0.6703,
+ "step": 8336
+ },
+ {
+ "epoch": 22.716621253405993,
+ "grad_norm": 7.966055393218994,
+ "learning_rate": 1.8029470682613886e-05,
+ "loss": 0.8085,
+ "step": 8337
+ },
+ {
+ "epoch": 22.719346049046322,
+ "grad_norm": 9.901015281677246,
+ "learning_rate": 1.8028944640121948e-05,
+ "loss": 0.7672,
+ "step": 8338
+ },
+ {
+ "epoch": 22.722070844686648,
+ "grad_norm": 11.238534927368164,
+ "learning_rate": 1.8028418535100848e-05,
+ "loss": 0.6296,
+ "step": 8339
+ },
+ {
+ "epoch": 22.724795640326974,
+ "grad_norm": 9.268028259277344,
+ "learning_rate": 1.8027892367554686e-05,
+ "loss": 0.6449,
+ "step": 8340
+ },
+ {
+ "epoch": 22.727520435967303,
+ "grad_norm": 10.056122779846191,
+ "learning_rate": 1.8027366137487555e-05,
+ "loss": 0.7068,
+ "step": 8341
+ },
+ {
+ "epoch": 22.73024523160763,
+ "grad_norm": 8.317461967468262,
+ "learning_rate": 1.8026839844903552e-05,
+ "loss": 0.6533,
+ "step": 8342
+ },
+ {
+ "epoch": 22.732970027247955,
+ "grad_norm": 18.117374420166016,
+ "learning_rate": 1.8026313489806783e-05,
+ "loss": 0.6644,
+ "step": 8343
+ },
+ {
+ "epoch": 22.735694822888284,
+ "grad_norm": 11.009692192077637,
+ "learning_rate": 1.802578707220134e-05,
+ "loss": 0.6713,
+ "step": 8344
+ },
+ {
+ "epoch": 22.73841961852861,
+ "grad_norm": 7.9983367919921875,
+ "learning_rate": 1.8025260592091326e-05,
+ "loss": 0.8015,
+ "step": 8345
+ },
+ {
+ "epoch": 22.741144414168936,
+ "grad_norm": 8.074543952941895,
+ "learning_rate": 1.8024734049480843e-05,
+ "loss": 0.7056,
+ "step": 8346
+ },
+ {
+ "epoch": 22.743869209809265,
+ "grad_norm": 12.755304336547852,
+ "learning_rate": 1.8024207444373988e-05,
+ "loss": 0.7308,
+ "step": 8347
+ },
+ {
+ "epoch": 22.74659400544959,
+ "grad_norm": 8.259418487548828,
+ "learning_rate": 1.802368077677486e-05,
+ "loss": 0.6225,
+ "step": 8348
+ },
+ {
+ "epoch": 22.749318801089917,
+ "grad_norm": 10.191117286682129,
+ "learning_rate": 1.802315404668757e-05,
+ "loss": 0.7797,
+ "step": 8349
+ },
+ {
+ "epoch": 22.752043596730246,
+ "grad_norm": 7.531361103057861,
+ "learning_rate": 1.802262725411621e-05,
+ "loss": 0.7404,
+ "step": 8350
+ },
+ {
+ "epoch": 22.754768392370572,
+ "grad_norm": 8.780338287353516,
+ "learning_rate": 1.802210039906489e-05,
+ "loss": 0.7735,
+ "step": 8351
+ },
+ {
+ "epoch": 22.757493188010898,
+ "grad_norm": 10.208608627319336,
+ "learning_rate": 1.8021573481537712e-05,
+ "loss": 0.8137,
+ "step": 8352
+ },
+ {
+ "epoch": 22.760217983651227,
+ "grad_norm": 11.209440231323242,
+ "learning_rate": 1.8021046501538774e-05,
+ "loss": 0.6912,
+ "step": 8353
+ },
+ {
+ "epoch": 22.762942779291553,
+ "grad_norm": 10.841713905334473,
+ "learning_rate": 1.8020519459072186e-05,
+ "loss": 0.7172,
+ "step": 8354
+ },
+ {
+ "epoch": 22.76566757493188,
+ "grad_norm": 7.741214752197266,
+ "learning_rate": 1.801999235414205e-05,
+ "loss": 0.8362,
+ "step": 8355
+ },
+ {
+ "epoch": 22.768392370572208,
+ "grad_norm": 8.230745315551758,
+ "learning_rate": 1.801946518675247e-05,
+ "loss": 0.7798,
+ "step": 8356
+ },
+ {
+ "epoch": 22.771117166212534,
+ "grad_norm": 9.219021797180176,
+ "learning_rate": 1.8018937956907556e-05,
+ "loss": 0.7969,
+ "step": 8357
+ },
+ {
+ "epoch": 22.77384196185286,
+ "grad_norm": 7.021849632263184,
+ "learning_rate": 1.8018410664611413e-05,
+ "loss": 0.8274,
+ "step": 8358
+ },
+ {
+ "epoch": 22.77656675749319,
+ "grad_norm": 8.705036163330078,
+ "learning_rate": 1.801788330986814e-05,
+ "loss": 0.7939,
+ "step": 8359
+ },
+ {
+ "epoch": 22.779291553133515,
+ "grad_norm": 8.407700538635254,
+ "learning_rate": 1.8017355892681855e-05,
+ "loss": 0.6484,
+ "step": 8360
+ },
+ {
+ "epoch": 22.78201634877384,
+ "grad_norm": 10.441157341003418,
+ "learning_rate": 1.8016828413056657e-05,
+ "loss": 0.6018,
+ "step": 8361
+ },
+ {
+ "epoch": 22.78474114441417,
+ "grad_norm": 15.836782455444336,
+ "learning_rate": 1.8016300870996657e-05,
+ "loss": 0.7433,
+ "step": 8362
+ },
+ {
+ "epoch": 22.787465940054496,
+ "grad_norm": 7.165671348571777,
+ "learning_rate": 1.8015773266505968e-05,
+ "loss": 0.6499,
+ "step": 8363
+ },
+ {
+ "epoch": 22.79019073569482,
+ "grad_norm": 7.884844779968262,
+ "learning_rate": 1.801524559958869e-05,
+ "loss": 0.7734,
+ "step": 8364
+ },
+ {
+ "epoch": 22.79291553133515,
+ "grad_norm": 8.301671028137207,
+ "learning_rate": 1.801471787024894e-05,
+ "loss": 0.7458,
+ "step": 8365
+ },
+ {
+ "epoch": 22.795640326975477,
+ "grad_norm": 8.874147415161133,
+ "learning_rate": 1.8014190078490827e-05,
+ "loss": 0.818,
+ "step": 8366
+ },
+ {
+ "epoch": 22.798365122615802,
+ "grad_norm": 8.567561149597168,
+ "learning_rate": 1.8013662224318454e-05,
+ "loss": 0.6621,
+ "step": 8367
+ },
+ {
+ "epoch": 22.80108991825613,
+ "grad_norm": 8.372900009155273,
+ "learning_rate": 1.801313430773594e-05,
+ "loss": 0.7499,
+ "step": 8368
+ },
+ {
+ "epoch": 22.803814713896458,
+ "grad_norm": 10.487556457519531,
+ "learning_rate": 1.8012606328747396e-05,
+ "loss": 0.7626,
+ "step": 8369
+ },
+ {
+ "epoch": 22.806539509536783,
+ "grad_norm": 8.268380165100098,
+ "learning_rate": 1.801207828735693e-05,
+ "loss": 0.6166,
+ "step": 8370
+ },
+ {
+ "epoch": 22.809264305177113,
+ "grad_norm": 9.076476097106934,
+ "learning_rate": 1.801155018356866e-05,
+ "loss": 0.9066,
+ "step": 8371
+ },
+ {
+ "epoch": 22.81198910081744,
+ "grad_norm": 7.709597110748291,
+ "learning_rate": 1.801102201738669e-05,
+ "loss": 0.7554,
+ "step": 8372
+ },
+ {
+ "epoch": 22.814713896457764,
+ "grad_norm": 7.452513694763184,
+ "learning_rate": 1.801049378881514e-05,
+ "loss": 0.8503,
+ "step": 8373
+ },
+ {
+ "epoch": 22.817438692098094,
+ "grad_norm": 12.326823234558105,
+ "learning_rate": 1.8009965497858122e-05,
+ "loss": 0.8734,
+ "step": 8374
+ },
+ {
+ "epoch": 22.82016348773842,
+ "grad_norm": 8.573702812194824,
+ "learning_rate": 1.8009437144519754e-05,
+ "loss": 0.7109,
+ "step": 8375
+ },
+ {
+ "epoch": 22.822888283378745,
+ "grad_norm": 9.0914306640625,
+ "learning_rate": 1.800890872880414e-05,
+ "loss": 0.7036,
+ "step": 8376
+ },
+ {
+ "epoch": 22.825613079019075,
+ "grad_norm": 7.493348121643066,
+ "learning_rate": 1.8008380250715407e-05,
+ "loss": 0.7402,
+ "step": 8377
+ },
+ {
+ "epoch": 22.8283378746594,
+ "grad_norm": 7.073947906494141,
+ "learning_rate": 1.8007851710257665e-05,
+ "loss": 0.7428,
+ "step": 8378
+ },
+ {
+ "epoch": 22.831062670299726,
+ "grad_norm": 7.560627460479736,
+ "learning_rate": 1.8007323107435036e-05,
+ "loss": 0.7723,
+ "step": 8379
+ },
+ {
+ "epoch": 22.833787465940055,
+ "grad_norm": 11.093255043029785,
+ "learning_rate": 1.8006794442251628e-05,
+ "loss": 0.6369,
+ "step": 8380
+ },
+ {
+ "epoch": 22.83651226158038,
+ "grad_norm": 10.050905227661133,
+ "learning_rate": 1.8006265714711563e-05,
+ "loss": 0.7341,
+ "step": 8381
+ },
+ {
+ "epoch": 22.839237057220707,
+ "grad_norm": 6.6332011222839355,
+ "learning_rate": 1.800573692481896e-05,
+ "loss": 0.6653,
+ "step": 8382
+ },
+ {
+ "epoch": 22.841961852861036,
+ "grad_norm": 10.797080993652344,
+ "learning_rate": 1.8005208072577934e-05,
+ "loss": 0.7542,
+ "step": 8383
+ },
+ {
+ "epoch": 22.844686648501362,
+ "grad_norm": 7.66061544418335,
+ "learning_rate": 1.8004679157992603e-05,
+ "loss": 0.6463,
+ "step": 8384
+ },
+ {
+ "epoch": 22.847411444141688,
+ "grad_norm": 9.29662036895752,
+ "learning_rate": 1.8004150181067092e-05,
+ "loss": 0.6167,
+ "step": 8385
+ },
+ {
+ "epoch": 22.850136239782017,
+ "grad_norm": 8.294990539550781,
+ "learning_rate": 1.8003621141805515e-05,
+ "loss": 0.8214,
+ "step": 8386
+ },
+ {
+ "epoch": 22.852861035422343,
+ "grad_norm": 9.719687461853027,
+ "learning_rate": 1.8003092040211997e-05,
+ "loss": 0.7599,
+ "step": 8387
+ },
+ {
+ "epoch": 22.85558583106267,
+ "grad_norm": 6.939882755279541,
+ "learning_rate": 1.8002562876290653e-05,
+ "loss": 0.6698,
+ "step": 8388
+ },
+ {
+ "epoch": 22.858310626703,
+ "grad_norm": 7.773337364196777,
+ "learning_rate": 1.8002033650045608e-05,
+ "loss": 0.7798,
+ "step": 8389
+ },
+ {
+ "epoch": 22.861035422343324,
+ "grad_norm": 5.989284992218018,
+ "learning_rate": 1.800150436148098e-05,
+ "loss": 0.8341,
+ "step": 8390
+ },
+ {
+ "epoch": 22.86376021798365,
+ "grad_norm": 8.706110000610352,
+ "learning_rate": 1.8000975010600896e-05,
+ "loss": 0.6805,
+ "step": 8391
+ },
+ {
+ "epoch": 22.86648501362398,
+ "grad_norm": 8.234627723693848,
+ "learning_rate": 1.8000445597409476e-05,
+ "loss": 0.7802,
+ "step": 8392
+ },
+ {
+ "epoch": 22.869209809264305,
+ "grad_norm": 8.230191230773926,
+ "learning_rate": 1.7999916121910844e-05,
+ "loss": 0.9098,
+ "step": 8393
+ },
+ {
+ "epoch": 22.87193460490463,
+ "grad_norm": 9.947519302368164,
+ "learning_rate": 1.799938658410912e-05,
+ "loss": 0.6981,
+ "step": 8394
+ },
+ {
+ "epoch": 22.87465940054496,
+ "grad_norm": 8.276824951171875,
+ "learning_rate": 1.7998856984008435e-05,
+ "loss": 0.625,
+ "step": 8395
+ },
+ {
+ "epoch": 22.877384196185286,
+ "grad_norm": 9.143417358398438,
+ "learning_rate": 1.799832732161291e-05,
+ "loss": 0.7893,
+ "step": 8396
+ },
+ {
+ "epoch": 22.88010899182561,
+ "grad_norm": 8.269719123840332,
+ "learning_rate": 1.7997797596926663e-05,
+ "loss": 0.6224,
+ "step": 8397
+ },
+ {
+ "epoch": 22.88283378746594,
+ "grad_norm": 12.5256929397583,
+ "learning_rate": 1.799726780995383e-05,
+ "loss": 0.705,
+ "step": 8398
+ },
+ {
+ "epoch": 22.885558583106267,
+ "grad_norm": 7.561325550079346,
+ "learning_rate": 1.799673796069853e-05,
+ "loss": 0.6573,
+ "step": 8399
+ },
+ {
+ "epoch": 22.888283378746593,
+ "grad_norm": 8.696834564208984,
+ "learning_rate": 1.7996208049164893e-05,
+ "loss": 0.8337,
+ "step": 8400
+ },
+ {
+ "epoch": 22.891008174386922,
+ "grad_norm": 12.15063190460205,
+ "learning_rate": 1.7995678075357046e-05,
+ "loss": 0.9536,
+ "step": 8401
+ },
+ {
+ "epoch": 22.893732970027248,
+ "grad_norm": 11.010416030883789,
+ "learning_rate": 1.7995148039279114e-05,
+ "loss": 0.6628,
+ "step": 8402
+ },
+ {
+ "epoch": 22.896457765667574,
+ "grad_norm": 27.363561630249023,
+ "learning_rate": 1.799461794093523e-05,
+ "loss": 0.7762,
+ "step": 8403
+ },
+ {
+ "epoch": 22.899182561307903,
+ "grad_norm": 9.95945930480957,
+ "learning_rate": 1.7994087780329515e-05,
+ "loss": 0.7667,
+ "step": 8404
+ },
+ {
+ "epoch": 22.90190735694823,
+ "grad_norm": 9.571027755737305,
+ "learning_rate": 1.79935575574661e-05,
+ "loss": 0.6774,
+ "step": 8405
+ },
+ {
+ "epoch": 22.904632152588555,
+ "grad_norm": 6.8465681076049805,
+ "learning_rate": 1.7993027272349122e-05,
+ "loss": 0.7532,
+ "step": 8406
+ },
+ {
+ "epoch": 22.907356948228884,
+ "grad_norm": 7.76675271987915,
+ "learning_rate": 1.79924969249827e-05,
+ "loss": 0.6217,
+ "step": 8407
+ },
+ {
+ "epoch": 22.91008174386921,
+ "grad_norm": 7.14346170425415,
+ "learning_rate": 1.799196651537097e-05,
+ "loss": 0.8032,
+ "step": 8408
+ },
+ {
+ "epoch": 22.912806539509535,
+ "grad_norm": 8.59581470489502,
+ "learning_rate": 1.7991436043518063e-05,
+ "loss": 0.7368,
+ "step": 8409
+ },
+ {
+ "epoch": 22.915531335149865,
+ "grad_norm": 9.888229370117188,
+ "learning_rate": 1.7990905509428113e-05,
+ "loss": 0.8506,
+ "step": 8410
+ },
+ {
+ "epoch": 22.91825613079019,
+ "grad_norm": 8.427626609802246,
+ "learning_rate": 1.7990374913105243e-05,
+ "loss": 0.7975,
+ "step": 8411
+ },
+ {
+ "epoch": 22.920980926430516,
+ "grad_norm": 7.949625015258789,
+ "learning_rate": 1.798984425455359e-05,
+ "loss": 0.7159,
+ "step": 8412
+ },
+ {
+ "epoch": 22.923705722070846,
+ "grad_norm": 12.150747299194336,
+ "learning_rate": 1.798931353377729e-05,
+ "loss": 0.6206,
+ "step": 8413
+ },
+ {
+ "epoch": 22.92643051771117,
+ "grad_norm": 11.340509414672852,
+ "learning_rate": 1.7988782750780474e-05,
+ "loss": 0.8069,
+ "step": 8414
+ },
+ {
+ "epoch": 22.929155313351497,
+ "grad_norm": 8.656377792358398,
+ "learning_rate": 1.7988251905567272e-05,
+ "loss": 0.6528,
+ "step": 8415
+ },
+ {
+ "epoch": 22.931880108991827,
+ "grad_norm": 8.10794448852539,
+ "learning_rate": 1.798772099814182e-05,
+ "loss": 0.5533,
+ "step": 8416
+ },
+ {
+ "epoch": 22.934604904632153,
+ "grad_norm": 6.618900299072266,
+ "learning_rate": 1.7987190028508258e-05,
+ "loss": 0.7542,
+ "step": 8417
+ },
+ {
+ "epoch": 22.93732970027248,
+ "grad_norm": 10.989508628845215,
+ "learning_rate": 1.7986658996670716e-05,
+ "loss": 0.6791,
+ "step": 8418
+ },
+ {
+ "epoch": 22.940054495912808,
+ "grad_norm": 7.508787155151367,
+ "learning_rate": 1.798612790263333e-05,
+ "loss": 0.7457,
+ "step": 8419
+ },
+ {
+ "epoch": 22.942779291553133,
+ "grad_norm": 11.940625190734863,
+ "learning_rate": 1.7985596746400234e-05,
+ "loss": 0.7559,
+ "step": 8420
+ },
+ {
+ "epoch": 22.94550408719346,
+ "grad_norm": 9.415892601013184,
+ "learning_rate": 1.7985065527975574e-05,
+ "loss": 0.86,
+ "step": 8421
+ },
+ {
+ "epoch": 22.94822888283379,
+ "grad_norm": 9.412283897399902,
+ "learning_rate": 1.798453424736348e-05,
+ "loss": 0.707,
+ "step": 8422
+ },
+ {
+ "epoch": 22.950953678474114,
+ "grad_norm": 7.368431568145752,
+ "learning_rate": 1.7984002904568085e-05,
+ "loss": 0.5997,
+ "step": 8423
+ },
+ {
+ "epoch": 22.95367847411444,
+ "grad_norm": 8.547812461853027,
+ "learning_rate": 1.7983471499593536e-05,
+ "loss": 0.758,
+ "step": 8424
+ },
+ {
+ "epoch": 22.95640326975477,
+ "grad_norm": 8.5846586227417,
+ "learning_rate": 1.7982940032443967e-05,
+ "loss": 0.7478,
+ "step": 8425
+ },
+ {
+ "epoch": 22.959128065395095,
+ "grad_norm": 15.388944625854492,
+ "learning_rate": 1.7982408503123518e-05,
+ "loss": 0.7078,
+ "step": 8426
+ },
+ {
+ "epoch": 22.96185286103542,
+ "grad_norm": 7.916131496429443,
+ "learning_rate": 1.7981876911636325e-05,
+ "loss": 0.6588,
+ "step": 8427
+ },
+ {
+ "epoch": 22.96457765667575,
+ "grad_norm": 8.411246299743652,
+ "learning_rate": 1.7981345257986537e-05,
+ "loss": 0.7148,
+ "step": 8428
+ },
+ {
+ "epoch": 22.967302452316076,
+ "grad_norm": 8.674823760986328,
+ "learning_rate": 1.798081354217829e-05,
+ "loss": 0.7478,
+ "step": 8429
+ },
+ {
+ "epoch": 22.970027247956402,
+ "grad_norm": 8.647583961486816,
+ "learning_rate": 1.7980281764215716e-05,
+ "loss": 0.7847,
+ "step": 8430
+ },
+ {
+ "epoch": 22.97275204359673,
+ "grad_norm": 12.102951049804688,
+ "learning_rate": 1.797974992410297e-05,
+ "loss": 0.9033,
+ "step": 8431
+ },
+ {
+ "epoch": 22.975476839237057,
+ "grad_norm": 8.523092269897461,
+ "learning_rate": 1.797921802184419e-05,
+ "loss": 0.6737,
+ "step": 8432
+ },
+ {
+ "epoch": 22.978201634877383,
+ "grad_norm": 9.005290031433105,
+ "learning_rate": 1.7978686057443514e-05,
+ "loss": 0.7683,
+ "step": 8433
+ },
+ {
+ "epoch": 22.980926430517712,
+ "grad_norm": 14.410584449768066,
+ "learning_rate": 1.797815403090509e-05,
+ "loss": 0.6978,
+ "step": 8434
+ },
+ {
+ "epoch": 22.983651226158038,
+ "grad_norm": 8.908540725708008,
+ "learning_rate": 1.7977621942233057e-05,
+ "loss": 0.8822,
+ "step": 8435
+ },
+ {
+ "epoch": 22.986376021798364,
+ "grad_norm": 9.658884048461914,
+ "learning_rate": 1.797708979143156e-05,
+ "loss": 0.9028,
+ "step": 8436
+ },
+ {
+ "epoch": 22.989100817438693,
+ "grad_norm": 9.560940742492676,
+ "learning_rate": 1.797655757850475e-05,
+ "loss": 0.733,
+ "step": 8437
+ },
+ {
+ "epoch": 22.99182561307902,
+ "grad_norm": 8.36474609375,
+ "learning_rate": 1.797602530345676e-05,
+ "loss": 0.6675,
+ "step": 8438
+ },
+ {
+ "epoch": 22.994550408719345,
+ "grad_norm": 7.720761299133301,
+ "learning_rate": 1.7975492966291743e-05,
+ "loss": 0.7605,
+ "step": 8439
+ },
+ {
+ "epoch": 22.997275204359674,
+ "grad_norm": 10.557333946228027,
+ "learning_rate": 1.7974960567013844e-05,
+ "loss": 0.8137,
+ "step": 8440
+ },
+ {
+ "epoch": 23.0,
+ "grad_norm": 7.309525966644287,
+ "learning_rate": 1.797442810562721e-05,
+ "loss": 0.5304,
+ "step": 8441
+ },
+ {
+ "epoch": 23.002724795640326,
+ "grad_norm": 7.120656967163086,
+ "learning_rate": 1.7973895582135984e-05,
+ "loss": 0.6416,
+ "step": 8442
+ },
+ {
+ "epoch": 23.005449591280655,
+ "grad_norm": 7.714159965515137,
+ "learning_rate": 1.7973362996544318e-05,
+ "loss": 0.5383,
+ "step": 8443
+ },
+ {
+ "epoch": 23.00817438692098,
+ "grad_norm": 7.924902439117432,
+ "learning_rate": 1.7972830348856358e-05,
+ "loss": 0.6489,
+ "step": 8444
+ },
+ {
+ "epoch": 23.010899182561307,
+ "grad_norm": 8.31507682800293,
+ "learning_rate": 1.797229763907625e-05,
+ "loss": 0.6921,
+ "step": 8445
+ },
+ {
+ "epoch": 23.013623978201636,
+ "grad_norm": 6.668956756591797,
+ "learning_rate": 1.797176486720815e-05,
+ "loss": 0.6844,
+ "step": 8446
+ },
+ {
+ "epoch": 23.016348773841962,
+ "grad_norm": 7.660555362701416,
+ "learning_rate": 1.7971232033256197e-05,
+ "loss": 0.4926,
+ "step": 8447
+ },
+ {
+ "epoch": 23.019073569482288,
+ "grad_norm": 6.523613929748535,
+ "learning_rate": 1.7970699137224543e-05,
+ "loss": 0.6993,
+ "step": 8448
+ },
+ {
+ "epoch": 23.021798365122617,
+ "grad_norm": 9.737499237060547,
+ "learning_rate": 1.7970166179117344e-05,
+ "loss": 0.7983,
+ "step": 8449
+ },
+ {
+ "epoch": 23.024523160762943,
+ "grad_norm": 7.278012275695801,
+ "learning_rate": 1.7969633158938745e-05,
+ "loss": 0.6957,
+ "step": 8450
+ },
+ {
+ "epoch": 23.02724795640327,
+ "grad_norm": 10.634453773498535,
+ "learning_rate": 1.79691000766929e-05,
+ "loss": 0.6973,
+ "step": 8451
+ },
+ {
+ "epoch": 23.029972752043598,
+ "grad_norm": 8.478558540344238,
+ "learning_rate": 1.7968566932383968e-05,
+ "loss": 0.671,
+ "step": 8452
+ },
+ {
+ "epoch": 23.032697547683924,
+ "grad_norm": 10.252836227416992,
+ "learning_rate": 1.7968033726016085e-05,
+ "loss": 0.619,
+ "step": 8453
+ },
+ {
+ "epoch": 23.03542234332425,
+ "grad_norm": 7.047082424163818,
+ "learning_rate": 1.7967500457593412e-05,
+ "loss": 0.6472,
+ "step": 8454
+ },
+ {
+ "epoch": 23.03814713896458,
+ "grad_norm": 8.522323608398438,
+ "learning_rate": 1.79669671271201e-05,
+ "loss": 0.6464,
+ "step": 8455
+ },
+ {
+ "epoch": 23.040871934604905,
+ "grad_norm": 7.537111759185791,
+ "learning_rate": 1.796643373460031e-05,
+ "loss": 0.6147,
+ "step": 8456
+ },
+ {
+ "epoch": 23.04359673024523,
+ "grad_norm": 7.55095911026001,
+ "learning_rate": 1.796590028003819e-05,
+ "loss": 0.6521,
+ "step": 8457
+ },
+ {
+ "epoch": 23.04632152588556,
+ "grad_norm": 7.395035743713379,
+ "learning_rate": 1.7965366763437893e-05,
+ "loss": 0.6871,
+ "step": 8458
+ },
+ {
+ "epoch": 23.049046321525886,
+ "grad_norm": 8.479537010192871,
+ "learning_rate": 1.7964833184803576e-05,
+ "loss": 0.6937,
+ "step": 8459
+ },
+ {
+ "epoch": 23.05177111716621,
+ "grad_norm": 6.660445690155029,
+ "learning_rate": 1.7964299544139394e-05,
+ "loss": 0.5733,
+ "step": 8460
+ },
+ {
+ "epoch": 23.05449591280654,
+ "grad_norm": 8.537720680236816,
+ "learning_rate": 1.7963765841449506e-05,
+ "loss": 0.6393,
+ "step": 8461
+ },
+ {
+ "epoch": 23.057220708446867,
+ "grad_norm": 9.241690635681152,
+ "learning_rate": 1.7963232076738063e-05,
+ "loss": 0.6331,
+ "step": 8462
+ },
+ {
+ "epoch": 23.059945504087192,
+ "grad_norm": 35.25710678100586,
+ "learning_rate": 1.7962698250009226e-05,
+ "loss": 0.646,
+ "step": 8463
+ },
+ {
+ "epoch": 23.06267029972752,
+ "grad_norm": 7.614792823791504,
+ "learning_rate": 1.7962164361267152e-05,
+ "loss": 0.5204,
+ "step": 8464
+ },
+ {
+ "epoch": 23.065395095367847,
+ "grad_norm": 7.552260398864746,
+ "learning_rate": 1.7961630410515998e-05,
+ "loss": 0.5472,
+ "step": 8465
+ },
+ {
+ "epoch": 23.068119891008173,
+ "grad_norm": 10.231441497802734,
+ "learning_rate": 1.7961096397759922e-05,
+ "loss": 0.592,
+ "step": 8466
+ },
+ {
+ "epoch": 23.070844686648503,
+ "grad_norm": 7.6383843421936035,
+ "learning_rate": 1.7960562323003087e-05,
+ "loss": 0.5792,
+ "step": 8467
+ },
+ {
+ "epoch": 23.07356948228883,
+ "grad_norm": 9.595244407653809,
+ "learning_rate": 1.7960028186249644e-05,
+ "loss": 0.693,
+ "step": 8468
+ },
+ {
+ "epoch": 23.076294277929154,
+ "grad_norm": 9.348398208618164,
+ "learning_rate": 1.7959493987503757e-05,
+ "loss": 0.6698,
+ "step": 8469
+ },
+ {
+ "epoch": 23.079019073569484,
+ "grad_norm": 8.854413032531738,
+ "learning_rate": 1.795895972676959e-05,
+ "loss": 0.6348,
+ "step": 8470
+ },
+ {
+ "epoch": 23.08174386920981,
+ "grad_norm": 8.519789695739746,
+ "learning_rate": 1.79584254040513e-05,
+ "loss": 0.5905,
+ "step": 8471
+ },
+ {
+ "epoch": 23.084468664850135,
+ "grad_norm": 8.251155853271484,
+ "learning_rate": 1.7957891019353048e-05,
+ "loss": 0.6971,
+ "step": 8472
+ },
+ {
+ "epoch": 23.087193460490465,
+ "grad_norm": 9.817055702209473,
+ "learning_rate": 1.7957356572678998e-05,
+ "loss": 0.5431,
+ "step": 8473
+ },
+ {
+ "epoch": 23.08991825613079,
+ "grad_norm": 9.670547485351562,
+ "learning_rate": 1.7956822064033313e-05,
+ "loss": 0.6669,
+ "step": 8474
+ },
+ {
+ "epoch": 23.092643051771116,
+ "grad_norm": 9.475438117980957,
+ "learning_rate": 1.7956287493420152e-05,
+ "loss": 0.7317,
+ "step": 8475
+ },
+ {
+ "epoch": 23.095367847411445,
+ "grad_norm": 8.039822578430176,
+ "learning_rate": 1.7955752860843678e-05,
+ "loss": 0.6687,
+ "step": 8476
+ },
+ {
+ "epoch": 23.09809264305177,
+ "grad_norm": 7.249072074890137,
+ "learning_rate": 1.795521816630806e-05,
+ "loss": 0.646,
+ "step": 8477
+ },
+ {
+ "epoch": 23.100817438692097,
+ "grad_norm": 7.711321830749512,
+ "learning_rate": 1.7954683409817457e-05,
+ "loss": 0.5933,
+ "step": 8478
+ },
+ {
+ "epoch": 23.103542234332426,
+ "grad_norm": 7.8946380615234375,
+ "learning_rate": 1.7954148591376038e-05,
+ "loss": 0.6982,
+ "step": 8479
+ },
+ {
+ "epoch": 23.106267029972752,
+ "grad_norm": 7.7069597244262695,
+ "learning_rate": 1.7953613710987966e-05,
+ "loss": 0.5725,
+ "step": 8480
+ },
+ {
+ "epoch": 23.108991825613078,
+ "grad_norm": 8.600133895874023,
+ "learning_rate": 1.7953078768657404e-05,
+ "loss": 0.6288,
+ "step": 8481
+ },
+ {
+ "epoch": 23.111716621253407,
+ "grad_norm": 7.790313720703125,
+ "learning_rate": 1.795254376438852e-05,
+ "loss": 0.6152,
+ "step": 8482
+ },
+ {
+ "epoch": 23.114441416893733,
+ "grad_norm": 9.687016487121582,
+ "learning_rate": 1.7952008698185483e-05,
+ "loss": 0.6984,
+ "step": 8483
+ },
+ {
+ "epoch": 23.11716621253406,
+ "grad_norm": 8.021065711975098,
+ "learning_rate": 1.7951473570052457e-05,
+ "loss": 0.6957,
+ "step": 8484
+ },
+ {
+ "epoch": 23.11989100817439,
+ "grad_norm": 47.138607025146484,
+ "learning_rate": 1.795093837999361e-05,
+ "loss": 0.5585,
+ "step": 8485
+ },
+ {
+ "epoch": 23.122615803814714,
+ "grad_norm": 8.166311264038086,
+ "learning_rate": 1.795040312801311e-05,
+ "loss": 0.5601,
+ "step": 8486
+ },
+ {
+ "epoch": 23.12534059945504,
+ "grad_norm": 8.451225280761719,
+ "learning_rate": 1.794986781411513e-05,
+ "loss": 0.677,
+ "step": 8487
+ },
+ {
+ "epoch": 23.12806539509537,
+ "grad_norm": 9.893058776855469,
+ "learning_rate": 1.7949332438303834e-05,
+ "loss": 0.6196,
+ "step": 8488
+ },
+ {
+ "epoch": 23.130790190735695,
+ "grad_norm": 7.625050067901611,
+ "learning_rate": 1.7948797000583394e-05,
+ "loss": 0.6169,
+ "step": 8489
+ },
+ {
+ "epoch": 23.13351498637602,
+ "grad_norm": 9.372100830078125,
+ "learning_rate": 1.7948261500957974e-05,
+ "loss": 0.6243,
+ "step": 8490
+ },
+ {
+ "epoch": 23.13623978201635,
+ "grad_norm": 10.169224739074707,
+ "learning_rate": 1.7947725939431756e-05,
+ "loss": 0.7031,
+ "step": 8491
+ },
+ {
+ "epoch": 23.138964577656676,
+ "grad_norm": 8.801020622253418,
+ "learning_rate": 1.7947190316008896e-05,
+ "loss": 0.6228,
+ "step": 8492
+ },
+ {
+ "epoch": 23.141689373297,
+ "grad_norm": 12.136094093322754,
+ "learning_rate": 1.7946654630693583e-05,
+ "loss": 0.7136,
+ "step": 8493
+ },
+ {
+ "epoch": 23.14441416893733,
+ "grad_norm": 7.939266204833984,
+ "learning_rate": 1.7946118883489974e-05,
+ "loss": 0.7758,
+ "step": 8494
+ },
+ {
+ "epoch": 23.147138964577657,
+ "grad_norm": 7.835748195648193,
+ "learning_rate": 1.7945583074402246e-05,
+ "loss": 0.6205,
+ "step": 8495
+ },
+ {
+ "epoch": 23.149863760217983,
+ "grad_norm": 10.074135780334473,
+ "learning_rate": 1.7945047203434573e-05,
+ "loss": 0.6698,
+ "step": 8496
+ },
+ {
+ "epoch": 23.152588555858312,
+ "grad_norm": 9.422436714172363,
+ "learning_rate": 1.794451127059113e-05,
+ "loss": 0.79,
+ "step": 8497
+ },
+ {
+ "epoch": 23.155313351498638,
+ "grad_norm": 8.241384506225586,
+ "learning_rate": 1.7943975275876088e-05,
+ "loss": 0.636,
+ "step": 8498
+ },
+ {
+ "epoch": 23.158038147138964,
+ "grad_norm": 8.339426040649414,
+ "learning_rate": 1.7943439219293623e-05,
+ "loss": 0.692,
+ "step": 8499
+ },
+ {
+ "epoch": 23.160762942779293,
+ "grad_norm": 8.311019897460938,
+ "learning_rate": 1.794290310084791e-05,
+ "loss": 0.5696,
+ "step": 8500
+ },
+ {
+ "epoch": 23.16348773841962,
+ "grad_norm": 8.582189559936523,
+ "learning_rate": 1.794236692054312e-05,
+ "loss": 0.5953,
+ "step": 8501
+ },
+ {
+ "epoch": 23.166212534059945,
+ "grad_norm": 7.771618366241455,
+ "learning_rate": 1.7941830678383433e-05,
+ "loss": 0.8604,
+ "step": 8502
+ },
+ {
+ "epoch": 23.168937329700274,
+ "grad_norm": 10.156007766723633,
+ "learning_rate": 1.794129437437303e-05,
+ "loss": 0.6352,
+ "step": 8503
+ },
+ {
+ "epoch": 23.1716621253406,
+ "grad_norm": 10.292689323425293,
+ "learning_rate": 1.7940758008516074e-05,
+ "loss": 0.721,
+ "step": 8504
+ },
+ {
+ "epoch": 23.174386920980925,
+ "grad_norm": 8.468525886535645,
+ "learning_rate": 1.7940221580816755e-05,
+ "loss": 0.5929,
+ "step": 8505
+ },
+ {
+ "epoch": 23.177111716621255,
+ "grad_norm": 8.367538452148438,
+ "learning_rate": 1.7939685091279244e-05,
+ "loss": 0.6339,
+ "step": 8506
+ },
+ {
+ "epoch": 23.17983651226158,
+ "grad_norm": 9.837169647216797,
+ "learning_rate": 1.7939148539907722e-05,
+ "loss": 0.6194,
+ "step": 8507
+ },
+ {
+ "epoch": 23.182561307901906,
+ "grad_norm": 7.640585422515869,
+ "learning_rate": 1.7938611926706365e-05,
+ "loss": 0.5526,
+ "step": 8508
+ },
+ {
+ "epoch": 23.185286103542236,
+ "grad_norm": 7.256917476654053,
+ "learning_rate": 1.7938075251679356e-05,
+ "loss": 0.6492,
+ "step": 8509
+ },
+ {
+ "epoch": 23.18801089918256,
+ "grad_norm": 6.757735252380371,
+ "learning_rate": 1.793753851483087e-05,
+ "loss": 0.5229,
+ "step": 8510
+ },
+ {
+ "epoch": 23.190735694822887,
+ "grad_norm": 10.572715759277344,
+ "learning_rate": 1.793700171616509e-05,
+ "loss": 0.7336,
+ "step": 8511
+ },
+ {
+ "epoch": 23.193460490463217,
+ "grad_norm": 8.248072624206543,
+ "learning_rate": 1.7936464855686197e-05,
+ "loss": 0.6858,
+ "step": 8512
+ },
+ {
+ "epoch": 23.196185286103542,
+ "grad_norm": 8.662367820739746,
+ "learning_rate": 1.7935927933398374e-05,
+ "loss": 0.6094,
+ "step": 8513
+ },
+ {
+ "epoch": 23.19891008174387,
+ "grad_norm": 6.991458415985107,
+ "learning_rate": 1.7935390949305796e-05,
+ "loss": 0.789,
+ "step": 8514
+ },
+ {
+ "epoch": 23.201634877384198,
+ "grad_norm": 8.048157691955566,
+ "learning_rate": 1.7934853903412648e-05,
+ "loss": 0.66,
+ "step": 8515
+ },
+ {
+ "epoch": 23.204359673024523,
+ "grad_norm": 11.361948013305664,
+ "learning_rate": 1.7934316795723116e-05,
+ "loss": 0.675,
+ "step": 8516
+ },
+ {
+ "epoch": 23.20708446866485,
+ "grad_norm": 19.493915557861328,
+ "learning_rate": 1.793377962624138e-05,
+ "loss": 0.6782,
+ "step": 8517
+ },
+ {
+ "epoch": 23.20980926430518,
+ "grad_norm": 7.957698822021484,
+ "learning_rate": 1.793324239497162e-05,
+ "loss": 0.5366,
+ "step": 8518
+ },
+ {
+ "epoch": 23.212534059945504,
+ "grad_norm": 7.149418354034424,
+ "learning_rate": 1.7932705101918025e-05,
+ "loss": 0.7745,
+ "step": 8519
+ },
+ {
+ "epoch": 23.21525885558583,
+ "grad_norm": 9.753764152526855,
+ "learning_rate": 1.793216774708478e-05,
+ "loss": 0.5413,
+ "step": 8520
+ },
+ {
+ "epoch": 23.21798365122616,
+ "grad_norm": 8.978517532348633,
+ "learning_rate": 1.7931630330476066e-05,
+ "loss": 0.7794,
+ "step": 8521
+ },
+ {
+ "epoch": 23.220708446866485,
+ "grad_norm": 10.788363456726074,
+ "learning_rate": 1.793109285209607e-05,
+ "loss": 0.6026,
+ "step": 8522
+ },
+ {
+ "epoch": 23.22343324250681,
+ "grad_norm": 8.073689460754395,
+ "learning_rate": 1.793055531194898e-05,
+ "loss": 0.6669,
+ "step": 8523
+ },
+ {
+ "epoch": 23.22615803814714,
+ "grad_norm": 7.393884181976318,
+ "learning_rate": 1.793001771003898e-05,
+ "loss": 0.6308,
+ "step": 8524
+ },
+ {
+ "epoch": 23.228882833787466,
+ "grad_norm": 9.178787231445312,
+ "learning_rate": 1.7929480046370257e-05,
+ "loss": 0.7239,
+ "step": 8525
+ },
+ {
+ "epoch": 23.231607629427792,
+ "grad_norm": 8.557303428649902,
+ "learning_rate": 1.7928942320947e-05,
+ "loss": 0.8069,
+ "step": 8526
+ },
+ {
+ "epoch": 23.23433242506812,
+ "grad_norm": 7.862518310546875,
+ "learning_rate": 1.7928404533773394e-05,
+ "loss": 0.6935,
+ "step": 8527
+ },
+ {
+ "epoch": 23.237057220708447,
+ "grad_norm": 7.550032138824463,
+ "learning_rate": 1.7927866684853628e-05,
+ "loss": 0.5632,
+ "step": 8528
+ },
+ {
+ "epoch": 23.239782016348773,
+ "grad_norm": 10.641572952270508,
+ "learning_rate": 1.792732877419189e-05,
+ "loss": 0.6713,
+ "step": 8529
+ },
+ {
+ "epoch": 23.242506811989102,
+ "grad_norm": 11.035921096801758,
+ "learning_rate": 1.7926790801792374e-05,
+ "loss": 0.7606,
+ "step": 8530
+ },
+ {
+ "epoch": 23.245231607629428,
+ "grad_norm": 10.768778800964355,
+ "learning_rate": 1.7926252767659265e-05,
+ "loss": 0.6884,
+ "step": 8531
+ },
+ {
+ "epoch": 23.247956403269754,
+ "grad_norm": 8.348357200622559,
+ "learning_rate": 1.7925714671796754e-05,
+ "loss": 0.5798,
+ "step": 8532
+ },
+ {
+ "epoch": 23.250681198910083,
+ "grad_norm": 8.501439094543457,
+ "learning_rate": 1.7925176514209033e-05,
+ "loss": 0.721,
+ "step": 8533
+ },
+ {
+ "epoch": 23.25340599455041,
+ "grad_norm": 8.829363822937012,
+ "learning_rate": 1.7924638294900292e-05,
+ "loss": 0.7488,
+ "step": 8534
+ },
+ {
+ "epoch": 23.256130790190735,
+ "grad_norm": 7.027775287628174,
+ "learning_rate": 1.7924100013874725e-05,
+ "loss": 0.7323,
+ "step": 8535
+ },
+ {
+ "epoch": 23.258855585831064,
+ "grad_norm": 7.892490863800049,
+ "learning_rate": 1.792356167113652e-05,
+ "loss": 0.5483,
+ "step": 8536
+ },
+ {
+ "epoch": 23.26158038147139,
+ "grad_norm": 7.996335983276367,
+ "learning_rate": 1.792302326668987e-05,
+ "loss": 0.5439,
+ "step": 8537
+ },
+ {
+ "epoch": 23.264305177111716,
+ "grad_norm": 11.164660453796387,
+ "learning_rate": 1.7922484800538973e-05,
+ "loss": 0.5655,
+ "step": 8538
+ },
+ {
+ "epoch": 23.267029972752045,
+ "grad_norm": 7.229864120483398,
+ "learning_rate": 1.7921946272688018e-05,
+ "loss": 0.6787,
+ "step": 8539
+ },
+ {
+ "epoch": 23.26975476839237,
+ "grad_norm": 9.329996109008789,
+ "learning_rate": 1.79214076831412e-05,
+ "loss": 0.6082,
+ "step": 8540
+ },
+ {
+ "epoch": 23.272479564032697,
+ "grad_norm": 7.63694429397583,
+ "learning_rate": 1.7920869031902715e-05,
+ "loss": 0.6626,
+ "step": 8541
+ },
+ {
+ "epoch": 23.275204359673026,
+ "grad_norm": 8.810453414916992,
+ "learning_rate": 1.792033031897676e-05,
+ "loss": 0.5375,
+ "step": 8542
+ },
+ {
+ "epoch": 23.277929155313352,
+ "grad_norm": 8.408686637878418,
+ "learning_rate": 1.791979154436752e-05,
+ "loss": 0.74,
+ "step": 8543
+ },
+ {
+ "epoch": 23.280653950953678,
+ "grad_norm": 8.32150650024414,
+ "learning_rate": 1.7919252708079203e-05,
+ "loss": 0.6957,
+ "step": 8544
+ },
+ {
+ "epoch": 23.283378746594007,
+ "grad_norm": 7.6873040199279785,
+ "learning_rate": 1.7918713810116e-05,
+ "loss": 0.6849,
+ "step": 8545
+ },
+ {
+ "epoch": 23.286103542234333,
+ "grad_norm": 15.796939849853516,
+ "learning_rate": 1.791817485048211e-05,
+ "loss": 0.6536,
+ "step": 8546
+ },
+ {
+ "epoch": 23.28882833787466,
+ "grad_norm": 10.190418243408203,
+ "learning_rate": 1.7917635829181726e-05,
+ "loss": 0.6182,
+ "step": 8547
+ },
+ {
+ "epoch": 23.291553133514988,
+ "grad_norm": 9.241643905639648,
+ "learning_rate": 1.7917096746219053e-05,
+ "loss": 0.607,
+ "step": 8548
+ },
+ {
+ "epoch": 23.294277929155314,
+ "grad_norm": 7.768148422241211,
+ "learning_rate": 1.7916557601598283e-05,
+ "loss": 0.679,
+ "step": 8549
+ },
+ {
+ "epoch": 23.29700272479564,
+ "grad_norm": 9.539830207824707,
+ "learning_rate": 1.7916018395323614e-05,
+ "loss": 0.5195,
+ "step": 8550
+ },
+ {
+ "epoch": 23.29972752043597,
+ "grad_norm": 7.210759162902832,
+ "learning_rate": 1.7915479127399255e-05,
+ "loss": 0.6689,
+ "step": 8551
+ },
+ {
+ "epoch": 23.302452316076295,
+ "grad_norm": 10.108943939208984,
+ "learning_rate": 1.7914939797829393e-05,
+ "loss": 0.8805,
+ "step": 8552
+ },
+ {
+ "epoch": 23.30517711171662,
+ "grad_norm": 8.475149154663086,
+ "learning_rate": 1.791440040661824e-05,
+ "loss": 0.6523,
+ "step": 8553
+ },
+ {
+ "epoch": 23.30790190735695,
+ "grad_norm": 7.329076766967773,
+ "learning_rate": 1.7913860953769987e-05,
+ "loss": 0.5496,
+ "step": 8554
+ },
+ {
+ "epoch": 23.310626702997276,
+ "grad_norm": 7.7415876388549805,
+ "learning_rate": 1.791332143928884e-05,
+ "loss": 0.6384,
+ "step": 8555
+ },
+ {
+ "epoch": 23.3133514986376,
+ "grad_norm": 9.320038795471191,
+ "learning_rate": 1.7912781863179005e-05,
+ "loss": 0.6972,
+ "step": 8556
+ },
+ {
+ "epoch": 23.31607629427793,
+ "grad_norm": 9.999711990356445,
+ "learning_rate": 1.7912242225444676e-05,
+ "loss": 0.7368,
+ "step": 8557
+ },
+ {
+ "epoch": 23.318801089918257,
+ "grad_norm": 10.375534057617188,
+ "learning_rate": 1.791170252609006e-05,
+ "loss": 0.681,
+ "step": 8558
+ },
+ {
+ "epoch": 23.321525885558582,
+ "grad_norm": 9.925941467285156,
+ "learning_rate": 1.7911162765119357e-05,
+ "loss": 0.6501,
+ "step": 8559
+ },
+ {
+ "epoch": 23.32425068119891,
+ "grad_norm": 9.065058708190918,
+ "learning_rate": 1.7910622942536777e-05,
+ "loss": 0.7489,
+ "step": 8560
+ },
+ {
+ "epoch": 23.326975476839237,
+ "grad_norm": 8.21484088897705,
+ "learning_rate": 1.7910083058346516e-05,
+ "loss": 0.8214,
+ "step": 8561
+ },
+ {
+ "epoch": 23.329700272479563,
+ "grad_norm": 7.954100608825684,
+ "learning_rate": 1.790954311255279e-05,
+ "loss": 0.5521,
+ "step": 8562
+ },
+ {
+ "epoch": 23.332425068119893,
+ "grad_norm": 8.682811737060547,
+ "learning_rate": 1.790900310515979e-05,
+ "loss": 0.691,
+ "step": 8563
+ },
+ {
+ "epoch": 23.33514986376022,
+ "grad_norm": 8.368846893310547,
+ "learning_rate": 1.790846303617173e-05,
+ "loss": 0.7624,
+ "step": 8564
+ },
+ {
+ "epoch": 23.337874659400544,
+ "grad_norm": 7.999691963195801,
+ "learning_rate": 1.7907922905592813e-05,
+ "loss": 0.6859,
+ "step": 8565
+ },
+ {
+ "epoch": 23.340599455040874,
+ "grad_norm": 7.746175289154053,
+ "learning_rate": 1.790738271342725e-05,
+ "loss": 0.6075,
+ "step": 8566
+ },
+ {
+ "epoch": 23.3433242506812,
+ "grad_norm": 7.714305400848389,
+ "learning_rate": 1.7906842459679242e-05,
+ "loss": 0.7225,
+ "step": 8567
+ },
+ {
+ "epoch": 23.346049046321525,
+ "grad_norm": 7.813354969024658,
+ "learning_rate": 1.7906302144353002e-05,
+ "loss": 0.6647,
+ "step": 8568
+ },
+ {
+ "epoch": 23.348773841961854,
+ "grad_norm": 23.70584487915039,
+ "learning_rate": 1.7905761767452735e-05,
+ "loss": 0.6464,
+ "step": 8569
+ },
+ {
+ "epoch": 23.35149863760218,
+ "grad_norm": 11.611759185791016,
+ "learning_rate": 1.7905221328982647e-05,
+ "loss": 0.7893,
+ "step": 8570
+ },
+ {
+ "epoch": 23.354223433242506,
+ "grad_norm": 7.760707378387451,
+ "learning_rate": 1.790468082894695e-05,
+ "loss": 0.7317,
+ "step": 8571
+ },
+ {
+ "epoch": 23.356948228882835,
+ "grad_norm": 8.688565254211426,
+ "learning_rate": 1.7904140267349856e-05,
+ "loss": 0.5536,
+ "step": 8572
+ },
+ {
+ "epoch": 23.35967302452316,
+ "grad_norm": 6.916512489318848,
+ "learning_rate": 1.7903599644195573e-05,
+ "loss": 0.6938,
+ "step": 8573
+ },
+ {
+ "epoch": 23.362397820163487,
+ "grad_norm": 9.440940856933594,
+ "learning_rate": 1.7903058959488307e-05,
+ "loss": 0.6481,
+ "step": 8574
+ },
+ {
+ "epoch": 23.365122615803816,
+ "grad_norm": 9.571310997009277,
+ "learning_rate": 1.7902518213232273e-05,
+ "loss": 0.718,
+ "step": 8575
+ },
+ {
+ "epoch": 23.367847411444142,
+ "grad_norm": 8.1104736328125,
+ "learning_rate": 1.7901977405431683e-05,
+ "loss": 0.7656,
+ "step": 8576
+ },
+ {
+ "epoch": 23.370572207084468,
+ "grad_norm": 8.448812484741211,
+ "learning_rate": 1.7901436536090747e-05,
+ "loss": 0.7043,
+ "step": 8577
+ },
+ {
+ "epoch": 23.373297002724797,
+ "grad_norm": 8.477097511291504,
+ "learning_rate": 1.7900895605213673e-05,
+ "loss": 0.6609,
+ "step": 8578
+ },
+ {
+ "epoch": 23.376021798365123,
+ "grad_norm": 8.596450805664062,
+ "learning_rate": 1.7900354612804685e-05,
+ "loss": 0.7032,
+ "step": 8579
+ },
+ {
+ "epoch": 23.37874659400545,
+ "grad_norm": 8.790950775146484,
+ "learning_rate": 1.7899813558867985e-05,
+ "loss": 0.7711,
+ "step": 8580
+ },
+ {
+ "epoch": 23.381471389645778,
+ "grad_norm": 8.57071590423584,
+ "learning_rate": 1.7899272443407792e-05,
+ "loss": 0.6788,
+ "step": 8581
+ },
+ {
+ "epoch": 23.384196185286104,
+ "grad_norm": 8.83356761932373,
+ "learning_rate": 1.789873126642832e-05,
+ "loss": 0.8002,
+ "step": 8582
+ },
+ {
+ "epoch": 23.38692098092643,
+ "grad_norm": 7.473575115203857,
+ "learning_rate": 1.7898190027933785e-05,
+ "loss": 0.5423,
+ "step": 8583
+ },
+ {
+ "epoch": 23.38964577656676,
+ "grad_norm": 9.0474853515625,
+ "learning_rate": 1.78976487279284e-05,
+ "loss": 0.62,
+ "step": 8584
+ },
+ {
+ "epoch": 23.392370572207085,
+ "grad_norm": 7.830740928649902,
+ "learning_rate": 1.7897107366416378e-05,
+ "loss": 0.7531,
+ "step": 8585
+ },
+ {
+ "epoch": 23.39509536784741,
+ "grad_norm": 7.8416290283203125,
+ "learning_rate": 1.789656594340194e-05,
+ "loss": 0.6802,
+ "step": 8586
+ },
+ {
+ "epoch": 23.39782016348774,
+ "grad_norm": 8.996277809143066,
+ "learning_rate": 1.78960244588893e-05,
+ "loss": 0.5889,
+ "step": 8587
+ },
+ {
+ "epoch": 23.400544959128066,
+ "grad_norm": 8.558965682983398,
+ "learning_rate": 1.7895482912882673e-05,
+ "loss": 0.6445,
+ "step": 8588
+ },
+ {
+ "epoch": 23.40326975476839,
+ "grad_norm": 7.307924747467041,
+ "learning_rate": 1.7894941305386283e-05,
+ "loss": 0.7791,
+ "step": 8589
+ },
+ {
+ "epoch": 23.40599455040872,
+ "grad_norm": 10.23050594329834,
+ "learning_rate": 1.7894399636404344e-05,
+ "loss": 0.6134,
+ "step": 8590
+ },
+ {
+ "epoch": 23.408719346049047,
+ "grad_norm": 8.079825401306152,
+ "learning_rate": 1.7893857905941074e-05,
+ "loss": 0.7001,
+ "step": 8591
+ },
+ {
+ "epoch": 23.411444141689373,
+ "grad_norm": 9.503316879272461,
+ "learning_rate": 1.789331611400069e-05,
+ "loss": 0.7207,
+ "step": 8592
+ },
+ {
+ "epoch": 23.414168937329702,
+ "grad_norm": 7.8776021003723145,
+ "learning_rate": 1.789277426058742e-05,
+ "loss": 0.5166,
+ "step": 8593
+ },
+ {
+ "epoch": 23.416893732970028,
+ "grad_norm": 40.536216735839844,
+ "learning_rate": 1.7892232345705475e-05,
+ "loss": 0.7108,
+ "step": 8594
+ },
+ {
+ "epoch": 23.419618528610354,
+ "grad_norm": 7.9806718826293945,
+ "learning_rate": 1.7891690369359077e-05,
+ "loss": 0.6958,
+ "step": 8595
+ },
+ {
+ "epoch": 23.422343324250683,
+ "grad_norm": 8.904545783996582,
+ "learning_rate": 1.789114833155245e-05,
+ "loss": 0.8054,
+ "step": 8596
+ },
+ {
+ "epoch": 23.42506811989101,
+ "grad_norm": 9.127898216247559,
+ "learning_rate": 1.7890606232289815e-05,
+ "loss": 0.7883,
+ "step": 8597
+ },
+ {
+ "epoch": 23.427792915531334,
+ "grad_norm": 9.511321067810059,
+ "learning_rate": 1.789006407157539e-05,
+ "loss": 0.7177,
+ "step": 8598
+ },
+ {
+ "epoch": 23.430517711171664,
+ "grad_norm": 8.270140647888184,
+ "learning_rate": 1.78895218494134e-05,
+ "loss": 0.5883,
+ "step": 8599
+ },
+ {
+ "epoch": 23.43324250681199,
+ "grad_norm": 7.842483043670654,
+ "learning_rate": 1.788897956580807e-05,
+ "loss": 0.6144,
+ "step": 8600
+ },
+ {
+ "epoch": 23.435967302452315,
+ "grad_norm": 9.526908874511719,
+ "learning_rate": 1.7888437220763618e-05,
+ "loss": 0.7385,
+ "step": 8601
+ },
+ {
+ "epoch": 23.438692098092645,
+ "grad_norm": 8.789389610290527,
+ "learning_rate": 1.7887894814284274e-05,
+ "loss": 0.5989,
+ "step": 8602
+ },
+ {
+ "epoch": 23.44141689373297,
+ "grad_norm": 9.479100227355957,
+ "learning_rate": 1.7887352346374255e-05,
+ "loss": 0.6363,
+ "step": 8603
+ },
+ {
+ "epoch": 23.444141689373296,
+ "grad_norm": 8.337409019470215,
+ "learning_rate": 1.7886809817037797e-05,
+ "loss": 0.7091,
+ "step": 8604
+ },
+ {
+ "epoch": 23.446866485013626,
+ "grad_norm": 7.94667911529541,
+ "learning_rate": 1.7886267226279114e-05,
+ "loss": 0.714,
+ "step": 8605
+ },
+ {
+ "epoch": 23.44959128065395,
+ "grad_norm": 9.154091835021973,
+ "learning_rate": 1.788572457410243e-05,
+ "loss": 0.6265,
+ "step": 8606
+ },
+ {
+ "epoch": 23.452316076294277,
+ "grad_norm": 9.223176956176758,
+ "learning_rate": 1.7885181860511983e-05,
+ "loss": 0.702,
+ "step": 8607
+ },
+ {
+ "epoch": 23.455040871934607,
+ "grad_norm": 7.356810092926025,
+ "learning_rate": 1.7884639085511996e-05,
+ "loss": 0.6519,
+ "step": 8608
+ },
+ {
+ "epoch": 23.457765667574932,
+ "grad_norm": 8.943059921264648,
+ "learning_rate": 1.7884096249106687e-05,
+ "loss": 0.667,
+ "step": 8609
+ },
+ {
+ "epoch": 23.460490463215258,
+ "grad_norm": 9.221323013305664,
+ "learning_rate": 1.7883553351300292e-05,
+ "loss": 0.7407,
+ "step": 8610
+ },
+ {
+ "epoch": 23.463215258855588,
+ "grad_norm": 7.710006237030029,
+ "learning_rate": 1.788301039209704e-05,
+ "loss": 0.6475,
+ "step": 8611
+ },
+ {
+ "epoch": 23.465940054495913,
+ "grad_norm": 8.61248779296875,
+ "learning_rate": 1.7882467371501156e-05,
+ "loss": 0.6575,
+ "step": 8612
+ },
+ {
+ "epoch": 23.46866485013624,
+ "grad_norm": 7.137813568115234,
+ "learning_rate": 1.788192428951687e-05,
+ "loss": 0.6826,
+ "step": 8613
+ },
+ {
+ "epoch": 23.47138964577657,
+ "grad_norm": 7.6610212326049805,
+ "learning_rate": 1.788138114614841e-05,
+ "loss": 0.7191,
+ "step": 8614
+ },
+ {
+ "epoch": 23.474114441416894,
+ "grad_norm": 9.8787841796875,
+ "learning_rate": 1.7880837941400005e-05,
+ "loss": 0.7482,
+ "step": 8615
+ },
+ {
+ "epoch": 23.47683923705722,
+ "grad_norm": 6.708698749542236,
+ "learning_rate": 1.788029467527589e-05,
+ "loss": 0.7267,
+ "step": 8616
+ },
+ {
+ "epoch": 23.479564032697546,
+ "grad_norm": 6.205842971801758,
+ "learning_rate": 1.7879751347780297e-05,
+ "loss": 0.5804,
+ "step": 8617
+ },
+ {
+ "epoch": 23.482288828337875,
+ "grad_norm": 7.933350563049316,
+ "learning_rate": 1.7879207958917447e-05,
+ "loss": 0.5801,
+ "step": 8618
+ },
+ {
+ "epoch": 23.4850136239782,
+ "grad_norm": 9.49789047241211,
+ "learning_rate": 1.7878664508691586e-05,
+ "loss": 0.5733,
+ "step": 8619
+ },
+ {
+ "epoch": 23.48773841961853,
+ "grad_norm": 7.27047061920166,
+ "learning_rate": 1.7878120997106937e-05,
+ "loss": 0.546,
+ "step": 8620
+ },
+ {
+ "epoch": 23.490463215258856,
+ "grad_norm": 9.08828067779541,
+ "learning_rate": 1.7877577424167734e-05,
+ "loss": 0.5861,
+ "step": 8621
+ },
+ {
+ "epoch": 23.493188010899182,
+ "grad_norm": 7.885524272918701,
+ "learning_rate": 1.7877033789878212e-05,
+ "loss": 0.8145,
+ "step": 8622
+ },
+ {
+ "epoch": 23.495912806539508,
+ "grad_norm": 7.435037136077881,
+ "learning_rate": 1.7876490094242604e-05,
+ "loss": 0.7148,
+ "step": 8623
+ },
+ {
+ "epoch": 23.498637602179837,
+ "grad_norm": 7.90762996673584,
+ "learning_rate": 1.7875946337265143e-05,
+ "loss": 0.6532,
+ "step": 8624
+ },
+ {
+ "epoch": 23.501362397820163,
+ "grad_norm": 7.87869930267334,
+ "learning_rate": 1.787540251895007e-05,
+ "loss": 0.7826,
+ "step": 8625
+ },
+ {
+ "epoch": 23.504087193460492,
+ "grad_norm": 6.55080509185791,
+ "learning_rate": 1.7874858639301616e-05,
+ "loss": 0.6455,
+ "step": 8626
+ },
+ {
+ "epoch": 23.506811989100818,
+ "grad_norm": 8.975728034973145,
+ "learning_rate": 1.7874314698324012e-05,
+ "loss": 0.72,
+ "step": 8627
+ },
+ {
+ "epoch": 23.509536784741144,
+ "grad_norm": 10.967278480529785,
+ "learning_rate": 1.78737706960215e-05,
+ "loss": 0.7908,
+ "step": 8628
+ },
+ {
+ "epoch": 23.51226158038147,
+ "grad_norm": 8.755050659179688,
+ "learning_rate": 1.7873226632398317e-05,
+ "loss": 0.814,
+ "step": 8629
+ },
+ {
+ "epoch": 23.5149863760218,
+ "grad_norm": 8.059727668762207,
+ "learning_rate": 1.7872682507458696e-05,
+ "loss": 0.7316,
+ "step": 8630
+ },
+ {
+ "epoch": 23.517711171662125,
+ "grad_norm": 12.241052627563477,
+ "learning_rate": 1.7872138321206876e-05,
+ "loss": 0.6984,
+ "step": 8631
+ },
+ {
+ "epoch": 23.520435967302454,
+ "grad_norm": 9.974397659301758,
+ "learning_rate": 1.78715940736471e-05,
+ "loss": 0.6152,
+ "step": 8632
+ },
+ {
+ "epoch": 23.52316076294278,
+ "grad_norm": 8.978565216064453,
+ "learning_rate": 1.7871049764783598e-05,
+ "loss": 0.6549,
+ "step": 8633
+ },
+ {
+ "epoch": 23.525885558583106,
+ "grad_norm": 10.687780380249023,
+ "learning_rate": 1.7870505394620617e-05,
+ "loss": 0.6996,
+ "step": 8634
+ },
+ {
+ "epoch": 23.52861035422343,
+ "grad_norm": 7.585939884185791,
+ "learning_rate": 1.7869960963162395e-05,
+ "loss": 0.5245,
+ "step": 8635
+ },
+ {
+ "epoch": 23.53133514986376,
+ "grad_norm": 8.184713363647461,
+ "learning_rate": 1.7869416470413167e-05,
+ "loss": 0.6719,
+ "step": 8636
+ },
+ {
+ "epoch": 23.534059945504087,
+ "grad_norm": 9.080817222595215,
+ "learning_rate": 1.7868871916377178e-05,
+ "loss": 0.7789,
+ "step": 8637
+ },
+ {
+ "epoch": 23.536784741144416,
+ "grad_norm": 6.877401351928711,
+ "learning_rate": 1.7868327301058668e-05,
+ "loss": 0.5884,
+ "step": 8638
+ },
+ {
+ "epoch": 23.539509536784742,
+ "grad_norm": 7.515068531036377,
+ "learning_rate": 1.7867782624461877e-05,
+ "loss": 0.5229,
+ "step": 8639
+ },
+ {
+ "epoch": 23.542234332425068,
+ "grad_norm": 7.122920513153076,
+ "learning_rate": 1.786723788659105e-05,
+ "loss": 0.7167,
+ "step": 8640
+ },
+ {
+ "epoch": 23.544959128065393,
+ "grad_norm": 8.047174453735352,
+ "learning_rate": 1.7866693087450426e-05,
+ "loss": 0.6377,
+ "step": 8641
+ },
+ {
+ "epoch": 23.547683923705723,
+ "grad_norm": 7.259688377380371,
+ "learning_rate": 1.786614822704425e-05,
+ "loss": 0.6741,
+ "step": 8642
+ },
+ {
+ "epoch": 23.55040871934605,
+ "grad_norm": 7.659267425537109,
+ "learning_rate": 1.7865603305376765e-05,
+ "loss": 0.7208,
+ "step": 8643
+ },
+ {
+ "epoch": 23.553133514986374,
+ "grad_norm": 6.8070173263549805,
+ "learning_rate": 1.7865058322452214e-05,
+ "loss": 0.6266,
+ "step": 8644
+ },
+ {
+ "epoch": 23.555858310626704,
+ "grad_norm": 7.469305515289307,
+ "learning_rate": 1.7864513278274843e-05,
+ "loss": 0.7759,
+ "step": 8645
+ },
+ {
+ "epoch": 23.55858310626703,
+ "grad_norm": 8.908949851989746,
+ "learning_rate": 1.7863968172848897e-05,
+ "loss": 0.5837,
+ "step": 8646
+ },
+ {
+ "epoch": 23.561307901907355,
+ "grad_norm": 7.560341835021973,
+ "learning_rate": 1.7863423006178616e-05,
+ "loss": 0.6711,
+ "step": 8647
+ },
+ {
+ "epoch": 23.564032697547685,
+ "grad_norm": 7.590961933135986,
+ "learning_rate": 1.786287777826825e-05,
+ "loss": 0.6345,
+ "step": 8648
+ },
+ {
+ "epoch": 23.56675749318801,
+ "grad_norm": 8.51723861694336,
+ "learning_rate": 1.786233248912205e-05,
+ "loss": 0.5675,
+ "step": 8649
+ },
+ {
+ "epoch": 23.569482288828336,
+ "grad_norm": 8.561624526977539,
+ "learning_rate": 1.7861787138744254e-05,
+ "loss": 0.7284,
+ "step": 8650
+ },
+ {
+ "epoch": 23.572207084468666,
+ "grad_norm": 8.869158744812012,
+ "learning_rate": 1.7861241727139113e-05,
+ "loss": 0.812,
+ "step": 8651
+ },
+ {
+ "epoch": 23.57493188010899,
+ "grad_norm": 10.612920761108398,
+ "learning_rate": 1.7860696254310874e-05,
+ "loss": 0.6151,
+ "step": 8652
+ },
+ {
+ "epoch": 23.577656675749317,
+ "grad_norm": 8.31689453125,
+ "learning_rate": 1.7860150720263786e-05,
+ "loss": 0.601,
+ "step": 8653
+ },
+ {
+ "epoch": 23.580381471389646,
+ "grad_norm": 8.467896461486816,
+ "learning_rate": 1.7859605125002098e-05,
+ "loss": 0.5558,
+ "step": 8654
+ },
+ {
+ "epoch": 23.583106267029972,
+ "grad_norm": 7.422057628631592,
+ "learning_rate": 1.7859059468530055e-05,
+ "loss": 0.5573,
+ "step": 8655
+ },
+ {
+ "epoch": 23.585831062670298,
+ "grad_norm": 13.866622924804688,
+ "learning_rate": 1.7858513750851913e-05,
+ "loss": 0.8096,
+ "step": 8656
+ },
+ {
+ "epoch": 23.588555858310627,
+ "grad_norm": 8.810937881469727,
+ "learning_rate": 1.785796797197192e-05,
+ "loss": 0.6388,
+ "step": 8657
+ },
+ {
+ "epoch": 23.591280653950953,
+ "grad_norm": 6.7735090255737305,
+ "learning_rate": 1.7857422131894322e-05,
+ "loss": 0.7238,
+ "step": 8658
+ },
+ {
+ "epoch": 23.59400544959128,
+ "grad_norm": 8.533026695251465,
+ "learning_rate": 1.7856876230623374e-05,
+ "loss": 0.6313,
+ "step": 8659
+ },
+ {
+ "epoch": 23.59673024523161,
+ "grad_norm": 7.0363922119140625,
+ "learning_rate": 1.785633026816333e-05,
+ "loss": 0.5979,
+ "step": 8660
+ },
+ {
+ "epoch": 23.599455040871934,
+ "grad_norm": 8.589900970458984,
+ "learning_rate": 1.7855784244518434e-05,
+ "loss": 0.5581,
+ "step": 8661
+ },
+ {
+ "epoch": 23.60217983651226,
+ "grad_norm": 7.23314905166626,
+ "learning_rate": 1.7855238159692943e-05,
+ "loss": 0.5594,
+ "step": 8662
+ },
+ {
+ "epoch": 23.60490463215259,
+ "grad_norm": 6.846451282501221,
+ "learning_rate": 1.7854692013691114e-05,
+ "loss": 0.6437,
+ "step": 8663
+ },
+ {
+ "epoch": 23.607629427792915,
+ "grad_norm": 15.448397636413574,
+ "learning_rate": 1.7854145806517195e-05,
+ "loss": 0.6333,
+ "step": 8664
+ },
+ {
+ "epoch": 23.61035422343324,
+ "grad_norm": 9.071206092834473,
+ "learning_rate": 1.7853599538175443e-05,
+ "loss": 0.6938,
+ "step": 8665
+ },
+ {
+ "epoch": 23.61307901907357,
+ "grad_norm": 9.376893997192383,
+ "learning_rate": 1.785305320867011e-05,
+ "loss": 0.6271,
+ "step": 8666
+ },
+ {
+ "epoch": 23.615803814713896,
+ "grad_norm": 7.037196159362793,
+ "learning_rate": 1.785250681800545e-05,
+ "loss": 0.5181,
+ "step": 8667
+ },
+ {
+ "epoch": 23.618528610354222,
+ "grad_norm": 7.3704376220703125,
+ "learning_rate": 1.7851960366185718e-05,
+ "loss": 0.6652,
+ "step": 8668
+ },
+ {
+ "epoch": 23.62125340599455,
+ "grad_norm": 8.9699125289917,
+ "learning_rate": 1.7851413853215175e-05,
+ "loss": 0.7029,
+ "step": 8669
+ },
+ {
+ "epoch": 23.623978201634877,
+ "grad_norm": 9.074806213378906,
+ "learning_rate": 1.785086727909807e-05,
+ "loss": 0.733,
+ "step": 8670
+ },
+ {
+ "epoch": 23.626702997275203,
+ "grad_norm": 7.657893657684326,
+ "learning_rate": 1.7850320643838666e-05,
+ "loss": 0.597,
+ "step": 8671
+ },
+ {
+ "epoch": 23.629427792915532,
+ "grad_norm": 7.139098167419434,
+ "learning_rate": 1.7849773947441215e-05,
+ "loss": 0.6231,
+ "step": 8672
+ },
+ {
+ "epoch": 23.632152588555858,
+ "grad_norm": 8.690154075622559,
+ "learning_rate": 1.784922718990998e-05,
+ "loss": 0.6373,
+ "step": 8673
+ },
+ {
+ "epoch": 23.634877384196184,
+ "grad_norm": 7.496939182281494,
+ "learning_rate": 1.7848680371249214e-05,
+ "loss": 0.6178,
+ "step": 8674
+ },
+ {
+ "epoch": 23.637602179836513,
+ "grad_norm": 10.386566162109375,
+ "learning_rate": 1.7848133491463176e-05,
+ "loss": 0.7594,
+ "step": 8675
+ },
+ {
+ "epoch": 23.64032697547684,
+ "grad_norm": 7.76467752456665,
+ "learning_rate": 1.7847586550556132e-05,
+ "loss": 0.6033,
+ "step": 8676
+ },
+ {
+ "epoch": 23.643051771117165,
+ "grad_norm": 7.715465068817139,
+ "learning_rate": 1.7847039548532333e-05,
+ "loss": 0.7561,
+ "step": 8677
+ },
+ {
+ "epoch": 23.645776566757494,
+ "grad_norm": 8.637248039245605,
+ "learning_rate": 1.7846492485396046e-05,
+ "loss": 0.6965,
+ "step": 8678
+ },
+ {
+ "epoch": 23.64850136239782,
+ "grad_norm": 8.032029151916504,
+ "learning_rate": 1.7845945361151526e-05,
+ "loss": 0.7462,
+ "step": 8679
+ },
+ {
+ "epoch": 23.651226158038146,
+ "grad_norm": 8.577354431152344,
+ "learning_rate": 1.7845398175803035e-05,
+ "loss": 0.792,
+ "step": 8680
+ },
+ {
+ "epoch": 23.653950953678475,
+ "grad_norm": 8.476625442504883,
+ "learning_rate": 1.7844850929354835e-05,
+ "loss": 0.7145,
+ "step": 8681
+ },
+ {
+ "epoch": 23.6566757493188,
+ "grad_norm": 9.123308181762695,
+ "learning_rate": 1.784430362181119e-05,
+ "loss": 0.7391,
+ "step": 8682
+ },
+ {
+ "epoch": 23.659400544959126,
+ "grad_norm": 8.435811996459961,
+ "learning_rate": 1.7843756253176362e-05,
+ "loss": 0.6026,
+ "step": 8683
+ },
+ {
+ "epoch": 23.662125340599456,
+ "grad_norm": 9.569748878479004,
+ "learning_rate": 1.784320882345461e-05,
+ "loss": 0.7577,
+ "step": 8684
+ },
+ {
+ "epoch": 23.66485013623978,
+ "grad_norm": 7.912408828735352,
+ "learning_rate": 1.7842661332650202e-05,
+ "loss": 0.8336,
+ "step": 8685
+ },
+ {
+ "epoch": 23.667574931880107,
+ "grad_norm": 8.150311470031738,
+ "learning_rate": 1.78421137807674e-05,
+ "loss": 0.5372,
+ "step": 8686
+ },
+ {
+ "epoch": 23.670299727520437,
+ "grad_norm": 6.968649864196777,
+ "learning_rate": 1.7841566167810467e-05,
+ "loss": 0.521,
+ "step": 8687
+ },
+ {
+ "epoch": 23.673024523160763,
+ "grad_norm": 6.817625045776367,
+ "learning_rate": 1.784101849378367e-05,
+ "loss": 0.6313,
+ "step": 8688
+ },
+ {
+ "epoch": 23.67574931880109,
+ "grad_norm": 7.390740871429443,
+ "learning_rate": 1.7840470758691274e-05,
+ "loss": 0.6503,
+ "step": 8689
+ },
+ {
+ "epoch": 23.678474114441418,
+ "grad_norm": 8.48143482208252,
+ "learning_rate": 1.7839922962537543e-05,
+ "loss": 0.6953,
+ "step": 8690
+ },
+ {
+ "epoch": 23.681198910081743,
+ "grad_norm": 9.579242706298828,
+ "learning_rate": 1.7839375105326743e-05,
+ "loss": 0.8687,
+ "step": 8691
+ },
+ {
+ "epoch": 23.68392370572207,
+ "grad_norm": 7.510007381439209,
+ "learning_rate": 1.7838827187063144e-05,
+ "loss": 0.6313,
+ "step": 8692
+ },
+ {
+ "epoch": 23.6866485013624,
+ "grad_norm": 8.059843063354492,
+ "learning_rate": 1.7838279207751013e-05,
+ "loss": 0.5894,
+ "step": 8693
+ },
+ {
+ "epoch": 23.689373297002724,
+ "grad_norm": 7.011054992675781,
+ "learning_rate": 1.7837731167394614e-05,
+ "loss": 0.7607,
+ "step": 8694
+ },
+ {
+ "epoch": 23.69209809264305,
+ "grad_norm": 9.017129898071289,
+ "learning_rate": 1.7837183065998215e-05,
+ "loss": 0.6663,
+ "step": 8695
+ },
+ {
+ "epoch": 23.69482288828338,
+ "grad_norm": 8.130972862243652,
+ "learning_rate": 1.783663490356609e-05,
+ "loss": 1.0414,
+ "step": 8696
+ },
+ {
+ "epoch": 23.697547683923705,
+ "grad_norm": 10.18790340423584,
+ "learning_rate": 1.78360866801025e-05,
+ "loss": 0.787,
+ "step": 8697
+ },
+ {
+ "epoch": 23.70027247956403,
+ "grad_norm": 8.673542976379395,
+ "learning_rate": 1.783553839561172e-05,
+ "loss": 0.5428,
+ "step": 8698
+ },
+ {
+ "epoch": 23.70299727520436,
+ "grad_norm": 8.38430118560791,
+ "learning_rate": 1.7834990050098025e-05,
+ "loss": 0.8124,
+ "step": 8699
+ },
+ {
+ "epoch": 23.705722070844686,
+ "grad_norm": 8.579794883728027,
+ "learning_rate": 1.7834441643565674e-05,
+ "loss": 0.5999,
+ "step": 8700
+ },
+ {
+ "epoch": 23.708446866485012,
+ "grad_norm": 8.432461738586426,
+ "learning_rate": 1.7833893176018945e-05,
+ "loss": 0.7352,
+ "step": 8701
+ },
+ {
+ "epoch": 23.71117166212534,
+ "grad_norm": 10.682052612304688,
+ "learning_rate": 1.7833344647462106e-05,
+ "loss": 0.6133,
+ "step": 8702
+ },
+ {
+ "epoch": 23.713896457765667,
+ "grad_norm": 8.271554946899414,
+ "learning_rate": 1.7832796057899434e-05,
+ "loss": 0.6321,
+ "step": 8703
+ },
+ {
+ "epoch": 23.716621253405993,
+ "grad_norm": 7.847799301147461,
+ "learning_rate": 1.7832247407335197e-05,
+ "loss": 0.6888,
+ "step": 8704
+ },
+ {
+ "epoch": 23.719346049046322,
+ "grad_norm": 7.223616600036621,
+ "learning_rate": 1.783169869577367e-05,
+ "loss": 0.6458,
+ "step": 8705
+ },
+ {
+ "epoch": 23.722070844686648,
+ "grad_norm": 7.0132904052734375,
+ "learning_rate": 1.7831149923219126e-05,
+ "loss": 0.7334,
+ "step": 8706
+ },
+ {
+ "epoch": 23.724795640326974,
+ "grad_norm": 8.604496002197266,
+ "learning_rate": 1.783060108967584e-05,
+ "loss": 0.6483,
+ "step": 8707
+ },
+ {
+ "epoch": 23.727520435967303,
+ "grad_norm": 6.9799652099609375,
+ "learning_rate": 1.7830052195148083e-05,
+ "loss": 0.7627,
+ "step": 8708
+ },
+ {
+ "epoch": 23.73024523160763,
+ "grad_norm": 6.896748065948486,
+ "learning_rate": 1.782950323964013e-05,
+ "loss": 0.5499,
+ "step": 8709
+ },
+ {
+ "epoch": 23.732970027247955,
+ "grad_norm": 9.566889762878418,
+ "learning_rate": 1.7828954223156257e-05,
+ "loss": 0.6467,
+ "step": 8710
+ },
+ {
+ "epoch": 23.735694822888284,
+ "grad_norm": 7.210999965667725,
+ "learning_rate": 1.7828405145700743e-05,
+ "loss": 0.6013,
+ "step": 8711
+ },
+ {
+ "epoch": 23.73841961852861,
+ "grad_norm": 10.314238548278809,
+ "learning_rate": 1.7827856007277865e-05,
+ "loss": 0.6503,
+ "step": 8712
+ },
+ {
+ "epoch": 23.741144414168936,
+ "grad_norm": 9.22961711883545,
+ "learning_rate": 1.782730680789189e-05,
+ "loss": 0.7363,
+ "step": 8713
+ },
+ {
+ "epoch": 23.743869209809265,
+ "grad_norm": 9.406926155090332,
+ "learning_rate": 1.78267575475471e-05,
+ "loss": 0.6622,
+ "step": 8714
+ },
+ {
+ "epoch": 23.74659400544959,
+ "grad_norm": 8.926714897155762,
+ "learning_rate": 1.7826208226247783e-05,
+ "loss": 0.6537,
+ "step": 8715
+ },
+ {
+ "epoch": 23.749318801089917,
+ "grad_norm": 9.726031303405762,
+ "learning_rate": 1.78256588439982e-05,
+ "loss": 0.567,
+ "step": 8716
+ },
+ {
+ "epoch": 23.752043596730246,
+ "grad_norm": 8.517714500427246,
+ "learning_rate": 1.7825109400802643e-05,
+ "loss": 0.77,
+ "step": 8717
+ },
+ {
+ "epoch": 23.754768392370572,
+ "grad_norm": 7.61201286315918,
+ "learning_rate": 1.7824559896665385e-05,
+ "loss": 0.6111,
+ "step": 8718
+ },
+ {
+ "epoch": 23.757493188010898,
+ "grad_norm": 8.55817985534668,
+ "learning_rate": 1.7824010331590703e-05,
+ "loss": 0.5581,
+ "step": 8719
+ },
+ {
+ "epoch": 23.760217983651227,
+ "grad_norm": 8.823881149291992,
+ "learning_rate": 1.7823460705582884e-05,
+ "loss": 0.6625,
+ "step": 8720
+ },
+ {
+ "epoch": 23.762942779291553,
+ "grad_norm": 7.473922252655029,
+ "learning_rate": 1.7822911018646202e-05,
+ "loss": 0.5093,
+ "step": 8721
+ },
+ {
+ "epoch": 23.76566757493188,
+ "grad_norm": 7.682458877563477,
+ "learning_rate": 1.782236127078494e-05,
+ "loss": 0.6854,
+ "step": 8722
+ },
+ {
+ "epoch": 23.768392370572208,
+ "grad_norm": 8.417536735534668,
+ "learning_rate": 1.7821811462003387e-05,
+ "loss": 0.6559,
+ "step": 8723
+ },
+ {
+ "epoch": 23.771117166212534,
+ "grad_norm": 8.51427173614502,
+ "learning_rate": 1.782126159230581e-05,
+ "loss": 0.6233,
+ "step": 8724
+ },
+ {
+ "epoch": 23.77384196185286,
+ "grad_norm": 8.760787963867188,
+ "learning_rate": 1.7820711661696504e-05,
+ "loss": 0.7046,
+ "step": 8725
+ },
+ {
+ "epoch": 23.77656675749319,
+ "grad_norm": 8.030685424804688,
+ "learning_rate": 1.7820161670179748e-05,
+ "loss": 0.6956,
+ "step": 8726
+ },
+ {
+ "epoch": 23.779291553133515,
+ "grad_norm": 8.65029239654541,
+ "learning_rate": 1.7819611617759826e-05,
+ "loss": 0.631,
+ "step": 8727
+ },
+ {
+ "epoch": 23.78201634877384,
+ "grad_norm": 7.661012649536133,
+ "learning_rate": 1.7819061504441016e-05,
+ "loss": 0.6351,
+ "step": 8728
+ },
+ {
+ "epoch": 23.78474114441417,
+ "grad_norm": 7.802098751068115,
+ "learning_rate": 1.7818511330227604e-05,
+ "loss": 0.7091,
+ "step": 8729
+ },
+ {
+ "epoch": 23.787465940054496,
+ "grad_norm": 8.589938163757324,
+ "learning_rate": 1.7817961095123885e-05,
+ "loss": 0.7041,
+ "step": 8730
+ },
+ {
+ "epoch": 23.79019073569482,
+ "grad_norm": 8.099030494689941,
+ "learning_rate": 1.7817410799134133e-05,
+ "loss": 0.8079,
+ "step": 8731
+ },
+ {
+ "epoch": 23.79291553133515,
+ "grad_norm": 10.787029266357422,
+ "learning_rate": 1.7816860442262637e-05,
+ "loss": 0.6957,
+ "step": 8732
+ },
+ {
+ "epoch": 23.795640326975477,
+ "grad_norm": 9.628156661987305,
+ "learning_rate": 1.781631002451368e-05,
+ "loss": 0.6896,
+ "step": 8733
+ },
+ {
+ "epoch": 23.798365122615802,
+ "grad_norm": 8.368080139160156,
+ "learning_rate": 1.7815759545891556e-05,
+ "loss": 0.6821,
+ "step": 8734
+ },
+ {
+ "epoch": 23.80108991825613,
+ "grad_norm": 7.77903938293457,
+ "learning_rate": 1.781520900640055e-05,
+ "loss": 0.5994,
+ "step": 8735
+ },
+ {
+ "epoch": 23.803814713896458,
+ "grad_norm": 8.866826057434082,
+ "learning_rate": 1.7814658406044948e-05,
+ "loss": 0.7404,
+ "step": 8736
+ },
+ {
+ "epoch": 23.806539509536783,
+ "grad_norm": 9.506380081176758,
+ "learning_rate": 1.7814107744829036e-05,
+ "loss": 0.7247,
+ "step": 8737
+ },
+ {
+ "epoch": 23.809264305177113,
+ "grad_norm": 13.592761993408203,
+ "learning_rate": 1.7813557022757103e-05,
+ "loss": 0.7326,
+ "step": 8738
+ },
+ {
+ "epoch": 23.81198910081744,
+ "grad_norm": 9.544055938720703,
+ "learning_rate": 1.781300623983344e-05,
+ "loss": 0.5842,
+ "step": 8739
+ },
+ {
+ "epoch": 23.814713896457764,
+ "grad_norm": 7.893803596496582,
+ "learning_rate": 1.7812455396062336e-05,
+ "loss": 0.6718,
+ "step": 8740
+ },
+ {
+ "epoch": 23.817438692098094,
+ "grad_norm": 8.230522155761719,
+ "learning_rate": 1.781190449144808e-05,
+ "loss": 0.6367,
+ "step": 8741
+ },
+ {
+ "epoch": 23.82016348773842,
+ "grad_norm": 8.57618522644043,
+ "learning_rate": 1.7811353525994967e-05,
+ "loss": 0.6167,
+ "step": 8742
+ },
+ {
+ "epoch": 23.822888283378745,
+ "grad_norm": 9.646374702453613,
+ "learning_rate": 1.781080249970728e-05,
+ "loss": 0.7092,
+ "step": 8743
+ },
+ {
+ "epoch": 23.825613079019075,
+ "grad_norm": 8.21642017364502,
+ "learning_rate": 1.7810251412589315e-05,
+ "loss": 0.6303,
+ "step": 8744
+ },
+ {
+ "epoch": 23.8283378746594,
+ "grad_norm": 8.2904052734375,
+ "learning_rate": 1.7809700264645365e-05,
+ "loss": 0.7354,
+ "step": 8745
+ },
+ {
+ "epoch": 23.831062670299726,
+ "grad_norm": 8.364733695983887,
+ "learning_rate": 1.780914905587972e-05,
+ "loss": 0.7319,
+ "step": 8746
+ },
+ {
+ "epoch": 23.833787465940055,
+ "grad_norm": 8.430075645446777,
+ "learning_rate": 1.7808597786296673e-05,
+ "loss": 0.596,
+ "step": 8747
+ },
+ {
+ "epoch": 23.83651226158038,
+ "grad_norm": 8.242403030395508,
+ "learning_rate": 1.7808046455900517e-05,
+ "loss": 0.696,
+ "step": 8748
+ },
+ {
+ "epoch": 23.839237057220707,
+ "grad_norm": 8.332865715026855,
+ "learning_rate": 1.780749506469555e-05,
+ "loss": 0.7371,
+ "step": 8749
+ },
+ {
+ "epoch": 23.841961852861036,
+ "grad_norm": 7.8866400718688965,
+ "learning_rate": 1.7806943612686058e-05,
+ "loss": 0.6669,
+ "step": 8750
+ },
+ {
+ "epoch": 23.844686648501362,
+ "grad_norm": 6.825740337371826,
+ "learning_rate": 1.7806392099876343e-05,
+ "loss": 0.6196,
+ "step": 8751
+ },
+ {
+ "epoch": 23.847411444141688,
+ "grad_norm": 13.025237083435059,
+ "learning_rate": 1.78058405262707e-05,
+ "loss": 0.7921,
+ "step": 8752
+ },
+ {
+ "epoch": 23.850136239782017,
+ "grad_norm": 6.44904088973999,
+ "learning_rate": 1.780528889187342e-05,
+ "loss": 0.7094,
+ "step": 8753
+ },
+ {
+ "epoch": 23.852861035422343,
+ "grad_norm": 8.157832145690918,
+ "learning_rate": 1.78047371966888e-05,
+ "loss": 0.6033,
+ "step": 8754
+ },
+ {
+ "epoch": 23.85558583106267,
+ "grad_norm": 9.57671070098877,
+ "learning_rate": 1.7804185440721136e-05,
+ "loss": 0.5122,
+ "step": 8755
+ },
+ {
+ "epoch": 23.858310626703,
+ "grad_norm": 9.046643257141113,
+ "learning_rate": 1.7803633623974732e-05,
+ "loss": 0.6341,
+ "step": 8756
+ },
+ {
+ "epoch": 23.861035422343324,
+ "grad_norm": 8.198485374450684,
+ "learning_rate": 1.7803081746453877e-05,
+ "loss": 0.5378,
+ "step": 8757
+ },
+ {
+ "epoch": 23.86376021798365,
+ "grad_norm": 7.1689043045043945,
+ "learning_rate": 1.7802529808162877e-05,
+ "loss": 0.6439,
+ "step": 8758
+ },
+ {
+ "epoch": 23.86648501362398,
+ "grad_norm": 7.593871116638184,
+ "learning_rate": 1.7801977809106024e-05,
+ "loss": 0.787,
+ "step": 8759
+ },
+ {
+ "epoch": 23.869209809264305,
+ "grad_norm": 8.279637336730957,
+ "learning_rate": 1.7801425749287616e-05,
+ "loss": 0.7444,
+ "step": 8760
+ },
+ {
+ "epoch": 23.87193460490463,
+ "grad_norm": 10.108986854553223,
+ "learning_rate": 1.7800873628711957e-05,
+ "loss": 0.7656,
+ "step": 8761
+ },
+ {
+ "epoch": 23.87465940054496,
+ "grad_norm": 14.299032211303711,
+ "learning_rate": 1.7800321447383345e-05,
+ "loss": 0.9197,
+ "step": 8762
+ },
+ {
+ "epoch": 23.877384196185286,
+ "grad_norm": 6.564296722412109,
+ "learning_rate": 1.7799769205306082e-05,
+ "loss": 0.7238,
+ "step": 8763
+ },
+ {
+ "epoch": 23.88010899182561,
+ "grad_norm": 8.50287914276123,
+ "learning_rate": 1.7799216902484465e-05,
+ "loss": 0.5895,
+ "step": 8764
+ },
+ {
+ "epoch": 23.88283378746594,
+ "grad_norm": 7.999722480773926,
+ "learning_rate": 1.77986645389228e-05,
+ "loss": 0.5835,
+ "step": 8765
+ },
+ {
+ "epoch": 23.885558583106267,
+ "grad_norm": 7.00806188583374,
+ "learning_rate": 1.7798112114625385e-05,
+ "loss": 0.8248,
+ "step": 8766
+ },
+ {
+ "epoch": 23.888283378746593,
+ "grad_norm": 8.394281387329102,
+ "learning_rate": 1.7797559629596525e-05,
+ "loss": 0.6644,
+ "step": 8767
+ },
+ {
+ "epoch": 23.891008174386922,
+ "grad_norm": 7.199811935424805,
+ "learning_rate": 1.7797007083840522e-05,
+ "loss": 0.7495,
+ "step": 8768
+ },
+ {
+ "epoch": 23.893732970027248,
+ "grad_norm": 8.760477066040039,
+ "learning_rate": 1.7796454477361676e-05,
+ "loss": 0.7896,
+ "step": 8769
+ },
+ {
+ "epoch": 23.896457765667574,
+ "grad_norm": 7.498642444610596,
+ "learning_rate": 1.7795901810164296e-05,
+ "loss": 0.6012,
+ "step": 8770
+ },
+ {
+ "epoch": 23.899182561307903,
+ "grad_norm": 7.29533052444458,
+ "learning_rate": 1.7795349082252686e-05,
+ "loss": 0.6757,
+ "step": 8771
+ },
+ {
+ "epoch": 23.90190735694823,
+ "grad_norm": 11.376025199890137,
+ "learning_rate": 1.7794796293631144e-05,
+ "loss": 0.7375,
+ "step": 8772
+ },
+ {
+ "epoch": 23.904632152588555,
+ "grad_norm": 9.86885929107666,
+ "learning_rate": 1.779424344430398e-05,
+ "loss": 0.653,
+ "step": 8773
+ },
+ {
+ "epoch": 23.907356948228884,
+ "grad_norm": 7.98117733001709,
+ "learning_rate": 1.77936905342755e-05,
+ "loss": 0.6324,
+ "step": 8774
+ },
+ {
+ "epoch": 23.91008174386921,
+ "grad_norm": 9.175762176513672,
+ "learning_rate": 1.7793137563550006e-05,
+ "loss": 0.6484,
+ "step": 8775
+ },
+ {
+ "epoch": 23.912806539509535,
+ "grad_norm": 9.684450149536133,
+ "learning_rate": 1.7792584532131813e-05,
+ "loss": 0.6616,
+ "step": 8776
+ },
+ {
+ "epoch": 23.915531335149865,
+ "grad_norm": 9.040603637695312,
+ "learning_rate": 1.779203144002522e-05,
+ "loss": 0.7095,
+ "step": 8777
+ },
+ {
+ "epoch": 23.91825613079019,
+ "grad_norm": 8.966569900512695,
+ "learning_rate": 1.7791478287234534e-05,
+ "loss": 0.6418,
+ "step": 8778
+ },
+ {
+ "epoch": 23.920980926430516,
+ "grad_norm": 9.191880226135254,
+ "learning_rate": 1.779092507376407e-05,
+ "loss": 0.7317,
+ "step": 8779
+ },
+ {
+ "epoch": 23.923705722070846,
+ "grad_norm": 6.665855407714844,
+ "learning_rate": 1.779037179961813e-05,
+ "loss": 0.678,
+ "step": 8780
+ },
+ {
+ "epoch": 23.92643051771117,
+ "grad_norm": 10.758771896362305,
+ "learning_rate": 1.7789818464801025e-05,
+ "loss": 0.7538,
+ "step": 8781
+ },
+ {
+ "epoch": 23.929155313351497,
+ "grad_norm": 8.288837432861328,
+ "learning_rate": 1.7789265069317067e-05,
+ "loss": 0.649,
+ "step": 8782
+ },
+ {
+ "epoch": 23.931880108991827,
+ "grad_norm": 8.446208000183105,
+ "learning_rate": 1.778871161317056e-05,
+ "loss": 0.6255,
+ "step": 8783
+ },
+ {
+ "epoch": 23.934604904632153,
+ "grad_norm": 10.18574047088623,
+ "learning_rate": 1.778815809636582e-05,
+ "loss": 0.6509,
+ "step": 8784
+ },
+ {
+ "epoch": 23.93732970027248,
+ "grad_norm": 7.808631420135498,
+ "learning_rate": 1.7787604518907152e-05,
+ "loss": 0.8768,
+ "step": 8785
+ },
+ {
+ "epoch": 23.940054495912808,
+ "grad_norm": 8.451011657714844,
+ "learning_rate": 1.7787050880798877e-05,
+ "loss": 0.6985,
+ "step": 8786
+ },
+ {
+ "epoch": 23.942779291553133,
+ "grad_norm": 10.8347749710083,
+ "learning_rate": 1.7786497182045295e-05,
+ "loss": 0.7277,
+ "step": 8787
+ },
+ {
+ "epoch": 23.94550408719346,
+ "grad_norm": 8.061737060546875,
+ "learning_rate": 1.7785943422650724e-05,
+ "loss": 0.5524,
+ "step": 8788
+ },
+ {
+ "epoch": 23.94822888283379,
+ "grad_norm": 10.186460494995117,
+ "learning_rate": 1.7785389602619477e-05,
+ "loss": 0.6448,
+ "step": 8789
+ },
+ {
+ "epoch": 23.950953678474114,
+ "grad_norm": 9.940427780151367,
+ "learning_rate": 1.7784835721955866e-05,
+ "loss": 0.6981,
+ "step": 8790
+ },
+ {
+ "epoch": 23.95367847411444,
+ "grad_norm": 8.110967636108398,
+ "learning_rate": 1.778428178066421e-05,
+ "loss": 0.7357,
+ "step": 8791
+ },
+ {
+ "epoch": 23.95640326975477,
+ "grad_norm": 8.784134864807129,
+ "learning_rate": 1.778372777874881e-05,
+ "loss": 0.6589,
+ "step": 8792
+ },
+ {
+ "epoch": 23.959128065395095,
+ "grad_norm": 8.895995140075684,
+ "learning_rate": 1.7783173716213996e-05,
+ "loss": 0.6352,
+ "step": 8793
+ },
+ {
+ "epoch": 23.96185286103542,
+ "grad_norm": 8.353736877441406,
+ "learning_rate": 1.778261959306407e-05,
+ "loss": 0.7448,
+ "step": 8794
+ },
+ {
+ "epoch": 23.96457765667575,
+ "grad_norm": 7.859174728393555,
+ "learning_rate": 1.7782065409303354e-05,
+ "loss": 0.6858,
+ "step": 8795
+ },
+ {
+ "epoch": 23.967302452316076,
+ "grad_norm": 6.824813365936279,
+ "learning_rate": 1.7781511164936166e-05,
+ "loss": 0.5969,
+ "step": 8796
+ },
+ {
+ "epoch": 23.970027247956402,
+ "grad_norm": 7.503294467926025,
+ "learning_rate": 1.7780956859966816e-05,
+ "loss": 0.5964,
+ "step": 8797
+ },
+ {
+ "epoch": 23.97275204359673,
+ "grad_norm": 16.265262603759766,
+ "learning_rate": 1.7780402494399625e-05,
+ "loss": 0.6479,
+ "step": 8798
+ },
+ {
+ "epoch": 23.975476839237057,
+ "grad_norm": 10.838225364685059,
+ "learning_rate": 1.777984806823891e-05,
+ "loss": 0.9917,
+ "step": 8799
+ },
+ {
+ "epoch": 23.978201634877383,
+ "grad_norm": 8.561009407043457,
+ "learning_rate": 1.777929358148899e-05,
+ "loss": 0.5197,
+ "step": 8800
+ },
+ {
+ "epoch": 23.980926430517712,
+ "grad_norm": 7.6468000411987305,
+ "learning_rate": 1.777873903415418e-05,
+ "loss": 0.6396,
+ "step": 8801
+ },
+ {
+ "epoch": 23.983651226158038,
+ "grad_norm": 8.598393440246582,
+ "learning_rate": 1.7778184426238805e-05,
+ "loss": 0.7515,
+ "step": 8802
+ },
+ {
+ "epoch": 23.986376021798364,
+ "grad_norm": 8.6475248336792,
+ "learning_rate": 1.7777629757747177e-05,
+ "loss": 0.7531,
+ "step": 8803
+ },
+ {
+ "epoch": 23.989100817438693,
+ "grad_norm": 9.719010353088379,
+ "learning_rate": 1.7777075028683617e-05,
+ "loss": 0.5279,
+ "step": 8804
+ },
+ {
+ "epoch": 23.99182561307902,
+ "grad_norm": 6.662492275238037,
+ "learning_rate": 1.7776520239052447e-05,
+ "loss": 0.6635,
+ "step": 8805
+ },
+ {
+ "epoch": 23.994550408719345,
+ "grad_norm": 9.058082580566406,
+ "learning_rate": 1.777596538885799e-05,
+ "loss": 0.7446,
+ "step": 8806
+ },
+ {
+ "epoch": 23.997275204359674,
+ "grad_norm": 11.454946517944336,
+ "learning_rate": 1.7775410478104566e-05,
+ "loss": 0.7344,
+ "step": 8807
+ },
+ {
+ "epoch": 24.0,
+ "grad_norm": 7.274345397949219,
+ "learning_rate": 1.7774855506796497e-05,
+ "loss": 0.6438,
+ "step": 8808
+ },
+ {
+ "epoch": 24.002724795640326,
+ "grad_norm": 9.180956840515137,
+ "learning_rate": 1.77743004749381e-05,
+ "loss": 0.7663,
+ "step": 8809
+ },
+ {
+ "epoch": 24.005449591280655,
+ "grad_norm": 9.361931800842285,
+ "learning_rate": 1.77737453825337e-05,
+ "loss": 0.5725,
+ "step": 8810
+ },
+ {
+ "epoch": 24.00817438692098,
+ "grad_norm": 13.765742301940918,
+ "learning_rate": 1.7773190229587624e-05,
+ "loss": 0.6661,
+ "step": 8811
+ },
+ {
+ "epoch": 24.010899182561307,
+ "grad_norm": 7.7954325675964355,
+ "learning_rate": 1.777263501610419e-05,
+ "loss": 0.5587,
+ "step": 8812
+ },
+ {
+ "epoch": 24.013623978201636,
+ "grad_norm": 9.439408302307129,
+ "learning_rate": 1.7772079742087728e-05,
+ "loss": 0.5846,
+ "step": 8813
+ },
+ {
+ "epoch": 24.016348773841962,
+ "grad_norm": 8.322379112243652,
+ "learning_rate": 1.7771524407542557e-05,
+ "loss": 0.4714,
+ "step": 8814
+ },
+ {
+ "epoch": 24.019073569482288,
+ "grad_norm": 9.102412223815918,
+ "learning_rate": 1.7770969012473002e-05,
+ "loss": 0.5491,
+ "step": 8815
+ },
+ {
+ "epoch": 24.021798365122617,
+ "grad_norm": 7.189291954040527,
+ "learning_rate": 1.777041355688339e-05,
+ "loss": 0.5874,
+ "step": 8816
+ },
+ {
+ "epoch": 24.024523160762943,
+ "grad_norm": 8.017959594726562,
+ "learning_rate": 1.7769858040778052e-05,
+ "loss": 0.5565,
+ "step": 8817
+ },
+ {
+ "epoch": 24.02724795640327,
+ "grad_norm": 7.578139305114746,
+ "learning_rate": 1.7769302464161307e-05,
+ "loss": 0.606,
+ "step": 8818
+ },
+ {
+ "epoch": 24.029972752043598,
+ "grad_norm": 8.187880516052246,
+ "learning_rate": 1.7768746827037485e-05,
+ "loss": 0.8091,
+ "step": 8819
+ },
+ {
+ "epoch": 24.032697547683924,
+ "grad_norm": 11.661108016967773,
+ "learning_rate": 1.7768191129410913e-05,
+ "loss": 0.5452,
+ "step": 8820
+ },
+ {
+ "epoch": 24.03542234332425,
+ "grad_norm": 7.239599227905273,
+ "learning_rate": 1.776763537128592e-05,
+ "loss": 0.7075,
+ "step": 8821
+ },
+ {
+ "epoch": 24.03814713896458,
+ "grad_norm": 6.680261135101318,
+ "learning_rate": 1.7767079552666827e-05,
+ "loss": 0.641,
+ "step": 8822
+ },
+ {
+ "epoch": 24.040871934604905,
+ "grad_norm": 6.787194728851318,
+ "learning_rate": 1.7766523673557973e-05,
+ "loss": 0.5983,
+ "step": 8823
+ },
+ {
+ "epoch": 24.04359673024523,
+ "grad_norm": 7.517077445983887,
+ "learning_rate": 1.7765967733963683e-05,
+ "loss": 0.7063,
+ "step": 8824
+ },
+ {
+ "epoch": 24.04632152588556,
+ "grad_norm": 7.721282482147217,
+ "learning_rate": 1.7765411733888286e-05,
+ "loss": 0.5142,
+ "step": 8825
+ },
+ {
+ "epoch": 24.049046321525886,
+ "grad_norm": 7.770618438720703,
+ "learning_rate": 1.776485567333611e-05,
+ "loss": 0.7643,
+ "step": 8826
+ },
+ {
+ "epoch": 24.05177111716621,
+ "grad_norm": 10.189929008483887,
+ "learning_rate": 1.776429955231149e-05,
+ "loss": 0.5923,
+ "step": 8827
+ },
+ {
+ "epoch": 24.05449591280654,
+ "grad_norm": 9.526094436645508,
+ "learning_rate": 1.7763743370818754e-05,
+ "loss": 0.5329,
+ "step": 8828
+ },
+ {
+ "epoch": 24.057220708446867,
+ "grad_norm": 7.70242166519165,
+ "learning_rate": 1.7763187128862237e-05,
+ "loss": 0.5778,
+ "step": 8829
+ },
+ {
+ "epoch": 24.059945504087192,
+ "grad_norm": 6.777331829071045,
+ "learning_rate": 1.7762630826446266e-05,
+ "loss": 0.5876,
+ "step": 8830
+ },
+ {
+ "epoch": 24.06267029972752,
+ "grad_norm": 6.557994842529297,
+ "learning_rate": 1.7762074463575175e-05,
+ "loss": 0.5725,
+ "step": 8831
+ },
+ {
+ "epoch": 24.065395095367847,
+ "grad_norm": 8.306127548217773,
+ "learning_rate": 1.77615180402533e-05,
+ "loss": 0.5729,
+ "step": 8832
+ },
+ {
+ "epoch": 24.068119891008173,
+ "grad_norm": 11.447331428527832,
+ "learning_rate": 1.776096155648497e-05,
+ "loss": 0.5963,
+ "step": 8833
+ },
+ {
+ "epoch": 24.070844686648503,
+ "grad_norm": 9.204768180847168,
+ "learning_rate": 1.7760405012274524e-05,
+ "loss": 0.7494,
+ "step": 8834
+ },
+ {
+ "epoch": 24.07356948228883,
+ "grad_norm": 7.9457197189331055,
+ "learning_rate": 1.775984840762629e-05,
+ "loss": 0.6118,
+ "step": 8835
+ },
+ {
+ "epoch": 24.076294277929154,
+ "grad_norm": 8.53819465637207,
+ "learning_rate": 1.775929174254461e-05,
+ "loss": 0.5968,
+ "step": 8836
+ },
+ {
+ "epoch": 24.079019073569484,
+ "grad_norm": 9.084603309631348,
+ "learning_rate": 1.7758735017033815e-05,
+ "loss": 0.5464,
+ "step": 8837
+ },
+ {
+ "epoch": 24.08174386920981,
+ "grad_norm": 8.14167594909668,
+ "learning_rate": 1.775817823109824e-05,
+ "loss": 0.5959,
+ "step": 8838
+ },
+ {
+ "epoch": 24.084468664850135,
+ "grad_norm": 8.741009712219238,
+ "learning_rate": 1.7757621384742224e-05,
+ "loss": 0.6049,
+ "step": 8839
+ },
+ {
+ "epoch": 24.087193460490465,
+ "grad_norm": 8.19509220123291,
+ "learning_rate": 1.7757064477970102e-05,
+ "loss": 0.6028,
+ "step": 8840
+ },
+ {
+ "epoch": 24.08991825613079,
+ "grad_norm": 7.75546932220459,
+ "learning_rate": 1.775650751078621e-05,
+ "loss": 0.6354,
+ "step": 8841
+ },
+ {
+ "epoch": 24.092643051771116,
+ "grad_norm": 6.951767444610596,
+ "learning_rate": 1.775595048319489e-05,
+ "loss": 0.4155,
+ "step": 8842
+ },
+ {
+ "epoch": 24.095367847411445,
+ "grad_norm": 7.5613837242126465,
+ "learning_rate": 1.7755393395200474e-05,
+ "loss": 0.5192,
+ "step": 8843
+ },
+ {
+ "epoch": 24.09809264305177,
+ "grad_norm": 7.482040882110596,
+ "learning_rate": 1.7754836246807308e-05,
+ "loss": 0.5631,
+ "step": 8844
+ },
+ {
+ "epoch": 24.100817438692097,
+ "grad_norm": 6.91545295715332,
+ "learning_rate": 1.775427903801972e-05,
+ "loss": 0.774,
+ "step": 8845
+ },
+ {
+ "epoch": 24.103542234332426,
+ "grad_norm": 6.406805515289307,
+ "learning_rate": 1.7753721768842062e-05,
+ "loss": 0.6931,
+ "step": 8846
+ },
+ {
+ "epoch": 24.106267029972752,
+ "grad_norm": 7.519858360290527,
+ "learning_rate": 1.775316443927867e-05,
+ "loss": 0.6432,
+ "step": 8847
+ },
+ {
+ "epoch": 24.108991825613078,
+ "grad_norm": 7.980284690856934,
+ "learning_rate": 1.7752607049333878e-05,
+ "loss": 0.6577,
+ "step": 8848
+ },
+ {
+ "epoch": 24.111716621253407,
+ "grad_norm": 6.317418575286865,
+ "learning_rate": 1.7752049599012037e-05,
+ "loss": 0.6211,
+ "step": 8849
+ },
+ {
+ "epoch": 24.114441416893733,
+ "grad_norm": 7.740270614624023,
+ "learning_rate": 1.775149208831748e-05,
+ "loss": 0.6008,
+ "step": 8850
+ },
+ {
+ "epoch": 24.11716621253406,
+ "grad_norm": 9.802743911743164,
+ "learning_rate": 1.775093451725455e-05,
+ "loss": 0.4851,
+ "step": 8851
+ },
+ {
+ "epoch": 24.11989100817439,
+ "grad_norm": 9.85669231414795,
+ "learning_rate": 1.775037688582759e-05,
+ "loss": 0.5617,
+ "step": 8852
+ },
+ {
+ "epoch": 24.122615803814714,
+ "grad_norm": 13.62320613861084,
+ "learning_rate": 1.7749819194040953e-05,
+ "loss": 0.6625,
+ "step": 8853
+ },
+ {
+ "epoch": 24.12534059945504,
+ "grad_norm": 8.604169845581055,
+ "learning_rate": 1.774926144189897e-05,
+ "loss": 0.5516,
+ "step": 8854
+ },
+ {
+ "epoch": 24.12806539509537,
+ "grad_norm": 7.5963945388793945,
+ "learning_rate": 1.7748703629405985e-05,
+ "loss": 0.6075,
+ "step": 8855
+ },
+ {
+ "epoch": 24.130790190735695,
+ "grad_norm": 10.069814682006836,
+ "learning_rate": 1.7748145756566346e-05,
+ "loss": 0.6424,
+ "step": 8856
+ },
+ {
+ "epoch": 24.13351498637602,
+ "grad_norm": 9.934816360473633,
+ "learning_rate": 1.7747587823384398e-05,
+ "loss": 0.6561,
+ "step": 8857
+ },
+ {
+ "epoch": 24.13623978201635,
+ "grad_norm": 7.163966178894043,
+ "learning_rate": 1.7747029829864485e-05,
+ "loss": 0.5048,
+ "step": 8858
+ },
+ {
+ "epoch": 24.138964577656676,
+ "grad_norm": 6.831045627593994,
+ "learning_rate": 1.7746471776010953e-05,
+ "loss": 0.5886,
+ "step": 8859
+ },
+ {
+ "epoch": 24.141689373297,
+ "grad_norm": 8.305370330810547,
+ "learning_rate": 1.7745913661828148e-05,
+ "loss": 0.6605,
+ "step": 8860
+ },
+ {
+ "epoch": 24.14441416893733,
+ "grad_norm": 7.8919677734375,
+ "learning_rate": 1.7745355487320418e-05,
+ "loss": 0.5443,
+ "step": 8861
+ },
+ {
+ "epoch": 24.147138964577657,
+ "grad_norm": 8.134822845458984,
+ "learning_rate": 1.774479725249211e-05,
+ "loss": 0.4431,
+ "step": 8862
+ },
+ {
+ "epoch": 24.149863760217983,
+ "grad_norm": 6.560815334320068,
+ "learning_rate": 1.774423895734757e-05,
+ "loss": 0.465,
+ "step": 8863
+ },
+ {
+ "epoch": 24.152588555858312,
+ "grad_norm": 6.805933475494385,
+ "learning_rate": 1.7743680601891146e-05,
+ "loss": 0.5242,
+ "step": 8864
+ },
+ {
+ "epoch": 24.155313351498638,
+ "grad_norm": 12.554423332214355,
+ "learning_rate": 1.7743122186127186e-05,
+ "loss": 0.5912,
+ "step": 8865
+ },
+ {
+ "epoch": 24.158038147138964,
+ "grad_norm": 9.693236351013184,
+ "learning_rate": 1.7742563710060036e-05,
+ "loss": 0.7233,
+ "step": 8866
+ },
+ {
+ "epoch": 24.160762942779293,
+ "grad_norm": 7.917965888977051,
+ "learning_rate": 1.774200517369405e-05,
+ "loss": 0.5757,
+ "step": 8867
+ },
+ {
+ "epoch": 24.16348773841962,
+ "grad_norm": 7.072247505187988,
+ "learning_rate": 1.7741446577033584e-05,
+ "loss": 0.6943,
+ "step": 8868
+ },
+ {
+ "epoch": 24.166212534059945,
+ "grad_norm": 7.145406723022461,
+ "learning_rate": 1.7740887920082975e-05,
+ "loss": 0.5609,
+ "step": 8869
+ },
+ {
+ "epoch": 24.168937329700274,
+ "grad_norm": 7.124011993408203,
+ "learning_rate": 1.774032920284658e-05,
+ "loss": 0.5221,
+ "step": 8870
+ },
+ {
+ "epoch": 24.1716621253406,
+ "grad_norm": 13.629548072814941,
+ "learning_rate": 1.7739770425328755e-05,
+ "loss": 0.5374,
+ "step": 8871
+ },
+ {
+ "epoch": 24.174386920980925,
+ "grad_norm": 8.548341751098633,
+ "learning_rate": 1.773921158753384e-05,
+ "loss": 0.5474,
+ "step": 8872
+ },
+ {
+ "epoch": 24.177111716621255,
+ "grad_norm": 7.261266708374023,
+ "learning_rate": 1.77386526894662e-05,
+ "loss": 0.4607,
+ "step": 8873
+ },
+ {
+ "epoch": 24.17983651226158,
+ "grad_norm": 8.976286888122559,
+ "learning_rate": 1.773809373113018e-05,
+ "loss": 0.6172,
+ "step": 8874
+ },
+ {
+ "epoch": 24.182561307901906,
+ "grad_norm": 8.677587509155273,
+ "learning_rate": 1.7737534712530133e-05,
+ "loss": 0.5142,
+ "step": 8875
+ },
+ {
+ "epoch": 24.185286103542236,
+ "grad_norm": 6.425335884094238,
+ "learning_rate": 1.7736975633670418e-05,
+ "loss": 0.6136,
+ "step": 8876
+ },
+ {
+ "epoch": 24.18801089918256,
+ "grad_norm": 14.822269439697266,
+ "learning_rate": 1.7736416494555384e-05,
+ "loss": 0.6446,
+ "step": 8877
+ },
+ {
+ "epoch": 24.190735694822887,
+ "grad_norm": 7.213735580444336,
+ "learning_rate": 1.773585729518939e-05,
+ "loss": 0.5947,
+ "step": 8878
+ },
+ {
+ "epoch": 24.193460490463217,
+ "grad_norm": 21.222930908203125,
+ "learning_rate": 1.7735298035576784e-05,
+ "loss": 0.5765,
+ "step": 8879
+ },
+ {
+ "epoch": 24.196185286103542,
+ "grad_norm": 9.02164077758789,
+ "learning_rate": 1.7734738715721928e-05,
+ "loss": 0.5336,
+ "step": 8880
+ },
+ {
+ "epoch": 24.19891008174387,
+ "grad_norm": 8.176846504211426,
+ "learning_rate": 1.7734179335629175e-05,
+ "loss": 0.7168,
+ "step": 8881
+ },
+ {
+ "epoch": 24.201634877384198,
+ "grad_norm": 7.966734409332275,
+ "learning_rate": 1.7733619895302886e-05,
+ "loss": 0.5344,
+ "step": 8882
+ },
+ {
+ "epoch": 24.204359673024523,
+ "grad_norm": 7.438953876495361,
+ "learning_rate": 1.773306039474741e-05,
+ "loss": 0.5792,
+ "step": 8883
+ },
+ {
+ "epoch": 24.20708446866485,
+ "grad_norm": 8.2271146774292,
+ "learning_rate": 1.7732500833967112e-05,
+ "loss": 0.5456,
+ "step": 8884
+ },
+ {
+ "epoch": 24.20980926430518,
+ "grad_norm": 9.87670612335205,
+ "learning_rate": 1.773194121296634e-05,
+ "loss": 0.5912,
+ "step": 8885
+ },
+ {
+ "epoch": 24.212534059945504,
+ "grad_norm": 6.806392192840576,
+ "learning_rate": 1.7731381531749465e-05,
+ "loss": 0.5977,
+ "step": 8886
+ },
+ {
+ "epoch": 24.21525885558583,
+ "grad_norm": 9.069767951965332,
+ "learning_rate": 1.7730821790320836e-05,
+ "loss": 0.7052,
+ "step": 8887
+ },
+ {
+ "epoch": 24.21798365122616,
+ "grad_norm": 7.941775798797607,
+ "learning_rate": 1.7730261988684817e-05,
+ "loss": 0.4982,
+ "step": 8888
+ },
+ {
+ "epoch": 24.220708446866485,
+ "grad_norm": 8.840487480163574,
+ "learning_rate": 1.772970212684577e-05,
+ "loss": 0.5079,
+ "step": 8889
+ },
+ {
+ "epoch": 24.22343324250681,
+ "grad_norm": 6.968510627746582,
+ "learning_rate": 1.7729142204808044e-05,
+ "loss": 0.8477,
+ "step": 8890
+ },
+ {
+ "epoch": 24.22615803814714,
+ "grad_norm": 8.35019588470459,
+ "learning_rate": 1.7728582222576012e-05,
+ "loss": 0.733,
+ "step": 8891
+ },
+ {
+ "epoch": 24.228882833787466,
+ "grad_norm": 20.245084762573242,
+ "learning_rate": 1.7728022180154032e-05,
+ "loss": 0.648,
+ "step": 8892
+ },
+ {
+ "epoch": 24.231607629427792,
+ "grad_norm": 6.931366443634033,
+ "learning_rate": 1.772746207754646e-05,
+ "loss": 0.5787,
+ "step": 8893
+ },
+ {
+ "epoch": 24.23433242506812,
+ "grad_norm": 8.669196128845215,
+ "learning_rate": 1.7726901914757664e-05,
+ "loss": 0.6771,
+ "step": 8894
+ },
+ {
+ "epoch": 24.237057220708447,
+ "grad_norm": 8.523401260375977,
+ "learning_rate": 1.7726341691792007e-05,
+ "loss": 0.6283,
+ "step": 8895
+ },
+ {
+ "epoch": 24.239782016348773,
+ "grad_norm": 8.485087394714355,
+ "learning_rate": 1.7725781408653844e-05,
+ "loss": 0.4896,
+ "step": 8896
+ },
+ {
+ "epoch": 24.242506811989102,
+ "grad_norm": 9.202347755432129,
+ "learning_rate": 1.772522106534755e-05,
+ "loss": 0.6118,
+ "step": 8897
+ },
+ {
+ "epoch": 24.245231607629428,
+ "grad_norm": 8.783988952636719,
+ "learning_rate": 1.7724660661877478e-05,
+ "loss": 0.5195,
+ "step": 8898
+ },
+ {
+ "epoch": 24.247956403269754,
+ "grad_norm": 8.67990493774414,
+ "learning_rate": 1.7724100198248e-05,
+ "loss": 0.6837,
+ "step": 8899
+ },
+ {
+ "epoch": 24.250681198910083,
+ "grad_norm": 6.818397521972656,
+ "learning_rate": 1.7723539674463473e-05,
+ "loss": 0.7156,
+ "step": 8900
+ },
+ {
+ "epoch": 24.25340599455041,
+ "grad_norm": 11.372779846191406,
+ "learning_rate": 1.7722979090528275e-05,
+ "loss": 0.8043,
+ "step": 8901
+ },
+ {
+ "epoch": 24.256130790190735,
+ "grad_norm": 7.923463821411133,
+ "learning_rate": 1.7722418446446764e-05,
+ "loss": 0.7062,
+ "step": 8902
+ },
+ {
+ "epoch": 24.258855585831064,
+ "grad_norm": 9.79150104522705,
+ "learning_rate": 1.7721857742223302e-05,
+ "loss": 0.5948,
+ "step": 8903
+ },
+ {
+ "epoch": 24.26158038147139,
+ "grad_norm": 8.668356895446777,
+ "learning_rate": 1.7721296977862263e-05,
+ "loss": 0.7242,
+ "step": 8904
+ },
+ {
+ "epoch": 24.264305177111716,
+ "grad_norm": 7.8720574378967285,
+ "learning_rate": 1.772073615336801e-05,
+ "loss": 0.6948,
+ "step": 8905
+ },
+ {
+ "epoch": 24.267029972752045,
+ "grad_norm": 13.879902839660645,
+ "learning_rate": 1.7720175268744914e-05,
+ "loss": 0.6692,
+ "step": 8906
+ },
+ {
+ "epoch": 24.26975476839237,
+ "grad_norm": 8.270305633544922,
+ "learning_rate": 1.771961432399734e-05,
+ "loss": 0.5986,
+ "step": 8907
+ },
+ {
+ "epoch": 24.272479564032697,
+ "grad_norm": 7.922856330871582,
+ "learning_rate": 1.771905331912966e-05,
+ "loss": 0.5305,
+ "step": 8908
+ },
+ {
+ "epoch": 24.275204359673026,
+ "grad_norm": 8.344463348388672,
+ "learning_rate": 1.771849225414624e-05,
+ "loss": 0.6023,
+ "step": 8909
+ },
+ {
+ "epoch": 24.277929155313352,
+ "grad_norm": 12.2206392288208,
+ "learning_rate": 1.7717931129051453e-05,
+ "loss": 0.6153,
+ "step": 8910
+ },
+ {
+ "epoch": 24.280653950953678,
+ "grad_norm": 8.765689849853516,
+ "learning_rate": 1.7717369943849666e-05,
+ "loss": 0.6091,
+ "step": 8911
+ },
+ {
+ "epoch": 24.283378746594007,
+ "grad_norm": 8.562520027160645,
+ "learning_rate": 1.771680869854525e-05,
+ "loss": 0.7114,
+ "step": 8912
+ },
+ {
+ "epoch": 24.286103542234333,
+ "grad_norm": 7.536573886871338,
+ "learning_rate": 1.7716247393142574e-05,
+ "loss": 0.8361,
+ "step": 8913
+ },
+ {
+ "epoch": 24.28882833787466,
+ "grad_norm": 9.855628967285156,
+ "learning_rate": 1.7715686027646012e-05,
+ "loss": 0.7352,
+ "step": 8914
+ },
+ {
+ "epoch": 24.291553133514988,
+ "grad_norm": 8.171891212463379,
+ "learning_rate": 1.7715124602059938e-05,
+ "loss": 0.5229,
+ "step": 8915
+ },
+ {
+ "epoch": 24.294277929155314,
+ "grad_norm": 8.117642402648926,
+ "learning_rate": 1.7714563116388717e-05,
+ "loss": 0.5455,
+ "step": 8916
+ },
+ {
+ "epoch": 24.29700272479564,
+ "grad_norm": 8.047110557556152,
+ "learning_rate": 1.771400157063673e-05,
+ "loss": 0.6682,
+ "step": 8917
+ },
+ {
+ "epoch": 24.29972752043597,
+ "grad_norm": 6.081267356872559,
+ "learning_rate": 1.771343996480835e-05,
+ "loss": 0.4733,
+ "step": 8918
+ },
+ {
+ "epoch": 24.302452316076295,
+ "grad_norm": 7.226494312286377,
+ "learning_rate": 1.7712878298907947e-05,
+ "loss": 0.6339,
+ "step": 8919
+ },
+ {
+ "epoch": 24.30517711171662,
+ "grad_norm": 7.701619625091553,
+ "learning_rate": 1.7712316572939893e-05,
+ "loss": 0.682,
+ "step": 8920
+ },
+ {
+ "epoch": 24.30790190735695,
+ "grad_norm": 12.228361129760742,
+ "learning_rate": 1.7711754786908566e-05,
+ "loss": 0.7488,
+ "step": 8921
+ },
+ {
+ "epoch": 24.310626702997276,
+ "grad_norm": 7.400647163391113,
+ "learning_rate": 1.771119294081834e-05,
+ "loss": 0.5571,
+ "step": 8922
+ },
+ {
+ "epoch": 24.3133514986376,
+ "grad_norm": 8.388209342956543,
+ "learning_rate": 1.7710631034673596e-05,
+ "loss": 0.6585,
+ "step": 8923
+ },
+ {
+ "epoch": 24.31607629427793,
+ "grad_norm": 11.702413558959961,
+ "learning_rate": 1.77100690684787e-05,
+ "loss": 0.6978,
+ "step": 8924
+ },
+ {
+ "epoch": 24.318801089918257,
+ "grad_norm": 8.448484420776367,
+ "learning_rate": 1.770950704223804e-05,
+ "loss": 0.6179,
+ "step": 8925
+ },
+ {
+ "epoch": 24.321525885558582,
+ "grad_norm": 13.490495681762695,
+ "learning_rate": 1.7708944955955983e-05,
+ "loss": 0.5149,
+ "step": 8926
+ },
+ {
+ "epoch": 24.32425068119891,
+ "grad_norm": 7.025055885314941,
+ "learning_rate": 1.7708382809636916e-05,
+ "loss": 0.6355,
+ "step": 8927
+ },
+ {
+ "epoch": 24.326975476839237,
+ "grad_norm": 9.349492073059082,
+ "learning_rate": 1.7707820603285205e-05,
+ "loss": 0.6227,
+ "step": 8928
+ },
+ {
+ "epoch": 24.329700272479563,
+ "grad_norm": 7.702953338623047,
+ "learning_rate": 1.770725833690524e-05,
+ "loss": 0.587,
+ "step": 8929
+ },
+ {
+ "epoch": 24.332425068119893,
+ "grad_norm": 8.693236351013184,
+ "learning_rate": 1.7706696010501393e-05,
+ "loss": 0.6459,
+ "step": 8930
+ },
+ {
+ "epoch": 24.33514986376022,
+ "grad_norm": 7.2914042472839355,
+ "learning_rate": 1.7706133624078046e-05,
+ "loss": 0.6217,
+ "step": 8931
+ },
+ {
+ "epoch": 24.337874659400544,
+ "grad_norm": 8.049612045288086,
+ "learning_rate": 1.7705571177639576e-05,
+ "loss": 0.5838,
+ "step": 8932
+ },
+ {
+ "epoch": 24.340599455040874,
+ "grad_norm": 6.403984069824219,
+ "learning_rate": 1.770500867119037e-05,
+ "loss": 0.636,
+ "step": 8933
+ },
+ {
+ "epoch": 24.3433242506812,
+ "grad_norm": 8.680638313293457,
+ "learning_rate": 1.7704446104734803e-05,
+ "loss": 0.6687,
+ "step": 8934
+ },
+ {
+ "epoch": 24.346049046321525,
+ "grad_norm": 10.090593338012695,
+ "learning_rate": 1.7703883478277254e-05,
+ "loss": 0.5801,
+ "step": 8935
+ },
+ {
+ "epoch": 24.348773841961854,
+ "grad_norm": 7.0510573387146,
+ "learning_rate": 1.7703320791822115e-05,
+ "loss": 0.5844,
+ "step": 8936
+ },
+ {
+ "epoch": 24.35149863760218,
+ "grad_norm": 7.9243292808532715,
+ "learning_rate": 1.7702758045373757e-05,
+ "loss": 0.56,
+ "step": 8937
+ },
+ {
+ "epoch": 24.354223433242506,
+ "grad_norm": 8.23276138305664,
+ "learning_rate": 1.7702195238936567e-05,
+ "loss": 0.5253,
+ "step": 8938
+ },
+ {
+ "epoch": 24.356948228882835,
+ "grad_norm": 7.644566059112549,
+ "learning_rate": 1.7701632372514934e-05,
+ "loss": 0.5872,
+ "step": 8939
+ },
+ {
+ "epoch": 24.35967302452316,
+ "grad_norm": 7.820858001708984,
+ "learning_rate": 1.770106944611323e-05,
+ "loss": 0.5786,
+ "step": 8940
+ },
+ {
+ "epoch": 24.362397820163487,
+ "grad_norm": 8.273859977722168,
+ "learning_rate": 1.7700506459735844e-05,
+ "loss": 0.6094,
+ "step": 8941
+ },
+ {
+ "epoch": 24.365122615803816,
+ "grad_norm": 8.284680366516113,
+ "learning_rate": 1.7699943413387166e-05,
+ "loss": 0.6714,
+ "step": 8942
+ },
+ {
+ "epoch": 24.367847411444142,
+ "grad_norm": 7.8198981285095215,
+ "learning_rate": 1.7699380307071575e-05,
+ "loss": 0.6301,
+ "step": 8943
+ },
+ {
+ "epoch": 24.370572207084468,
+ "grad_norm": 10.067788124084473,
+ "learning_rate": 1.7698817140793458e-05,
+ "loss": 0.5275,
+ "step": 8944
+ },
+ {
+ "epoch": 24.373297002724797,
+ "grad_norm": 6.036175727844238,
+ "learning_rate": 1.76982539145572e-05,
+ "loss": 0.774,
+ "step": 8945
+ },
+ {
+ "epoch": 24.376021798365123,
+ "grad_norm": 8.07691478729248,
+ "learning_rate": 1.7697690628367188e-05,
+ "loss": 0.6495,
+ "step": 8946
+ },
+ {
+ "epoch": 24.37874659400545,
+ "grad_norm": 7.238626480102539,
+ "learning_rate": 1.769712728222781e-05,
+ "loss": 0.6085,
+ "step": 8947
+ },
+ {
+ "epoch": 24.381471389645778,
+ "grad_norm": 7.894228935241699,
+ "learning_rate": 1.7696563876143455e-05,
+ "loss": 0.7269,
+ "step": 8948
+ },
+ {
+ "epoch": 24.384196185286104,
+ "grad_norm": 8.925589561462402,
+ "learning_rate": 1.7696000410118504e-05,
+ "loss": 0.5912,
+ "step": 8949
+ },
+ {
+ "epoch": 24.38692098092643,
+ "grad_norm": 8.214383125305176,
+ "learning_rate": 1.7695436884157353e-05,
+ "loss": 0.6021,
+ "step": 8950
+ },
+ {
+ "epoch": 24.38964577656676,
+ "grad_norm": 7.753206253051758,
+ "learning_rate": 1.7694873298264385e-05,
+ "loss": 0.6138,
+ "step": 8951
+ },
+ {
+ "epoch": 24.392370572207085,
+ "grad_norm": 7.649204254150391,
+ "learning_rate": 1.769430965244399e-05,
+ "loss": 0.6303,
+ "step": 8952
+ },
+ {
+ "epoch": 24.39509536784741,
+ "grad_norm": 7.90365743637085,
+ "learning_rate": 1.7693745946700566e-05,
+ "loss": 0.632,
+ "step": 8953
+ },
+ {
+ "epoch": 24.39782016348774,
+ "grad_norm": 8.675521850585938,
+ "learning_rate": 1.769318218103849e-05,
+ "loss": 0.6139,
+ "step": 8954
+ },
+ {
+ "epoch": 24.400544959128066,
+ "grad_norm": 9.54442310333252,
+ "learning_rate": 1.7692618355462157e-05,
+ "loss": 0.5366,
+ "step": 8955
+ },
+ {
+ "epoch": 24.40326975476839,
+ "grad_norm": 7.759203910827637,
+ "learning_rate": 1.7692054469975964e-05,
+ "loss": 0.4946,
+ "step": 8956
+ },
+ {
+ "epoch": 24.40599455040872,
+ "grad_norm": 26.981840133666992,
+ "learning_rate": 1.7691490524584297e-05,
+ "loss": 0.7293,
+ "step": 8957
+ },
+ {
+ "epoch": 24.408719346049047,
+ "grad_norm": 9.283357620239258,
+ "learning_rate": 1.7690926519291548e-05,
+ "loss": 0.7754,
+ "step": 8958
+ },
+ {
+ "epoch": 24.411444141689373,
+ "grad_norm": 7.14051628112793,
+ "learning_rate": 1.7690362454102114e-05,
+ "loss": 0.5724,
+ "step": 8959
+ },
+ {
+ "epoch": 24.414168937329702,
+ "grad_norm": 8.556551933288574,
+ "learning_rate": 1.7689798329020386e-05,
+ "loss": 0.5964,
+ "step": 8960
+ },
+ {
+ "epoch": 24.416893732970028,
+ "grad_norm": 7.010879993438721,
+ "learning_rate": 1.768923414405075e-05,
+ "loss": 0.54,
+ "step": 8961
+ },
+ {
+ "epoch": 24.419618528610354,
+ "grad_norm": 7.770777225494385,
+ "learning_rate": 1.768866989919761e-05,
+ "loss": 0.5397,
+ "step": 8962
+ },
+ {
+ "epoch": 24.422343324250683,
+ "grad_norm": 8.03707504272461,
+ "learning_rate": 1.7688105594465356e-05,
+ "loss": 0.6537,
+ "step": 8963
+ },
+ {
+ "epoch": 24.42506811989101,
+ "grad_norm": 8.599611282348633,
+ "learning_rate": 1.768754122985838e-05,
+ "loss": 0.6307,
+ "step": 8964
+ },
+ {
+ "epoch": 24.427792915531334,
+ "grad_norm": 8.289087295532227,
+ "learning_rate": 1.7686976805381084e-05,
+ "loss": 0.6356,
+ "step": 8965
+ },
+ {
+ "epoch": 24.430517711171664,
+ "grad_norm": 7.699691295623779,
+ "learning_rate": 1.7686412321037857e-05,
+ "loss": 0.5087,
+ "step": 8966
+ },
+ {
+ "epoch": 24.43324250681199,
+ "grad_norm": 6.849878311157227,
+ "learning_rate": 1.76858477768331e-05,
+ "loss": 0.5422,
+ "step": 8967
+ },
+ {
+ "epoch": 24.435967302452315,
+ "grad_norm": 7.258474826812744,
+ "learning_rate": 1.768528317277121e-05,
+ "loss": 0.4946,
+ "step": 8968
+ },
+ {
+ "epoch": 24.438692098092645,
+ "grad_norm": 13.755452156066895,
+ "learning_rate": 1.768471850885658e-05,
+ "loss": 0.538,
+ "step": 8969
+ },
+ {
+ "epoch": 24.44141689373297,
+ "grad_norm": 6.409572124481201,
+ "learning_rate": 1.768415378509361e-05,
+ "loss": 0.6858,
+ "step": 8970
+ },
+ {
+ "epoch": 24.444141689373296,
+ "grad_norm": 7.1457014083862305,
+ "learning_rate": 1.7683589001486696e-05,
+ "loss": 0.7271,
+ "step": 8971
+ },
+ {
+ "epoch": 24.446866485013626,
+ "grad_norm": 7.805093765258789,
+ "learning_rate": 1.768302415804024e-05,
+ "loss": 0.6566,
+ "step": 8972
+ },
+ {
+ "epoch": 24.44959128065395,
+ "grad_norm": 9.943085670471191,
+ "learning_rate": 1.768245925475864e-05,
+ "loss": 0.6541,
+ "step": 8973
+ },
+ {
+ "epoch": 24.452316076294277,
+ "grad_norm": 9.868901252746582,
+ "learning_rate": 1.7681894291646293e-05,
+ "loss": 0.4976,
+ "step": 8974
+ },
+ {
+ "epoch": 24.455040871934607,
+ "grad_norm": 9.336941719055176,
+ "learning_rate": 1.7681329268707598e-05,
+ "loss": 0.5962,
+ "step": 8975
+ },
+ {
+ "epoch": 24.457765667574932,
+ "grad_norm": 9.290519714355469,
+ "learning_rate": 1.768076418594696e-05,
+ "loss": 0.6821,
+ "step": 8976
+ },
+ {
+ "epoch": 24.460490463215258,
+ "grad_norm": 8.6582612991333,
+ "learning_rate": 1.768019904336878e-05,
+ "loss": 0.6085,
+ "step": 8977
+ },
+ {
+ "epoch": 24.463215258855588,
+ "grad_norm": 7.847634315490723,
+ "learning_rate": 1.7679633840977454e-05,
+ "loss": 0.5726,
+ "step": 8978
+ },
+ {
+ "epoch": 24.465940054495913,
+ "grad_norm": 8.564176559448242,
+ "learning_rate": 1.7679068578777387e-05,
+ "loss": 0.6907,
+ "step": 8979
+ },
+ {
+ "epoch": 24.46866485013624,
+ "grad_norm": 8.275485038757324,
+ "learning_rate": 1.7678503256772985e-05,
+ "loss": 0.6737,
+ "step": 8980
+ },
+ {
+ "epoch": 24.47138964577657,
+ "grad_norm": 9.92436408996582,
+ "learning_rate": 1.7677937874968646e-05,
+ "loss": 0.5356,
+ "step": 8981
+ },
+ {
+ "epoch": 24.474114441416894,
+ "grad_norm": 7.590448379516602,
+ "learning_rate": 1.767737243336877e-05,
+ "loss": 0.6865,
+ "step": 8982
+ },
+ {
+ "epoch": 24.47683923705722,
+ "grad_norm": 8.421040534973145,
+ "learning_rate": 1.7676806931977765e-05,
+ "loss": 0.5803,
+ "step": 8983
+ },
+ {
+ "epoch": 24.479564032697546,
+ "grad_norm": 9.572787284851074,
+ "learning_rate": 1.7676241370800037e-05,
+ "loss": 0.6669,
+ "step": 8984
+ },
+ {
+ "epoch": 24.482288828337875,
+ "grad_norm": 7.989253520965576,
+ "learning_rate": 1.7675675749839988e-05,
+ "loss": 0.5555,
+ "step": 8985
+ },
+ {
+ "epoch": 24.4850136239782,
+ "grad_norm": 7.294342517852783,
+ "learning_rate": 1.7675110069102022e-05,
+ "loss": 0.601,
+ "step": 8986
+ },
+ {
+ "epoch": 24.48773841961853,
+ "grad_norm": 8.045269012451172,
+ "learning_rate": 1.7674544328590547e-05,
+ "loss": 0.5715,
+ "step": 8987
+ },
+ {
+ "epoch": 24.490463215258856,
+ "grad_norm": 7.78092622756958,
+ "learning_rate": 1.7673978528309964e-05,
+ "loss": 0.6519,
+ "step": 8988
+ },
+ {
+ "epoch": 24.493188010899182,
+ "grad_norm": 8.891827583312988,
+ "learning_rate": 1.7673412668264687e-05,
+ "loss": 0.7516,
+ "step": 8989
+ },
+ {
+ "epoch": 24.495912806539508,
+ "grad_norm": 7.932019233703613,
+ "learning_rate": 1.767284674845912e-05,
+ "loss": 0.6261,
+ "step": 8990
+ },
+ {
+ "epoch": 24.498637602179837,
+ "grad_norm": 8.965381622314453,
+ "learning_rate": 1.767228076889767e-05,
+ "loss": 0.6057,
+ "step": 8991
+ },
+ {
+ "epoch": 24.501362397820163,
+ "grad_norm": 7.663259983062744,
+ "learning_rate": 1.767171472958474e-05,
+ "loss": 0.6209,
+ "step": 8992
+ },
+ {
+ "epoch": 24.504087193460492,
+ "grad_norm": 10.831971168518066,
+ "learning_rate": 1.7671148630524745e-05,
+ "loss": 0.5768,
+ "step": 8993
+ },
+ {
+ "epoch": 24.506811989100818,
+ "grad_norm": 7.278465747833252,
+ "learning_rate": 1.767058247172209e-05,
+ "loss": 0.6361,
+ "step": 8994
+ },
+ {
+ "epoch": 24.509536784741144,
+ "grad_norm": 10.330945014953613,
+ "learning_rate": 1.767001625318119e-05,
+ "loss": 0.655,
+ "step": 8995
+ },
+ {
+ "epoch": 24.51226158038147,
+ "grad_norm": 8.391157150268555,
+ "learning_rate": 1.7669449974906446e-05,
+ "loss": 0.6749,
+ "step": 8996
+ },
+ {
+ "epoch": 24.5149863760218,
+ "grad_norm": 6.680755615234375,
+ "learning_rate": 1.766888363690227e-05,
+ "loss": 0.6873,
+ "step": 8997
+ },
+ {
+ "epoch": 24.517711171662125,
+ "grad_norm": 9.297725677490234,
+ "learning_rate": 1.766831723917308e-05,
+ "loss": 0.6774,
+ "step": 8998
+ },
+ {
+ "epoch": 24.520435967302454,
+ "grad_norm": 7.953189849853516,
+ "learning_rate": 1.7667750781723282e-05,
+ "loss": 0.6069,
+ "step": 8999
+ },
+ {
+ "epoch": 24.52316076294278,
+ "grad_norm": 7.478446006774902,
+ "learning_rate": 1.7667184264557286e-05,
+ "loss": 0.6924,
+ "step": 9000
+ },
+ {
+ "epoch": 24.525885558583106,
+ "grad_norm": 7.651972770690918,
+ "learning_rate": 1.7666617687679505e-05,
+ "loss": 0.5371,
+ "step": 9001
+ },
+ {
+ "epoch": 24.52861035422343,
+ "grad_norm": 7.096588611602783,
+ "learning_rate": 1.766605105109435e-05,
+ "loss": 0.6324,
+ "step": 9002
+ },
+ {
+ "epoch": 24.53133514986376,
+ "grad_norm": 9.0821533203125,
+ "learning_rate": 1.7665484354806244e-05,
+ "loss": 0.7375,
+ "step": 9003
+ },
+ {
+ "epoch": 24.534059945504087,
+ "grad_norm": 6.819845676422119,
+ "learning_rate": 1.766491759881959e-05,
+ "loss": 0.5464,
+ "step": 9004
+ },
+ {
+ "epoch": 24.536784741144416,
+ "grad_norm": 8.515116691589355,
+ "learning_rate": 1.76643507831388e-05,
+ "loss": 0.5974,
+ "step": 9005
+ },
+ {
+ "epoch": 24.539509536784742,
+ "grad_norm": 9.178707122802734,
+ "learning_rate": 1.7663783907768298e-05,
+ "loss": 0.775,
+ "step": 9006
+ },
+ {
+ "epoch": 24.542234332425068,
+ "grad_norm": 7.338752269744873,
+ "learning_rate": 1.766321697271249e-05,
+ "loss": 0.6062,
+ "step": 9007
+ },
+ {
+ "epoch": 24.544959128065393,
+ "grad_norm": 8.074347496032715,
+ "learning_rate": 1.7662649977975794e-05,
+ "loss": 0.5342,
+ "step": 9008
+ },
+ {
+ "epoch": 24.547683923705723,
+ "grad_norm": 9.013470649719238,
+ "learning_rate": 1.766208292356263e-05,
+ "loss": 0.5968,
+ "step": 9009
+ },
+ {
+ "epoch": 24.55040871934605,
+ "grad_norm": 8.02351188659668,
+ "learning_rate": 1.766151580947741e-05,
+ "loss": 0.6957,
+ "step": 9010
+ },
+ {
+ "epoch": 24.553133514986374,
+ "grad_norm": 7.712599277496338,
+ "learning_rate": 1.766094863572455e-05,
+ "loss": 0.6971,
+ "step": 9011
+ },
+ {
+ "epoch": 24.555858310626704,
+ "grad_norm": 9.144669532775879,
+ "learning_rate": 1.7660381402308465e-05,
+ "loss": 0.678,
+ "step": 9012
+ },
+ {
+ "epoch": 24.55858310626703,
+ "grad_norm": 9.957167625427246,
+ "learning_rate": 1.765981410923358e-05,
+ "loss": 0.6351,
+ "step": 9013
+ },
+ {
+ "epoch": 24.561307901907355,
+ "grad_norm": 8.49111270904541,
+ "learning_rate": 1.7659246756504313e-05,
+ "loss": 0.577,
+ "step": 9014
+ },
+ {
+ "epoch": 24.564032697547685,
+ "grad_norm": 8.66234302520752,
+ "learning_rate": 1.7658679344125075e-05,
+ "loss": 0.5004,
+ "step": 9015
+ },
+ {
+ "epoch": 24.56675749318801,
+ "grad_norm": 10.30588436126709,
+ "learning_rate": 1.7658111872100287e-05,
+ "loss": 0.4411,
+ "step": 9016
+ },
+ {
+ "epoch": 24.569482288828336,
+ "grad_norm": 8.420388221740723,
+ "learning_rate": 1.7657544340434375e-05,
+ "loss": 0.6025,
+ "step": 9017
+ },
+ {
+ "epoch": 24.572207084468666,
+ "grad_norm": 8.328437805175781,
+ "learning_rate": 1.7656976749131753e-05,
+ "loss": 0.5613,
+ "step": 9018
+ },
+ {
+ "epoch": 24.57493188010899,
+ "grad_norm": 7.625326633453369,
+ "learning_rate": 1.765640909819684e-05,
+ "loss": 0.55,
+ "step": 9019
+ },
+ {
+ "epoch": 24.577656675749317,
+ "grad_norm": 10.811392784118652,
+ "learning_rate": 1.7655841387634057e-05,
+ "loss": 0.9567,
+ "step": 9020
+ },
+ {
+ "epoch": 24.580381471389646,
+ "grad_norm": 22.325044631958008,
+ "learning_rate": 1.765527361744783e-05,
+ "loss": 0.8193,
+ "step": 9021
+ },
+ {
+ "epoch": 24.583106267029972,
+ "grad_norm": 9.547529220581055,
+ "learning_rate": 1.765470578764258e-05,
+ "loss": 0.6692,
+ "step": 9022
+ },
+ {
+ "epoch": 24.585831062670298,
+ "grad_norm": 9.6989107131958,
+ "learning_rate": 1.7654137898222728e-05,
+ "loss": 0.7803,
+ "step": 9023
+ },
+ {
+ "epoch": 24.588555858310627,
+ "grad_norm": 10.85034465789795,
+ "learning_rate": 1.7653569949192698e-05,
+ "loss": 0.4957,
+ "step": 9024
+ },
+ {
+ "epoch": 24.591280653950953,
+ "grad_norm": 10.391765594482422,
+ "learning_rate": 1.765300194055691e-05,
+ "loss": 0.6892,
+ "step": 9025
+ },
+ {
+ "epoch": 24.59400544959128,
+ "grad_norm": 7.947431564331055,
+ "learning_rate": 1.7652433872319785e-05,
+ "loss": 0.6081,
+ "step": 9026
+ },
+ {
+ "epoch": 24.59673024523161,
+ "grad_norm": 7.657660961151123,
+ "learning_rate": 1.7651865744485755e-05,
+ "loss": 0.608,
+ "step": 9027
+ },
+ {
+ "epoch": 24.599455040871934,
+ "grad_norm": 12.64451789855957,
+ "learning_rate": 1.765129755705924e-05,
+ "loss": 0.6497,
+ "step": 9028
+ },
+ {
+ "epoch": 24.60217983651226,
+ "grad_norm": 7.720130443572998,
+ "learning_rate": 1.7650729310044667e-05,
+ "loss": 0.6349,
+ "step": 9029
+ },
+ {
+ "epoch": 24.60490463215259,
+ "grad_norm": 6.875460147857666,
+ "learning_rate": 1.765016100344646e-05,
+ "loss": 0.6453,
+ "step": 9030
+ },
+ {
+ "epoch": 24.607629427792915,
+ "grad_norm": 9.920437812805176,
+ "learning_rate": 1.7649592637269045e-05,
+ "loss": 0.6627,
+ "step": 9031
+ },
+ {
+ "epoch": 24.61035422343324,
+ "grad_norm": 7.393453598022461,
+ "learning_rate": 1.7649024211516848e-05,
+ "loss": 0.534,
+ "step": 9032
+ },
+ {
+ "epoch": 24.61307901907357,
+ "grad_norm": 8.168704986572266,
+ "learning_rate": 1.76484557261943e-05,
+ "loss": 0.5313,
+ "step": 9033
+ },
+ {
+ "epoch": 24.615803814713896,
+ "grad_norm": 8.419522285461426,
+ "learning_rate": 1.7647887181305822e-05,
+ "loss": 0.7209,
+ "step": 9034
+ },
+ {
+ "epoch": 24.618528610354222,
+ "grad_norm": 8.104192733764648,
+ "learning_rate": 1.7647318576855843e-05,
+ "loss": 0.6615,
+ "step": 9035
+ },
+ {
+ "epoch": 24.62125340599455,
+ "grad_norm": 7.3158488273620605,
+ "learning_rate": 1.7646749912848795e-05,
+ "loss": 0.6165,
+ "step": 9036
+ },
+ {
+ "epoch": 24.623978201634877,
+ "grad_norm": 8.528558731079102,
+ "learning_rate": 1.7646181189289108e-05,
+ "loss": 0.6068,
+ "step": 9037
+ },
+ {
+ "epoch": 24.626702997275203,
+ "grad_norm": 11.592710494995117,
+ "learning_rate": 1.7645612406181204e-05,
+ "loss": 0.6259,
+ "step": 9038
+ },
+ {
+ "epoch": 24.629427792915532,
+ "grad_norm": 7.119830131530762,
+ "learning_rate": 1.7645043563529518e-05,
+ "loss": 0.5124,
+ "step": 9039
+ },
+ {
+ "epoch": 24.632152588555858,
+ "grad_norm": 9.007055282592773,
+ "learning_rate": 1.764447466133848e-05,
+ "loss": 0.7422,
+ "step": 9040
+ },
+ {
+ "epoch": 24.634877384196184,
+ "grad_norm": 7.347967624664307,
+ "learning_rate": 1.7643905699612513e-05,
+ "loss": 0.5612,
+ "step": 9041
+ },
+ {
+ "epoch": 24.637602179836513,
+ "grad_norm": 8.965445518493652,
+ "learning_rate": 1.7643336678356063e-05,
+ "loss": 0.7264,
+ "step": 9042
+ },
+ {
+ "epoch": 24.64032697547684,
+ "grad_norm": 10.226734161376953,
+ "learning_rate": 1.7642767597573548e-05,
+ "loss": 0.6119,
+ "step": 9043
+ },
+ {
+ "epoch": 24.643051771117165,
+ "grad_norm": 7.831031799316406,
+ "learning_rate": 1.7642198457269405e-05,
+ "loss": 0.5123,
+ "step": 9044
+ },
+ {
+ "epoch": 24.645776566757494,
+ "grad_norm": 7.503066062927246,
+ "learning_rate": 1.7641629257448068e-05,
+ "loss": 0.5405,
+ "step": 9045
+ },
+ {
+ "epoch": 24.64850136239782,
+ "grad_norm": 15.644835472106934,
+ "learning_rate": 1.7641059998113966e-05,
+ "loss": 0.6517,
+ "step": 9046
+ },
+ {
+ "epoch": 24.651226158038146,
+ "grad_norm": 8.321699142456055,
+ "learning_rate": 1.7640490679271537e-05,
+ "loss": 0.7328,
+ "step": 9047
+ },
+ {
+ "epoch": 24.653950953678475,
+ "grad_norm": 11.984652519226074,
+ "learning_rate": 1.7639921300925213e-05,
+ "loss": 0.6308,
+ "step": 9048
+ },
+ {
+ "epoch": 24.6566757493188,
+ "grad_norm": 7.8258748054504395,
+ "learning_rate": 1.7639351863079426e-05,
+ "loss": 0.6423,
+ "step": 9049
+ },
+ {
+ "epoch": 24.659400544959126,
+ "grad_norm": 6.94466495513916,
+ "learning_rate": 1.7638782365738613e-05,
+ "loss": 0.6277,
+ "step": 9050
+ },
+ {
+ "epoch": 24.662125340599456,
+ "grad_norm": 6.627162456512451,
+ "learning_rate": 1.763821280890721e-05,
+ "loss": 0.7846,
+ "step": 9051
+ },
+ {
+ "epoch": 24.66485013623978,
+ "grad_norm": 10.093145370483398,
+ "learning_rate": 1.763764319258965e-05,
+ "loss": 0.6024,
+ "step": 9052
+ },
+ {
+ "epoch": 24.667574931880107,
+ "grad_norm": 10.328065872192383,
+ "learning_rate": 1.7637073516790373e-05,
+ "loss": 0.6041,
+ "step": 9053
+ },
+ {
+ "epoch": 24.670299727520437,
+ "grad_norm": 8.410794258117676,
+ "learning_rate": 1.7636503781513808e-05,
+ "loss": 0.7278,
+ "step": 9054
+ },
+ {
+ "epoch": 24.673024523160763,
+ "grad_norm": 7.4909348487854,
+ "learning_rate": 1.7635933986764403e-05,
+ "loss": 0.575,
+ "step": 9055
+ },
+ {
+ "epoch": 24.67574931880109,
+ "grad_norm": 10.587180137634277,
+ "learning_rate": 1.7635364132546587e-05,
+ "loss": 0.4573,
+ "step": 9056
+ },
+ {
+ "epoch": 24.678474114441418,
+ "grad_norm": 10.027560234069824,
+ "learning_rate": 1.7634794218864802e-05,
+ "loss": 0.7155,
+ "step": 9057
+ },
+ {
+ "epoch": 24.681198910081743,
+ "grad_norm": 8.658035278320312,
+ "learning_rate": 1.7634224245723482e-05,
+ "loss": 0.6944,
+ "step": 9058
+ },
+ {
+ "epoch": 24.68392370572207,
+ "grad_norm": 7.574838161468506,
+ "learning_rate": 1.7633654213127074e-05,
+ "loss": 0.5848,
+ "step": 9059
+ },
+ {
+ "epoch": 24.6866485013624,
+ "grad_norm": 15.168315887451172,
+ "learning_rate": 1.763308412108001e-05,
+ "loss": 0.8035,
+ "step": 9060
+ },
+ {
+ "epoch": 24.689373297002724,
+ "grad_norm": 13.63664722442627,
+ "learning_rate": 1.7632513969586736e-05,
+ "loss": 0.5897,
+ "step": 9061
+ },
+ {
+ "epoch": 24.69209809264305,
+ "grad_norm": 8.766971588134766,
+ "learning_rate": 1.7631943758651687e-05,
+ "loss": 0.5793,
+ "step": 9062
+ },
+ {
+ "epoch": 24.69482288828338,
+ "grad_norm": 8.28712272644043,
+ "learning_rate": 1.7631373488279303e-05,
+ "loss": 0.749,
+ "step": 9063
+ },
+ {
+ "epoch": 24.697547683923705,
+ "grad_norm": 7.610118865966797,
+ "learning_rate": 1.763080315847403e-05,
+ "loss": 0.6459,
+ "step": 9064
+ },
+ {
+ "epoch": 24.70027247956403,
+ "grad_norm": 11.615033149719238,
+ "learning_rate": 1.7630232769240307e-05,
+ "loss": 0.5387,
+ "step": 9065
+ },
+ {
+ "epoch": 24.70299727520436,
+ "grad_norm": 8.760119438171387,
+ "learning_rate": 1.7629662320582578e-05,
+ "loss": 0.7877,
+ "step": 9066
+ },
+ {
+ "epoch": 24.705722070844686,
+ "grad_norm": 7.303828239440918,
+ "learning_rate": 1.7629091812505285e-05,
+ "loss": 0.7491,
+ "step": 9067
+ },
+ {
+ "epoch": 24.708446866485012,
+ "grad_norm": 9.286757469177246,
+ "learning_rate": 1.762852124501287e-05,
+ "loss": 0.7002,
+ "step": 9068
+ },
+ {
+ "epoch": 24.71117166212534,
+ "grad_norm": 7.101996898651123,
+ "learning_rate": 1.7627950618109775e-05,
+ "loss": 0.6022,
+ "step": 9069
+ },
+ {
+ "epoch": 24.713896457765667,
+ "grad_norm": 8.550169944763184,
+ "learning_rate": 1.7627379931800446e-05,
+ "loss": 0.6114,
+ "step": 9070
+ },
+ {
+ "epoch": 24.716621253405993,
+ "grad_norm": 9.084425926208496,
+ "learning_rate": 1.762680918608933e-05,
+ "loss": 0.6962,
+ "step": 9071
+ },
+ {
+ "epoch": 24.719346049046322,
+ "grad_norm": 8.570323944091797,
+ "learning_rate": 1.7626238380980866e-05,
+ "loss": 0.7131,
+ "step": 9072
+ },
+ {
+ "epoch": 24.722070844686648,
+ "grad_norm": 8.048595428466797,
+ "learning_rate": 1.7625667516479508e-05,
+ "loss": 0.7187,
+ "step": 9073
+ },
+ {
+ "epoch": 24.724795640326974,
+ "grad_norm": 8.957825660705566,
+ "learning_rate": 1.7625096592589692e-05,
+ "loss": 0.7624,
+ "step": 9074
+ },
+ {
+ "epoch": 24.727520435967303,
+ "grad_norm": 9.336494445800781,
+ "learning_rate": 1.7624525609315873e-05,
+ "loss": 0.6737,
+ "step": 9075
+ },
+ {
+ "epoch": 24.73024523160763,
+ "grad_norm": 14.707310676574707,
+ "learning_rate": 1.762395456666249e-05,
+ "loss": 0.6622,
+ "step": 9076
+ },
+ {
+ "epoch": 24.732970027247955,
+ "grad_norm": 8.099577903747559,
+ "learning_rate": 1.7623383464633996e-05,
+ "loss": 0.6689,
+ "step": 9077
+ },
+ {
+ "epoch": 24.735694822888284,
+ "grad_norm": 7.692896366119385,
+ "learning_rate": 1.7622812303234837e-05,
+ "loss": 0.7451,
+ "step": 9078
+ },
+ {
+ "epoch": 24.73841961852861,
+ "grad_norm": 7.110904216766357,
+ "learning_rate": 1.7622241082469463e-05,
+ "loss": 0.8058,
+ "step": 9079
+ },
+ {
+ "epoch": 24.741144414168936,
+ "grad_norm": 9.915729522705078,
+ "learning_rate": 1.762166980234232e-05,
+ "loss": 0.6854,
+ "step": 9080
+ },
+ {
+ "epoch": 24.743869209809265,
+ "grad_norm": 6.910274982452393,
+ "learning_rate": 1.762109846285786e-05,
+ "loss": 0.7994,
+ "step": 9081
+ },
+ {
+ "epoch": 24.74659400544959,
+ "grad_norm": 8.334527969360352,
+ "learning_rate": 1.7620527064020524e-05,
+ "loss": 0.6736,
+ "step": 9082
+ },
+ {
+ "epoch": 24.749318801089917,
+ "grad_norm": 7.239718437194824,
+ "learning_rate": 1.761995560583477e-05,
+ "loss": 0.6385,
+ "step": 9083
+ },
+ {
+ "epoch": 24.752043596730246,
+ "grad_norm": 9.957289695739746,
+ "learning_rate": 1.761938408830505e-05,
+ "loss": 0.6938,
+ "step": 9084
+ },
+ {
+ "epoch": 24.754768392370572,
+ "grad_norm": 8.416315078735352,
+ "learning_rate": 1.761881251143581e-05,
+ "loss": 0.7626,
+ "step": 9085
+ },
+ {
+ "epoch": 24.757493188010898,
+ "grad_norm": 7.973998069763184,
+ "learning_rate": 1.7618240875231504e-05,
+ "loss": 0.6124,
+ "step": 9086
+ },
+ {
+ "epoch": 24.760217983651227,
+ "grad_norm": 12.216193199157715,
+ "learning_rate": 1.7617669179696584e-05,
+ "loss": 0.6934,
+ "step": 9087
+ },
+ {
+ "epoch": 24.762942779291553,
+ "grad_norm": 8.15843391418457,
+ "learning_rate": 1.76170974248355e-05,
+ "loss": 0.5637,
+ "step": 9088
+ },
+ {
+ "epoch": 24.76566757493188,
+ "grad_norm": 9.592131614685059,
+ "learning_rate": 1.761652561065271e-05,
+ "loss": 0.5842,
+ "step": 9089
+ },
+ {
+ "epoch": 24.768392370572208,
+ "grad_norm": 8.345134735107422,
+ "learning_rate": 1.7615953737152662e-05,
+ "loss": 0.6991,
+ "step": 9090
+ },
+ {
+ "epoch": 24.771117166212534,
+ "grad_norm": 8.831202507019043,
+ "learning_rate": 1.7615381804339812e-05,
+ "loss": 0.5632,
+ "step": 9091
+ },
+ {
+ "epoch": 24.77384196185286,
+ "grad_norm": 6.586507320404053,
+ "learning_rate": 1.761480981221861e-05,
+ "loss": 0.712,
+ "step": 9092
+ },
+ {
+ "epoch": 24.77656675749319,
+ "grad_norm": 7.661722660064697,
+ "learning_rate": 1.7614237760793517e-05,
+ "loss": 0.6247,
+ "step": 9093
+ },
+ {
+ "epoch": 24.779291553133515,
+ "grad_norm": 11.912310600280762,
+ "learning_rate": 1.7613665650068986e-05,
+ "loss": 0.7829,
+ "step": 9094
+ },
+ {
+ "epoch": 24.78201634877384,
+ "grad_norm": 9.052411079406738,
+ "learning_rate": 1.7613093480049472e-05,
+ "loss": 0.6127,
+ "step": 9095
+ },
+ {
+ "epoch": 24.78474114441417,
+ "grad_norm": 8.426584243774414,
+ "learning_rate": 1.7612521250739427e-05,
+ "loss": 0.4929,
+ "step": 9096
+ },
+ {
+ "epoch": 24.787465940054496,
+ "grad_norm": 8.199124336242676,
+ "learning_rate": 1.7611948962143317e-05,
+ "loss": 0.6892,
+ "step": 9097
+ },
+ {
+ "epoch": 24.79019073569482,
+ "grad_norm": 9.086944580078125,
+ "learning_rate": 1.7611376614265586e-05,
+ "loss": 0.656,
+ "step": 9098
+ },
+ {
+ "epoch": 24.79291553133515,
+ "grad_norm": 11.262910842895508,
+ "learning_rate": 1.7610804207110708e-05,
+ "loss": 0.721,
+ "step": 9099
+ },
+ {
+ "epoch": 24.795640326975477,
+ "grad_norm": 7.025333404541016,
+ "learning_rate": 1.7610231740683127e-05,
+ "loss": 0.7167,
+ "step": 9100
+ },
+ {
+ "epoch": 24.798365122615802,
+ "grad_norm": 7.94744348526001,
+ "learning_rate": 1.7609659214987306e-05,
+ "loss": 0.6428,
+ "step": 9101
+ },
+ {
+ "epoch": 24.80108991825613,
+ "grad_norm": 7.263674736022949,
+ "learning_rate": 1.7609086630027703e-05,
+ "loss": 0.619,
+ "step": 9102
+ },
+ {
+ "epoch": 24.803814713896458,
+ "grad_norm": 6.2140793800354,
+ "learning_rate": 1.760851398580878e-05,
+ "loss": 0.6459,
+ "step": 9103
+ },
+ {
+ "epoch": 24.806539509536783,
+ "grad_norm": 8.475105285644531,
+ "learning_rate": 1.7607941282334994e-05,
+ "loss": 0.6431,
+ "step": 9104
+ },
+ {
+ "epoch": 24.809264305177113,
+ "grad_norm": 9.592691421508789,
+ "learning_rate": 1.760736851961081e-05,
+ "loss": 0.7227,
+ "step": 9105
+ },
+ {
+ "epoch": 24.81198910081744,
+ "grad_norm": 9.697248458862305,
+ "learning_rate": 1.760679569764068e-05,
+ "loss": 0.7128,
+ "step": 9106
+ },
+ {
+ "epoch": 24.814713896457764,
+ "grad_norm": 7.512829303741455,
+ "learning_rate": 1.7606222816429072e-05,
+ "loss": 0.5385,
+ "step": 9107
+ },
+ {
+ "epoch": 24.817438692098094,
+ "grad_norm": 7.659682273864746,
+ "learning_rate": 1.7605649875980444e-05,
+ "loss": 0.6131,
+ "step": 9108
+ },
+ {
+ "epoch": 24.82016348773842,
+ "grad_norm": 9.706716537475586,
+ "learning_rate": 1.760507687629926e-05,
+ "loss": 0.6518,
+ "step": 9109
+ },
+ {
+ "epoch": 24.822888283378745,
+ "grad_norm": 7.4076948165893555,
+ "learning_rate": 1.7604503817389984e-05,
+ "loss": 0.6416,
+ "step": 9110
+ },
+ {
+ "epoch": 24.825613079019075,
+ "grad_norm": 7.795478820800781,
+ "learning_rate": 1.7603930699257077e-05,
+ "loss": 0.6566,
+ "step": 9111
+ },
+ {
+ "epoch": 24.8283378746594,
+ "grad_norm": 8.182226181030273,
+ "learning_rate": 1.7603357521905002e-05,
+ "loss": 0.7444,
+ "step": 9112
+ },
+ {
+ "epoch": 24.831062670299726,
+ "grad_norm": 8.728377342224121,
+ "learning_rate": 1.760278428533822e-05,
+ "loss": 0.6691,
+ "step": 9113
+ },
+ {
+ "epoch": 24.833787465940055,
+ "grad_norm": 13.578832626342773,
+ "learning_rate": 1.7602210989561202e-05,
+ "loss": 0.6788,
+ "step": 9114
+ },
+ {
+ "epoch": 24.83651226158038,
+ "grad_norm": 9.919561386108398,
+ "learning_rate": 1.760163763457841e-05,
+ "loss": 0.6063,
+ "step": 9115
+ },
+ {
+ "epoch": 24.839237057220707,
+ "grad_norm": 7.077985763549805,
+ "learning_rate": 1.7601064220394305e-05,
+ "loss": 0.5043,
+ "step": 9116
+ },
+ {
+ "epoch": 24.841961852861036,
+ "grad_norm": 9.012791633605957,
+ "learning_rate": 1.760049074701336e-05,
+ "loss": 0.4412,
+ "step": 9117
+ },
+ {
+ "epoch": 24.844686648501362,
+ "grad_norm": 7.965156555175781,
+ "learning_rate": 1.7599917214440035e-05,
+ "loss": 0.6007,
+ "step": 9118
+ },
+ {
+ "epoch": 24.847411444141688,
+ "grad_norm": 8.324759483337402,
+ "learning_rate": 1.7599343622678802e-05,
+ "loss": 0.5599,
+ "step": 9119
+ },
+ {
+ "epoch": 24.850136239782017,
+ "grad_norm": 8.590094566345215,
+ "learning_rate": 1.7598769971734127e-05,
+ "loss": 0.7472,
+ "step": 9120
+ },
+ {
+ "epoch": 24.852861035422343,
+ "grad_norm": 8.1151762008667,
+ "learning_rate": 1.7598196261610476e-05,
+ "loss": 0.5726,
+ "step": 9121
+ },
+ {
+ "epoch": 24.85558583106267,
+ "grad_norm": 7.521329402923584,
+ "learning_rate": 1.7597622492312313e-05,
+ "loss": 0.5908,
+ "step": 9122
+ },
+ {
+ "epoch": 24.858310626703,
+ "grad_norm": 9.701559066772461,
+ "learning_rate": 1.759704866384411e-05,
+ "loss": 0.5087,
+ "step": 9123
+ },
+ {
+ "epoch": 24.861035422343324,
+ "grad_norm": 8.193989753723145,
+ "learning_rate": 1.759647477621034e-05,
+ "loss": 0.5861,
+ "step": 9124
+ },
+ {
+ "epoch": 24.86376021798365,
+ "grad_norm": 9.653748512268066,
+ "learning_rate": 1.759590082941547e-05,
+ "loss": 0.767,
+ "step": 9125
+ },
+ {
+ "epoch": 24.86648501362398,
+ "grad_norm": 7.191437244415283,
+ "learning_rate": 1.7595326823463963e-05,
+ "loss": 0.5499,
+ "step": 9126
+ },
+ {
+ "epoch": 24.869209809264305,
+ "grad_norm": 7.461208820343018,
+ "learning_rate": 1.75947527583603e-05,
+ "loss": 0.4998,
+ "step": 9127
+ },
+ {
+ "epoch": 24.87193460490463,
+ "grad_norm": 8.673975944519043,
+ "learning_rate": 1.7594178634108944e-05,
+ "loss": 0.6719,
+ "step": 9128
+ },
+ {
+ "epoch": 24.87465940054496,
+ "grad_norm": 8.278363227844238,
+ "learning_rate": 1.759360445071437e-05,
+ "loss": 0.6855,
+ "step": 9129
+ },
+ {
+ "epoch": 24.877384196185286,
+ "grad_norm": 7.993578910827637,
+ "learning_rate": 1.7593030208181052e-05,
+ "loss": 0.6843,
+ "step": 9130
+ },
+ {
+ "epoch": 24.88010899182561,
+ "grad_norm": 8.322216033935547,
+ "learning_rate": 1.7592455906513456e-05,
+ "loss": 0.7618,
+ "step": 9131
+ },
+ {
+ "epoch": 24.88283378746594,
+ "grad_norm": 10.070342063903809,
+ "learning_rate": 1.7591881545716058e-05,
+ "loss": 0.6232,
+ "step": 9132
+ },
+ {
+ "epoch": 24.885558583106267,
+ "grad_norm": 9.82460880279541,
+ "learning_rate": 1.7591307125793332e-05,
+ "loss": 0.587,
+ "step": 9133
+ },
+ {
+ "epoch": 24.888283378746593,
+ "grad_norm": 7.020534038543701,
+ "learning_rate": 1.759073264674975e-05,
+ "loss": 0.7737,
+ "step": 9134
+ },
+ {
+ "epoch": 24.891008174386922,
+ "grad_norm": 7.385281085968018,
+ "learning_rate": 1.7590158108589785e-05,
+ "loss": 0.6512,
+ "step": 9135
+ },
+ {
+ "epoch": 24.893732970027248,
+ "grad_norm": 7.650609493255615,
+ "learning_rate": 1.7589583511317915e-05,
+ "loss": 0.6586,
+ "step": 9136
+ },
+ {
+ "epoch": 24.896457765667574,
+ "grad_norm": 6.550846099853516,
+ "learning_rate": 1.7589008854938613e-05,
+ "loss": 0.5401,
+ "step": 9137
+ },
+ {
+ "epoch": 24.899182561307903,
+ "grad_norm": 7.285351753234863,
+ "learning_rate": 1.7588434139456354e-05,
+ "loss": 0.6038,
+ "step": 9138
+ },
+ {
+ "epoch": 24.90190735694823,
+ "grad_norm": 7.743149280548096,
+ "learning_rate": 1.7587859364875613e-05,
+ "loss": 0.7252,
+ "step": 9139
+ },
+ {
+ "epoch": 24.904632152588555,
+ "grad_norm": 7.218400478363037,
+ "learning_rate": 1.7587284531200866e-05,
+ "loss": 0.4827,
+ "step": 9140
+ },
+ {
+ "epoch": 24.907356948228884,
+ "grad_norm": 6.358419418334961,
+ "learning_rate": 1.7586709638436593e-05,
+ "loss": 0.6794,
+ "step": 9141
+ },
+ {
+ "epoch": 24.91008174386921,
+ "grad_norm": 7.754582405090332,
+ "learning_rate": 1.758613468658727e-05,
+ "loss": 0.5704,
+ "step": 9142
+ },
+ {
+ "epoch": 24.912806539509535,
+ "grad_norm": 8.69373893737793,
+ "learning_rate": 1.7585559675657377e-05,
+ "loss": 0.7025,
+ "step": 9143
+ },
+ {
+ "epoch": 24.915531335149865,
+ "grad_norm": 8.12856674194336,
+ "learning_rate": 1.7584984605651385e-05,
+ "loss": 0.5807,
+ "step": 9144
+ },
+ {
+ "epoch": 24.91825613079019,
+ "grad_norm": 6.606778621673584,
+ "learning_rate": 1.758440947657378e-05,
+ "loss": 0.6108,
+ "step": 9145
+ },
+ {
+ "epoch": 24.920980926430516,
+ "grad_norm": 8.338944435119629,
+ "learning_rate": 1.7583834288429032e-05,
+ "loss": 0.7186,
+ "step": 9146
+ },
+ {
+ "epoch": 24.923705722070846,
+ "grad_norm": 8.624048233032227,
+ "learning_rate": 1.7583259041221634e-05,
+ "loss": 0.5325,
+ "step": 9147
+ },
+ {
+ "epoch": 24.92643051771117,
+ "grad_norm": 8.943880081176758,
+ "learning_rate": 1.7582683734956055e-05,
+ "loss": 0.6185,
+ "step": 9148
+ },
+ {
+ "epoch": 24.929155313351497,
+ "grad_norm": 8.175042152404785,
+ "learning_rate": 1.758210836963678e-05,
+ "loss": 0.7002,
+ "step": 9149
+ },
+ {
+ "epoch": 24.931880108991827,
+ "grad_norm": 8.36201286315918,
+ "learning_rate": 1.758153294526829e-05,
+ "loss": 0.5826,
+ "step": 9150
+ },
+ {
+ "epoch": 24.934604904632153,
+ "grad_norm": 9.481425285339355,
+ "learning_rate": 1.7580957461855064e-05,
+ "loss": 0.7182,
+ "step": 9151
+ },
+ {
+ "epoch": 24.93732970027248,
+ "grad_norm": 8.212348937988281,
+ "learning_rate": 1.7580381919401586e-05,
+ "loss": 0.6982,
+ "step": 9152
+ },
+ {
+ "epoch": 24.940054495912808,
+ "grad_norm": 7.990788459777832,
+ "learning_rate": 1.7579806317912336e-05,
+ "loss": 0.5393,
+ "step": 9153
+ },
+ {
+ "epoch": 24.942779291553133,
+ "grad_norm": 9.8809175491333,
+ "learning_rate": 1.7579230657391803e-05,
+ "loss": 0.5881,
+ "step": 9154
+ },
+ {
+ "epoch": 24.94550408719346,
+ "grad_norm": 10.29200553894043,
+ "learning_rate": 1.757865493784446e-05,
+ "loss": 0.6382,
+ "step": 9155
+ },
+ {
+ "epoch": 24.94822888283379,
+ "grad_norm": 7.920681953430176,
+ "learning_rate": 1.7578079159274798e-05,
+ "loss": 0.7075,
+ "step": 9156
+ },
+ {
+ "epoch": 24.950953678474114,
+ "grad_norm": 9.220345497131348,
+ "learning_rate": 1.75775033216873e-05,
+ "loss": 0.6733,
+ "step": 9157
+ },
+ {
+ "epoch": 24.95367847411444,
+ "grad_norm": 7.205484867095947,
+ "learning_rate": 1.757692742508645e-05,
+ "loss": 0.5162,
+ "step": 9158
+ },
+ {
+ "epoch": 24.95640326975477,
+ "grad_norm": 7.997858047485352,
+ "learning_rate": 1.7576351469476735e-05,
+ "loss": 0.6132,
+ "step": 9159
+ },
+ {
+ "epoch": 24.959128065395095,
+ "grad_norm": 8.290677070617676,
+ "learning_rate": 1.7575775454862636e-05,
+ "loss": 0.6284,
+ "step": 9160
+ },
+ {
+ "epoch": 24.96185286103542,
+ "grad_norm": 8.271625518798828,
+ "learning_rate": 1.7575199381248643e-05,
+ "loss": 0.6142,
+ "step": 9161
+ },
+ {
+ "epoch": 24.96457765667575,
+ "grad_norm": 7.2044572830200195,
+ "learning_rate": 1.757462324863924e-05,
+ "loss": 0.5352,
+ "step": 9162
+ },
+ {
+ "epoch": 24.967302452316076,
+ "grad_norm": 7.704048156738281,
+ "learning_rate": 1.7574047057038914e-05,
+ "loss": 0.6229,
+ "step": 9163
+ },
+ {
+ "epoch": 24.970027247956402,
+ "grad_norm": 8.477546691894531,
+ "learning_rate": 1.7573470806452156e-05,
+ "loss": 0.6918,
+ "step": 9164
+ },
+ {
+ "epoch": 24.97275204359673,
+ "grad_norm": 9.030668258666992,
+ "learning_rate": 1.7572894496883448e-05,
+ "loss": 0.6869,
+ "step": 9165
+ },
+ {
+ "epoch": 24.975476839237057,
+ "grad_norm": 7.245536804199219,
+ "learning_rate": 1.7572318128337286e-05,
+ "loss": 0.5255,
+ "step": 9166
+ },
+ {
+ "epoch": 24.978201634877383,
+ "grad_norm": 8.229454040527344,
+ "learning_rate": 1.757174170081815e-05,
+ "loss": 0.6912,
+ "step": 9167
+ },
+ {
+ "epoch": 24.980926430517712,
+ "grad_norm": 10.456474304199219,
+ "learning_rate": 1.7571165214330533e-05,
+ "loss": 0.5757,
+ "step": 9168
+ },
+ {
+ "epoch": 24.983651226158038,
+ "grad_norm": 13.14166259765625,
+ "learning_rate": 1.7570588668878925e-05,
+ "loss": 0.8313,
+ "step": 9169
+ },
+ {
+ "epoch": 24.986376021798364,
+ "grad_norm": 9.433475494384766,
+ "learning_rate": 1.757001206446782e-05,
+ "loss": 0.6941,
+ "step": 9170
+ },
+ {
+ "epoch": 24.989100817438693,
+ "grad_norm": 8.512743949890137,
+ "learning_rate": 1.7569435401101702e-05,
+ "loss": 0.6174,
+ "step": 9171
+ },
+ {
+ "epoch": 24.99182561307902,
+ "grad_norm": 8.018141746520996,
+ "learning_rate": 1.7568858678785067e-05,
+ "loss": 0.6895,
+ "step": 9172
+ },
+ {
+ "epoch": 24.994550408719345,
+ "grad_norm": 7.822866439819336,
+ "learning_rate": 1.75682818975224e-05,
+ "loss": 0.7471,
+ "step": 9173
+ },
+ {
+ "epoch": 24.997275204359674,
+ "grad_norm": 8.118390083312988,
+ "learning_rate": 1.75677050573182e-05,
+ "loss": 0.5596,
+ "step": 9174
+ },
+ {
+ "epoch": 25.0,
+ "grad_norm": 7.722609043121338,
+ "learning_rate": 1.7567128158176955e-05,
+ "loss": 0.7333,
+ "step": 9175
+ },
+ {
+ "epoch": 25.002724795640326,
+ "grad_norm": 7.151113510131836,
+ "learning_rate": 1.756655120010316e-05,
+ "loss": 0.6569,
+ "step": 9176
+ },
+ {
+ "epoch": 25.005449591280655,
+ "grad_norm": 7.189694404602051,
+ "learning_rate": 1.756597418310131e-05,
+ "loss": 0.4894,
+ "step": 9177
+ },
+ {
+ "epoch": 25.00817438692098,
+ "grad_norm": 7.096490859985352,
+ "learning_rate": 1.7565397107175893e-05,
+ "loss": 0.6046,
+ "step": 9178
+ },
+ {
+ "epoch": 25.010899182561307,
+ "grad_norm": 8.53683853149414,
+ "learning_rate": 1.7564819972331408e-05,
+ "loss": 0.593,
+ "step": 9179
+ },
+ {
+ "epoch": 25.013623978201636,
+ "grad_norm": 7.668188571929932,
+ "learning_rate": 1.7564242778572348e-05,
+ "loss": 0.6535,
+ "step": 9180
+ },
+ {
+ "epoch": 25.016348773841962,
+ "grad_norm": 7.663745403289795,
+ "learning_rate": 1.756366552590321e-05,
+ "loss": 0.4633,
+ "step": 9181
+ },
+ {
+ "epoch": 25.019073569482288,
+ "grad_norm": 6.856311321258545,
+ "learning_rate": 1.756308821432849e-05,
+ "loss": 0.5386,
+ "step": 9182
+ },
+ {
+ "epoch": 25.021798365122617,
+ "grad_norm": 8.927593231201172,
+ "learning_rate": 1.7562510843852678e-05,
+ "loss": 0.5468,
+ "step": 9183
+ },
+ {
+ "epoch": 25.024523160762943,
+ "grad_norm": 7.710852146148682,
+ "learning_rate": 1.7561933414480278e-05,
+ "loss": 0.5551,
+ "step": 9184
+ },
+ {
+ "epoch": 25.02724795640327,
+ "grad_norm": 7.814901828765869,
+ "learning_rate": 1.7561355926215784e-05,
+ "loss": 0.5698,
+ "step": 9185
+ },
+ {
+ "epoch": 25.029972752043598,
+ "grad_norm": 7.54987907409668,
+ "learning_rate": 1.7560778379063693e-05,
+ "loss": 0.5743,
+ "step": 9186
+ },
+ {
+ "epoch": 25.032697547683924,
+ "grad_norm": 8.966099739074707,
+ "learning_rate": 1.75602007730285e-05,
+ "loss": 0.6206,
+ "step": 9187
+ },
+ {
+ "epoch": 25.03542234332425,
+ "grad_norm": 9.749812126159668,
+ "learning_rate": 1.7559623108114713e-05,
+ "loss": 0.5268,
+ "step": 9188
+ },
+ {
+ "epoch": 25.03814713896458,
+ "grad_norm": 7.751905918121338,
+ "learning_rate": 1.755904538432682e-05,
+ "loss": 0.7687,
+ "step": 9189
+ },
+ {
+ "epoch": 25.040871934604905,
+ "grad_norm": 6.137204170227051,
+ "learning_rate": 1.7558467601669326e-05,
+ "loss": 0.6042,
+ "step": 9190
+ },
+ {
+ "epoch": 25.04359673024523,
+ "grad_norm": 9.052706718444824,
+ "learning_rate": 1.755788976014673e-05,
+ "loss": 0.6306,
+ "step": 9191
+ },
+ {
+ "epoch": 25.04632152588556,
+ "grad_norm": 7.87229585647583,
+ "learning_rate": 1.755731185976353e-05,
+ "loss": 0.4666,
+ "step": 9192
+ },
+ {
+ "epoch": 25.049046321525886,
+ "grad_norm": 12.386114120483398,
+ "learning_rate": 1.755673390052423e-05,
+ "loss": 0.4894,
+ "step": 9193
+ },
+ {
+ "epoch": 25.05177111716621,
+ "grad_norm": 7.40094518661499,
+ "learning_rate": 1.755615588243333e-05,
+ "loss": 0.4758,
+ "step": 9194
+ },
+ {
+ "epoch": 25.05449591280654,
+ "grad_norm": 9.998497009277344,
+ "learning_rate": 1.755557780549533e-05,
+ "loss": 0.5323,
+ "step": 9195
+ },
+ {
+ "epoch": 25.057220708446867,
+ "grad_norm": 7.588438034057617,
+ "learning_rate": 1.7554999669714736e-05,
+ "loss": 0.6864,
+ "step": 9196
+ },
+ {
+ "epoch": 25.059945504087192,
+ "grad_norm": 7.710918426513672,
+ "learning_rate": 1.7554421475096047e-05,
+ "loss": 0.5907,
+ "step": 9197
+ },
+ {
+ "epoch": 25.06267029972752,
+ "grad_norm": 7.103505611419678,
+ "learning_rate": 1.7553843221643764e-05,
+ "loss": 0.5072,
+ "step": 9198
+ },
+ {
+ "epoch": 25.065395095367847,
+ "grad_norm": 7.364475727081299,
+ "learning_rate": 1.7553264909362397e-05,
+ "loss": 0.6147,
+ "step": 9199
+ },
+ {
+ "epoch": 25.068119891008173,
+ "grad_norm": 6.914089679718018,
+ "learning_rate": 1.755268653825644e-05,
+ "loss": 0.7128,
+ "step": 9200
+ },
+ {
+ "epoch": 25.070844686648503,
+ "grad_norm": 6.164554595947266,
+ "learning_rate": 1.7552108108330407e-05,
+ "loss": 0.5146,
+ "step": 9201
+ },
+ {
+ "epoch": 25.07356948228883,
+ "grad_norm": 7.43580961227417,
+ "learning_rate": 1.75515296195888e-05,
+ "loss": 0.4504,
+ "step": 9202
+ },
+ {
+ "epoch": 25.076294277929154,
+ "grad_norm": 6.554437637329102,
+ "learning_rate": 1.755095107203612e-05,
+ "loss": 0.6844,
+ "step": 9203
+ },
+ {
+ "epoch": 25.079019073569484,
+ "grad_norm": 8.390671730041504,
+ "learning_rate": 1.755037246567688e-05,
+ "loss": 0.6544,
+ "step": 9204
+ },
+ {
+ "epoch": 25.08174386920981,
+ "grad_norm": 9.178902626037598,
+ "learning_rate": 1.754979380051558e-05,
+ "loss": 0.5558,
+ "step": 9205
+ },
+ {
+ "epoch": 25.084468664850135,
+ "grad_norm": 6.180863380432129,
+ "learning_rate": 1.754921507655673e-05,
+ "loss": 0.6732,
+ "step": 9206
+ },
+ {
+ "epoch": 25.087193460490465,
+ "grad_norm": 6.8885674476623535,
+ "learning_rate": 1.7548636293804838e-05,
+ "loss": 0.7445,
+ "step": 9207
+ },
+ {
+ "epoch": 25.08991825613079,
+ "grad_norm": 9.175154685974121,
+ "learning_rate": 1.7548057452264404e-05,
+ "loss": 0.6847,
+ "step": 9208
+ },
+ {
+ "epoch": 25.092643051771116,
+ "grad_norm": 7.723278999328613,
+ "learning_rate": 1.7547478551939944e-05,
+ "loss": 0.5176,
+ "step": 9209
+ },
+ {
+ "epoch": 25.095367847411445,
+ "grad_norm": 9.161273956298828,
+ "learning_rate": 1.7546899592835968e-05,
+ "loss": 0.5295,
+ "step": 9210
+ },
+ {
+ "epoch": 25.09809264305177,
+ "grad_norm": 7.03291654586792,
+ "learning_rate": 1.7546320574956976e-05,
+ "loss": 0.5646,
+ "step": 9211
+ },
+ {
+ "epoch": 25.100817438692097,
+ "grad_norm": 7.496363162994385,
+ "learning_rate": 1.7545741498307483e-05,
+ "loss": 0.5092,
+ "step": 9212
+ },
+ {
+ "epoch": 25.103542234332426,
+ "grad_norm": 9.686806678771973,
+ "learning_rate": 1.7545162362891997e-05,
+ "loss": 0.4745,
+ "step": 9213
+ },
+ {
+ "epoch": 25.106267029972752,
+ "grad_norm": 8.231841087341309,
+ "learning_rate": 1.754458316871503e-05,
+ "loss": 0.5324,
+ "step": 9214
+ },
+ {
+ "epoch": 25.108991825613078,
+ "grad_norm": 8.02005386352539,
+ "learning_rate": 1.7544003915781097e-05,
+ "loss": 0.6253,
+ "step": 9215
+ },
+ {
+ "epoch": 25.111716621253407,
+ "grad_norm": 6.017721652984619,
+ "learning_rate": 1.7543424604094697e-05,
+ "loss": 0.5031,
+ "step": 9216
+ },
+ {
+ "epoch": 25.114441416893733,
+ "grad_norm": 8.045443534851074,
+ "learning_rate": 1.754284523366035e-05,
+ "loss": 0.6282,
+ "step": 9217
+ },
+ {
+ "epoch": 25.11716621253406,
+ "grad_norm": 6.175623893737793,
+ "learning_rate": 1.7542265804482573e-05,
+ "loss": 0.6051,
+ "step": 9218
+ },
+ {
+ "epoch": 25.11989100817439,
+ "grad_norm": 7.03268575668335,
+ "learning_rate": 1.754168631656587e-05,
+ "loss": 0.5444,
+ "step": 9219
+ },
+ {
+ "epoch": 25.122615803814714,
+ "grad_norm": 9.013124465942383,
+ "learning_rate": 1.754110676991475e-05,
+ "loss": 0.5907,
+ "step": 9220
+ },
+ {
+ "epoch": 25.12534059945504,
+ "grad_norm": 7.212218284606934,
+ "learning_rate": 1.7540527164533744e-05,
+ "loss": 0.6246,
+ "step": 9221
+ },
+ {
+ "epoch": 25.12806539509537,
+ "grad_norm": 7.503476142883301,
+ "learning_rate": 1.7539947500427346e-05,
+ "loss": 0.5248,
+ "step": 9222
+ },
+ {
+ "epoch": 25.130790190735695,
+ "grad_norm": 7.938776969909668,
+ "learning_rate": 1.7539367777600088e-05,
+ "loss": 0.5154,
+ "step": 9223
+ },
+ {
+ "epoch": 25.13351498637602,
+ "grad_norm": 7.27805757522583,
+ "learning_rate": 1.753878799605647e-05,
+ "loss": 0.6232,
+ "step": 9224
+ },
+ {
+ "epoch": 25.13623978201635,
+ "grad_norm": 7.290003776550293,
+ "learning_rate": 1.7538208155801014e-05,
+ "loss": 0.5217,
+ "step": 9225
+ },
+ {
+ "epoch": 25.138964577656676,
+ "grad_norm": 7.449812412261963,
+ "learning_rate": 1.7537628256838238e-05,
+ "loss": 0.5759,
+ "step": 9226
+ },
+ {
+ "epoch": 25.141689373297,
+ "grad_norm": 9.210305213928223,
+ "learning_rate": 1.7537048299172657e-05,
+ "loss": 0.541,
+ "step": 9227
+ },
+ {
+ "epoch": 25.14441416893733,
+ "grad_norm": 8.278675079345703,
+ "learning_rate": 1.7536468282808787e-05,
+ "loss": 0.5414,
+ "step": 9228
+ },
+ {
+ "epoch": 25.147138964577657,
+ "grad_norm": 8.17081356048584,
+ "learning_rate": 1.753588820775114e-05,
+ "loss": 0.6001,
+ "step": 9229
+ },
+ {
+ "epoch": 25.149863760217983,
+ "grad_norm": 7.017838478088379,
+ "learning_rate": 1.7535308074004242e-05,
+ "loss": 0.5342,
+ "step": 9230
+ },
+ {
+ "epoch": 25.152588555858312,
+ "grad_norm": 7.229761600494385,
+ "learning_rate": 1.7534727881572603e-05,
+ "loss": 0.5457,
+ "step": 9231
+ },
+ {
+ "epoch": 25.155313351498638,
+ "grad_norm": 7.093820095062256,
+ "learning_rate": 1.753414763046075e-05,
+ "loss": 0.5176,
+ "step": 9232
+ },
+ {
+ "epoch": 25.158038147138964,
+ "grad_norm": 7.416743755340576,
+ "learning_rate": 1.7533567320673197e-05,
+ "loss": 0.5902,
+ "step": 9233
+ },
+ {
+ "epoch": 25.160762942779293,
+ "grad_norm": 7.925085544586182,
+ "learning_rate": 1.7532986952214458e-05,
+ "loss": 0.5453,
+ "step": 9234
+ },
+ {
+ "epoch": 25.16348773841962,
+ "grad_norm": 7.787499904632568,
+ "learning_rate": 1.7532406525089065e-05,
+ "loss": 0.4775,
+ "step": 9235
+ },
+ {
+ "epoch": 25.166212534059945,
+ "grad_norm": 8.381814956665039,
+ "learning_rate": 1.7531826039301534e-05,
+ "loss": 0.6014,
+ "step": 9236
+ },
+ {
+ "epoch": 25.168937329700274,
+ "grad_norm": 10.34481430053711,
+ "learning_rate": 1.7531245494856383e-05,
+ "loss": 0.6141,
+ "step": 9237
+ },
+ {
+ "epoch": 25.1716621253406,
+ "grad_norm": 6.762233734130859,
+ "learning_rate": 1.753066489175813e-05,
+ "loss": 0.6984,
+ "step": 9238
+ },
+ {
+ "epoch": 25.174386920980925,
+ "grad_norm": 8.525280952453613,
+ "learning_rate": 1.7530084230011305e-05,
+ "loss": 0.5868,
+ "step": 9239
+ },
+ {
+ "epoch": 25.177111716621255,
+ "grad_norm": 8.026586532592773,
+ "learning_rate": 1.7529503509620426e-05,
+ "loss": 0.4789,
+ "step": 9240
+ },
+ {
+ "epoch": 25.17983651226158,
+ "grad_norm": 7.491539478302002,
+ "learning_rate": 1.7528922730590014e-05,
+ "loss": 0.5432,
+ "step": 9241
+ },
+ {
+ "epoch": 25.182561307901906,
+ "grad_norm": 7.025993824005127,
+ "learning_rate": 1.7528341892924598e-05,
+ "loss": 0.53,
+ "step": 9242
+ },
+ {
+ "epoch": 25.185286103542236,
+ "grad_norm": 8.817523956298828,
+ "learning_rate": 1.7527760996628695e-05,
+ "loss": 0.677,
+ "step": 9243
+ },
+ {
+ "epoch": 25.18801089918256,
+ "grad_norm": 7.676280975341797,
+ "learning_rate": 1.7527180041706834e-05,
+ "loss": 0.5723,
+ "step": 9244
+ },
+ {
+ "epoch": 25.190735694822887,
+ "grad_norm": 7.347946643829346,
+ "learning_rate": 1.7526599028163534e-05,
+ "loss": 0.6664,
+ "step": 9245
+ },
+ {
+ "epoch": 25.193460490463217,
+ "grad_norm": 8.0401029586792,
+ "learning_rate": 1.7526017956003324e-05,
+ "loss": 0.5846,
+ "step": 9246
+ },
+ {
+ "epoch": 25.196185286103542,
+ "grad_norm": 6.611307144165039,
+ "learning_rate": 1.7525436825230728e-05,
+ "loss": 0.3984,
+ "step": 9247
+ },
+ {
+ "epoch": 25.19891008174387,
+ "grad_norm": 8.031599998474121,
+ "learning_rate": 1.7524855635850272e-05,
+ "loss": 0.5362,
+ "step": 9248
+ },
+ {
+ "epoch": 25.201634877384198,
+ "grad_norm": 7.952152252197266,
+ "learning_rate": 1.7524274387866483e-05,
+ "loss": 0.625,
+ "step": 9249
+ },
+ {
+ "epoch": 25.204359673024523,
+ "grad_norm": 9.92528247833252,
+ "learning_rate": 1.752369308128389e-05,
+ "loss": 0.446,
+ "step": 9250
+ },
+ {
+ "epoch": 25.20708446866485,
+ "grad_norm": 8.438230514526367,
+ "learning_rate": 1.7523111716107016e-05,
+ "loss": 0.5319,
+ "step": 9251
+ },
+ {
+ "epoch": 25.20980926430518,
+ "grad_norm": 6.178292274475098,
+ "learning_rate": 1.7522530292340387e-05,
+ "loss": 0.5495,
+ "step": 9252
+ },
+ {
+ "epoch": 25.212534059945504,
+ "grad_norm": 7.064868450164795,
+ "learning_rate": 1.7521948809988538e-05,
+ "loss": 0.6548,
+ "step": 9253
+ },
+ {
+ "epoch": 25.21525885558583,
+ "grad_norm": 9.970439910888672,
+ "learning_rate": 1.752136726905599e-05,
+ "loss": 0.6219,
+ "step": 9254
+ },
+ {
+ "epoch": 25.21798365122616,
+ "grad_norm": 6.916043758392334,
+ "learning_rate": 1.752078566954728e-05,
+ "loss": 0.5088,
+ "step": 9255
+ },
+ {
+ "epoch": 25.220708446866485,
+ "grad_norm": 7.9270195960998535,
+ "learning_rate": 1.752020401146693e-05,
+ "loss": 0.6082,
+ "step": 9256
+ },
+ {
+ "epoch": 25.22343324250681,
+ "grad_norm": 7.422311305999756,
+ "learning_rate": 1.7519622294819474e-05,
+ "loss": 0.509,
+ "step": 9257
+ },
+ {
+ "epoch": 25.22615803814714,
+ "grad_norm": 8.811856269836426,
+ "learning_rate": 1.7519040519609443e-05,
+ "loss": 0.6207,
+ "step": 9258
+ },
+ {
+ "epoch": 25.228882833787466,
+ "grad_norm": 12.191774368286133,
+ "learning_rate": 1.751845868584136e-05,
+ "loss": 0.4642,
+ "step": 9259
+ },
+ {
+ "epoch": 25.231607629427792,
+ "grad_norm": 6.951323986053467,
+ "learning_rate": 1.7517876793519772e-05,
+ "loss": 0.7046,
+ "step": 9260
+ },
+ {
+ "epoch": 25.23433242506812,
+ "grad_norm": 9.310023307800293,
+ "learning_rate": 1.75172948426492e-05,
+ "loss": 0.531,
+ "step": 9261
+ },
+ {
+ "epoch": 25.237057220708447,
+ "grad_norm": 11.55679988861084,
+ "learning_rate": 1.751671283323417e-05,
+ "loss": 0.5942,
+ "step": 9262
+ },
+ {
+ "epoch": 25.239782016348773,
+ "grad_norm": 6.232604026794434,
+ "learning_rate": 1.751613076527923e-05,
+ "loss": 0.6099,
+ "step": 9263
+ },
+ {
+ "epoch": 25.242506811989102,
+ "grad_norm": 10.137306213378906,
+ "learning_rate": 1.7515548638788904e-05,
+ "loss": 0.6305,
+ "step": 9264
+ },
+ {
+ "epoch": 25.245231607629428,
+ "grad_norm": 7.340976238250732,
+ "learning_rate": 1.7514966453767725e-05,
+ "loss": 0.5643,
+ "step": 9265
+ },
+ {
+ "epoch": 25.247956403269754,
+ "grad_norm": 6.675346851348877,
+ "learning_rate": 1.751438421022023e-05,
+ "loss": 0.6963,
+ "step": 9266
+ },
+ {
+ "epoch": 25.250681198910083,
+ "grad_norm": 9.164529800415039,
+ "learning_rate": 1.7513801908150953e-05,
+ "loss": 0.634,
+ "step": 9267
+ },
+ {
+ "epoch": 25.25340599455041,
+ "grad_norm": 7.60259485244751,
+ "learning_rate": 1.7513219547564427e-05,
+ "loss": 0.4993,
+ "step": 9268
+ },
+ {
+ "epoch": 25.256130790190735,
+ "grad_norm": 7.457983016967773,
+ "learning_rate": 1.7512637128465195e-05,
+ "loss": 0.5522,
+ "step": 9269
+ },
+ {
+ "epoch": 25.258855585831064,
+ "grad_norm": 7.982919216156006,
+ "learning_rate": 1.751205465085778e-05,
+ "loss": 0.5412,
+ "step": 9270
+ },
+ {
+ "epoch": 25.26158038147139,
+ "grad_norm": 6.639307022094727,
+ "learning_rate": 1.7511472114746727e-05,
+ "loss": 0.6172,
+ "step": 9271
+ },
+ {
+ "epoch": 25.264305177111716,
+ "grad_norm": 9.026050567626953,
+ "learning_rate": 1.7510889520136572e-05,
+ "loss": 0.516,
+ "step": 9272
+ },
+ {
+ "epoch": 25.267029972752045,
+ "grad_norm": 11.0486478805542,
+ "learning_rate": 1.751030686703185e-05,
+ "loss": 0.5549,
+ "step": 9273
+ },
+ {
+ "epoch": 25.26975476839237,
+ "grad_norm": 6.79197359085083,
+ "learning_rate": 1.7509724155437104e-05,
+ "loss": 0.5136,
+ "step": 9274
+ },
+ {
+ "epoch": 25.272479564032697,
+ "grad_norm": 9.363343238830566,
+ "learning_rate": 1.750914138535686e-05,
+ "loss": 0.4385,
+ "step": 9275
+ },
+ {
+ "epoch": 25.275204359673026,
+ "grad_norm": 8.308867454528809,
+ "learning_rate": 1.750855855679567e-05,
+ "loss": 0.5222,
+ "step": 9276
+ },
+ {
+ "epoch": 25.277929155313352,
+ "grad_norm": 7.330071926116943,
+ "learning_rate": 1.750797566975807e-05,
+ "loss": 0.5204,
+ "step": 9277
+ },
+ {
+ "epoch": 25.280653950953678,
+ "grad_norm": 7.579598426818848,
+ "learning_rate": 1.7507392724248592e-05,
+ "loss": 0.5756,
+ "step": 9278
+ },
+ {
+ "epoch": 25.283378746594007,
+ "grad_norm": 7.826560020446777,
+ "learning_rate": 1.750680972027178e-05,
+ "loss": 0.5952,
+ "step": 9279
+ },
+ {
+ "epoch": 25.286103542234333,
+ "grad_norm": 7.135838031768799,
+ "learning_rate": 1.750622665783218e-05,
+ "loss": 0.6481,
+ "step": 9280
+ },
+ {
+ "epoch": 25.28882833787466,
+ "grad_norm": 14.81757640838623,
+ "learning_rate": 1.7505643536934326e-05,
+ "loss": 0.7836,
+ "step": 9281
+ },
+ {
+ "epoch": 25.291553133514988,
+ "grad_norm": 7.334166526794434,
+ "learning_rate": 1.750506035758276e-05,
+ "loss": 0.546,
+ "step": 9282
+ },
+ {
+ "epoch": 25.294277929155314,
+ "grad_norm": 7.982358455657959,
+ "learning_rate": 1.750447711978203e-05,
+ "loss": 0.5037,
+ "step": 9283
+ },
+ {
+ "epoch": 25.29700272479564,
+ "grad_norm": 9.636107444763184,
+ "learning_rate": 1.7503893823536675e-05,
+ "loss": 0.5786,
+ "step": 9284
+ },
+ {
+ "epoch": 25.29972752043597,
+ "grad_norm": 8.395858764648438,
+ "learning_rate": 1.7503310468851232e-05,
+ "loss": 0.5997,
+ "step": 9285
+ },
+ {
+ "epoch": 25.302452316076295,
+ "grad_norm": 9.377330780029297,
+ "learning_rate": 1.750272705573025e-05,
+ "loss": 0.4741,
+ "step": 9286
+ },
+ {
+ "epoch": 25.30517711171662,
+ "grad_norm": 7.8394951820373535,
+ "learning_rate": 1.750214358417827e-05,
+ "loss": 0.5222,
+ "step": 9287
+ },
+ {
+ "epoch": 25.30790190735695,
+ "grad_norm": 10.575955390930176,
+ "learning_rate": 1.750156005419984e-05,
+ "loss": 0.6584,
+ "step": 9288
+ },
+ {
+ "epoch": 25.310626702997276,
+ "grad_norm": 8.982266426086426,
+ "learning_rate": 1.7500976465799496e-05,
+ "loss": 0.8733,
+ "step": 9289
+ },
+ {
+ "epoch": 25.3133514986376,
+ "grad_norm": 10.613094329833984,
+ "learning_rate": 1.7500392818981792e-05,
+ "loss": 0.5869,
+ "step": 9290
+ },
+ {
+ "epoch": 25.31607629427793,
+ "grad_norm": 7.434613227844238,
+ "learning_rate": 1.749980911375127e-05,
+ "loss": 0.5545,
+ "step": 9291
+ },
+ {
+ "epoch": 25.318801089918257,
+ "grad_norm": 6.9735565185546875,
+ "learning_rate": 1.7499225350112475e-05,
+ "loss": 0.5378,
+ "step": 9292
+ },
+ {
+ "epoch": 25.321525885558582,
+ "grad_norm": 8.49386215209961,
+ "learning_rate": 1.7498641528069956e-05,
+ "loss": 0.5077,
+ "step": 9293
+ },
+ {
+ "epoch": 25.32425068119891,
+ "grad_norm": 9.577007293701172,
+ "learning_rate": 1.749805764762826e-05,
+ "loss": 0.6476,
+ "step": 9294
+ },
+ {
+ "epoch": 25.326975476839237,
+ "grad_norm": 7.3503265380859375,
+ "learning_rate": 1.749747370879193e-05,
+ "loss": 0.5378,
+ "step": 9295
+ },
+ {
+ "epoch": 25.329700272479563,
+ "grad_norm": 7.510955810546875,
+ "learning_rate": 1.7496889711565516e-05,
+ "loss": 0.6151,
+ "step": 9296
+ },
+ {
+ "epoch": 25.332425068119893,
+ "grad_norm": 8.559822082519531,
+ "learning_rate": 1.7496305655953567e-05,
+ "loss": 0.4661,
+ "step": 9297
+ },
+ {
+ "epoch": 25.33514986376022,
+ "grad_norm": 7.167689800262451,
+ "learning_rate": 1.749572154196063e-05,
+ "loss": 0.5245,
+ "step": 9298
+ },
+ {
+ "epoch": 25.337874659400544,
+ "grad_norm": 8.277609825134277,
+ "learning_rate": 1.749513736959126e-05,
+ "loss": 0.7338,
+ "step": 9299
+ },
+ {
+ "epoch": 25.340599455040874,
+ "grad_norm": 7.558475971221924,
+ "learning_rate": 1.7494553138849993e-05,
+ "loss": 0.5319,
+ "step": 9300
+ },
+ {
+ "epoch": 25.3433242506812,
+ "grad_norm": 12.541115760803223,
+ "learning_rate": 1.749396884974139e-05,
+ "loss": 0.6882,
+ "step": 9301
+ },
+ {
+ "epoch": 25.346049046321525,
+ "grad_norm": 9.739608764648438,
+ "learning_rate": 1.7493384502270003e-05,
+ "loss": 0.6673,
+ "step": 9302
+ },
+ {
+ "epoch": 25.348773841961854,
+ "grad_norm": 8.39655590057373,
+ "learning_rate": 1.7492800096440376e-05,
+ "loss": 0.482,
+ "step": 9303
+ },
+ {
+ "epoch": 25.35149863760218,
+ "grad_norm": 11.642461776733398,
+ "learning_rate": 1.749221563225706e-05,
+ "loss": 0.5998,
+ "step": 9304
+ },
+ {
+ "epoch": 25.354223433242506,
+ "grad_norm": 9.626822471618652,
+ "learning_rate": 1.7491631109724613e-05,
+ "loss": 0.7056,
+ "step": 9305
+ },
+ {
+ "epoch": 25.356948228882835,
+ "grad_norm": 7.723657131195068,
+ "learning_rate": 1.7491046528847584e-05,
+ "loss": 0.5672,
+ "step": 9306
+ },
+ {
+ "epoch": 25.35967302452316,
+ "grad_norm": 8.35869026184082,
+ "learning_rate": 1.7490461889630523e-05,
+ "loss": 0.5688,
+ "step": 9307
+ },
+ {
+ "epoch": 25.362397820163487,
+ "grad_norm": 7.555449485778809,
+ "learning_rate": 1.748987719207799e-05,
+ "loss": 0.5198,
+ "step": 9308
+ },
+ {
+ "epoch": 25.365122615803816,
+ "grad_norm": 8.054333686828613,
+ "learning_rate": 1.748929243619453e-05,
+ "loss": 0.6856,
+ "step": 9309
+ },
+ {
+ "epoch": 25.367847411444142,
+ "grad_norm": 9.204339027404785,
+ "learning_rate": 1.7488707621984702e-05,
+ "loss": 0.5024,
+ "step": 9310
+ },
+ {
+ "epoch": 25.370572207084468,
+ "grad_norm": 7.36260461807251,
+ "learning_rate": 1.7488122749453067e-05,
+ "loss": 0.6157,
+ "step": 9311
+ },
+ {
+ "epoch": 25.373297002724797,
+ "grad_norm": 7.929131031036377,
+ "learning_rate": 1.7487537818604166e-05,
+ "loss": 0.6201,
+ "step": 9312
+ },
+ {
+ "epoch": 25.376021798365123,
+ "grad_norm": 6.746554374694824,
+ "learning_rate": 1.7486952829442562e-05,
+ "loss": 0.5786,
+ "step": 9313
+ },
+ {
+ "epoch": 25.37874659400545,
+ "grad_norm": 8.873085021972656,
+ "learning_rate": 1.7486367781972813e-05,
+ "loss": 0.6929,
+ "step": 9314
+ },
+ {
+ "epoch": 25.381471389645778,
+ "grad_norm": 8.892407417297363,
+ "learning_rate": 1.7485782676199475e-05,
+ "loss": 0.5998,
+ "step": 9315
+ },
+ {
+ "epoch": 25.384196185286104,
+ "grad_norm": 11.712400436401367,
+ "learning_rate": 1.7485197512127096e-05,
+ "loss": 0.4626,
+ "step": 9316
+ },
+ {
+ "epoch": 25.38692098092643,
+ "grad_norm": 8.752985000610352,
+ "learning_rate": 1.7484612289760242e-05,
+ "loss": 0.5222,
+ "step": 9317
+ },
+ {
+ "epoch": 25.38964577656676,
+ "grad_norm": 7.0970377922058105,
+ "learning_rate": 1.748402700910347e-05,
+ "loss": 0.6296,
+ "step": 9318
+ },
+ {
+ "epoch": 25.392370572207085,
+ "grad_norm": 8.385693550109863,
+ "learning_rate": 1.7483441670161336e-05,
+ "loss": 0.538,
+ "step": 9319
+ },
+ {
+ "epoch": 25.39509536784741,
+ "grad_norm": 8.93567943572998,
+ "learning_rate": 1.7482856272938398e-05,
+ "loss": 0.5391,
+ "step": 9320
+ },
+ {
+ "epoch": 25.39782016348774,
+ "grad_norm": 7.765710830688477,
+ "learning_rate": 1.7482270817439217e-05,
+ "loss": 0.7386,
+ "step": 9321
+ },
+ {
+ "epoch": 25.400544959128066,
+ "grad_norm": 9.23783016204834,
+ "learning_rate": 1.7481685303668353e-05,
+ "loss": 0.5933,
+ "step": 9322
+ },
+ {
+ "epoch": 25.40326975476839,
+ "grad_norm": 8.068859100341797,
+ "learning_rate": 1.7481099731630365e-05,
+ "loss": 0.5716,
+ "step": 9323
+ },
+ {
+ "epoch": 25.40599455040872,
+ "grad_norm": 6.749257564544678,
+ "learning_rate": 1.7480514101329808e-05,
+ "loss": 0.5922,
+ "step": 9324
+ },
+ {
+ "epoch": 25.408719346049047,
+ "grad_norm": 17.23390007019043,
+ "learning_rate": 1.7479928412771253e-05,
+ "loss": 0.5787,
+ "step": 9325
+ },
+ {
+ "epoch": 25.411444141689373,
+ "grad_norm": 7.998206615447998,
+ "learning_rate": 1.7479342665959254e-05,
+ "loss": 0.5224,
+ "step": 9326
+ },
+ {
+ "epoch": 25.414168937329702,
+ "grad_norm": 8.28626823425293,
+ "learning_rate": 1.7478756860898378e-05,
+ "loss": 0.6528,
+ "step": 9327
+ },
+ {
+ "epoch": 25.416893732970028,
+ "grad_norm": 8.12370491027832,
+ "learning_rate": 1.747817099759318e-05,
+ "loss": 0.5311,
+ "step": 9328
+ },
+ {
+ "epoch": 25.419618528610354,
+ "grad_norm": 9.191961288452148,
+ "learning_rate": 1.747758507604823e-05,
+ "loss": 0.6464,
+ "step": 9329
+ },
+ {
+ "epoch": 25.422343324250683,
+ "grad_norm": 7.370696544647217,
+ "learning_rate": 1.7476999096268086e-05,
+ "loss": 0.3813,
+ "step": 9330
+ },
+ {
+ "epoch": 25.42506811989101,
+ "grad_norm": 7.346981048583984,
+ "learning_rate": 1.7476413058257313e-05,
+ "loss": 0.6216,
+ "step": 9331
+ },
+ {
+ "epoch": 25.427792915531334,
+ "grad_norm": 7.545352458953857,
+ "learning_rate": 1.7475826962020476e-05,
+ "loss": 0.642,
+ "step": 9332
+ },
+ {
+ "epoch": 25.430517711171664,
+ "grad_norm": 9.863822937011719,
+ "learning_rate": 1.747524080756214e-05,
+ "loss": 0.7235,
+ "step": 9333
+ },
+ {
+ "epoch": 25.43324250681199,
+ "grad_norm": 8.380276679992676,
+ "learning_rate": 1.7474654594886873e-05,
+ "loss": 0.4589,
+ "step": 9334
+ },
+ {
+ "epoch": 25.435967302452315,
+ "grad_norm": 8.475086212158203,
+ "learning_rate": 1.7474068323999232e-05,
+ "loss": 0.4783,
+ "step": 9335
+ },
+ {
+ "epoch": 25.438692098092645,
+ "grad_norm": 7.905653953552246,
+ "learning_rate": 1.7473481994903788e-05,
+ "loss": 0.52,
+ "step": 9336
+ },
+ {
+ "epoch": 25.44141689373297,
+ "grad_norm": 8.372299194335938,
+ "learning_rate": 1.747289560760511e-05,
+ "loss": 0.5763,
+ "step": 9337
+ },
+ {
+ "epoch": 25.444141689373296,
+ "grad_norm": 8.619787216186523,
+ "learning_rate": 1.7472309162107757e-05,
+ "loss": 0.5384,
+ "step": 9338
+ },
+ {
+ "epoch": 25.446866485013626,
+ "grad_norm": 9.927772521972656,
+ "learning_rate": 1.7471722658416302e-05,
+ "loss": 0.4372,
+ "step": 9339
+ },
+ {
+ "epoch": 25.44959128065395,
+ "grad_norm": 9.848402976989746,
+ "learning_rate": 1.7471136096535316e-05,
+ "loss": 0.7333,
+ "step": 9340
+ },
+ {
+ "epoch": 25.452316076294277,
+ "grad_norm": 9.86668872833252,
+ "learning_rate": 1.7470549476469357e-05,
+ "loss": 0.6058,
+ "step": 9341
+ },
+ {
+ "epoch": 25.455040871934607,
+ "grad_norm": 8.02867603302002,
+ "learning_rate": 1.7469962798223e-05,
+ "loss": 0.6613,
+ "step": 9342
+ },
+ {
+ "epoch": 25.457765667574932,
+ "grad_norm": 9.436712265014648,
+ "learning_rate": 1.7469376061800815e-05,
+ "loss": 0.5602,
+ "step": 9343
+ },
+ {
+ "epoch": 25.460490463215258,
+ "grad_norm": 8.04949951171875,
+ "learning_rate": 1.746878926720737e-05,
+ "loss": 0.6345,
+ "step": 9344
+ },
+ {
+ "epoch": 25.463215258855588,
+ "grad_norm": 7.776516437530518,
+ "learning_rate": 1.746820241444723e-05,
+ "loss": 0.566,
+ "step": 9345
+ },
+ {
+ "epoch": 25.465940054495913,
+ "grad_norm": 9.003487586975098,
+ "learning_rate": 1.7467615503524973e-05,
+ "loss": 0.6335,
+ "step": 9346
+ },
+ {
+ "epoch": 25.46866485013624,
+ "grad_norm": 7.916099548339844,
+ "learning_rate": 1.7467028534445166e-05,
+ "loss": 0.5493,
+ "step": 9347
+ },
+ {
+ "epoch": 25.47138964577657,
+ "grad_norm": 7.610687255859375,
+ "learning_rate": 1.7466441507212383e-05,
+ "loss": 0.4928,
+ "step": 9348
+ },
+ {
+ "epoch": 25.474114441416894,
+ "grad_norm": 7.990988731384277,
+ "learning_rate": 1.7465854421831192e-05,
+ "loss": 0.5379,
+ "step": 9349
+ },
+ {
+ "epoch": 25.47683923705722,
+ "grad_norm": 6.85425329208374,
+ "learning_rate": 1.746526727830617e-05,
+ "loss": 0.5766,
+ "step": 9350
+ },
+ {
+ "epoch": 25.479564032697546,
+ "grad_norm": 7.345608234405518,
+ "learning_rate": 1.7464680076641883e-05,
+ "loss": 0.6484,
+ "step": 9351
+ },
+ {
+ "epoch": 25.482288828337875,
+ "grad_norm": 6.640669345855713,
+ "learning_rate": 1.746409281684291e-05,
+ "loss": 0.5922,
+ "step": 9352
+ },
+ {
+ "epoch": 25.4850136239782,
+ "grad_norm": 7.6144633293151855,
+ "learning_rate": 1.746350549891382e-05,
+ "loss": 0.4883,
+ "step": 9353
+ },
+ {
+ "epoch": 25.48773841961853,
+ "grad_norm": 8.312814712524414,
+ "learning_rate": 1.7462918122859193e-05,
+ "loss": 0.5203,
+ "step": 9354
+ },
+ {
+ "epoch": 25.490463215258856,
+ "grad_norm": 8.035418510437012,
+ "learning_rate": 1.7462330688683596e-05,
+ "loss": 0.7047,
+ "step": 9355
+ },
+ {
+ "epoch": 25.493188010899182,
+ "grad_norm": 6.685522556304932,
+ "learning_rate": 1.7461743196391613e-05,
+ "loss": 0.8011,
+ "step": 9356
+ },
+ {
+ "epoch": 25.495912806539508,
+ "grad_norm": 7.33150577545166,
+ "learning_rate": 1.746115564598781e-05,
+ "loss": 0.5392,
+ "step": 9357
+ },
+ {
+ "epoch": 25.498637602179837,
+ "grad_norm": 7.050995349884033,
+ "learning_rate": 1.746056803747677e-05,
+ "loss": 0.5724,
+ "step": 9358
+ },
+ {
+ "epoch": 25.501362397820163,
+ "grad_norm": 7.876449108123779,
+ "learning_rate": 1.7459980370863063e-05,
+ "loss": 0.6718,
+ "step": 9359
+ },
+ {
+ "epoch": 25.504087193460492,
+ "grad_norm": 6.868752479553223,
+ "learning_rate": 1.7459392646151266e-05,
+ "loss": 0.5359,
+ "step": 9360
+ },
+ {
+ "epoch": 25.506811989100818,
+ "grad_norm": 7.423297882080078,
+ "learning_rate": 1.7458804863345966e-05,
+ "loss": 0.5386,
+ "step": 9361
+ },
+ {
+ "epoch": 25.509536784741144,
+ "grad_norm": 8.611160278320312,
+ "learning_rate": 1.745821702245173e-05,
+ "loss": 0.4833,
+ "step": 9362
+ },
+ {
+ "epoch": 25.51226158038147,
+ "grad_norm": 7.3242998123168945,
+ "learning_rate": 1.7457629123473144e-05,
+ "loss": 0.5158,
+ "step": 9363
+ },
+ {
+ "epoch": 25.5149863760218,
+ "grad_norm": 8.992837905883789,
+ "learning_rate": 1.745704116641478e-05,
+ "loss": 0.6549,
+ "step": 9364
+ },
+ {
+ "epoch": 25.517711171662125,
+ "grad_norm": 7.9097208976745605,
+ "learning_rate": 1.7456453151281215e-05,
+ "loss": 0.4332,
+ "step": 9365
+ },
+ {
+ "epoch": 25.520435967302454,
+ "grad_norm": 8.41103458404541,
+ "learning_rate": 1.7455865078077038e-05,
+ "loss": 0.6543,
+ "step": 9366
+ },
+ {
+ "epoch": 25.52316076294278,
+ "grad_norm": 7.673321723937988,
+ "learning_rate": 1.745527694680682e-05,
+ "loss": 0.6619,
+ "step": 9367
+ },
+ {
+ "epoch": 25.525885558583106,
+ "grad_norm": 6.998402118682861,
+ "learning_rate": 1.745468875747515e-05,
+ "loss": 0.5494,
+ "step": 9368
+ },
+ {
+ "epoch": 25.52861035422343,
+ "grad_norm": 6.4210686683654785,
+ "learning_rate": 1.74541005100866e-05,
+ "loss": 0.5988,
+ "step": 9369
+ },
+ {
+ "epoch": 25.53133514986376,
+ "grad_norm": 7.388408184051514,
+ "learning_rate": 1.7453512204645756e-05,
+ "loss": 0.6859,
+ "step": 9370
+ },
+ {
+ "epoch": 25.534059945504087,
+ "grad_norm": 7.578431606292725,
+ "learning_rate": 1.7452923841157198e-05,
+ "loss": 0.4578,
+ "step": 9371
+ },
+ {
+ "epoch": 25.536784741144416,
+ "grad_norm": 7.251674175262451,
+ "learning_rate": 1.7452335419625514e-05,
+ "loss": 0.631,
+ "step": 9372
+ },
+ {
+ "epoch": 25.539509536784742,
+ "grad_norm": 9.027373313903809,
+ "learning_rate": 1.7451746940055278e-05,
+ "loss": 0.5519,
+ "step": 9373
+ },
+ {
+ "epoch": 25.542234332425068,
+ "grad_norm": 8.505552291870117,
+ "learning_rate": 1.7451158402451078e-05,
+ "loss": 0.5848,
+ "step": 9374
+ },
+ {
+ "epoch": 25.544959128065393,
+ "grad_norm": 7.444201469421387,
+ "learning_rate": 1.7450569806817494e-05,
+ "loss": 0.5968,
+ "step": 9375
+ },
+ {
+ "epoch": 25.547683923705723,
+ "grad_norm": 7.371540546417236,
+ "learning_rate": 1.744998115315911e-05,
+ "loss": 0.658,
+ "step": 9376
+ },
+ {
+ "epoch": 25.55040871934605,
+ "grad_norm": 8.483649253845215,
+ "learning_rate": 1.744939244148052e-05,
+ "loss": 0.5031,
+ "step": 9377
+ },
+ {
+ "epoch": 25.553133514986374,
+ "grad_norm": 25.00672149658203,
+ "learning_rate": 1.7448803671786292e-05,
+ "loss": 0.6876,
+ "step": 9378
+ },
+ {
+ "epoch": 25.555858310626704,
+ "grad_norm": 7.475778102874756,
+ "learning_rate": 1.7448214844081026e-05,
+ "loss": 0.6038,
+ "step": 9379
+ },
+ {
+ "epoch": 25.55858310626703,
+ "grad_norm": 8.381858825683594,
+ "learning_rate": 1.7447625958369303e-05,
+ "loss": 0.6476,
+ "step": 9380
+ },
+ {
+ "epoch": 25.561307901907355,
+ "grad_norm": 8.840806007385254,
+ "learning_rate": 1.744703701465571e-05,
+ "loss": 0.5338,
+ "step": 9381
+ },
+ {
+ "epoch": 25.564032697547685,
+ "grad_norm": 7.5802764892578125,
+ "learning_rate": 1.744644801294483e-05,
+ "loss": 0.6526,
+ "step": 9382
+ },
+ {
+ "epoch": 25.56675749318801,
+ "grad_norm": 8.006721496582031,
+ "learning_rate": 1.744585895324125e-05,
+ "loss": 0.4777,
+ "step": 9383
+ },
+ {
+ "epoch": 25.569482288828336,
+ "grad_norm": 8.405454635620117,
+ "learning_rate": 1.7445269835549565e-05,
+ "loss": 0.7128,
+ "step": 9384
+ },
+ {
+ "epoch": 25.572207084468666,
+ "grad_norm": 12.386618614196777,
+ "learning_rate": 1.7444680659874354e-05,
+ "loss": 0.5532,
+ "step": 9385
+ },
+ {
+ "epoch": 25.57493188010899,
+ "grad_norm": 8.866639137268066,
+ "learning_rate": 1.744409142622021e-05,
+ "loss": 0.5941,
+ "step": 9386
+ },
+ {
+ "epoch": 25.577656675749317,
+ "grad_norm": 10.208216667175293,
+ "learning_rate": 1.7443502134591725e-05,
+ "loss": 0.4695,
+ "step": 9387
+ },
+ {
+ "epoch": 25.580381471389646,
+ "grad_norm": 8.157602310180664,
+ "learning_rate": 1.744291278499348e-05,
+ "loss": 0.5888,
+ "step": 9388
+ },
+ {
+ "epoch": 25.583106267029972,
+ "grad_norm": 15.60487174987793,
+ "learning_rate": 1.744232337743008e-05,
+ "loss": 0.6458,
+ "step": 9389
+ },
+ {
+ "epoch": 25.585831062670298,
+ "grad_norm": 9.842437744140625,
+ "learning_rate": 1.7441733911906092e-05,
+ "loss": 0.5865,
+ "step": 9390
+ },
+ {
+ "epoch": 25.588555858310627,
+ "grad_norm": 11.806042671203613,
+ "learning_rate": 1.7441144388426126e-05,
+ "loss": 0.5978,
+ "step": 9391
+ },
+ {
+ "epoch": 25.591280653950953,
+ "grad_norm": 7.766541004180908,
+ "learning_rate": 1.7440554806994768e-05,
+ "loss": 0.5707,
+ "step": 9392
+ },
+ {
+ "epoch": 25.59400544959128,
+ "grad_norm": 9.12265682220459,
+ "learning_rate": 1.743996516761661e-05,
+ "loss": 0.5485,
+ "step": 9393
+ },
+ {
+ "epoch": 25.59673024523161,
+ "grad_norm": 8.803854942321777,
+ "learning_rate": 1.743937547029624e-05,
+ "loss": 0.7141,
+ "step": 9394
+ },
+ {
+ "epoch": 25.599455040871934,
+ "grad_norm": 9.123351097106934,
+ "learning_rate": 1.7438785715038253e-05,
+ "loss": 0.5258,
+ "step": 9395
+ },
+ {
+ "epoch": 25.60217983651226,
+ "grad_norm": 10.303979873657227,
+ "learning_rate": 1.7438195901847243e-05,
+ "loss": 0.6413,
+ "step": 9396
+ },
+ {
+ "epoch": 25.60490463215259,
+ "grad_norm": 8.321008682250977,
+ "learning_rate": 1.7437606030727804e-05,
+ "loss": 0.6555,
+ "step": 9397
+ },
+ {
+ "epoch": 25.607629427792915,
+ "grad_norm": 7.6452789306640625,
+ "learning_rate": 1.7437016101684526e-05,
+ "loss": 0.5445,
+ "step": 9398
+ },
+ {
+ "epoch": 25.61035422343324,
+ "grad_norm": 8.129426002502441,
+ "learning_rate": 1.7436426114722006e-05,
+ "loss": 0.5661,
+ "step": 9399
+ },
+ {
+ "epoch": 25.61307901907357,
+ "grad_norm": 8.526227951049805,
+ "learning_rate": 1.7435836069844838e-05,
+ "loss": 0.5932,
+ "step": 9400
+ },
+ {
+ "epoch": 25.615803814713896,
+ "grad_norm": 8.07772159576416,
+ "learning_rate": 1.7435245967057623e-05,
+ "loss": 0.7504,
+ "step": 9401
+ },
+ {
+ "epoch": 25.618528610354222,
+ "grad_norm": 8.812663078308105,
+ "learning_rate": 1.7434655806364945e-05,
+ "loss": 0.5126,
+ "step": 9402
+ },
+ {
+ "epoch": 25.62125340599455,
+ "grad_norm": 8.795720100402832,
+ "learning_rate": 1.7434065587771413e-05,
+ "loss": 0.7559,
+ "step": 9403
+ },
+ {
+ "epoch": 25.623978201634877,
+ "grad_norm": 8.46756362915039,
+ "learning_rate": 1.7433475311281616e-05,
+ "loss": 0.6748,
+ "step": 9404
+ },
+ {
+ "epoch": 25.626702997275203,
+ "grad_norm": 8.732349395751953,
+ "learning_rate": 1.7432884976900147e-05,
+ "loss": 0.5325,
+ "step": 9405
+ },
+ {
+ "epoch": 25.629427792915532,
+ "grad_norm": 9.263157844543457,
+ "learning_rate": 1.7432294584631616e-05,
+ "loss": 0.6005,
+ "step": 9406
+ },
+ {
+ "epoch": 25.632152588555858,
+ "grad_norm": 10.506868362426758,
+ "learning_rate": 1.7431704134480608e-05,
+ "loss": 0.6466,
+ "step": 9407
+ },
+ {
+ "epoch": 25.634877384196184,
+ "grad_norm": 7.771955966949463,
+ "learning_rate": 1.7431113626451733e-05,
+ "loss": 0.4752,
+ "step": 9408
+ },
+ {
+ "epoch": 25.637602179836513,
+ "grad_norm": 8.836752891540527,
+ "learning_rate": 1.7430523060549586e-05,
+ "loss": 0.5073,
+ "step": 9409
+ },
+ {
+ "epoch": 25.64032697547684,
+ "grad_norm": 8.095437049865723,
+ "learning_rate": 1.7429932436778755e-05,
+ "loss": 0.656,
+ "step": 9410
+ },
+ {
+ "epoch": 25.643051771117165,
+ "grad_norm": 7.719583988189697,
+ "learning_rate": 1.7429341755143857e-05,
+ "loss": 0.4961,
+ "step": 9411
+ },
+ {
+ "epoch": 25.645776566757494,
+ "grad_norm": 6.682363510131836,
+ "learning_rate": 1.7428751015649483e-05,
+ "loss": 0.7285,
+ "step": 9412
+ },
+ {
+ "epoch": 25.64850136239782,
+ "grad_norm": 7.992876052856445,
+ "learning_rate": 1.7428160218300236e-05,
+ "loss": 0.584,
+ "step": 9413
+ },
+ {
+ "epoch": 25.651226158038146,
+ "grad_norm": 7.828421115875244,
+ "learning_rate": 1.7427569363100714e-05,
+ "loss": 0.5701,
+ "step": 9414
+ },
+ {
+ "epoch": 25.653950953678475,
+ "grad_norm": 7.200517654418945,
+ "learning_rate": 1.742697845005552e-05,
+ "loss": 0.6543,
+ "step": 9415
+ },
+ {
+ "epoch": 25.6566757493188,
+ "grad_norm": 9.306139945983887,
+ "learning_rate": 1.7426387479169256e-05,
+ "loss": 0.5515,
+ "step": 9416
+ },
+ {
+ "epoch": 25.659400544959126,
+ "grad_norm": 6.922572612762451,
+ "learning_rate": 1.7425796450446532e-05,
+ "loss": 0.5296,
+ "step": 9417
+ },
+ {
+ "epoch": 25.662125340599456,
+ "grad_norm": 6.6560444831848145,
+ "learning_rate": 1.7425205363891938e-05,
+ "loss": 0.6051,
+ "step": 9418
+ },
+ {
+ "epoch": 25.66485013623978,
+ "grad_norm": 8.202136993408203,
+ "learning_rate": 1.7424614219510087e-05,
+ "loss": 0.8121,
+ "step": 9419
+ },
+ {
+ "epoch": 25.667574931880107,
+ "grad_norm": 7.640063285827637,
+ "learning_rate": 1.742402301730558e-05,
+ "loss": 0.6223,
+ "step": 9420
+ },
+ {
+ "epoch": 25.670299727520437,
+ "grad_norm": 7.376254081726074,
+ "learning_rate": 1.7423431757283018e-05,
+ "loss": 0.5077,
+ "step": 9421
+ },
+ {
+ "epoch": 25.673024523160763,
+ "grad_norm": 8.305665016174316,
+ "learning_rate": 1.742284043944701e-05,
+ "loss": 0.5715,
+ "step": 9422
+ },
+ {
+ "epoch": 25.67574931880109,
+ "grad_norm": 6.209292411804199,
+ "learning_rate": 1.742224906380216e-05,
+ "loss": 0.4484,
+ "step": 9423
+ },
+ {
+ "epoch": 25.678474114441418,
+ "grad_norm": 8.914823532104492,
+ "learning_rate": 1.7421657630353068e-05,
+ "loss": 0.6091,
+ "step": 9424
+ },
+ {
+ "epoch": 25.681198910081743,
+ "grad_norm": 7.535190105438232,
+ "learning_rate": 1.742106613910435e-05,
+ "loss": 0.5803,
+ "step": 9425
+ },
+ {
+ "epoch": 25.68392370572207,
+ "grad_norm": 7.564618110656738,
+ "learning_rate": 1.7420474590060606e-05,
+ "loss": 0.4732,
+ "step": 9426
+ },
+ {
+ "epoch": 25.6866485013624,
+ "grad_norm": 7.2093963623046875,
+ "learning_rate": 1.7419882983226446e-05,
+ "loss": 0.6475,
+ "step": 9427
+ },
+ {
+ "epoch": 25.689373297002724,
+ "grad_norm": 8.094961166381836,
+ "learning_rate": 1.7419291318606476e-05,
+ "loss": 0.6348,
+ "step": 9428
+ },
+ {
+ "epoch": 25.69209809264305,
+ "grad_norm": 11.35478687286377,
+ "learning_rate": 1.7418699596205303e-05,
+ "loss": 0.5717,
+ "step": 9429
+ },
+ {
+ "epoch": 25.69482288828338,
+ "grad_norm": 7.570865631103516,
+ "learning_rate": 1.7418107816027538e-05,
+ "loss": 0.5313,
+ "step": 9430
+ },
+ {
+ "epoch": 25.697547683923705,
+ "grad_norm": 7.583775043487549,
+ "learning_rate": 1.741751597807779e-05,
+ "loss": 0.5817,
+ "step": 9431
+ },
+ {
+ "epoch": 25.70027247956403,
+ "grad_norm": 7.399974346160889,
+ "learning_rate": 1.741692408236066e-05,
+ "loss": 0.4835,
+ "step": 9432
+ },
+ {
+ "epoch": 25.70299727520436,
+ "grad_norm": 7.177084922790527,
+ "learning_rate": 1.7416332128880768e-05,
+ "loss": 0.5538,
+ "step": 9433
+ },
+ {
+ "epoch": 25.705722070844686,
+ "grad_norm": 6.838465213775635,
+ "learning_rate": 1.7415740117642718e-05,
+ "loss": 0.551,
+ "step": 9434
+ },
+ {
+ "epoch": 25.708446866485012,
+ "grad_norm": 7.103573799133301,
+ "learning_rate": 1.7415148048651126e-05,
+ "loss": 0.504,
+ "step": 9435
+ },
+ {
+ "epoch": 25.71117166212534,
+ "grad_norm": 7.283553600311279,
+ "learning_rate": 1.7414555921910597e-05,
+ "loss": 0.7719,
+ "step": 9436
+ },
+ {
+ "epoch": 25.713896457765667,
+ "grad_norm": 7.7645087242126465,
+ "learning_rate": 1.7413963737425747e-05,
+ "loss": 0.5516,
+ "step": 9437
+ },
+ {
+ "epoch": 25.716621253405993,
+ "grad_norm": 8.091785430908203,
+ "learning_rate": 1.7413371495201183e-05,
+ "loss": 0.5369,
+ "step": 9438
+ },
+ {
+ "epoch": 25.719346049046322,
+ "grad_norm": 6.979974269866943,
+ "learning_rate": 1.7412779195241524e-05,
+ "loss": 0.9425,
+ "step": 9439
+ },
+ {
+ "epoch": 25.722070844686648,
+ "grad_norm": 9.18759536743164,
+ "learning_rate": 1.741218683755138e-05,
+ "loss": 0.5754,
+ "step": 9440
+ },
+ {
+ "epoch": 25.724795640326974,
+ "grad_norm": 7.882137775421143,
+ "learning_rate": 1.7411594422135357e-05,
+ "loss": 0.5159,
+ "step": 9441
+ },
+ {
+ "epoch": 25.727520435967303,
+ "grad_norm": 7.561557769775391,
+ "learning_rate": 1.741100194899808e-05,
+ "loss": 0.6474,
+ "step": 9442
+ },
+ {
+ "epoch": 25.73024523160763,
+ "grad_norm": 17.012176513671875,
+ "learning_rate": 1.741040941814416e-05,
+ "loss": 0.6215,
+ "step": 9443
+ },
+ {
+ "epoch": 25.732970027247955,
+ "grad_norm": 7.687644004821777,
+ "learning_rate": 1.7409816829578205e-05,
+ "loss": 0.6672,
+ "step": 9444
+ },
+ {
+ "epoch": 25.735694822888284,
+ "grad_norm": 6.788773059844971,
+ "learning_rate": 1.7409224183304836e-05,
+ "loss": 0.5242,
+ "step": 9445
+ },
+ {
+ "epoch": 25.73841961852861,
+ "grad_norm": 8.36744213104248,
+ "learning_rate": 1.740863147932867e-05,
+ "loss": 0.4936,
+ "step": 9446
+ },
+ {
+ "epoch": 25.741144414168936,
+ "grad_norm": 7.843606948852539,
+ "learning_rate": 1.740803871765432e-05,
+ "loss": 0.6784,
+ "step": 9447
+ },
+ {
+ "epoch": 25.743869209809265,
+ "grad_norm": 8.095901489257812,
+ "learning_rate": 1.7407445898286405e-05,
+ "loss": 0.5069,
+ "step": 9448
+ },
+ {
+ "epoch": 25.74659400544959,
+ "grad_norm": 8.641240119934082,
+ "learning_rate": 1.7406853021229535e-05,
+ "loss": 0.7564,
+ "step": 9449
+ },
+ {
+ "epoch": 25.749318801089917,
+ "grad_norm": 7.994680881500244,
+ "learning_rate": 1.7406260086488336e-05,
+ "loss": 0.5792,
+ "step": 9450
+ },
+ {
+ "epoch": 25.752043596730246,
+ "grad_norm": 7.075345993041992,
+ "learning_rate": 1.740566709406742e-05,
+ "loss": 0.6983,
+ "step": 9451
+ },
+ {
+ "epoch": 25.754768392370572,
+ "grad_norm": 7.390691757202148,
+ "learning_rate": 1.7405074043971407e-05,
+ "loss": 0.7299,
+ "step": 9452
+ },
+ {
+ "epoch": 25.757493188010898,
+ "grad_norm": 9.825465202331543,
+ "learning_rate": 1.7404480936204914e-05,
+ "loss": 0.7331,
+ "step": 9453
+ },
+ {
+ "epoch": 25.760217983651227,
+ "grad_norm": 8.008077621459961,
+ "learning_rate": 1.7403887770772564e-05,
+ "loss": 0.5295,
+ "step": 9454
+ },
+ {
+ "epoch": 25.762942779291553,
+ "grad_norm": 8.09028148651123,
+ "learning_rate": 1.7403294547678975e-05,
+ "loss": 0.6837,
+ "step": 9455
+ },
+ {
+ "epoch": 25.76566757493188,
+ "grad_norm": 7.616891384124756,
+ "learning_rate": 1.7402701266928767e-05,
+ "loss": 0.5135,
+ "step": 9456
+ },
+ {
+ "epoch": 25.768392370572208,
+ "grad_norm": 14.6254243850708,
+ "learning_rate": 1.7402107928526556e-05,
+ "loss": 0.5233,
+ "step": 9457
+ },
+ {
+ "epoch": 25.771117166212534,
+ "grad_norm": 7.203038692474365,
+ "learning_rate": 1.740151453247697e-05,
+ "loss": 0.4981,
+ "step": 9458
+ },
+ {
+ "epoch": 25.77384196185286,
+ "grad_norm": 8.74550724029541,
+ "learning_rate": 1.7400921078784624e-05,
+ "loss": 0.6011,
+ "step": 9459
+ },
+ {
+ "epoch": 25.77656675749319,
+ "grad_norm": 7.549883842468262,
+ "learning_rate": 1.7400327567454145e-05,
+ "loss": 0.4445,
+ "step": 9460
+ },
+ {
+ "epoch": 25.779291553133515,
+ "grad_norm": 7.61672306060791,
+ "learning_rate": 1.7399733998490152e-05,
+ "loss": 0.6873,
+ "step": 9461
+ },
+ {
+ "epoch": 25.78201634877384,
+ "grad_norm": 7.361455917358398,
+ "learning_rate": 1.739914037189727e-05,
+ "loss": 0.6927,
+ "step": 9462
+ },
+ {
+ "epoch": 25.78474114441417,
+ "grad_norm": 5.834643840789795,
+ "learning_rate": 1.739854668768012e-05,
+ "loss": 0.7412,
+ "step": 9463
+ },
+ {
+ "epoch": 25.787465940054496,
+ "grad_norm": 8.191956520080566,
+ "learning_rate": 1.7397952945843325e-05,
+ "loss": 0.6303,
+ "step": 9464
+ },
+ {
+ "epoch": 25.79019073569482,
+ "grad_norm": 11.40386962890625,
+ "learning_rate": 1.7397359146391513e-05,
+ "loss": 0.7029,
+ "step": 9465
+ },
+ {
+ "epoch": 25.79291553133515,
+ "grad_norm": 8.3353910446167,
+ "learning_rate": 1.7396765289329308e-05,
+ "loss": 0.5961,
+ "step": 9466
+ },
+ {
+ "epoch": 25.795640326975477,
+ "grad_norm": 8.796889305114746,
+ "learning_rate": 1.739617137466133e-05,
+ "loss": 0.6309,
+ "step": 9467
+ },
+ {
+ "epoch": 25.798365122615802,
+ "grad_norm": 7.54941987991333,
+ "learning_rate": 1.7395577402392208e-05,
+ "loss": 0.6583,
+ "step": 9468
+ },
+ {
+ "epoch": 25.80108991825613,
+ "grad_norm": 6.982385635375977,
+ "learning_rate": 1.739498337252657e-05,
+ "loss": 0.6166,
+ "step": 9469
+ },
+ {
+ "epoch": 25.803814713896458,
+ "grad_norm": 7.676999568939209,
+ "learning_rate": 1.7394389285069034e-05,
+ "loss": 0.7845,
+ "step": 9470
+ },
+ {
+ "epoch": 25.806539509536783,
+ "grad_norm": 7.578592777252197,
+ "learning_rate": 1.7393795140024235e-05,
+ "loss": 0.8047,
+ "step": 9471
+ },
+ {
+ "epoch": 25.809264305177113,
+ "grad_norm": 9.978384017944336,
+ "learning_rate": 1.7393200937396795e-05,
+ "loss": 0.5497,
+ "step": 9472
+ },
+ {
+ "epoch": 25.81198910081744,
+ "grad_norm": 13.144746780395508,
+ "learning_rate": 1.7392606677191345e-05,
+ "loss": 0.629,
+ "step": 9473
+ },
+ {
+ "epoch": 25.814713896457764,
+ "grad_norm": 8.699050903320312,
+ "learning_rate": 1.7392012359412517e-05,
+ "loss": 0.4867,
+ "step": 9474
+ },
+ {
+ "epoch": 25.817438692098094,
+ "grad_norm": 11.404301643371582,
+ "learning_rate": 1.7391417984064932e-05,
+ "loss": 0.7406,
+ "step": 9475
+ },
+ {
+ "epoch": 25.82016348773842,
+ "grad_norm": 7.311351776123047,
+ "learning_rate": 1.7390823551153218e-05,
+ "loss": 0.5009,
+ "step": 9476
+ },
+ {
+ "epoch": 25.822888283378745,
+ "grad_norm": 9.406844139099121,
+ "learning_rate": 1.739022906068201e-05,
+ "loss": 0.6615,
+ "step": 9477
+ },
+ {
+ "epoch": 25.825613079019075,
+ "grad_norm": 8.44792366027832,
+ "learning_rate": 1.738963451265594e-05,
+ "loss": 0.6606,
+ "step": 9478
+ },
+ {
+ "epoch": 25.8283378746594,
+ "grad_norm": 9.070053100585938,
+ "learning_rate": 1.738903990707963e-05,
+ "loss": 0.5695,
+ "step": 9479
+ },
+ {
+ "epoch": 25.831062670299726,
+ "grad_norm": 8.260103225708008,
+ "learning_rate": 1.7388445243957717e-05,
+ "loss": 0.5321,
+ "step": 9480
+ },
+ {
+ "epoch": 25.833787465940055,
+ "grad_norm": 8.975306510925293,
+ "learning_rate": 1.7387850523294827e-05,
+ "loss": 0.5169,
+ "step": 9481
+ },
+ {
+ "epoch": 25.83651226158038,
+ "grad_norm": 8.646730422973633,
+ "learning_rate": 1.7387255745095597e-05,
+ "loss": 0.4396,
+ "step": 9482
+ },
+ {
+ "epoch": 25.839237057220707,
+ "grad_norm": 8.46390151977539,
+ "learning_rate": 1.738666090936466e-05,
+ "loss": 0.6315,
+ "step": 9483
+ },
+ {
+ "epoch": 25.841961852861036,
+ "grad_norm": 7.23923397064209,
+ "learning_rate": 1.738606601610664e-05,
+ "loss": 0.563,
+ "step": 9484
+ },
+ {
+ "epoch": 25.844686648501362,
+ "grad_norm": 8.615715980529785,
+ "learning_rate": 1.738547106532618e-05,
+ "loss": 0.4901,
+ "step": 9485
+ },
+ {
+ "epoch": 25.847411444141688,
+ "grad_norm": 9.231773376464844,
+ "learning_rate": 1.7384876057027907e-05,
+ "loss": 0.5825,
+ "step": 9486
+ },
+ {
+ "epoch": 25.850136239782017,
+ "grad_norm": 8.428955078125,
+ "learning_rate": 1.7384280991216455e-05,
+ "loss": 0.5003,
+ "step": 9487
+ },
+ {
+ "epoch": 25.852861035422343,
+ "grad_norm": 9.66771125793457,
+ "learning_rate": 1.7383685867896463e-05,
+ "loss": 0.7293,
+ "step": 9488
+ },
+ {
+ "epoch": 25.85558583106267,
+ "grad_norm": 8.030937194824219,
+ "learning_rate": 1.7383090687072563e-05,
+ "loss": 0.4869,
+ "step": 9489
+ },
+ {
+ "epoch": 25.858310626703,
+ "grad_norm": 7.184062957763672,
+ "learning_rate": 1.738249544874939e-05,
+ "loss": 0.6099,
+ "step": 9490
+ },
+ {
+ "epoch": 25.861035422343324,
+ "grad_norm": 7.648211479187012,
+ "learning_rate": 1.7381900152931582e-05,
+ "loss": 0.7165,
+ "step": 9491
+ },
+ {
+ "epoch": 25.86376021798365,
+ "grad_norm": 7.263122081756592,
+ "learning_rate": 1.738130479962377e-05,
+ "loss": 0.4726,
+ "step": 9492
+ },
+ {
+ "epoch": 25.86648501362398,
+ "grad_norm": 9.472850799560547,
+ "learning_rate": 1.7380709388830595e-05,
+ "loss": 0.6682,
+ "step": 9493
+ },
+ {
+ "epoch": 25.869209809264305,
+ "grad_norm": 10.854084968566895,
+ "learning_rate": 1.738011392055669e-05,
+ "loss": 0.5417,
+ "step": 9494
+ },
+ {
+ "epoch": 25.87193460490463,
+ "grad_norm": 7.673418998718262,
+ "learning_rate": 1.7379518394806703e-05,
+ "loss": 0.5994,
+ "step": 9495
+ },
+ {
+ "epoch": 25.87465940054496,
+ "grad_norm": 8.981013298034668,
+ "learning_rate": 1.7378922811585256e-05,
+ "loss": 0.8358,
+ "step": 9496
+ },
+ {
+ "epoch": 25.877384196185286,
+ "grad_norm": 7.159624099731445,
+ "learning_rate": 1.7378327170897e-05,
+ "loss": 0.6071,
+ "step": 9497
+ },
+ {
+ "epoch": 25.88010899182561,
+ "grad_norm": 7.000638008117676,
+ "learning_rate": 1.737773147274657e-05,
+ "loss": 0.4789,
+ "step": 9498
+ },
+ {
+ "epoch": 25.88283378746594,
+ "grad_norm": 8.612425804138184,
+ "learning_rate": 1.73771357171386e-05,
+ "loss": 0.8832,
+ "step": 9499
+ },
+ {
+ "epoch": 25.885558583106267,
+ "grad_norm": 30.55554962158203,
+ "learning_rate": 1.7376539904077742e-05,
+ "loss": 0.6271,
+ "step": 9500
+ },
+ {
+ "epoch": 25.888283378746593,
+ "grad_norm": 7.560913562774658,
+ "learning_rate": 1.7375944033568625e-05,
+ "loss": 0.6835,
+ "step": 9501
+ },
+ {
+ "epoch": 25.891008174386922,
+ "grad_norm": 7.5395097732543945,
+ "learning_rate": 1.737534810561589e-05,
+ "loss": 0.6556,
+ "step": 9502
+ },
+ {
+ "epoch": 25.893732970027248,
+ "grad_norm": 9.153618812561035,
+ "learning_rate": 1.7374752120224184e-05,
+ "loss": 0.7285,
+ "step": 9503
+ },
+ {
+ "epoch": 25.896457765667574,
+ "grad_norm": 9.776400566101074,
+ "learning_rate": 1.7374156077398144e-05,
+ "loss": 0.705,
+ "step": 9504
+ },
+ {
+ "epoch": 25.899182561307903,
+ "grad_norm": 7.857279300689697,
+ "learning_rate": 1.7373559977142416e-05,
+ "loss": 0.5347,
+ "step": 9505
+ },
+ {
+ "epoch": 25.90190735694823,
+ "grad_norm": 7.109128475189209,
+ "learning_rate": 1.7372963819461642e-05,
+ "loss": 0.6846,
+ "step": 9506
+ },
+ {
+ "epoch": 25.904632152588555,
+ "grad_norm": 7.639939785003662,
+ "learning_rate": 1.737236760436046e-05,
+ "loss": 0.6296,
+ "step": 9507
+ },
+ {
+ "epoch": 25.907356948228884,
+ "grad_norm": 7.69437837600708,
+ "learning_rate": 1.7371771331843517e-05,
+ "loss": 0.5632,
+ "step": 9508
+ },
+ {
+ "epoch": 25.91008174386921,
+ "grad_norm": 8.280343055725098,
+ "learning_rate": 1.7371175001915455e-05,
+ "loss": 0.6794,
+ "step": 9509
+ },
+ {
+ "epoch": 25.912806539509535,
+ "grad_norm": 10.756189346313477,
+ "learning_rate": 1.7370578614580922e-05,
+ "loss": 0.6239,
+ "step": 9510
+ },
+ {
+ "epoch": 25.915531335149865,
+ "grad_norm": 9.908435821533203,
+ "learning_rate": 1.736998216984456e-05,
+ "loss": 0.6348,
+ "step": 9511
+ },
+ {
+ "epoch": 25.91825613079019,
+ "grad_norm": 8.193130493164062,
+ "learning_rate": 1.7369385667711013e-05,
+ "loss": 0.6911,
+ "step": 9512
+ },
+ {
+ "epoch": 25.920980926430516,
+ "grad_norm": 9.463773727416992,
+ "learning_rate": 1.7368789108184927e-05,
+ "loss": 0.5245,
+ "step": 9513
+ },
+ {
+ "epoch": 25.923705722070846,
+ "grad_norm": 8.20947265625,
+ "learning_rate": 1.7368192491270946e-05,
+ "loss": 0.5592,
+ "step": 9514
+ },
+ {
+ "epoch": 25.92643051771117,
+ "grad_norm": 8.28555679321289,
+ "learning_rate": 1.7367595816973722e-05,
+ "loss": 0.6529,
+ "step": 9515
+ },
+ {
+ "epoch": 25.929155313351497,
+ "grad_norm": 7.5748491287231445,
+ "learning_rate": 1.73669990852979e-05,
+ "loss": 0.5446,
+ "step": 9516
+ },
+ {
+ "epoch": 25.931880108991827,
+ "grad_norm": 7.565945148468018,
+ "learning_rate": 1.7366402296248126e-05,
+ "loss": 0.6647,
+ "step": 9517
+ },
+ {
+ "epoch": 25.934604904632153,
+ "grad_norm": 7.207835674285889,
+ "learning_rate": 1.7365805449829047e-05,
+ "loss": 0.7472,
+ "step": 9518
+ },
+ {
+ "epoch": 25.93732970027248,
+ "grad_norm": 9.150147438049316,
+ "learning_rate": 1.7365208546045315e-05,
+ "loss": 0.5984,
+ "step": 9519
+ },
+ {
+ "epoch": 25.940054495912808,
+ "grad_norm": 7.448739528656006,
+ "learning_rate": 1.736461158490157e-05,
+ "loss": 0.5756,
+ "step": 9520
+ },
+ {
+ "epoch": 25.942779291553133,
+ "grad_norm": 9.423181533813477,
+ "learning_rate": 1.7364014566402472e-05,
+ "loss": 0.6123,
+ "step": 9521
+ },
+ {
+ "epoch": 25.94550408719346,
+ "grad_norm": 7.365279197692871,
+ "learning_rate": 1.7363417490552664e-05,
+ "loss": 0.4821,
+ "step": 9522
+ },
+ {
+ "epoch": 25.94822888283379,
+ "grad_norm": 7.734255313873291,
+ "learning_rate": 1.7362820357356794e-05,
+ "loss": 0.5531,
+ "step": 9523
+ },
+ {
+ "epoch": 25.950953678474114,
+ "grad_norm": 6.780492305755615,
+ "learning_rate": 1.736222316681952e-05,
+ "loss": 0.6304,
+ "step": 9524
+ },
+ {
+ "epoch": 25.95367847411444,
+ "grad_norm": 17.256683349609375,
+ "learning_rate": 1.736162591894549e-05,
+ "loss": 0.6966,
+ "step": 9525
+ },
+ {
+ "epoch": 25.95640326975477,
+ "grad_norm": 11.581868171691895,
+ "learning_rate": 1.7361028613739354e-05,
+ "loss": 0.6542,
+ "step": 9526
+ },
+ {
+ "epoch": 25.959128065395095,
+ "grad_norm": 8.833714485168457,
+ "learning_rate": 1.7360431251205763e-05,
+ "loss": 0.6693,
+ "step": 9527
+ },
+ {
+ "epoch": 25.96185286103542,
+ "grad_norm": 7.809795379638672,
+ "learning_rate": 1.735983383134937e-05,
+ "loss": 0.7259,
+ "step": 9528
+ },
+ {
+ "epoch": 25.96457765667575,
+ "grad_norm": 7.3385820388793945,
+ "learning_rate": 1.7359236354174826e-05,
+ "loss": 0.6353,
+ "step": 9529
+ },
+ {
+ "epoch": 25.967302452316076,
+ "grad_norm": 7.326361179351807,
+ "learning_rate": 1.7358638819686787e-05,
+ "loss": 0.5353,
+ "step": 9530
+ },
+ {
+ "epoch": 25.970027247956402,
+ "grad_norm": 6.983292579650879,
+ "learning_rate": 1.735804122788991e-05,
+ "loss": 0.6599,
+ "step": 9531
+ },
+ {
+ "epoch": 25.97275204359673,
+ "grad_norm": 7.214084625244141,
+ "learning_rate": 1.735744357878884e-05,
+ "loss": 0.6243,
+ "step": 9532
+ },
+ {
+ "epoch": 25.975476839237057,
+ "grad_norm": 7.334532737731934,
+ "learning_rate": 1.7356845872388238e-05,
+ "loss": 0.8033,
+ "step": 9533
+ },
+ {
+ "epoch": 25.978201634877383,
+ "grad_norm": 9.344524383544922,
+ "learning_rate": 1.7356248108692758e-05,
+ "loss": 0.5524,
+ "step": 9534
+ },
+ {
+ "epoch": 25.980926430517712,
+ "grad_norm": 7.228560924530029,
+ "learning_rate": 1.735565028770705e-05,
+ "loss": 0.6976,
+ "step": 9535
+ },
+ {
+ "epoch": 25.983651226158038,
+ "grad_norm": 11.06403636932373,
+ "learning_rate": 1.735505240943578e-05,
+ "loss": 0.6921,
+ "step": 9536
+ },
+ {
+ "epoch": 25.986376021798364,
+ "grad_norm": 8.322148323059082,
+ "learning_rate": 1.7354454473883596e-05,
+ "loss": 0.5891,
+ "step": 9537
+ },
+ {
+ "epoch": 25.989100817438693,
+ "grad_norm": 10.034852981567383,
+ "learning_rate": 1.7353856481055157e-05,
+ "loss": 0.7438,
+ "step": 9538
+ },
+ {
+ "epoch": 25.99182561307902,
+ "grad_norm": 11.697212219238281,
+ "learning_rate": 1.735325843095512e-05,
+ "loss": 0.4705,
+ "step": 9539
+ },
+ {
+ "epoch": 25.994550408719345,
+ "grad_norm": 8.835293769836426,
+ "learning_rate": 1.7352660323588146e-05,
+ "loss": 0.7668,
+ "step": 9540
+ },
+ {
+ "epoch": 25.997275204359674,
+ "grad_norm": 7.350338935852051,
+ "learning_rate": 1.7352062158958887e-05,
+ "loss": 0.5106,
+ "step": 9541
+ },
+ {
+ "epoch": 26.0,
+ "grad_norm": 8.838607788085938,
+ "learning_rate": 1.7351463937072008e-05,
+ "loss": 0.6144,
+ "step": 9542
+ },
+ {
+ "epoch": 26.002724795640326,
+ "grad_norm": 7.957286357879639,
+ "learning_rate": 1.735086565793216e-05,
+ "loss": 0.5024,
+ "step": 9543
+ },
+ {
+ "epoch": 26.005449591280655,
+ "grad_norm": 6.296217918395996,
+ "learning_rate": 1.735026732154401e-05,
+ "loss": 0.6693,
+ "step": 9544
+ },
+ {
+ "epoch": 26.00817438692098,
+ "grad_norm": 7.643580436706543,
+ "learning_rate": 1.734966892791221e-05,
+ "loss": 0.4755,
+ "step": 9545
+ },
+ {
+ "epoch": 26.010899182561307,
+ "grad_norm": 9.448199272155762,
+ "learning_rate": 1.734907047704143e-05,
+ "loss": 0.6694,
+ "step": 9546
+ },
+ {
+ "epoch": 26.013623978201636,
+ "grad_norm": 6.621395111083984,
+ "learning_rate": 1.7348471968936325e-05,
+ "loss": 0.5294,
+ "step": 9547
+ },
+ {
+ "epoch": 26.016348773841962,
+ "grad_norm": 10.18807601928711,
+ "learning_rate": 1.7347873403601557e-05,
+ "loss": 0.5653,
+ "step": 9548
+ },
+ {
+ "epoch": 26.019073569482288,
+ "grad_norm": 6.76434850692749,
+ "learning_rate": 1.7347274781041784e-05,
+ "loss": 0.4984,
+ "step": 9549
+ },
+ {
+ "epoch": 26.021798365122617,
+ "grad_norm": 6.526801109313965,
+ "learning_rate": 1.7346676101261676e-05,
+ "loss": 0.4005,
+ "step": 9550
+ },
+ {
+ "epoch": 26.024523160762943,
+ "grad_norm": 8.109182357788086,
+ "learning_rate": 1.734607736426589e-05,
+ "loss": 0.5455,
+ "step": 9551
+ },
+ {
+ "epoch": 26.02724795640327,
+ "grad_norm": 7.0792012214660645,
+ "learning_rate": 1.7345478570059084e-05,
+ "loss": 0.5917,
+ "step": 9552
+ },
+ {
+ "epoch": 26.029972752043598,
+ "grad_norm": 8.693367958068848,
+ "learning_rate": 1.7344879718645934e-05,
+ "loss": 0.4088,
+ "step": 9553
+ },
+ {
+ "epoch": 26.032697547683924,
+ "grad_norm": 7.457730293273926,
+ "learning_rate": 1.7344280810031097e-05,
+ "loss": 0.6736,
+ "step": 9554
+ },
+ {
+ "epoch": 26.03542234332425,
+ "grad_norm": 6.975096702575684,
+ "learning_rate": 1.7343681844219232e-05,
+ "loss": 0.6584,
+ "step": 9555
+ },
+ {
+ "epoch": 26.03814713896458,
+ "grad_norm": 7.109955310821533,
+ "learning_rate": 1.7343082821215015e-05,
+ "loss": 0.5279,
+ "step": 9556
+ },
+ {
+ "epoch": 26.040871934604905,
+ "grad_norm": 9.716678619384766,
+ "learning_rate": 1.73424837410231e-05,
+ "loss": 0.4881,
+ "step": 9557
+ },
+ {
+ "epoch": 26.04359673024523,
+ "grad_norm": 7.266867160797119,
+ "learning_rate": 1.7341884603648164e-05,
+ "loss": 0.5488,
+ "step": 9558
+ },
+ {
+ "epoch": 26.04632152588556,
+ "grad_norm": 7.502307891845703,
+ "learning_rate": 1.7341285409094862e-05,
+ "loss": 0.6344,
+ "step": 9559
+ },
+ {
+ "epoch": 26.049046321525886,
+ "grad_norm": 9.43380355834961,
+ "learning_rate": 1.7340686157367866e-05,
+ "loss": 0.4438,
+ "step": 9560
+ },
+ {
+ "epoch": 26.05177111716621,
+ "grad_norm": 8.707967758178711,
+ "learning_rate": 1.7340086848471848e-05,
+ "loss": 0.5626,
+ "step": 9561
+ },
+ {
+ "epoch": 26.05449591280654,
+ "grad_norm": 20.586732864379883,
+ "learning_rate": 1.7339487482411464e-05,
+ "loss": 0.6022,
+ "step": 9562
+ },
+ {
+ "epoch": 26.057220708446867,
+ "grad_norm": 7.162247657775879,
+ "learning_rate": 1.733888805919139e-05,
+ "loss": 0.6588,
+ "step": 9563
+ },
+ {
+ "epoch": 26.059945504087192,
+ "grad_norm": 7.609987258911133,
+ "learning_rate": 1.7338288578816292e-05,
+ "loss": 0.6384,
+ "step": 9564
+ },
+ {
+ "epoch": 26.06267029972752,
+ "grad_norm": 8.76731014251709,
+ "learning_rate": 1.733768904129084e-05,
+ "loss": 0.5563,
+ "step": 9565
+ },
+ {
+ "epoch": 26.065395095367847,
+ "grad_norm": 13.402876853942871,
+ "learning_rate": 1.7337089446619697e-05,
+ "loss": 0.5977,
+ "step": 9566
+ },
+ {
+ "epoch": 26.068119891008173,
+ "grad_norm": 8.927674293518066,
+ "learning_rate": 1.733648979480754e-05,
+ "loss": 0.5298,
+ "step": 9567
+ },
+ {
+ "epoch": 26.070844686648503,
+ "grad_norm": 7.532134532928467,
+ "learning_rate": 1.733589008585904e-05,
+ "loss": 0.5392,
+ "step": 9568
+ },
+ {
+ "epoch": 26.07356948228883,
+ "grad_norm": 9.537463188171387,
+ "learning_rate": 1.733529031977886e-05,
+ "loss": 0.3874,
+ "step": 9569
+ },
+ {
+ "epoch": 26.076294277929154,
+ "grad_norm": 7.319093704223633,
+ "learning_rate": 1.7334690496571677e-05,
+ "loss": 0.4325,
+ "step": 9570
+ },
+ {
+ "epoch": 26.079019073569484,
+ "grad_norm": 10.53061580657959,
+ "learning_rate": 1.733409061624216e-05,
+ "loss": 0.5564,
+ "step": 9571
+ },
+ {
+ "epoch": 26.08174386920981,
+ "grad_norm": 7.40098237991333,
+ "learning_rate": 1.733349067879498e-05,
+ "loss": 0.6164,
+ "step": 9572
+ },
+ {
+ "epoch": 26.084468664850135,
+ "grad_norm": 6.9981865882873535,
+ "learning_rate": 1.7332890684234815e-05,
+ "loss": 0.5289,
+ "step": 9573
+ },
+ {
+ "epoch": 26.087193460490465,
+ "grad_norm": 7.324646949768066,
+ "learning_rate": 1.7332290632566325e-05,
+ "loss": 0.4944,
+ "step": 9574
+ },
+ {
+ "epoch": 26.08991825613079,
+ "grad_norm": 7.746469497680664,
+ "learning_rate": 1.73316905237942e-05,
+ "loss": 0.497,
+ "step": 9575
+ },
+ {
+ "epoch": 26.092643051771116,
+ "grad_norm": 6.78636360168457,
+ "learning_rate": 1.7331090357923103e-05,
+ "loss": 0.4863,
+ "step": 9576
+ },
+ {
+ "epoch": 26.095367847411445,
+ "grad_norm": 7.395721435546875,
+ "learning_rate": 1.7330490134957707e-05,
+ "loss": 0.4698,
+ "step": 9577
+ },
+ {
+ "epoch": 26.09809264305177,
+ "grad_norm": 8.91894817352295,
+ "learning_rate": 1.732988985490269e-05,
+ "loss": 0.5521,
+ "step": 9578
+ },
+ {
+ "epoch": 26.100817438692097,
+ "grad_norm": 8.462091445922852,
+ "learning_rate": 1.7329289517762733e-05,
+ "loss": 0.5223,
+ "step": 9579
+ },
+ {
+ "epoch": 26.103542234332426,
+ "grad_norm": 7.259838581085205,
+ "learning_rate": 1.73286891235425e-05,
+ "loss": 0.4938,
+ "step": 9580
+ },
+ {
+ "epoch": 26.106267029972752,
+ "grad_norm": 9.486263275146484,
+ "learning_rate": 1.7328088672246674e-05,
+ "loss": 0.4198,
+ "step": 9581
+ },
+ {
+ "epoch": 26.108991825613078,
+ "grad_norm": 7.32037353515625,
+ "learning_rate": 1.7327488163879923e-05,
+ "loss": 0.5327,
+ "step": 9582
+ },
+ {
+ "epoch": 26.111716621253407,
+ "grad_norm": 14.064255714416504,
+ "learning_rate": 1.7326887598446937e-05,
+ "loss": 0.5925,
+ "step": 9583
+ },
+ {
+ "epoch": 26.114441416893733,
+ "grad_norm": 7.668673515319824,
+ "learning_rate": 1.7326286975952387e-05,
+ "loss": 0.4813,
+ "step": 9584
+ },
+ {
+ "epoch": 26.11716621253406,
+ "grad_norm": 7.011399269104004,
+ "learning_rate": 1.7325686296400946e-05,
+ "loss": 0.5601,
+ "step": 9585
+ },
+ {
+ "epoch": 26.11989100817439,
+ "grad_norm": 9.075329780578613,
+ "learning_rate": 1.7325085559797295e-05,
+ "loss": 0.5008,
+ "step": 9586
+ },
+ {
+ "epoch": 26.122615803814714,
+ "grad_norm": 9.160786628723145,
+ "learning_rate": 1.7324484766146118e-05,
+ "loss": 0.6431,
+ "step": 9587
+ },
+ {
+ "epoch": 26.12534059945504,
+ "grad_norm": 6.6641130447387695,
+ "learning_rate": 1.7323883915452087e-05,
+ "loss": 0.5106,
+ "step": 9588
+ },
+ {
+ "epoch": 26.12806539509537,
+ "grad_norm": 8.302316665649414,
+ "learning_rate": 1.7323283007719883e-05,
+ "loss": 0.5582,
+ "step": 9589
+ },
+ {
+ "epoch": 26.130790190735695,
+ "grad_norm": 8.207863807678223,
+ "learning_rate": 1.7322682042954186e-05,
+ "loss": 0.5475,
+ "step": 9590
+ },
+ {
+ "epoch": 26.13351498637602,
+ "grad_norm": 8.551682472229004,
+ "learning_rate": 1.732208102115968e-05,
+ "loss": 0.7343,
+ "step": 9591
+ },
+ {
+ "epoch": 26.13623978201635,
+ "grad_norm": 17.928634643554688,
+ "learning_rate": 1.732147994234104e-05,
+ "loss": 0.4928,
+ "step": 9592
+ },
+ {
+ "epoch": 26.138964577656676,
+ "grad_norm": 8.315779685974121,
+ "learning_rate": 1.732087880650295e-05,
+ "loss": 0.4801,
+ "step": 9593
+ },
+ {
+ "epoch": 26.141689373297,
+ "grad_norm": 8.798788070678711,
+ "learning_rate": 1.7320277613650093e-05,
+ "loss": 0.5987,
+ "step": 9594
+ },
+ {
+ "epoch": 26.14441416893733,
+ "grad_norm": 7.271299839019775,
+ "learning_rate": 1.7319676363787146e-05,
+ "loss": 0.626,
+ "step": 9595
+ },
+ {
+ "epoch": 26.147138964577657,
+ "grad_norm": 7.583462715148926,
+ "learning_rate": 1.7319075056918798e-05,
+ "loss": 0.4981,
+ "step": 9596
+ },
+ {
+ "epoch": 26.149863760217983,
+ "grad_norm": 11.364434242248535,
+ "learning_rate": 1.731847369304973e-05,
+ "loss": 0.4866,
+ "step": 9597
+ },
+ {
+ "epoch": 26.152588555858312,
+ "grad_norm": 8.130598068237305,
+ "learning_rate": 1.7317872272184624e-05,
+ "loss": 0.5431,
+ "step": 9598
+ },
+ {
+ "epoch": 26.155313351498638,
+ "grad_norm": 10.138801574707031,
+ "learning_rate": 1.7317270794328164e-05,
+ "loss": 0.4934,
+ "step": 9599
+ },
+ {
+ "epoch": 26.158038147138964,
+ "grad_norm": 7.542050361633301,
+ "learning_rate": 1.731666925948503e-05,
+ "loss": 0.6616,
+ "step": 9600
+ },
+ {
+ "epoch": 26.160762942779293,
+ "grad_norm": 9.432887077331543,
+ "learning_rate": 1.731606766765992e-05,
+ "loss": 0.5143,
+ "step": 9601
+ },
+ {
+ "epoch": 26.16348773841962,
+ "grad_norm": 10.398560523986816,
+ "learning_rate": 1.7315466018857505e-05,
+ "loss": 0.5665,
+ "step": 9602
+ },
+ {
+ "epoch": 26.166212534059945,
+ "grad_norm": 17.910289764404297,
+ "learning_rate": 1.7314864313082477e-05,
+ "loss": 0.5927,
+ "step": 9603
+ },
+ {
+ "epoch": 26.168937329700274,
+ "grad_norm": 7.854093551635742,
+ "learning_rate": 1.731426255033952e-05,
+ "loss": 0.5396,
+ "step": 9604
+ },
+ {
+ "epoch": 26.1716621253406,
+ "grad_norm": 6.922926902770996,
+ "learning_rate": 1.7313660730633324e-05,
+ "loss": 0.4514,
+ "step": 9605
+ },
+ {
+ "epoch": 26.174386920980925,
+ "grad_norm": 7.1274542808532715,
+ "learning_rate": 1.7313058853968572e-05,
+ "loss": 0.6428,
+ "step": 9606
+ },
+ {
+ "epoch": 26.177111716621255,
+ "grad_norm": 9.016749382019043,
+ "learning_rate": 1.731245692034995e-05,
+ "loss": 0.4739,
+ "step": 9607
+ },
+ {
+ "epoch": 26.17983651226158,
+ "grad_norm": 7.756386756896973,
+ "learning_rate": 1.7311854929782154e-05,
+ "loss": 0.5453,
+ "step": 9608
+ },
+ {
+ "epoch": 26.182561307901906,
+ "grad_norm": 27.780536651611328,
+ "learning_rate": 1.7311252882269864e-05,
+ "loss": 0.5505,
+ "step": 9609
+ },
+ {
+ "epoch": 26.185286103542236,
+ "grad_norm": 9.53674602508545,
+ "learning_rate": 1.7310650777817775e-05,
+ "loss": 0.6656,
+ "step": 9610
+ },
+ {
+ "epoch": 26.18801089918256,
+ "grad_norm": 7.744842052459717,
+ "learning_rate": 1.7310048616430572e-05,
+ "loss": 0.6854,
+ "step": 9611
+ },
+ {
+ "epoch": 26.190735694822887,
+ "grad_norm": 7.945459842681885,
+ "learning_rate": 1.7309446398112942e-05,
+ "loss": 0.5873,
+ "step": 9612
+ },
+ {
+ "epoch": 26.193460490463217,
+ "grad_norm": 8.727627754211426,
+ "learning_rate": 1.7308844122869583e-05,
+ "loss": 0.7332,
+ "step": 9613
+ },
+ {
+ "epoch": 26.196185286103542,
+ "grad_norm": 7.102766513824463,
+ "learning_rate": 1.7308241790705182e-05,
+ "loss": 0.7229,
+ "step": 9614
+ },
+ {
+ "epoch": 26.19891008174387,
+ "grad_norm": 7.141162395477295,
+ "learning_rate": 1.7307639401624426e-05,
+ "loss": 0.4993,
+ "step": 9615
+ },
+ {
+ "epoch": 26.201634877384198,
+ "grad_norm": 7.5889201164245605,
+ "learning_rate": 1.730703695563201e-05,
+ "loss": 0.4652,
+ "step": 9616
+ },
+ {
+ "epoch": 26.204359673024523,
+ "grad_norm": 6.298281669616699,
+ "learning_rate": 1.7306434452732626e-05,
+ "loss": 0.8528,
+ "step": 9617
+ },
+ {
+ "epoch": 26.20708446866485,
+ "grad_norm": 8.14534854888916,
+ "learning_rate": 1.7305831892930967e-05,
+ "loss": 0.4977,
+ "step": 9618
+ },
+ {
+ "epoch": 26.20980926430518,
+ "grad_norm": 8.6360502243042,
+ "learning_rate": 1.7305229276231723e-05,
+ "loss": 0.5149,
+ "step": 9619
+ },
+ {
+ "epoch": 26.212534059945504,
+ "grad_norm": 6.499998092651367,
+ "learning_rate": 1.7304626602639586e-05,
+ "loss": 0.6614,
+ "step": 9620
+ },
+ {
+ "epoch": 26.21525885558583,
+ "grad_norm": 7.012277603149414,
+ "learning_rate": 1.7304023872159253e-05,
+ "loss": 0.4642,
+ "step": 9621
+ },
+ {
+ "epoch": 26.21798365122616,
+ "grad_norm": 8.445688247680664,
+ "learning_rate": 1.7303421084795423e-05,
+ "loss": 0.5104,
+ "step": 9622
+ },
+ {
+ "epoch": 26.220708446866485,
+ "grad_norm": 8.20719051361084,
+ "learning_rate": 1.7302818240552775e-05,
+ "loss": 0.5985,
+ "step": 9623
+ },
+ {
+ "epoch": 26.22343324250681,
+ "grad_norm": 7.609731197357178,
+ "learning_rate": 1.7302215339436022e-05,
+ "loss": 0.4766,
+ "step": 9624
+ },
+ {
+ "epoch": 26.22615803814714,
+ "grad_norm": 7.7689995765686035,
+ "learning_rate": 1.7301612381449846e-05,
+ "loss": 0.4874,
+ "step": 9625
+ },
+ {
+ "epoch": 26.228882833787466,
+ "grad_norm": 7.080004692077637,
+ "learning_rate": 1.730100936659895e-05,
+ "loss": 0.7334,
+ "step": 9626
+ },
+ {
+ "epoch": 26.231607629427792,
+ "grad_norm": 6.169990539550781,
+ "learning_rate": 1.7300406294888027e-05,
+ "loss": 0.6745,
+ "step": 9627
+ },
+ {
+ "epoch": 26.23433242506812,
+ "grad_norm": 9.814729690551758,
+ "learning_rate": 1.7299803166321778e-05,
+ "loss": 0.7088,
+ "step": 9628
+ },
+ {
+ "epoch": 26.237057220708447,
+ "grad_norm": 7.300668716430664,
+ "learning_rate": 1.729919998090489e-05,
+ "loss": 0.5634,
+ "step": 9629
+ },
+ {
+ "epoch": 26.239782016348773,
+ "grad_norm": 8.827960014343262,
+ "learning_rate": 1.7298596738642074e-05,
+ "loss": 0.5107,
+ "step": 9630
+ },
+ {
+ "epoch": 26.242506811989102,
+ "grad_norm": 8.249507904052734,
+ "learning_rate": 1.7297993439538017e-05,
+ "loss": 0.4824,
+ "step": 9631
+ },
+ {
+ "epoch": 26.245231607629428,
+ "grad_norm": 9.042924880981445,
+ "learning_rate": 1.7297390083597426e-05,
+ "loss": 0.5739,
+ "step": 9632
+ },
+ {
+ "epoch": 26.247956403269754,
+ "grad_norm": 7.981200218200684,
+ "learning_rate": 1.7296786670824993e-05,
+ "loss": 0.6775,
+ "step": 9633
+ },
+ {
+ "epoch": 26.250681198910083,
+ "grad_norm": 8.520824432373047,
+ "learning_rate": 1.7296183201225422e-05,
+ "loss": 0.5093,
+ "step": 9634
+ },
+ {
+ "epoch": 26.25340599455041,
+ "grad_norm": 6.9999589920043945,
+ "learning_rate": 1.729557967480341e-05,
+ "loss": 0.4789,
+ "step": 9635
+ },
+ {
+ "epoch": 26.256130790190735,
+ "grad_norm": 8.646928787231445,
+ "learning_rate": 1.7294976091563663e-05,
+ "loss": 0.5217,
+ "step": 9636
+ },
+ {
+ "epoch": 26.258855585831064,
+ "grad_norm": 7.401947498321533,
+ "learning_rate": 1.729437245151087e-05,
+ "loss": 0.4224,
+ "step": 9637
+ },
+ {
+ "epoch": 26.26158038147139,
+ "grad_norm": 22.106281280517578,
+ "learning_rate": 1.7293768754649743e-05,
+ "loss": 0.4922,
+ "step": 9638
+ },
+ {
+ "epoch": 26.264305177111716,
+ "grad_norm": 8.012722969055176,
+ "learning_rate": 1.7293165000984977e-05,
+ "loss": 0.6678,
+ "step": 9639
+ },
+ {
+ "epoch": 26.267029972752045,
+ "grad_norm": 7.759902000427246,
+ "learning_rate": 1.729256119052128e-05,
+ "loss": 0.5939,
+ "step": 9640
+ },
+ {
+ "epoch": 26.26975476839237,
+ "grad_norm": 20.350008010864258,
+ "learning_rate": 1.729195732326335e-05,
+ "loss": 0.5517,
+ "step": 9641
+ },
+ {
+ "epoch": 26.272479564032697,
+ "grad_norm": 7.252711296081543,
+ "learning_rate": 1.729135339921589e-05,
+ "loss": 0.6181,
+ "step": 9642
+ },
+ {
+ "epoch": 26.275204359673026,
+ "grad_norm": 7.245285511016846,
+ "learning_rate": 1.7290749418383604e-05,
+ "loss": 0.5903,
+ "step": 9643
+ },
+ {
+ "epoch": 26.277929155313352,
+ "grad_norm": 7.566021919250488,
+ "learning_rate": 1.72901453807712e-05,
+ "loss": 0.5847,
+ "step": 9644
+ },
+ {
+ "epoch": 26.280653950953678,
+ "grad_norm": 7.564478397369385,
+ "learning_rate": 1.7289541286383374e-05,
+ "loss": 0.609,
+ "step": 9645
+ },
+ {
+ "epoch": 26.283378746594007,
+ "grad_norm": 14.416666984558105,
+ "learning_rate": 1.7288937135224833e-05,
+ "loss": 0.4868,
+ "step": 9646
+ },
+ {
+ "epoch": 26.286103542234333,
+ "grad_norm": 9.122889518737793,
+ "learning_rate": 1.7288332927300292e-05,
+ "loss": 0.5007,
+ "step": 9647
+ },
+ {
+ "epoch": 26.28882833787466,
+ "grad_norm": 7.749236583709717,
+ "learning_rate": 1.7287728662614444e-05,
+ "loss": 0.6157,
+ "step": 9648
+ },
+ {
+ "epoch": 26.291553133514988,
+ "grad_norm": 11.464571952819824,
+ "learning_rate": 1.7287124341171998e-05,
+ "loss": 0.4988,
+ "step": 9649
+ },
+ {
+ "epoch": 26.294277929155314,
+ "grad_norm": 7.148604393005371,
+ "learning_rate": 1.7286519962977663e-05,
+ "loss": 0.5306,
+ "step": 9650
+ },
+ {
+ "epoch": 26.29700272479564,
+ "grad_norm": 7.657546043395996,
+ "learning_rate": 1.728591552803615e-05,
+ "loss": 0.5533,
+ "step": 9651
+ },
+ {
+ "epoch": 26.29972752043597,
+ "grad_norm": 8.062553405761719,
+ "learning_rate": 1.7285311036352156e-05,
+ "loss": 0.6571,
+ "step": 9652
+ },
+ {
+ "epoch": 26.302452316076295,
+ "grad_norm": 7.646594524383545,
+ "learning_rate": 1.7284706487930396e-05,
+ "loss": 0.7164,
+ "step": 9653
+ },
+ {
+ "epoch": 26.30517711171662,
+ "grad_norm": 8.308866500854492,
+ "learning_rate": 1.7284101882775575e-05,
+ "loss": 0.6648,
+ "step": 9654
+ },
+ {
+ "epoch": 26.30790190735695,
+ "grad_norm": 8.04058837890625,
+ "learning_rate": 1.7283497220892406e-05,
+ "loss": 0.4776,
+ "step": 9655
+ },
+ {
+ "epoch": 26.310626702997276,
+ "grad_norm": 8.126984596252441,
+ "learning_rate": 1.728289250228559e-05,
+ "loss": 0.5143,
+ "step": 9656
+ },
+ {
+ "epoch": 26.3133514986376,
+ "grad_norm": 6.92857027053833,
+ "learning_rate": 1.7282287726959847e-05,
+ "loss": 0.6617,
+ "step": 9657
+ },
+ {
+ "epoch": 26.31607629427793,
+ "grad_norm": 7.771056652069092,
+ "learning_rate": 1.728168289491988e-05,
+ "loss": 0.5382,
+ "step": 9658
+ },
+ {
+ "epoch": 26.318801089918257,
+ "grad_norm": 7.239190101623535,
+ "learning_rate": 1.72810780061704e-05,
+ "loss": 0.4505,
+ "step": 9659
+ },
+ {
+ "epoch": 26.321525885558582,
+ "grad_norm": 8.406765937805176,
+ "learning_rate": 1.728047306071612e-05,
+ "loss": 0.6041,
+ "step": 9660
+ },
+ {
+ "epoch": 26.32425068119891,
+ "grad_norm": 9.182141304016113,
+ "learning_rate": 1.727986805856175e-05,
+ "loss": 0.4531,
+ "step": 9661
+ },
+ {
+ "epoch": 26.326975476839237,
+ "grad_norm": 7.7115631103515625,
+ "learning_rate": 1.7279262999712e-05,
+ "loss": 0.4387,
+ "step": 9662
+ },
+ {
+ "epoch": 26.329700272479563,
+ "grad_norm": 8.787193298339844,
+ "learning_rate": 1.7278657884171585e-05,
+ "loss": 0.6171,
+ "step": 9663
+ },
+ {
+ "epoch": 26.332425068119893,
+ "grad_norm": 8.689203262329102,
+ "learning_rate": 1.7278052711945218e-05,
+ "loss": 0.5219,
+ "step": 9664
+ },
+ {
+ "epoch": 26.33514986376022,
+ "grad_norm": 6.698019027709961,
+ "learning_rate": 1.7277447483037608e-05,
+ "loss": 0.5166,
+ "step": 9665
+ },
+ {
+ "epoch": 26.337874659400544,
+ "grad_norm": 8.592679977416992,
+ "learning_rate": 1.7276842197453475e-05,
+ "loss": 0.5221,
+ "step": 9666
+ },
+ {
+ "epoch": 26.340599455040874,
+ "grad_norm": 9.411178588867188,
+ "learning_rate": 1.7276236855197526e-05,
+ "loss": 0.6801,
+ "step": 9667
+ },
+ {
+ "epoch": 26.3433242506812,
+ "grad_norm": 9.463963508605957,
+ "learning_rate": 1.7275631456274476e-05,
+ "loss": 0.5466,
+ "step": 9668
+ },
+ {
+ "epoch": 26.346049046321525,
+ "grad_norm": 7.92461633682251,
+ "learning_rate": 1.727502600068905e-05,
+ "loss": 0.5344,
+ "step": 9669
+ },
+ {
+ "epoch": 26.348773841961854,
+ "grad_norm": 6.824985504150391,
+ "learning_rate": 1.727442048844595e-05,
+ "loss": 0.755,
+ "step": 9670
+ },
+ {
+ "epoch": 26.35149863760218,
+ "grad_norm": 8.3933744430542,
+ "learning_rate": 1.72738149195499e-05,
+ "loss": 0.7602,
+ "step": 9671
+ },
+ {
+ "epoch": 26.354223433242506,
+ "grad_norm": 9.247557640075684,
+ "learning_rate": 1.727320929400561e-05,
+ "loss": 0.5687,
+ "step": 9672
+ },
+ {
+ "epoch": 26.356948228882835,
+ "grad_norm": 8.802834510803223,
+ "learning_rate": 1.7272603611817803e-05,
+ "loss": 0.5789,
+ "step": 9673
+ },
+ {
+ "epoch": 26.35967302452316,
+ "grad_norm": 24.909435272216797,
+ "learning_rate": 1.7271997872991192e-05,
+ "loss": 0.5758,
+ "step": 9674
+ },
+ {
+ "epoch": 26.362397820163487,
+ "grad_norm": 7.1943817138671875,
+ "learning_rate": 1.7271392077530498e-05,
+ "loss": 0.6175,
+ "step": 9675
+ },
+ {
+ "epoch": 26.365122615803816,
+ "grad_norm": 9.605677604675293,
+ "learning_rate": 1.7270786225440434e-05,
+ "loss": 0.4918,
+ "step": 9676
+ },
+ {
+ "epoch": 26.367847411444142,
+ "grad_norm": 8.220892906188965,
+ "learning_rate": 1.727018031672572e-05,
+ "loss": 0.6282,
+ "step": 9677
+ },
+ {
+ "epoch": 26.370572207084468,
+ "grad_norm": 10.437742233276367,
+ "learning_rate": 1.726957435139108e-05,
+ "loss": 0.5023,
+ "step": 9678
+ },
+ {
+ "epoch": 26.373297002724797,
+ "grad_norm": 17.860620498657227,
+ "learning_rate": 1.7268968329441226e-05,
+ "loss": 0.5096,
+ "step": 9679
+ },
+ {
+ "epoch": 26.376021798365123,
+ "grad_norm": 7.564548015594482,
+ "learning_rate": 1.7268362250880878e-05,
+ "loss": 0.6897,
+ "step": 9680
+ },
+ {
+ "epoch": 26.37874659400545,
+ "grad_norm": 8.498891830444336,
+ "learning_rate": 1.726775611571476e-05,
+ "loss": 0.5014,
+ "step": 9681
+ },
+ {
+ "epoch": 26.381471389645778,
+ "grad_norm": 8.183478355407715,
+ "learning_rate": 1.7267149923947598e-05,
+ "loss": 0.5712,
+ "step": 9682
+ },
+ {
+ "epoch": 26.384196185286104,
+ "grad_norm": 8.678196907043457,
+ "learning_rate": 1.72665436755841e-05,
+ "loss": 0.5667,
+ "step": 9683
+ },
+ {
+ "epoch": 26.38692098092643,
+ "grad_norm": 8.562444686889648,
+ "learning_rate": 1.7265937370628995e-05,
+ "loss": 0.5267,
+ "step": 9684
+ },
+ {
+ "epoch": 26.38964577656676,
+ "grad_norm": 6.696924686431885,
+ "learning_rate": 1.7265331009087004e-05,
+ "loss": 0.5307,
+ "step": 9685
+ },
+ {
+ "epoch": 26.392370572207085,
+ "grad_norm": 6.626930236816406,
+ "learning_rate": 1.7264724590962846e-05,
+ "loss": 0.4725,
+ "step": 9686
+ },
+ {
+ "epoch": 26.39509536784741,
+ "grad_norm": 9.666239738464355,
+ "learning_rate": 1.726411811626125e-05,
+ "loss": 0.561,
+ "step": 9687
+ },
+ {
+ "epoch": 26.39782016348774,
+ "grad_norm": 8.817061424255371,
+ "learning_rate": 1.7263511584986935e-05,
+ "loss": 0.6234,
+ "step": 9688
+ },
+ {
+ "epoch": 26.400544959128066,
+ "grad_norm": 9.749441146850586,
+ "learning_rate": 1.7262904997144626e-05,
+ "loss": 0.5256,
+ "step": 9689
+ },
+ {
+ "epoch": 26.40326975476839,
+ "grad_norm": 11.836180686950684,
+ "learning_rate": 1.7262298352739048e-05,
+ "loss": 0.5289,
+ "step": 9690
+ },
+ {
+ "epoch": 26.40599455040872,
+ "grad_norm": 8.412851333618164,
+ "learning_rate": 1.7261691651774922e-05,
+ "loss": 0.6529,
+ "step": 9691
+ },
+ {
+ "epoch": 26.408719346049047,
+ "grad_norm": 8.265201568603516,
+ "learning_rate": 1.7261084894256975e-05,
+ "loss": 0.6555,
+ "step": 9692
+ },
+ {
+ "epoch": 26.411444141689373,
+ "grad_norm": 7.24312686920166,
+ "learning_rate": 1.7260478080189932e-05,
+ "loss": 0.6314,
+ "step": 9693
+ },
+ {
+ "epoch": 26.414168937329702,
+ "grad_norm": 8.179997444152832,
+ "learning_rate": 1.725987120957852e-05,
+ "loss": 0.711,
+ "step": 9694
+ },
+ {
+ "epoch": 26.416893732970028,
+ "grad_norm": 7.774048328399658,
+ "learning_rate": 1.7259264282427467e-05,
+ "loss": 0.5784,
+ "step": 9695
+ },
+ {
+ "epoch": 26.419618528610354,
+ "grad_norm": 9.335322380065918,
+ "learning_rate": 1.7258657298741494e-05,
+ "loss": 0.4728,
+ "step": 9696
+ },
+ {
+ "epoch": 26.422343324250683,
+ "grad_norm": 8.457154273986816,
+ "learning_rate": 1.7258050258525335e-05,
+ "loss": 0.5094,
+ "step": 9697
+ },
+ {
+ "epoch": 26.42506811989101,
+ "grad_norm": 8.617023468017578,
+ "learning_rate": 1.7257443161783712e-05,
+ "loss": 0.4645,
+ "step": 9698
+ },
+ {
+ "epoch": 26.427792915531334,
+ "grad_norm": 19.97624969482422,
+ "learning_rate": 1.7256836008521354e-05,
+ "loss": 0.666,
+ "step": 9699
+ },
+ {
+ "epoch": 26.430517711171664,
+ "grad_norm": 8.577537536621094,
+ "learning_rate": 1.725622879874299e-05,
+ "loss": 0.4655,
+ "step": 9700
+ },
+ {
+ "epoch": 26.43324250681199,
+ "grad_norm": 8.199747085571289,
+ "learning_rate": 1.7255621532453356e-05,
+ "loss": 0.591,
+ "step": 9701
+ },
+ {
+ "epoch": 26.435967302452315,
+ "grad_norm": 8.759621620178223,
+ "learning_rate": 1.725501420965717e-05,
+ "loss": 0.4586,
+ "step": 9702
+ },
+ {
+ "epoch": 26.438692098092645,
+ "grad_norm": 7.397414684295654,
+ "learning_rate": 1.7254406830359166e-05,
+ "loss": 0.5256,
+ "step": 9703
+ },
+ {
+ "epoch": 26.44141689373297,
+ "grad_norm": 10.123652458190918,
+ "learning_rate": 1.725379939456408e-05,
+ "loss": 0.4986,
+ "step": 9704
+ },
+ {
+ "epoch": 26.444141689373296,
+ "grad_norm": 7.325468063354492,
+ "learning_rate": 1.7253191902276634e-05,
+ "loss": 0.5513,
+ "step": 9705
+ },
+ {
+ "epoch": 26.446866485013626,
+ "grad_norm": 11.196511268615723,
+ "learning_rate": 1.725258435350156e-05,
+ "loss": 0.6641,
+ "step": 9706
+ },
+ {
+ "epoch": 26.44959128065395,
+ "grad_norm": 15.448986053466797,
+ "learning_rate": 1.7251976748243597e-05,
+ "loss": 0.6542,
+ "step": 9707
+ },
+ {
+ "epoch": 26.452316076294277,
+ "grad_norm": 8.92198657989502,
+ "learning_rate": 1.7251369086507472e-05,
+ "loss": 0.6694,
+ "step": 9708
+ },
+ {
+ "epoch": 26.455040871934607,
+ "grad_norm": 22.12588882446289,
+ "learning_rate": 1.725076136829792e-05,
+ "loss": 0.6179,
+ "step": 9709
+ },
+ {
+ "epoch": 26.457765667574932,
+ "grad_norm": 9.834114074707031,
+ "learning_rate": 1.725015359361967e-05,
+ "loss": 0.7356,
+ "step": 9710
+ },
+ {
+ "epoch": 26.460490463215258,
+ "grad_norm": 8.150346755981445,
+ "learning_rate": 1.7249545762477454e-05,
+ "loss": 0.5803,
+ "step": 9711
+ },
+ {
+ "epoch": 26.463215258855588,
+ "grad_norm": 10.009634971618652,
+ "learning_rate": 1.7248937874876013e-05,
+ "loss": 0.5165,
+ "step": 9712
+ },
+ {
+ "epoch": 26.465940054495913,
+ "grad_norm": 9.49602222442627,
+ "learning_rate": 1.7248329930820076e-05,
+ "loss": 0.4071,
+ "step": 9713
+ },
+ {
+ "epoch": 26.46866485013624,
+ "grad_norm": 8.119736671447754,
+ "learning_rate": 1.7247721930314377e-05,
+ "loss": 0.5149,
+ "step": 9714
+ },
+ {
+ "epoch": 26.47138964577657,
+ "grad_norm": 9.511920928955078,
+ "learning_rate": 1.7247113873363656e-05,
+ "loss": 0.5853,
+ "step": 9715
+ },
+ {
+ "epoch": 26.474114441416894,
+ "grad_norm": 8.866805076599121,
+ "learning_rate": 1.7246505759972643e-05,
+ "loss": 0.559,
+ "step": 9716
+ },
+ {
+ "epoch": 26.47683923705722,
+ "grad_norm": 27.62454605102539,
+ "learning_rate": 1.7245897590146078e-05,
+ "loss": 0.6063,
+ "step": 9717
+ },
+ {
+ "epoch": 26.479564032697546,
+ "grad_norm": 12.811103820800781,
+ "learning_rate": 1.7245289363888694e-05,
+ "loss": 0.5844,
+ "step": 9718
+ },
+ {
+ "epoch": 26.482288828337875,
+ "grad_norm": 7.823066711425781,
+ "learning_rate": 1.7244681081205227e-05,
+ "loss": 0.4919,
+ "step": 9719
+ },
+ {
+ "epoch": 26.4850136239782,
+ "grad_norm": 5.938113689422607,
+ "learning_rate": 1.7244072742100422e-05,
+ "loss": 0.4162,
+ "step": 9720
+ },
+ {
+ "epoch": 26.48773841961853,
+ "grad_norm": 8.288970947265625,
+ "learning_rate": 1.724346434657901e-05,
+ "loss": 0.6464,
+ "step": 9721
+ },
+ {
+ "epoch": 26.490463215258856,
+ "grad_norm": 15.540919303894043,
+ "learning_rate": 1.724285589464573e-05,
+ "loss": 0.4741,
+ "step": 9722
+ },
+ {
+ "epoch": 26.493188010899182,
+ "grad_norm": 9.762518882751465,
+ "learning_rate": 1.7242247386305324e-05,
+ "loss": 0.5653,
+ "step": 9723
+ },
+ {
+ "epoch": 26.495912806539508,
+ "grad_norm": 9.49687385559082,
+ "learning_rate": 1.7241638821562526e-05,
+ "loss": 0.4958,
+ "step": 9724
+ },
+ {
+ "epoch": 26.498637602179837,
+ "grad_norm": 8.982109069824219,
+ "learning_rate": 1.7241030200422078e-05,
+ "loss": 0.5706,
+ "step": 9725
+ },
+ {
+ "epoch": 26.501362397820163,
+ "grad_norm": 22.22509002685547,
+ "learning_rate": 1.724042152288872e-05,
+ "loss": 0.541,
+ "step": 9726
+ },
+ {
+ "epoch": 26.504087193460492,
+ "grad_norm": 9.978806495666504,
+ "learning_rate": 1.7239812788967195e-05,
+ "loss": 0.5566,
+ "step": 9727
+ },
+ {
+ "epoch": 26.506811989100818,
+ "grad_norm": 9.385416030883789,
+ "learning_rate": 1.7239203998662234e-05,
+ "loss": 0.5651,
+ "step": 9728
+ },
+ {
+ "epoch": 26.509536784741144,
+ "grad_norm": 10.099444389343262,
+ "learning_rate": 1.7238595151978593e-05,
+ "loss": 0.526,
+ "step": 9729
+ },
+ {
+ "epoch": 26.51226158038147,
+ "grad_norm": 7.989203929901123,
+ "learning_rate": 1.7237986248921003e-05,
+ "loss": 0.5272,
+ "step": 9730
+ },
+ {
+ "epoch": 26.5149863760218,
+ "grad_norm": 7.509270668029785,
+ "learning_rate": 1.7237377289494207e-05,
+ "loss": 0.6298,
+ "step": 9731
+ },
+ {
+ "epoch": 26.517711171662125,
+ "grad_norm": 10.203505516052246,
+ "learning_rate": 1.7236768273702952e-05,
+ "loss": 0.505,
+ "step": 9732
+ },
+ {
+ "epoch": 26.520435967302454,
+ "grad_norm": 8.250483512878418,
+ "learning_rate": 1.7236159201551978e-05,
+ "loss": 0.5259,
+ "step": 9733
+ },
+ {
+ "epoch": 26.52316076294278,
+ "grad_norm": 8.439765930175781,
+ "learning_rate": 1.723555007304603e-05,
+ "loss": 0.5204,
+ "step": 9734
+ },
+ {
+ "epoch": 26.525885558583106,
+ "grad_norm": 7.641886234283447,
+ "learning_rate": 1.7234940888189847e-05,
+ "loss": 0.4673,
+ "step": 9735
+ },
+ {
+ "epoch": 26.52861035422343,
+ "grad_norm": 10.620079040527344,
+ "learning_rate": 1.7234331646988183e-05,
+ "loss": 0.5453,
+ "step": 9736
+ },
+ {
+ "epoch": 26.53133514986376,
+ "grad_norm": 7.982536315917969,
+ "learning_rate": 1.7233722349445774e-05,
+ "loss": 0.5303,
+ "step": 9737
+ },
+ {
+ "epoch": 26.534059945504087,
+ "grad_norm": 10.731901168823242,
+ "learning_rate": 1.7233112995567366e-05,
+ "loss": 0.5692,
+ "step": 9738
+ },
+ {
+ "epoch": 26.536784741144416,
+ "grad_norm": 8.416155815124512,
+ "learning_rate": 1.723250358535771e-05,
+ "loss": 0.557,
+ "step": 9739
+ },
+ {
+ "epoch": 26.539509536784742,
+ "grad_norm": 8.52946662902832,
+ "learning_rate": 1.723189411882155e-05,
+ "loss": 0.6161,
+ "step": 9740
+ },
+ {
+ "epoch": 26.542234332425068,
+ "grad_norm": 6.650148391723633,
+ "learning_rate": 1.723128459596363e-05,
+ "loss": 0.5844,
+ "step": 9741
+ },
+ {
+ "epoch": 26.544959128065393,
+ "grad_norm": 8.657482147216797,
+ "learning_rate": 1.7230675016788697e-05,
+ "loss": 0.5673,
+ "step": 9742
+ },
+ {
+ "epoch": 26.547683923705723,
+ "grad_norm": 9.079556465148926,
+ "learning_rate": 1.72300653813015e-05,
+ "loss": 0.5774,
+ "step": 9743
+ },
+ {
+ "epoch": 26.55040871934605,
+ "grad_norm": 7.331713676452637,
+ "learning_rate": 1.7229455689506786e-05,
+ "loss": 0.6069,
+ "step": 9744
+ },
+ {
+ "epoch": 26.553133514986374,
+ "grad_norm": 8.788839340209961,
+ "learning_rate": 1.7228845941409304e-05,
+ "loss": 0.6886,
+ "step": 9745
+ },
+ {
+ "epoch": 26.555858310626704,
+ "grad_norm": 16.687707901000977,
+ "learning_rate": 1.7228236137013804e-05,
+ "loss": 0.5566,
+ "step": 9746
+ },
+ {
+ "epoch": 26.55858310626703,
+ "grad_norm": 10.596636772155762,
+ "learning_rate": 1.7227626276325033e-05,
+ "loss": 0.4482,
+ "step": 9747
+ },
+ {
+ "epoch": 26.561307901907355,
+ "grad_norm": 6.884238243103027,
+ "learning_rate": 1.722701635934774e-05,
+ "loss": 0.5292,
+ "step": 9748
+ },
+ {
+ "epoch": 26.564032697547685,
+ "grad_norm": 19.73212242126465,
+ "learning_rate": 1.7226406386086675e-05,
+ "loss": 0.6209,
+ "step": 9749
+ },
+ {
+ "epoch": 26.56675749318801,
+ "grad_norm": 10.994420051574707,
+ "learning_rate": 1.7225796356546592e-05,
+ "loss": 0.7026,
+ "step": 9750
+ },
+ {
+ "epoch": 26.569482288828336,
+ "grad_norm": 10.321929931640625,
+ "learning_rate": 1.7225186270732242e-05,
+ "loss": 0.6399,
+ "step": 9751
+ },
+ {
+ "epoch": 26.572207084468666,
+ "grad_norm": 9.506365776062012,
+ "learning_rate": 1.722457612864837e-05,
+ "loss": 0.5134,
+ "step": 9752
+ },
+ {
+ "epoch": 26.57493188010899,
+ "grad_norm": 7.55317497253418,
+ "learning_rate": 1.7223965930299732e-05,
+ "loss": 0.542,
+ "step": 9753
+ },
+ {
+ "epoch": 26.577656675749317,
+ "grad_norm": 7.067741394042969,
+ "learning_rate": 1.722335567569108e-05,
+ "loss": 0.76,
+ "step": 9754
+ },
+ {
+ "epoch": 26.580381471389646,
+ "grad_norm": 8.14130687713623,
+ "learning_rate": 1.7222745364827167e-05,
+ "loss": 0.4661,
+ "step": 9755
+ },
+ {
+ "epoch": 26.583106267029972,
+ "grad_norm": 8.30457592010498,
+ "learning_rate": 1.7222134997712748e-05,
+ "loss": 0.7259,
+ "step": 9756
+ },
+ {
+ "epoch": 26.585831062670298,
+ "grad_norm": 8.38310718536377,
+ "learning_rate": 1.722152457435257e-05,
+ "loss": 0.6436,
+ "step": 9757
+ },
+ {
+ "epoch": 26.588555858310627,
+ "grad_norm": 10.805953025817871,
+ "learning_rate": 1.722091409475139e-05,
+ "loss": 0.733,
+ "step": 9758
+ },
+ {
+ "epoch": 26.591280653950953,
+ "grad_norm": 8.848837852478027,
+ "learning_rate": 1.722030355891397e-05,
+ "loss": 0.5511,
+ "step": 9759
+ },
+ {
+ "epoch": 26.59400544959128,
+ "grad_norm": 54.405826568603516,
+ "learning_rate": 1.721969296684505e-05,
+ "loss": 0.4696,
+ "step": 9760
+ },
+ {
+ "epoch": 26.59673024523161,
+ "grad_norm": 13.935903549194336,
+ "learning_rate": 1.72190823185494e-05,
+ "loss": 0.5378,
+ "step": 9761
+ },
+ {
+ "epoch": 26.599455040871934,
+ "grad_norm": 7.5879435539245605,
+ "learning_rate": 1.721847161403177e-05,
+ "loss": 0.7851,
+ "step": 9762
+ },
+ {
+ "epoch": 26.60217983651226,
+ "grad_norm": 8.205209732055664,
+ "learning_rate": 1.721786085329691e-05,
+ "loss": 0.4768,
+ "step": 9763
+ },
+ {
+ "epoch": 26.60490463215259,
+ "grad_norm": 8.208876609802246,
+ "learning_rate": 1.7217250036349584e-05,
+ "loss": 0.5588,
+ "step": 9764
+ },
+ {
+ "epoch": 26.607629427792915,
+ "grad_norm": 17.013639450073242,
+ "learning_rate": 1.721663916319455e-05,
+ "loss": 0.527,
+ "step": 9765
+ },
+ {
+ "epoch": 26.61035422343324,
+ "grad_norm": 17.2004337310791,
+ "learning_rate": 1.721602823383656e-05,
+ "loss": 0.5312,
+ "step": 9766
+ },
+ {
+ "epoch": 26.61307901907357,
+ "grad_norm": 25.651762008666992,
+ "learning_rate": 1.7215417248280374e-05,
+ "loss": 0.7311,
+ "step": 9767
+ },
+ {
+ "epoch": 26.615803814713896,
+ "grad_norm": 27.533079147338867,
+ "learning_rate": 1.721480620653075e-05,
+ "loss": 0.6274,
+ "step": 9768
+ },
+ {
+ "epoch": 26.618528610354222,
+ "grad_norm": 10.6248197555542,
+ "learning_rate": 1.7214195108592448e-05,
+ "loss": 0.6133,
+ "step": 9769
+ },
+ {
+ "epoch": 26.62125340599455,
+ "grad_norm": 10.059863090515137,
+ "learning_rate": 1.7213583954470228e-05,
+ "loss": 0.7231,
+ "step": 9770
+ },
+ {
+ "epoch": 26.623978201634877,
+ "grad_norm": 8.468740463256836,
+ "learning_rate": 1.721297274416885e-05,
+ "loss": 0.5704,
+ "step": 9771
+ },
+ {
+ "epoch": 26.626702997275203,
+ "grad_norm": 9.464869499206543,
+ "learning_rate": 1.7212361477693068e-05,
+ "loss": 0.5226,
+ "step": 9772
+ },
+ {
+ "epoch": 26.629427792915532,
+ "grad_norm": 10.510021209716797,
+ "learning_rate": 1.721175015504765e-05,
+ "loss": 0.5062,
+ "step": 9773
+ },
+ {
+ "epoch": 26.632152588555858,
+ "grad_norm": 8.539653778076172,
+ "learning_rate": 1.721113877623735e-05,
+ "loss": 0.5445,
+ "step": 9774
+ },
+ {
+ "epoch": 26.634877384196184,
+ "grad_norm": 11.123778343200684,
+ "learning_rate": 1.7210527341266936e-05,
+ "loss": 0.6424,
+ "step": 9775
+ },
+ {
+ "epoch": 26.637602179836513,
+ "grad_norm": 10.299055099487305,
+ "learning_rate": 1.720991585014117e-05,
+ "loss": 0.5608,
+ "step": 9776
+ },
+ {
+ "epoch": 26.64032697547684,
+ "grad_norm": 8.966005325317383,
+ "learning_rate": 1.7209304302864808e-05,
+ "loss": 0.543,
+ "step": 9777
+ },
+ {
+ "epoch": 26.643051771117165,
+ "grad_norm": 8.661131858825684,
+ "learning_rate": 1.7208692699442618e-05,
+ "loss": 0.4578,
+ "step": 9778
+ },
+ {
+ "epoch": 26.645776566757494,
+ "grad_norm": 8.650118827819824,
+ "learning_rate": 1.7208081039879355e-05,
+ "loss": 0.5977,
+ "step": 9779
+ },
+ {
+ "epoch": 26.64850136239782,
+ "grad_norm": 9.450804710388184,
+ "learning_rate": 1.7207469324179796e-05,
+ "loss": 0.6046,
+ "step": 9780
+ },
+ {
+ "epoch": 26.651226158038146,
+ "grad_norm": 7.290467739105225,
+ "learning_rate": 1.7206857552348696e-05,
+ "loss": 0.636,
+ "step": 9781
+ },
+ {
+ "epoch": 26.653950953678475,
+ "grad_norm": 8.39273452758789,
+ "learning_rate": 1.720624572439082e-05,
+ "loss": 0.553,
+ "step": 9782
+ },
+ {
+ "epoch": 26.6566757493188,
+ "grad_norm": 10.417442321777344,
+ "learning_rate": 1.7205633840310935e-05,
+ "loss": 0.6809,
+ "step": 9783
+ },
+ {
+ "epoch": 26.659400544959126,
+ "grad_norm": 9.35910701751709,
+ "learning_rate": 1.7205021900113808e-05,
+ "loss": 0.5734,
+ "step": 9784
+ },
+ {
+ "epoch": 26.662125340599456,
+ "grad_norm": 8.904742240905762,
+ "learning_rate": 1.72044099038042e-05,
+ "loss": 0.6603,
+ "step": 9785
+ },
+ {
+ "epoch": 26.66485013623978,
+ "grad_norm": 8.284513473510742,
+ "learning_rate": 1.7203797851386878e-05,
+ "loss": 0.5482,
+ "step": 9786
+ },
+ {
+ "epoch": 26.667574931880107,
+ "grad_norm": 7.7133870124816895,
+ "learning_rate": 1.720318574286661e-05,
+ "loss": 0.4943,
+ "step": 9787
+ },
+ {
+ "epoch": 26.670299727520437,
+ "grad_norm": 7.952728271484375,
+ "learning_rate": 1.7202573578248166e-05,
+ "loss": 0.5464,
+ "step": 9788
+ },
+ {
+ "epoch": 26.673024523160763,
+ "grad_norm": 10.20577621459961,
+ "learning_rate": 1.7201961357536313e-05,
+ "loss": 0.5574,
+ "step": 9789
+ },
+ {
+ "epoch": 26.67574931880109,
+ "grad_norm": 8.854503631591797,
+ "learning_rate": 1.720134908073581e-05,
+ "loss": 0.557,
+ "step": 9790
+ },
+ {
+ "epoch": 26.678474114441418,
+ "grad_norm": 7.459747314453125,
+ "learning_rate": 1.720073674785144e-05,
+ "loss": 0.4844,
+ "step": 9791
+ },
+ {
+ "epoch": 26.681198910081743,
+ "grad_norm": 7.778055667877197,
+ "learning_rate": 1.720012435888796e-05,
+ "loss": 0.5489,
+ "step": 9792
+ },
+ {
+ "epoch": 26.68392370572207,
+ "grad_norm": 7.30932092666626,
+ "learning_rate": 1.7199511913850142e-05,
+ "loss": 0.5255,
+ "step": 9793
+ },
+ {
+ "epoch": 26.6866485013624,
+ "grad_norm": 9.2329740524292,
+ "learning_rate": 1.7198899412742756e-05,
+ "loss": 0.6163,
+ "step": 9794
+ },
+ {
+ "epoch": 26.689373297002724,
+ "grad_norm": 9.634840965270996,
+ "learning_rate": 1.7198286855570575e-05,
+ "loss": 0.6769,
+ "step": 9795
+ },
+ {
+ "epoch": 26.69209809264305,
+ "grad_norm": 9.673457145690918,
+ "learning_rate": 1.719767424233837e-05,
+ "loss": 0.6982,
+ "step": 9796
+ },
+ {
+ "epoch": 26.69482288828338,
+ "grad_norm": 12.041887283325195,
+ "learning_rate": 1.719706157305091e-05,
+ "loss": 0.6368,
+ "step": 9797
+ },
+ {
+ "epoch": 26.697547683923705,
+ "grad_norm": 7.8084821701049805,
+ "learning_rate": 1.719644884771296e-05,
+ "loss": 0.4594,
+ "step": 9798
+ },
+ {
+ "epoch": 26.70027247956403,
+ "grad_norm": 7.280473232269287,
+ "learning_rate": 1.7195836066329304e-05,
+ "loss": 0.6399,
+ "step": 9799
+ },
+ {
+ "epoch": 26.70299727520436,
+ "grad_norm": 8.602075576782227,
+ "learning_rate": 1.7195223228904705e-05,
+ "loss": 0.5395,
+ "step": 9800
+ },
+ {
+ "epoch": 26.705722070844686,
+ "grad_norm": 7.182285785675049,
+ "learning_rate": 1.719461033544394e-05,
+ "loss": 0.4574,
+ "step": 9801
+ },
+ {
+ "epoch": 26.708446866485012,
+ "grad_norm": 13.214006423950195,
+ "learning_rate": 1.719399738595178e-05,
+ "loss": 0.6719,
+ "step": 9802
+ },
+ {
+ "epoch": 26.71117166212534,
+ "grad_norm": 6.748271942138672,
+ "learning_rate": 1.7193384380433e-05,
+ "loss": 0.5078,
+ "step": 9803
+ },
+ {
+ "epoch": 26.713896457765667,
+ "grad_norm": 8.99386978149414,
+ "learning_rate": 1.7192771318892377e-05,
+ "loss": 0.548,
+ "step": 9804
+ },
+ {
+ "epoch": 26.716621253405993,
+ "grad_norm": 7.487708568572998,
+ "learning_rate": 1.719215820133468e-05,
+ "loss": 0.4866,
+ "step": 9805
+ },
+ {
+ "epoch": 26.719346049046322,
+ "grad_norm": 8.8655366897583,
+ "learning_rate": 1.7191545027764686e-05,
+ "loss": 0.5208,
+ "step": 9806
+ },
+ {
+ "epoch": 26.722070844686648,
+ "grad_norm": 8.175238609313965,
+ "learning_rate": 1.7190931798187173e-05,
+ "loss": 0.6731,
+ "step": 9807
+ },
+ {
+ "epoch": 26.724795640326974,
+ "grad_norm": 10.522286415100098,
+ "learning_rate": 1.719031851260691e-05,
+ "loss": 0.5506,
+ "step": 9808
+ },
+ {
+ "epoch": 26.727520435967303,
+ "grad_norm": 9.17513370513916,
+ "learning_rate": 1.7189705171028684e-05,
+ "loss": 0.4948,
+ "step": 9809
+ },
+ {
+ "epoch": 26.73024523160763,
+ "grad_norm": 7.262209415435791,
+ "learning_rate": 1.7189091773457263e-05,
+ "loss": 0.5682,
+ "step": 9810
+ },
+ {
+ "epoch": 26.732970027247955,
+ "grad_norm": 7.6149373054504395,
+ "learning_rate": 1.7188478319897425e-05,
+ "loss": 0.6615,
+ "step": 9811
+ },
+ {
+ "epoch": 26.735694822888284,
+ "grad_norm": 7.136045455932617,
+ "learning_rate": 1.718786481035395e-05,
+ "loss": 0.5837,
+ "step": 9812
+ },
+ {
+ "epoch": 26.73841961852861,
+ "grad_norm": 8.332613945007324,
+ "learning_rate": 1.7187251244831617e-05,
+ "loss": 0.5957,
+ "step": 9813
+ },
+ {
+ "epoch": 26.741144414168936,
+ "grad_norm": 7.949191093444824,
+ "learning_rate": 1.7186637623335202e-05,
+ "loss": 0.5762,
+ "step": 9814
+ },
+ {
+ "epoch": 26.743869209809265,
+ "grad_norm": 8.355345726013184,
+ "learning_rate": 1.7186023945869482e-05,
+ "loss": 0.6154,
+ "step": 9815
+ },
+ {
+ "epoch": 26.74659400544959,
+ "grad_norm": 7.350244998931885,
+ "learning_rate": 1.718541021243924e-05,
+ "loss": 0.5094,
+ "step": 9816
+ },
+ {
+ "epoch": 26.749318801089917,
+ "grad_norm": 7.143017768859863,
+ "learning_rate": 1.7184796423049258e-05,
+ "loss": 0.5666,
+ "step": 9817
+ },
+ {
+ "epoch": 26.752043596730246,
+ "grad_norm": 7.0420451164245605,
+ "learning_rate": 1.7184182577704308e-05,
+ "loss": 0.7675,
+ "step": 9818
+ },
+ {
+ "epoch": 26.754768392370572,
+ "grad_norm": 7.085203647613525,
+ "learning_rate": 1.7183568676409177e-05,
+ "loss": 0.5901,
+ "step": 9819
+ },
+ {
+ "epoch": 26.757493188010898,
+ "grad_norm": 17.482250213623047,
+ "learning_rate": 1.7182954719168644e-05,
+ "loss": 0.5327,
+ "step": 9820
+ },
+ {
+ "epoch": 26.760217983651227,
+ "grad_norm": 8.615785598754883,
+ "learning_rate": 1.7182340705987493e-05,
+ "loss": 0.6075,
+ "step": 9821
+ },
+ {
+ "epoch": 26.762942779291553,
+ "grad_norm": 11.417250633239746,
+ "learning_rate": 1.7181726636870503e-05,
+ "loss": 0.6096,
+ "step": 9822
+ },
+ {
+ "epoch": 26.76566757493188,
+ "grad_norm": 7.919449806213379,
+ "learning_rate": 1.7181112511822454e-05,
+ "loss": 0.5388,
+ "step": 9823
+ },
+ {
+ "epoch": 26.768392370572208,
+ "grad_norm": 7.389474868774414,
+ "learning_rate": 1.7180498330848136e-05,
+ "loss": 0.7375,
+ "step": 9824
+ },
+ {
+ "epoch": 26.771117166212534,
+ "grad_norm": 8.586124420166016,
+ "learning_rate": 1.7179884093952323e-05,
+ "loss": 0.5284,
+ "step": 9825
+ },
+ {
+ "epoch": 26.77384196185286,
+ "grad_norm": 8.27129077911377,
+ "learning_rate": 1.717926980113981e-05,
+ "loss": 0.5146,
+ "step": 9826
+ },
+ {
+ "epoch": 26.77656675749319,
+ "grad_norm": 6.685294151306152,
+ "learning_rate": 1.717865545241537e-05,
+ "loss": 0.5565,
+ "step": 9827
+ },
+ {
+ "epoch": 26.779291553133515,
+ "grad_norm": 9.088601112365723,
+ "learning_rate": 1.7178041047783794e-05,
+ "loss": 0.5798,
+ "step": 9828
+ },
+ {
+ "epoch": 26.78201634877384,
+ "grad_norm": 8.028997421264648,
+ "learning_rate": 1.7177426587249867e-05,
+ "loss": 0.4793,
+ "step": 9829
+ },
+ {
+ "epoch": 26.78474114441417,
+ "grad_norm": 8.733445167541504,
+ "learning_rate": 1.717681207081837e-05,
+ "loss": 0.4783,
+ "step": 9830
+ },
+ {
+ "epoch": 26.787465940054496,
+ "grad_norm": 6.7583088874816895,
+ "learning_rate": 1.717619749849409e-05,
+ "loss": 0.5808,
+ "step": 9831
+ },
+ {
+ "epoch": 26.79019073569482,
+ "grad_norm": 7.639645576477051,
+ "learning_rate": 1.717558287028182e-05,
+ "loss": 0.6336,
+ "step": 9832
+ },
+ {
+ "epoch": 26.79291553133515,
+ "grad_norm": 6.987443447113037,
+ "learning_rate": 1.717496818618634e-05,
+ "loss": 0.5704,
+ "step": 9833
+ },
+ {
+ "epoch": 26.795640326975477,
+ "grad_norm": 7.344447135925293,
+ "learning_rate": 1.7174353446212438e-05,
+ "loss": 0.4557,
+ "step": 9834
+ },
+ {
+ "epoch": 26.798365122615802,
+ "grad_norm": 7.086408615112305,
+ "learning_rate": 1.71737386503649e-05,
+ "loss": 0.5657,
+ "step": 9835
+ },
+ {
+ "epoch": 26.80108991825613,
+ "grad_norm": 7.556144714355469,
+ "learning_rate": 1.7173123798648517e-05,
+ "loss": 0.6652,
+ "step": 9836
+ },
+ {
+ "epoch": 26.803814713896458,
+ "grad_norm": 15.217717170715332,
+ "learning_rate": 1.717250889106808e-05,
+ "loss": 0.5214,
+ "step": 9837
+ },
+ {
+ "epoch": 26.806539509536783,
+ "grad_norm": 9.909323692321777,
+ "learning_rate": 1.7171893927628374e-05,
+ "loss": 0.6533,
+ "step": 9838
+ },
+ {
+ "epoch": 26.809264305177113,
+ "grad_norm": 9.069902420043945,
+ "learning_rate": 1.7171278908334188e-05,
+ "loss": 0.6884,
+ "step": 9839
+ },
+ {
+ "epoch": 26.81198910081744,
+ "grad_norm": 8.221458435058594,
+ "learning_rate": 1.717066383319031e-05,
+ "loss": 0.6047,
+ "step": 9840
+ },
+ {
+ "epoch": 26.814713896457764,
+ "grad_norm": 7.048707962036133,
+ "learning_rate": 1.7170048702201536e-05,
+ "loss": 0.6982,
+ "step": 9841
+ },
+ {
+ "epoch": 26.817438692098094,
+ "grad_norm": 8.236212730407715,
+ "learning_rate": 1.7169433515372652e-05,
+ "loss": 0.6212,
+ "step": 9842
+ },
+ {
+ "epoch": 26.82016348773842,
+ "grad_norm": 13.191624641418457,
+ "learning_rate": 1.716881827270845e-05,
+ "loss": 0.5137,
+ "step": 9843
+ },
+ {
+ "epoch": 26.822888283378745,
+ "grad_norm": 6.405436038970947,
+ "learning_rate": 1.7168202974213723e-05,
+ "loss": 0.5905,
+ "step": 9844
+ },
+ {
+ "epoch": 26.825613079019075,
+ "grad_norm": 8.298712730407715,
+ "learning_rate": 1.7167587619893266e-05,
+ "loss": 0.5558,
+ "step": 9845
+ },
+ {
+ "epoch": 26.8283378746594,
+ "grad_norm": 8.389778137207031,
+ "learning_rate": 1.7166972209751863e-05,
+ "loss": 0.6276,
+ "step": 9846
+ },
+ {
+ "epoch": 26.831062670299726,
+ "grad_norm": 8.159259796142578,
+ "learning_rate": 1.716635674379431e-05,
+ "loss": 0.6414,
+ "step": 9847
+ },
+ {
+ "epoch": 26.833787465940055,
+ "grad_norm": 9.523921012878418,
+ "learning_rate": 1.7165741222025404e-05,
+ "loss": 0.5206,
+ "step": 9848
+ },
+ {
+ "epoch": 26.83651226158038,
+ "grad_norm": 8.652966499328613,
+ "learning_rate": 1.7165125644449935e-05,
+ "loss": 0.5121,
+ "step": 9849
+ },
+ {
+ "epoch": 26.839237057220707,
+ "grad_norm": 8.350944519042969,
+ "learning_rate": 1.7164510011072698e-05,
+ "loss": 0.4707,
+ "step": 9850
+ },
+ {
+ "epoch": 26.841961852861036,
+ "grad_norm": 7.804934024810791,
+ "learning_rate": 1.7163894321898484e-05,
+ "loss": 0.501,
+ "step": 9851
+ },
+ {
+ "epoch": 26.844686648501362,
+ "grad_norm": 7.301161766052246,
+ "learning_rate": 1.7163278576932096e-05,
+ "loss": 0.5817,
+ "step": 9852
+ },
+ {
+ "epoch": 26.847411444141688,
+ "grad_norm": 9.36557674407959,
+ "learning_rate": 1.7162662776178326e-05,
+ "loss": 0.4836,
+ "step": 9853
+ },
+ {
+ "epoch": 26.850136239782017,
+ "grad_norm": 7.538303375244141,
+ "learning_rate": 1.7162046919641965e-05,
+ "loss": 0.5938,
+ "step": 9854
+ },
+ {
+ "epoch": 26.852861035422343,
+ "grad_norm": 7.781804084777832,
+ "learning_rate": 1.7161431007327817e-05,
+ "loss": 0.4291,
+ "step": 9855
+ },
+ {
+ "epoch": 26.85558583106267,
+ "grad_norm": 9.716976165771484,
+ "learning_rate": 1.7160815039240673e-05,
+ "loss": 0.5191,
+ "step": 9856
+ },
+ {
+ "epoch": 26.858310626703,
+ "grad_norm": 8.597269058227539,
+ "learning_rate": 1.716019901538533e-05,
+ "loss": 0.6948,
+ "step": 9857
+ },
+ {
+ "epoch": 26.861035422343324,
+ "grad_norm": 36.90464782714844,
+ "learning_rate": 1.715958293576659e-05,
+ "loss": 0.6644,
+ "step": 9858
+ },
+ {
+ "epoch": 26.86376021798365,
+ "grad_norm": 8.590659141540527,
+ "learning_rate": 1.7158966800389248e-05,
+ "loss": 0.6661,
+ "step": 9859
+ },
+ {
+ "epoch": 26.86648501362398,
+ "grad_norm": 7.516275405883789,
+ "learning_rate": 1.7158350609258102e-05,
+ "loss": 0.5664,
+ "step": 9860
+ },
+ {
+ "epoch": 26.869209809264305,
+ "grad_norm": 8.420100212097168,
+ "learning_rate": 1.7157734362377954e-05,
+ "loss": 0.6704,
+ "step": 9861
+ },
+ {
+ "epoch": 26.87193460490463,
+ "grad_norm": 10.217272758483887,
+ "learning_rate": 1.71571180597536e-05,
+ "loss": 0.6155,
+ "step": 9862
+ },
+ {
+ "epoch": 26.87465940054496,
+ "grad_norm": 8.462159156799316,
+ "learning_rate": 1.715650170138984e-05,
+ "loss": 0.574,
+ "step": 9863
+ },
+ {
+ "epoch": 26.877384196185286,
+ "grad_norm": 8.050196647644043,
+ "learning_rate": 1.7155885287291477e-05,
+ "loss": 0.5557,
+ "step": 9864
+ },
+ {
+ "epoch": 26.88010899182561,
+ "grad_norm": 8.381481170654297,
+ "learning_rate": 1.715526881746331e-05,
+ "loss": 0.5322,
+ "step": 9865
+ },
+ {
+ "epoch": 26.88283378746594,
+ "grad_norm": 7.986210823059082,
+ "learning_rate": 1.7154652291910134e-05,
+ "loss": 0.5847,
+ "step": 9866
+ },
+ {
+ "epoch": 26.885558583106267,
+ "grad_norm": 8.827322006225586,
+ "learning_rate": 1.7154035710636764e-05,
+ "loss": 0.4438,
+ "step": 9867
+ },
+ {
+ "epoch": 26.888283378746593,
+ "grad_norm": 7.283189296722412,
+ "learning_rate": 1.715341907364799e-05,
+ "loss": 0.5301,
+ "step": 9868
+ },
+ {
+ "epoch": 26.891008174386922,
+ "grad_norm": 8.739351272583008,
+ "learning_rate": 1.7152802380948618e-05,
+ "loss": 0.5347,
+ "step": 9869
+ },
+ {
+ "epoch": 26.893732970027248,
+ "grad_norm": 8.528818130493164,
+ "learning_rate": 1.7152185632543453e-05,
+ "loss": 0.5613,
+ "step": 9870
+ },
+ {
+ "epoch": 26.896457765667574,
+ "grad_norm": 8.095894813537598,
+ "learning_rate": 1.7151568828437294e-05,
+ "loss": 0.5068,
+ "step": 9871
+ },
+ {
+ "epoch": 26.899182561307903,
+ "grad_norm": 6.297325611114502,
+ "learning_rate": 1.7150951968634947e-05,
+ "loss": 0.5719,
+ "step": 9872
+ },
+ {
+ "epoch": 26.90190735694823,
+ "grad_norm": 15.39514446258545,
+ "learning_rate": 1.715033505314122e-05,
+ "loss": 0.5058,
+ "step": 9873
+ },
+ {
+ "epoch": 26.904632152588555,
+ "grad_norm": 9.491486549377441,
+ "learning_rate": 1.7149718081960912e-05,
+ "loss": 0.6662,
+ "step": 9874
+ },
+ {
+ "epoch": 26.907356948228884,
+ "grad_norm": 9.023232460021973,
+ "learning_rate": 1.714910105509883e-05,
+ "loss": 0.566,
+ "step": 9875
+ },
+ {
+ "epoch": 26.91008174386921,
+ "grad_norm": 10.471985816955566,
+ "learning_rate": 1.7148483972559778e-05,
+ "loss": 0.5975,
+ "step": 9876
+ },
+ {
+ "epoch": 26.912806539509535,
+ "grad_norm": 7.666295528411865,
+ "learning_rate": 1.7147866834348567e-05,
+ "loss": 0.7562,
+ "step": 9877
+ },
+ {
+ "epoch": 26.915531335149865,
+ "grad_norm": 6.589531898498535,
+ "learning_rate": 1.7147249640469995e-05,
+ "loss": 0.6293,
+ "step": 9878
+ },
+ {
+ "epoch": 26.91825613079019,
+ "grad_norm": 15.742155075073242,
+ "learning_rate": 1.7146632390928874e-05,
+ "loss": 0.5092,
+ "step": 9879
+ },
+ {
+ "epoch": 26.920980926430516,
+ "grad_norm": 7.420589447021484,
+ "learning_rate": 1.7146015085730006e-05,
+ "loss": 0.5157,
+ "step": 9880
+ },
+ {
+ "epoch": 26.923705722070846,
+ "grad_norm": 7.282872676849365,
+ "learning_rate": 1.7145397724878208e-05,
+ "loss": 0.584,
+ "step": 9881
+ },
+ {
+ "epoch": 26.92643051771117,
+ "grad_norm": 6.97989559173584,
+ "learning_rate": 1.7144780308378283e-05,
+ "loss": 0.452,
+ "step": 9882
+ },
+ {
+ "epoch": 26.929155313351497,
+ "grad_norm": 7.551604747772217,
+ "learning_rate": 1.7144162836235036e-05,
+ "loss": 0.5566,
+ "step": 9883
+ },
+ {
+ "epoch": 26.931880108991827,
+ "grad_norm": 8.512497901916504,
+ "learning_rate": 1.7143545308453274e-05,
+ "loss": 0.6614,
+ "step": 9884
+ },
+ {
+ "epoch": 26.934604904632153,
+ "grad_norm": 8.548844337463379,
+ "learning_rate": 1.714292772503782e-05,
+ "loss": 0.6156,
+ "step": 9885
+ },
+ {
+ "epoch": 26.93732970027248,
+ "grad_norm": 8.930683135986328,
+ "learning_rate": 1.714231008599347e-05,
+ "loss": 0.6012,
+ "step": 9886
+ },
+ {
+ "epoch": 26.940054495912808,
+ "grad_norm": 8.837637901306152,
+ "learning_rate": 1.7141692391325038e-05,
+ "loss": 0.6991,
+ "step": 9887
+ },
+ {
+ "epoch": 26.942779291553133,
+ "grad_norm": 7.4434332847595215,
+ "learning_rate": 1.714107464103734e-05,
+ "loss": 0.6538,
+ "step": 9888
+ },
+ {
+ "epoch": 26.94550408719346,
+ "grad_norm": 6.97316837310791,
+ "learning_rate": 1.714045683513518e-05,
+ "loss": 0.5726,
+ "step": 9889
+ },
+ {
+ "epoch": 26.94822888283379,
+ "grad_norm": 7.7166008949279785,
+ "learning_rate": 1.7139838973623372e-05,
+ "loss": 0.5148,
+ "step": 9890
+ },
+ {
+ "epoch": 26.950953678474114,
+ "grad_norm": 10.185364723205566,
+ "learning_rate": 1.7139221056506728e-05,
+ "loss": 0.6141,
+ "step": 9891
+ },
+ {
+ "epoch": 26.95367847411444,
+ "grad_norm": 7.110172271728516,
+ "learning_rate": 1.7138603083790058e-05,
+ "loss": 0.4905,
+ "step": 9892
+ },
+ {
+ "epoch": 26.95640326975477,
+ "grad_norm": 21.275188446044922,
+ "learning_rate": 1.713798505547818e-05,
+ "loss": 0.5323,
+ "step": 9893
+ },
+ {
+ "epoch": 26.959128065395095,
+ "grad_norm": 14.872252464294434,
+ "learning_rate": 1.7137366971575905e-05,
+ "loss": 0.5959,
+ "step": 9894
+ },
+ {
+ "epoch": 26.96185286103542,
+ "grad_norm": 6.733795166015625,
+ "learning_rate": 1.7136748832088043e-05,
+ "loss": 0.4517,
+ "step": 9895
+ },
+ {
+ "epoch": 26.96457765667575,
+ "grad_norm": 8.441132545471191,
+ "learning_rate": 1.713613063701941e-05,
+ "loss": 0.6322,
+ "step": 9896
+ },
+ {
+ "epoch": 26.967302452316076,
+ "grad_norm": 10.844657897949219,
+ "learning_rate": 1.7135512386374823e-05,
+ "loss": 0.7972,
+ "step": 9897
+ },
+ {
+ "epoch": 26.970027247956402,
+ "grad_norm": 8.176034927368164,
+ "learning_rate": 1.7134894080159096e-05,
+ "loss": 0.7691,
+ "step": 9898
+ },
+ {
+ "epoch": 26.97275204359673,
+ "grad_norm": 9.46308708190918,
+ "learning_rate": 1.7134275718377043e-05,
+ "loss": 0.575,
+ "step": 9899
+ },
+ {
+ "epoch": 26.975476839237057,
+ "grad_norm": 8.104681015014648,
+ "learning_rate": 1.713365730103348e-05,
+ "loss": 0.6555,
+ "step": 9900
+ },
+ {
+ "epoch": 26.978201634877383,
+ "grad_norm": 8.981183052062988,
+ "learning_rate": 1.7133038828133224e-05,
+ "loss": 0.5291,
+ "step": 9901
+ },
+ {
+ "epoch": 26.980926430517712,
+ "grad_norm": 10.914739608764648,
+ "learning_rate": 1.713242029968109e-05,
+ "loss": 0.7823,
+ "step": 9902
+ },
+ {
+ "epoch": 26.983651226158038,
+ "grad_norm": 9.093073844909668,
+ "learning_rate": 1.71318017156819e-05,
+ "loss": 0.4865,
+ "step": 9903
+ },
+ {
+ "epoch": 26.986376021798364,
+ "grad_norm": 7.77921724319458,
+ "learning_rate": 1.7131183076140462e-05,
+ "loss": 0.6554,
+ "step": 9904
+ },
+ {
+ "epoch": 26.989100817438693,
+ "grad_norm": 8.578624725341797,
+ "learning_rate": 1.7130564381061603e-05,
+ "loss": 0.511,
+ "step": 9905
+ },
+ {
+ "epoch": 26.99182561307902,
+ "grad_norm": 9.18174934387207,
+ "learning_rate": 1.7129945630450136e-05,
+ "loss": 0.5055,
+ "step": 9906
+ },
+ {
+ "epoch": 26.994550408719345,
+ "grad_norm": 6.425988674163818,
+ "learning_rate": 1.7129326824310882e-05,
+ "loss": 0.7188,
+ "step": 9907
+ },
+ {
+ "epoch": 26.997275204359674,
+ "grad_norm": 8.770267486572266,
+ "learning_rate": 1.7128707962648662e-05,
+ "loss": 0.4218,
+ "step": 9908
+ },
+ {
+ "epoch": 27.0,
+ "grad_norm": 10.719183921813965,
+ "learning_rate": 1.7128089045468294e-05,
+ "loss": 0.53,
+ "step": 9909
+ },
+ {
+ "epoch": 27.002724795640326,
+ "grad_norm": 7.504054069519043,
+ "learning_rate": 1.71274700727746e-05,
+ "loss": 0.6198,
+ "step": 9910
+ },
+ {
+ "epoch": 27.005449591280655,
+ "grad_norm": 10.078618049621582,
+ "learning_rate": 1.7126851044572395e-05,
+ "loss": 0.655,
+ "step": 9911
+ },
+ {
+ "epoch": 27.00817438692098,
+ "grad_norm": 9.173070907592773,
+ "learning_rate": 1.7126231960866505e-05,
+ "loss": 0.5139,
+ "step": 9912
+ },
+ {
+ "epoch": 27.010899182561307,
+ "grad_norm": 7.0432820320129395,
+ "learning_rate": 1.7125612821661746e-05,
+ "loss": 0.4684,
+ "step": 9913
+ },
+ {
+ "epoch": 27.013623978201636,
+ "grad_norm": 7.106161117553711,
+ "learning_rate": 1.7124993626962946e-05,
+ "loss": 0.5553,
+ "step": 9914
+ },
+ {
+ "epoch": 27.016348773841962,
+ "grad_norm": 5.988898277282715,
+ "learning_rate": 1.7124374376774926e-05,
+ "loss": 0.6425,
+ "step": 9915
+ },
+ {
+ "epoch": 27.019073569482288,
+ "grad_norm": 16.35003089904785,
+ "learning_rate": 1.712375507110251e-05,
+ "loss": 0.6501,
+ "step": 9916
+ },
+ {
+ "epoch": 27.021798365122617,
+ "grad_norm": 9.020776748657227,
+ "learning_rate": 1.7123135709950515e-05,
+ "loss": 0.566,
+ "step": 9917
+ },
+ {
+ "epoch": 27.024523160762943,
+ "grad_norm": 6.925570964813232,
+ "learning_rate": 1.7122516293323767e-05,
+ "loss": 0.4954,
+ "step": 9918
+ },
+ {
+ "epoch": 27.02724795640327,
+ "grad_norm": 7.659992694854736,
+ "learning_rate": 1.7121896821227094e-05,
+ "loss": 0.4759,
+ "step": 9919
+ },
+ {
+ "epoch": 27.029972752043598,
+ "grad_norm": 12.315473556518555,
+ "learning_rate": 1.712127729366532e-05,
+ "loss": 0.5403,
+ "step": 9920
+ },
+ {
+ "epoch": 27.032697547683924,
+ "grad_norm": 7.5261383056640625,
+ "learning_rate": 1.7120657710643264e-05,
+ "loss": 0.6048,
+ "step": 9921
+ },
+ {
+ "epoch": 27.03542234332425,
+ "grad_norm": 7.493836402893066,
+ "learning_rate": 1.7120038072165756e-05,
+ "loss": 0.5029,
+ "step": 9922
+ },
+ {
+ "epoch": 27.03814713896458,
+ "grad_norm": 7.221220970153809,
+ "learning_rate": 1.7119418378237623e-05,
+ "loss": 0.6017,
+ "step": 9923
+ },
+ {
+ "epoch": 27.040871934604905,
+ "grad_norm": 7.582027435302734,
+ "learning_rate": 1.7118798628863685e-05,
+ "loss": 0.6014,
+ "step": 9924
+ },
+ {
+ "epoch": 27.04359673024523,
+ "grad_norm": 10.846917152404785,
+ "learning_rate": 1.7118178824048774e-05,
+ "loss": 0.5579,
+ "step": 9925
+ },
+ {
+ "epoch": 27.04632152588556,
+ "grad_norm": 7.30008602142334,
+ "learning_rate": 1.7117558963797715e-05,
+ "loss": 0.5022,
+ "step": 9926
+ },
+ {
+ "epoch": 27.049046321525886,
+ "grad_norm": 6.973043441772461,
+ "learning_rate": 1.7116939048115336e-05,
+ "loss": 0.4575,
+ "step": 9927
+ },
+ {
+ "epoch": 27.05177111716621,
+ "grad_norm": 7.097996711730957,
+ "learning_rate": 1.711631907700647e-05,
+ "loss": 0.4754,
+ "step": 9928
+ },
+ {
+ "epoch": 27.05449591280654,
+ "grad_norm": 9.277467727661133,
+ "learning_rate": 1.711569905047593e-05,
+ "loss": 0.676,
+ "step": 9929
+ },
+ {
+ "epoch": 27.057220708446867,
+ "grad_norm": 7.5056610107421875,
+ "learning_rate": 1.7115078968528563e-05,
+ "loss": 0.6619,
+ "step": 9930
+ },
+ {
+ "epoch": 27.059945504087192,
+ "grad_norm": 8.805801391601562,
+ "learning_rate": 1.7114458831169184e-05,
+ "loss": 0.5337,
+ "step": 9931
+ },
+ {
+ "epoch": 27.06267029972752,
+ "grad_norm": 7.667728424072266,
+ "learning_rate": 1.7113838638402633e-05,
+ "loss": 0.4593,
+ "step": 9932
+ },
+ {
+ "epoch": 27.065395095367847,
+ "grad_norm": 12.151493072509766,
+ "learning_rate": 1.7113218390233734e-05,
+ "loss": 0.6071,
+ "step": 9933
+ },
+ {
+ "epoch": 27.068119891008173,
+ "grad_norm": 7.711685657501221,
+ "learning_rate": 1.711259808666732e-05,
+ "loss": 0.5402,
+ "step": 9934
+ },
+ {
+ "epoch": 27.070844686648503,
+ "grad_norm": 10.571061134338379,
+ "learning_rate": 1.711197772770822e-05,
+ "loss": 0.3903,
+ "step": 9935
+ },
+ {
+ "epoch": 27.07356948228883,
+ "grad_norm": 7.110350608825684,
+ "learning_rate": 1.7111357313361264e-05,
+ "loss": 0.4113,
+ "step": 9936
+ },
+ {
+ "epoch": 27.076294277929154,
+ "grad_norm": 15.685750007629395,
+ "learning_rate": 1.7110736843631294e-05,
+ "loss": 0.6638,
+ "step": 9937
+ },
+ {
+ "epoch": 27.079019073569484,
+ "grad_norm": 6.967113971710205,
+ "learning_rate": 1.7110116318523126e-05,
+ "loss": 0.5338,
+ "step": 9938
+ },
+ {
+ "epoch": 27.08174386920981,
+ "grad_norm": 9.692916870117188,
+ "learning_rate": 1.7109495738041605e-05,
+ "loss": 0.5378,
+ "step": 9939
+ },
+ {
+ "epoch": 27.084468664850135,
+ "grad_norm": 6.948312282562256,
+ "learning_rate": 1.7108875102191557e-05,
+ "loss": 0.4175,
+ "step": 9940
+ },
+ {
+ "epoch": 27.087193460490465,
+ "grad_norm": 7.597878456115723,
+ "learning_rate": 1.7108254410977822e-05,
+ "loss": 0.4593,
+ "step": 9941
+ },
+ {
+ "epoch": 27.08991825613079,
+ "grad_norm": 7.904601097106934,
+ "learning_rate": 1.710763366440523e-05,
+ "loss": 0.4382,
+ "step": 9942
+ },
+ {
+ "epoch": 27.092643051771116,
+ "grad_norm": 9.962733268737793,
+ "learning_rate": 1.7107012862478614e-05,
+ "loss": 0.4148,
+ "step": 9943
+ },
+ {
+ "epoch": 27.095367847411445,
+ "grad_norm": 9.055351257324219,
+ "learning_rate": 1.710639200520281e-05,
+ "loss": 0.4607,
+ "step": 9944
+ },
+ {
+ "epoch": 27.09809264305177,
+ "grad_norm": 7.320572376251221,
+ "learning_rate": 1.7105771092582655e-05,
+ "loss": 0.5253,
+ "step": 9945
+ },
+ {
+ "epoch": 27.100817438692097,
+ "grad_norm": 7.846962928771973,
+ "learning_rate": 1.7105150124622985e-05,
+ "loss": 0.6495,
+ "step": 9946
+ },
+ {
+ "epoch": 27.103542234332426,
+ "grad_norm": 7.681886672973633,
+ "learning_rate": 1.7104529101328632e-05,
+ "loss": 0.573,
+ "step": 9947
+ },
+ {
+ "epoch": 27.106267029972752,
+ "grad_norm": 11.92682933807373,
+ "learning_rate": 1.7103908022704436e-05,
+ "loss": 0.4685,
+ "step": 9948
+ },
+ {
+ "epoch": 27.108991825613078,
+ "grad_norm": 8.032818794250488,
+ "learning_rate": 1.7103286888755237e-05,
+ "loss": 0.5396,
+ "step": 9949
+ },
+ {
+ "epoch": 27.111716621253407,
+ "grad_norm": 6.875002384185791,
+ "learning_rate": 1.710266569948586e-05,
+ "loss": 0.591,
+ "step": 9950
+ },
+ {
+ "epoch": 27.114441416893733,
+ "grad_norm": 10.565400123596191,
+ "learning_rate": 1.7102044454901155e-05,
+ "loss": 0.5151,
+ "step": 9951
+ },
+ {
+ "epoch": 27.11716621253406,
+ "grad_norm": 7.093526363372803,
+ "learning_rate": 1.7101423155005957e-05,
+ "loss": 0.5104,
+ "step": 9952
+ },
+ {
+ "epoch": 27.11989100817439,
+ "grad_norm": 7.847536563873291,
+ "learning_rate": 1.7100801799805104e-05,
+ "loss": 0.5755,
+ "step": 9953
+ },
+ {
+ "epoch": 27.122615803814714,
+ "grad_norm": 9.526288986206055,
+ "learning_rate": 1.7100180389303435e-05,
+ "loss": 0.4774,
+ "step": 9954
+ },
+ {
+ "epoch": 27.12534059945504,
+ "grad_norm": 7.164559364318848,
+ "learning_rate": 1.7099558923505792e-05,
+ "loss": 0.5342,
+ "step": 9955
+ },
+ {
+ "epoch": 27.12806539509537,
+ "grad_norm": 6.162780284881592,
+ "learning_rate": 1.709893740241701e-05,
+ "loss": 0.3869,
+ "step": 9956
+ },
+ {
+ "epoch": 27.130790190735695,
+ "grad_norm": 7.655863285064697,
+ "learning_rate": 1.7098315826041932e-05,
+ "loss": 0.4987,
+ "step": 9957
+ },
+ {
+ "epoch": 27.13351498637602,
+ "grad_norm": 7.7024359703063965,
+ "learning_rate": 1.7097694194385395e-05,
+ "loss": 0.6907,
+ "step": 9958
+ },
+ {
+ "epoch": 27.13623978201635,
+ "grad_norm": 6.282317638397217,
+ "learning_rate": 1.709707250745225e-05,
+ "loss": 0.4347,
+ "step": 9959
+ },
+ {
+ "epoch": 27.138964577656676,
+ "grad_norm": 8.424469947814941,
+ "learning_rate": 1.7096450765247333e-05,
+ "loss": 0.5565,
+ "step": 9960
+ },
+ {
+ "epoch": 27.141689373297,
+ "grad_norm": 7.163951873779297,
+ "learning_rate": 1.7095828967775485e-05,
+ "loss": 0.461,
+ "step": 9961
+ },
+ {
+ "epoch": 27.14441416893733,
+ "grad_norm": 19.0053768157959,
+ "learning_rate": 1.7095207115041546e-05,
+ "loss": 0.5612,
+ "step": 9962
+ },
+ {
+ "epoch": 27.147138964577657,
+ "grad_norm": 10.031600952148438,
+ "learning_rate": 1.7094585207050363e-05,
+ "loss": 0.6506,
+ "step": 9963
+ },
+ {
+ "epoch": 27.149863760217983,
+ "grad_norm": 6.632686614990234,
+ "learning_rate": 1.709396324380678e-05,
+ "loss": 0.4497,
+ "step": 9964
+ },
+ {
+ "epoch": 27.152588555858312,
+ "grad_norm": 6.571283340454102,
+ "learning_rate": 1.709334122531564e-05,
+ "loss": 0.6563,
+ "step": 9965
+ },
+ {
+ "epoch": 27.155313351498638,
+ "grad_norm": 10.044163703918457,
+ "learning_rate": 1.7092719151581786e-05,
+ "loss": 0.5818,
+ "step": 9966
+ },
+ {
+ "epoch": 27.158038147138964,
+ "grad_norm": 7.754175186157227,
+ "learning_rate": 1.7092097022610064e-05,
+ "loss": 0.4387,
+ "step": 9967
+ },
+ {
+ "epoch": 27.160762942779293,
+ "grad_norm": 8.865942001342773,
+ "learning_rate": 1.709147483840532e-05,
+ "loss": 0.5388,
+ "step": 9968
+ },
+ {
+ "epoch": 27.16348773841962,
+ "grad_norm": 8.810154914855957,
+ "learning_rate": 1.7090852598972398e-05,
+ "loss": 0.4935,
+ "step": 9969
+ },
+ {
+ "epoch": 27.166212534059945,
+ "grad_norm": 7.3079681396484375,
+ "learning_rate": 1.7090230304316142e-05,
+ "loss": 0.5281,
+ "step": 9970
+ },
+ {
+ "epoch": 27.168937329700274,
+ "grad_norm": 9.283902168273926,
+ "learning_rate": 1.7089607954441403e-05,
+ "loss": 0.5385,
+ "step": 9971
+ },
+ {
+ "epoch": 27.1716621253406,
+ "grad_norm": 8.04033374786377,
+ "learning_rate": 1.7088985549353024e-05,
+ "loss": 0.3656,
+ "step": 9972
+ },
+ {
+ "epoch": 27.174386920980925,
+ "grad_norm": 12.064838409423828,
+ "learning_rate": 1.7088363089055854e-05,
+ "loss": 0.488,
+ "step": 9973
+ },
+ {
+ "epoch": 27.177111716621255,
+ "grad_norm": 6.4653544425964355,
+ "learning_rate": 1.708774057355474e-05,
+ "loss": 0.6996,
+ "step": 9974
+ },
+ {
+ "epoch": 27.17983651226158,
+ "grad_norm": 7.534409046173096,
+ "learning_rate": 1.708711800285453e-05,
+ "loss": 0.5007,
+ "step": 9975
+ },
+ {
+ "epoch": 27.182561307901906,
+ "grad_norm": 7.947213172912598,
+ "learning_rate": 1.7086495376960073e-05,
+ "loss": 0.543,
+ "step": 9976
+ },
+ {
+ "epoch": 27.185286103542236,
+ "grad_norm": 8.628761291503906,
+ "learning_rate": 1.708587269587622e-05,
+ "loss": 0.4768,
+ "step": 9977
+ },
+ {
+ "epoch": 27.18801089918256,
+ "grad_norm": 8.160655975341797,
+ "learning_rate": 1.7085249959607818e-05,
+ "loss": 0.6144,
+ "step": 9978
+ },
+ {
+ "epoch": 27.190735694822887,
+ "grad_norm": 6.389145851135254,
+ "learning_rate": 1.7084627168159716e-05,
+ "loss": 0.7598,
+ "step": 9979
+ },
+ {
+ "epoch": 27.193460490463217,
+ "grad_norm": 7.102512836456299,
+ "learning_rate": 1.708400432153677e-05,
+ "loss": 0.4783,
+ "step": 9980
+ },
+ {
+ "epoch": 27.196185286103542,
+ "grad_norm": 6.776620864868164,
+ "learning_rate": 1.7083381419743817e-05,
+ "loss": 0.5002,
+ "step": 9981
+ },
+ {
+ "epoch": 27.19891008174387,
+ "grad_norm": 6.986589431762695,
+ "learning_rate": 1.7082758462785728e-05,
+ "loss": 0.5826,
+ "step": 9982
+ },
+ {
+ "epoch": 27.201634877384198,
+ "grad_norm": 6.739128589630127,
+ "learning_rate": 1.7082135450667335e-05,
+ "loss": 0.5797,
+ "step": 9983
+ },
+ {
+ "epoch": 27.204359673024523,
+ "grad_norm": 10.087153434753418,
+ "learning_rate": 1.7081512383393507e-05,
+ "loss": 0.4793,
+ "step": 9984
+ },
+ {
+ "epoch": 27.20708446866485,
+ "grad_norm": 7.079504489898682,
+ "learning_rate": 1.7080889260969083e-05,
+ "loss": 0.644,
+ "step": 9985
+ },
+ {
+ "epoch": 27.20980926430518,
+ "grad_norm": 7.418025493621826,
+ "learning_rate": 1.708026608339892e-05,
+ "loss": 0.4905,
+ "step": 9986
+ },
+ {
+ "epoch": 27.212534059945504,
+ "grad_norm": 7.351944446563721,
+ "learning_rate": 1.7079642850687877e-05,
+ "loss": 0.5712,
+ "step": 9987
+ },
+ {
+ "epoch": 27.21525885558583,
+ "grad_norm": 7.845609664916992,
+ "learning_rate": 1.7079019562840805e-05,
+ "loss": 0.7001,
+ "step": 9988
+ },
+ {
+ "epoch": 27.21798365122616,
+ "grad_norm": 9.999709129333496,
+ "learning_rate": 1.7078396219862555e-05,
+ "loss": 0.6672,
+ "step": 9989
+ },
+ {
+ "epoch": 27.220708446866485,
+ "grad_norm": 8.453604698181152,
+ "learning_rate": 1.707777282175798e-05,
+ "loss": 0.5795,
+ "step": 9990
+ },
+ {
+ "epoch": 27.22343324250681,
+ "grad_norm": 8.12509536743164,
+ "learning_rate": 1.707714936853194e-05,
+ "loss": 0.4963,
+ "step": 9991
+ },
+ {
+ "epoch": 27.22615803814714,
+ "grad_norm": 8.132515907287598,
+ "learning_rate": 1.7076525860189287e-05,
+ "loss": 0.642,
+ "step": 9992
+ },
+ {
+ "epoch": 27.228882833787466,
+ "grad_norm": 7.824767589569092,
+ "learning_rate": 1.707590229673488e-05,
+ "loss": 0.3948,
+ "step": 9993
+ },
+ {
+ "epoch": 27.231607629427792,
+ "grad_norm": 6.789891242980957,
+ "learning_rate": 1.7075278678173574e-05,
+ "loss": 0.4338,
+ "step": 9994
+ },
+ {
+ "epoch": 27.23433242506812,
+ "grad_norm": 7.379485130310059,
+ "learning_rate": 1.7074655004510225e-05,
+ "loss": 0.4098,
+ "step": 9995
+ },
+ {
+ "epoch": 27.237057220708447,
+ "grad_norm": 6.867528915405273,
+ "learning_rate": 1.7074031275749686e-05,
+ "loss": 0.575,
+ "step": 9996
+ },
+ {
+ "epoch": 27.239782016348773,
+ "grad_norm": 6.640412330627441,
+ "learning_rate": 1.7073407491896824e-05,
+ "loss": 0.5046,
+ "step": 9997
+ },
+ {
+ "epoch": 27.242506811989102,
+ "grad_norm": 7.1053786277771,
+ "learning_rate": 1.7072783652956493e-05,
+ "loss": 0.5579,
+ "step": 9998
+ },
+ {
+ "epoch": 27.245231607629428,
+ "grad_norm": 9.06983757019043,
+ "learning_rate": 1.707215975893355e-05,
+ "loss": 0.5596,
+ "step": 9999
+ },
+ {
+ "epoch": 27.247956403269754,
+ "grad_norm": 7.0437912940979,
+ "learning_rate": 1.7071535809832852e-05,
+ "loss": 0.6115,
+ "step": 10000
+ },
+ {
+ "epoch": 27.250681198910083,
+ "grad_norm": 9.336917877197266,
+ "learning_rate": 1.707091180565926e-05,
+ "loss": 0.4551,
+ "step": 10001
+ },
+ {
+ "epoch": 27.25340599455041,
+ "grad_norm": 7.803974151611328,
+ "learning_rate": 1.7070287746417636e-05,
+ "loss": 0.4794,
+ "step": 10002
+ },
+ {
+ "epoch": 27.256130790190735,
+ "grad_norm": 10.840062141418457,
+ "learning_rate": 1.706966363211284e-05,
+ "loss": 0.5307,
+ "step": 10003
+ },
+ {
+ "epoch": 27.258855585831064,
+ "grad_norm": 7.2597336769104,
+ "learning_rate": 1.7069039462749734e-05,
+ "loss": 0.6178,
+ "step": 10004
+ },
+ {
+ "epoch": 27.26158038147139,
+ "grad_norm": 7.98543119430542,
+ "learning_rate": 1.706841523833317e-05,
+ "loss": 0.5807,
+ "step": 10005
+ },
+ {
+ "epoch": 27.264305177111716,
+ "grad_norm": 9.968547821044922,
+ "learning_rate": 1.7067790958868017e-05,
+ "loss": 0.6636,
+ "step": 10006
+ },
+ {
+ "epoch": 27.267029972752045,
+ "grad_norm": 9.231914520263672,
+ "learning_rate": 1.7067166624359138e-05,
+ "loss": 0.47,
+ "step": 10007
+ },
+ {
+ "epoch": 27.26975476839237,
+ "grad_norm": 8.400660514831543,
+ "learning_rate": 1.706654223481139e-05,
+ "loss": 0.5679,
+ "step": 10008
+ },
+ {
+ "epoch": 27.272479564032697,
+ "grad_norm": 8.488985061645508,
+ "learning_rate": 1.706591779022964e-05,
+ "loss": 0.5359,
+ "step": 10009
+ },
+ {
+ "epoch": 27.275204359673026,
+ "grad_norm": 6.763240337371826,
+ "learning_rate": 1.706529329061875e-05,
+ "loss": 0.5494,
+ "step": 10010
+ },
+ {
+ "epoch": 27.277929155313352,
+ "grad_norm": 7.996668815612793,
+ "learning_rate": 1.706466873598358e-05,
+ "loss": 0.4254,
+ "step": 10011
+ },
+ {
+ "epoch": 27.280653950953678,
+ "grad_norm": 8.270384788513184,
+ "learning_rate": 1.7064044126329e-05,
+ "loss": 0.4733,
+ "step": 10012
+ },
+ {
+ "epoch": 27.283378746594007,
+ "grad_norm": 7.509069442749023,
+ "learning_rate": 1.706341946165987e-05,
+ "loss": 0.5413,
+ "step": 10013
+ },
+ {
+ "epoch": 27.286103542234333,
+ "grad_norm": 9.132331848144531,
+ "learning_rate": 1.706279474198106e-05,
+ "loss": 0.4437,
+ "step": 10014
+ },
+ {
+ "epoch": 27.28882833787466,
+ "grad_norm": 6.917953014373779,
+ "learning_rate": 1.7062169967297432e-05,
+ "loss": 0.4746,
+ "step": 10015
+ },
+ {
+ "epoch": 27.291553133514988,
+ "grad_norm": 7.6658477783203125,
+ "learning_rate": 1.7061545137613847e-05,
+ "loss": 0.7435,
+ "step": 10016
+ },
+ {
+ "epoch": 27.294277929155314,
+ "grad_norm": 7.395020961761475,
+ "learning_rate": 1.706092025293518e-05,
+ "loss": 0.4034,
+ "step": 10017
+ },
+ {
+ "epoch": 27.29700272479564,
+ "grad_norm": 6.857711315155029,
+ "learning_rate": 1.7060295313266292e-05,
+ "loss": 0.4524,
+ "step": 10018
+ },
+ {
+ "epoch": 27.29972752043597,
+ "grad_norm": 8.136479377746582,
+ "learning_rate": 1.7059670318612053e-05,
+ "loss": 0.3506,
+ "step": 10019
+ },
+ {
+ "epoch": 27.302452316076295,
+ "grad_norm": 8.787403106689453,
+ "learning_rate": 1.7059045268977325e-05,
+ "loss": 0.4917,
+ "step": 10020
+ },
+ {
+ "epoch": 27.30517711171662,
+ "grad_norm": 6.448479175567627,
+ "learning_rate": 1.705842016436698e-05,
+ "loss": 0.5216,
+ "step": 10021
+ },
+ {
+ "epoch": 27.30790190735695,
+ "grad_norm": 6.3374481201171875,
+ "learning_rate": 1.705779500478589e-05,
+ "loss": 0.5302,
+ "step": 10022
+ },
+ {
+ "epoch": 27.310626702997276,
+ "grad_norm": 7.888910293579102,
+ "learning_rate": 1.7057169790238916e-05,
+ "loss": 0.5046,
+ "step": 10023
+ },
+ {
+ "epoch": 27.3133514986376,
+ "grad_norm": 8.027619361877441,
+ "learning_rate": 1.705654452073093e-05,
+ "loss": 0.6215,
+ "step": 10024
+ },
+ {
+ "epoch": 27.31607629427793,
+ "grad_norm": 8.172956466674805,
+ "learning_rate": 1.7055919196266806e-05,
+ "loss": 0.5985,
+ "step": 10025
+ },
+ {
+ "epoch": 27.318801089918257,
+ "grad_norm": 7.377542972564697,
+ "learning_rate": 1.705529381685141e-05,
+ "loss": 0.5151,
+ "step": 10026
+ },
+ {
+ "epoch": 27.321525885558582,
+ "grad_norm": 7.448740005493164,
+ "learning_rate": 1.705466838248961e-05,
+ "loss": 0.5624,
+ "step": 10027
+ },
+ {
+ "epoch": 27.32425068119891,
+ "grad_norm": 7.380115032196045,
+ "learning_rate": 1.705404289318628e-05,
+ "loss": 0.5007,
+ "step": 10028
+ },
+ {
+ "epoch": 27.326975476839237,
+ "grad_norm": 7.7183518409729,
+ "learning_rate": 1.7053417348946293e-05,
+ "loss": 0.5818,
+ "step": 10029
+ },
+ {
+ "epoch": 27.329700272479563,
+ "grad_norm": 7.5660719871521,
+ "learning_rate": 1.705279174977452e-05,
+ "loss": 0.5103,
+ "step": 10030
+ },
+ {
+ "epoch": 27.332425068119893,
+ "grad_norm": 12.974373817443848,
+ "learning_rate": 1.7052166095675827e-05,
+ "loss": 0.645,
+ "step": 10031
+ },
+ {
+ "epoch": 27.33514986376022,
+ "grad_norm": 7.177042484283447,
+ "learning_rate": 1.7051540386655094e-05,
+ "loss": 0.4811,
+ "step": 10032
+ },
+ {
+ "epoch": 27.337874659400544,
+ "grad_norm": 9.889019012451172,
+ "learning_rate": 1.705091462271719e-05,
+ "loss": 0.7004,
+ "step": 10033
+ },
+ {
+ "epoch": 27.340599455040874,
+ "grad_norm": 7.093506813049316,
+ "learning_rate": 1.7050288803866992e-05,
+ "loss": 0.6276,
+ "step": 10034
+ },
+ {
+ "epoch": 27.3433242506812,
+ "grad_norm": 9.160090446472168,
+ "learning_rate": 1.7049662930109373e-05,
+ "loss": 0.6492,
+ "step": 10035
+ },
+ {
+ "epoch": 27.346049046321525,
+ "grad_norm": 8.586556434631348,
+ "learning_rate": 1.7049037001449202e-05,
+ "loss": 0.5503,
+ "step": 10036
+ },
+ {
+ "epoch": 27.348773841961854,
+ "grad_norm": 7.525806903839111,
+ "learning_rate": 1.704841101789136e-05,
+ "loss": 0.4617,
+ "step": 10037
+ },
+ {
+ "epoch": 27.35149863760218,
+ "grad_norm": 6.517123699188232,
+ "learning_rate": 1.704778497944072e-05,
+ "loss": 0.4512,
+ "step": 10038
+ },
+ {
+ "epoch": 27.354223433242506,
+ "grad_norm": 8.63493824005127,
+ "learning_rate": 1.704715888610216e-05,
+ "loss": 0.5289,
+ "step": 10039
+ },
+ {
+ "epoch": 27.356948228882835,
+ "grad_norm": 7.07725191116333,
+ "learning_rate": 1.704653273788055e-05,
+ "loss": 0.7155,
+ "step": 10040
+ },
+ {
+ "epoch": 27.35967302452316,
+ "grad_norm": 7.394663333892822,
+ "learning_rate": 1.704590653478077e-05,
+ "loss": 0.5936,
+ "step": 10041
+ },
+ {
+ "epoch": 27.362397820163487,
+ "grad_norm": 7.452281951904297,
+ "learning_rate": 1.7045280276807697e-05,
+ "loss": 0.6404,
+ "step": 10042
+ },
+ {
+ "epoch": 27.365122615803816,
+ "grad_norm": 8.40842056274414,
+ "learning_rate": 1.7044653963966206e-05,
+ "loss": 0.7006,
+ "step": 10043
+ },
+ {
+ "epoch": 27.367847411444142,
+ "grad_norm": 7.894318580627441,
+ "learning_rate": 1.7044027596261178e-05,
+ "loss": 0.5676,
+ "step": 10044
+ },
+ {
+ "epoch": 27.370572207084468,
+ "grad_norm": 8.687544822692871,
+ "learning_rate": 1.704340117369749e-05,
+ "loss": 0.4442,
+ "step": 10045
+ },
+ {
+ "epoch": 27.373297002724797,
+ "grad_norm": 6.665185928344727,
+ "learning_rate": 1.7042774696280023e-05,
+ "loss": 0.7184,
+ "step": 10046
+ },
+ {
+ "epoch": 27.376021798365123,
+ "grad_norm": 6.788980960845947,
+ "learning_rate": 1.704214816401365e-05,
+ "loss": 0.6483,
+ "step": 10047
+ },
+ {
+ "epoch": 27.37874659400545,
+ "grad_norm": 8.649880409240723,
+ "learning_rate": 1.7041521576903254e-05,
+ "loss": 0.4934,
+ "step": 10048
+ },
+ {
+ "epoch": 27.381471389645778,
+ "grad_norm": 6.84049654006958,
+ "learning_rate": 1.7040894934953715e-05,
+ "loss": 0.5432,
+ "step": 10049
+ },
+ {
+ "epoch": 27.384196185286104,
+ "grad_norm": 7.426638126373291,
+ "learning_rate": 1.7040268238169916e-05,
+ "loss": 0.4585,
+ "step": 10050
+ },
+ {
+ "epoch": 27.38692098092643,
+ "grad_norm": 7.961089611053467,
+ "learning_rate": 1.7039641486556732e-05,
+ "loss": 0.5002,
+ "step": 10051
+ },
+ {
+ "epoch": 27.38964577656676,
+ "grad_norm": 8.751544952392578,
+ "learning_rate": 1.7039014680119046e-05,
+ "loss": 0.6028,
+ "step": 10052
+ },
+ {
+ "epoch": 27.392370572207085,
+ "grad_norm": 7.071634292602539,
+ "learning_rate": 1.703838781886174e-05,
+ "loss": 0.485,
+ "step": 10053
+ },
+ {
+ "epoch": 27.39509536784741,
+ "grad_norm": 7.8563456535339355,
+ "learning_rate": 1.7037760902789696e-05,
+ "loss": 0.6389,
+ "step": 10054
+ },
+ {
+ "epoch": 27.39782016348774,
+ "grad_norm": 7.355616569519043,
+ "learning_rate": 1.7037133931907797e-05,
+ "loss": 0.4425,
+ "step": 10055
+ },
+ {
+ "epoch": 27.400544959128066,
+ "grad_norm": 8.382254600524902,
+ "learning_rate": 1.7036506906220928e-05,
+ "loss": 0.4914,
+ "step": 10056
+ },
+ {
+ "epoch": 27.40326975476839,
+ "grad_norm": 7.880213260650635,
+ "learning_rate": 1.7035879825733965e-05,
+ "loss": 0.5283,
+ "step": 10057
+ },
+ {
+ "epoch": 27.40599455040872,
+ "grad_norm": 7.893124103546143,
+ "learning_rate": 1.70352526904518e-05,
+ "loss": 0.5607,
+ "step": 10058
+ },
+ {
+ "epoch": 27.408719346049047,
+ "grad_norm": 8.816205024719238,
+ "learning_rate": 1.7034625500379312e-05,
+ "loss": 0.4796,
+ "step": 10059
+ },
+ {
+ "epoch": 27.411444141689373,
+ "grad_norm": 6.785427093505859,
+ "learning_rate": 1.7033998255521388e-05,
+ "loss": 0.7288,
+ "step": 10060
+ },
+ {
+ "epoch": 27.414168937329702,
+ "grad_norm": 8.814774513244629,
+ "learning_rate": 1.703337095588291e-05,
+ "loss": 0.4966,
+ "step": 10061
+ },
+ {
+ "epoch": 27.416893732970028,
+ "grad_norm": 9.867323875427246,
+ "learning_rate": 1.703274360146877e-05,
+ "loss": 0.5505,
+ "step": 10062
+ },
+ {
+ "epoch": 27.419618528610354,
+ "grad_norm": 12.343128204345703,
+ "learning_rate": 1.7032116192283844e-05,
+ "loss": 0.5804,
+ "step": 10063
+ },
+ {
+ "epoch": 27.422343324250683,
+ "grad_norm": 7.334210395812988,
+ "learning_rate": 1.7031488728333025e-05,
+ "loss": 0.4539,
+ "step": 10064
+ },
+ {
+ "epoch": 27.42506811989101,
+ "grad_norm": 7.609729766845703,
+ "learning_rate": 1.70308612096212e-05,
+ "loss": 0.5215,
+ "step": 10065
+ },
+ {
+ "epoch": 27.427792915531334,
+ "grad_norm": 7.235856533050537,
+ "learning_rate": 1.703023363615325e-05,
+ "loss": 0.6719,
+ "step": 10066
+ },
+ {
+ "epoch": 27.430517711171664,
+ "grad_norm": 10.903604507446289,
+ "learning_rate": 1.7029606007934073e-05,
+ "loss": 0.4841,
+ "step": 10067
+ },
+ {
+ "epoch": 27.43324250681199,
+ "grad_norm": 6.353349685668945,
+ "learning_rate": 1.7028978324968543e-05,
+ "loss": 0.616,
+ "step": 10068
+ },
+ {
+ "epoch": 27.435967302452315,
+ "grad_norm": 9.866066932678223,
+ "learning_rate": 1.702835058726156e-05,
+ "loss": 0.5229,
+ "step": 10069
+ },
+ {
+ "epoch": 27.438692098092645,
+ "grad_norm": 7.57305383682251,
+ "learning_rate": 1.7027722794818008e-05,
+ "loss": 0.3775,
+ "step": 10070
+ },
+ {
+ "epoch": 27.44141689373297,
+ "grad_norm": 22.632381439208984,
+ "learning_rate": 1.702709494764278e-05,
+ "loss": 0.4514,
+ "step": 10071
+ },
+ {
+ "epoch": 27.444141689373296,
+ "grad_norm": 7.173084735870361,
+ "learning_rate": 1.7026467045740762e-05,
+ "loss": 0.5573,
+ "step": 10072
+ },
+ {
+ "epoch": 27.446866485013626,
+ "grad_norm": 8.10495376586914,
+ "learning_rate": 1.7025839089116843e-05,
+ "loss": 0.4835,
+ "step": 10073
+ },
+ {
+ "epoch": 27.44959128065395,
+ "grad_norm": 7.458191394805908,
+ "learning_rate": 1.7025211077775915e-05,
+ "loss": 0.4229,
+ "step": 10074
+ },
+ {
+ "epoch": 27.452316076294277,
+ "grad_norm": 7.296041011810303,
+ "learning_rate": 1.702458301172287e-05,
+ "loss": 0.5245,
+ "step": 10075
+ },
+ {
+ "epoch": 27.455040871934607,
+ "grad_norm": 8.165763854980469,
+ "learning_rate": 1.70239548909626e-05,
+ "loss": 0.3905,
+ "step": 10076
+ },
+ {
+ "epoch": 27.457765667574932,
+ "grad_norm": 10.956998825073242,
+ "learning_rate": 1.7023326715499994e-05,
+ "loss": 0.555,
+ "step": 10077
+ },
+ {
+ "epoch": 27.460490463215258,
+ "grad_norm": 7.5906805992126465,
+ "learning_rate": 1.7022698485339945e-05,
+ "loss": 0.6392,
+ "step": 10078
+ },
+ {
+ "epoch": 27.463215258855588,
+ "grad_norm": 5.883872032165527,
+ "learning_rate": 1.7022070200487344e-05,
+ "loss": 0.4222,
+ "step": 10079
+ },
+ {
+ "epoch": 27.465940054495913,
+ "grad_norm": 7.269608974456787,
+ "learning_rate": 1.702144186094709e-05,
+ "loss": 0.4908,
+ "step": 10080
+ },
+ {
+ "epoch": 27.46866485013624,
+ "grad_norm": 6.971725940704346,
+ "learning_rate": 1.7020813466724072e-05,
+ "loss": 0.4449,
+ "step": 10081
+ },
+ {
+ "epoch": 27.47138964577657,
+ "grad_norm": 7.517458915710449,
+ "learning_rate": 1.7020185017823185e-05,
+ "loss": 0.459,
+ "step": 10082
+ },
+ {
+ "epoch": 27.474114441416894,
+ "grad_norm": 8.003358840942383,
+ "learning_rate": 1.7019556514249323e-05,
+ "loss": 0.5072,
+ "step": 10083
+ },
+ {
+ "epoch": 27.47683923705722,
+ "grad_norm": 7.887994766235352,
+ "learning_rate": 1.701892795600738e-05,
+ "loss": 0.4629,
+ "step": 10084
+ },
+ {
+ "epoch": 27.479564032697546,
+ "grad_norm": 7.413704872131348,
+ "learning_rate": 1.7018299343102252e-05,
+ "loss": 0.4489,
+ "step": 10085
+ },
+ {
+ "epoch": 27.482288828337875,
+ "grad_norm": 8.17776107788086,
+ "learning_rate": 1.7017670675538834e-05,
+ "loss": 0.5391,
+ "step": 10086
+ },
+ {
+ "epoch": 27.4850136239782,
+ "grad_norm": 8.881941795349121,
+ "learning_rate": 1.7017041953322025e-05,
+ "loss": 0.4822,
+ "step": 10087
+ },
+ {
+ "epoch": 27.48773841961853,
+ "grad_norm": 8.7860107421875,
+ "learning_rate": 1.7016413176456717e-05,
+ "loss": 0.6063,
+ "step": 10088
+ },
+ {
+ "epoch": 27.490463215258856,
+ "grad_norm": 8.136934280395508,
+ "learning_rate": 1.701578434494781e-05,
+ "loss": 0.5015,
+ "step": 10089
+ },
+ {
+ "epoch": 27.493188010899182,
+ "grad_norm": 7.738018989562988,
+ "learning_rate": 1.70151554588002e-05,
+ "loss": 0.5712,
+ "step": 10090
+ },
+ {
+ "epoch": 27.495912806539508,
+ "grad_norm": 8.951044082641602,
+ "learning_rate": 1.7014526518018787e-05,
+ "loss": 0.4677,
+ "step": 10091
+ },
+ {
+ "epoch": 27.498637602179837,
+ "grad_norm": 8.95796012878418,
+ "learning_rate": 1.7013897522608464e-05,
+ "loss": 0.4974,
+ "step": 10092
+ },
+ {
+ "epoch": 27.501362397820163,
+ "grad_norm": 6.817696571350098,
+ "learning_rate": 1.7013268472574133e-05,
+ "loss": 0.586,
+ "step": 10093
+ },
+ {
+ "epoch": 27.504087193460492,
+ "grad_norm": 9.146210670471191,
+ "learning_rate": 1.7012639367920694e-05,
+ "loss": 0.5119,
+ "step": 10094
+ },
+ {
+ "epoch": 27.506811989100818,
+ "grad_norm": 8.180194854736328,
+ "learning_rate": 1.7012010208653044e-05,
+ "loss": 0.5262,
+ "step": 10095
+ },
+ {
+ "epoch": 27.509536784741144,
+ "grad_norm": 7.886168956756592,
+ "learning_rate": 1.7011380994776086e-05,
+ "loss": 0.55,
+ "step": 10096
+ },
+ {
+ "epoch": 27.51226158038147,
+ "grad_norm": 7.781095027923584,
+ "learning_rate": 1.701075172629472e-05,
+ "loss": 0.4719,
+ "step": 10097
+ },
+ {
+ "epoch": 27.5149863760218,
+ "grad_norm": 9.938278198242188,
+ "learning_rate": 1.701012240321384e-05,
+ "loss": 0.4791,
+ "step": 10098
+ },
+ {
+ "epoch": 27.517711171662125,
+ "grad_norm": 8.60433578491211,
+ "learning_rate": 1.7009493025538356e-05,
+ "loss": 0.5984,
+ "step": 10099
+ },
+ {
+ "epoch": 27.520435967302454,
+ "grad_norm": 7.6925740242004395,
+ "learning_rate": 1.7008863593273167e-05,
+ "loss": 0.4728,
+ "step": 10100
+ },
+ {
+ "epoch": 27.52316076294278,
+ "grad_norm": 10.18087387084961,
+ "learning_rate": 1.7008234106423175e-05,
+ "loss": 0.5426,
+ "step": 10101
+ },
+ {
+ "epoch": 27.525885558583106,
+ "grad_norm": 8.223434448242188,
+ "learning_rate": 1.7007604564993277e-05,
+ "loss": 0.4843,
+ "step": 10102
+ },
+ {
+ "epoch": 27.52861035422343,
+ "grad_norm": 7.773364067077637,
+ "learning_rate": 1.7006974968988382e-05,
+ "loss": 0.5776,
+ "step": 10103
+ },
+ {
+ "epoch": 27.53133514986376,
+ "grad_norm": 7.327798366546631,
+ "learning_rate": 1.700634531841339e-05,
+ "loss": 0.5204,
+ "step": 10104
+ },
+ {
+ "epoch": 27.534059945504087,
+ "grad_norm": 7.9707512855529785,
+ "learning_rate": 1.7005715613273206e-05,
+ "loss": 0.3813,
+ "step": 10105
+ },
+ {
+ "epoch": 27.536784741144416,
+ "grad_norm": 8.973421096801758,
+ "learning_rate": 1.7005085853572736e-05,
+ "loss": 0.5999,
+ "step": 10106
+ },
+ {
+ "epoch": 27.539509536784742,
+ "grad_norm": 6.864203453063965,
+ "learning_rate": 1.7004456039316883e-05,
+ "loss": 0.4249,
+ "step": 10107
+ },
+ {
+ "epoch": 27.542234332425068,
+ "grad_norm": 8.282187461853027,
+ "learning_rate": 1.700382617051055e-05,
+ "loss": 0.6014,
+ "step": 10108
+ },
+ {
+ "epoch": 27.544959128065393,
+ "grad_norm": 12.412527084350586,
+ "learning_rate": 1.700319624715865e-05,
+ "loss": 0.4525,
+ "step": 10109
+ },
+ {
+ "epoch": 27.547683923705723,
+ "grad_norm": 9.558048248291016,
+ "learning_rate": 1.7002566269266078e-05,
+ "loss": 0.3632,
+ "step": 10110
+ },
+ {
+ "epoch": 27.55040871934605,
+ "grad_norm": 9.724501609802246,
+ "learning_rate": 1.7001936236837743e-05,
+ "loss": 0.6462,
+ "step": 10111
+ },
+ {
+ "epoch": 27.553133514986374,
+ "grad_norm": 8.310857772827148,
+ "learning_rate": 1.700130614987856e-05,
+ "loss": 0.5931,
+ "step": 10112
+ },
+ {
+ "epoch": 27.555858310626704,
+ "grad_norm": 14.585291862487793,
+ "learning_rate": 1.700067600839342e-05,
+ "loss": 0.4228,
+ "step": 10113
+ },
+ {
+ "epoch": 27.55858310626703,
+ "grad_norm": 7.609127044677734,
+ "learning_rate": 1.7000045812387253e-05,
+ "loss": 0.4537,
+ "step": 10114
+ },
+ {
+ "epoch": 27.561307901907355,
+ "grad_norm": 8.360729217529297,
+ "learning_rate": 1.6999415561864946e-05,
+ "loss": 0.5504,
+ "step": 10115
+ },
+ {
+ "epoch": 27.564032697547685,
+ "grad_norm": 10.392511367797852,
+ "learning_rate": 1.699878525683142e-05,
+ "loss": 0.6907,
+ "step": 10116
+ },
+ {
+ "epoch": 27.56675749318801,
+ "grad_norm": 9.930464744567871,
+ "learning_rate": 1.699815489729158e-05,
+ "loss": 0.5182,
+ "step": 10117
+ },
+ {
+ "epoch": 27.569482288828336,
+ "grad_norm": 8.100626945495605,
+ "learning_rate": 1.699752448325033e-05,
+ "loss": 0.4962,
+ "step": 10118
+ },
+ {
+ "epoch": 27.572207084468666,
+ "grad_norm": 9.099678039550781,
+ "learning_rate": 1.699689401471259e-05,
+ "loss": 0.5587,
+ "step": 10119
+ },
+ {
+ "epoch": 27.57493188010899,
+ "grad_norm": 8.464005470275879,
+ "learning_rate": 1.6996263491683263e-05,
+ "loss": 0.5463,
+ "step": 10120
+ },
+ {
+ "epoch": 27.577656675749317,
+ "grad_norm": 7.654876232147217,
+ "learning_rate": 1.699563291416726e-05,
+ "loss": 0.495,
+ "step": 10121
+ },
+ {
+ "epoch": 27.580381471389646,
+ "grad_norm": 8.215298652648926,
+ "learning_rate": 1.699500228216949e-05,
+ "loss": 0.5095,
+ "step": 10122
+ },
+ {
+ "epoch": 27.583106267029972,
+ "grad_norm": 8.29395580291748,
+ "learning_rate": 1.6994371595694875e-05,
+ "loss": 0.5142,
+ "step": 10123
+ },
+ {
+ "epoch": 27.585831062670298,
+ "grad_norm": 7.2489190101623535,
+ "learning_rate": 1.6993740854748315e-05,
+ "loss": 0.576,
+ "step": 10124
+ },
+ {
+ "epoch": 27.588555858310627,
+ "grad_norm": 8.529529571533203,
+ "learning_rate": 1.6993110059334725e-05,
+ "loss": 0.4901,
+ "step": 10125
+ },
+ {
+ "epoch": 27.591280653950953,
+ "grad_norm": 9.240521430969238,
+ "learning_rate": 1.699247920945902e-05,
+ "loss": 0.7894,
+ "step": 10126
+ },
+ {
+ "epoch": 27.59400544959128,
+ "grad_norm": 8.59414005279541,
+ "learning_rate": 1.6991848305126113e-05,
+ "loss": 0.3962,
+ "step": 10127
+ },
+ {
+ "epoch": 27.59673024523161,
+ "grad_norm": 7.808393478393555,
+ "learning_rate": 1.6991217346340917e-05,
+ "loss": 0.4674,
+ "step": 10128
+ },
+ {
+ "epoch": 27.599455040871934,
+ "grad_norm": 9.266545295715332,
+ "learning_rate": 1.6990586333108342e-05,
+ "loss": 0.4837,
+ "step": 10129
+ },
+ {
+ "epoch": 27.60217983651226,
+ "grad_norm": 10.481103897094727,
+ "learning_rate": 1.698995526543331e-05,
+ "loss": 0.5045,
+ "step": 10130
+ },
+ {
+ "epoch": 27.60490463215259,
+ "grad_norm": 8.234030723571777,
+ "learning_rate": 1.698932414332073e-05,
+ "loss": 0.6446,
+ "step": 10131
+ },
+ {
+ "epoch": 27.607629427792915,
+ "grad_norm": 8.013397216796875,
+ "learning_rate": 1.6988692966775515e-05,
+ "loss": 0.5372,
+ "step": 10132
+ },
+ {
+ "epoch": 27.61035422343324,
+ "grad_norm": 11.488170623779297,
+ "learning_rate": 1.6988061735802587e-05,
+ "loss": 0.5749,
+ "step": 10133
+ },
+ {
+ "epoch": 27.61307901907357,
+ "grad_norm": 8.59324836730957,
+ "learning_rate": 1.6987430450406857e-05,
+ "loss": 0.4888,
+ "step": 10134
+ },
+ {
+ "epoch": 27.615803814713896,
+ "grad_norm": 6.613129138946533,
+ "learning_rate": 1.698679911059325e-05,
+ "loss": 0.6968,
+ "step": 10135
+ },
+ {
+ "epoch": 27.618528610354222,
+ "grad_norm": 8.80296802520752,
+ "learning_rate": 1.698616771636667e-05,
+ "loss": 0.4436,
+ "step": 10136
+ },
+ {
+ "epoch": 27.62125340599455,
+ "grad_norm": 9.776527404785156,
+ "learning_rate": 1.698553626773204e-05,
+ "loss": 0.5546,
+ "step": 10137
+ },
+ {
+ "epoch": 27.623978201634877,
+ "grad_norm": 9.341790199279785,
+ "learning_rate": 1.6984904764694282e-05,
+ "loss": 0.548,
+ "step": 10138
+ },
+ {
+ "epoch": 27.626702997275203,
+ "grad_norm": 8.773140907287598,
+ "learning_rate": 1.6984273207258312e-05,
+ "loss": 0.5074,
+ "step": 10139
+ },
+ {
+ "epoch": 27.629427792915532,
+ "grad_norm": 7.1406025886535645,
+ "learning_rate": 1.698364159542904e-05,
+ "loss": 0.4796,
+ "step": 10140
+ },
+ {
+ "epoch": 27.632152588555858,
+ "grad_norm": 8.004528999328613,
+ "learning_rate": 1.6983009929211397e-05,
+ "loss": 0.4002,
+ "step": 10141
+ },
+ {
+ "epoch": 27.634877384196184,
+ "grad_norm": 14.518450736999512,
+ "learning_rate": 1.6982378208610298e-05,
+ "loss": 0.4852,
+ "step": 10142
+ },
+ {
+ "epoch": 27.637602179836513,
+ "grad_norm": 12.912113189697266,
+ "learning_rate": 1.698174643363066e-05,
+ "loss": 0.5564,
+ "step": 10143
+ },
+ {
+ "epoch": 27.64032697547684,
+ "grad_norm": 7.492455005645752,
+ "learning_rate": 1.698111460427741e-05,
+ "loss": 0.4921,
+ "step": 10144
+ },
+ {
+ "epoch": 27.643051771117165,
+ "grad_norm": 8.511575698852539,
+ "learning_rate": 1.6980482720555457e-05,
+ "loss": 0.562,
+ "step": 10145
+ },
+ {
+ "epoch": 27.645776566757494,
+ "grad_norm": 8.994081497192383,
+ "learning_rate": 1.6979850782469734e-05,
+ "loss": 0.3861,
+ "step": 10146
+ },
+ {
+ "epoch": 27.64850136239782,
+ "grad_norm": 10.454629898071289,
+ "learning_rate": 1.6979218790025157e-05,
+ "loss": 0.5139,
+ "step": 10147
+ },
+ {
+ "epoch": 27.651226158038146,
+ "grad_norm": 6.342076778411865,
+ "learning_rate": 1.6978586743226646e-05,
+ "loss": 0.4712,
+ "step": 10148
+ },
+ {
+ "epoch": 27.653950953678475,
+ "grad_norm": 7.370853900909424,
+ "learning_rate": 1.697795464207913e-05,
+ "loss": 0.4252,
+ "step": 10149
+ },
+ {
+ "epoch": 27.6566757493188,
+ "grad_norm": 7.944183349609375,
+ "learning_rate": 1.6977322486587527e-05,
+ "loss": 0.48,
+ "step": 10150
+ },
+ {
+ "epoch": 27.659400544959126,
+ "grad_norm": 9.738842964172363,
+ "learning_rate": 1.697669027675676e-05,
+ "loss": 0.5269,
+ "step": 10151
+ },
+ {
+ "epoch": 27.662125340599456,
+ "grad_norm": 10.647909164428711,
+ "learning_rate": 1.6976058012591755e-05,
+ "loss": 0.5145,
+ "step": 10152
+ },
+ {
+ "epoch": 27.66485013623978,
+ "grad_norm": 7.026835918426514,
+ "learning_rate": 1.697542569409743e-05,
+ "loss": 0.5372,
+ "step": 10153
+ },
+ {
+ "epoch": 27.667574931880107,
+ "grad_norm": 7.8032684326171875,
+ "learning_rate": 1.697479332127872e-05,
+ "loss": 0.722,
+ "step": 10154
+ },
+ {
+ "epoch": 27.670299727520437,
+ "grad_norm": 7.139540672302246,
+ "learning_rate": 1.697416089414054e-05,
+ "loss": 0.5872,
+ "step": 10155
+ },
+ {
+ "epoch": 27.673024523160763,
+ "grad_norm": 8.369836807250977,
+ "learning_rate": 1.6973528412687824e-05,
+ "loss": 0.6517,
+ "step": 10156
+ },
+ {
+ "epoch": 27.67574931880109,
+ "grad_norm": 8.08837604522705,
+ "learning_rate": 1.697289587692549e-05,
+ "loss": 0.5886,
+ "step": 10157
+ },
+ {
+ "epoch": 27.678474114441418,
+ "grad_norm": 11.793229103088379,
+ "learning_rate": 1.6972263286858467e-05,
+ "loss": 0.4599,
+ "step": 10158
+ },
+ {
+ "epoch": 27.681198910081743,
+ "grad_norm": 7.740310192108154,
+ "learning_rate": 1.6971630642491683e-05,
+ "loss": 0.4795,
+ "step": 10159
+ },
+ {
+ "epoch": 27.68392370572207,
+ "grad_norm": 17.676279067993164,
+ "learning_rate": 1.6970997943830062e-05,
+ "loss": 0.422,
+ "step": 10160
+ },
+ {
+ "epoch": 27.6866485013624,
+ "grad_norm": 7.5012617111206055,
+ "learning_rate": 1.6970365190878536e-05,
+ "loss": 0.5285,
+ "step": 10161
+ },
+ {
+ "epoch": 27.689373297002724,
+ "grad_norm": 8.547582626342773,
+ "learning_rate": 1.696973238364203e-05,
+ "loss": 0.4307,
+ "step": 10162
+ },
+ {
+ "epoch": 27.69209809264305,
+ "grad_norm": 9.068389892578125,
+ "learning_rate": 1.6969099522125475e-05,
+ "loss": 0.6285,
+ "step": 10163
+ },
+ {
+ "epoch": 27.69482288828338,
+ "grad_norm": 9.725485801696777,
+ "learning_rate": 1.6968466606333792e-05,
+ "loss": 0.5322,
+ "step": 10164
+ },
+ {
+ "epoch": 27.697547683923705,
+ "grad_norm": 8.065115928649902,
+ "learning_rate": 1.6967833636271916e-05,
+ "loss": 0.5037,
+ "step": 10165
+ },
+ {
+ "epoch": 27.70027247956403,
+ "grad_norm": 7.664557456970215,
+ "learning_rate": 1.6967200611944776e-05,
+ "loss": 0.4163,
+ "step": 10166
+ },
+ {
+ "epoch": 27.70299727520436,
+ "grad_norm": 8.630768775939941,
+ "learning_rate": 1.69665675333573e-05,
+ "loss": 0.5409,
+ "step": 10167
+ },
+ {
+ "epoch": 27.705722070844686,
+ "grad_norm": 7.188152313232422,
+ "learning_rate": 1.696593440051443e-05,
+ "loss": 0.5503,
+ "step": 10168
+ },
+ {
+ "epoch": 27.708446866485012,
+ "grad_norm": 10.388522148132324,
+ "learning_rate": 1.6965301213421075e-05,
+ "loss": 0.6546,
+ "step": 10169
+ },
+ {
+ "epoch": 27.71117166212534,
+ "grad_norm": 9.461798667907715,
+ "learning_rate": 1.6964667972082187e-05,
+ "loss": 0.5003,
+ "step": 10170
+ },
+ {
+ "epoch": 27.713896457765667,
+ "grad_norm": 10.95566463470459,
+ "learning_rate": 1.6964034676502686e-05,
+ "loss": 0.5399,
+ "step": 10171
+ },
+ {
+ "epoch": 27.716621253405993,
+ "grad_norm": 14.988588333129883,
+ "learning_rate": 1.6963401326687506e-05,
+ "loss": 0.5426,
+ "step": 10172
+ },
+ {
+ "epoch": 27.719346049046322,
+ "grad_norm": 7.101005554199219,
+ "learning_rate": 1.696276792264158e-05,
+ "loss": 0.476,
+ "step": 10173
+ },
+ {
+ "epoch": 27.722070844686648,
+ "grad_norm": 8.343110084533691,
+ "learning_rate": 1.6962134464369846e-05,
+ "loss": 0.5077,
+ "step": 10174
+ },
+ {
+ "epoch": 27.724795640326974,
+ "grad_norm": 12.384000778198242,
+ "learning_rate": 1.696150095187723e-05,
+ "loss": 0.5668,
+ "step": 10175
+ },
+ {
+ "epoch": 27.727520435967303,
+ "grad_norm": 7.71723747253418,
+ "learning_rate": 1.6960867385168668e-05,
+ "loss": 0.4366,
+ "step": 10176
+ },
+ {
+ "epoch": 27.73024523160763,
+ "grad_norm": 7.035843372344971,
+ "learning_rate": 1.6960233764249095e-05,
+ "loss": 0.6004,
+ "step": 10177
+ },
+ {
+ "epoch": 27.732970027247955,
+ "grad_norm": 8.7925386428833,
+ "learning_rate": 1.6959600089123447e-05,
+ "loss": 0.5704,
+ "step": 10178
+ },
+ {
+ "epoch": 27.735694822888284,
+ "grad_norm": 7.859381198883057,
+ "learning_rate": 1.6958966359796657e-05,
+ "loss": 0.4832,
+ "step": 10179
+ },
+ {
+ "epoch": 27.73841961852861,
+ "grad_norm": 7.379161834716797,
+ "learning_rate": 1.695833257627366e-05,
+ "loss": 0.6636,
+ "step": 10180
+ },
+ {
+ "epoch": 27.741144414168936,
+ "grad_norm": 7.621696949005127,
+ "learning_rate": 1.695769873855939e-05,
+ "loss": 0.4753,
+ "step": 10181
+ },
+ {
+ "epoch": 27.743869209809265,
+ "grad_norm": 7.432315349578857,
+ "learning_rate": 1.695706484665879e-05,
+ "loss": 0.6271,
+ "step": 10182
+ },
+ {
+ "epoch": 27.74659400544959,
+ "grad_norm": 8.763675689697266,
+ "learning_rate": 1.695643090057679e-05,
+ "loss": 0.5212,
+ "step": 10183
+ },
+ {
+ "epoch": 27.749318801089917,
+ "grad_norm": 8.227683067321777,
+ "learning_rate": 1.6955796900318337e-05,
+ "loss": 0.5168,
+ "step": 10184
+ },
+ {
+ "epoch": 27.752043596730246,
+ "grad_norm": 8.002479553222656,
+ "learning_rate": 1.6955162845888354e-05,
+ "loss": 0.5506,
+ "step": 10185
+ },
+ {
+ "epoch": 27.754768392370572,
+ "grad_norm": 7.464667320251465,
+ "learning_rate": 1.6954528737291787e-05,
+ "loss": 0.3843,
+ "step": 10186
+ },
+ {
+ "epoch": 27.757493188010898,
+ "grad_norm": 8.782455444335938,
+ "learning_rate": 1.695389457453358e-05,
+ "loss": 0.4337,
+ "step": 10187
+ },
+ {
+ "epoch": 27.760217983651227,
+ "grad_norm": 6.0465922355651855,
+ "learning_rate": 1.6953260357618662e-05,
+ "loss": 0.3922,
+ "step": 10188
+ },
+ {
+ "epoch": 27.762942779291553,
+ "grad_norm": 9.327617645263672,
+ "learning_rate": 1.6952626086551977e-05,
+ "loss": 0.49,
+ "step": 10189
+ },
+ {
+ "epoch": 27.76566757493188,
+ "grad_norm": 8.79337215423584,
+ "learning_rate": 1.6951991761338463e-05,
+ "loss": 0.6237,
+ "step": 10190
+ },
+ {
+ "epoch": 27.768392370572208,
+ "grad_norm": 8.579442977905273,
+ "learning_rate": 1.695135738198306e-05,
+ "loss": 0.5703,
+ "step": 10191
+ },
+ {
+ "epoch": 27.771117166212534,
+ "grad_norm": 8.197420120239258,
+ "learning_rate": 1.6950722948490713e-05,
+ "loss": 0.5209,
+ "step": 10192
+ },
+ {
+ "epoch": 27.77384196185286,
+ "grad_norm": 8.335177421569824,
+ "learning_rate": 1.6950088460866357e-05,
+ "loss": 0.5037,
+ "step": 10193
+ },
+ {
+ "epoch": 27.77656675749319,
+ "grad_norm": 7.469491958618164,
+ "learning_rate": 1.694945391911493e-05,
+ "loss": 0.4836,
+ "step": 10194
+ },
+ {
+ "epoch": 27.779291553133515,
+ "grad_norm": 8.92253303527832,
+ "learning_rate": 1.694881932324139e-05,
+ "loss": 0.4843,
+ "step": 10195
+ },
+ {
+ "epoch": 27.78201634877384,
+ "grad_norm": 8.606045722961426,
+ "learning_rate": 1.6948184673250665e-05,
+ "loss": 0.5375,
+ "step": 10196
+ },
+ {
+ "epoch": 27.78474114441417,
+ "grad_norm": 7.045773506164551,
+ "learning_rate": 1.69475499691477e-05,
+ "loss": 0.4955,
+ "step": 10197
+ },
+ {
+ "epoch": 27.787465940054496,
+ "grad_norm": 8.528428077697754,
+ "learning_rate": 1.694691521093744e-05,
+ "loss": 0.4139,
+ "step": 10198
+ },
+ {
+ "epoch": 27.79019073569482,
+ "grad_norm": 11.833290100097656,
+ "learning_rate": 1.6946280398624828e-05,
+ "loss": 0.5298,
+ "step": 10199
+ },
+ {
+ "epoch": 27.79291553133515,
+ "grad_norm": 7.898739337921143,
+ "learning_rate": 1.6945645532214805e-05,
+ "loss": 0.6686,
+ "step": 10200
+ },
+ {
+ "epoch": 27.795640326975477,
+ "grad_norm": 8.228962898254395,
+ "learning_rate": 1.694501061171232e-05,
+ "loss": 0.493,
+ "step": 10201
+ },
+ {
+ "epoch": 27.798365122615802,
+ "grad_norm": 10.405641555786133,
+ "learning_rate": 1.6944375637122318e-05,
+ "loss": 0.5291,
+ "step": 10202
+ },
+ {
+ "epoch": 27.80108991825613,
+ "grad_norm": 8.502785682678223,
+ "learning_rate": 1.694374060844974e-05,
+ "loss": 0.5408,
+ "step": 10203
+ },
+ {
+ "epoch": 27.803814713896458,
+ "grad_norm": 8.7985200881958,
+ "learning_rate": 1.6943105525699534e-05,
+ "loss": 0.6182,
+ "step": 10204
+ },
+ {
+ "epoch": 27.806539509536783,
+ "grad_norm": 8.150802612304688,
+ "learning_rate": 1.6942470388876645e-05,
+ "loss": 0.692,
+ "step": 10205
+ },
+ {
+ "epoch": 27.809264305177113,
+ "grad_norm": 6.949302673339844,
+ "learning_rate": 1.6941835197986023e-05,
+ "loss": 0.564,
+ "step": 10206
+ },
+ {
+ "epoch": 27.81198910081744,
+ "grad_norm": 11.274639129638672,
+ "learning_rate": 1.694119995303261e-05,
+ "loss": 0.5856,
+ "step": 10207
+ },
+ {
+ "epoch": 27.814713896457764,
+ "grad_norm": 7.7016072273254395,
+ "learning_rate": 1.6940564654021355e-05,
+ "loss": 0.5806,
+ "step": 10208
+ },
+ {
+ "epoch": 27.817438692098094,
+ "grad_norm": 8.560013771057129,
+ "learning_rate": 1.6939929300957206e-05,
+ "loss": 0.6448,
+ "step": 10209
+ },
+ {
+ "epoch": 27.82016348773842,
+ "grad_norm": 6.942630290985107,
+ "learning_rate": 1.693929389384511e-05,
+ "loss": 0.4706,
+ "step": 10210
+ },
+ {
+ "epoch": 27.822888283378745,
+ "grad_norm": 6.969632148742676,
+ "learning_rate": 1.6938658432690016e-05,
+ "loss": 0.4278,
+ "step": 10211
+ },
+ {
+ "epoch": 27.825613079019075,
+ "grad_norm": 7.503054618835449,
+ "learning_rate": 1.6938022917496876e-05,
+ "loss": 0.4682,
+ "step": 10212
+ },
+ {
+ "epoch": 27.8283378746594,
+ "grad_norm": 8.342432975769043,
+ "learning_rate": 1.6937387348270636e-05,
+ "loss": 0.4071,
+ "step": 10213
+ },
+ {
+ "epoch": 27.831062670299726,
+ "grad_norm": 7.85593318939209,
+ "learning_rate": 1.6936751725016248e-05,
+ "loss": 0.6279,
+ "step": 10214
+ },
+ {
+ "epoch": 27.833787465940055,
+ "grad_norm": 6.302553653717041,
+ "learning_rate": 1.6936116047738657e-05,
+ "loss": 0.5239,
+ "step": 10215
+ },
+ {
+ "epoch": 27.83651226158038,
+ "grad_norm": 8.658904075622559,
+ "learning_rate": 1.6935480316442818e-05,
+ "loss": 0.5029,
+ "step": 10216
+ },
+ {
+ "epoch": 27.839237057220707,
+ "grad_norm": 7.880286693572998,
+ "learning_rate": 1.6934844531133686e-05,
+ "loss": 0.509,
+ "step": 10217
+ },
+ {
+ "epoch": 27.841961852861036,
+ "grad_norm": 6.384045124053955,
+ "learning_rate": 1.6934208691816203e-05,
+ "loss": 0.4031,
+ "step": 10218
+ },
+ {
+ "epoch": 27.844686648501362,
+ "grad_norm": 7.981046199798584,
+ "learning_rate": 1.6933572798495327e-05,
+ "loss": 0.4557,
+ "step": 10219
+ },
+ {
+ "epoch": 27.847411444141688,
+ "grad_norm": 7.138590335845947,
+ "learning_rate": 1.6932936851176013e-05,
+ "loss": 0.6566,
+ "step": 10220
+ },
+ {
+ "epoch": 27.850136239782017,
+ "grad_norm": 6.986456871032715,
+ "learning_rate": 1.6932300849863207e-05,
+ "loss": 0.4547,
+ "step": 10221
+ },
+ {
+ "epoch": 27.852861035422343,
+ "grad_norm": 7.824373245239258,
+ "learning_rate": 1.6931664794561862e-05,
+ "loss": 0.5171,
+ "step": 10222
+ },
+ {
+ "epoch": 27.85558583106267,
+ "grad_norm": 8.812350273132324,
+ "learning_rate": 1.693102868527694e-05,
+ "loss": 0.6844,
+ "step": 10223
+ },
+ {
+ "epoch": 27.858310626703,
+ "grad_norm": 6.86625862121582,
+ "learning_rate": 1.693039252201339e-05,
+ "loss": 0.3973,
+ "step": 10224
+ },
+ {
+ "epoch": 27.861035422343324,
+ "grad_norm": 10.785688400268555,
+ "learning_rate": 1.692975630477616e-05,
+ "loss": 0.7382,
+ "step": 10225
+ },
+ {
+ "epoch": 27.86376021798365,
+ "grad_norm": 42.3944091796875,
+ "learning_rate": 1.6929120033570218e-05,
+ "loss": 0.5722,
+ "step": 10226
+ },
+ {
+ "epoch": 27.86648501362398,
+ "grad_norm": 7.785507678985596,
+ "learning_rate": 1.6928483708400504e-05,
+ "loss": 0.4921,
+ "step": 10227
+ },
+ {
+ "epoch": 27.869209809264305,
+ "grad_norm": 6.294122695922852,
+ "learning_rate": 1.692784732927199e-05,
+ "loss": 0.4783,
+ "step": 10228
+ },
+ {
+ "epoch": 27.87193460490463,
+ "grad_norm": 7.572083950042725,
+ "learning_rate": 1.692721089618962e-05,
+ "loss": 0.4753,
+ "step": 10229
+ },
+ {
+ "epoch": 27.87465940054496,
+ "grad_norm": 10.167337417602539,
+ "learning_rate": 1.6926574409158354e-05,
+ "loss": 0.5658,
+ "step": 10230
+ },
+ {
+ "epoch": 27.877384196185286,
+ "grad_norm": 7.328114986419678,
+ "learning_rate": 1.692593786818315e-05,
+ "loss": 0.5149,
+ "step": 10231
+ },
+ {
+ "epoch": 27.88010899182561,
+ "grad_norm": 7.156718730926514,
+ "learning_rate": 1.6925301273268965e-05,
+ "loss": 0.5066,
+ "step": 10232
+ },
+ {
+ "epoch": 27.88283378746594,
+ "grad_norm": 11.570022583007812,
+ "learning_rate": 1.6924664624420758e-05,
+ "loss": 0.5504,
+ "step": 10233
+ },
+ {
+ "epoch": 27.885558583106267,
+ "grad_norm": 7.075197219848633,
+ "learning_rate": 1.6924027921643485e-05,
+ "loss": 0.4808,
+ "step": 10234
+ },
+ {
+ "epoch": 27.888283378746593,
+ "grad_norm": 8.273008346557617,
+ "learning_rate": 1.6923391164942106e-05,
+ "loss": 0.703,
+ "step": 10235
+ },
+ {
+ "epoch": 27.891008174386922,
+ "grad_norm": 6.79816198348999,
+ "learning_rate": 1.6922754354321577e-05,
+ "loss": 0.713,
+ "step": 10236
+ },
+ {
+ "epoch": 27.893732970027248,
+ "grad_norm": 7.069867134094238,
+ "learning_rate": 1.6922117489786863e-05,
+ "loss": 0.6285,
+ "step": 10237
+ },
+ {
+ "epoch": 27.896457765667574,
+ "grad_norm": 6.594805717468262,
+ "learning_rate": 1.6921480571342916e-05,
+ "loss": 0.5786,
+ "step": 10238
+ },
+ {
+ "epoch": 27.899182561307903,
+ "grad_norm": 8.521928787231445,
+ "learning_rate": 1.6920843598994707e-05,
+ "loss": 0.4567,
+ "step": 10239
+ },
+ {
+ "epoch": 27.90190735694823,
+ "grad_norm": 9.371071815490723,
+ "learning_rate": 1.6920206572747186e-05,
+ "loss": 0.4895,
+ "step": 10240
+ },
+ {
+ "epoch": 27.904632152588555,
+ "grad_norm": 7.50525426864624,
+ "learning_rate": 1.691956949260532e-05,
+ "loss": 0.4757,
+ "step": 10241
+ },
+ {
+ "epoch": 27.907356948228884,
+ "grad_norm": 9.543774604797363,
+ "learning_rate": 1.691893235857407e-05,
+ "loss": 0.4894,
+ "step": 10242
+ },
+ {
+ "epoch": 27.91008174386921,
+ "grad_norm": 7.727305889129639,
+ "learning_rate": 1.69182951706584e-05,
+ "loss": 0.6274,
+ "step": 10243
+ },
+ {
+ "epoch": 27.912806539509535,
+ "grad_norm": 8.318642616271973,
+ "learning_rate": 1.6917657928863267e-05,
+ "loss": 0.4711,
+ "step": 10244
+ },
+ {
+ "epoch": 27.915531335149865,
+ "grad_norm": 7.303012847900391,
+ "learning_rate": 1.691702063319364e-05,
+ "loss": 0.5171,
+ "step": 10245
+ },
+ {
+ "epoch": 27.91825613079019,
+ "grad_norm": 7.7373247146606445,
+ "learning_rate": 1.6916383283654478e-05,
+ "loss": 0.6812,
+ "step": 10246
+ },
+ {
+ "epoch": 27.920980926430516,
+ "grad_norm": 8.06027889251709,
+ "learning_rate": 1.691574588025074e-05,
+ "loss": 0.6066,
+ "step": 10247
+ },
+ {
+ "epoch": 27.923705722070846,
+ "grad_norm": 8.682061195373535,
+ "learning_rate": 1.6915108422987402e-05,
+ "loss": 0.5661,
+ "step": 10248
+ },
+ {
+ "epoch": 27.92643051771117,
+ "grad_norm": 6.264842510223389,
+ "learning_rate": 1.691447091186942e-05,
+ "loss": 0.5078,
+ "step": 10249
+ },
+ {
+ "epoch": 27.929155313351497,
+ "grad_norm": 8.2464017868042,
+ "learning_rate": 1.6913833346901758e-05,
+ "loss": 0.615,
+ "step": 10250
+ },
+ {
+ "epoch": 27.931880108991827,
+ "grad_norm": 14.93500804901123,
+ "learning_rate": 1.6913195728089388e-05,
+ "loss": 0.55,
+ "step": 10251
+ },
+ {
+ "epoch": 27.934604904632153,
+ "grad_norm": 8.586822509765625,
+ "learning_rate": 1.6912558055437273e-05,
+ "loss": 0.4811,
+ "step": 10252
+ },
+ {
+ "epoch": 27.93732970027248,
+ "grad_norm": 6.676853656768799,
+ "learning_rate": 1.6911920328950376e-05,
+ "loss": 0.547,
+ "step": 10253
+ },
+ {
+ "epoch": 27.940054495912808,
+ "grad_norm": 10.004607200622559,
+ "learning_rate": 1.6911282548633664e-05,
+ "loss": 0.751,
+ "step": 10254
+ },
+ {
+ "epoch": 27.942779291553133,
+ "grad_norm": 9.108039855957031,
+ "learning_rate": 1.691064471449211e-05,
+ "loss": 0.4478,
+ "step": 10255
+ },
+ {
+ "epoch": 27.94550408719346,
+ "grad_norm": 7.818694114685059,
+ "learning_rate": 1.691000682653068e-05,
+ "loss": 0.5316,
+ "step": 10256
+ },
+ {
+ "epoch": 27.94822888283379,
+ "grad_norm": 6.828567028045654,
+ "learning_rate": 1.690936888475433e-05,
+ "loss": 0.4294,
+ "step": 10257
+ },
+ {
+ "epoch": 27.950953678474114,
+ "grad_norm": 9.278924942016602,
+ "learning_rate": 1.6908730889168047e-05,
+ "loss": 0.4493,
+ "step": 10258
+ },
+ {
+ "epoch": 27.95367847411444,
+ "grad_norm": 8.610934257507324,
+ "learning_rate": 1.690809283977678e-05,
+ "loss": 0.62,
+ "step": 10259
+ },
+ {
+ "epoch": 27.95640326975477,
+ "grad_norm": 7.227691650390625,
+ "learning_rate": 1.6907454736585517e-05,
+ "loss": 0.5197,
+ "step": 10260
+ },
+ {
+ "epoch": 27.959128065395095,
+ "grad_norm": 6.648590087890625,
+ "learning_rate": 1.6906816579599217e-05,
+ "loss": 0.5727,
+ "step": 10261
+ },
+ {
+ "epoch": 27.96185286103542,
+ "grad_norm": 6.574821949005127,
+ "learning_rate": 1.690617836882285e-05,
+ "loss": 0.4755,
+ "step": 10262
+ },
+ {
+ "epoch": 27.96457765667575,
+ "grad_norm": 7.378173351287842,
+ "learning_rate": 1.690554010426139e-05,
+ "loss": 0.5754,
+ "step": 10263
+ },
+ {
+ "epoch": 27.967302452316076,
+ "grad_norm": 10.361187934875488,
+ "learning_rate": 1.6904901785919806e-05,
+ "loss": 0.6264,
+ "step": 10264
+ },
+ {
+ "epoch": 27.970027247956402,
+ "grad_norm": 7.284205436706543,
+ "learning_rate": 1.6904263413803068e-05,
+ "loss": 0.446,
+ "step": 10265
+ },
+ {
+ "epoch": 27.97275204359673,
+ "grad_norm": 7.510517597198486,
+ "learning_rate": 1.6903624987916147e-05,
+ "loss": 0.5075,
+ "step": 10266
+ },
+ {
+ "epoch": 27.975476839237057,
+ "grad_norm": 8.687686920166016,
+ "learning_rate": 1.690298650826402e-05,
+ "loss": 0.5695,
+ "step": 10267
+ },
+ {
+ "epoch": 27.978201634877383,
+ "grad_norm": 7.612741470336914,
+ "learning_rate": 1.6902347974851653e-05,
+ "loss": 0.4938,
+ "step": 10268
+ },
+ {
+ "epoch": 27.980926430517712,
+ "grad_norm": 8.871014595031738,
+ "learning_rate": 1.6901709387684025e-05,
+ "loss": 0.5045,
+ "step": 10269
+ },
+ {
+ "epoch": 27.983651226158038,
+ "grad_norm": 7.562943458557129,
+ "learning_rate": 1.6901070746766108e-05,
+ "loss": 0.5377,
+ "step": 10270
+ },
+ {
+ "epoch": 27.986376021798364,
+ "grad_norm": 9.494495391845703,
+ "learning_rate": 1.690043205210287e-05,
+ "loss": 0.5172,
+ "step": 10271
+ },
+ {
+ "epoch": 27.989100817438693,
+ "grad_norm": 8.3716459274292,
+ "learning_rate": 1.689979330369929e-05,
+ "loss": 0.5178,
+ "step": 10272
+ },
+ {
+ "epoch": 27.99182561307902,
+ "grad_norm": 9.27304744720459,
+ "learning_rate": 1.6899154501560344e-05,
+ "loss": 0.4353,
+ "step": 10273
+ },
+ {
+ "epoch": 27.994550408719345,
+ "grad_norm": 7.550212383270264,
+ "learning_rate": 1.6898515645691002e-05,
+ "loss": 0.4103,
+ "step": 10274
+ },
+ {
+ "epoch": 27.997275204359674,
+ "grad_norm": 8.311297416687012,
+ "learning_rate": 1.6897876736096247e-05,
+ "loss": 0.4959,
+ "step": 10275
+ },
+ {
+ "epoch": 28.0,
+ "grad_norm": 6.824106216430664,
+ "learning_rate": 1.6897237772781046e-05,
+ "loss": 0.6491,
+ "step": 10276
+ },
+ {
+ "epoch": 28.002724795640326,
+ "grad_norm": 7.665373802185059,
+ "learning_rate": 1.6896598755750376e-05,
+ "loss": 0.606,
+ "step": 10277
+ },
+ {
+ "epoch": 28.005449591280655,
+ "grad_norm": 6.007593631744385,
+ "learning_rate": 1.689595968500922e-05,
+ "loss": 0.4334,
+ "step": 10278
+ },
+ {
+ "epoch": 28.00817438692098,
+ "grad_norm": 7.365853309631348,
+ "learning_rate": 1.6895320560562554e-05,
+ "loss": 0.4828,
+ "step": 10279
+ },
+ {
+ "epoch": 28.010899182561307,
+ "grad_norm": 8.586054801940918,
+ "learning_rate": 1.6894681382415353e-05,
+ "loss": 0.532,
+ "step": 10280
+ },
+ {
+ "epoch": 28.013623978201636,
+ "grad_norm": 9.997074127197266,
+ "learning_rate": 1.6894042150572594e-05,
+ "loss": 0.4187,
+ "step": 10281
+ },
+ {
+ "epoch": 28.016348773841962,
+ "grad_norm": 8.226503372192383,
+ "learning_rate": 1.6893402865039257e-05,
+ "loss": 0.4926,
+ "step": 10282
+ },
+ {
+ "epoch": 28.019073569482288,
+ "grad_norm": 7.064162731170654,
+ "learning_rate": 1.689276352582032e-05,
+ "loss": 0.5343,
+ "step": 10283
+ },
+ {
+ "epoch": 28.021798365122617,
+ "grad_norm": 18.196016311645508,
+ "learning_rate": 1.6892124132920763e-05,
+ "loss": 0.4216,
+ "step": 10284
+ },
+ {
+ "epoch": 28.024523160762943,
+ "grad_norm": 6.422055721282959,
+ "learning_rate": 1.6891484686345565e-05,
+ "loss": 0.5878,
+ "step": 10285
+ },
+ {
+ "epoch": 28.02724795640327,
+ "grad_norm": 6.667153835296631,
+ "learning_rate": 1.6890845186099705e-05,
+ "loss": 0.6854,
+ "step": 10286
+ },
+ {
+ "epoch": 28.029972752043598,
+ "grad_norm": 5.945711135864258,
+ "learning_rate": 1.6890205632188166e-05,
+ "loss": 0.396,
+ "step": 10287
+ },
+ {
+ "epoch": 28.032697547683924,
+ "grad_norm": 8.55396556854248,
+ "learning_rate": 1.6889566024615928e-05,
+ "loss": 0.4163,
+ "step": 10288
+ },
+ {
+ "epoch": 28.03542234332425,
+ "grad_norm": 6.2634406089782715,
+ "learning_rate": 1.688892636338797e-05,
+ "loss": 0.3436,
+ "step": 10289
+ },
+ {
+ "epoch": 28.03814713896458,
+ "grad_norm": 8.88974666595459,
+ "learning_rate": 1.6888286648509272e-05,
+ "loss": 0.4431,
+ "step": 10290
+ },
+ {
+ "epoch": 28.040871934604905,
+ "grad_norm": 6.603543758392334,
+ "learning_rate": 1.6887646879984826e-05,
+ "loss": 0.4554,
+ "step": 10291
+ },
+ {
+ "epoch": 28.04359673024523,
+ "grad_norm": 7.227399826049805,
+ "learning_rate": 1.6887007057819606e-05,
+ "loss": 0.5347,
+ "step": 10292
+ },
+ {
+ "epoch": 28.04632152588556,
+ "grad_norm": 7.476388931274414,
+ "learning_rate": 1.6886367182018593e-05,
+ "loss": 0.5303,
+ "step": 10293
+ },
+ {
+ "epoch": 28.049046321525886,
+ "grad_norm": 8.124524116516113,
+ "learning_rate": 1.6885727252586774e-05,
+ "loss": 0.479,
+ "step": 10294
+ },
+ {
+ "epoch": 28.05177111716621,
+ "grad_norm": 7.9931640625,
+ "learning_rate": 1.6885087269529136e-05,
+ "loss": 0.7098,
+ "step": 10295
+ },
+ {
+ "epoch": 28.05449591280654,
+ "grad_norm": 6.5644636154174805,
+ "learning_rate": 1.6884447232850657e-05,
+ "loss": 0.5326,
+ "step": 10296
+ },
+ {
+ "epoch": 28.057220708446867,
+ "grad_norm": 7.5684285163879395,
+ "learning_rate": 1.688380714255633e-05,
+ "loss": 0.6125,
+ "step": 10297
+ },
+ {
+ "epoch": 28.059945504087192,
+ "grad_norm": 7.379377841949463,
+ "learning_rate": 1.688316699865113e-05,
+ "loss": 0.4286,
+ "step": 10298
+ },
+ {
+ "epoch": 28.06267029972752,
+ "grad_norm": 8.864320755004883,
+ "learning_rate": 1.6882526801140046e-05,
+ "loss": 0.5087,
+ "step": 10299
+ },
+ {
+ "epoch": 28.065395095367847,
+ "grad_norm": 8.201573371887207,
+ "learning_rate": 1.6881886550028068e-05,
+ "loss": 0.372,
+ "step": 10300
+ },
+ {
+ "epoch": 28.068119891008173,
+ "grad_norm": 6.924935817718506,
+ "learning_rate": 1.688124624532018e-05,
+ "loss": 0.3792,
+ "step": 10301
+ },
+ {
+ "epoch": 28.070844686648503,
+ "grad_norm": 17.250703811645508,
+ "learning_rate": 1.6880605887021362e-05,
+ "loss": 0.4113,
+ "step": 10302
+ },
+ {
+ "epoch": 28.07356948228883,
+ "grad_norm": 7.773608207702637,
+ "learning_rate": 1.687996547513661e-05,
+ "loss": 0.5192,
+ "step": 10303
+ },
+ {
+ "epoch": 28.076294277929154,
+ "grad_norm": 11.720868110656738,
+ "learning_rate": 1.6879325009670912e-05,
+ "loss": 0.5282,
+ "step": 10304
+ },
+ {
+ "epoch": 28.079019073569484,
+ "grad_norm": 8.303223609924316,
+ "learning_rate": 1.6878684490629247e-05,
+ "loss": 0.4907,
+ "step": 10305
+ },
+ {
+ "epoch": 28.08174386920981,
+ "grad_norm": 5.874635219573975,
+ "learning_rate": 1.687804391801661e-05,
+ "loss": 0.5293,
+ "step": 10306
+ },
+ {
+ "epoch": 28.084468664850135,
+ "grad_norm": 6.997998237609863,
+ "learning_rate": 1.687740329183799e-05,
+ "loss": 0.3651,
+ "step": 10307
+ },
+ {
+ "epoch": 28.087193460490465,
+ "grad_norm": 11.347203254699707,
+ "learning_rate": 1.687676261209837e-05,
+ "loss": 0.4861,
+ "step": 10308
+ },
+ {
+ "epoch": 28.08991825613079,
+ "grad_norm": 9.801603317260742,
+ "learning_rate": 1.6876121878802748e-05,
+ "loss": 0.5014,
+ "step": 10309
+ },
+ {
+ "epoch": 28.092643051771116,
+ "grad_norm": 7.367988586425781,
+ "learning_rate": 1.687548109195611e-05,
+ "loss": 0.5709,
+ "step": 10310
+ },
+ {
+ "epoch": 28.095367847411445,
+ "grad_norm": 8.178997993469238,
+ "learning_rate": 1.6874840251563448e-05,
+ "loss": 0.5577,
+ "step": 10311
+ },
+ {
+ "epoch": 28.09809264305177,
+ "grad_norm": 10.153870582580566,
+ "learning_rate": 1.6874199357629747e-05,
+ "loss": 0.5374,
+ "step": 10312
+ },
+ {
+ "epoch": 28.100817438692097,
+ "grad_norm": 7.0586066246032715,
+ "learning_rate": 1.6873558410160006e-05,
+ "loss": 0.373,
+ "step": 10313
+ },
+ {
+ "epoch": 28.103542234332426,
+ "grad_norm": 6.657742977142334,
+ "learning_rate": 1.6872917409159213e-05,
+ "loss": 0.3198,
+ "step": 10314
+ },
+ {
+ "epoch": 28.106267029972752,
+ "grad_norm": 8.027143478393555,
+ "learning_rate": 1.6872276354632358e-05,
+ "loss": 0.5042,
+ "step": 10315
+ },
+ {
+ "epoch": 28.108991825613078,
+ "grad_norm": 6.80226993560791,
+ "learning_rate": 1.687163524658444e-05,
+ "loss": 0.4276,
+ "step": 10316
+ },
+ {
+ "epoch": 28.111716621253407,
+ "grad_norm": 7.309327602386475,
+ "learning_rate": 1.6870994085020446e-05,
+ "loss": 0.4528,
+ "step": 10317
+ },
+ {
+ "epoch": 28.114441416893733,
+ "grad_norm": 9.73857593536377,
+ "learning_rate": 1.687035286994537e-05,
+ "loss": 0.483,
+ "step": 10318
+ },
+ {
+ "epoch": 28.11716621253406,
+ "grad_norm": 7.97163200378418,
+ "learning_rate": 1.6869711601364206e-05,
+ "loss": 0.4059,
+ "step": 10319
+ },
+ {
+ "epoch": 28.11989100817439,
+ "grad_norm": 6.555824279785156,
+ "learning_rate": 1.686907027928195e-05,
+ "loss": 0.4689,
+ "step": 10320
+ },
+ {
+ "epoch": 28.122615803814714,
+ "grad_norm": 7.380853652954102,
+ "learning_rate": 1.6868428903703598e-05,
+ "loss": 0.4585,
+ "step": 10321
+ },
+ {
+ "epoch": 28.12534059945504,
+ "grad_norm": 7.245654106140137,
+ "learning_rate": 1.6867787474634142e-05,
+ "loss": 0.5209,
+ "step": 10322
+ },
+ {
+ "epoch": 28.12806539509537,
+ "grad_norm": 7.773459434509277,
+ "learning_rate": 1.6867145992078577e-05,
+ "loss": 0.5188,
+ "step": 10323
+ },
+ {
+ "epoch": 28.130790190735695,
+ "grad_norm": 7.523104667663574,
+ "learning_rate": 1.68665044560419e-05,
+ "loss": 0.3985,
+ "step": 10324
+ },
+ {
+ "epoch": 28.13351498637602,
+ "grad_norm": 7.532975673675537,
+ "learning_rate": 1.686586286652911e-05,
+ "loss": 0.4188,
+ "step": 10325
+ },
+ {
+ "epoch": 28.13623978201635,
+ "grad_norm": 8.93874740600586,
+ "learning_rate": 1.6865221223545198e-05,
+ "loss": 0.4528,
+ "step": 10326
+ },
+ {
+ "epoch": 28.138964577656676,
+ "grad_norm": 7.237036228179932,
+ "learning_rate": 1.6864579527095163e-05,
+ "loss": 0.491,
+ "step": 10327
+ },
+ {
+ "epoch": 28.141689373297,
+ "grad_norm": 7.244105339050293,
+ "learning_rate": 1.6863937777184006e-05,
+ "loss": 0.4947,
+ "step": 10328
+ },
+ {
+ "epoch": 28.14441416893733,
+ "grad_norm": 13.066157341003418,
+ "learning_rate": 1.686329597381672e-05,
+ "loss": 0.5469,
+ "step": 10329
+ },
+ {
+ "epoch": 28.147138964577657,
+ "grad_norm": 6.924302577972412,
+ "learning_rate": 1.686265411699831e-05,
+ "loss": 0.4539,
+ "step": 10330
+ },
+ {
+ "epoch": 28.149863760217983,
+ "grad_norm": 7.257571697235107,
+ "learning_rate": 1.6862012206733768e-05,
+ "loss": 0.6908,
+ "step": 10331
+ },
+ {
+ "epoch": 28.152588555858312,
+ "grad_norm": 10.561065673828125,
+ "learning_rate": 1.6861370243028097e-05,
+ "loss": 0.6219,
+ "step": 10332
+ },
+ {
+ "epoch": 28.155313351498638,
+ "grad_norm": 8.823827743530273,
+ "learning_rate": 1.6860728225886295e-05,
+ "loss": 0.4505,
+ "step": 10333
+ },
+ {
+ "epoch": 28.158038147138964,
+ "grad_norm": 6.851810932159424,
+ "learning_rate": 1.6860086155313364e-05,
+ "loss": 0.5002,
+ "step": 10334
+ },
+ {
+ "epoch": 28.160762942779293,
+ "grad_norm": 8.059377670288086,
+ "learning_rate": 1.6859444031314297e-05,
+ "loss": 0.4726,
+ "step": 10335
+ },
+ {
+ "epoch": 28.16348773841962,
+ "grad_norm": 9.536529541015625,
+ "learning_rate": 1.6858801853894105e-05,
+ "loss": 0.3778,
+ "step": 10336
+ },
+ {
+ "epoch": 28.166212534059945,
+ "grad_norm": 6.575474739074707,
+ "learning_rate": 1.6858159623057787e-05,
+ "loss": 0.4834,
+ "step": 10337
+ },
+ {
+ "epoch": 28.168937329700274,
+ "grad_norm": 13.317432403564453,
+ "learning_rate": 1.685751733881034e-05,
+ "loss": 0.4341,
+ "step": 10338
+ },
+ {
+ "epoch": 28.1716621253406,
+ "grad_norm": 8.081430435180664,
+ "learning_rate": 1.685687500115677e-05,
+ "loss": 0.6339,
+ "step": 10339
+ },
+ {
+ "epoch": 28.174386920980925,
+ "grad_norm": 8.51950454711914,
+ "learning_rate": 1.6856232610102074e-05,
+ "loss": 0.5239,
+ "step": 10340
+ },
+ {
+ "epoch": 28.177111716621255,
+ "grad_norm": 9.547775268554688,
+ "learning_rate": 1.6855590165651263e-05,
+ "loss": 0.6049,
+ "step": 10341
+ },
+ {
+ "epoch": 28.17983651226158,
+ "grad_norm": 7.281281471252441,
+ "learning_rate": 1.6854947667809333e-05,
+ "loss": 0.4608,
+ "step": 10342
+ },
+ {
+ "epoch": 28.182561307901906,
+ "grad_norm": 8.876697540283203,
+ "learning_rate": 1.6854305116581294e-05,
+ "loss": 0.5292,
+ "step": 10343
+ },
+ {
+ "epoch": 28.185286103542236,
+ "grad_norm": 7.376714706420898,
+ "learning_rate": 1.685366251197215e-05,
+ "loss": 0.5331,
+ "step": 10344
+ },
+ {
+ "epoch": 28.18801089918256,
+ "grad_norm": 6.850920677185059,
+ "learning_rate": 1.68530198539869e-05,
+ "loss": 0.4112,
+ "step": 10345
+ },
+ {
+ "epoch": 28.190735694822887,
+ "grad_norm": 8.650160789489746,
+ "learning_rate": 1.685237714263055e-05,
+ "loss": 0.7314,
+ "step": 10346
+ },
+ {
+ "epoch": 28.193460490463217,
+ "grad_norm": 14.532156944274902,
+ "learning_rate": 1.6851734377908106e-05,
+ "loss": 0.4206,
+ "step": 10347
+ },
+ {
+ "epoch": 28.196185286103542,
+ "grad_norm": 8.100082397460938,
+ "learning_rate": 1.685109155982458e-05,
+ "loss": 0.5037,
+ "step": 10348
+ },
+ {
+ "epoch": 28.19891008174387,
+ "grad_norm": 6.799877166748047,
+ "learning_rate": 1.6850448688384972e-05,
+ "loss": 0.4937,
+ "step": 10349
+ },
+ {
+ "epoch": 28.201634877384198,
+ "grad_norm": 7.809359550476074,
+ "learning_rate": 1.6849805763594293e-05,
+ "loss": 0.5504,
+ "step": 10350
+ },
+ {
+ "epoch": 28.204359673024523,
+ "grad_norm": 6.646524429321289,
+ "learning_rate": 1.684916278545754e-05,
+ "loss": 0.3853,
+ "step": 10351
+ },
+ {
+ "epoch": 28.20708446866485,
+ "grad_norm": 10.917232513427734,
+ "learning_rate": 1.6848519753979732e-05,
+ "loss": 0.3925,
+ "step": 10352
+ },
+ {
+ "epoch": 28.20980926430518,
+ "grad_norm": 6.854604721069336,
+ "learning_rate": 1.6847876669165874e-05,
+ "loss": 0.56,
+ "step": 10353
+ },
+ {
+ "epoch": 28.212534059945504,
+ "grad_norm": 8.6856689453125,
+ "learning_rate": 1.684723353102097e-05,
+ "loss": 0.5193,
+ "step": 10354
+ },
+ {
+ "epoch": 28.21525885558583,
+ "grad_norm": 7.57242488861084,
+ "learning_rate": 1.684659033955003e-05,
+ "loss": 0.5102,
+ "step": 10355
+ },
+ {
+ "epoch": 28.21798365122616,
+ "grad_norm": 7.709518909454346,
+ "learning_rate": 1.684594709475807e-05,
+ "loss": 0.5396,
+ "step": 10356
+ },
+ {
+ "epoch": 28.220708446866485,
+ "grad_norm": 8.30573558807373,
+ "learning_rate": 1.6845303796650094e-05,
+ "loss": 0.3871,
+ "step": 10357
+ },
+ {
+ "epoch": 28.22343324250681,
+ "grad_norm": 9.018017768859863,
+ "learning_rate": 1.684466044523111e-05,
+ "loss": 0.4784,
+ "step": 10358
+ },
+ {
+ "epoch": 28.22615803814714,
+ "grad_norm": 8.360239028930664,
+ "learning_rate": 1.6844017040506132e-05,
+ "loss": 0.5625,
+ "step": 10359
+ },
+ {
+ "epoch": 28.228882833787466,
+ "grad_norm": 7.19600772857666,
+ "learning_rate": 1.6843373582480168e-05,
+ "loss": 0.3723,
+ "step": 10360
+ },
+ {
+ "epoch": 28.231607629427792,
+ "grad_norm": 26.532180786132812,
+ "learning_rate": 1.684273007115823e-05,
+ "loss": 0.4842,
+ "step": 10361
+ },
+ {
+ "epoch": 28.23433242506812,
+ "grad_norm": 7.297877788543701,
+ "learning_rate": 1.6842086506545334e-05,
+ "loss": 0.3293,
+ "step": 10362
+ },
+ {
+ "epoch": 28.237057220708447,
+ "grad_norm": 10.168774604797363,
+ "learning_rate": 1.6841442888646483e-05,
+ "loss": 0.4346,
+ "step": 10363
+ },
+ {
+ "epoch": 28.239782016348773,
+ "grad_norm": 9.161511421203613,
+ "learning_rate": 1.68407992174667e-05,
+ "loss": 0.527,
+ "step": 10364
+ },
+ {
+ "epoch": 28.242506811989102,
+ "grad_norm": 8.480376243591309,
+ "learning_rate": 1.684015549301099e-05,
+ "loss": 0.4944,
+ "step": 10365
+ },
+ {
+ "epoch": 28.245231607629428,
+ "grad_norm": 8.92908763885498,
+ "learning_rate": 1.6839511715284372e-05,
+ "loss": 0.5138,
+ "step": 10366
+ },
+ {
+ "epoch": 28.247956403269754,
+ "grad_norm": 8.959177017211914,
+ "learning_rate": 1.6838867884291855e-05,
+ "loss": 0.4398,
+ "step": 10367
+ },
+ {
+ "epoch": 28.250681198910083,
+ "grad_norm": 14.875165939331055,
+ "learning_rate": 1.6838224000038455e-05,
+ "loss": 0.5484,
+ "step": 10368
+ },
+ {
+ "epoch": 28.25340599455041,
+ "grad_norm": 7.646803855895996,
+ "learning_rate": 1.683758006252919e-05,
+ "loss": 0.6553,
+ "step": 10369
+ },
+ {
+ "epoch": 28.256130790190735,
+ "grad_norm": 7.4817705154418945,
+ "learning_rate": 1.6836936071769064e-05,
+ "loss": 0.5055,
+ "step": 10370
+ },
+ {
+ "epoch": 28.258855585831064,
+ "grad_norm": 10.627854347229004,
+ "learning_rate": 1.6836292027763102e-05,
+ "loss": 0.453,
+ "step": 10371
+ },
+ {
+ "epoch": 28.26158038147139,
+ "grad_norm": 8.66915512084961,
+ "learning_rate": 1.6835647930516322e-05,
+ "loss": 0.5134,
+ "step": 10372
+ },
+ {
+ "epoch": 28.264305177111716,
+ "grad_norm": 6.920253753662109,
+ "learning_rate": 1.6835003780033738e-05,
+ "loss": 0.5014,
+ "step": 10373
+ },
+ {
+ "epoch": 28.267029972752045,
+ "grad_norm": 8.081284523010254,
+ "learning_rate": 1.6834359576320357e-05,
+ "loss": 0.41,
+ "step": 10374
+ },
+ {
+ "epoch": 28.26975476839237,
+ "grad_norm": 7.855467796325684,
+ "learning_rate": 1.683371531938121e-05,
+ "loss": 0.5132,
+ "step": 10375
+ },
+ {
+ "epoch": 28.272479564032697,
+ "grad_norm": 13.5990629196167,
+ "learning_rate": 1.6833071009221306e-05,
+ "loss": 0.551,
+ "step": 10376
+ },
+ {
+ "epoch": 28.275204359673026,
+ "grad_norm": 11.321314811706543,
+ "learning_rate": 1.683242664584566e-05,
+ "loss": 0.5769,
+ "step": 10377
+ },
+ {
+ "epoch": 28.277929155313352,
+ "grad_norm": 11.942986488342285,
+ "learning_rate": 1.68317822292593e-05,
+ "loss": 0.4187,
+ "step": 10378
+ },
+ {
+ "epoch": 28.280653950953678,
+ "grad_norm": 8.610215187072754,
+ "learning_rate": 1.683113775946724e-05,
+ "loss": 0.6056,
+ "step": 10379
+ },
+ {
+ "epoch": 28.283378746594007,
+ "grad_norm": 8.839770317077637,
+ "learning_rate": 1.6830493236474497e-05,
+ "loss": 0.3628,
+ "step": 10380
+ },
+ {
+ "epoch": 28.286103542234333,
+ "grad_norm": 7.970127105712891,
+ "learning_rate": 1.6829848660286093e-05,
+ "loss": 0.6532,
+ "step": 10381
+ },
+ {
+ "epoch": 28.28882833787466,
+ "grad_norm": 6.654072284698486,
+ "learning_rate": 1.6829204030907045e-05,
+ "loss": 0.5068,
+ "step": 10382
+ },
+ {
+ "epoch": 28.291553133514988,
+ "grad_norm": 9.671961784362793,
+ "learning_rate": 1.6828559348342382e-05,
+ "loss": 0.4399,
+ "step": 10383
+ },
+ {
+ "epoch": 28.294277929155314,
+ "grad_norm": 9.164841651916504,
+ "learning_rate": 1.6827914612597115e-05,
+ "loss": 0.3484,
+ "step": 10384
+ },
+ {
+ "epoch": 28.29700272479564,
+ "grad_norm": 8.438698768615723,
+ "learning_rate": 1.682726982367627e-05,
+ "loss": 0.4659,
+ "step": 10385
+ },
+ {
+ "epoch": 28.29972752043597,
+ "grad_norm": 7.779649257659912,
+ "learning_rate": 1.6826624981584868e-05,
+ "loss": 0.663,
+ "step": 10386
+ },
+ {
+ "epoch": 28.302452316076295,
+ "grad_norm": 7.599969387054443,
+ "learning_rate": 1.6825980086327927e-05,
+ "loss": 0.4323,
+ "step": 10387
+ },
+ {
+ "epoch": 28.30517711171662,
+ "grad_norm": 7.940140724182129,
+ "learning_rate": 1.6825335137910474e-05,
+ "loss": 0.3535,
+ "step": 10388
+ },
+ {
+ "epoch": 28.30790190735695,
+ "grad_norm": 6.6571807861328125,
+ "learning_rate": 1.6824690136337533e-05,
+ "loss": 0.5281,
+ "step": 10389
+ },
+ {
+ "epoch": 28.310626702997276,
+ "grad_norm": 14.657061576843262,
+ "learning_rate": 1.682404508161412e-05,
+ "loss": 0.6565,
+ "step": 10390
+ },
+ {
+ "epoch": 28.3133514986376,
+ "grad_norm": 7.262669563293457,
+ "learning_rate": 1.682339997374527e-05,
+ "loss": 0.5697,
+ "step": 10391
+ },
+ {
+ "epoch": 28.31607629427793,
+ "grad_norm": 7.552542209625244,
+ "learning_rate": 1.6822754812735995e-05,
+ "loss": 0.4747,
+ "step": 10392
+ },
+ {
+ "epoch": 28.318801089918257,
+ "grad_norm": 9.409974098205566,
+ "learning_rate": 1.6822109598591327e-05,
+ "loss": 0.4474,
+ "step": 10393
+ },
+ {
+ "epoch": 28.321525885558582,
+ "grad_norm": 7.490232467651367,
+ "learning_rate": 1.682146433131629e-05,
+ "loss": 0.4171,
+ "step": 10394
+ },
+ {
+ "epoch": 28.32425068119891,
+ "grad_norm": 10.111641883850098,
+ "learning_rate": 1.682081901091591e-05,
+ "loss": 0.4914,
+ "step": 10395
+ },
+ {
+ "epoch": 28.326975476839237,
+ "grad_norm": 8.32813835144043,
+ "learning_rate": 1.6820173637395208e-05,
+ "loss": 0.5367,
+ "step": 10396
+ },
+ {
+ "epoch": 28.329700272479563,
+ "grad_norm": 6.854457378387451,
+ "learning_rate": 1.6819528210759216e-05,
+ "loss": 0.4817,
+ "step": 10397
+ },
+ {
+ "epoch": 28.332425068119893,
+ "grad_norm": 7.725712299346924,
+ "learning_rate": 1.6818882731012954e-05,
+ "loss": 0.6059,
+ "step": 10398
+ },
+ {
+ "epoch": 28.33514986376022,
+ "grad_norm": 6.47776460647583,
+ "learning_rate": 1.6818237198161456e-05,
+ "loss": 0.6245,
+ "step": 10399
+ },
+ {
+ "epoch": 28.337874659400544,
+ "grad_norm": 7.381679534912109,
+ "learning_rate": 1.6817591612209744e-05,
+ "loss": 0.4849,
+ "step": 10400
+ },
+ {
+ "epoch": 28.340599455040874,
+ "grad_norm": 7.378352642059326,
+ "learning_rate": 1.681694597316285e-05,
+ "loss": 0.4969,
+ "step": 10401
+ },
+ {
+ "epoch": 28.3433242506812,
+ "grad_norm": 6.980203628540039,
+ "learning_rate": 1.6816300281025796e-05,
+ "loss": 0.5902,
+ "step": 10402
+ },
+ {
+ "epoch": 28.346049046321525,
+ "grad_norm": 9.453960418701172,
+ "learning_rate": 1.681565453580362e-05,
+ "loss": 0.5278,
+ "step": 10403
+ },
+ {
+ "epoch": 28.348773841961854,
+ "grad_norm": 7.603379726409912,
+ "learning_rate": 1.681500873750134e-05,
+ "loss": 0.5557,
+ "step": 10404
+ },
+ {
+ "epoch": 28.35149863760218,
+ "grad_norm": 7.9871039390563965,
+ "learning_rate": 1.6814362886123994e-05,
+ "loss": 0.4535,
+ "step": 10405
+ },
+ {
+ "epoch": 28.354223433242506,
+ "grad_norm": 8.485020637512207,
+ "learning_rate": 1.6813716981676612e-05,
+ "loss": 0.5384,
+ "step": 10406
+ },
+ {
+ "epoch": 28.356948228882835,
+ "grad_norm": 7.360891819000244,
+ "learning_rate": 1.681307102416422e-05,
+ "loss": 0.4211,
+ "step": 10407
+ },
+ {
+ "epoch": 28.35967302452316,
+ "grad_norm": 8.2415771484375,
+ "learning_rate": 1.681242501359185e-05,
+ "loss": 0.4482,
+ "step": 10408
+ },
+ {
+ "epoch": 28.362397820163487,
+ "grad_norm": 7.84987735748291,
+ "learning_rate": 1.681177894996453e-05,
+ "loss": 0.5217,
+ "step": 10409
+ },
+ {
+ "epoch": 28.365122615803816,
+ "grad_norm": 11.041234970092773,
+ "learning_rate": 1.6811132833287296e-05,
+ "loss": 0.5422,
+ "step": 10410
+ },
+ {
+ "epoch": 28.367847411444142,
+ "grad_norm": 9.216878890991211,
+ "learning_rate": 1.6810486663565183e-05,
+ "loss": 0.4366,
+ "step": 10411
+ },
+ {
+ "epoch": 28.370572207084468,
+ "grad_norm": 8.009267807006836,
+ "learning_rate": 1.680984044080322e-05,
+ "loss": 0.6246,
+ "step": 10412
+ },
+ {
+ "epoch": 28.373297002724797,
+ "grad_norm": 8.616374969482422,
+ "learning_rate": 1.680919416500643e-05,
+ "loss": 0.4103,
+ "step": 10413
+ },
+ {
+ "epoch": 28.376021798365123,
+ "grad_norm": 8.781277656555176,
+ "learning_rate": 1.6808547836179862e-05,
+ "loss": 0.5015,
+ "step": 10414
+ },
+ {
+ "epoch": 28.37874659400545,
+ "grad_norm": 7.765417098999023,
+ "learning_rate": 1.680790145432854e-05,
+ "loss": 0.5505,
+ "step": 10415
+ },
+ {
+ "epoch": 28.381471389645778,
+ "grad_norm": 6.382985591888428,
+ "learning_rate": 1.6807255019457503e-05,
+ "loss": 0.3701,
+ "step": 10416
+ },
+ {
+ "epoch": 28.384196185286104,
+ "grad_norm": 8.345076560974121,
+ "learning_rate": 1.680660853157178e-05,
+ "loss": 0.5445,
+ "step": 10417
+ },
+ {
+ "epoch": 28.38692098092643,
+ "grad_norm": 6.24092960357666,
+ "learning_rate": 1.680596199067641e-05,
+ "loss": 0.5378,
+ "step": 10418
+ },
+ {
+ "epoch": 28.38964577656676,
+ "grad_norm": 8.847549438476562,
+ "learning_rate": 1.6805315396776427e-05,
+ "loss": 0.5143,
+ "step": 10419
+ },
+ {
+ "epoch": 28.392370572207085,
+ "grad_norm": 8.919387817382812,
+ "learning_rate": 1.6804668749876867e-05,
+ "loss": 0.5549,
+ "step": 10420
+ },
+ {
+ "epoch": 28.39509536784741,
+ "grad_norm": 8.392271995544434,
+ "learning_rate": 1.6804022049982768e-05,
+ "loss": 0.5368,
+ "step": 10421
+ },
+ {
+ "epoch": 28.39782016348774,
+ "grad_norm": 8.466325759887695,
+ "learning_rate": 1.6803375297099162e-05,
+ "loss": 0.4869,
+ "step": 10422
+ },
+ {
+ "epoch": 28.400544959128066,
+ "grad_norm": 7.85569953918457,
+ "learning_rate": 1.6802728491231083e-05,
+ "loss": 0.407,
+ "step": 10423
+ },
+ {
+ "epoch": 28.40326975476839,
+ "grad_norm": 9.220958709716797,
+ "learning_rate": 1.680208163238358e-05,
+ "loss": 0.4977,
+ "step": 10424
+ },
+ {
+ "epoch": 28.40599455040872,
+ "grad_norm": 7.3440141677856445,
+ "learning_rate": 1.6801434720561683e-05,
+ "loss": 0.576,
+ "step": 10425
+ },
+ {
+ "epoch": 28.408719346049047,
+ "grad_norm": 6.604451656341553,
+ "learning_rate": 1.680078775577043e-05,
+ "loss": 0.481,
+ "step": 10426
+ },
+ {
+ "epoch": 28.411444141689373,
+ "grad_norm": 6.42094612121582,
+ "learning_rate": 1.680014073801486e-05,
+ "loss": 0.4882,
+ "step": 10427
+ },
+ {
+ "epoch": 28.414168937329702,
+ "grad_norm": 8.168827056884766,
+ "learning_rate": 1.6799493667300018e-05,
+ "loss": 0.4686,
+ "step": 10428
+ },
+ {
+ "epoch": 28.416893732970028,
+ "grad_norm": 7.647387504577637,
+ "learning_rate": 1.6798846543630934e-05,
+ "loss": 0.47,
+ "step": 10429
+ },
+ {
+ "epoch": 28.419618528610354,
+ "grad_norm": 8.366386413574219,
+ "learning_rate": 1.6798199367012652e-05,
+ "loss": 0.4745,
+ "step": 10430
+ },
+ {
+ "epoch": 28.422343324250683,
+ "grad_norm": 8.590060234069824,
+ "learning_rate": 1.6797552137450214e-05,
+ "loss": 0.514,
+ "step": 10431
+ },
+ {
+ "epoch": 28.42506811989101,
+ "grad_norm": 6.036066055297852,
+ "learning_rate": 1.6796904854948656e-05,
+ "loss": 0.4146,
+ "step": 10432
+ },
+ {
+ "epoch": 28.427792915531334,
+ "grad_norm": 8.050939559936523,
+ "learning_rate": 1.6796257519513024e-05,
+ "loss": 0.457,
+ "step": 10433
+ },
+ {
+ "epoch": 28.430517711171664,
+ "grad_norm": 11.273110389709473,
+ "learning_rate": 1.6795610131148357e-05,
+ "loss": 0.663,
+ "step": 10434
+ },
+ {
+ "epoch": 28.43324250681199,
+ "grad_norm": 7.349226951599121,
+ "learning_rate": 1.6794962689859696e-05,
+ "loss": 0.5003,
+ "step": 10435
+ },
+ {
+ "epoch": 28.435967302452315,
+ "grad_norm": 7.010150909423828,
+ "learning_rate": 1.6794315195652085e-05,
+ "loss": 0.4498,
+ "step": 10436
+ },
+ {
+ "epoch": 28.438692098092645,
+ "grad_norm": 8.3838529586792,
+ "learning_rate": 1.6793667648530567e-05,
+ "loss": 0.5936,
+ "step": 10437
+ },
+ {
+ "epoch": 28.44141689373297,
+ "grad_norm": 25.742835998535156,
+ "learning_rate": 1.6793020048500183e-05,
+ "loss": 0.4208,
+ "step": 10438
+ },
+ {
+ "epoch": 28.444141689373296,
+ "grad_norm": 7.778672218322754,
+ "learning_rate": 1.6792372395565978e-05,
+ "loss": 0.7396,
+ "step": 10439
+ },
+ {
+ "epoch": 28.446866485013626,
+ "grad_norm": 7.268556594848633,
+ "learning_rate": 1.6791724689732992e-05,
+ "loss": 0.6994,
+ "step": 10440
+ },
+ {
+ "epoch": 28.44959128065395,
+ "grad_norm": 8.157234191894531,
+ "learning_rate": 1.6791076931006276e-05,
+ "loss": 0.4328,
+ "step": 10441
+ },
+ {
+ "epoch": 28.452316076294277,
+ "grad_norm": 7.949583530426025,
+ "learning_rate": 1.679042911939087e-05,
+ "loss": 0.3544,
+ "step": 10442
+ },
+ {
+ "epoch": 28.455040871934607,
+ "grad_norm": 6.344139575958252,
+ "learning_rate": 1.6789781254891822e-05,
+ "loss": 0.4261,
+ "step": 10443
+ },
+ {
+ "epoch": 28.457765667574932,
+ "grad_norm": 13.322134017944336,
+ "learning_rate": 1.6789133337514178e-05,
+ "loss": 0.562,
+ "step": 10444
+ },
+ {
+ "epoch": 28.460490463215258,
+ "grad_norm": 7.682892322540283,
+ "learning_rate": 1.6788485367262975e-05,
+ "loss": 0.6436,
+ "step": 10445
+ },
+ {
+ "epoch": 28.463215258855588,
+ "grad_norm": 10.428749084472656,
+ "learning_rate": 1.6787837344143273e-05,
+ "loss": 0.6119,
+ "step": 10446
+ },
+ {
+ "epoch": 28.465940054495913,
+ "grad_norm": 11.043083190917969,
+ "learning_rate": 1.678718926816011e-05,
+ "loss": 0.5913,
+ "step": 10447
+ },
+ {
+ "epoch": 28.46866485013624,
+ "grad_norm": 8.230341911315918,
+ "learning_rate": 1.6786541139318537e-05,
+ "loss": 0.4512,
+ "step": 10448
+ },
+ {
+ "epoch": 28.47138964577657,
+ "grad_norm": 7.745244026184082,
+ "learning_rate": 1.6785892957623598e-05,
+ "loss": 0.5378,
+ "step": 10449
+ },
+ {
+ "epoch": 28.474114441416894,
+ "grad_norm": 18.82840347290039,
+ "learning_rate": 1.678524472308034e-05,
+ "loss": 0.4413,
+ "step": 10450
+ },
+ {
+ "epoch": 28.47683923705722,
+ "grad_norm": 6.365556240081787,
+ "learning_rate": 1.678459643569382e-05,
+ "loss": 0.5273,
+ "step": 10451
+ },
+ {
+ "epoch": 28.479564032697546,
+ "grad_norm": 5.9933037757873535,
+ "learning_rate": 1.6783948095469082e-05,
+ "loss": 0.3474,
+ "step": 10452
+ },
+ {
+ "epoch": 28.482288828337875,
+ "grad_norm": 9.864625930786133,
+ "learning_rate": 1.678329970241117e-05,
+ "loss": 0.4769,
+ "step": 10453
+ },
+ {
+ "epoch": 28.4850136239782,
+ "grad_norm": 7.456377029418945,
+ "learning_rate": 1.678265125652514e-05,
+ "loss": 0.5831,
+ "step": 10454
+ },
+ {
+ "epoch": 28.48773841961853,
+ "grad_norm": 8.414080619812012,
+ "learning_rate": 1.6782002757816043e-05,
+ "loss": 0.5112,
+ "step": 10455
+ },
+ {
+ "epoch": 28.490463215258856,
+ "grad_norm": 14.215851783752441,
+ "learning_rate": 1.6781354206288924e-05,
+ "loss": 0.5678,
+ "step": 10456
+ },
+ {
+ "epoch": 28.493188010899182,
+ "grad_norm": 8.581607818603516,
+ "learning_rate": 1.6780705601948833e-05,
+ "loss": 0.4189,
+ "step": 10457
+ },
+ {
+ "epoch": 28.495912806539508,
+ "grad_norm": 10.440707206726074,
+ "learning_rate": 1.6780056944800833e-05,
+ "loss": 0.4722,
+ "step": 10458
+ },
+ {
+ "epoch": 28.498637602179837,
+ "grad_norm": 8.628376960754395,
+ "learning_rate": 1.6779408234849964e-05,
+ "loss": 0.4987,
+ "step": 10459
+ },
+ {
+ "epoch": 28.501362397820163,
+ "grad_norm": 9.071776390075684,
+ "learning_rate": 1.677875947210128e-05,
+ "loss": 0.5309,
+ "step": 10460
+ },
+ {
+ "epoch": 28.504087193460492,
+ "grad_norm": 52.496681213378906,
+ "learning_rate": 1.6778110656559837e-05,
+ "loss": 0.4279,
+ "step": 10461
+ },
+ {
+ "epoch": 28.506811989100818,
+ "grad_norm": 9.852365493774414,
+ "learning_rate": 1.677746178823069e-05,
+ "loss": 0.5231,
+ "step": 10462
+ },
+ {
+ "epoch": 28.509536784741144,
+ "grad_norm": 7.248706340789795,
+ "learning_rate": 1.6776812867118885e-05,
+ "loss": 0.5611,
+ "step": 10463
+ },
+ {
+ "epoch": 28.51226158038147,
+ "grad_norm": 12.963179588317871,
+ "learning_rate": 1.6776163893229476e-05,
+ "loss": 0.4556,
+ "step": 10464
+ },
+ {
+ "epoch": 28.5149863760218,
+ "grad_norm": 8.917076110839844,
+ "learning_rate": 1.6775514866567527e-05,
+ "loss": 0.6695,
+ "step": 10465
+ },
+ {
+ "epoch": 28.517711171662125,
+ "grad_norm": 10.566930770874023,
+ "learning_rate": 1.677486578713808e-05,
+ "loss": 0.4056,
+ "step": 10466
+ },
+ {
+ "epoch": 28.520435967302454,
+ "grad_norm": 9.388032913208008,
+ "learning_rate": 1.6774216654946203e-05,
+ "loss": 0.4838,
+ "step": 10467
+ },
+ {
+ "epoch": 28.52316076294278,
+ "grad_norm": 16.75680160522461,
+ "learning_rate": 1.677356746999694e-05,
+ "loss": 0.5612,
+ "step": 10468
+ },
+ {
+ "epoch": 28.525885558583106,
+ "grad_norm": 8.811739921569824,
+ "learning_rate": 1.6772918232295353e-05,
+ "loss": 0.4979,
+ "step": 10469
+ },
+ {
+ "epoch": 28.52861035422343,
+ "grad_norm": 13.264880180358887,
+ "learning_rate": 1.6772268941846496e-05,
+ "loss": 0.4393,
+ "step": 10470
+ },
+ {
+ "epoch": 28.53133514986376,
+ "grad_norm": 7.859387397766113,
+ "learning_rate": 1.6771619598655432e-05,
+ "loss": 0.4305,
+ "step": 10471
+ },
+ {
+ "epoch": 28.534059945504087,
+ "grad_norm": 7.618261814117432,
+ "learning_rate": 1.6770970202727206e-05,
+ "loss": 0.6329,
+ "step": 10472
+ },
+ {
+ "epoch": 28.536784741144416,
+ "grad_norm": 9.38042163848877,
+ "learning_rate": 1.6770320754066886e-05,
+ "loss": 0.6401,
+ "step": 10473
+ },
+ {
+ "epoch": 28.539509536784742,
+ "grad_norm": 9.186793327331543,
+ "learning_rate": 1.676967125267952e-05,
+ "loss": 0.4864,
+ "step": 10474
+ },
+ {
+ "epoch": 28.542234332425068,
+ "grad_norm": 8.843674659729004,
+ "learning_rate": 1.6769021698570178e-05,
+ "loss": 0.5904,
+ "step": 10475
+ },
+ {
+ "epoch": 28.544959128065393,
+ "grad_norm": 8.38227367401123,
+ "learning_rate": 1.676837209174391e-05,
+ "loss": 0.4263,
+ "step": 10476
+ },
+ {
+ "epoch": 28.547683923705723,
+ "grad_norm": 7.939977169036865,
+ "learning_rate": 1.676772243220578e-05,
+ "loss": 0.5242,
+ "step": 10477
+ },
+ {
+ "epoch": 28.55040871934605,
+ "grad_norm": 15.47470760345459,
+ "learning_rate": 1.6767072719960845e-05,
+ "loss": 0.5037,
+ "step": 10478
+ },
+ {
+ "epoch": 28.553133514986374,
+ "grad_norm": 9.203507423400879,
+ "learning_rate": 1.6766422955014164e-05,
+ "loss": 0.467,
+ "step": 10479
+ },
+ {
+ "epoch": 28.555858310626704,
+ "grad_norm": 7.513101577758789,
+ "learning_rate": 1.67657731373708e-05,
+ "loss": 0.6239,
+ "step": 10480
+ },
+ {
+ "epoch": 28.55858310626703,
+ "grad_norm": 12.132689476013184,
+ "learning_rate": 1.6765123267035813e-05,
+ "loss": 0.6172,
+ "step": 10481
+ },
+ {
+ "epoch": 28.561307901907355,
+ "grad_norm": 8.619035720825195,
+ "learning_rate": 1.6764473344014264e-05,
+ "loss": 0.4727,
+ "step": 10482
+ },
+ {
+ "epoch": 28.564032697547685,
+ "grad_norm": 7.933316230773926,
+ "learning_rate": 1.6763823368311213e-05,
+ "loss": 0.4595,
+ "step": 10483
+ },
+ {
+ "epoch": 28.56675749318801,
+ "grad_norm": 9.0542573928833,
+ "learning_rate": 1.6763173339931718e-05,
+ "loss": 0.3766,
+ "step": 10484
+ },
+ {
+ "epoch": 28.569482288828336,
+ "grad_norm": 12.085680961608887,
+ "learning_rate": 1.6762523258880855e-05,
+ "loss": 0.4951,
+ "step": 10485
+ },
+ {
+ "epoch": 28.572207084468666,
+ "grad_norm": 8.230812072753906,
+ "learning_rate": 1.6761873125163676e-05,
+ "loss": 0.4879,
+ "step": 10486
+ },
+ {
+ "epoch": 28.57493188010899,
+ "grad_norm": 13.951199531555176,
+ "learning_rate": 1.6761222938785245e-05,
+ "loss": 0.3983,
+ "step": 10487
+ },
+ {
+ "epoch": 28.577656675749317,
+ "grad_norm": 8.826639175415039,
+ "learning_rate": 1.676057269975063e-05,
+ "loss": 0.5461,
+ "step": 10488
+ },
+ {
+ "epoch": 28.580381471389646,
+ "grad_norm": 10.449169158935547,
+ "learning_rate": 1.675992240806489e-05,
+ "loss": 0.4296,
+ "step": 10489
+ },
+ {
+ "epoch": 28.583106267029972,
+ "grad_norm": 6.757328510284424,
+ "learning_rate": 1.6759272063733094e-05,
+ "loss": 0.549,
+ "step": 10490
+ },
+ {
+ "epoch": 28.585831062670298,
+ "grad_norm": 9.143452644348145,
+ "learning_rate": 1.6758621666760304e-05,
+ "loss": 0.4813,
+ "step": 10491
+ },
+ {
+ "epoch": 28.588555858310627,
+ "grad_norm": 36.08699417114258,
+ "learning_rate": 1.675797121715159e-05,
+ "loss": 0.4719,
+ "step": 10492
+ },
+ {
+ "epoch": 28.591280653950953,
+ "grad_norm": 12.879393577575684,
+ "learning_rate": 1.6757320714912007e-05,
+ "loss": 0.4965,
+ "step": 10493
+ },
+ {
+ "epoch": 28.59400544959128,
+ "grad_norm": 8.112102508544922,
+ "learning_rate": 1.6756670160046628e-05,
+ "loss": 0.4584,
+ "step": 10494
+ },
+ {
+ "epoch": 28.59673024523161,
+ "grad_norm": 6.9734392166137695,
+ "learning_rate": 1.6756019552560522e-05,
+ "loss": 0.5682,
+ "step": 10495
+ },
+ {
+ "epoch": 28.599455040871934,
+ "grad_norm": 7.311095714569092,
+ "learning_rate": 1.6755368892458753e-05,
+ "loss": 0.5016,
+ "step": 10496
+ },
+ {
+ "epoch": 28.60217983651226,
+ "grad_norm": 8.643707275390625,
+ "learning_rate": 1.675471817974639e-05,
+ "loss": 0.6283,
+ "step": 10497
+ },
+ {
+ "epoch": 28.60490463215259,
+ "grad_norm": 7.092410564422607,
+ "learning_rate": 1.6754067414428497e-05,
+ "loss": 0.6003,
+ "step": 10498
+ },
+ {
+ "epoch": 28.607629427792915,
+ "grad_norm": 9.788068771362305,
+ "learning_rate": 1.6753416596510144e-05,
+ "loss": 0.45,
+ "step": 10499
+ },
+ {
+ "epoch": 28.61035422343324,
+ "grad_norm": 9.50992488861084,
+ "learning_rate": 1.6752765725996402e-05,
+ "loss": 0.5356,
+ "step": 10500
+ },
+ {
+ "epoch": 28.61307901907357,
+ "grad_norm": 7.4705281257629395,
+ "learning_rate": 1.6752114802892332e-05,
+ "loss": 0.5111,
+ "step": 10501
+ },
+ {
+ "epoch": 28.615803814713896,
+ "grad_norm": 12.41318416595459,
+ "learning_rate": 1.6751463827203018e-05,
+ "loss": 0.4525,
+ "step": 10502
+ },
+ {
+ "epoch": 28.618528610354222,
+ "grad_norm": 10.357723236083984,
+ "learning_rate": 1.6750812798933512e-05,
+ "loss": 0.6619,
+ "step": 10503
+ },
+ {
+ "epoch": 28.62125340599455,
+ "grad_norm": 8.30016803741455,
+ "learning_rate": 1.6750161718088902e-05,
+ "loss": 0.4381,
+ "step": 10504
+ },
+ {
+ "epoch": 28.623978201634877,
+ "grad_norm": 9.020997047424316,
+ "learning_rate": 1.6749510584674243e-05,
+ "loss": 0.4266,
+ "step": 10505
+ },
+ {
+ "epoch": 28.626702997275203,
+ "grad_norm": 7.495340347290039,
+ "learning_rate": 1.6748859398694616e-05,
+ "loss": 0.3745,
+ "step": 10506
+ },
+ {
+ "epoch": 28.629427792915532,
+ "grad_norm": 11.160477638244629,
+ "learning_rate": 1.674820816015509e-05,
+ "loss": 0.4176,
+ "step": 10507
+ },
+ {
+ "epoch": 28.632152588555858,
+ "grad_norm": 9.42709732055664,
+ "learning_rate": 1.6747556869060735e-05,
+ "loss": 0.5268,
+ "step": 10508
+ },
+ {
+ "epoch": 28.634877384196184,
+ "grad_norm": 7.919163227081299,
+ "learning_rate": 1.6746905525416625e-05,
+ "loss": 0.39,
+ "step": 10509
+ },
+ {
+ "epoch": 28.637602179836513,
+ "grad_norm": 10.078733444213867,
+ "learning_rate": 1.674625412922783e-05,
+ "loss": 0.5568,
+ "step": 10510
+ },
+ {
+ "epoch": 28.64032697547684,
+ "grad_norm": 9.338096618652344,
+ "learning_rate": 1.6745602680499426e-05,
+ "loss": 0.5707,
+ "step": 10511
+ },
+ {
+ "epoch": 28.643051771117165,
+ "grad_norm": 8.589585304260254,
+ "learning_rate": 1.6744951179236487e-05,
+ "loss": 0.5765,
+ "step": 10512
+ },
+ {
+ "epoch": 28.645776566757494,
+ "grad_norm": 8.227743148803711,
+ "learning_rate": 1.6744299625444082e-05,
+ "loss": 0.4916,
+ "step": 10513
+ },
+ {
+ "epoch": 28.64850136239782,
+ "grad_norm": 12.171733856201172,
+ "learning_rate": 1.674364801912729e-05,
+ "loss": 0.5273,
+ "step": 10514
+ },
+ {
+ "epoch": 28.651226158038146,
+ "grad_norm": 8.201462745666504,
+ "learning_rate": 1.6742996360291184e-05,
+ "loss": 0.5538,
+ "step": 10515
+ },
+ {
+ "epoch": 28.653950953678475,
+ "grad_norm": 7.957534313201904,
+ "learning_rate": 1.674234464894084e-05,
+ "loss": 0.4372,
+ "step": 10516
+ },
+ {
+ "epoch": 28.6566757493188,
+ "grad_norm": 11.711692810058594,
+ "learning_rate": 1.6741692885081333e-05,
+ "loss": 0.535,
+ "step": 10517
+ },
+ {
+ "epoch": 28.659400544959126,
+ "grad_norm": 7.344912052154541,
+ "learning_rate": 1.6741041068717737e-05,
+ "loss": 0.578,
+ "step": 10518
+ },
+ {
+ "epoch": 28.662125340599456,
+ "grad_norm": 17.266468048095703,
+ "learning_rate": 1.674038919985513e-05,
+ "loss": 0.4063,
+ "step": 10519
+ },
+ {
+ "epoch": 28.66485013623978,
+ "grad_norm": 7.3692626953125,
+ "learning_rate": 1.6739737278498595e-05,
+ "loss": 0.5085,
+ "step": 10520
+ },
+ {
+ "epoch": 28.667574931880107,
+ "grad_norm": 8.309320449829102,
+ "learning_rate": 1.6739085304653197e-05,
+ "loss": 0.4993,
+ "step": 10521
+ },
+ {
+ "epoch": 28.670299727520437,
+ "grad_norm": 9.00151538848877,
+ "learning_rate": 1.673843327832402e-05,
+ "loss": 0.5508,
+ "step": 10522
+ },
+ {
+ "epoch": 28.673024523160763,
+ "grad_norm": 7.283410549163818,
+ "learning_rate": 1.6737781199516143e-05,
+ "loss": 0.481,
+ "step": 10523
+ },
+ {
+ "epoch": 28.67574931880109,
+ "grad_norm": 9.720575332641602,
+ "learning_rate": 1.6737129068234642e-05,
+ "loss": 0.5471,
+ "step": 10524
+ },
+ {
+ "epoch": 28.678474114441418,
+ "grad_norm": 7.802993297576904,
+ "learning_rate": 1.67364768844846e-05,
+ "loss": 0.6346,
+ "step": 10525
+ },
+ {
+ "epoch": 28.681198910081743,
+ "grad_norm": 9.069677352905273,
+ "learning_rate": 1.6735824648271085e-05,
+ "loss": 0.442,
+ "step": 10526
+ },
+ {
+ "epoch": 28.68392370572207,
+ "grad_norm": 12.54915714263916,
+ "learning_rate": 1.6735172359599193e-05,
+ "loss": 0.7076,
+ "step": 10527
+ },
+ {
+ "epoch": 28.6866485013624,
+ "grad_norm": 7.4631853103637695,
+ "learning_rate": 1.673452001847399e-05,
+ "loss": 0.5363,
+ "step": 10528
+ },
+ {
+ "epoch": 28.689373297002724,
+ "grad_norm": 7.945371627807617,
+ "learning_rate": 1.6733867624900565e-05,
+ "loss": 0.5799,
+ "step": 10529
+ },
+ {
+ "epoch": 28.69209809264305,
+ "grad_norm": 8.726821899414062,
+ "learning_rate": 1.6733215178883996e-05,
+ "loss": 0.4099,
+ "step": 10530
+ },
+ {
+ "epoch": 28.69482288828338,
+ "grad_norm": 7.770522594451904,
+ "learning_rate": 1.6732562680429358e-05,
+ "loss": 0.4289,
+ "step": 10531
+ },
+ {
+ "epoch": 28.697547683923705,
+ "grad_norm": 7.258590221405029,
+ "learning_rate": 1.6731910129541745e-05,
+ "loss": 0.5604,
+ "step": 10532
+ },
+ {
+ "epoch": 28.70027247956403,
+ "grad_norm": 7.198451995849609,
+ "learning_rate": 1.673125752622623e-05,
+ "loss": 0.5089,
+ "step": 10533
+ },
+ {
+ "epoch": 28.70299727520436,
+ "grad_norm": 7.6721882820129395,
+ "learning_rate": 1.67306048704879e-05,
+ "loss": 0.4549,
+ "step": 10534
+ },
+ {
+ "epoch": 28.705722070844686,
+ "grad_norm": 9.911489486694336,
+ "learning_rate": 1.672995216233183e-05,
+ "loss": 0.5649,
+ "step": 10535
+ },
+ {
+ "epoch": 28.708446866485012,
+ "grad_norm": 8.163591384887695,
+ "learning_rate": 1.6729299401763116e-05,
+ "loss": 0.4192,
+ "step": 10536
+ },
+ {
+ "epoch": 28.71117166212534,
+ "grad_norm": 8.404854774475098,
+ "learning_rate": 1.672864658878683e-05,
+ "loss": 0.4542,
+ "step": 10537
+ },
+ {
+ "epoch": 28.713896457765667,
+ "grad_norm": 8.87028694152832,
+ "learning_rate": 1.6727993723408066e-05,
+ "loss": 0.4514,
+ "step": 10538
+ },
+ {
+ "epoch": 28.716621253405993,
+ "grad_norm": 10.431681632995605,
+ "learning_rate": 1.67273408056319e-05,
+ "loss": 0.4138,
+ "step": 10539
+ },
+ {
+ "epoch": 28.719346049046322,
+ "grad_norm": 8.951879501342773,
+ "learning_rate": 1.672668783546342e-05,
+ "loss": 0.5924,
+ "step": 10540
+ },
+ {
+ "epoch": 28.722070844686648,
+ "grad_norm": 14.982688903808594,
+ "learning_rate": 1.6726034812907713e-05,
+ "loss": 0.4955,
+ "step": 10541
+ },
+ {
+ "epoch": 28.724795640326974,
+ "grad_norm": 12.39867115020752,
+ "learning_rate": 1.672538173796986e-05,
+ "loss": 0.5046,
+ "step": 10542
+ },
+ {
+ "epoch": 28.727520435967303,
+ "grad_norm": 8.843228340148926,
+ "learning_rate": 1.6724728610654955e-05,
+ "loss": 0.4193,
+ "step": 10543
+ },
+ {
+ "epoch": 28.73024523160763,
+ "grad_norm": 8.99812126159668,
+ "learning_rate": 1.672407543096808e-05,
+ "loss": 0.4847,
+ "step": 10544
+ },
+ {
+ "epoch": 28.732970027247955,
+ "grad_norm": 7.509914398193359,
+ "learning_rate": 1.6723422198914317e-05,
+ "loss": 0.448,
+ "step": 10545
+ },
+ {
+ "epoch": 28.735694822888284,
+ "grad_norm": 7.077925682067871,
+ "learning_rate": 1.6722768914498763e-05,
+ "loss": 0.3459,
+ "step": 10546
+ },
+ {
+ "epoch": 28.73841961852861,
+ "grad_norm": 13.859886169433594,
+ "learning_rate": 1.6722115577726497e-05,
+ "loss": 0.6188,
+ "step": 10547
+ },
+ {
+ "epoch": 28.741144414168936,
+ "grad_norm": 8.113566398620605,
+ "learning_rate": 1.6721462188602618e-05,
+ "loss": 0.4128,
+ "step": 10548
+ },
+ {
+ "epoch": 28.743869209809265,
+ "grad_norm": 7.334417819976807,
+ "learning_rate": 1.6720808747132204e-05,
+ "loss": 0.3771,
+ "step": 10549
+ },
+ {
+ "epoch": 28.74659400544959,
+ "grad_norm": 7.81968879699707,
+ "learning_rate": 1.6720155253320348e-05,
+ "loss": 0.4758,
+ "step": 10550
+ },
+ {
+ "epoch": 28.749318801089917,
+ "grad_norm": 7.863037586212158,
+ "learning_rate": 1.6719501707172135e-05,
+ "loss": 0.3486,
+ "step": 10551
+ },
+ {
+ "epoch": 28.752043596730246,
+ "grad_norm": 7.974241256713867,
+ "learning_rate": 1.6718848108692665e-05,
+ "loss": 0.5805,
+ "step": 10552
+ },
+ {
+ "epoch": 28.754768392370572,
+ "grad_norm": 14.860568046569824,
+ "learning_rate": 1.671819445788702e-05,
+ "loss": 0.562,
+ "step": 10553
+ },
+ {
+ "epoch": 28.757493188010898,
+ "grad_norm": 7.626082420349121,
+ "learning_rate": 1.671754075476029e-05,
+ "loss": 0.6777,
+ "step": 10554
+ },
+ {
+ "epoch": 28.760217983651227,
+ "grad_norm": 8.53664779663086,
+ "learning_rate": 1.6716886999317573e-05,
+ "loss": 0.4551,
+ "step": 10555
+ },
+ {
+ "epoch": 28.762942779291553,
+ "grad_norm": 8.117570877075195,
+ "learning_rate": 1.6716233191563956e-05,
+ "loss": 0.4374,
+ "step": 10556
+ },
+ {
+ "epoch": 28.76566757493188,
+ "grad_norm": 9.303681373596191,
+ "learning_rate": 1.671557933150453e-05,
+ "loss": 0.5538,
+ "step": 10557
+ },
+ {
+ "epoch": 28.768392370572208,
+ "grad_norm": 10.377424240112305,
+ "learning_rate": 1.6714925419144384e-05,
+ "loss": 0.5431,
+ "step": 10558
+ },
+ {
+ "epoch": 28.771117166212534,
+ "grad_norm": 10.983673095703125,
+ "learning_rate": 1.671427145448862e-05,
+ "loss": 0.4244,
+ "step": 10559
+ },
+ {
+ "epoch": 28.77384196185286,
+ "grad_norm": 8.11573314666748,
+ "learning_rate": 1.6713617437542328e-05,
+ "loss": 0.3999,
+ "step": 10560
+ },
+ {
+ "epoch": 28.77656675749319,
+ "grad_norm": 18.627511978149414,
+ "learning_rate": 1.6712963368310596e-05,
+ "loss": 0.6816,
+ "step": 10561
+ },
+ {
+ "epoch": 28.779291553133515,
+ "grad_norm": 7.47135591506958,
+ "learning_rate": 1.671230924679852e-05,
+ "loss": 0.6332,
+ "step": 10562
+ },
+ {
+ "epoch": 28.78201634877384,
+ "grad_norm": 8.145977973937988,
+ "learning_rate": 1.6711655073011196e-05,
+ "loss": 0.5015,
+ "step": 10563
+ },
+ {
+ "epoch": 28.78474114441417,
+ "grad_norm": 7.705799102783203,
+ "learning_rate": 1.6711000846953722e-05,
+ "loss": 0.5104,
+ "step": 10564
+ },
+ {
+ "epoch": 28.787465940054496,
+ "grad_norm": 6.46087121963501,
+ "learning_rate": 1.671034656863119e-05,
+ "loss": 0.6451,
+ "step": 10565
+ },
+ {
+ "epoch": 28.79019073569482,
+ "grad_norm": 7.06374454498291,
+ "learning_rate": 1.6709692238048688e-05,
+ "loss": 0.4239,
+ "step": 10566
+ },
+ {
+ "epoch": 28.79291553133515,
+ "grad_norm": 20.436994552612305,
+ "learning_rate": 1.670903785521132e-05,
+ "loss": 0.5519,
+ "step": 10567
+ },
+ {
+ "epoch": 28.795640326975477,
+ "grad_norm": 8.40551471710205,
+ "learning_rate": 1.670838342012419e-05,
+ "loss": 0.4232,
+ "step": 10568
+ },
+ {
+ "epoch": 28.798365122615802,
+ "grad_norm": 7.828116416931152,
+ "learning_rate": 1.6707728932792376e-05,
+ "loss": 0.5026,
+ "step": 10569
+ },
+ {
+ "epoch": 28.80108991825613,
+ "grad_norm": 8.556410789489746,
+ "learning_rate": 1.670707439322099e-05,
+ "loss": 0.499,
+ "step": 10570
+ },
+ {
+ "epoch": 28.803814713896458,
+ "grad_norm": 7.418813228607178,
+ "learning_rate": 1.6706419801415122e-05,
+ "loss": 0.5561,
+ "step": 10571
+ },
+ {
+ "epoch": 28.806539509536783,
+ "grad_norm": 9.093198776245117,
+ "learning_rate": 1.6705765157379876e-05,
+ "loss": 0.4318,
+ "step": 10572
+ },
+ {
+ "epoch": 28.809264305177113,
+ "grad_norm": 6.8813252449035645,
+ "learning_rate": 1.6705110461120343e-05,
+ "loss": 0.5348,
+ "step": 10573
+ },
+ {
+ "epoch": 28.81198910081744,
+ "grad_norm": 9.664884567260742,
+ "learning_rate": 1.670445571264163e-05,
+ "loss": 0.5199,
+ "step": 10574
+ },
+ {
+ "epoch": 28.814713896457764,
+ "grad_norm": 6.698128700256348,
+ "learning_rate": 1.6703800911948825e-05,
+ "loss": 0.5584,
+ "step": 10575
+ },
+ {
+ "epoch": 28.817438692098094,
+ "grad_norm": 8.184273719787598,
+ "learning_rate": 1.6703146059047038e-05,
+ "loss": 0.5055,
+ "step": 10576
+ },
+ {
+ "epoch": 28.82016348773842,
+ "grad_norm": 10.05097484588623,
+ "learning_rate": 1.6702491153941367e-05,
+ "loss": 0.5341,
+ "step": 10577
+ },
+ {
+ "epoch": 28.822888283378745,
+ "grad_norm": 7.727924346923828,
+ "learning_rate": 1.6701836196636908e-05,
+ "loss": 0.5427,
+ "step": 10578
+ },
+ {
+ "epoch": 28.825613079019075,
+ "grad_norm": 7.529411792755127,
+ "learning_rate": 1.6701181187138767e-05,
+ "loss": 0.5878,
+ "step": 10579
+ },
+ {
+ "epoch": 28.8283378746594,
+ "grad_norm": 7.188710689544678,
+ "learning_rate": 1.670052612545204e-05,
+ "loss": 0.4862,
+ "step": 10580
+ },
+ {
+ "epoch": 28.831062670299726,
+ "grad_norm": 12.786149978637695,
+ "learning_rate": 1.669987101158183e-05,
+ "loss": 0.5767,
+ "step": 10581
+ },
+ {
+ "epoch": 28.833787465940055,
+ "grad_norm": 10.405355453491211,
+ "learning_rate": 1.6699215845533244e-05,
+ "loss": 0.4841,
+ "step": 10582
+ },
+ {
+ "epoch": 28.83651226158038,
+ "grad_norm": 7.407323360443115,
+ "learning_rate": 1.6698560627311378e-05,
+ "loss": 0.4706,
+ "step": 10583
+ },
+ {
+ "epoch": 28.839237057220707,
+ "grad_norm": 8.080324172973633,
+ "learning_rate": 1.669790535692134e-05,
+ "loss": 0.5331,
+ "step": 10584
+ },
+ {
+ "epoch": 28.841961852861036,
+ "grad_norm": 11.468756675720215,
+ "learning_rate": 1.6697250034368226e-05,
+ "loss": 0.4819,
+ "step": 10585
+ },
+ {
+ "epoch": 28.844686648501362,
+ "grad_norm": 7.990210056304932,
+ "learning_rate": 1.669659465965715e-05,
+ "loss": 0.5371,
+ "step": 10586
+ },
+ {
+ "epoch": 28.847411444141688,
+ "grad_norm": 8.95950698852539,
+ "learning_rate": 1.6695939232793206e-05,
+ "loss": 0.5915,
+ "step": 10587
+ },
+ {
+ "epoch": 28.850136239782017,
+ "grad_norm": 8.210714340209961,
+ "learning_rate": 1.66952837537815e-05,
+ "loss": 0.5724,
+ "step": 10588
+ },
+ {
+ "epoch": 28.852861035422343,
+ "grad_norm": 10.971351623535156,
+ "learning_rate": 1.6694628222627148e-05,
+ "loss": 0.5953,
+ "step": 10589
+ },
+ {
+ "epoch": 28.85558583106267,
+ "grad_norm": 7.6229448318481445,
+ "learning_rate": 1.669397263933524e-05,
+ "loss": 0.5294,
+ "step": 10590
+ },
+ {
+ "epoch": 28.858310626703,
+ "grad_norm": 8.125885963439941,
+ "learning_rate": 1.6693317003910895e-05,
+ "loss": 0.635,
+ "step": 10591
+ },
+ {
+ "epoch": 28.861035422343324,
+ "grad_norm": 8.368759155273438,
+ "learning_rate": 1.6692661316359206e-05,
+ "loss": 0.5388,
+ "step": 10592
+ },
+ {
+ "epoch": 28.86376021798365,
+ "grad_norm": 8.914116859436035,
+ "learning_rate": 1.6692005576685288e-05,
+ "loss": 0.4432,
+ "step": 10593
+ },
+ {
+ "epoch": 28.86648501362398,
+ "grad_norm": 9.29539966583252,
+ "learning_rate": 1.669134978489425e-05,
+ "loss": 0.589,
+ "step": 10594
+ },
+ {
+ "epoch": 28.869209809264305,
+ "grad_norm": 11.241096496582031,
+ "learning_rate": 1.669069394099119e-05,
+ "loss": 0.5644,
+ "step": 10595
+ },
+ {
+ "epoch": 28.87193460490463,
+ "grad_norm": 7.38763427734375,
+ "learning_rate": 1.6690038044981222e-05,
+ "loss": 0.5002,
+ "step": 10596
+ },
+ {
+ "epoch": 28.87465940054496,
+ "grad_norm": 7.305187225341797,
+ "learning_rate": 1.6689382096869457e-05,
+ "loss": 0.4514,
+ "step": 10597
+ },
+ {
+ "epoch": 28.877384196185286,
+ "grad_norm": 9.493101119995117,
+ "learning_rate": 1.6688726096660994e-05,
+ "loss": 0.4852,
+ "step": 10598
+ },
+ {
+ "epoch": 28.88010899182561,
+ "grad_norm": 8.345754623413086,
+ "learning_rate": 1.668807004436095e-05,
+ "loss": 0.4807,
+ "step": 10599
+ },
+ {
+ "epoch": 28.88283378746594,
+ "grad_norm": 8.172216415405273,
+ "learning_rate": 1.668741393997443e-05,
+ "loss": 0.7126,
+ "step": 10600
+ },
+ {
+ "epoch": 28.885558583106267,
+ "grad_norm": 8.099128723144531,
+ "learning_rate": 1.668675778350655e-05,
+ "loss": 0.4258,
+ "step": 10601
+ },
+ {
+ "epoch": 28.888283378746593,
+ "grad_norm": 8.967839241027832,
+ "learning_rate": 1.6686101574962413e-05,
+ "loss": 0.4801,
+ "step": 10602
+ },
+ {
+ "epoch": 28.891008174386922,
+ "grad_norm": 8.110413551330566,
+ "learning_rate": 1.668544531434713e-05,
+ "loss": 0.5353,
+ "step": 10603
+ },
+ {
+ "epoch": 28.893732970027248,
+ "grad_norm": 8.122382164001465,
+ "learning_rate": 1.668478900166582e-05,
+ "loss": 0.597,
+ "step": 10604
+ },
+ {
+ "epoch": 28.896457765667574,
+ "grad_norm": 8.046221733093262,
+ "learning_rate": 1.668413263692358e-05,
+ "loss": 0.5664,
+ "step": 10605
+ },
+ {
+ "epoch": 28.899182561307903,
+ "grad_norm": 6.769096851348877,
+ "learning_rate": 1.6683476220125535e-05,
+ "loss": 0.4942,
+ "step": 10606
+ },
+ {
+ "epoch": 28.90190735694823,
+ "grad_norm": 7.824985504150391,
+ "learning_rate": 1.668281975127679e-05,
+ "loss": 0.5683,
+ "step": 10607
+ },
+ {
+ "epoch": 28.904632152588555,
+ "grad_norm": 9.089848518371582,
+ "learning_rate": 1.6682163230382465e-05,
+ "loss": 0.5217,
+ "step": 10608
+ },
+ {
+ "epoch": 28.907356948228884,
+ "grad_norm": 8.377856254577637,
+ "learning_rate": 1.6681506657447664e-05,
+ "loss": 0.4709,
+ "step": 10609
+ },
+ {
+ "epoch": 28.91008174386921,
+ "grad_norm": 7.7487382888793945,
+ "learning_rate": 1.6680850032477504e-05,
+ "loss": 0.4902,
+ "step": 10610
+ },
+ {
+ "epoch": 28.912806539509535,
+ "grad_norm": 6.764167308807373,
+ "learning_rate": 1.66801933554771e-05,
+ "loss": 0.4218,
+ "step": 10611
+ },
+ {
+ "epoch": 28.915531335149865,
+ "grad_norm": 7.561228275299072,
+ "learning_rate": 1.6679536626451565e-05,
+ "loss": 0.4656,
+ "step": 10612
+ },
+ {
+ "epoch": 28.91825613079019,
+ "grad_norm": 7.498943328857422,
+ "learning_rate": 1.6678879845406014e-05,
+ "loss": 0.5511,
+ "step": 10613
+ },
+ {
+ "epoch": 28.920980926430516,
+ "grad_norm": 7.2002153396606445,
+ "learning_rate": 1.667822301234556e-05,
+ "loss": 0.3559,
+ "step": 10614
+ },
+ {
+ "epoch": 28.923705722070846,
+ "grad_norm": 9.295483589172363,
+ "learning_rate": 1.667756612727532e-05,
+ "loss": 0.661,
+ "step": 10615
+ },
+ {
+ "epoch": 28.92643051771117,
+ "grad_norm": 9.446654319763184,
+ "learning_rate": 1.6676909190200416e-05,
+ "loss": 0.428,
+ "step": 10616
+ },
+ {
+ "epoch": 28.929155313351497,
+ "grad_norm": 8.02613353729248,
+ "learning_rate": 1.667625220112595e-05,
+ "loss": 0.5871,
+ "step": 10617
+ },
+ {
+ "epoch": 28.931880108991827,
+ "grad_norm": 7.79987096786499,
+ "learning_rate": 1.6675595160057053e-05,
+ "loss": 0.592,
+ "step": 10618
+ },
+ {
+ "epoch": 28.934604904632153,
+ "grad_norm": 7.361390590667725,
+ "learning_rate": 1.667493806699883e-05,
+ "loss": 0.6436,
+ "step": 10619
+ },
+ {
+ "epoch": 28.93732970027248,
+ "grad_norm": 8.387858390808105,
+ "learning_rate": 1.667428092195641e-05,
+ "loss": 0.4167,
+ "step": 10620
+ },
+ {
+ "epoch": 28.940054495912808,
+ "grad_norm": 8.999015808105469,
+ "learning_rate": 1.6673623724934898e-05,
+ "loss": 0.5012,
+ "step": 10621
+ },
+ {
+ "epoch": 28.942779291553133,
+ "grad_norm": 6.0761823654174805,
+ "learning_rate": 1.6672966475939426e-05,
+ "loss": 0.4583,
+ "step": 10622
+ },
+ {
+ "epoch": 28.94550408719346,
+ "grad_norm": 7.447052955627441,
+ "learning_rate": 1.66723091749751e-05,
+ "loss": 0.4194,
+ "step": 10623
+ },
+ {
+ "epoch": 28.94822888283379,
+ "grad_norm": 7.755176067352295,
+ "learning_rate": 1.6671651822047052e-05,
+ "loss": 0.3965,
+ "step": 10624
+ },
+ {
+ "epoch": 28.950953678474114,
+ "grad_norm": 8.58421516418457,
+ "learning_rate": 1.667099441716039e-05,
+ "loss": 0.5266,
+ "step": 10625
+ },
+ {
+ "epoch": 28.95367847411444,
+ "grad_norm": 6.611844062805176,
+ "learning_rate": 1.6670336960320237e-05,
+ "loss": 0.5188,
+ "step": 10626
+ },
+ {
+ "epoch": 28.95640326975477,
+ "grad_norm": 11.779068946838379,
+ "learning_rate": 1.6669679451531716e-05,
+ "loss": 0.4384,
+ "step": 10627
+ },
+ {
+ "epoch": 28.959128065395095,
+ "grad_norm": 7.734330654144287,
+ "learning_rate": 1.666902189079995e-05,
+ "loss": 0.5486,
+ "step": 10628
+ },
+ {
+ "epoch": 28.96185286103542,
+ "grad_norm": 7.206127166748047,
+ "learning_rate": 1.6668364278130047e-05,
+ "loss": 0.4609,
+ "step": 10629
+ },
+ {
+ "epoch": 28.96457765667575,
+ "grad_norm": 7.38665771484375,
+ "learning_rate": 1.6667706613527142e-05,
+ "loss": 0.5,
+ "step": 10630
+ },
+ {
+ "epoch": 28.967302452316076,
+ "grad_norm": 9.11385726928711,
+ "learning_rate": 1.6667048896996357e-05,
+ "loss": 0.4606,
+ "step": 10631
+ },
+ {
+ "epoch": 28.970027247956402,
+ "grad_norm": 7.674446105957031,
+ "learning_rate": 1.6666391128542802e-05,
+ "loss": 0.4459,
+ "step": 10632
+ },
+ {
+ "epoch": 28.97275204359673,
+ "grad_norm": 7.57926607131958,
+ "learning_rate": 1.6665733308171615e-05,
+ "loss": 0.596,
+ "step": 10633
+ },
+ {
+ "epoch": 28.975476839237057,
+ "grad_norm": 7.778857231140137,
+ "learning_rate": 1.6665075435887907e-05,
+ "loss": 0.6039,
+ "step": 10634
+ },
+ {
+ "epoch": 28.978201634877383,
+ "grad_norm": 9.085589408874512,
+ "learning_rate": 1.6664417511696807e-05,
+ "loss": 0.4991,
+ "step": 10635
+ },
+ {
+ "epoch": 28.980926430517712,
+ "grad_norm": 7.43651819229126,
+ "learning_rate": 1.6663759535603438e-05,
+ "loss": 0.4854,
+ "step": 10636
+ },
+ {
+ "epoch": 28.983651226158038,
+ "grad_norm": 7.128672122955322,
+ "learning_rate": 1.6663101507612926e-05,
+ "loss": 0.4504,
+ "step": 10637
+ },
+ {
+ "epoch": 28.986376021798364,
+ "grad_norm": 8.316488265991211,
+ "learning_rate": 1.666244342773039e-05,
+ "loss": 0.4891,
+ "step": 10638
+ },
+ {
+ "epoch": 28.989100817438693,
+ "grad_norm": 9.425989151000977,
+ "learning_rate": 1.666178529596096e-05,
+ "loss": 0.546,
+ "step": 10639
+ },
+ {
+ "epoch": 28.99182561307902,
+ "grad_norm": 7.048205852508545,
+ "learning_rate": 1.666112711230976e-05,
+ "loss": 0.4882,
+ "step": 10640
+ },
+ {
+ "epoch": 28.994550408719345,
+ "grad_norm": 7.403781890869141,
+ "learning_rate": 1.666046887678192e-05,
+ "loss": 0.6663,
+ "step": 10641
+ },
+ {
+ "epoch": 28.997275204359674,
+ "grad_norm": 6.79907751083374,
+ "learning_rate": 1.665981058938256e-05,
+ "loss": 0.6273,
+ "step": 10642
+ },
+ {
+ "epoch": 29.0,
+ "grad_norm": 6.791356563568115,
+ "learning_rate": 1.665915225011681e-05,
+ "loss": 0.5466,
+ "step": 10643
+ },
+ {
+ "epoch": 29.002724795640326,
+ "grad_norm": 6.716793537139893,
+ "learning_rate": 1.66584938589898e-05,
+ "loss": 0.5327,
+ "step": 10644
+ },
+ {
+ "epoch": 29.005449591280655,
+ "grad_norm": 6.785096168518066,
+ "learning_rate": 1.665783541600665e-05,
+ "loss": 0.3464,
+ "step": 10645
+ },
+ {
+ "epoch": 29.00817438692098,
+ "grad_norm": 7.015567302703857,
+ "learning_rate": 1.6657176921172492e-05,
+ "loss": 0.5493,
+ "step": 10646
+ },
+ {
+ "epoch": 29.010899182561307,
+ "grad_norm": 6.1250834465026855,
+ "learning_rate": 1.6656518374492458e-05,
+ "loss": 0.3676,
+ "step": 10647
+ },
+ {
+ "epoch": 29.013623978201636,
+ "grad_norm": 6.8189873695373535,
+ "learning_rate": 1.665585977597167e-05,
+ "loss": 0.4194,
+ "step": 10648
+ },
+ {
+ "epoch": 29.016348773841962,
+ "grad_norm": 6.028426170349121,
+ "learning_rate": 1.6655201125615263e-05,
+ "loss": 0.4869,
+ "step": 10649
+ },
+ {
+ "epoch": 29.019073569482288,
+ "grad_norm": 8.195756912231445,
+ "learning_rate": 1.665454242342836e-05,
+ "loss": 0.5178,
+ "step": 10650
+ },
+ {
+ "epoch": 29.021798365122617,
+ "grad_norm": 7.648116111755371,
+ "learning_rate": 1.6653883669416098e-05,
+ "loss": 0.5685,
+ "step": 10651
+ },
+ {
+ "epoch": 29.024523160762943,
+ "grad_norm": 6.029077529907227,
+ "learning_rate": 1.6653224863583602e-05,
+ "loss": 0.55,
+ "step": 10652
+ },
+ {
+ "epoch": 29.02724795640327,
+ "grad_norm": 6.578215599060059,
+ "learning_rate": 1.6652566005936004e-05,
+ "loss": 0.3692,
+ "step": 10653
+ },
+ {
+ "epoch": 29.029972752043598,
+ "grad_norm": 6.456214904785156,
+ "learning_rate": 1.6651907096478436e-05,
+ "loss": 0.359,
+ "step": 10654
+ },
+ {
+ "epoch": 29.032697547683924,
+ "grad_norm": 8.54837703704834,
+ "learning_rate": 1.6651248135216032e-05,
+ "loss": 0.4001,
+ "step": 10655
+ },
+ {
+ "epoch": 29.03542234332425,
+ "grad_norm": 8.930901527404785,
+ "learning_rate": 1.665058912215392e-05,
+ "loss": 0.4656,
+ "step": 10656
+ },
+ {
+ "epoch": 29.03814713896458,
+ "grad_norm": 7.996654987335205,
+ "learning_rate": 1.6649930057297235e-05,
+ "loss": 0.3322,
+ "step": 10657
+ },
+ {
+ "epoch": 29.040871934604905,
+ "grad_norm": 7.286412715911865,
+ "learning_rate": 1.664927094065111e-05,
+ "loss": 0.4208,
+ "step": 10658
+ },
+ {
+ "epoch": 29.04359673024523,
+ "grad_norm": 9.534561157226562,
+ "learning_rate": 1.6648611772220675e-05,
+ "loss": 0.4321,
+ "step": 10659
+ },
+ {
+ "epoch": 29.04632152588556,
+ "grad_norm": 7.3517985343933105,
+ "learning_rate": 1.664795255201107e-05,
+ "loss": 0.5556,
+ "step": 10660
+ },
+ {
+ "epoch": 29.049046321525886,
+ "grad_norm": 6.535494327545166,
+ "learning_rate": 1.664729328002742e-05,
+ "loss": 0.4312,
+ "step": 10661
+ },
+ {
+ "epoch": 29.05177111716621,
+ "grad_norm": 6.648280143737793,
+ "learning_rate": 1.6646633956274862e-05,
+ "loss": 0.7457,
+ "step": 10662
+ },
+ {
+ "epoch": 29.05449591280654,
+ "grad_norm": 7.089462757110596,
+ "learning_rate": 1.6645974580758533e-05,
+ "loss": 0.431,
+ "step": 10663
+ },
+ {
+ "epoch": 29.057220708446867,
+ "grad_norm": 7.128489971160889,
+ "learning_rate": 1.6645315153483572e-05,
+ "loss": 0.614,
+ "step": 10664
+ },
+ {
+ "epoch": 29.059945504087192,
+ "grad_norm": 7.6592183113098145,
+ "learning_rate": 1.6644655674455107e-05,
+ "loss": 0.3837,
+ "step": 10665
+ },
+ {
+ "epoch": 29.06267029972752,
+ "grad_norm": 7.780344009399414,
+ "learning_rate": 1.664399614367828e-05,
+ "loss": 0.5763,
+ "step": 10666
+ },
+ {
+ "epoch": 29.065395095367847,
+ "grad_norm": 8.125530242919922,
+ "learning_rate": 1.6643336561158222e-05,
+ "loss": 0.4218,
+ "step": 10667
+ },
+ {
+ "epoch": 29.068119891008173,
+ "grad_norm": 7.207923889160156,
+ "learning_rate": 1.6642676926900077e-05,
+ "loss": 0.5035,
+ "step": 10668
+ },
+ {
+ "epoch": 29.070844686648503,
+ "grad_norm": 8.001280784606934,
+ "learning_rate": 1.6642017240908975e-05,
+ "loss": 0.377,
+ "step": 10669
+ },
+ {
+ "epoch": 29.07356948228883,
+ "grad_norm": 6.393892765045166,
+ "learning_rate": 1.6641357503190055e-05,
+ "loss": 0.4096,
+ "step": 10670
+ },
+ {
+ "epoch": 29.076294277929154,
+ "grad_norm": 6.3388214111328125,
+ "learning_rate": 1.664069771374846e-05,
+ "loss": 0.4064,
+ "step": 10671
+ },
+ {
+ "epoch": 29.079019073569484,
+ "grad_norm": 5.872392177581787,
+ "learning_rate": 1.664003787258932e-05,
+ "loss": 0.3359,
+ "step": 10672
+ },
+ {
+ "epoch": 29.08174386920981,
+ "grad_norm": 7.228592872619629,
+ "learning_rate": 1.6639377979717784e-05,
+ "loss": 0.4145,
+ "step": 10673
+ },
+ {
+ "epoch": 29.084468664850135,
+ "grad_norm": 7.437412261962891,
+ "learning_rate": 1.6638718035138985e-05,
+ "loss": 0.4682,
+ "step": 10674
+ },
+ {
+ "epoch": 29.087193460490465,
+ "grad_norm": 7.387948989868164,
+ "learning_rate": 1.663805803885806e-05,
+ "loss": 0.469,
+ "step": 10675
+ },
+ {
+ "epoch": 29.08991825613079,
+ "grad_norm": 40.065284729003906,
+ "learning_rate": 1.6637397990880158e-05,
+ "loss": 0.3711,
+ "step": 10676
+ },
+ {
+ "epoch": 29.092643051771116,
+ "grad_norm": 7.11245059967041,
+ "learning_rate": 1.6636737891210412e-05,
+ "loss": 0.4128,
+ "step": 10677
+ },
+ {
+ "epoch": 29.095367847411445,
+ "grad_norm": 7.460601329803467,
+ "learning_rate": 1.663607773985396e-05,
+ "loss": 0.4702,
+ "step": 10678
+ },
+ {
+ "epoch": 29.09809264305177,
+ "grad_norm": 13.630023956298828,
+ "learning_rate": 1.6635417536815953e-05,
+ "loss": 0.626,
+ "step": 10679
+ },
+ {
+ "epoch": 29.100817438692097,
+ "grad_norm": 6.180692195892334,
+ "learning_rate": 1.663475728210153e-05,
+ "loss": 0.4881,
+ "step": 10680
+ },
+ {
+ "epoch": 29.103542234332426,
+ "grad_norm": 7.246993541717529,
+ "learning_rate": 1.6634096975715825e-05,
+ "loss": 0.4967,
+ "step": 10681
+ },
+ {
+ "epoch": 29.106267029972752,
+ "grad_norm": 7.189358711242676,
+ "learning_rate": 1.6633436617663988e-05,
+ "loss": 0.3922,
+ "step": 10682
+ },
+ {
+ "epoch": 29.108991825613078,
+ "grad_norm": 8.475040435791016,
+ "learning_rate": 1.6632776207951165e-05,
+ "loss": 0.4345,
+ "step": 10683
+ },
+ {
+ "epoch": 29.111716621253407,
+ "grad_norm": 6.120608329772949,
+ "learning_rate": 1.663211574658249e-05,
+ "loss": 0.3836,
+ "step": 10684
+ },
+ {
+ "epoch": 29.114441416893733,
+ "grad_norm": 7.1794281005859375,
+ "learning_rate": 1.6631455233563113e-05,
+ "loss": 0.4676,
+ "step": 10685
+ },
+ {
+ "epoch": 29.11716621253406,
+ "grad_norm": 7.182884693145752,
+ "learning_rate": 1.6630794668898175e-05,
+ "loss": 0.4496,
+ "step": 10686
+ },
+ {
+ "epoch": 29.11989100817439,
+ "grad_norm": 6.465396881103516,
+ "learning_rate": 1.6630134052592823e-05,
+ "loss": 0.4851,
+ "step": 10687
+ },
+ {
+ "epoch": 29.122615803814714,
+ "grad_norm": 6.79514741897583,
+ "learning_rate": 1.6629473384652197e-05,
+ "loss": 0.4568,
+ "step": 10688
+ },
+ {
+ "epoch": 29.12534059945504,
+ "grad_norm": 8.822425842285156,
+ "learning_rate": 1.6628812665081446e-05,
+ "loss": 0.4444,
+ "step": 10689
+ },
+ {
+ "epoch": 29.12806539509537,
+ "grad_norm": 9.892768859863281,
+ "learning_rate": 1.6628151893885715e-05,
+ "loss": 0.5513,
+ "step": 10690
+ },
+ {
+ "epoch": 29.130790190735695,
+ "grad_norm": 7.1043620109558105,
+ "learning_rate": 1.6627491071070152e-05,
+ "loss": 0.3967,
+ "step": 10691
+ },
+ {
+ "epoch": 29.13351498637602,
+ "grad_norm": 7.769501686096191,
+ "learning_rate": 1.66268301966399e-05,
+ "loss": 0.452,
+ "step": 10692
+ },
+ {
+ "epoch": 29.13623978201635,
+ "grad_norm": 9.14890193939209,
+ "learning_rate": 1.6626169270600113e-05,
+ "loss": 0.601,
+ "step": 10693
+ },
+ {
+ "epoch": 29.138964577656676,
+ "grad_norm": 6.528905391693115,
+ "learning_rate": 1.662550829295593e-05,
+ "loss": 0.3549,
+ "step": 10694
+ },
+ {
+ "epoch": 29.141689373297,
+ "grad_norm": 7.674026966094971,
+ "learning_rate": 1.66248472637125e-05,
+ "loss": 0.4982,
+ "step": 10695
+ },
+ {
+ "epoch": 29.14441416893733,
+ "grad_norm": 6.87601900100708,
+ "learning_rate": 1.6624186182874977e-05,
+ "loss": 0.3966,
+ "step": 10696
+ },
+ {
+ "epoch": 29.147138964577657,
+ "grad_norm": 7.0147552490234375,
+ "learning_rate": 1.66235250504485e-05,
+ "loss": 0.4487,
+ "step": 10697
+ },
+ {
+ "epoch": 29.149863760217983,
+ "grad_norm": 6.048093318939209,
+ "learning_rate": 1.6622863866438223e-05,
+ "loss": 0.4211,
+ "step": 10698
+ },
+ {
+ "epoch": 29.152588555858312,
+ "grad_norm": 6.146883010864258,
+ "learning_rate": 1.66222026308493e-05,
+ "loss": 0.4698,
+ "step": 10699
+ },
+ {
+ "epoch": 29.155313351498638,
+ "grad_norm": 8.4680814743042,
+ "learning_rate": 1.662154134368687e-05,
+ "loss": 0.339,
+ "step": 10700
+ },
+ {
+ "epoch": 29.158038147138964,
+ "grad_norm": 7.185520648956299,
+ "learning_rate": 1.6620880004956095e-05,
+ "loss": 0.3368,
+ "step": 10701
+ },
+ {
+ "epoch": 29.160762942779293,
+ "grad_norm": 7.100562572479248,
+ "learning_rate": 1.662021861466212e-05,
+ "loss": 0.5181,
+ "step": 10702
+ },
+ {
+ "epoch": 29.16348773841962,
+ "grad_norm": 8.350886344909668,
+ "learning_rate": 1.661955717281009e-05,
+ "loss": 0.5449,
+ "step": 10703
+ },
+ {
+ "epoch": 29.166212534059945,
+ "grad_norm": 8.237159729003906,
+ "learning_rate": 1.6618895679405165e-05,
+ "loss": 0.4541,
+ "step": 10704
+ },
+ {
+ "epoch": 29.168937329700274,
+ "grad_norm": 7.449276447296143,
+ "learning_rate": 1.6618234134452493e-05,
+ "loss": 0.3835,
+ "step": 10705
+ },
+ {
+ "epoch": 29.1716621253406,
+ "grad_norm": 7.251029014587402,
+ "learning_rate": 1.661757253795723e-05,
+ "loss": 0.5143,
+ "step": 10706
+ },
+ {
+ "epoch": 29.174386920980925,
+ "grad_norm": 6.984391212463379,
+ "learning_rate": 1.661691088992452e-05,
+ "loss": 0.4431,
+ "step": 10707
+ },
+ {
+ "epoch": 29.177111716621255,
+ "grad_norm": 8.196168899536133,
+ "learning_rate": 1.661624919035952e-05,
+ "loss": 0.4003,
+ "step": 10708
+ },
+ {
+ "epoch": 29.17983651226158,
+ "grad_norm": 7.046302318572998,
+ "learning_rate": 1.661558743926739e-05,
+ "loss": 0.4662,
+ "step": 10709
+ },
+ {
+ "epoch": 29.182561307901906,
+ "grad_norm": 7.18446683883667,
+ "learning_rate": 1.6614925636653274e-05,
+ "loss": 0.5267,
+ "step": 10710
+ },
+ {
+ "epoch": 29.185286103542236,
+ "grad_norm": 7.664499759674072,
+ "learning_rate": 1.6614263782522332e-05,
+ "loss": 0.4207,
+ "step": 10711
+ },
+ {
+ "epoch": 29.18801089918256,
+ "grad_norm": 5.894651412963867,
+ "learning_rate": 1.6613601876879714e-05,
+ "loss": 0.5299,
+ "step": 10712
+ },
+ {
+ "epoch": 29.190735694822887,
+ "grad_norm": 7.169234275817871,
+ "learning_rate": 1.6612939919730578e-05,
+ "loss": 0.4573,
+ "step": 10713
+ },
+ {
+ "epoch": 29.193460490463217,
+ "grad_norm": 10.233022689819336,
+ "learning_rate": 1.661227791108008e-05,
+ "loss": 0.4675,
+ "step": 10714
+ },
+ {
+ "epoch": 29.196185286103542,
+ "grad_norm": 6.739607810974121,
+ "learning_rate": 1.6611615850933374e-05,
+ "loss": 0.4117,
+ "step": 10715
+ },
+ {
+ "epoch": 29.19891008174387,
+ "grad_norm": 6.349090099334717,
+ "learning_rate": 1.6610953739295617e-05,
+ "loss": 0.4535,
+ "step": 10716
+ },
+ {
+ "epoch": 29.201634877384198,
+ "grad_norm": 7.4584479331970215,
+ "learning_rate": 1.6610291576171965e-05,
+ "loss": 0.4776,
+ "step": 10717
+ },
+ {
+ "epoch": 29.204359673024523,
+ "grad_norm": 7.474863529205322,
+ "learning_rate": 1.6609629361567578e-05,
+ "loss": 0.3361,
+ "step": 10718
+ },
+ {
+ "epoch": 29.20708446866485,
+ "grad_norm": 7.306474685668945,
+ "learning_rate": 1.6608967095487606e-05,
+ "loss": 0.5182,
+ "step": 10719
+ },
+ {
+ "epoch": 29.20980926430518,
+ "grad_norm": 6.636267185211182,
+ "learning_rate": 1.660830477793721e-05,
+ "loss": 0.5018,
+ "step": 10720
+ },
+ {
+ "epoch": 29.212534059945504,
+ "grad_norm": 8.042543411254883,
+ "learning_rate": 1.6607642408921552e-05,
+ "loss": 0.4495,
+ "step": 10721
+ },
+ {
+ "epoch": 29.21525885558583,
+ "grad_norm": 7.184332847595215,
+ "learning_rate": 1.6606979988445787e-05,
+ "loss": 0.3229,
+ "step": 10722
+ },
+ {
+ "epoch": 29.21798365122616,
+ "grad_norm": 6.720614433288574,
+ "learning_rate": 1.6606317516515074e-05,
+ "loss": 0.4746,
+ "step": 10723
+ },
+ {
+ "epoch": 29.220708446866485,
+ "grad_norm": 8.756359100341797,
+ "learning_rate": 1.660565499313457e-05,
+ "loss": 0.3661,
+ "step": 10724
+ },
+ {
+ "epoch": 29.22343324250681,
+ "grad_norm": 6.875161647796631,
+ "learning_rate": 1.6604992418309443e-05,
+ "loss": 0.3187,
+ "step": 10725
+ },
+ {
+ "epoch": 29.22615803814714,
+ "grad_norm": 8.915993690490723,
+ "learning_rate": 1.6604329792044845e-05,
+ "loss": 0.4139,
+ "step": 10726
+ },
+ {
+ "epoch": 29.228882833787466,
+ "grad_norm": 14.585935592651367,
+ "learning_rate": 1.660366711434594e-05,
+ "loss": 0.3608,
+ "step": 10727
+ },
+ {
+ "epoch": 29.231607629427792,
+ "grad_norm": 7.285501480102539,
+ "learning_rate": 1.6603004385217887e-05,
+ "loss": 0.3971,
+ "step": 10728
+ },
+ {
+ "epoch": 29.23433242506812,
+ "grad_norm": 7.343924045562744,
+ "learning_rate": 1.6602341604665848e-05,
+ "loss": 0.5458,
+ "step": 10729
+ },
+ {
+ "epoch": 29.237057220708447,
+ "grad_norm": 8.615266799926758,
+ "learning_rate": 1.6601678772694985e-05,
+ "loss": 0.5154,
+ "step": 10730
+ },
+ {
+ "epoch": 29.239782016348773,
+ "grad_norm": 8.476104736328125,
+ "learning_rate": 1.6601015889310462e-05,
+ "loss": 0.5087,
+ "step": 10731
+ },
+ {
+ "epoch": 29.242506811989102,
+ "grad_norm": 6.7297682762146,
+ "learning_rate": 1.6600352954517437e-05,
+ "loss": 0.444,
+ "step": 10732
+ },
+ {
+ "epoch": 29.245231607629428,
+ "grad_norm": 12.848528861999512,
+ "learning_rate": 1.659968996832108e-05,
+ "loss": 0.4996,
+ "step": 10733
+ },
+ {
+ "epoch": 29.247956403269754,
+ "grad_norm": 7.561726093292236,
+ "learning_rate": 1.6599026930726544e-05,
+ "loss": 0.3617,
+ "step": 10734
+ },
+ {
+ "epoch": 29.250681198910083,
+ "grad_norm": 6.653961658477783,
+ "learning_rate": 1.6598363841739004e-05,
+ "loss": 0.4031,
+ "step": 10735
+ },
+ {
+ "epoch": 29.25340599455041,
+ "grad_norm": 7.954012870788574,
+ "learning_rate": 1.6597700701363615e-05,
+ "loss": 0.4294,
+ "step": 10736
+ },
+ {
+ "epoch": 29.256130790190735,
+ "grad_norm": 7.65130090713501,
+ "learning_rate": 1.6597037509605546e-05,
+ "loss": 0.5634,
+ "step": 10737
+ },
+ {
+ "epoch": 29.258855585831064,
+ "grad_norm": 6.7763519287109375,
+ "learning_rate": 1.6596374266469963e-05,
+ "loss": 0.5255,
+ "step": 10738
+ },
+ {
+ "epoch": 29.26158038147139,
+ "grad_norm": 7.821353435516357,
+ "learning_rate": 1.6595710971962028e-05,
+ "loss": 0.5572,
+ "step": 10739
+ },
+ {
+ "epoch": 29.264305177111716,
+ "grad_norm": 6.62902307510376,
+ "learning_rate": 1.6595047626086908e-05,
+ "loss": 0.3801,
+ "step": 10740
+ },
+ {
+ "epoch": 29.267029972752045,
+ "grad_norm": 7.1971564292907715,
+ "learning_rate": 1.659438422884977e-05,
+ "loss": 0.5649,
+ "step": 10741
+ },
+ {
+ "epoch": 29.26975476839237,
+ "grad_norm": 19.59003257751465,
+ "learning_rate": 1.6593720780255778e-05,
+ "loss": 0.3581,
+ "step": 10742
+ },
+ {
+ "epoch": 29.272479564032697,
+ "grad_norm": 7.921016693115234,
+ "learning_rate": 1.6593057280310105e-05,
+ "loss": 0.3824,
+ "step": 10743
+ },
+ {
+ "epoch": 29.275204359673026,
+ "grad_norm": 7.749704837799072,
+ "learning_rate": 1.659239372901791e-05,
+ "loss": 0.3783,
+ "step": 10744
+ },
+ {
+ "epoch": 29.277929155313352,
+ "grad_norm": 7.899710655212402,
+ "learning_rate": 1.659173012638437e-05,
+ "loss": 0.475,
+ "step": 10745
+ },
+ {
+ "epoch": 29.280653950953678,
+ "grad_norm": 7.129073143005371,
+ "learning_rate": 1.6591066472414647e-05,
+ "loss": 0.5405,
+ "step": 10746
+ },
+ {
+ "epoch": 29.283378746594007,
+ "grad_norm": 6.995426654815674,
+ "learning_rate": 1.6590402767113903e-05,
+ "loss": 0.6329,
+ "step": 10747
+ },
+ {
+ "epoch": 29.286103542234333,
+ "grad_norm": 6.966623783111572,
+ "learning_rate": 1.6589739010487323e-05,
+ "loss": 0.5219,
+ "step": 10748
+ },
+ {
+ "epoch": 29.28882833787466,
+ "grad_norm": 6.712077617645264,
+ "learning_rate": 1.6589075202540064e-05,
+ "loss": 0.37,
+ "step": 10749
+ },
+ {
+ "epoch": 29.291553133514988,
+ "grad_norm": 8.465301513671875,
+ "learning_rate": 1.65884113432773e-05,
+ "loss": 0.5001,
+ "step": 10750
+ },
+ {
+ "epoch": 29.294277929155314,
+ "grad_norm": 9.476337432861328,
+ "learning_rate": 1.65877474327042e-05,
+ "loss": 0.5214,
+ "step": 10751
+ },
+ {
+ "epoch": 29.29700272479564,
+ "grad_norm": 26.010038375854492,
+ "learning_rate": 1.6587083470825933e-05,
+ "loss": 0.4188,
+ "step": 10752
+ },
+ {
+ "epoch": 29.29972752043597,
+ "grad_norm": 8.532973289489746,
+ "learning_rate": 1.6586419457647673e-05,
+ "loss": 0.485,
+ "step": 10753
+ },
+ {
+ "epoch": 29.302452316076295,
+ "grad_norm": 7.86745023727417,
+ "learning_rate": 1.658575539317459e-05,
+ "loss": 0.444,
+ "step": 10754
+ },
+ {
+ "epoch": 29.30517711171662,
+ "grad_norm": 7.497247695922852,
+ "learning_rate": 1.658509127741186e-05,
+ "loss": 0.4146,
+ "step": 10755
+ },
+ {
+ "epoch": 29.30790190735695,
+ "grad_norm": 6.255491733551025,
+ "learning_rate": 1.658442711036465e-05,
+ "loss": 0.439,
+ "step": 10756
+ },
+ {
+ "epoch": 29.310626702997276,
+ "grad_norm": 7.498615741729736,
+ "learning_rate": 1.658376289203813e-05,
+ "loss": 0.5736,
+ "step": 10757
+ },
+ {
+ "epoch": 29.3133514986376,
+ "grad_norm": 7.252074718475342,
+ "learning_rate": 1.6583098622437477e-05,
+ "loss": 0.5148,
+ "step": 10758
+ },
+ {
+ "epoch": 29.31607629427793,
+ "grad_norm": 6.788809776306152,
+ "learning_rate": 1.6582434301567865e-05,
+ "loss": 0.5305,
+ "step": 10759
+ },
+ {
+ "epoch": 29.318801089918257,
+ "grad_norm": 8.381567001342773,
+ "learning_rate": 1.6581769929434467e-05,
+ "loss": 0.4646,
+ "step": 10760
+ },
+ {
+ "epoch": 29.321525885558582,
+ "grad_norm": 8.161211967468262,
+ "learning_rate": 1.6581105506042456e-05,
+ "loss": 0.5881,
+ "step": 10761
+ },
+ {
+ "epoch": 29.32425068119891,
+ "grad_norm": 10.112963676452637,
+ "learning_rate": 1.6580441031397008e-05,
+ "loss": 0.4094,
+ "step": 10762
+ },
+ {
+ "epoch": 29.326975476839237,
+ "grad_norm": 8.371186256408691,
+ "learning_rate": 1.6579776505503294e-05,
+ "loss": 0.4287,
+ "step": 10763
+ },
+ {
+ "epoch": 29.329700272479563,
+ "grad_norm": 7.590577602386475,
+ "learning_rate": 1.65791119283665e-05,
+ "loss": 0.3506,
+ "step": 10764
+ },
+ {
+ "epoch": 29.332425068119893,
+ "grad_norm": 7.688154697418213,
+ "learning_rate": 1.6578447299991788e-05,
+ "loss": 0.4612,
+ "step": 10765
+ },
+ {
+ "epoch": 29.33514986376022,
+ "grad_norm": 6.572022914886475,
+ "learning_rate": 1.657778262038434e-05,
+ "loss": 0.4254,
+ "step": 10766
+ },
+ {
+ "epoch": 29.337874659400544,
+ "grad_norm": 8.043402671813965,
+ "learning_rate": 1.657711788954933e-05,
+ "loss": 0.4941,
+ "step": 10767
+ },
+ {
+ "epoch": 29.340599455040874,
+ "grad_norm": 7.502988815307617,
+ "learning_rate": 1.6576453107491945e-05,
+ "loss": 0.4216,
+ "step": 10768
+ },
+ {
+ "epoch": 29.3433242506812,
+ "grad_norm": 6.928520202636719,
+ "learning_rate": 1.6575788274217347e-05,
+ "loss": 0.3849,
+ "step": 10769
+ },
+ {
+ "epoch": 29.346049046321525,
+ "grad_norm": 8.919737815856934,
+ "learning_rate": 1.6575123389730728e-05,
+ "loss": 0.4212,
+ "step": 10770
+ },
+ {
+ "epoch": 29.348773841961854,
+ "grad_norm": 6.961564064025879,
+ "learning_rate": 1.6574458454037256e-05,
+ "loss": 0.4708,
+ "step": 10771
+ },
+ {
+ "epoch": 29.35149863760218,
+ "grad_norm": 7.387964725494385,
+ "learning_rate": 1.6573793467142114e-05,
+ "loss": 0.5485,
+ "step": 10772
+ },
+ {
+ "epoch": 29.354223433242506,
+ "grad_norm": 9.136253356933594,
+ "learning_rate": 1.657312842905048e-05,
+ "loss": 0.4797,
+ "step": 10773
+ },
+ {
+ "epoch": 29.356948228882835,
+ "grad_norm": 7.161242961883545,
+ "learning_rate": 1.6572463339767537e-05,
+ "loss": 0.3954,
+ "step": 10774
+ },
+ {
+ "epoch": 29.35967302452316,
+ "grad_norm": 7.878520488739014,
+ "learning_rate": 1.6571798199298457e-05,
+ "loss": 0.4626,
+ "step": 10775
+ },
+ {
+ "epoch": 29.362397820163487,
+ "grad_norm": 8.14638900756836,
+ "learning_rate": 1.6571133007648424e-05,
+ "loss": 0.5304,
+ "step": 10776
+ },
+ {
+ "epoch": 29.365122615803816,
+ "grad_norm": 8.658432006835938,
+ "learning_rate": 1.657046776482262e-05,
+ "loss": 0.5071,
+ "step": 10777
+ },
+ {
+ "epoch": 29.367847411444142,
+ "grad_norm": 8.138938903808594,
+ "learning_rate": 1.6569802470826226e-05,
+ "loss": 0.6318,
+ "step": 10778
+ },
+ {
+ "epoch": 29.370572207084468,
+ "grad_norm": 6.878420829772949,
+ "learning_rate": 1.6569137125664417e-05,
+ "loss": 0.5325,
+ "step": 10779
+ },
+ {
+ "epoch": 29.373297002724797,
+ "grad_norm": 8.385366439819336,
+ "learning_rate": 1.6568471729342384e-05,
+ "loss": 0.5004,
+ "step": 10780
+ },
+ {
+ "epoch": 29.376021798365123,
+ "grad_norm": 8.681464195251465,
+ "learning_rate": 1.6567806281865305e-05,
+ "loss": 0.5396,
+ "step": 10781
+ },
+ {
+ "epoch": 29.37874659400545,
+ "grad_norm": 6.902587413787842,
+ "learning_rate": 1.6567140783238358e-05,
+ "loss": 0.4479,
+ "step": 10782
+ },
+ {
+ "epoch": 29.381471389645778,
+ "grad_norm": 9.539426803588867,
+ "learning_rate": 1.6566475233466732e-05,
+ "loss": 0.5034,
+ "step": 10783
+ },
+ {
+ "epoch": 29.384196185286104,
+ "grad_norm": 7.421967029571533,
+ "learning_rate": 1.6565809632555607e-05,
+ "loss": 0.5312,
+ "step": 10784
+ },
+ {
+ "epoch": 29.38692098092643,
+ "grad_norm": 8.303641319274902,
+ "learning_rate": 1.656514398051017e-05,
+ "loss": 0.5323,
+ "step": 10785
+ },
+ {
+ "epoch": 29.38964577656676,
+ "grad_norm": 8.001503944396973,
+ "learning_rate": 1.65644782773356e-05,
+ "loss": 0.4594,
+ "step": 10786
+ },
+ {
+ "epoch": 29.392370572207085,
+ "grad_norm": 8.343440055847168,
+ "learning_rate": 1.6563812523037087e-05,
+ "loss": 0.4363,
+ "step": 10787
+ },
+ {
+ "epoch": 29.39509536784741,
+ "grad_norm": 7.275823593139648,
+ "learning_rate": 1.6563146717619814e-05,
+ "loss": 0.4149,
+ "step": 10788
+ },
+ {
+ "epoch": 29.39782016348774,
+ "grad_norm": 7.187505722045898,
+ "learning_rate": 1.6562480861088966e-05,
+ "loss": 0.5338,
+ "step": 10789
+ },
+ {
+ "epoch": 29.400544959128066,
+ "grad_norm": 7.029732704162598,
+ "learning_rate": 1.6561814953449728e-05,
+ "loss": 0.3399,
+ "step": 10790
+ },
+ {
+ "epoch": 29.40326975476839,
+ "grad_norm": 8.944703102111816,
+ "learning_rate": 1.6561148994707285e-05,
+ "loss": 0.451,
+ "step": 10791
+ },
+ {
+ "epoch": 29.40599455040872,
+ "grad_norm": 6.436709880828857,
+ "learning_rate": 1.6560482984866823e-05,
+ "loss": 0.5174,
+ "step": 10792
+ },
+ {
+ "epoch": 29.408719346049047,
+ "grad_norm": 6.83833646774292,
+ "learning_rate": 1.655981692393353e-05,
+ "loss": 0.4771,
+ "step": 10793
+ },
+ {
+ "epoch": 29.411444141689373,
+ "grad_norm": 6.635432243347168,
+ "learning_rate": 1.65591508119126e-05,
+ "loss": 0.6338,
+ "step": 10794
+ },
+ {
+ "epoch": 29.414168937329702,
+ "grad_norm": 7.787850856781006,
+ "learning_rate": 1.655848464880921e-05,
+ "loss": 0.4234,
+ "step": 10795
+ },
+ {
+ "epoch": 29.416893732970028,
+ "grad_norm": 6.895452499389648,
+ "learning_rate": 1.6557818434628555e-05,
+ "loss": 0.3962,
+ "step": 10796
+ },
+ {
+ "epoch": 29.419618528610354,
+ "grad_norm": 14.239097595214844,
+ "learning_rate": 1.655715216937582e-05,
+ "loss": 0.5432,
+ "step": 10797
+ },
+ {
+ "epoch": 29.422343324250683,
+ "grad_norm": 7.626240253448486,
+ "learning_rate": 1.6556485853056194e-05,
+ "loss": 0.5251,
+ "step": 10798
+ },
+ {
+ "epoch": 29.42506811989101,
+ "grad_norm": 7.327658653259277,
+ "learning_rate": 1.6555819485674865e-05,
+ "loss": 0.5409,
+ "step": 10799
+ },
+ {
+ "epoch": 29.427792915531334,
+ "grad_norm": 8.085366249084473,
+ "learning_rate": 1.655515306723703e-05,
+ "loss": 0.4064,
+ "step": 10800
+ },
+ {
+ "epoch": 29.430517711171664,
+ "grad_norm": 8.021275520324707,
+ "learning_rate": 1.655448659774787e-05,
+ "loss": 0.4655,
+ "step": 10801
+ },
+ {
+ "epoch": 29.43324250681199,
+ "grad_norm": 7.704780101776123,
+ "learning_rate": 1.6553820077212585e-05,
+ "loss": 0.4886,
+ "step": 10802
+ },
+ {
+ "epoch": 29.435967302452315,
+ "grad_norm": 8.516914367675781,
+ "learning_rate": 1.6553153505636356e-05,
+ "loss": 0.5174,
+ "step": 10803
+ },
+ {
+ "epoch": 29.438692098092645,
+ "grad_norm": 7.043200492858887,
+ "learning_rate": 1.6552486883024376e-05,
+ "loss": 0.3714,
+ "step": 10804
+ },
+ {
+ "epoch": 29.44141689373297,
+ "grad_norm": 7.265212535858154,
+ "learning_rate": 1.6551820209381843e-05,
+ "loss": 0.4593,
+ "step": 10805
+ },
+ {
+ "epoch": 29.444141689373296,
+ "grad_norm": 6.623559951782227,
+ "learning_rate": 1.6551153484713943e-05,
+ "loss": 0.5319,
+ "step": 10806
+ },
+ {
+ "epoch": 29.446866485013626,
+ "grad_norm": 7.270200252532959,
+ "learning_rate": 1.655048670902587e-05,
+ "loss": 0.371,
+ "step": 10807
+ },
+ {
+ "epoch": 29.44959128065395,
+ "grad_norm": 8.101445198059082,
+ "learning_rate": 1.654981988232282e-05,
+ "loss": 0.5175,
+ "step": 10808
+ },
+ {
+ "epoch": 29.452316076294277,
+ "grad_norm": 6.925370693206787,
+ "learning_rate": 1.6549153004609982e-05,
+ "loss": 0.4874,
+ "step": 10809
+ },
+ {
+ "epoch": 29.455040871934607,
+ "grad_norm": 7.511909008026123,
+ "learning_rate": 1.654848607589255e-05,
+ "loss": 0.6361,
+ "step": 10810
+ },
+ {
+ "epoch": 29.457765667574932,
+ "grad_norm": 10.822510719299316,
+ "learning_rate": 1.6547819096175722e-05,
+ "loss": 0.5509,
+ "step": 10811
+ },
+ {
+ "epoch": 29.460490463215258,
+ "grad_norm": 8.81610107421875,
+ "learning_rate": 1.6547152065464688e-05,
+ "loss": 0.4535,
+ "step": 10812
+ },
+ {
+ "epoch": 29.463215258855588,
+ "grad_norm": 6.656589031219482,
+ "learning_rate": 1.6546484983764646e-05,
+ "loss": 0.4775,
+ "step": 10813
+ },
+ {
+ "epoch": 29.465940054495913,
+ "grad_norm": 10.142149925231934,
+ "learning_rate": 1.6545817851080785e-05,
+ "loss": 0.5012,
+ "step": 10814
+ },
+ {
+ "epoch": 29.46866485013624,
+ "grad_norm": 9.494502067565918,
+ "learning_rate": 1.654515066741831e-05,
+ "loss": 0.3914,
+ "step": 10815
+ },
+ {
+ "epoch": 29.47138964577657,
+ "grad_norm": 6.635324954986572,
+ "learning_rate": 1.654448343278241e-05,
+ "loss": 0.5041,
+ "step": 10816
+ },
+ {
+ "epoch": 29.474114441416894,
+ "grad_norm": 5.768138408660889,
+ "learning_rate": 1.6543816147178283e-05,
+ "loss": 0.3553,
+ "step": 10817
+ },
+ {
+ "epoch": 29.47683923705722,
+ "grad_norm": 8.109676361083984,
+ "learning_rate": 1.654314881061113e-05,
+ "loss": 0.4941,
+ "step": 10818
+ },
+ {
+ "epoch": 29.479564032697546,
+ "grad_norm": 7.911977291107178,
+ "learning_rate": 1.6542481423086145e-05,
+ "loss": 0.4431,
+ "step": 10819
+ },
+ {
+ "epoch": 29.482288828337875,
+ "grad_norm": 5.9850311279296875,
+ "learning_rate": 1.654181398460852e-05,
+ "loss": 0.4828,
+ "step": 10820
+ },
+ {
+ "epoch": 29.4850136239782,
+ "grad_norm": 8.306781768798828,
+ "learning_rate": 1.6541146495183463e-05,
+ "loss": 0.5159,
+ "step": 10821
+ },
+ {
+ "epoch": 29.48773841961853,
+ "grad_norm": 9.13083267211914,
+ "learning_rate": 1.6540478954816164e-05,
+ "loss": 0.4634,
+ "step": 10822
+ },
+ {
+ "epoch": 29.490463215258856,
+ "grad_norm": 7.0769267082214355,
+ "learning_rate": 1.6539811363511827e-05,
+ "loss": 0.3601,
+ "step": 10823
+ },
+ {
+ "epoch": 29.493188010899182,
+ "grad_norm": 8.102646827697754,
+ "learning_rate": 1.653914372127565e-05,
+ "loss": 0.4487,
+ "step": 10824
+ },
+ {
+ "epoch": 29.495912806539508,
+ "grad_norm": 7.4217681884765625,
+ "learning_rate": 1.6538476028112832e-05,
+ "loss": 0.3892,
+ "step": 10825
+ },
+ {
+ "epoch": 29.498637602179837,
+ "grad_norm": 7.808663845062256,
+ "learning_rate": 1.653780828402857e-05,
+ "loss": 0.3923,
+ "step": 10826
+ },
+ {
+ "epoch": 29.501362397820163,
+ "grad_norm": 6.494418144226074,
+ "learning_rate": 1.6537140489028073e-05,
+ "loss": 0.5069,
+ "step": 10827
+ },
+ {
+ "epoch": 29.504087193460492,
+ "grad_norm": 7.85498571395874,
+ "learning_rate": 1.653647264311653e-05,
+ "loss": 0.5422,
+ "step": 10828
+ },
+ {
+ "epoch": 29.506811989100818,
+ "grad_norm": 8.364899635314941,
+ "learning_rate": 1.6535804746299154e-05,
+ "loss": 0.4385,
+ "step": 10829
+ },
+ {
+ "epoch": 29.509536784741144,
+ "grad_norm": 6.561302185058594,
+ "learning_rate": 1.653513679858114e-05,
+ "loss": 0.3771,
+ "step": 10830
+ },
+ {
+ "epoch": 29.51226158038147,
+ "grad_norm": 7.510750770568848,
+ "learning_rate": 1.6534468799967692e-05,
+ "loss": 0.7035,
+ "step": 10831
+ },
+ {
+ "epoch": 29.5149863760218,
+ "grad_norm": 7.323873519897461,
+ "learning_rate": 1.6533800750464006e-05,
+ "loss": 0.3801,
+ "step": 10832
+ },
+ {
+ "epoch": 29.517711171662125,
+ "grad_norm": 7.319087028503418,
+ "learning_rate": 1.6533132650075293e-05,
+ "loss": 0.4436,
+ "step": 10833
+ },
+ {
+ "epoch": 29.520435967302454,
+ "grad_norm": 7.902466297149658,
+ "learning_rate": 1.6532464498806755e-05,
+ "loss": 0.3191,
+ "step": 10834
+ },
+ {
+ "epoch": 29.52316076294278,
+ "grad_norm": 8.569283485412598,
+ "learning_rate": 1.6531796296663595e-05,
+ "loss": 0.3892,
+ "step": 10835
+ },
+ {
+ "epoch": 29.525885558583106,
+ "grad_norm": 9.558220863342285,
+ "learning_rate": 1.653112804365101e-05,
+ "loss": 0.4821,
+ "step": 10836
+ },
+ {
+ "epoch": 29.52861035422343,
+ "grad_norm": 8.228992462158203,
+ "learning_rate": 1.653045973977421e-05,
+ "loss": 0.4522,
+ "step": 10837
+ },
+ {
+ "epoch": 29.53133514986376,
+ "grad_norm": 7.123694896697998,
+ "learning_rate": 1.6529791385038404e-05,
+ "loss": 0.4266,
+ "step": 10838
+ },
+ {
+ "epoch": 29.534059945504087,
+ "grad_norm": 7.235476493835449,
+ "learning_rate": 1.6529122979448792e-05,
+ "loss": 0.5008,
+ "step": 10839
+ },
+ {
+ "epoch": 29.536784741144416,
+ "grad_norm": 7.183542251586914,
+ "learning_rate": 1.6528454523010583e-05,
+ "loss": 0.4805,
+ "step": 10840
+ },
+ {
+ "epoch": 29.539509536784742,
+ "grad_norm": 7.383785724639893,
+ "learning_rate": 1.6527786015728975e-05,
+ "loss": 0.5205,
+ "step": 10841
+ },
+ {
+ "epoch": 29.542234332425068,
+ "grad_norm": 9.598885536193848,
+ "learning_rate": 1.652711745760918e-05,
+ "loss": 0.4417,
+ "step": 10842
+ },
+ {
+ "epoch": 29.544959128065393,
+ "grad_norm": 9.335498809814453,
+ "learning_rate": 1.6526448848656407e-05,
+ "loss": 0.5446,
+ "step": 10843
+ },
+ {
+ "epoch": 29.547683923705723,
+ "grad_norm": 7.628083229064941,
+ "learning_rate": 1.652578018887586e-05,
+ "loss": 0.4476,
+ "step": 10844
+ },
+ {
+ "epoch": 29.55040871934605,
+ "grad_norm": 7.617641448974609,
+ "learning_rate": 1.6525111478272748e-05,
+ "loss": 0.4086,
+ "step": 10845
+ },
+ {
+ "epoch": 29.553133514986374,
+ "grad_norm": 7.333584785461426,
+ "learning_rate": 1.6524442716852273e-05,
+ "loss": 0.5005,
+ "step": 10846
+ },
+ {
+ "epoch": 29.555858310626704,
+ "grad_norm": 7.800898551940918,
+ "learning_rate": 1.6523773904619653e-05,
+ "loss": 0.4606,
+ "step": 10847
+ },
+ {
+ "epoch": 29.55858310626703,
+ "grad_norm": 7.886172294616699,
+ "learning_rate": 1.652310504158009e-05,
+ "loss": 0.4534,
+ "step": 10848
+ },
+ {
+ "epoch": 29.561307901907355,
+ "grad_norm": 9.152216911315918,
+ "learning_rate": 1.6522436127738797e-05,
+ "loss": 0.4162,
+ "step": 10849
+ },
+ {
+ "epoch": 29.564032697547685,
+ "grad_norm": 24.142454147338867,
+ "learning_rate": 1.652176716310098e-05,
+ "loss": 0.5763,
+ "step": 10850
+ },
+ {
+ "epoch": 29.56675749318801,
+ "grad_norm": 7.811501979827881,
+ "learning_rate": 1.6521098147671847e-05,
+ "loss": 0.4875,
+ "step": 10851
+ },
+ {
+ "epoch": 29.569482288828336,
+ "grad_norm": 8.617351531982422,
+ "learning_rate": 1.6520429081456615e-05,
+ "loss": 0.4185,
+ "step": 10852
+ },
+ {
+ "epoch": 29.572207084468666,
+ "grad_norm": 7.524698734283447,
+ "learning_rate": 1.6519759964460488e-05,
+ "loss": 0.6508,
+ "step": 10853
+ },
+ {
+ "epoch": 29.57493188010899,
+ "grad_norm": 8.168391227722168,
+ "learning_rate": 1.6519090796688685e-05,
+ "loss": 0.4301,
+ "step": 10854
+ },
+ {
+ "epoch": 29.577656675749317,
+ "grad_norm": 8.772461891174316,
+ "learning_rate": 1.651842157814641e-05,
+ "loss": 0.3873,
+ "step": 10855
+ },
+ {
+ "epoch": 29.580381471389646,
+ "grad_norm": 7.3811211585998535,
+ "learning_rate": 1.6517752308838877e-05,
+ "loss": 0.4337,
+ "step": 10856
+ },
+ {
+ "epoch": 29.583106267029972,
+ "grad_norm": 6.60532283782959,
+ "learning_rate": 1.65170829887713e-05,
+ "loss": 0.4587,
+ "step": 10857
+ },
+ {
+ "epoch": 29.585831062670298,
+ "grad_norm": 7.635605335235596,
+ "learning_rate": 1.651641361794889e-05,
+ "loss": 0.7336,
+ "step": 10858
+ },
+ {
+ "epoch": 29.588555858310627,
+ "grad_norm": 9.370646476745605,
+ "learning_rate": 1.6515744196376863e-05,
+ "loss": 0.5171,
+ "step": 10859
+ },
+ {
+ "epoch": 29.591280653950953,
+ "grad_norm": 9.356303215026855,
+ "learning_rate": 1.6515074724060425e-05,
+ "loss": 0.5969,
+ "step": 10860
+ },
+ {
+ "epoch": 29.59400544959128,
+ "grad_norm": 13.548718452453613,
+ "learning_rate": 1.6514405201004797e-05,
+ "loss": 0.4778,
+ "step": 10861
+ },
+ {
+ "epoch": 29.59673024523161,
+ "grad_norm": 7.7641472816467285,
+ "learning_rate": 1.6513735627215192e-05,
+ "loss": 0.4249,
+ "step": 10862
+ },
+ {
+ "epoch": 29.599455040871934,
+ "grad_norm": 9.723471641540527,
+ "learning_rate": 1.651306600269682e-05,
+ "loss": 0.4331,
+ "step": 10863
+ },
+ {
+ "epoch": 29.60217983651226,
+ "grad_norm": 6.466434478759766,
+ "learning_rate": 1.65123963274549e-05,
+ "loss": 0.4282,
+ "step": 10864
+ },
+ {
+ "epoch": 29.60490463215259,
+ "grad_norm": 18.430665969848633,
+ "learning_rate": 1.6511726601494655e-05,
+ "loss": 0.6192,
+ "step": 10865
+ },
+ {
+ "epoch": 29.607629427792915,
+ "grad_norm": 6.94656229019165,
+ "learning_rate": 1.6511056824821285e-05,
+ "loss": 0.385,
+ "step": 10866
+ },
+ {
+ "epoch": 29.61035422343324,
+ "grad_norm": 5.463720798492432,
+ "learning_rate": 1.6510386997440017e-05,
+ "loss": 0.6242,
+ "step": 10867
+ },
+ {
+ "epoch": 29.61307901907357,
+ "grad_norm": 7.205257892608643,
+ "learning_rate": 1.6509717119356065e-05,
+ "loss": 0.5305,
+ "step": 10868
+ },
+ {
+ "epoch": 29.615803814713896,
+ "grad_norm": 6.175645351409912,
+ "learning_rate": 1.6509047190574643e-05,
+ "loss": 0.4505,
+ "step": 10869
+ },
+ {
+ "epoch": 29.618528610354222,
+ "grad_norm": 6.795779228210449,
+ "learning_rate": 1.650837721110097e-05,
+ "loss": 0.5634,
+ "step": 10870
+ },
+ {
+ "epoch": 29.62125340599455,
+ "grad_norm": 6.857511520385742,
+ "learning_rate": 1.6507707180940268e-05,
+ "loss": 0.4543,
+ "step": 10871
+ },
+ {
+ "epoch": 29.623978201634877,
+ "grad_norm": 7.351967811584473,
+ "learning_rate": 1.650703710009775e-05,
+ "loss": 0.3824,
+ "step": 10872
+ },
+ {
+ "epoch": 29.626702997275203,
+ "grad_norm": 7.04655647277832,
+ "learning_rate": 1.6506366968578637e-05,
+ "loss": 0.4796,
+ "step": 10873
+ },
+ {
+ "epoch": 29.629427792915532,
+ "grad_norm": 7.237663745880127,
+ "learning_rate": 1.650569678638815e-05,
+ "loss": 0.6383,
+ "step": 10874
+ },
+ {
+ "epoch": 29.632152588555858,
+ "grad_norm": 6.777371406555176,
+ "learning_rate": 1.65050265535315e-05,
+ "loss": 0.5815,
+ "step": 10875
+ },
+ {
+ "epoch": 29.634877384196184,
+ "grad_norm": 6.713928699493408,
+ "learning_rate": 1.650435627001392e-05,
+ "loss": 0.4886,
+ "step": 10876
+ },
+ {
+ "epoch": 29.637602179836513,
+ "grad_norm": 7.542415142059326,
+ "learning_rate": 1.650368593584062e-05,
+ "loss": 0.4447,
+ "step": 10877
+ },
+ {
+ "epoch": 29.64032697547684,
+ "grad_norm": 6.431827068328857,
+ "learning_rate": 1.650301555101682e-05,
+ "loss": 0.4555,
+ "step": 10878
+ },
+ {
+ "epoch": 29.643051771117165,
+ "grad_norm": 7.300482273101807,
+ "learning_rate": 1.6502345115547745e-05,
+ "loss": 0.411,
+ "step": 10879
+ },
+ {
+ "epoch": 29.645776566757494,
+ "grad_norm": 9.059066772460938,
+ "learning_rate": 1.6501674629438617e-05,
+ "loss": 0.4895,
+ "step": 10880
+ },
+ {
+ "epoch": 29.64850136239782,
+ "grad_norm": 7.237509250640869,
+ "learning_rate": 1.6501004092694655e-05,
+ "loss": 0.3969,
+ "step": 10881
+ },
+ {
+ "epoch": 29.651226158038146,
+ "grad_norm": 7.097210884094238,
+ "learning_rate": 1.6500333505321085e-05,
+ "loss": 0.4492,
+ "step": 10882
+ },
+ {
+ "epoch": 29.653950953678475,
+ "grad_norm": 8.74032211303711,
+ "learning_rate": 1.6499662867323127e-05,
+ "loss": 0.4481,
+ "step": 10883
+ },
+ {
+ "epoch": 29.6566757493188,
+ "grad_norm": 7.301566123962402,
+ "learning_rate": 1.6498992178706002e-05,
+ "loss": 0.3846,
+ "step": 10884
+ },
+ {
+ "epoch": 29.659400544959126,
+ "grad_norm": 7.869488716125488,
+ "learning_rate": 1.6498321439474935e-05,
+ "loss": 0.5212,
+ "step": 10885
+ },
+ {
+ "epoch": 29.662125340599456,
+ "grad_norm": 9.363385200500488,
+ "learning_rate": 1.649765064963515e-05,
+ "loss": 0.4977,
+ "step": 10886
+ },
+ {
+ "epoch": 29.66485013623978,
+ "grad_norm": 6.198626518249512,
+ "learning_rate": 1.649697980919187e-05,
+ "loss": 0.5959,
+ "step": 10887
+ },
+ {
+ "epoch": 29.667574931880107,
+ "grad_norm": 6.578914642333984,
+ "learning_rate": 1.6496308918150323e-05,
+ "loss": 0.4032,
+ "step": 10888
+ },
+ {
+ "epoch": 29.670299727520437,
+ "grad_norm": 9.510456085205078,
+ "learning_rate": 1.649563797651573e-05,
+ "loss": 0.418,
+ "step": 10889
+ },
+ {
+ "epoch": 29.673024523160763,
+ "grad_norm": 6.486546039581299,
+ "learning_rate": 1.6494966984293316e-05,
+ "loss": 0.3596,
+ "step": 10890
+ },
+ {
+ "epoch": 29.67574931880109,
+ "grad_norm": 6.955389499664307,
+ "learning_rate": 1.6494295941488307e-05,
+ "loss": 0.4252,
+ "step": 10891
+ },
+ {
+ "epoch": 29.678474114441418,
+ "grad_norm": 6.365244388580322,
+ "learning_rate": 1.6493624848105934e-05,
+ "loss": 0.4741,
+ "step": 10892
+ },
+ {
+ "epoch": 29.681198910081743,
+ "grad_norm": 7.88081169128418,
+ "learning_rate": 1.649295370415142e-05,
+ "loss": 0.5278,
+ "step": 10893
+ },
+ {
+ "epoch": 29.68392370572207,
+ "grad_norm": 7.345284461975098,
+ "learning_rate": 1.649228250962999e-05,
+ "loss": 0.4361,
+ "step": 10894
+ },
+ {
+ "epoch": 29.6866485013624,
+ "grad_norm": 6.725378513336182,
+ "learning_rate": 1.6491611264546868e-05,
+ "loss": 0.5792,
+ "step": 10895
+ },
+ {
+ "epoch": 29.689373297002724,
+ "grad_norm": 8.338081359863281,
+ "learning_rate": 1.6490939968907295e-05,
+ "loss": 0.4827,
+ "step": 10896
+ },
+ {
+ "epoch": 29.69209809264305,
+ "grad_norm": 6.808753967285156,
+ "learning_rate": 1.6490268622716484e-05,
+ "loss": 0.4923,
+ "step": 10897
+ },
+ {
+ "epoch": 29.69482288828338,
+ "grad_norm": 11.013527870178223,
+ "learning_rate": 1.6489597225979673e-05,
+ "loss": 0.298,
+ "step": 10898
+ },
+ {
+ "epoch": 29.697547683923705,
+ "grad_norm": 8.209692001342773,
+ "learning_rate": 1.6488925778702084e-05,
+ "loss": 0.4075,
+ "step": 10899
+ },
+ {
+ "epoch": 29.70027247956403,
+ "grad_norm": 5.375641345977783,
+ "learning_rate": 1.6488254280888956e-05,
+ "loss": 0.5535,
+ "step": 10900
+ },
+ {
+ "epoch": 29.70299727520436,
+ "grad_norm": 9.399170875549316,
+ "learning_rate": 1.6487582732545506e-05,
+ "loss": 0.5728,
+ "step": 10901
+ },
+ {
+ "epoch": 29.705722070844686,
+ "grad_norm": 13.955491065979004,
+ "learning_rate": 1.6486911133676974e-05,
+ "loss": 0.4485,
+ "step": 10902
+ },
+ {
+ "epoch": 29.708446866485012,
+ "grad_norm": 7.763715744018555,
+ "learning_rate": 1.6486239484288585e-05,
+ "loss": 0.592,
+ "step": 10903
+ },
+ {
+ "epoch": 29.71117166212534,
+ "grad_norm": 10.498160362243652,
+ "learning_rate": 1.6485567784385574e-05,
+ "loss": 0.4219,
+ "step": 10904
+ },
+ {
+ "epoch": 29.713896457765667,
+ "grad_norm": 6.306120872497559,
+ "learning_rate": 1.6484896033973168e-05,
+ "loss": 0.485,
+ "step": 10905
+ },
+ {
+ "epoch": 29.716621253405993,
+ "grad_norm": 8.809769630432129,
+ "learning_rate": 1.6484224233056602e-05,
+ "loss": 0.4487,
+ "step": 10906
+ },
+ {
+ "epoch": 29.719346049046322,
+ "grad_norm": 10.231396675109863,
+ "learning_rate": 1.6483552381641107e-05,
+ "loss": 0.5508,
+ "step": 10907
+ },
+ {
+ "epoch": 29.722070844686648,
+ "grad_norm": 8.767487525939941,
+ "learning_rate": 1.6482880479731912e-05,
+ "loss": 0.5564,
+ "step": 10908
+ },
+ {
+ "epoch": 29.724795640326974,
+ "grad_norm": 7.6702375411987305,
+ "learning_rate": 1.6482208527334257e-05,
+ "loss": 0.667,
+ "step": 10909
+ },
+ {
+ "epoch": 29.727520435967303,
+ "grad_norm": 9.525460243225098,
+ "learning_rate": 1.6481536524453365e-05,
+ "loss": 0.4465,
+ "step": 10910
+ },
+ {
+ "epoch": 29.73024523160763,
+ "grad_norm": 6.9797163009643555,
+ "learning_rate": 1.648086447109448e-05,
+ "loss": 0.3654,
+ "step": 10911
+ },
+ {
+ "epoch": 29.732970027247955,
+ "grad_norm": 7.111659049987793,
+ "learning_rate": 1.6480192367262827e-05,
+ "loss": 0.4361,
+ "step": 10912
+ },
+ {
+ "epoch": 29.735694822888284,
+ "grad_norm": 9.03895378112793,
+ "learning_rate": 1.6479520212963644e-05,
+ "loss": 0.4158,
+ "step": 10913
+ },
+ {
+ "epoch": 29.73841961852861,
+ "grad_norm": 7.492087364196777,
+ "learning_rate": 1.647884800820217e-05,
+ "loss": 0.3877,
+ "step": 10914
+ },
+ {
+ "epoch": 29.741144414168936,
+ "grad_norm": 7.278896331787109,
+ "learning_rate": 1.6478175752983632e-05,
+ "loss": 0.4546,
+ "step": 10915
+ },
+ {
+ "epoch": 29.743869209809265,
+ "grad_norm": 8.521524429321289,
+ "learning_rate": 1.6477503447313276e-05,
+ "loss": 0.43,
+ "step": 10916
+ },
+ {
+ "epoch": 29.74659400544959,
+ "grad_norm": 7.021545886993408,
+ "learning_rate": 1.6476831091196327e-05,
+ "loss": 0.3748,
+ "step": 10917
+ },
+ {
+ "epoch": 29.749318801089917,
+ "grad_norm": 7.985683917999268,
+ "learning_rate": 1.6476158684638027e-05,
+ "loss": 0.6056,
+ "step": 10918
+ },
+ {
+ "epoch": 29.752043596730246,
+ "grad_norm": 8.665266036987305,
+ "learning_rate": 1.647548622764361e-05,
+ "loss": 0.477,
+ "step": 10919
+ },
+ {
+ "epoch": 29.754768392370572,
+ "grad_norm": 8.756564140319824,
+ "learning_rate": 1.6474813720218318e-05,
+ "loss": 0.542,
+ "step": 10920
+ },
+ {
+ "epoch": 29.757493188010898,
+ "grad_norm": 7.334249019622803,
+ "learning_rate": 1.6474141162367384e-05,
+ "loss": 0.4863,
+ "step": 10921
+ },
+ {
+ "epoch": 29.760217983651227,
+ "grad_norm": 8.4699125289917,
+ "learning_rate": 1.6473468554096045e-05,
+ "loss": 0.601,
+ "step": 10922
+ },
+ {
+ "epoch": 29.762942779291553,
+ "grad_norm": 7.529186725616455,
+ "learning_rate": 1.6472795895409542e-05,
+ "loss": 0.3366,
+ "step": 10923
+ },
+ {
+ "epoch": 29.76566757493188,
+ "grad_norm": 8.458430290222168,
+ "learning_rate": 1.6472123186313114e-05,
+ "loss": 0.5209,
+ "step": 10924
+ },
+ {
+ "epoch": 29.768392370572208,
+ "grad_norm": 8.96320915222168,
+ "learning_rate": 1.6471450426811997e-05,
+ "loss": 0.5283,
+ "step": 10925
+ },
+ {
+ "epoch": 29.771117166212534,
+ "grad_norm": 11.148738861083984,
+ "learning_rate": 1.6470777616911435e-05,
+ "loss": 0.4584,
+ "step": 10926
+ },
+ {
+ "epoch": 29.77384196185286,
+ "grad_norm": 8.912113189697266,
+ "learning_rate": 1.6470104756616664e-05,
+ "loss": 0.5006,
+ "step": 10927
+ },
+ {
+ "epoch": 29.77656675749319,
+ "grad_norm": 7.305341720581055,
+ "learning_rate": 1.6469431845932923e-05,
+ "loss": 0.5061,
+ "step": 10928
+ },
+ {
+ "epoch": 29.779291553133515,
+ "grad_norm": 6.873284339904785,
+ "learning_rate": 1.646875888486546e-05,
+ "loss": 0.3441,
+ "step": 10929
+ },
+ {
+ "epoch": 29.78201634877384,
+ "grad_norm": 5.6703290939331055,
+ "learning_rate": 1.6468085873419502e-05,
+ "loss": 0.6736,
+ "step": 10930
+ },
+ {
+ "epoch": 29.78474114441417,
+ "grad_norm": 7.85083532333374,
+ "learning_rate": 1.646741281160031e-05,
+ "loss": 0.3551,
+ "step": 10931
+ },
+ {
+ "epoch": 29.787465940054496,
+ "grad_norm": 6.734079360961914,
+ "learning_rate": 1.646673969941311e-05,
+ "loss": 0.3798,
+ "step": 10932
+ },
+ {
+ "epoch": 29.79019073569482,
+ "grad_norm": 6.857694149017334,
+ "learning_rate": 1.646606653686315e-05,
+ "loss": 0.5082,
+ "step": 10933
+ },
+ {
+ "epoch": 29.79291553133515,
+ "grad_norm": 17.572439193725586,
+ "learning_rate": 1.6465393323955673e-05,
+ "loss": 0.4622,
+ "step": 10934
+ },
+ {
+ "epoch": 29.795640326975477,
+ "grad_norm": 6.712080955505371,
+ "learning_rate": 1.6464720060695918e-05,
+ "loss": 0.4265,
+ "step": 10935
+ },
+ {
+ "epoch": 29.798365122615802,
+ "grad_norm": 9.340763092041016,
+ "learning_rate": 1.6464046747089134e-05,
+ "loss": 0.5399,
+ "step": 10936
+ },
+ {
+ "epoch": 29.80108991825613,
+ "grad_norm": 7.187861442565918,
+ "learning_rate": 1.6463373383140563e-05,
+ "loss": 0.4803,
+ "step": 10937
+ },
+ {
+ "epoch": 29.803814713896458,
+ "grad_norm": 7.087644577026367,
+ "learning_rate": 1.6462699968855446e-05,
+ "loss": 0.5294,
+ "step": 10938
+ },
+ {
+ "epoch": 29.806539509536783,
+ "grad_norm": 8.618359565734863,
+ "learning_rate": 1.6462026504239026e-05,
+ "loss": 0.5131,
+ "step": 10939
+ },
+ {
+ "epoch": 29.809264305177113,
+ "grad_norm": 9.606124877929688,
+ "learning_rate": 1.6461352989296556e-05,
+ "loss": 0.4279,
+ "step": 10940
+ },
+ {
+ "epoch": 29.81198910081744,
+ "grad_norm": 8.291728019714355,
+ "learning_rate": 1.6460679424033278e-05,
+ "loss": 0.3738,
+ "step": 10941
+ },
+ {
+ "epoch": 29.814713896457764,
+ "grad_norm": 8.681512832641602,
+ "learning_rate": 1.6460005808454434e-05,
+ "loss": 0.4538,
+ "step": 10942
+ },
+ {
+ "epoch": 29.817438692098094,
+ "grad_norm": 7.411059379577637,
+ "learning_rate": 1.6459332142565275e-05,
+ "loss": 0.4568,
+ "step": 10943
+ },
+ {
+ "epoch": 29.82016348773842,
+ "grad_norm": 11.733348846435547,
+ "learning_rate": 1.6458658426371043e-05,
+ "loss": 0.351,
+ "step": 10944
+ },
+ {
+ "epoch": 29.822888283378745,
+ "grad_norm": 8.563687324523926,
+ "learning_rate": 1.645798465987699e-05,
+ "loss": 0.6837,
+ "step": 10945
+ },
+ {
+ "epoch": 29.825613079019075,
+ "grad_norm": 6.435044765472412,
+ "learning_rate": 1.6457310843088355e-05,
+ "loss": 0.2955,
+ "step": 10946
+ },
+ {
+ "epoch": 29.8283378746594,
+ "grad_norm": 11.304015159606934,
+ "learning_rate": 1.6456636976010396e-05,
+ "loss": 0.3521,
+ "step": 10947
+ },
+ {
+ "epoch": 29.831062670299726,
+ "grad_norm": 8.280211448669434,
+ "learning_rate": 1.6455963058648353e-05,
+ "loss": 0.6414,
+ "step": 10948
+ },
+ {
+ "epoch": 29.833787465940055,
+ "grad_norm": 6.6961259841918945,
+ "learning_rate": 1.6455289091007478e-05,
+ "loss": 0.3734,
+ "step": 10949
+ },
+ {
+ "epoch": 29.83651226158038,
+ "grad_norm": 7.7939372062683105,
+ "learning_rate": 1.645461507309302e-05,
+ "loss": 0.4768,
+ "step": 10950
+ },
+ {
+ "epoch": 29.839237057220707,
+ "grad_norm": 8.741804122924805,
+ "learning_rate": 1.6453941004910227e-05,
+ "loss": 0.4564,
+ "step": 10951
+ },
+ {
+ "epoch": 29.841961852861036,
+ "grad_norm": 7.31764554977417,
+ "learning_rate": 1.645326688646435e-05,
+ "loss": 0.576,
+ "step": 10952
+ },
+ {
+ "epoch": 29.844686648501362,
+ "grad_norm": 6.965038776397705,
+ "learning_rate": 1.645259271776064e-05,
+ "loss": 0.5383,
+ "step": 10953
+ },
+ {
+ "epoch": 29.847411444141688,
+ "grad_norm": 10.115130424499512,
+ "learning_rate": 1.6451918498804343e-05,
+ "loss": 0.5702,
+ "step": 10954
+ },
+ {
+ "epoch": 29.850136239782017,
+ "grad_norm": 7.532892227172852,
+ "learning_rate": 1.645124422960071e-05,
+ "loss": 0.4471,
+ "step": 10955
+ },
+ {
+ "epoch": 29.852861035422343,
+ "grad_norm": 7.694735050201416,
+ "learning_rate": 1.6450569910154998e-05,
+ "loss": 0.4386,
+ "step": 10956
+ },
+ {
+ "epoch": 29.85558583106267,
+ "grad_norm": 7.561770439147949,
+ "learning_rate": 1.6449895540472455e-05,
+ "loss": 0.5721,
+ "step": 10957
+ },
+ {
+ "epoch": 29.858310626703,
+ "grad_norm": 7.428245544433594,
+ "learning_rate": 1.6449221120558334e-05,
+ "loss": 0.7021,
+ "step": 10958
+ },
+ {
+ "epoch": 29.861035422343324,
+ "grad_norm": 8.777802467346191,
+ "learning_rate": 1.6448546650417883e-05,
+ "loss": 0.3962,
+ "step": 10959
+ },
+ {
+ "epoch": 29.86376021798365,
+ "grad_norm": 6.817665100097656,
+ "learning_rate": 1.644787213005636e-05,
+ "loss": 0.6262,
+ "step": 10960
+ },
+ {
+ "epoch": 29.86648501362398,
+ "grad_norm": 7.662132263183594,
+ "learning_rate": 1.6447197559479017e-05,
+ "loss": 0.5568,
+ "step": 10961
+ },
+ {
+ "epoch": 29.869209809264305,
+ "grad_norm": 7.989658832550049,
+ "learning_rate": 1.6446522938691107e-05,
+ "loss": 0.5452,
+ "step": 10962
+ },
+ {
+ "epoch": 29.87193460490463,
+ "grad_norm": 5.7323126792907715,
+ "learning_rate": 1.6445848267697884e-05,
+ "loss": 0.5826,
+ "step": 10963
+ },
+ {
+ "epoch": 29.87465940054496,
+ "grad_norm": 6.911271095275879,
+ "learning_rate": 1.6445173546504603e-05,
+ "loss": 0.6467,
+ "step": 10964
+ },
+ {
+ "epoch": 29.877384196185286,
+ "grad_norm": 6.319054126739502,
+ "learning_rate": 1.6444498775116512e-05,
+ "loss": 0.4939,
+ "step": 10965
+ },
+ {
+ "epoch": 29.88010899182561,
+ "grad_norm": 8.498305320739746,
+ "learning_rate": 1.6443823953538876e-05,
+ "loss": 0.4156,
+ "step": 10966
+ },
+ {
+ "epoch": 29.88283378746594,
+ "grad_norm": 8.051203727722168,
+ "learning_rate": 1.644314908177695e-05,
+ "loss": 0.5158,
+ "step": 10967
+ },
+ {
+ "epoch": 29.885558583106267,
+ "grad_norm": 7.078332901000977,
+ "learning_rate": 1.6442474159835984e-05,
+ "loss": 0.5493,
+ "step": 10968
+ },
+ {
+ "epoch": 29.888283378746593,
+ "grad_norm": 8.033302307128906,
+ "learning_rate": 1.6441799187721237e-05,
+ "loss": 0.5834,
+ "step": 10969
+ },
+ {
+ "epoch": 29.891008174386922,
+ "grad_norm": 7.197174549102783,
+ "learning_rate": 1.6441124165437962e-05,
+ "loss": 0.3835,
+ "step": 10970
+ },
+ {
+ "epoch": 29.893732970027248,
+ "grad_norm": 7.283804416656494,
+ "learning_rate": 1.6440449092991424e-05,
+ "loss": 0.4468,
+ "step": 10971
+ },
+ {
+ "epoch": 29.896457765667574,
+ "grad_norm": 7.508810043334961,
+ "learning_rate": 1.643977397038687e-05,
+ "loss": 0.561,
+ "step": 10972
+ },
+ {
+ "epoch": 29.899182561307903,
+ "grad_norm": 6.808213710784912,
+ "learning_rate": 1.6439098797629565e-05,
+ "loss": 0.4292,
+ "step": 10973
+ },
+ {
+ "epoch": 29.90190735694823,
+ "grad_norm": 7.95700216293335,
+ "learning_rate": 1.6438423574724768e-05,
+ "loss": 0.5316,
+ "step": 10974
+ },
+ {
+ "epoch": 29.904632152588555,
+ "grad_norm": 7.048412799835205,
+ "learning_rate": 1.6437748301677738e-05,
+ "loss": 0.5133,
+ "step": 10975
+ },
+ {
+ "epoch": 29.907356948228884,
+ "grad_norm": 9.064624786376953,
+ "learning_rate": 1.643707297849373e-05,
+ "loss": 0.5742,
+ "step": 10976
+ },
+ {
+ "epoch": 29.91008174386921,
+ "grad_norm": 6.609524250030518,
+ "learning_rate": 1.6436397605178e-05,
+ "loss": 0.4809,
+ "step": 10977
+ },
+ {
+ "epoch": 29.912806539509535,
+ "grad_norm": 6.805055618286133,
+ "learning_rate": 1.6435722181735817e-05,
+ "loss": 0.499,
+ "step": 10978
+ },
+ {
+ "epoch": 29.915531335149865,
+ "grad_norm": 7.3713250160217285,
+ "learning_rate": 1.6435046708172436e-05,
+ "loss": 0.42,
+ "step": 10979
+ },
+ {
+ "epoch": 29.91825613079019,
+ "grad_norm": 10.440509796142578,
+ "learning_rate": 1.6434371184493117e-05,
+ "loss": 0.4354,
+ "step": 10980
+ },
+ {
+ "epoch": 29.920980926430516,
+ "grad_norm": 8.879534721374512,
+ "learning_rate": 1.6433695610703123e-05,
+ "loss": 0.4551,
+ "step": 10981
+ },
+ {
+ "epoch": 29.923705722070846,
+ "grad_norm": 6.668054103851318,
+ "learning_rate": 1.6433019986807714e-05,
+ "loss": 0.4812,
+ "step": 10982
+ },
+ {
+ "epoch": 29.92643051771117,
+ "grad_norm": 9.760262489318848,
+ "learning_rate": 1.6432344312812153e-05,
+ "loss": 0.4534,
+ "step": 10983
+ },
+ {
+ "epoch": 29.929155313351497,
+ "grad_norm": 6.852321147918701,
+ "learning_rate": 1.64316685887217e-05,
+ "loss": 0.3206,
+ "step": 10984
+ },
+ {
+ "epoch": 29.931880108991827,
+ "grad_norm": 17.207426071166992,
+ "learning_rate": 1.6430992814541625e-05,
+ "loss": 0.6734,
+ "step": 10985
+ },
+ {
+ "epoch": 29.934604904632153,
+ "grad_norm": 8.152406692504883,
+ "learning_rate": 1.643031699027718e-05,
+ "loss": 0.5496,
+ "step": 10986
+ },
+ {
+ "epoch": 29.93732970027248,
+ "grad_norm": 7.128805160522461,
+ "learning_rate": 1.6429641115933635e-05,
+ "loss": 0.5237,
+ "step": 10987
+ },
+ {
+ "epoch": 29.940054495912808,
+ "grad_norm": 6.745392322540283,
+ "learning_rate": 1.642896519151625e-05,
+ "loss": 0.3401,
+ "step": 10988
+ },
+ {
+ "epoch": 29.942779291553133,
+ "grad_norm": 6.946228981018066,
+ "learning_rate": 1.642828921703029e-05,
+ "loss": 0.3607,
+ "step": 10989
+ },
+ {
+ "epoch": 29.94550408719346,
+ "grad_norm": 10.81572437286377,
+ "learning_rate": 1.6427613192481025e-05,
+ "loss": 0.3947,
+ "step": 10990
+ },
+ {
+ "epoch": 29.94822888283379,
+ "grad_norm": 7.242533206939697,
+ "learning_rate": 1.6426937117873713e-05,
+ "loss": 0.3457,
+ "step": 10991
+ },
+ {
+ "epoch": 29.950953678474114,
+ "grad_norm": 6.762942314147949,
+ "learning_rate": 1.642626099321362e-05,
+ "loss": 0.358,
+ "step": 10992
+ },
+ {
+ "epoch": 29.95367847411444,
+ "grad_norm": 7.605253219604492,
+ "learning_rate": 1.6425584818506016e-05,
+ "loss": 0.4045,
+ "step": 10993
+ },
+ {
+ "epoch": 29.95640326975477,
+ "grad_norm": 8.510704040527344,
+ "learning_rate": 1.6424908593756162e-05,
+ "loss": 0.4006,
+ "step": 10994
+ },
+ {
+ "epoch": 29.959128065395095,
+ "grad_norm": 8.417881965637207,
+ "learning_rate": 1.6424232318969327e-05,
+ "loss": 0.4297,
+ "step": 10995
+ },
+ {
+ "epoch": 29.96185286103542,
+ "grad_norm": 6.6445536613464355,
+ "learning_rate": 1.6423555994150776e-05,
+ "loss": 0.4922,
+ "step": 10996
+ },
+ {
+ "epoch": 29.96457765667575,
+ "grad_norm": 13.118285179138184,
+ "learning_rate": 1.6422879619305782e-05,
+ "loss": 0.5127,
+ "step": 10997
+ },
+ {
+ "epoch": 29.967302452316076,
+ "grad_norm": 8.387615203857422,
+ "learning_rate": 1.6422203194439606e-05,
+ "loss": 0.3346,
+ "step": 10998
+ },
+ {
+ "epoch": 29.970027247956402,
+ "grad_norm": 8.093526840209961,
+ "learning_rate": 1.6421526719557514e-05,
+ "loss": 0.5449,
+ "step": 10999
+ },
+ {
+ "epoch": 29.97275204359673,
+ "grad_norm": 6.561741828918457,
+ "learning_rate": 1.6420850194664787e-05,
+ "loss": 0.4216,
+ "step": 11000
+ },
+ {
+ "epoch": 29.975476839237057,
+ "grad_norm": 6.173132419586182,
+ "learning_rate": 1.642017361976668e-05,
+ "loss": 0.4457,
+ "step": 11001
+ },
+ {
+ "epoch": 29.978201634877383,
+ "grad_norm": 7.232378005981445,
+ "learning_rate": 1.6419496994868467e-05,
+ "loss": 0.4089,
+ "step": 11002
+ },
+ {
+ "epoch": 29.980926430517712,
+ "grad_norm": 7.017350673675537,
+ "learning_rate": 1.6418820319975418e-05,
+ "loss": 0.4875,
+ "step": 11003
+ },
+ {
+ "epoch": 29.983651226158038,
+ "grad_norm": 7.370197296142578,
+ "learning_rate": 1.6418143595092805e-05,
+ "loss": 0.3418,
+ "step": 11004
+ },
+ {
+ "epoch": 29.986376021798364,
+ "grad_norm": 6.696606636047363,
+ "learning_rate": 1.6417466820225896e-05,
+ "loss": 0.5358,
+ "step": 11005
+ },
+ {
+ "epoch": 29.989100817438693,
+ "grad_norm": 11.178949356079102,
+ "learning_rate": 1.641678999537996e-05,
+ "loss": 0.4545,
+ "step": 11006
+ },
+ {
+ "epoch": 29.99182561307902,
+ "grad_norm": 8.079872131347656,
+ "learning_rate": 1.6416113120560275e-05,
+ "loss": 0.3928,
+ "step": 11007
+ },
+ {
+ "epoch": 29.994550408719345,
+ "grad_norm": 20.830598831176758,
+ "learning_rate": 1.64154361957721e-05,
+ "loss": 0.446,
+ "step": 11008
+ },
+ {
+ "epoch": 29.997275204359674,
+ "grad_norm": 8.717055320739746,
+ "learning_rate": 1.641475922102072e-05,
+ "loss": 0.4711,
+ "step": 11009
+ },
+ {
+ "epoch": 30.0,
+ "grad_norm": 7.055100917816162,
+ "learning_rate": 1.6414082196311402e-05,
+ "loss": 0.5015,
+ "step": 11010
+ },
+ {
+ "epoch": 30.002724795640326,
+ "grad_norm": 6.0088300704956055,
+ "learning_rate": 1.6413405121649416e-05,
+ "loss": 0.3615,
+ "step": 11011
+ },
+ {
+ "epoch": 30.005449591280655,
+ "grad_norm": 5.820860385894775,
+ "learning_rate": 1.6412727997040036e-05,
+ "loss": 0.3237,
+ "step": 11012
+ },
+ {
+ "epoch": 30.00817438692098,
+ "grad_norm": 6.502038955688477,
+ "learning_rate": 1.641205082248854e-05,
+ "loss": 0.5334,
+ "step": 11013
+ },
+ {
+ "epoch": 30.010899182561307,
+ "grad_norm": 7.3135151863098145,
+ "learning_rate": 1.64113735980002e-05,
+ "loss": 0.485,
+ "step": 11014
+ },
+ {
+ "epoch": 30.013623978201636,
+ "grad_norm": 6.81199836730957,
+ "learning_rate": 1.641069632358028e-05,
+ "loss": 0.438,
+ "step": 11015
+ },
+ {
+ "epoch": 30.016348773841962,
+ "grad_norm": 6.724306106567383,
+ "learning_rate": 1.641001899923407e-05,
+ "loss": 0.2847,
+ "step": 11016
+ },
+ {
+ "epoch": 30.019073569482288,
+ "grad_norm": 12.282051086425781,
+ "learning_rate": 1.640934162496684e-05,
+ "loss": 0.4241,
+ "step": 11017
+ },
+ {
+ "epoch": 30.021798365122617,
+ "grad_norm": 7.175605773925781,
+ "learning_rate": 1.640866420078386e-05,
+ "loss": 0.3946,
+ "step": 11018
+ },
+ {
+ "epoch": 30.024523160762943,
+ "grad_norm": 6.926136016845703,
+ "learning_rate": 1.640798672669041e-05,
+ "loss": 0.3102,
+ "step": 11019
+ },
+ {
+ "epoch": 30.02724795640327,
+ "grad_norm": 7.437623500823975,
+ "learning_rate": 1.6407309202691765e-05,
+ "loss": 0.463,
+ "step": 11020
+ },
+ {
+ "epoch": 30.029972752043598,
+ "grad_norm": 6.733150959014893,
+ "learning_rate": 1.6406631628793205e-05,
+ "loss": 0.3729,
+ "step": 11021
+ },
+ {
+ "epoch": 30.032697547683924,
+ "grad_norm": 5.76999044418335,
+ "learning_rate": 1.6405954005e-05,
+ "loss": 0.3857,
+ "step": 11022
+ },
+ {
+ "epoch": 30.03542234332425,
+ "grad_norm": 7.99325704574585,
+ "learning_rate": 1.6405276331317437e-05,
+ "loss": 0.452,
+ "step": 11023
+ },
+ {
+ "epoch": 30.03814713896458,
+ "grad_norm": 6.218040943145752,
+ "learning_rate": 1.6404598607750785e-05,
+ "loss": 0.3005,
+ "step": 11024
+ },
+ {
+ "epoch": 30.040871934604905,
+ "grad_norm": 6.658420085906982,
+ "learning_rate": 1.6403920834305324e-05,
+ "loss": 0.3451,
+ "step": 11025
+ },
+ {
+ "epoch": 30.04359673024523,
+ "grad_norm": 7.311766624450684,
+ "learning_rate": 1.6403243010986332e-05,
+ "loss": 0.3774,
+ "step": 11026
+ },
+ {
+ "epoch": 30.04632152588556,
+ "grad_norm": 8.474394798278809,
+ "learning_rate": 1.6402565137799096e-05,
+ "loss": 0.3843,
+ "step": 11027
+ },
+ {
+ "epoch": 30.049046321525886,
+ "grad_norm": 7.289997577667236,
+ "learning_rate": 1.6401887214748887e-05,
+ "loss": 0.4448,
+ "step": 11028
+ },
+ {
+ "epoch": 30.05177111716621,
+ "grad_norm": 6.859222412109375,
+ "learning_rate": 1.6401209241840984e-05,
+ "loss": 0.3199,
+ "step": 11029
+ },
+ {
+ "epoch": 30.05449591280654,
+ "grad_norm": 6.75163459777832,
+ "learning_rate": 1.640053121908067e-05,
+ "loss": 0.438,
+ "step": 11030
+ },
+ {
+ "epoch": 30.057220708446867,
+ "grad_norm": 6.317370891571045,
+ "learning_rate": 1.6399853146473223e-05,
+ "loss": 0.2949,
+ "step": 11031
+ },
+ {
+ "epoch": 30.059945504087192,
+ "grad_norm": 8.458065032958984,
+ "learning_rate": 1.6399175024023927e-05,
+ "loss": 0.4216,
+ "step": 11032
+ },
+ {
+ "epoch": 30.06267029972752,
+ "grad_norm": 6.969457626342773,
+ "learning_rate": 1.6398496851738064e-05,
+ "loss": 0.3399,
+ "step": 11033
+ },
+ {
+ "epoch": 30.065395095367847,
+ "grad_norm": 6.142038345336914,
+ "learning_rate": 1.639781862962091e-05,
+ "loss": 0.2935,
+ "step": 11034
+ },
+ {
+ "epoch": 30.068119891008173,
+ "grad_norm": 7.265402317047119,
+ "learning_rate": 1.6397140357677753e-05,
+ "loss": 0.5065,
+ "step": 11035
+ },
+ {
+ "epoch": 30.070844686648503,
+ "grad_norm": 8.197349548339844,
+ "learning_rate": 1.6396462035913872e-05,
+ "loss": 0.456,
+ "step": 11036
+ },
+ {
+ "epoch": 30.07356948228883,
+ "grad_norm": 7.076777458190918,
+ "learning_rate": 1.639578366433455e-05,
+ "loss": 0.5262,
+ "step": 11037
+ },
+ {
+ "epoch": 30.076294277929154,
+ "grad_norm": 5.244971752166748,
+ "learning_rate": 1.639510524294507e-05,
+ "loss": 0.3103,
+ "step": 11038
+ },
+ {
+ "epoch": 30.079019073569484,
+ "grad_norm": 6.139191150665283,
+ "learning_rate": 1.639442677175072e-05,
+ "loss": 0.3783,
+ "step": 11039
+ },
+ {
+ "epoch": 30.08174386920981,
+ "grad_norm": 6.427220821380615,
+ "learning_rate": 1.639374825075678e-05,
+ "loss": 0.5044,
+ "step": 11040
+ },
+ {
+ "epoch": 30.084468664850135,
+ "grad_norm": 8.533020973205566,
+ "learning_rate": 1.639306967996853e-05,
+ "loss": 0.5481,
+ "step": 11041
+ },
+ {
+ "epoch": 30.087193460490465,
+ "grad_norm": 6.449970722198486,
+ "learning_rate": 1.6392391059391258e-05,
+ "loss": 0.4382,
+ "step": 11042
+ },
+ {
+ "epoch": 30.08991825613079,
+ "grad_norm": 10.026012420654297,
+ "learning_rate": 1.6391712389030253e-05,
+ "loss": 0.4258,
+ "step": 11043
+ },
+ {
+ "epoch": 30.092643051771116,
+ "grad_norm": 6.1092610359191895,
+ "learning_rate": 1.63910336688908e-05,
+ "loss": 0.3223,
+ "step": 11044
+ },
+ {
+ "epoch": 30.095367847411445,
+ "grad_norm": 9.438382148742676,
+ "learning_rate": 1.639035489897818e-05,
+ "loss": 0.4528,
+ "step": 11045
+ },
+ {
+ "epoch": 30.09809264305177,
+ "grad_norm": 6.647580146789551,
+ "learning_rate": 1.6389676079297684e-05,
+ "loss": 0.3857,
+ "step": 11046
+ },
+ {
+ "epoch": 30.100817438692097,
+ "grad_norm": 5.792067050933838,
+ "learning_rate": 1.6388997209854595e-05,
+ "loss": 0.655,
+ "step": 11047
+ },
+ {
+ "epoch": 30.103542234332426,
+ "grad_norm": 6.984425067901611,
+ "learning_rate": 1.63883182906542e-05,
+ "loss": 0.396,
+ "step": 11048
+ },
+ {
+ "epoch": 30.106267029972752,
+ "grad_norm": 7.124753475189209,
+ "learning_rate": 1.6387639321701787e-05,
+ "loss": 0.4637,
+ "step": 11049
+ },
+ {
+ "epoch": 30.108991825613078,
+ "grad_norm": 9.646773338317871,
+ "learning_rate": 1.6386960303002647e-05,
+ "loss": 0.4193,
+ "step": 11050
+ },
+ {
+ "epoch": 30.111716621253407,
+ "grad_norm": 6.347529888153076,
+ "learning_rate": 1.6386281234562065e-05,
+ "loss": 0.3469,
+ "step": 11051
+ },
+ {
+ "epoch": 30.114441416893733,
+ "grad_norm": 6.188181400299072,
+ "learning_rate": 1.638560211638533e-05,
+ "loss": 0.3493,
+ "step": 11052
+ },
+ {
+ "epoch": 30.11716621253406,
+ "grad_norm": 5.9739251136779785,
+ "learning_rate": 1.638492294847773e-05,
+ "loss": 0.4186,
+ "step": 11053
+ },
+ {
+ "epoch": 30.11989100817439,
+ "grad_norm": 8.596823692321777,
+ "learning_rate": 1.6384243730844556e-05,
+ "loss": 0.5058,
+ "step": 11054
+ },
+ {
+ "epoch": 30.122615803814714,
+ "grad_norm": 7.194712162017822,
+ "learning_rate": 1.63835644634911e-05,
+ "loss": 0.3762,
+ "step": 11055
+ },
+ {
+ "epoch": 30.12534059945504,
+ "grad_norm": 8.324389457702637,
+ "learning_rate": 1.6382885146422646e-05,
+ "loss": 0.4172,
+ "step": 11056
+ },
+ {
+ "epoch": 30.12806539509537,
+ "grad_norm": 6.283515930175781,
+ "learning_rate": 1.6382205779644487e-05,
+ "loss": 0.4075,
+ "step": 11057
+ },
+ {
+ "epoch": 30.130790190735695,
+ "grad_norm": 7.6013312339782715,
+ "learning_rate": 1.638152636316192e-05,
+ "loss": 0.4424,
+ "step": 11058
+ },
+ {
+ "epoch": 30.13351498637602,
+ "grad_norm": 6.367516994476318,
+ "learning_rate": 1.638084689698023e-05,
+ "loss": 0.523,
+ "step": 11059
+ },
+ {
+ "epoch": 30.13623978201635,
+ "grad_norm": 7.755098342895508,
+ "learning_rate": 1.6380167381104706e-05,
+ "loss": 0.4693,
+ "step": 11060
+ },
+ {
+ "epoch": 30.138964577656676,
+ "grad_norm": 7.197167873382568,
+ "learning_rate": 1.6379487815540648e-05,
+ "loss": 0.3907,
+ "step": 11061
+ },
+ {
+ "epoch": 30.141689373297,
+ "grad_norm": 6.419443130493164,
+ "learning_rate": 1.6378808200293343e-05,
+ "loss": 0.5005,
+ "step": 11062
+ },
+ {
+ "epoch": 30.14441416893733,
+ "grad_norm": 6.293830871582031,
+ "learning_rate": 1.6378128535368084e-05,
+ "loss": 0.3582,
+ "step": 11063
+ },
+ {
+ "epoch": 30.147138964577657,
+ "grad_norm": 6.32768440246582,
+ "learning_rate": 1.6377448820770164e-05,
+ "loss": 0.3264,
+ "step": 11064
+ },
+ {
+ "epoch": 30.149863760217983,
+ "grad_norm": 7.156543254852295,
+ "learning_rate": 1.637676905650488e-05,
+ "loss": 0.3628,
+ "step": 11065
+ },
+ {
+ "epoch": 30.152588555858312,
+ "grad_norm": 6.288056373596191,
+ "learning_rate": 1.637608924257752e-05,
+ "loss": 0.5111,
+ "step": 11066
+ },
+ {
+ "epoch": 30.155313351498638,
+ "grad_norm": 6.886847496032715,
+ "learning_rate": 1.6375409378993387e-05,
+ "loss": 0.3865,
+ "step": 11067
+ },
+ {
+ "epoch": 30.158038147138964,
+ "grad_norm": 7.042550086975098,
+ "learning_rate": 1.637472946575777e-05,
+ "loss": 0.6097,
+ "step": 11068
+ },
+ {
+ "epoch": 30.160762942779293,
+ "grad_norm": 6.211397171020508,
+ "learning_rate": 1.6374049502875963e-05,
+ "loss": 0.493,
+ "step": 11069
+ },
+ {
+ "epoch": 30.16348773841962,
+ "grad_norm": 6.925831317901611,
+ "learning_rate": 1.6373369490353265e-05,
+ "loss": 0.564,
+ "step": 11070
+ },
+ {
+ "epoch": 30.166212534059945,
+ "grad_norm": 7.403109073638916,
+ "learning_rate": 1.637268942819497e-05,
+ "loss": 0.4129,
+ "step": 11071
+ },
+ {
+ "epoch": 30.168937329700274,
+ "grad_norm": 5.961977481842041,
+ "learning_rate": 1.6372009316406376e-05,
+ "loss": 0.4259,
+ "step": 11072
+ },
+ {
+ "epoch": 30.1716621253406,
+ "grad_norm": 5.775633335113525,
+ "learning_rate": 1.6371329154992775e-05,
+ "loss": 0.5584,
+ "step": 11073
+ },
+ {
+ "epoch": 30.174386920980925,
+ "grad_norm": 6.836814880371094,
+ "learning_rate": 1.6370648943959473e-05,
+ "loss": 0.3898,
+ "step": 11074
+ },
+ {
+ "epoch": 30.177111716621255,
+ "grad_norm": 7.935107707977295,
+ "learning_rate": 1.6369968683311758e-05,
+ "loss": 0.5857,
+ "step": 11075
+ },
+ {
+ "epoch": 30.17983651226158,
+ "grad_norm": 5.413071155548096,
+ "learning_rate": 1.6369288373054936e-05,
+ "loss": 0.6349,
+ "step": 11076
+ },
+ {
+ "epoch": 30.182561307901906,
+ "grad_norm": 5.701023101806641,
+ "learning_rate": 1.6368608013194296e-05,
+ "loss": 0.5304,
+ "step": 11077
+ },
+ {
+ "epoch": 30.185286103542236,
+ "grad_norm": 6.271266460418701,
+ "learning_rate": 1.6367927603735144e-05,
+ "loss": 0.4534,
+ "step": 11078
+ },
+ {
+ "epoch": 30.18801089918256,
+ "grad_norm": 5.906961441040039,
+ "learning_rate": 1.636724714468278e-05,
+ "loss": 0.3754,
+ "step": 11079
+ },
+ {
+ "epoch": 30.190735694822887,
+ "grad_norm": 6.097695827484131,
+ "learning_rate": 1.6366566636042495e-05,
+ "loss": 0.463,
+ "step": 11080
+ },
+ {
+ "epoch": 30.193460490463217,
+ "grad_norm": 5.9541335105896,
+ "learning_rate": 1.6365886077819597e-05,
+ "loss": 0.5026,
+ "step": 11081
+ },
+ {
+ "epoch": 30.196185286103542,
+ "grad_norm": 7.629851341247559,
+ "learning_rate": 1.6365205470019383e-05,
+ "loss": 0.5601,
+ "step": 11082
+ },
+ {
+ "epoch": 30.19891008174387,
+ "grad_norm": 6.487632751464844,
+ "learning_rate": 1.6364524812647155e-05,
+ "loss": 0.4403,
+ "step": 11083
+ },
+ {
+ "epoch": 30.201634877384198,
+ "grad_norm": 8.499356269836426,
+ "learning_rate": 1.636384410570821e-05,
+ "loss": 0.5285,
+ "step": 11084
+ },
+ {
+ "epoch": 30.204359673024523,
+ "grad_norm": 12.487041473388672,
+ "learning_rate": 1.636316334920785e-05,
+ "loss": 0.4891,
+ "step": 11085
+ },
+ {
+ "epoch": 30.20708446866485,
+ "grad_norm": 6.921417713165283,
+ "learning_rate": 1.6362482543151382e-05,
+ "loss": 0.4167,
+ "step": 11086
+ },
+ {
+ "epoch": 30.20980926430518,
+ "grad_norm": 7.392184257507324,
+ "learning_rate": 1.6361801687544103e-05,
+ "loss": 0.4371,
+ "step": 11087
+ },
+ {
+ "epoch": 30.212534059945504,
+ "grad_norm": 8.208747863769531,
+ "learning_rate": 1.636112078239132e-05,
+ "loss": 0.3515,
+ "step": 11088
+ },
+ {
+ "epoch": 30.21525885558583,
+ "grad_norm": 6.039959907531738,
+ "learning_rate": 1.636043982769833e-05,
+ "loss": 0.5775,
+ "step": 11089
+ },
+ {
+ "epoch": 30.21798365122616,
+ "grad_norm": 5.5182600021362305,
+ "learning_rate": 1.635975882347044e-05,
+ "loss": 0.4808,
+ "step": 11090
+ },
+ {
+ "epoch": 30.220708446866485,
+ "grad_norm": 8.186211585998535,
+ "learning_rate": 1.6359077769712955e-05,
+ "loss": 0.3456,
+ "step": 11091
+ },
+ {
+ "epoch": 30.22343324250681,
+ "grad_norm": 6.7575459480285645,
+ "learning_rate": 1.6358396666431176e-05,
+ "loss": 0.4275,
+ "step": 11092
+ },
+ {
+ "epoch": 30.22615803814714,
+ "grad_norm": 6.863185405731201,
+ "learning_rate": 1.6357715513630407e-05,
+ "loss": 0.3653,
+ "step": 11093
+ },
+ {
+ "epoch": 30.228882833787466,
+ "grad_norm": 7.599756717681885,
+ "learning_rate": 1.6357034311315954e-05,
+ "loss": 0.3335,
+ "step": 11094
+ },
+ {
+ "epoch": 30.231607629427792,
+ "grad_norm": 7.023427486419678,
+ "learning_rate": 1.635635305949312e-05,
+ "loss": 0.3951,
+ "step": 11095
+ },
+ {
+ "epoch": 30.23433242506812,
+ "grad_norm": 5.927885055541992,
+ "learning_rate": 1.6355671758167218e-05,
+ "loss": 0.3515,
+ "step": 11096
+ },
+ {
+ "epoch": 30.237057220708447,
+ "grad_norm": 6.024624347686768,
+ "learning_rate": 1.635499040734355e-05,
+ "loss": 0.3495,
+ "step": 11097
+ },
+ {
+ "epoch": 30.239782016348773,
+ "grad_norm": 6.806307315826416,
+ "learning_rate": 1.6354309007027417e-05,
+ "loss": 0.413,
+ "step": 11098
+ },
+ {
+ "epoch": 30.242506811989102,
+ "grad_norm": 6.517013072967529,
+ "learning_rate": 1.635362755722413e-05,
+ "loss": 0.4623,
+ "step": 11099
+ },
+ {
+ "epoch": 30.245231607629428,
+ "grad_norm": 6.914282321929932,
+ "learning_rate": 1.6352946057938998e-05,
+ "loss": 0.3395,
+ "step": 11100
+ },
+ {
+ "epoch": 30.247956403269754,
+ "grad_norm": 7.303252220153809,
+ "learning_rate": 1.635226450917733e-05,
+ "loss": 0.3323,
+ "step": 11101
+ },
+ {
+ "epoch": 30.250681198910083,
+ "grad_norm": 6.682431697845459,
+ "learning_rate": 1.635158291094442e-05,
+ "loss": 0.4211,
+ "step": 11102
+ },
+ {
+ "epoch": 30.25340599455041,
+ "grad_norm": 5.761322021484375,
+ "learning_rate": 1.6350901263245594e-05,
+ "loss": 0.3323,
+ "step": 11103
+ },
+ {
+ "epoch": 30.256130790190735,
+ "grad_norm": 6.29879093170166,
+ "learning_rate": 1.6350219566086156e-05,
+ "loss": 0.4701,
+ "step": 11104
+ },
+ {
+ "epoch": 30.258855585831064,
+ "grad_norm": 7.568106174468994,
+ "learning_rate": 1.6349537819471408e-05,
+ "loss": 0.4886,
+ "step": 11105
+ },
+ {
+ "epoch": 30.26158038147139,
+ "grad_norm": 6.222177028656006,
+ "learning_rate": 1.6348856023406666e-05,
+ "loss": 0.4187,
+ "step": 11106
+ },
+ {
+ "epoch": 30.264305177111716,
+ "grad_norm": 7.444094657897949,
+ "learning_rate": 1.6348174177897237e-05,
+ "loss": 0.4895,
+ "step": 11107
+ },
+ {
+ "epoch": 30.267029972752045,
+ "grad_norm": 7.142608165740967,
+ "learning_rate": 1.634749228294843e-05,
+ "loss": 0.5111,
+ "step": 11108
+ },
+ {
+ "epoch": 30.26975476839237,
+ "grad_norm": 9.366308212280273,
+ "learning_rate": 1.634681033856556e-05,
+ "loss": 0.4298,
+ "step": 11109
+ },
+ {
+ "epoch": 30.272479564032697,
+ "grad_norm": 6.9632720947265625,
+ "learning_rate": 1.6346128344753932e-05,
+ "loss": 0.4662,
+ "step": 11110
+ },
+ {
+ "epoch": 30.275204359673026,
+ "grad_norm": 6.712884902954102,
+ "learning_rate": 1.6345446301518864e-05,
+ "loss": 0.3194,
+ "step": 11111
+ },
+ {
+ "epoch": 30.277929155313352,
+ "grad_norm": 7.170973777770996,
+ "learning_rate": 1.634476420886566e-05,
+ "loss": 0.4743,
+ "step": 11112
+ },
+ {
+ "epoch": 30.280653950953678,
+ "grad_norm": 6.807126045227051,
+ "learning_rate": 1.634408206679964e-05,
+ "loss": 0.3461,
+ "step": 11113
+ },
+ {
+ "epoch": 30.283378746594007,
+ "grad_norm": 6.459092140197754,
+ "learning_rate": 1.6343399875326115e-05,
+ "loss": 0.4248,
+ "step": 11114
+ },
+ {
+ "epoch": 30.286103542234333,
+ "grad_norm": 6.9402289390563965,
+ "learning_rate": 1.6342717634450393e-05,
+ "loss": 0.4156,
+ "step": 11115
+ },
+ {
+ "epoch": 30.28882833787466,
+ "grad_norm": 7.605564594268799,
+ "learning_rate": 1.634203534417779e-05,
+ "loss": 0.5897,
+ "step": 11116
+ },
+ {
+ "epoch": 30.291553133514988,
+ "grad_norm": 8.335100173950195,
+ "learning_rate": 1.6341353004513622e-05,
+ "loss": 0.5774,
+ "step": 11117
+ },
+ {
+ "epoch": 30.294277929155314,
+ "grad_norm": 7.1958112716674805,
+ "learning_rate": 1.63406706154632e-05,
+ "loss": 0.5863,
+ "step": 11118
+ },
+ {
+ "epoch": 30.29700272479564,
+ "grad_norm": 6.38262939453125,
+ "learning_rate": 1.633998817703184e-05,
+ "loss": 0.392,
+ "step": 11119
+ },
+ {
+ "epoch": 30.29972752043597,
+ "grad_norm": 6.995018005371094,
+ "learning_rate": 1.6339305689224853e-05,
+ "loss": 0.4524,
+ "step": 11120
+ },
+ {
+ "epoch": 30.302452316076295,
+ "grad_norm": 6.139112949371338,
+ "learning_rate": 1.633862315204756e-05,
+ "loss": 0.4032,
+ "step": 11121
+ },
+ {
+ "epoch": 30.30517711171662,
+ "grad_norm": 7.4238362312316895,
+ "learning_rate": 1.6337940565505275e-05,
+ "loss": 0.4225,
+ "step": 11122
+ },
+ {
+ "epoch": 30.30790190735695,
+ "grad_norm": 6.557679176330566,
+ "learning_rate": 1.633725792960331e-05,
+ "loss": 0.4968,
+ "step": 11123
+ },
+ {
+ "epoch": 30.310626702997276,
+ "grad_norm": 7.154829978942871,
+ "learning_rate": 1.6336575244346983e-05,
+ "loss": 0.3633,
+ "step": 11124
+ },
+ {
+ "epoch": 30.3133514986376,
+ "grad_norm": 7.474669933319092,
+ "learning_rate": 1.6335892509741618e-05,
+ "loss": 0.4091,
+ "step": 11125
+ },
+ {
+ "epoch": 30.31607629427793,
+ "grad_norm": 9.34608268737793,
+ "learning_rate": 1.633520972579252e-05,
+ "loss": 0.4148,
+ "step": 11126
+ },
+ {
+ "epoch": 30.318801089918257,
+ "grad_norm": 6.975616931915283,
+ "learning_rate": 1.6334526892505015e-05,
+ "loss": 0.3524,
+ "step": 11127
+ },
+ {
+ "epoch": 30.321525885558582,
+ "grad_norm": 6.626901149749756,
+ "learning_rate": 1.633384400988442e-05,
+ "loss": 0.649,
+ "step": 11128
+ },
+ {
+ "epoch": 30.32425068119891,
+ "grad_norm": 9.110139846801758,
+ "learning_rate": 1.633316107793605e-05,
+ "loss": 0.4517,
+ "step": 11129
+ },
+ {
+ "epoch": 30.326975476839237,
+ "grad_norm": 7.414907932281494,
+ "learning_rate": 1.6332478096665222e-05,
+ "loss": 0.4903,
+ "step": 11130
+ },
+ {
+ "epoch": 30.329700272479563,
+ "grad_norm": 6.143207550048828,
+ "learning_rate": 1.6331795066077262e-05,
+ "loss": 0.2961,
+ "step": 11131
+ },
+ {
+ "epoch": 30.332425068119893,
+ "grad_norm": 7.663824081420898,
+ "learning_rate": 1.633111198617749e-05,
+ "loss": 0.3638,
+ "step": 11132
+ },
+ {
+ "epoch": 30.33514986376022,
+ "grad_norm": 6.809144020080566,
+ "learning_rate": 1.6330428856971217e-05,
+ "loss": 0.3295,
+ "step": 11133
+ },
+ {
+ "epoch": 30.337874659400544,
+ "grad_norm": 6.921654224395752,
+ "learning_rate": 1.6329745678463765e-05,
+ "loss": 0.4185,
+ "step": 11134
+ },
+ {
+ "epoch": 30.340599455040874,
+ "grad_norm": 6.478837013244629,
+ "learning_rate": 1.6329062450660463e-05,
+ "loss": 0.4489,
+ "step": 11135
+ },
+ {
+ "epoch": 30.3433242506812,
+ "grad_norm": 12.89828109741211,
+ "learning_rate": 1.6328379173566623e-05,
+ "loss": 0.4382,
+ "step": 11136
+ },
+ {
+ "epoch": 30.346049046321525,
+ "grad_norm": 9.292570114135742,
+ "learning_rate": 1.632769584718757e-05,
+ "loss": 0.4523,
+ "step": 11137
+ },
+ {
+ "epoch": 30.348773841961854,
+ "grad_norm": 6.0499267578125,
+ "learning_rate": 1.6327012471528626e-05,
+ "loss": 0.2988,
+ "step": 11138
+ },
+ {
+ "epoch": 30.35149863760218,
+ "grad_norm": 6.418890953063965,
+ "learning_rate": 1.6326329046595112e-05,
+ "loss": 0.4348,
+ "step": 11139
+ },
+ {
+ "epoch": 30.354223433242506,
+ "grad_norm": 7.002811431884766,
+ "learning_rate": 1.632564557239235e-05,
+ "loss": 0.3316,
+ "step": 11140
+ },
+ {
+ "epoch": 30.356948228882835,
+ "grad_norm": 8.295167922973633,
+ "learning_rate": 1.6324962048925666e-05,
+ "loss": 0.2808,
+ "step": 11141
+ },
+ {
+ "epoch": 30.35967302452316,
+ "grad_norm": 6.577081203460693,
+ "learning_rate": 1.632427847620038e-05,
+ "loss": 0.4397,
+ "step": 11142
+ },
+ {
+ "epoch": 30.362397820163487,
+ "grad_norm": 9.08464527130127,
+ "learning_rate": 1.632359485422182e-05,
+ "loss": 0.4562,
+ "step": 11143
+ },
+ {
+ "epoch": 30.365122615803816,
+ "grad_norm": 6.9909844398498535,
+ "learning_rate": 1.63229111829953e-05,
+ "loss": 0.4818,
+ "step": 11144
+ },
+ {
+ "epoch": 30.367847411444142,
+ "grad_norm": 9.277730941772461,
+ "learning_rate": 1.6322227462526157e-05,
+ "loss": 0.442,
+ "step": 11145
+ },
+ {
+ "epoch": 30.370572207084468,
+ "grad_norm": 7.0915985107421875,
+ "learning_rate": 1.6321543692819707e-05,
+ "loss": 0.3355,
+ "step": 11146
+ },
+ {
+ "epoch": 30.373297002724797,
+ "grad_norm": 6.999594211578369,
+ "learning_rate": 1.6320859873881282e-05,
+ "loss": 0.5162,
+ "step": 11147
+ },
+ {
+ "epoch": 30.376021798365123,
+ "grad_norm": 7.807701587677002,
+ "learning_rate": 1.63201760057162e-05,
+ "loss": 0.5061,
+ "step": 11148
+ },
+ {
+ "epoch": 30.37874659400545,
+ "grad_norm": 8.793044090270996,
+ "learning_rate": 1.6319492088329792e-05,
+ "loss": 0.5065,
+ "step": 11149
+ },
+ {
+ "epoch": 30.381471389645778,
+ "grad_norm": 8.298761367797852,
+ "learning_rate": 1.631880812172738e-05,
+ "loss": 0.3995,
+ "step": 11150
+ },
+ {
+ "epoch": 30.384196185286104,
+ "grad_norm": 8.38496208190918,
+ "learning_rate": 1.63181241059143e-05,
+ "loss": 0.3788,
+ "step": 11151
+ },
+ {
+ "epoch": 30.38692098092643,
+ "grad_norm": 6.298509120941162,
+ "learning_rate": 1.631744004089587e-05,
+ "loss": 0.3848,
+ "step": 11152
+ },
+ {
+ "epoch": 30.38964577656676,
+ "grad_norm": 7.297521591186523,
+ "learning_rate": 1.6316755926677415e-05,
+ "loss": 0.4926,
+ "step": 11153
+ },
+ {
+ "epoch": 30.392370572207085,
+ "grad_norm": 6.584827423095703,
+ "learning_rate": 1.6316071763264277e-05,
+ "loss": 0.5525,
+ "step": 11154
+ },
+ {
+ "epoch": 30.39509536784741,
+ "grad_norm": 6.54464864730835,
+ "learning_rate": 1.631538755066177e-05,
+ "loss": 0.5013,
+ "step": 11155
+ },
+ {
+ "epoch": 30.39782016348774,
+ "grad_norm": 8.183076858520508,
+ "learning_rate": 1.631470328887523e-05,
+ "loss": 0.4586,
+ "step": 11156
+ },
+ {
+ "epoch": 30.400544959128066,
+ "grad_norm": 6.126870632171631,
+ "learning_rate": 1.6314018977909982e-05,
+ "loss": 0.3919,
+ "step": 11157
+ },
+ {
+ "epoch": 30.40326975476839,
+ "grad_norm": 7.185279846191406,
+ "learning_rate": 1.631333461777136e-05,
+ "loss": 0.3845,
+ "step": 11158
+ },
+ {
+ "epoch": 30.40599455040872,
+ "grad_norm": 6.868136882781982,
+ "learning_rate": 1.631265020846469e-05,
+ "loss": 0.4161,
+ "step": 11159
+ },
+ {
+ "epoch": 30.408719346049047,
+ "grad_norm": 7.411529064178467,
+ "learning_rate": 1.63119657499953e-05,
+ "loss": 0.4904,
+ "step": 11160
+ },
+ {
+ "epoch": 30.411444141689373,
+ "grad_norm": 6.574433326721191,
+ "learning_rate": 1.631128124236853e-05,
+ "loss": 0.4001,
+ "step": 11161
+ },
+ {
+ "epoch": 30.414168937329702,
+ "grad_norm": 6.144572734832764,
+ "learning_rate": 1.6310596685589703e-05,
+ "loss": 0.4123,
+ "step": 11162
+ },
+ {
+ "epoch": 30.416893732970028,
+ "grad_norm": 6.900004863739014,
+ "learning_rate": 1.6309912079664147e-05,
+ "loss": 0.4342,
+ "step": 11163
+ },
+ {
+ "epoch": 30.419618528610354,
+ "grad_norm": 6.595589637756348,
+ "learning_rate": 1.6309227424597207e-05,
+ "loss": 0.4882,
+ "step": 11164
+ },
+ {
+ "epoch": 30.422343324250683,
+ "grad_norm": 7.083584308624268,
+ "learning_rate": 1.63085427203942e-05,
+ "loss": 0.4852,
+ "step": 11165
+ },
+ {
+ "epoch": 30.42506811989101,
+ "grad_norm": 7.238770484924316,
+ "learning_rate": 1.6307857967060466e-05,
+ "loss": 0.5204,
+ "step": 11166
+ },
+ {
+ "epoch": 30.427792915531334,
+ "grad_norm": 7.944159507751465,
+ "learning_rate": 1.630717316460134e-05,
+ "loss": 0.3906,
+ "step": 11167
+ },
+ {
+ "epoch": 30.430517711171664,
+ "grad_norm": 9.476786613464355,
+ "learning_rate": 1.630648831302215e-05,
+ "loss": 0.4355,
+ "step": 11168
+ },
+ {
+ "epoch": 30.43324250681199,
+ "grad_norm": 8.080235481262207,
+ "learning_rate": 1.6305803412328236e-05,
+ "loss": 0.4662,
+ "step": 11169
+ },
+ {
+ "epoch": 30.435967302452315,
+ "grad_norm": 8.67461109161377,
+ "learning_rate": 1.6305118462524926e-05,
+ "loss": 0.4588,
+ "step": 11170
+ },
+ {
+ "epoch": 30.438692098092645,
+ "grad_norm": 6.554092884063721,
+ "learning_rate": 1.6304433463617554e-05,
+ "loss": 0.3947,
+ "step": 11171
+ },
+ {
+ "epoch": 30.44141689373297,
+ "grad_norm": 6.492825984954834,
+ "learning_rate": 1.630374841561146e-05,
+ "loss": 0.5317,
+ "step": 11172
+ },
+ {
+ "epoch": 30.444141689373296,
+ "grad_norm": 6.715017795562744,
+ "learning_rate": 1.6303063318511973e-05,
+ "loss": 0.3394,
+ "step": 11173
+ },
+ {
+ "epoch": 30.446866485013626,
+ "grad_norm": 7.301937580108643,
+ "learning_rate": 1.6302378172324436e-05,
+ "loss": 0.4982,
+ "step": 11174
+ },
+ {
+ "epoch": 30.44959128065395,
+ "grad_norm": 6.503893852233887,
+ "learning_rate": 1.6301692977054177e-05,
+ "loss": 0.3516,
+ "step": 11175
+ },
+ {
+ "epoch": 30.452316076294277,
+ "grad_norm": 7.567931652069092,
+ "learning_rate": 1.630100773270654e-05,
+ "loss": 0.4438,
+ "step": 11176
+ },
+ {
+ "epoch": 30.455040871934607,
+ "grad_norm": 6.096273899078369,
+ "learning_rate": 1.6300322439286852e-05,
+ "loss": 0.4471,
+ "step": 11177
+ },
+ {
+ "epoch": 30.457765667574932,
+ "grad_norm": 7.5801472663879395,
+ "learning_rate": 1.629963709680046e-05,
+ "loss": 0.3835,
+ "step": 11178
+ },
+ {
+ "epoch": 30.460490463215258,
+ "grad_norm": 6.825669765472412,
+ "learning_rate": 1.6298951705252697e-05,
+ "loss": 0.4557,
+ "step": 11179
+ },
+ {
+ "epoch": 30.463215258855588,
+ "grad_norm": 6.852964401245117,
+ "learning_rate": 1.6298266264648898e-05,
+ "loss": 0.4685,
+ "step": 11180
+ },
+ {
+ "epoch": 30.465940054495913,
+ "grad_norm": 6.547214508056641,
+ "learning_rate": 1.6297580774994404e-05,
+ "loss": 0.5506,
+ "step": 11181
+ },
+ {
+ "epoch": 30.46866485013624,
+ "grad_norm": 6.798362731933594,
+ "learning_rate": 1.6296895236294558e-05,
+ "loss": 0.3712,
+ "step": 11182
+ },
+ {
+ "epoch": 30.47138964577657,
+ "grad_norm": 6.006402015686035,
+ "learning_rate": 1.629620964855469e-05,
+ "loss": 0.6051,
+ "step": 11183
+ },
+ {
+ "epoch": 30.474114441416894,
+ "grad_norm": 7.253655433654785,
+ "learning_rate": 1.6295524011780147e-05,
+ "loss": 0.5779,
+ "step": 11184
+ },
+ {
+ "epoch": 30.47683923705722,
+ "grad_norm": 13.01401424407959,
+ "learning_rate": 1.629483832597626e-05,
+ "loss": 0.3723,
+ "step": 11185
+ },
+ {
+ "epoch": 30.479564032697546,
+ "grad_norm": 7.651995658874512,
+ "learning_rate": 1.6294152591148386e-05,
+ "loss": 0.46,
+ "step": 11186
+ },
+ {
+ "epoch": 30.482288828337875,
+ "grad_norm": 8.617700576782227,
+ "learning_rate": 1.6293466807301843e-05,
+ "loss": 0.4051,
+ "step": 11187
+ },
+ {
+ "epoch": 30.4850136239782,
+ "grad_norm": 6.405218601226807,
+ "learning_rate": 1.629278097444199e-05,
+ "loss": 0.3129,
+ "step": 11188
+ },
+ {
+ "epoch": 30.48773841961853,
+ "grad_norm": 8.3556489944458,
+ "learning_rate": 1.6292095092574154e-05,
+ "loss": 0.4845,
+ "step": 11189
+ },
+ {
+ "epoch": 30.490463215258856,
+ "grad_norm": 11.176692008972168,
+ "learning_rate": 1.629140916170369e-05,
+ "loss": 0.5119,
+ "step": 11190
+ },
+ {
+ "epoch": 30.493188010899182,
+ "grad_norm": 7.346235275268555,
+ "learning_rate": 1.6290723181835933e-05,
+ "loss": 0.5363,
+ "step": 11191
+ },
+ {
+ "epoch": 30.495912806539508,
+ "grad_norm": 7.172322750091553,
+ "learning_rate": 1.6290037152976227e-05,
+ "loss": 0.4497,
+ "step": 11192
+ },
+ {
+ "epoch": 30.498637602179837,
+ "grad_norm": 6.90130615234375,
+ "learning_rate": 1.628935107512991e-05,
+ "loss": 0.4502,
+ "step": 11193
+ },
+ {
+ "epoch": 30.501362397820163,
+ "grad_norm": 8.490738868713379,
+ "learning_rate": 1.6288664948302333e-05,
+ "loss": 0.3503,
+ "step": 11194
+ },
+ {
+ "epoch": 30.504087193460492,
+ "grad_norm": 6.3047709465026855,
+ "learning_rate": 1.6287978772498836e-05,
+ "loss": 0.2864,
+ "step": 11195
+ },
+ {
+ "epoch": 30.506811989100818,
+ "grad_norm": 6.159095287322998,
+ "learning_rate": 1.628729254772476e-05,
+ "loss": 0.4874,
+ "step": 11196
+ },
+ {
+ "epoch": 30.509536784741144,
+ "grad_norm": 6.74845027923584,
+ "learning_rate": 1.6286606273985452e-05,
+ "loss": 0.3663,
+ "step": 11197
+ },
+ {
+ "epoch": 30.51226158038147,
+ "grad_norm": 7.2375383377075195,
+ "learning_rate": 1.628591995128626e-05,
+ "loss": 0.4338,
+ "step": 11198
+ },
+ {
+ "epoch": 30.5149863760218,
+ "grad_norm": 6.118013381958008,
+ "learning_rate": 1.6285233579632525e-05,
+ "loss": 0.5677,
+ "step": 11199
+ },
+ {
+ "epoch": 30.517711171662125,
+ "grad_norm": 7.088701248168945,
+ "learning_rate": 1.628454715902959e-05,
+ "loss": 0.4264,
+ "step": 11200
+ },
+ {
+ "epoch": 30.520435967302454,
+ "grad_norm": 8.072192192077637,
+ "learning_rate": 1.628386068948281e-05,
+ "loss": 0.4079,
+ "step": 11201
+ },
+ {
+ "epoch": 30.52316076294278,
+ "grad_norm": 6.230062007904053,
+ "learning_rate": 1.6283174170997516e-05,
+ "loss": 0.4247,
+ "step": 11202
+ },
+ {
+ "epoch": 30.525885558583106,
+ "grad_norm": 7.471052169799805,
+ "learning_rate": 1.6282487603579073e-05,
+ "loss": 0.4824,
+ "step": 11203
+ },
+ {
+ "epoch": 30.52861035422343,
+ "grad_norm": 8.514483451843262,
+ "learning_rate": 1.6281800987232815e-05,
+ "loss": 0.4504,
+ "step": 11204
+ },
+ {
+ "epoch": 30.53133514986376,
+ "grad_norm": 8.606267929077148,
+ "learning_rate": 1.628111432196409e-05,
+ "loss": 0.4247,
+ "step": 11205
+ },
+ {
+ "epoch": 30.534059945504087,
+ "grad_norm": 7.907001495361328,
+ "learning_rate": 1.628042760777825e-05,
+ "loss": 0.3819,
+ "step": 11206
+ },
+ {
+ "epoch": 30.536784741144416,
+ "grad_norm": 7.460330009460449,
+ "learning_rate": 1.6279740844680647e-05,
+ "loss": 0.4031,
+ "step": 11207
+ },
+ {
+ "epoch": 30.539509536784742,
+ "grad_norm": 6.786050319671631,
+ "learning_rate": 1.627905403267662e-05,
+ "loss": 0.3704,
+ "step": 11208
+ },
+ {
+ "epoch": 30.542234332425068,
+ "grad_norm": 7.479556560516357,
+ "learning_rate": 1.6278367171771522e-05,
+ "loss": 0.3909,
+ "step": 11209
+ },
+ {
+ "epoch": 30.544959128065393,
+ "grad_norm": 5.854247093200684,
+ "learning_rate": 1.6277680261970706e-05,
+ "loss": 0.4698,
+ "step": 11210
+ },
+ {
+ "epoch": 30.547683923705723,
+ "grad_norm": 8.77616024017334,
+ "learning_rate": 1.6276993303279514e-05,
+ "loss": 0.4579,
+ "step": 11211
+ },
+ {
+ "epoch": 30.55040871934605,
+ "grad_norm": 8.852252960205078,
+ "learning_rate": 1.6276306295703307e-05,
+ "loss": 0.4197,
+ "step": 11212
+ },
+ {
+ "epoch": 30.553133514986374,
+ "grad_norm": 7.174180507659912,
+ "learning_rate": 1.6275619239247423e-05,
+ "loss": 0.3899,
+ "step": 11213
+ },
+ {
+ "epoch": 30.555858310626704,
+ "grad_norm": 7.6936211585998535,
+ "learning_rate": 1.6274932133917217e-05,
+ "loss": 0.4662,
+ "step": 11214
+ },
+ {
+ "epoch": 30.55858310626703,
+ "grad_norm": 7.429311275482178,
+ "learning_rate": 1.6274244979718044e-05,
+ "loss": 0.429,
+ "step": 11215
+ },
+ {
+ "epoch": 30.561307901907355,
+ "grad_norm": 6.269425868988037,
+ "learning_rate": 1.627355777665525e-05,
+ "loss": 0.3629,
+ "step": 11216
+ },
+ {
+ "epoch": 30.564032697547685,
+ "grad_norm": 7.538383483886719,
+ "learning_rate": 1.6272870524734193e-05,
+ "loss": 0.3674,
+ "step": 11217
+ },
+ {
+ "epoch": 30.56675749318801,
+ "grad_norm": 7.07504940032959,
+ "learning_rate": 1.6272183223960224e-05,
+ "loss": 0.4295,
+ "step": 11218
+ },
+ {
+ "epoch": 30.569482288828336,
+ "grad_norm": 7.453427314758301,
+ "learning_rate": 1.6271495874338692e-05,
+ "loss": 0.391,
+ "step": 11219
+ },
+ {
+ "epoch": 30.572207084468666,
+ "grad_norm": 8.222543716430664,
+ "learning_rate": 1.6270808475874953e-05,
+ "loss": 0.475,
+ "step": 11220
+ },
+ {
+ "epoch": 30.57493188010899,
+ "grad_norm": 6.086309909820557,
+ "learning_rate": 1.6270121028574358e-05,
+ "loss": 0.5153,
+ "step": 11221
+ },
+ {
+ "epoch": 30.577656675749317,
+ "grad_norm": 6.072343349456787,
+ "learning_rate": 1.6269433532442262e-05,
+ "loss": 0.4074,
+ "step": 11222
+ },
+ {
+ "epoch": 30.580381471389646,
+ "grad_norm": 11.468491554260254,
+ "learning_rate": 1.626874598748402e-05,
+ "loss": 0.4034,
+ "step": 11223
+ },
+ {
+ "epoch": 30.583106267029972,
+ "grad_norm": 7.184165954589844,
+ "learning_rate": 1.6268058393704986e-05,
+ "loss": 0.2477,
+ "step": 11224
+ },
+ {
+ "epoch": 30.585831062670298,
+ "grad_norm": 7.140717029571533,
+ "learning_rate": 1.6267370751110516e-05,
+ "loss": 0.3927,
+ "step": 11225
+ },
+ {
+ "epoch": 30.588555858310627,
+ "grad_norm": 7.32138729095459,
+ "learning_rate": 1.626668305970596e-05,
+ "loss": 0.4031,
+ "step": 11226
+ },
+ {
+ "epoch": 30.591280653950953,
+ "grad_norm": 5.864624500274658,
+ "learning_rate": 1.626599531949668e-05,
+ "loss": 0.5443,
+ "step": 11227
+ },
+ {
+ "epoch": 30.59400544959128,
+ "grad_norm": 5.666828632354736,
+ "learning_rate": 1.626530753048803e-05,
+ "loss": 0.3853,
+ "step": 11228
+ },
+ {
+ "epoch": 30.59673024523161,
+ "grad_norm": 5.726497173309326,
+ "learning_rate": 1.626461969268537e-05,
+ "loss": 0.4012,
+ "step": 11229
+ },
+ {
+ "epoch": 30.599455040871934,
+ "grad_norm": 8.0853271484375,
+ "learning_rate": 1.6263931806094053e-05,
+ "loss": 0.4961,
+ "step": 11230
+ },
+ {
+ "epoch": 30.60217983651226,
+ "grad_norm": 10.106380462646484,
+ "learning_rate": 1.6263243870719436e-05,
+ "loss": 0.4315,
+ "step": 11231
+ },
+ {
+ "epoch": 30.60490463215259,
+ "grad_norm": 8.311697959899902,
+ "learning_rate": 1.6262555886566874e-05,
+ "loss": 0.3714,
+ "step": 11232
+ },
+ {
+ "epoch": 30.607629427792915,
+ "grad_norm": 7.060946941375732,
+ "learning_rate": 1.626186785364173e-05,
+ "loss": 0.4977,
+ "step": 11233
+ },
+ {
+ "epoch": 30.61035422343324,
+ "grad_norm": 7.943112373352051,
+ "learning_rate": 1.6261179771949364e-05,
+ "loss": 0.4243,
+ "step": 11234
+ },
+ {
+ "epoch": 30.61307901907357,
+ "grad_norm": 6.9223222732543945,
+ "learning_rate": 1.6260491641495127e-05,
+ "loss": 0.5494,
+ "step": 11235
+ },
+ {
+ "epoch": 30.615803814713896,
+ "grad_norm": 7.2110161781311035,
+ "learning_rate": 1.6259803462284383e-05,
+ "loss": 0.5115,
+ "step": 11236
+ },
+ {
+ "epoch": 30.618528610354222,
+ "grad_norm": 40.30569839477539,
+ "learning_rate": 1.6259115234322492e-05,
+ "loss": 0.3106,
+ "step": 11237
+ },
+ {
+ "epoch": 30.62125340599455,
+ "grad_norm": 6.456710338592529,
+ "learning_rate": 1.6258426957614814e-05,
+ "loss": 0.4498,
+ "step": 11238
+ },
+ {
+ "epoch": 30.623978201634877,
+ "grad_norm": 8.054564476013184,
+ "learning_rate": 1.625773863216671e-05,
+ "loss": 0.4762,
+ "step": 11239
+ },
+ {
+ "epoch": 30.626702997275203,
+ "grad_norm": 6.941972732543945,
+ "learning_rate": 1.6257050257983536e-05,
+ "loss": 0.4694,
+ "step": 11240
+ },
+ {
+ "epoch": 30.629427792915532,
+ "grad_norm": 8.115713119506836,
+ "learning_rate": 1.625636183507066e-05,
+ "loss": 0.5095,
+ "step": 11241
+ },
+ {
+ "epoch": 30.632152588555858,
+ "grad_norm": 13.512476921081543,
+ "learning_rate": 1.6255673363433432e-05,
+ "loss": 0.4984,
+ "step": 11242
+ },
+ {
+ "epoch": 30.634877384196184,
+ "grad_norm": 5.05262565612793,
+ "learning_rate": 1.6254984843077228e-05,
+ "loss": 0.4244,
+ "step": 11243
+ },
+ {
+ "epoch": 30.637602179836513,
+ "grad_norm": 6.971745491027832,
+ "learning_rate": 1.62542962740074e-05,
+ "loss": 0.4017,
+ "step": 11244
+ },
+ {
+ "epoch": 30.64032697547684,
+ "grad_norm": 7.403254985809326,
+ "learning_rate": 1.625360765622931e-05,
+ "loss": 0.6022,
+ "step": 11245
+ },
+ {
+ "epoch": 30.643051771117165,
+ "grad_norm": 7.056795597076416,
+ "learning_rate": 1.6252918989748333e-05,
+ "loss": 0.5388,
+ "step": 11246
+ },
+ {
+ "epoch": 30.645776566757494,
+ "grad_norm": 7.612959384918213,
+ "learning_rate": 1.625223027456982e-05,
+ "loss": 0.4792,
+ "step": 11247
+ },
+ {
+ "epoch": 30.64850136239782,
+ "grad_norm": 6.716630458831787,
+ "learning_rate": 1.625154151069914e-05,
+ "loss": 0.4965,
+ "step": 11248
+ },
+ {
+ "epoch": 30.651226158038146,
+ "grad_norm": 7.09428596496582,
+ "learning_rate": 1.6250852698141654e-05,
+ "loss": 0.3607,
+ "step": 11249
+ },
+ {
+ "epoch": 30.653950953678475,
+ "grad_norm": 6.382897853851318,
+ "learning_rate": 1.625016383690273e-05,
+ "loss": 0.3431,
+ "step": 11250
+ },
+ {
+ "epoch": 30.6566757493188,
+ "grad_norm": 7.352816104888916,
+ "learning_rate": 1.624947492698773e-05,
+ "loss": 0.5231,
+ "step": 11251
+ },
+ {
+ "epoch": 30.659400544959126,
+ "grad_norm": 15.394720077514648,
+ "learning_rate": 1.624878596840202e-05,
+ "loss": 0.4471,
+ "step": 11252
+ },
+ {
+ "epoch": 30.662125340599456,
+ "grad_norm": 9.968376159667969,
+ "learning_rate": 1.624809696115097e-05,
+ "loss": 0.476,
+ "step": 11253
+ },
+ {
+ "epoch": 30.66485013623978,
+ "grad_norm": 9.12043285369873,
+ "learning_rate": 1.624740790523994e-05,
+ "loss": 0.684,
+ "step": 11254
+ },
+ {
+ "epoch": 30.667574931880107,
+ "grad_norm": 7.758697986602783,
+ "learning_rate": 1.6246718800674296e-05,
+ "loss": 0.5054,
+ "step": 11255
+ },
+ {
+ "epoch": 30.670299727520437,
+ "grad_norm": 6.44129753112793,
+ "learning_rate": 1.624602964745941e-05,
+ "loss": 0.4493,
+ "step": 11256
+ },
+ {
+ "epoch": 30.673024523160763,
+ "grad_norm": 7.188642501831055,
+ "learning_rate": 1.6245340445600643e-05,
+ "loss": 0.3573,
+ "step": 11257
+ },
+ {
+ "epoch": 30.67574931880109,
+ "grad_norm": 8.696399688720703,
+ "learning_rate": 1.6244651195103367e-05,
+ "loss": 0.5812,
+ "step": 11258
+ },
+ {
+ "epoch": 30.678474114441418,
+ "grad_norm": 13.490169525146484,
+ "learning_rate": 1.6243961895972948e-05,
+ "loss": 0.5551,
+ "step": 11259
+ },
+ {
+ "epoch": 30.681198910081743,
+ "grad_norm": 7.445071220397949,
+ "learning_rate": 1.6243272548214758e-05,
+ "loss": 0.2846,
+ "step": 11260
+ },
+ {
+ "epoch": 30.68392370572207,
+ "grad_norm": 6.342952251434326,
+ "learning_rate": 1.624258315183416e-05,
+ "loss": 0.5732,
+ "step": 11261
+ },
+ {
+ "epoch": 30.6866485013624,
+ "grad_norm": 7.206576347351074,
+ "learning_rate": 1.6241893706836525e-05,
+ "loss": 0.621,
+ "step": 11262
+ },
+ {
+ "epoch": 30.689373297002724,
+ "grad_norm": 6.406331539154053,
+ "learning_rate": 1.6241204213227223e-05,
+ "loss": 0.4424,
+ "step": 11263
+ },
+ {
+ "epoch": 30.69209809264305,
+ "grad_norm": 6.325895309448242,
+ "learning_rate": 1.6240514671011623e-05,
+ "loss": 0.4019,
+ "step": 11264
+ },
+ {
+ "epoch": 30.69482288828338,
+ "grad_norm": 6.496794700622559,
+ "learning_rate": 1.6239825080195096e-05,
+ "loss": 0.442,
+ "step": 11265
+ },
+ {
+ "epoch": 30.697547683923705,
+ "grad_norm": 6.719447612762451,
+ "learning_rate": 1.623913544078301e-05,
+ "loss": 0.4412,
+ "step": 11266
+ },
+ {
+ "epoch": 30.70027247956403,
+ "grad_norm": 7.510452747344971,
+ "learning_rate": 1.6238445752780742e-05,
+ "loss": 0.4723,
+ "step": 11267
+ },
+ {
+ "epoch": 30.70299727520436,
+ "grad_norm": 7.245124340057373,
+ "learning_rate": 1.623775601619366e-05,
+ "loss": 0.462,
+ "step": 11268
+ },
+ {
+ "epoch": 30.705722070844686,
+ "grad_norm": 7.671139717102051,
+ "learning_rate": 1.623706623102713e-05,
+ "loss": 0.4833,
+ "step": 11269
+ },
+ {
+ "epoch": 30.708446866485012,
+ "grad_norm": 7.977005958557129,
+ "learning_rate": 1.623637639728653e-05,
+ "loss": 0.4939,
+ "step": 11270
+ },
+ {
+ "epoch": 30.71117166212534,
+ "grad_norm": 7.758381366729736,
+ "learning_rate": 1.623568651497723e-05,
+ "loss": 0.4451,
+ "step": 11271
+ },
+ {
+ "epoch": 30.713896457765667,
+ "grad_norm": 8.436704635620117,
+ "learning_rate": 1.623499658410461e-05,
+ "loss": 0.3275,
+ "step": 11272
+ },
+ {
+ "epoch": 30.716621253405993,
+ "grad_norm": 7.324213981628418,
+ "learning_rate": 1.6234306604674034e-05,
+ "loss": 0.3871,
+ "step": 11273
+ },
+ {
+ "epoch": 30.719346049046322,
+ "grad_norm": 6.613918781280518,
+ "learning_rate": 1.6233616576690876e-05,
+ "loss": 0.4449,
+ "step": 11274
+ },
+ {
+ "epoch": 30.722070844686648,
+ "grad_norm": 7.338347434997559,
+ "learning_rate": 1.6232926500160514e-05,
+ "loss": 0.5445,
+ "step": 11275
+ },
+ {
+ "epoch": 30.724795640326974,
+ "grad_norm": 7.05747652053833,
+ "learning_rate": 1.6232236375088322e-05,
+ "loss": 0.5292,
+ "step": 11276
+ },
+ {
+ "epoch": 30.727520435967303,
+ "grad_norm": 10.454824447631836,
+ "learning_rate": 1.6231546201479676e-05,
+ "loss": 0.5487,
+ "step": 11277
+ },
+ {
+ "epoch": 30.73024523160763,
+ "grad_norm": 8.207958221435547,
+ "learning_rate": 1.623085597933995e-05,
+ "loss": 0.4236,
+ "step": 11278
+ },
+ {
+ "epoch": 30.732970027247955,
+ "grad_norm": 7.944293022155762,
+ "learning_rate": 1.6230165708674513e-05,
+ "loss": 0.4565,
+ "step": 11279
+ },
+ {
+ "epoch": 30.735694822888284,
+ "grad_norm": 7.1323137283325195,
+ "learning_rate": 1.622947538948875e-05,
+ "loss": 0.4794,
+ "step": 11280
+ },
+ {
+ "epoch": 30.73841961852861,
+ "grad_norm": 7.217621803283691,
+ "learning_rate": 1.622878502178803e-05,
+ "loss": 0.5521,
+ "step": 11281
+ },
+ {
+ "epoch": 30.741144414168936,
+ "grad_norm": 6.7949652671813965,
+ "learning_rate": 1.6228094605577734e-05,
+ "loss": 0.387,
+ "step": 11282
+ },
+ {
+ "epoch": 30.743869209809265,
+ "grad_norm": 7.413728713989258,
+ "learning_rate": 1.6227404140863233e-05,
+ "loss": 0.3795,
+ "step": 11283
+ },
+ {
+ "epoch": 30.74659400544959,
+ "grad_norm": 5.315408229827881,
+ "learning_rate": 1.6226713627649914e-05,
+ "loss": 0.2813,
+ "step": 11284
+ },
+ {
+ "epoch": 30.749318801089917,
+ "grad_norm": 7.66859245300293,
+ "learning_rate": 1.622602306594315e-05,
+ "loss": 0.428,
+ "step": 11285
+ },
+ {
+ "epoch": 30.752043596730246,
+ "grad_norm": 7.728278636932373,
+ "learning_rate": 1.622533245574832e-05,
+ "loss": 0.3884,
+ "step": 11286
+ },
+ {
+ "epoch": 30.754768392370572,
+ "grad_norm": 5.734921455383301,
+ "learning_rate": 1.62246417970708e-05,
+ "loss": 0.3226,
+ "step": 11287
+ },
+ {
+ "epoch": 30.757493188010898,
+ "grad_norm": 7.37510871887207,
+ "learning_rate": 1.6223951089915968e-05,
+ "loss": 0.4894,
+ "step": 11288
+ },
+ {
+ "epoch": 30.760217983651227,
+ "grad_norm": 6.9354143142700195,
+ "learning_rate": 1.6223260334289208e-05,
+ "loss": 0.5839,
+ "step": 11289
+ },
+ {
+ "epoch": 30.762942779291553,
+ "grad_norm": 7.1436944007873535,
+ "learning_rate": 1.6222569530195894e-05,
+ "loss": 0.5088,
+ "step": 11290
+ },
+ {
+ "epoch": 30.76566757493188,
+ "grad_norm": 6.357337951660156,
+ "learning_rate": 1.622187867764141e-05,
+ "loss": 0.4811,
+ "step": 11291
+ },
+ {
+ "epoch": 30.768392370572208,
+ "grad_norm": 7.193835258483887,
+ "learning_rate": 1.6221187776631134e-05,
+ "loss": 0.3481,
+ "step": 11292
+ },
+ {
+ "epoch": 30.771117166212534,
+ "grad_norm": 6.292130470275879,
+ "learning_rate": 1.622049682717045e-05,
+ "loss": 0.4471,
+ "step": 11293
+ },
+ {
+ "epoch": 30.77384196185286,
+ "grad_norm": 7.480403900146484,
+ "learning_rate": 1.6219805829264738e-05,
+ "loss": 0.3723,
+ "step": 11294
+ },
+ {
+ "epoch": 30.77656675749319,
+ "grad_norm": 6.53055477142334,
+ "learning_rate": 1.621911478291937e-05,
+ "loss": 0.5594,
+ "step": 11295
+ },
+ {
+ "epoch": 30.779291553133515,
+ "grad_norm": 6.633364677429199,
+ "learning_rate": 1.6218423688139748e-05,
+ "loss": 0.3906,
+ "step": 11296
+ },
+ {
+ "epoch": 30.78201634877384,
+ "grad_norm": 6.3846917152404785,
+ "learning_rate": 1.6217732544931237e-05,
+ "loss": 0.3395,
+ "step": 11297
+ },
+ {
+ "epoch": 30.78474114441417,
+ "grad_norm": 5.787449359893799,
+ "learning_rate": 1.6217041353299224e-05,
+ "loss": 0.4193,
+ "step": 11298
+ },
+ {
+ "epoch": 30.787465940054496,
+ "grad_norm": 6.977640151977539,
+ "learning_rate": 1.6216350113249094e-05,
+ "loss": 0.4863,
+ "step": 11299
+ },
+ {
+ "epoch": 30.79019073569482,
+ "grad_norm": 6.857836723327637,
+ "learning_rate": 1.6215658824786226e-05,
+ "loss": 0.4244,
+ "step": 11300
+ },
+ {
+ "epoch": 30.79291553133515,
+ "grad_norm": 6.683234691619873,
+ "learning_rate": 1.6214967487916012e-05,
+ "loss": 0.3848,
+ "step": 11301
+ },
+ {
+ "epoch": 30.795640326975477,
+ "grad_norm": 6.261143684387207,
+ "learning_rate": 1.6214276102643828e-05,
+ "loss": 0.331,
+ "step": 11302
+ },
+ {
+ "epoch": 30.798365122615802,
+ "grad_norm": 8.550078392028809,
+ "learning_rate": 1.6213584668975064e-05,
+ "loss": 0.3848,
+ "step": 11303
+ },
+ {
+ "epoch": 30.80108991825613,
+ "grad_norm": 6.435115814208984,
+ "learning_rate": 1.6212893186915105e-05,
+ "loss": 0.3448,
+ "step": 11304
+ },
+ {
+ "epoch": 30.803814713896458,
+ "grad_norm": 7.466169834136963,
+ "learning_rate": 1.6212201656469328e-05,
+ "loss": 0.5968,
+ "step": 11305
+ },
+ {
+ "epoch": 30.806539509536783,
+ "grad_norm": 7.373120307922363,
+ "learning_rate": 1.621151007764313e-05,
+ "loss": 0.3631,
+ "step": 11306
+ },
+ {
+ "epoch": 30.809264305177113,
+ "grad_norm": 6.224044322967529,
+ "learning_rate": 1.621081845044189e-05,
+ "loss": 0.3088,
+ "step": 11307
+ },
+ {
+ "epoch": 30.81198910081744,
+ "grad_norm": 10.48534107208252,
+ "learning_rate": 1.6210126774870992e-05,
+ "loss": 0.44,
+ "step": 11308
+ },
+ {
+ "epoch": 30.814713896457764,
+ "grad_norm": 6.622835159301758,
+ "learning_rate": 1.620943505093583e-05,
+ "loss": 0.4076,
+ "step": 11309
+ },
+ {
+ "epoch": 30.817438692098094,
+ "grad_norm": 6.534196376800537,
+ "learning_rate": 1.620874327864179e-05,
+ "loss": 0.3479,
+ "step": 11310
+ },
+ {
+ "epoch": 30.82016348773842,
+ "grad_norm": 7.377260208129883,
+ "learning_rate": 1.620805145799425e-05,
+ "loss": 0.4688,
+ "step": 11311
+ },
+ {
+ "epoch": 30.822888283378745,
+ "grad_norm": 9.587128639221191,
+ "learning_rate": 1.6207359588998608e-05,
+ "loss": 0.4082,
+ "step": 11312
+ },
+ {
+ "epoch": 30.825613079019075,
+ "grad_norm": 6.322308540344238,
+ "learning_rate": 1.620666767166025e-05,
+ "loss": 0.4466,
+ "step": 11313
+ },
+ {
+ "epoch": 30.8283378746594,
+ "grad_norm": 10.123698234558105,
+ "learning_rate": 1.6205975705984565e-05,
+ "loss": 0.3615,
+ "step": 11314
+ },
+ {
+ "epoch": 30.831062670299726,
+ "grad_norm": 7.531373977661133,
+ "learning_rate": 1.620528369197694e-05,
+ "loss": 0.3455,
+ "step": 11315
+ },
+ {
+ "epoch": 30.833787465940055,
+ "grad_norm": 6.879456996917725,
+ "learning_rate": 1.6204591629642767e-05,
+ "loss": 0.3533,
+ "step": 11316
+ },
+ {
+ "epoch": 30.83651226158038,
+ "grad_norm": 8.004433631896973,
+ "learning_rate": 1.620389951898743e-05,
+ "loss": 0.3981,
+ "step": 11317
+ },
+ {
+ "epoch": 30.839237057220707,
+ "grad_norm": 7.241403102874756,
+ "learning_rate": 1.6203207360016328e-05,
+ "loss": 0.4425,
+ "step": 11318
+ },
+ {
+ "epoch": 30.841961852861036,
+ "grad_norm": 7.608405113220215,
+ "learning_rate": 1.6202515152734844e-05,
+ "loss": 0.448,
+ "step": 11319
+ },
+ {
+ "epoch": 30.844686648501362,
+ "grad_norm": 6.407038688659668,
+ "learning_rate": 1.620182289714837e-05,
+ "loss": 0.38,
+ "step": 11320
+ },
+ {
+ "epoch": 30.847411444141688,
+ "grad_norm": 6.163354396820068,
+ "learning_rate": 1.62011305932623e-05,
+ "loss": 0.4984,
+ "step": 11321
+ },
+ {
+ "epoch": 30.850136239782017,
+ "grad_norm": 7.411386966705322,
+ "learning_rate": 1.6200438241082032e-05,
+ "loss": 0.4138,
+ "step": 11322
+ },
+ {
+ "epoch": 30.852861035422343,
+ "grad_norm": 7.78454065322876,
+ "learning_rate": 1.6199745840612942e-05,
+ "loss": 0.3887,
+ "step": 11323
+ },
+ {
+ "epoch": 30.85558583106267,
+ "grad_norm": 6.8289794921875,
+ "learning_rate": 1.619905339186043e-05,
+ "loss": 0.5495,
+ "step": 11324
+ },
+ {
+ "epoch": 30.858310626703,
+ "grad_norm": 7.852591037750244,
+ "learning_rate": 1.6198360894829893e-05,
+ "loss": 0.543,
+ "step": 11325
+ },
+ {
+ "epoch": 30.861035422343324,
+ "grad_norm": 6.447912693023682,
+ "learning_rate": 1.619766834952672e-05,
+ "loss": 0.5576,
+ "step": 11326
+ },
+ {
+ "epoch": 30.86376021798365,
+ "grad_norm": 12.491286277770996,
+ "learning_rate": 1.6196975755956308e-05,
+ "loss": 0.3752,
+ "step": 11327
+ },
+ {
+ "epoch": 30.86648501362398,
+ "grad_norm": 7.9670610427856445,
+ "learning_rate": 1.6196283114124045e-05,
+ "loss": 0.5906,
+ "step": 11328
+ },
+ {
+ "epoch": 30.869209809264305,
+ "grad_norm": 6.724163055419922,
+ "learning_rate": 1.619559042403533e-05,
+ "loss": 0.412,
+ "step": 11329
+ },
+ {
+ "epoch": 30.87193460490463,
+ "grad_norm": 7.976020336151123,
+ "learning_rate": 1.6194897685695558e-05,
+ "loss": 0.4774,
+ "step": 11330
+ },
+ {
+ "epoch": 30.87465940054496,
+ "grad_norm": 6.1216607093811035,
+ "learning_rate": 1.6194204899110118e-05,
+ "loss": 0.435,
+ "step": 11331
+ },
+ {
+ "epoch": 30.877384196185286,
+ "grad_norm": 11.007805824279785,
+ "learning_rate": 1.619351206428441e-05,
+ "loss": 0.418,
+ "step": 11332
+ },
+ {
+ "epoch": 30.88010899182561,
+ "grad_norm": 11.148780822753906,
+ "learning_rate": 1.6192819181223835e-05,
+ "loss": 0.3734,
+ "step": 11333
+ },
+ {
+ "epoch": 30.88283378746594,
+ "grad_norm": 6.831493377685547,
+ "learning_rate": 1.6192126249933776e-05,
+ "loss": 0.8787,
+ "step": 11334
+ },
+ {
+ "epoch": 30.885558583106267,
+ "grad_norm": 7.386627197265625,
+ "learning_rate": 1.619143327041964e-05,
+ "loss": 0.5354,
+ "step": 11335
+ },
+ {
+ "epoch": 30.888283378746593,
+ "grad_norm": 14.94681167602539,
+ "learning_rate": 1.619074024268682e-05,
+ "loss": 0.4447,
+ "step": 11336
+ },
+ {
+ "epoch": 30.891008174386922,
+ "grad_norm": 9.879965782165527,
+ "learning_rate": 1.619004716674072e-05,
+ "loss": 0.5003,
+ "step": 11337
+ },
+ {
+ "epoch": 30.893732970027248,
+ "grad_norm": 7.779361248016357,
+ "learning_rate": 1.6189354042586728e-05,
+ "loss": 0.4738,
+ "step": 11338
+ },
+ {
+ "epoch": 30.896457765667574,
+ "grad_norm": 6.914754390716553,
+ "learning_rate": 1.6188660870230246e-05,
+ "loss": 0.3867,
+ "step": 11339
+ },
+ {
+ "epoch": 30.899182561307903,
+ "grad_norm": 6.506638050079346,
+ "learning_rate": 1.6187967649676674e-05,
+ "loss": 0.4524,
+ "step": 11340
+ },
+ {
+ "epoch": 30.90190735694823,
+ "grad_norm": 13.945359230041504,
+ "learning_rate": 1.6187274380931403e-05,
+ "loss": 0.423,
+ "step": 11341
+ },
+ {
+ "epoch": 30.904632152588555,
+ "grad_norm": 8.164636611938477,
+ "learning_rate": 1.6186581063999844e-05,
+ "loss": 0.4088,
+ "step": 11342
+ },
+ {
+ "epoch": 30.907356948228884,
+ "grad_norm": 8.097151756286621,
+ "learning_rate": 1.6185887698887388e-05,
+ "loss": 0.5584,
+ "step": 11343
+ },
+ {
+ "epoch": 30.91008174386921,
+ "grad_norm": 6.8635149002075195,
+ "learning_rate": 1.618519428559944e-05,
+ "loss": 0.3417,
+ "step": 11344
+ },
+ {
+ "epoch": 30.912806539509535,
+ "grad_norm": 7.3902907371521,
+ "learning_rate": 1.6184500824141395e-05,
+ "loss": 0.5122,
+ "step": 11345
+ },
+ {
+ "epoch": 30.915531335149865,
+ "grad_norm": 7.98119592666626,
+ "learning_rate": 1.618380731451866e-05,
+ "loss": 0.495,
+ "step": 11346
+ },
+ {
+ "epoch": 30.91825613079019,
+ "grad_norm": 8.91533374786377,
+ "learning_rate": 1.618311375673663e-05,
+ "loss": 0.2698,
+ "step": 11347
+ },
+ {
+ "epoch": 30.920980926430516,
+ "grad_norm": 6.444336891174316,
+ "learning_rate": 1.6182420150800712e-05,
+ "loss": 0.4418,
+ "step": 11348
+ },
+ {
+ "epoch": 30.923705722070846,
+ "grad_norm": 6.765807628631592,
+ "learning_rate": 1.6181726496716304e-05,
+ "loss": 0.5147,
+ "step": 11349
+ },
+ {
+ "epoch": 30.92643051771117,
+ "grad_norm": 8.13369369506836,
+ "learning_rate": 1.6181032794488807e-05,
+ "loss": 0.43,
+ "step": 11350
+ },
+ {
+ "epoch": 30.929155313351497,
+ "grad_norm": 7.940556526184082,
+ "learning_rate": 1.6180339044123625e-05,
+ "loss": 0.4167,
+ "step": 11351
+ },
+ {
+ "epoch": 30.931880108991827,
+ "grad_norm": 8.560213088989258,
+ "learning_rate": 1.6179645245626165e-05,
+ "loss": 0.3338,
+ "step": 11352
+ },
+ {
+ "epoch": 30.934604904632153,
+ "grad_norm": 8.294337272644043,
+ "learning_rate": 1.617895139900182e-05,
+ "loss": 0.4414,
+ "step": 11353
+ },
+ {
+ "epoch": 30.93732970027248,
+ "grad_norm": 6.885270595550537,
+ "learning_rate": 1.6178257504256006e-05,
+ "loss": 0.4163,
+ "step": 11354
+ },
+ {
+ "epoch": 30.940054495912808,
+ "grad_norm": 9.962544441223145,
+ "learning_rate": 1.6177563561394123e-05,
+ "loss": 0.5212,
+ "step": 11355
+ },
+ {
+ "epoch": 30.942779291553133,
+ "grad_norm": 7.879058837890625,
+ "learning_rate": 1.617686957042157e-05,
+ "loss": 0.4608,
+ "step": 11356
+ },
+ {
+ "epoch": 30.94550408719346,
+ "grad_norm": 9.151025772094727,
+ "learning_rate": 1.617617553134376e-05,
+ "loss": 0.5252,
+ "step": 11357
+ },
+ {
+ "epoch": 30.94822888283379,
+ "grad_norm": 7.61784553527832,
+ "learning_rate": 1.617548144416609e-05,
+ "loss": 0.3527,
+ "step": 11358
+ },
+ {
+ "epoch": 30.950953678474114,
+ "grad_norm": 7.675395965576172,
+ "learning_rate": 1.617478730889397e-05,
+ "loss": 0.4101,
+ "step": 11359
+ },
+ {
+ "epoch": 30.95367847411444,
+ "grad_norm": 7.265422344207764,
+ "learning_rate": 1.6174093125532803e-05,
+ "loss": 0.5717,
+ "step": 11360
+ },
+ {
+ "epoch": 30.95640326975477,
+ "grad_norm": 8.320547103881836,
+ "learning_rate": 1.6173398894088e-05,
+ "loss": 0.5793,
+ "step": 11361
+ },
+ {
+ "epoch": 30.959128065395095,
+ "grad_norm": 7.721741676330566,
+ "learning_rate": 1.617270461456496e-05,
+ "loss": 0.3912,
+ "step": 11362
+ },
+ {
+ "epoch": 30.96185286103542,
+ "grad_norm": 7.551270961761475,
+ "learning_rate": 1.6172010286969105e-05,
+ "loss": 0.3861,
+ "step": 11363
+ },
+ {
+ "epoch": 30.96457765667575,
+ "grad_norm": 7.487505912780762,
+ "learning_rate": 1.6171315911305824e-05,
+ "loss": 0.5294,
+ "step": 11364
+ },
+ {
+ "epoch": 30.967302452316076,
+ "grad_norm": 9.483017921447754,
+ "learning_rate": 1.6170621487580538e-05,
+ "loss": 0.3951,
+ "step": 11365
+ },
+ {
+ "epoch": 30.970027247956402,
+ "grad_norm": 8.659347534179688,
+ "learning_rate": 1.616992701579865e-05,
+ "loss": 0.423,
+ "step": 11366
+ },
+ {
+ "epoch": 30.97275204359673,
+ "grad_norm": 7.702268600463867,
+ "learning_rate": 1.616923249596557e-05,
+ "loss": 0.5224,
+ "step": 11367
+ },
+ {
+ "epoch": 30.975476839237057,
+ "grad_norm": 6.881136417388916,
+ "learning_rate": 1.6168537928086703e-05,
+ "loss": 0.4398,
+ "step": 11368
+ },
+ {
+ "epoch": 30.978201634877383,
+ "grad_norm": 7.698774337768555,
+ "learning_rate": 1.616784331216746e-05,
+ "loss": 0.4814,
+ "step": 11369
+ },
+ {
+ "epoch": 30.980926430517712,
+ "grad_norm": 7.118900775909424,
+ "learning_rate": 1.6167148648213255e-05,
+ "loss": 0.5659,
+ "step": 11370
+ },
+ {
+ "epoch": 30.983651226158038,
+ "grad_norm": 6.75089693069458,
+ "learning_rate": 1.616645393622949e-05,
+ "loss": 0.4426,
+ "step": 11371
+ },
+ {
+ "epoch": 30.986376021798364,
+ "grad_norm": 8.22135066986084,
+ "learning_rate": 1.6165759176221588e-05,
+ "loss": 0.364,
+ "step": 11372
+ },
+ {
+ "epoch": 30.989100817438693,
+ "grad_norm": 6.734350204467773,
+ "learning_rate": 1.6165064368194946e-05,
+ "loss": 0.4398,
+ "step": 11373
+ },
+ {
+ "epoch": 30.99182561307902,
+ "grad_norm": 6.77470588684082,
+ "learning_rate": 1.6164369512154984e-05,
+ "loss": 0.428,
+ "step": 11374
+ },
+ {
+ "epoch": 30.994550408719345,
+ "grad_norm": 7.893370628356934,
+ "learning_rate": 1.616367460810711e-05,
+ "loss": 0.5637,
+ "step": 11375
+ },
+ {
+ "epoch": 30.997275204359674,
+ "grad_norm": 6.426718711853027,
+ "learning_rate": 1.6162979656056735e-05,
+ "loss": 0.428,
+ "step": 11376
+ },
+ {
+ "epoch": 31.0,
+ "grad_norm": 8.785823822021484,
+ "learning_rate": 1.6162284656009276e-05,
+ "loss": 0.3823,
+ "step": 11377
+ },
+ {
+ "epoch": 31.002724795640326,
+ "grad_norm": 7.742459297180176,
+ "learning_rate": 1.6161589607970137e-05,
+ "loss": 0.4664,
+ "step": 11378
+ },
+ {
+ "epoch": 31.005449591280655,
+ "grad_norm": 6.6974992752075195,
+ "learning_rate": 1.616089451194474e-05,
+ "loss": 0.3357,
+ "step": 11379
+ },
+ {
+ "epoch": 31.00817438692098,
+ "grad_norm": 8.149337768554688,
+ "learning_rate": 1.6160199367938494e-05,
+ "loss": 0.3966,
+ "step": 11380
+ },
+ {
+ "epoch": 31.010899182561307,
+ "grad_norm": 6.426740646362305,
+ "learning_rate": 1.6159504175956815e-05,
+ "loss": 0.4183,
+ "step": 11381
+ },
+ {
+ "epoch": 31.013623978201636,
+ "grad_norm": 18.186363220214844,
+ "learning_rate": 1.6158808936005116e-05,
+ "loss": 0.4672,
+ "step": 11382
+ },
+ {
+ "epoch": 31.016348773841962,
+ "grad_norm": 17.358253479003906,
+ "learning_rate": 1.615811364808881e-05,
+ "loss": 0.3635,
+ "step": 11383
+ },
+ {
+ "epoch": 31.019073569482288,
+ "grad_norm": 7.258265972137451,
+ "learning_rate": 1.6157418312213313e-05,
+ "loss": 0.4673,
+ "step": 11384
+ },
+ {
+ "epoch": 31.021798365122617,
+ "grad_norm": 5.632544040679932,
+ "learning_rate": 1.6156722928384042e-05,
+ "loss": 0.4389,
+ "step": 11385
+ },
+ {
+ "epoch": 31.024523160762943,
+ "grad_norm": 6.65710973739624,
+ "learning_rate": 1.6156027496606408e-05,
+ "loss": 0.3953,
+ "step": 11386
+ },
+ {
+ "epoch": 31.02724795640327,
+ "grad_norm": 8.200004577636719,
+ "learning_rate": 1.615533201688583e-05,
+ "loss": 0.2825,
+ "step": 11387
+ },
+ {
+ "epoch": 31.029972752043598,
+ "grad_norm": 6.341181755065918,
+ "learning_rate": 1.6154636489227726e-05,
+ "loss": 0.4567,
+ "step": 11388
+ },
+ {
+ "epoch": 31.032697547683924,
+ "grad_norm": 8.055546760559082,
+ "learning_rate": 1.615394091363751e-05,
+ "loss": 0.3899,
+ "step": 11389
+ },
+ {
+ "epoch": 31.03542234332425,
+ "grad_norm": 6.492162704467773,
+ "learning_rate": 1.6153245290120602e-05,
+ "loss": 0.3247,
+ "step": 11390
+ },
+ {
+ "epoch": 31.03814713896458,
+ "grad_norm": 5.917665958404541,
+ "learning_rate": 1.6152549618682418e-05,
+ "loss": 0.3828,
+ "step": 11391
+ },
+ {
+ "epoch": 31.040871934604905,
+ "grad_norm": 6.391448497772217,
+ "learning_rate": 1.6151853899328377e-05,
+ "loss": 0.4669,
+ "step": 11392
+ },
+ {
+ "epoch": 31.04359673024523,
+ "grad_norm": 7.711374282836914,
+ "learning_rate": 1.6151158132063892e-05,
+ "loss": 0.3836,
+ "step": 11393
+ },
+ {
+ "epoch": 31.04632152588556,
+ "grad_norm": 8.410181045532227,
+ "learning_rate": 1.615046231689439e-05,
+ "loss": 0.5526,
+ "step": 11394
+ },
+ {
+ "epoch": 31.049046321525886,
+ "grad_norm": 9.054497718811035,
+ "learning_rate": 1.614976645382528e-05,
+ "loss": 0.4236,
+ "step": 11395
+ },
+ {
+ "epoch": 31.05177111716621,
+ "grad_norm": 7.943727493286133,
+ "learning_rate": 1.614907054286199e-05,
+ "loss": 0.4403,
+ "step": 11396
+ },
+ {
+ "epoch": 31.05449591280654,
+ "grad_norm": 7.074095726013184,
+ "learning_rate": 1.6148374584009934e-05,
+ "loss": 0.2817,
+ "step": 11397
+ },
+ {
+ "epoch": 31.057220708446867,
+ "grad_norm": 11.083065032958984,
+ "learning_rate": 1.6147678577274537e-05,
+ "loss": 0.4228,
+ "step": 11398
+ },
+ {
+ "epoch": 31.059945504087192,
+ "grad_norm": 6.933168411254883,
+ "learning_rate": 1.6146982522661216e-05,
+ "loss": 0.3752,
+ "step": 11399
+ },
+ {
+ "epoch": 31.06267029972752,
+ "grad_norm": 6.469690322875977,
+ "learning_rate": 1.6146286420175393e-05,
+ "loss": 0.3382,
+ "step": 11400
+ },
+ {
+ "epoch": 31.065395095367847,
+ "grad_norm": 12.152203559875488,
+ "learning_rate": 1.6145590269822487e-05,
+ "loss": 0.3333,
+ "step": 11401
+ },
+ {
+ "epoch": 31.068119891008173,
+ "grad_norm": 6.3950724601745605,
+ "learning_rate": 1.6144894071607927e-05,
+ "loss": 0.4603,
+ "step": 11402
+ },
+ {
+ "epoch": 31.070844686648503,
+ "grad_norm": 6.445328712463379,
+ "learning_rate": 1.6144197825537127e-05,
+ "loss": 0.4309,
+ "step": 11403
+ },
+ {
+ "epoch": 31.07356948228883,
+ "grad_norm": 6.3824334144592285,
+ "learning_rate": 1.614350153161551e-05,
+ "loss": 0.4089,
+ "step": 11404
+ },
+ {
+ "epoch": 31.076294277929154,
+ "grad_norm": 6.513887882232666,
+ "learning_rate": 1.6142805189848504e-05,
+ "loss": 0.3729,
+ "step": 11405
+ },
+ {
+ "epoch": 31.079019073569484,
+ "grad_norm": 9.495572090148926,
+ "learning_rate": 1.6142108800241527e-05,
+ "loss": 0.4035,
+ "step": 11406
+ },
+ {
+ "epoch": 31.08174386920981,
+ "grad_norm": 5.747984409332275,
+ "learning_rate": 1.6141412362800007e-05,
+ "loss": 0.2485,
+ "step": 11407
+ },
+ {
+ "epoch": 31.084468664850135,
+ "grad_norm": 6.530543804168701,
+ "learning_rate": 1.6140715877529363e-05,
+ "loss": 0.287,
+ "step": 11408
+ },
+ {
+ "epoch": 31.087193460490465,
+ "grad_norm": 6.833845615386963,
+ "learning_rate": 1.614001934443502e-05,
+ "loss": 0.3145,
+ "step": 11409
+ },
+ {
+ "epoch": 31.08991825613079,
+ "grad_norm": 6.342391014099121,
+ "learning_rate": 1.613932276352241e-05,
+ "loss": 0.4034,
+ "step": 11410
+ },
+ {
+ "epoch": 31.092643051771116,
+ "grad_norm": 6.921346664428711,
+ "learning_rate": 1.6138626134796945e-05,
+ "loss": 0.3413,
+ "step": 11411
+ },
+ {
+ "epoch": 31.095367847411445,
+ "grad_norm": 5.6658525466918945,
+ "learning_rate": 1.613792945826406e-05,
+ "loss": 0.4648,
+ "step": 11412
+ },
+ {
+ "epoch": 31.09809264305177,
+ "grad_norm": 6.347414493560791,
+ "learning_rate": 1.6137232733929176e-05,
+ "loss": 0.3158,
+ "step": 11413
+ },
+ {
+ "epoch": 31.100817438692097,
+ "grad_norm": 6.033417701721191,
+ "learning_rate": 1.6136535961797722e-05,
+ "loss": 0.6105,
+ "step": 11414
+ },
+ {
+ "epoch": 31.103542234332426,
+ "grad_norm": 8.13783073425293,
+ "learning_rate": 1.6135839141875127e-05,
+ "loss": 0.3212,
+ "step": 11415
+ },
+ {
+ "epoch": 31.106267029972752,
+ "grad_norm": 6.720310688018799,
+ "learning_rate": 1.613514227416681e-05,
+ "loss": 0.2846,
+ "step": 11416
+ },
+ {
+ "epoch": 31.108991825613078,
+ "grad_norm": 6.779971122741699,
+ "learning_rate": 1.6134445358678205e-05,
+ "loss": 0.287,
+ "step": 11417
+ },
+ {
+ "epoch": 31.111716621253407,
+ "grad_norm": 7.640523433685303,
+ "learning_rate": 1.613374839541474e-05,
+ "loss": 0.3868,
+ "step": 11418
+ },
+ {
+ "epoch": 31.114441416893733,
+ "grad_norm": 8.470203399658203,
+ "learning_rate": 1.6133051384381833e-05,
+ "loss": 0.3141,
+ "step": 11419
+ },
+ {
+ "epoch": 31.11716621253406,
+ "grad_norm": 8.201193809509277,
+ "learning_rate": 1.613235432558492e-05,
+ "loss": 0.3012,
+ "step": 11420
+ },
+ {
+ "epoch": 31.11989100817439,
+ "grad_norm": 8.012935638427734,
+ "learning_rate": 1.6131657219029428e-05,
+ "loss": 0.5099,
+ "step": 11421
+ },
+ {
+ "epoch": 31.122615803814714,
+ "grad_norm": 9.044227600097656,
+ "learning_rate": 1.613096006472079e-05,
+ "loss": 0.3509,
+ "step": 11422
+ },
+ {
+ "epoch": 31.12534059945504,
+ "grad_norm": 7.542146682739258,
+ "learning_rate": 1.6130262862664432e-05,
+ "loss": 0.3584,
+ "step": 11423
+ },
+ {
+ "epoch": 31.12806539509537,
+ "grad_norm": 6.187380313873291,
+ "learning_rate": 1.6129565612865786e-05,
+ "loss": 0.511,
+ "step": 11424
+ },
+ {
+ "epoch": 31.130790190735695,
+ "grad_norm": 7.63981294631958,
+ "learning_rate": 1.6128868315330278e-05,
+ "loss": 0.4031,
+ "step": 11425
+ },
+ {
+ "epoch": 31.13351498637602,
+ "grad_norm": 6.212061405181885,
+ "learning_rate": 1.612817097006334e-05,
+ "loss": 0.4166,
+ "step": 11426
+ },
+ {
+ "epoch": 31.13623978201635,
+ "grad_norm": 6.52099609375,
+ "learning_rate": 1.6127473577070408e-05,
+ "loss": 0.4107,
+ "step": 11427
+ },
+ {
+ "epoch": 31.138964577656676,
+ "grad_norm": 7.275450706481934,
+ "learning_rate": 1.6126776136356906e-05,
+ "loss": 0.365,
+ "step": 11428
+ },
+ {
+ "epoch": 31.141689373297,
+ "grad_norm": 7.747114181518555,
+ "learning_rate": 1.6126078647928266e-05,
+ "loss": 0.3631,
+ "step": 11429
+ },
+ {
+ "epoch": 31.14441416893733,
+ "grad_norm": 6.333340644836426,
+ "learning_rate": 1.6125381111789926e-05,
+ "loss": 0.3771,
+ "step": 11430
+ },
+ {
+ "epoch": 31.147138964577657,
+ "grad_norm": 6.653792381286621,
+ "learning_rate": 1.6124683527947317e-05,
+ "loss": 0.3546,
+ "step": 11431
+ },
+ {
+ "epoch": 31.149863760217983,
+ "grad_norm": 7.549876689910889,
+ "learning_rate": 1.6123985896405863e-05,
+ "loss": 0.3541,
+ "step": 11432
+ },
+ {
+ "epoch": 31.152588555858312,
+ "grad_norm": 8.709712982177734,
+ "learning_rate": 1.612328821717101e-05,
+ "loss": 0.4449,
+ "step": 11433
+ },
+ {
+ "epoch": 31.155313351498638,
+ "grad_norm": 7.690953254699707,
+ "learning_rate": 1.6122590490248185e-05,
+ "loss": 0.5591,
+ "step": 11434
+ },
+ {
+ "epoch": 31.158038147138964,
+ "grad_norm": 5.91731595993042,
+ "learning_rate": 1.612189271564282e-05,
+ "loss": 0.3455,
+ "step": 11435
+ },
+ {
+ "epoch": 31.160762942779293,
+ "grad_norm": 6.265995502471924,
+ "learning_rate": 1.612119489336035e-05,
+ "loss": 0.4231,
+ "step": 11436
+ },
+ {
+ "epoch": 31.16348773841962,
+ "grad_norm": 6.31031608581543,
+ "learning_rate": 1.6120497023406215e-05,
+ "loss": 0.6752,
+ "step": 11437
+ },
+ {
+ "epoch": 31.166212534059945,
+ "grad_norm": 6.493164539337158,
+ "learning_rate": 1.6119799105785845e-05,
+ "loss": 0.2769,
+ "step": 11438
+ },
+ {
+ "epoch": 31.168937329700274,
+ "grad_norm": 5.690825939178467,
+ "learning_rate": 1.6119101140504676e-05,
+ "loss": 0.2941,
+ "step": 11439
+ },
+ {
+ "epoch": 31.1716621253406,
+ "grad_norm": 9.791960716247559,
+ "learning_rate": 1.6118403127568142e-05,
+ "loss": 0.4533,
+ "step": 11440
+ },
+ {
+ "epoch": 31.174386920980925,
+ "grad_norm": 5.588350296020508,
+ "learning_rate": 1.6117705066981685e-05,
+ "loss": 0.4198,
+ "step": 11441
+ },
+ {
+ "epoch": 31.177111716621255,
+ "grad_norm": 9.831247329711914,
+ "learning_rate": 1.611700695875074e-05,
+ "loss": 0.3397,
+ "step": 11442
+ },
+ {
+ "epoch": 31.17983651226158,
+ "grad_norm": 8.07266902923584,
+ "learning_rate": 1.6116308802880737e-05,
+ "loss": 0.4969,
+ "step": 11443
+ },
+ {
+ "epoch": 31.182561307901906,
+ "grad_norm": 9.771881103515625,
+ "learning_rate": 1.6115610599377118e-05,
+ "loss": 0.5136,
+ "step": 11444
+ },
+ {
+ "epoch": 31.185286103542236,
+ "grad_norm": 6.985413074493408,
+ "learning_rate": 1.6114912348245324e-05,
+ "loss": 0.4005,
+ "step": 11445
+ },
+ {
+ "epoch": 31.18801089918256,
+ "grad_norm": 9.464669227600098,
+ "learning_rate": 1.6114214049490787e-05,
+ "loss": 0.4031,
+ "step": 11446
+ },
+ {
+ "epoch": 31.190735694822887,
+ "grad_norm": 7.2476487159729,
+ "learning_rate": 1.6113515703118948e-05,
+ "loss": 0.3992,
+ "step": 11447
+ },
+ {
+ "epoch": 31.193460490463217,
+ "grad_norm": 8.128005981445312,
+ "learning_rate": 1.6112817309135244e-05,
+ "loss": 0.4161,
+ "step": 11448
+ },
+ {
+ "epoch": 31.196185286103542,
+ "grad_norm": 5.896011829376221,
+ "learning_rate": 1.6112118867545118e-05,
+ "loss": 0.5424,
+ "step": 11449
+ },
+ {
+ "epoch": 31.19891008174387,
+ "grad_norm": 6.663732051849365,
+ "learning_rate": 1.6111420378354003e-05,
+ "loss": 0.3523,
+ "step": 11450
+ },
+ {
+ "epoch": 31.201634877384198,
+ "grad_norm": 7.829227447509766,
+ "learning_rate": 1.611072184156735e-05,
+ "loss": 0.5641,
+ "step": 11451
+ },
+ {
+ "epoch": 31.204359673024523,
+ "grad_norm": 6.647010326385498,
+ "learning_rate": 1.6110023257190587e-05,
+ "loss": 0.5236,
+ "step": 11452
+ },
+ {
+ "epoch": 31.20708446866485,
+ "grad_norm": 7.284354209899902,
+ "learning_rate": 1.6109324625229158e-05,
+ "loss": 0.4636,
+ "step": 11453
+ },
+ {
+ "epoch": 31.20980926430518,
+ "grad_norm": 6.334175109863281,
+ "learning_rate": 1.610862594568851e-05,
+ "loss": 0.3138,
+ "step": 11454
+ },
+ {
+ "epoch": 31.212534059945504,
+ "grad_norm": 7.065399169921875,
+ "learning_rate": 1.6107927218574076e-05,
+ "loss": 0.3054,
+ "step": 11455
+ },
+ {
+ "epoch": 31.21525885558583,
+ "grad_norm": 6.003612995147705,
+ "learning_rate": 1.6107228443891303e-05,
+ "loss": 0.3783,
+ "step": 11456
+ },
+ {
+ "epoch": 31.21798365122616,
+ "grad_norm": 5.7851667404174805,
+ "learning_rate": 1.610652962164563e-05,
+ "loss": 0.3906,
+ "step": 11457
+ },
+ {
+ "epoch": 31.220708446866485,
+ "grad_norm": 7.043871879577637,
+ "learning_rate": 1.6105830751842503e-05,
+ "loss": 0.3427,
+ "step": 11458
+ },
+ {
+ "epoch": 31.22343324250681,
+ "grad_norm": 5.8861823081970215,
+ "learning_rate": 1.6105131834487364e-05,
+ "loss": 0.3306,
+ "step": 11459
+ },
+ {
+ "epoch": 31.22615803814714,
+ "grad_norm": 6.036689758300781,
+ "learning_rate": 1.6104432869585652e-05,
+ "loss": 0.455,
+ "step": 11460
+ },
+ {
+ "epoch": 31.228882833787466,
+ "grad_norm": 6.158356666564941,
+ "learning_rate": 1.610373385714281e-05,
+ "loss": 0.427,
+ "step": 11461
+ },
+ {
+ "epoch": 31.231607629427792,
+ "grad_norm": 6.051694869995117,
+ "learning_rate": 1.6103034797164294e-05,
+ "loss": 0.3,
+ "step": 11462
+ },
+ {
+ "epoch": 31.23433242506812,
+ "grad_norm": 9.04263973236084,
+ "learning_rate": 1.6102335689655533e-05,
+ "loss": 0.4077,
+ "step": 11463
+ },
+ {
+ "epoch": 31.237057220708447,
+ "grad_norm": 7.521633625030518,
+ "learning_rate": 1.610163653462198e-05,
+ "loss": 0.4977,
+ "step": 11464
+ },
+ {
+ "epoch": 31.239782016348773,
+ "grad_norm": 8.390018463134766,
+ "learning_rate": 1.6100937332069074e-05,
+ "loss": 0.3568,
+ "step": 11465
+ },
+ {
+ "epoch": 31.242506811989102,
+ "grad_norm": 6.256731033325195,
+ "learning_rate": 1.610023808200227e-05,
+ "loss": 0.5061,
+ "step": 11466
+ },
+ {
+ "epoch": 31.245231607629428,
+ "grad_norm": 6.731732368469238,
+ "learning_rate": 1.6099538784427005e-05,
+ "loss": 0.3767,
+ "step": 11467
+ },
+ {
+ "epoch": 31.247956403269754,
+ "grad_norm": 6.79564094543457,
+ "learning_rate": 1.609883943934873e-05,
+ "loss": 0.4227,
+ "step": 11468
+ },
+ {
+ "epoch": 31.250681198910083,
+ "grad_norm": 6.176658630371094,
+ "learning_rate": 1.609814004677289e-05,
+ "loss": 0.4348,
+ "step": 11469
+ },
+ {
+ "epoch": 31.25340599455041,
+ "grad_norm": 5.946808338165283,
+ "learning_rate": 1.6097440606704928e-05,
+ "loss": 0.4133,
+ "step": 11470
+ },
+ {
+ "epoch": 31.256130790190735,
+ "grad_norm": 6.666254043579102,
+ "learning_rate": 1.60967411191503e-05,
+ "loss": 0.433,
+ "step": 11471
+ },
+ {
+ "epoch": 31.258855585831064,
+ "grad_norm": 8.007935523986816,
+ "learning_rate": 1.6096041584114444e-05,
+ "loss": 0.4609,
+ "step": 11472
+ },
+ {
+ "epoch": 31.26158038147139,
+ "grad_norm": 7.5098724365234375,
+ "learning_rate": 1.6095342001602813e-05,
+ "loss": 0.4758,
+ "step": 11473
+ },
+ {
+ "epoch": 31.264305177111716,
+ "grad_norm": 6.390965938568115,
+ "learning_rate": 1.6094642371620857e-05,
+ "loss": 0.2469,
+ "step": 11474
+ },
+ {
+ "epoch": 31.267029972752045,
+ "grad_norm": 6.606525897979736,
+ "learning_rate": 1.6093942694174024e-05,
+ "loss": 0.3356,
+ "step": 11475
+ },
+ {
+ "epoch": 31.26975476839237,
+ "grad_norm": 8.822193145751953,
+ "learning_rate": 1.609324296926776e-05,
+ "loss": 0.3881,
+ "step": 11476
+ },
+ {
+ "epoch": 31.272479564032697,
+ "grad_norm": 7.46927547454834,
+ "learning_rate": 1.609254319690751e-05,
+ "loss": 0.4776,
+ "step": 11477
+ },
+ {
+ "epoch": 31.275204359673026,
+ "grad_norm": 6.187511920928955,
+ "learning_rate": 1.6091843377098734e-05,
+ "loss": 0.4377,
+ "step": 11478
+ },
+ {
+ "epoch": 31.277929155313352,
+ "grad_norm": 6.347655773162842,
+ "learning_rate": 1.609114350984688e-05,
+ "loss": 0.3725,
+ "step": 11479
+ },
+ {
+ "epoch": 31.280653950953678,
+ "grad_norm": 6.0924248695373535,
+ "learning_rate": 1.6090443595157396e-05,
+ "loss": 0.5453,
+ "step": 11480
+ },
+ {
+ "epoch": 31.283378746594007,
+ "grad_norm": 8.578104972839355,
+ "learning_rate": 1.6089743633035732e-05,
+ "loss": 0.3582,
+ "step": 11481
+ },
+ {
+ "epoch": 31.286103542234333,
+ "grad_norm": 8.714938163757324,
+ "learning_rate": 1.6089043623487338e-05,
+ "loss": 0.4052,
+ "step": 11482
+ },
+ {
+ "epoch": 31.28882833787466,
+ "grad_norm": 8.156457901000977,
+ "learning_rate": 1.608834356651767e-05,
+ "loss": 0.3929,
+ "step": 11483
+ },
+ {
+ "epoch": 31.291553133514988,
+ "grad_norm": 7.4753618240356445,
+ "learning_rate": 1.608764346213218e-05,
+ "loss": 0.4719,
+ "step": 11484
+ },
+ {
+ "epoch": 31.294277929155314,
+ "grad_norm": 6.959665775299072,
+ "learning_rate": 1.6086943310336315e-05,
+ "loss": 0.2707,
+ "step": 11485
+ },
+ {
+ "epoch": 31.29700272479564,
+ "grad_norm": 6.778475761413574,
+ "learning_rate": 1.6086243111135537e-05,
+ "loss": 0.2784,
+ "step": 11486
+ },
+ {
+ "epoch": 31.29972752043597,
+ "grad_norm": 8.395167350769043,
+ "learning_rate": 1.608554286453529e-05,
+ "loss": 0.5805,
+ "step": 11487
+ },
+ {
+ "epoch": 31.302452316076295,
+ "grad_norm": 6.569278717041016,
+ "learning_rate": 1.608484257054103e-05,
+ "loss": 0.5439,
+ "step": 11488
+ },
+ {
+ "epoch": 31.30517711171662,
+ "grad_norm": 7.05552339553833,
+ "learning_rate": 1.6084142229158214e-05,
+ "loss": 0.4718,
+ "step": 11489
+ },
+ {
+ "epoch": 31.30790190735695,
+ "grad_norm": 6.05991792678833,
+ "learning_rate": 1.608344184039229e-05,
+ "loss": 0.4052,
+ "step": 11490
+ },
+ {
+ "epoch": 31.310626702997276,
+ "grad_norm": 11.234015464782715,
+ "learning_rate": 1.6082741404248724e-05,
+ "loss": 0.4645,
+ "step": 11491
+ },
+ {
+ "epoch": 31.3133514986376,
+ "grad_norm": 6.1989006996154785,
+ "learning_rate": 1.608204092073296e-05,
+ "loss": 0.2135,
+ "step": 11492
+ },
+ {
+ "epoch": 31.31607629427793,
+ "grad_norm": 6.016495227813721,
+ "learning_rate": 1.608134038985046e-05,
+ "loss": 0.339,
+ "step": 11493
+ },
+ {
+ "epoch": 31.318801089918257,
+ "grad_norm": 7.02424955368042,
+ "learning_rate": 1.608063981160667e-05,
+ "loss": 0.4274,
+ "step": 11494
+ },
+ {
+ "epoch": 31.321525885558582,
+ "grad_norm": 6.882099628448486,
+ "learning_rate": 1.6079939186007058e-05,
+ "loss": 0.4521,
+ "step": 11495
+ },
+ {
+ "epoch": 31.32425068119891,
+ "grad_norm": 7.710224628448486,
+ "learning_rate": 1.6079238513057073e-05,
+ "loss": 0.3906,
+ "step": 11496
+ },
+ {
+ "epoch": 31.326975476839237,
+ "grad_norm": 7.994422912597656,
+ "learning_rate": 1.6078537792762174e-05,
+ "loss": 0.4096,
+ "step": 11497
+ },
+ {
+ "epoch": 31.329700272479563,
+ "grad_norm": 11.75682544708252,
+ "learning_rate": 1.6077837025127817e-05,
+ "loss": 0.4886,
+ "step": 11498
+ },
+ {
+ "epoch": 31.332425068119893,
+ "grad_norm": 7.2599077224731445,
+ "learning_rate": 1.6077136210159466e-05,
+ "loss": 0.4537,
+ "step": 11499
+ },
+ {
+ "epoch": 31.33514986376022,
+ "grad_norm": 6.902833461761475,
+ "learning_rate": 1.607643534786257e-05,
+ "loss": 0.4366,
+ "step": 11500
+ },
+ {
+ "epoch": 31.337874659400544,
+ "grad_norm": 6.804143905639648,
+ "learning_rate": 1.607573443824259e-05,
+ "loss": 0.4904,
+ "step": 11501
+ },
+ {
+ "epoch": 31.340599455040874,
+ "grad_norm": 6.350834846496582,
+ "learning_rate": 1.6075033481304993e-05,
+ "loss": 0.3763,
+ "step": 11502
+ },
+ {
+ "epoch": 31.3433242506812,
+ "grad_norm": 7.131535530090332,
+ "learning_rate": 1.6074332477055224e-05,
+ "loss": 0.3984,
+ "step": 11503
+ },
+ {
+ "epoch": 31.346049046321525,
+ "grad_norm": 6.9918389320373535,
+ "learning_rate": 1.607363142549875e-05,
+ "loss": 0.3341,
+ "step": 11504
+ },
+ {
+ "epoch": 31.348773841961854,
+ "grad_norm": 9.504937171936035,
+ "learning_rate": 1.607293032664103e-05,
+ "loss": 0.4984,
+ "step": 11505
+ },
+ {
+ "epoch": 31.35149863760218,
+ "grad_norm": 6.146029949188232,
+ "learning_rate": 1.6072229180487523e-05,
+ "loss": 0.4451,
+ "step": 11506
+ },
+ {
+ "epoch": 31.354223433242506,
+ "grad_norm": 31.787803649902344,
+ "learning_rate": 1.6071527987043693e-05,
+ "loss": 0.463,
+ "step": 11507
+ },
+ {
+ "epoch": 31.356948228882835,
+ "grad_norm": 6.9770121574401855,
+ "learning_rate": 1.6070826746314997e-05,
+ "loss": 0.3743,
+ "step": 11508
+ },
+ {
+ "epoch": 31.35967302452316,
+ "grad_norm": 6.07723331451416,
+ "learning_rate": 1.60701254583069e-05,
+ "loss": 0.4515,
+ "step": 11509
+ },
+ {
+ "epoch": 31.362397820163487,
+ "grad_norm": 6.7611985206604,
+ "learning_rate": 1.606942412302486e-05,
+ "loss": 0.4048,
+ "step": 11510
+ },
+ {
+ "epoch": 31.365122615803816,
+ "grad_norm": 5.638869762420654,
+ "learning_rate": 1.606872274047434e-05,
+ "loss": 0.4251,
+ "step": 11511
+ },
+ {
+ "epoch": 31.367847411444142,
+ "grad_norm": 13.817146301269531,
+ "learning_rate": 1.6068021310660806e-05,
+ "loss": 0.4402,
+ "step": 11512
+ },
+ {
+ "epoch": 31.370572207084468,
+ "grad_norm": 7.954291343688965,
+ "learning_rate": 1.606731983358971e-05,
+ "loss": 0.3469,
+ "step": 11513
+ },
+ {
+ "epoch": 31.373297002724797,
+ "grad_norm": 6.273427486419678,
+ "learning_rate": 1.6066618309266527e-05,
+ "loss": 0.3446,
+ "step": 11514
+ },
+ {
+ "epoch": 31.376021798365123,
+ "grad_norm": 6.062036991119385,
+ "learning_rate": 1.6065916737696713e-05,
+ "loss": 0.5062,
+ "step": 11515
+ },
+ {
+ "epoch": 31.37874659400545,
+ "grad_norm": 6.418720722198486,
+ "learning_rate": 1.6065215118885737e-05,
+ "loss": 0.4177,
+ "step": 11516
+ },
+ {
+ "epoch": 31.381471389645778,
+ "grad_norm": 5.220983028411865,
+ "learning_rate": 1.6064513452839064e-05,
+ "loss": 0.296,
+ "step": 11517
+ },
+ {
+ "epoch": 31.384196185286104,
+ "grad_norm": 13.341872215270996,
+ "learning_rate": 1.6063811739562153e-05,
+ "loss": 0.4035,
+ "step": 11518
+ },
+ {
+ "epoch": 31.38692098092643,
+ "grad_norm": 7.2220964431762695,
+ "learning_rate": 1.606310997906047e-05,
+ "loss": 0.5966,
+ "step": 11519
+ },
+ {
+ "epoch": 31.38964577656676,
+ "grad_norm": 7.388582229614258,
+ "learning_rate": 1.606240817133948e-05,
+ "loss": 0.4999,
+ "step": 11520
+ },
+ {
+ "epoch": 31.392370572207085,
+ "grad_norm": 6.779852867126465,
+ "learning_rate": 1.6061706316404653e-05,
+ "loss": 0.4079,
+ "step": 11521
+ },
+ {
+ "epoch": 31.39509536784741,
+ "grad_norm": 8.740653991699219,
+ "learning_rate": 1.606100441426145e-05,
+ "loss": 0.469,
+ "step": 11522
+ },
+ {
+ "epoch": 31.39782016348774,
+ "grad_norm": 7.6170854568481445,
+ "learning_rate": 1.6060302464915346e-05,
+ "loss": 0.3007,
+ "step": 11523
+ },
+ {
+ "epoch": 31.400544959128066,
+ "grad_norm": 9.081851959228516,
+ "learning_rate": 1.6059600468371792e-05,
+ "loss": 0.3765,
+ "step": 11524
+ },
+ {
+ "epoch": 31.40326975476839,
+ "grad_norm": 7.019375801086426,
+ "learning_rate": 1.605889842463627e-05,
+ "loss": 0.3902,
+ "step": 11525
+ },
+ {
+ "epoch": 31.40599455040872,
+ "grad_norm": 7.206212043762207,
+ "learning_rate": 1.605819633371424e-05,
+ "loss": 0.3379,
+ "step": 11526
+ },
+ {
+ "epoch": 31.408719346049047,
+ "grad_norm": 7.50978946685791,
+ "learning_rate": 1.6057494195611177e-05,
+ "loss": 0.3466,
+ "step": 11527
+ },
+ {
+ "epoch": 31.411444141689373,
+ "grad_norm": 6.506180763244629,
+ "learning_rate": 1.605679201033254e-05,
+ "loss": 0.477,
+ "step": 11528
+ },
+ {
+ "epoch": 31.414168937329702,
+ "grad_norm": 6.759514331817627,
+ "learning_rate": 1.6056089777883803e-05,
+ "loss": 0.4097,
+ "step": 11529
+ },
+ {
+ "epoch": 31.416893732970028,
+ "grad_norm": 5.902039527893066,
+ "learning_rate": 1.6055387498270435e-05,
+ "loss": 0.4765,
+ "step": 11530
+ },
+ {
+ "epoch": 31.419618528610354,
+ "grad_norm": 6.8216729164123535,
+ "learning_rate": 1.60546851714979e-05,
+ "loss": 0.4055,
+ "step": 11531
+ },
+ {
+ "epoch": 31.422343324250683,
+ "grad_norm": 6.676670074462891,
+ "learning_rate": 1.6053982797571675e-05,
+ "loss": 0.3519,
+ "step": 11532
+ },
+ {
+ "epoch": 31.42506811989101,
+ "grad_norm": 8.04570198059082,
+ "learning_rate": 1.6053280376497224e-05,
+ "loss": 0.3382,
+ "step": 11533
+ },
+ {
+ "epoch": 31.427792915531334,
+ "grad_norm": 8.004631042480469,
+ "learning_rate": 1.6052577908280022e-05,
+ "loss": 0.3306,
+ "step": 11534
+ },
+ {
+ "epoch": 31.430517711171664,
+ "grad_norm": 7.521023750305176,
+ "learning_rate": 1.605187539292554e-05,
+ "loss": 0.4975,
+ "step": 11535
+ },
+ {
+ "epoch": 31.43324250681199,
+ "grad_norm": 12.086722373962402,
+ "learning_rate": 1.6051172830439243e-05,
+ "loss": 0.3757,
+ "step": 11536
+ },
+ {
+ "epoch": 31.435967302452315,
+ "grad_norm": 6.613288879394531,
+ "learning_rate": 1.605047022082661e-05,
+ "loss": 0.3819,
+ "step": 11537
+ },
+ {
+ "epoch": 31.438692098092645,
+ "grad_norm": 6.143130779266357,
+ "learning_rate": 1.6049767564093107e-05,
+ "loss": 0.3684,
+ "step": 11538
+ },
+ {
+ "epoch": 31.44141689373297,
+ "grad_norm": 7.905948638916016,
+ "learning_rate": 1.604906486024421e-05,
+ "loss": 0.455,
+ "step": 11539
+ },
+ {
+ "epoch": 31.444141689373296,
+ "grad_norm": 11.131954193115234,
+ "learning_rate": 1.6048362109285393e-05,
+ "loss": 0.3509,
+ "step": 11540
+ },
+ {
+ "epoch": 31.446866485013626,
+ "grad_norm": 7.644253730773926,
+ "learning_rate": 1.6047659311222124e-05,
+ "loss": 0.3681,
+ "step": 11541
+ },
+ {
+ "epoch": 31.44959128065395,
+ "grad_norm": 6.650498867034912,
+ "learning_rate": 1.604695646605988e-05,
+ "loss": 0.3637,
+ "step": 11542
+ },
+ {
+ "epoch": 31.452316076294277,
+ "grad_norm": 6.839574337005615,
+ "learning_rate": 1.6046253573804134e-05,
+ "loss": 0.3998,
+ "step": 11543
+ },
+ {
+ "epoch": 31.455040871934607,
+ "grad_norm": 7.17881965637207,
+ "learning_rate": 1.6045550634460357e-05,
+ "loss": 0.3868,
+ "step": 11544
+ },
+ {
+ "epoch": 31.457765667574932,
+ "grad_norm": 6.631476402282715,
+ "learning_rate": 1.6044847648034026e-05,
+ "loss": 0.36,
+ "step": 11545
+ },
+ {
+ "epoch": 31.460490463215258,
+ "grad_norm": 11.95763874053955,
+ "learning_rate": 1.604414461453062e-05,
+ "loss": 0.343,
+ "step": 11546
+ },
+ {
+ "epoch": 31.463215258855588,
+ "grad_norm": 7.350583076477051,
+ "learning_rate": 1.604344153395561e-05,
+ "loss": 0.4047,
+ "step": 11547
+ },
+ {
+ "epoch": 31.465940054495913,
+ "grad_norm": 8.300507545471191,
+ "learning_rate": 1.604273840631447e-05,
+ "loss": 0.4782,
+ "step": 11548
+ },
+ {
+ "epoch": 31.46866485013624,
+ "grad_norm": 9.675360679626465,
+ "learning_rate": 1.6042035231612678e-05,
+ "loss": 0.412,
+ "step": 11549
+ },
+ {
+ "epoch": 31.47138964577657,
+ "grad_norm": 7.928048610687256,
+ "learning_rate": 1.604133200985571e-05,
+ "loss": 0.5042,
+ "step": 11550
+ },
+ {
+ "epoch": 31.474114441416894,
+ "grad_norm": 7.155492782592773,
+ "learning_rate": 1.6040628741049044e-05,
+ "loss": 0.4232,
+ "step": 11551
+ },
+ {
+ "epoch": 31.47683923705722,
+ "grad_norm": 10.458273887634277,
+ "learning_rate": 1.6039925425198156e-05,
+ "loss": 0.4533,
+ "step": 11552
+ },
+ {
+ "epoch": 31.479564032697546,
+ "grad_norm": 7.096415042877197,
+ "learning_rate": 1.603922206230852e-05,
+ "loss": 0.356,
+ "step": 11553
+ },
+ {
+ "epoch": 31.482288828337875,
+ "grad_norm": 6.542632102966309,
+ "learning_rate": 1.603851865238562e-05,
+ "loss": 0.4031,
+ "step": 11554
+ },
+ {
+ "epoch": 31.4850136239782,
+ "grad_norm": 6.910850524902344,
+ "learning_rate": 1.6037815195434928e-05,
+ "loss": 0.376,
+ "step": 11555
+ },
+ {
+ "epoch": 31.48773841961853,
+ "grad_norm": 6.508656978607178,
+ "learning_rate": 1.6037111691461932e-05,
+ "loss": 0.2852,
+ "step": 11556
+ },
+ {
+ "epoch": 31.490463215258856,
+ "grad_norm": 8.075109481811523,
+ "learning_rate": 1.6036408140472096e-05,
+ "loss": 0.3422,
+ "step": 11557
+ },
+ {
+ "epoch": 31.493188010899182,
+ "grad_norm": 7.133546352386475,
+ "learning_rate": 1.6035704542470915e-05,
+ "loss": 0.3654,
+ "step": 11558
+ },
+ {
+ "epoch": 31.495912806539508,
+ "grad_norm": 7.562647342681885,
+ "learning_rate": 1.6035000897463857e-05,
+ "loss": 0.4445,
+ "step": 11559
+ },
+ {
+ "epoch": 31.498637602179837,
+ "grad_norm": 6.576021194458008,
+ "learning_rate": 1.603429720545641e-05,
+ "loss": 0.5146,
+ "step": 11560
+ },
+ {
+ "epoch": 31.501362397820163,
+ "grad_norm": 6.826038837432861,
+ "learning_rate": 1.6033593466454043e-05,
+ "loss": 0.3154,
+ "step": 11561
+ },
+ {
+ "epoch": 31.504087193460492,
+ "grad_norm": 7.488579750061035,
+ "learning_rate": 1.603288968046225e-05,
+ "loss": 0.382,
+ "step": 11562
+ },
+ {
+ "epoch": 31.506811989100818,
+ "grad_norm": 7.069460391998291,
+ "learning_rate": 1.6032185847486504e-05,
+ "loss": 0.3824,
+ "step": 11563
+ },
+ {
+ "epoch": 31.509536784741144,
+ "grad_norm": 6.662590980529785,
+ "learning_rate": 1.6031481967532293e-05,
+ "loss": 0.5184,
+ "step": 11564
+ },
+ {
+ "epoch": 31.51226158038147,
+ "grad_norm": 6.6659722328186035,
+ "learning_rate": 1.603077804060509e-05,
+ "loss": 0.4854,
+ "step": 11565
+ },
+ {
+ "epoch": 31.5149863760218,
+ "grad_norm": 8.528528213500977,
+ "learning_rate": 1.6030074066710387e-05,
+ "loss": 0.479,
+ "step": 11566
+ },
+ {
+ "epoch": 31.517711171662125,
+ "grad_norm": 7.04036808013916,
+ "learning_rate": 1.6029370045853655e-05,
+ "loss": 0.3589,
+ "step": 11567
+ },
+ {
+ "epoch": 31.520435967302454,
+ "grad_norm": 8.598791122436523,
+ "learning_rate": 1.6028665978040388e-05,
+ "loss": 0.3669,
+ "step": 11568
+ },
+ {
+ "epoch": 31.52316076294278,
+ "grad_norm": 7.442421913146973,
+ "learning_rate": 1.602796186327606e-05,
+ "loss": 0.3,
+ "step": 11569
+ },
+ {
+ "epoch": 31.525885558583106,
+ "grad_norm": 7.288723468780518,
+ "learning_rate": 1.6027257701566162e-05,
+ "loss": 0.4641,
+ "step": 11570
+ },
+ {
+ "epoch": 31.52861035422343,
+ "grad_norm": 7.482388019561768,
+ "learning_rate": 1.6026553492916175e-05,
+ "loss": 0.3338,
+ "step": 11571
+ },
+ {
+ "epoch": 31.53133514986376,
+ "grad_norm": 8.168521881103516,
+ "learning_rate": 1.6025849237331583e-05,
+ "loss": 0.4507,
+ "step": 11572
+ },
+ {
+ "epoch": 31.534059945504087,
+ "grad_norm": 8.634714126586914,
+ "learning_rate": 1.602514493481787e-05,
+ "loss": 0.3071,
+ "step": 11573
+ },
+ {
+ "epoch": 31.536784741144416,
+ "grad_norm": 7.620938301086426,
+ "learning_rate": 1.6024440585380524e-05,
+ "loss": 0.452,
+ "step": 11574
+ },
+ {
+ "epoch": 31.539509536784742,
+ "grad_norm": 6.787168025970459,
+ "learning_rate": 1.6023736189025027e-05,
+ "loss": 0.4082,
+ "step": 11575
+ },
+ {
+ "epoch": 31.542234332425068,
+ "grad_norm": 7.074665069580078,
+ "learning_rate": 1.6023031745756864e-05,
+ "loss": 0.3651,
+ "step": 11576
+ },
+ {
+ "epoch": 31.544959128065393,
+ "grad_norm": 8.468385696411133,
+ "learning_rate": 1.602232725558153e-05,
+ "loss": 0.5849,
+ "step": 11577
+ },
+ {
+ "epoch": 31.547683923705723,
+ "grad_norm": 10.36236572265625,
+ "learning_rate": 1.6021622718504503e-05,
+ "loss": 0.4119,
+ "step": 11578
+ },
+ {
+ "epoch": 31.55040871934605,
+ "grad_norm": 8.830389022827148,
+ "learning_rate": 1.602091813453127e-05,
+ "loss": 0.4364,
+ "step": 11579
+ },
+ {
+ "epoch": 31.553133514986374,
+ "grad_norm": 7.7621846199035645,
+ "learning_rate": 1.602021350366732e-05,
+ "loss": 0.4208,
+ "step": 11580
+ },
+ {
+ "epoch": 31.555858310626704,
+ "grad_norm": 7.33500337600708,
+ "learning_rate": 1.6019508825918144e-05,
+ "loss": 0.427,
+ "step": 11581
+ },
+ {
+ "epoch": 31.55858310626703,
+ "grad_norm": 8.304717063903809,
+ "learning_rate": 1.6018804101289224e-05,
+ "loss": 0.6447,
+ "step": 11582
+ },
+ {
+ "epoch": 31.561307901907355,
+ "grad_norm": 7.474731922149658,
+ "learning_rate": 1.6018099329786053e-05,
+ "loss": 0.4329,
+ "step": 11583
+ },
+ {
+ "epoch": 31.564032697547685,
+ "grad_norm": 7.509472846984863,
+ "learning_rate": 1.6017394511414116e-05,
+ "loss": 0.4271,
+ "step": 11584
+ },
+ {
+ "epoch": 31.56675749318801,
+ "grad_norm": 8.360748291015625,
+ "learning_rate": 1.6016689646178906e-05,
+ "loss": 0.41,
+ "step": 11585
+ },
+ {
+ "epoch": 31.569482288828336,
+ "grad_norm": 7.341002941131592,
+ "learning_rate": 1.601598473408591e-05,
+ "loss": 0.5343,
+ "step": 11586
+ },
+ {
+ "epoch": 31.572207084468666,
+ "grad_norm": 8.834521293640137,
+ "learning_rate": 1.601527977514062e-05,
+ "loss": 0.4105,
+ "step": 11587
+ },
+ {
+ "epoch": 31.57493188010899,
+ "grad_norm": 6.91571044921875,
+ "learning_rate": 1.6014574769348526e-05,
+ "loss": 0.3516,
+ "step": 11588
+ },
+ {
+ "epoch": 31.577656675749317,
+ "grad_norm": 7.660037040710449,
+ "learning_rate": 1.6013869716715113e-05,
+ "loss": 0.4901,
+ "step": 11589
+ },
+ {
+ "epoch": 31.580381471389646,
+ "grad_norm": 7.215074062347412,
+ "learning_rate": 1.601316461724588e-05,
+ "loss": 0.4988,
+ "step": 11590
+ },
+ {
+ "epoch": 31.583106267029972,
+ "grad_norm": 5.853626251220703,
+ "learning_rate": 1.6012459470946315e-05,
+ "loss": 0.3817,
+ "step": 11591
+ },
+ {
+ "epoch": 31.585831062670298,
+ "grad_norm": 6.667288303375244,
+ "learning_rate": 1.6011754277821906e-05,
+ "loss": 0.3326,
+ "step": 11592
+ },
+ {
+ "epoch": 31.588555858310627,
+ "grad_norm": 7.225183486938477,
+ "learning_rate": 1.6011049037878145e-05,
+ "loss": 0.2822,
+ "step": 11593
+ },
+ {
+ "epoch": 31.591280653950953,
+ "grad_norm": 13.11107063293457,
+ "learning_rate": 1.6010343751120533e-05,
+ "loss": 0.4475,
+ "step": 11594
+ },
+ {
+ "epoch": 31.59400544959128,
+ "grad_norm": 6.232799053192139,
+ "learning_rate": 1.6009638417554555e-05,
+ "loss": 0.3852,
+ "step": 11595
+ },
+ {
+ "epoch": 31.59673024523161,
+ "grad_norm": 7.203550815582275,
+ "learning_rate": 1.600893303718571e-05,
+ "loss": 0.4605,
+ "step": 11596
+ },
+ {
+ "epoch": 31.599455040871934,
+ "grad_norm": 7.108577251434326,
+ "learning_rate": 1.6008227610019485e-05,
+ "loss": 0.3255,
+ "step": 11597
+ },
+ {
+ "epoch": 31.60217983651226,
+ "grad_norm": 6.979862213134766,
+ "learning_rate": 1.6007522136061378e-05,
+ "loss": 0.3233,
+ "step": 11598
+ },
+ {
+ "epoch": 31.60490463215259,
+ "grad_norm": 7.540842533111572,
+ "learning_rate": 1.600681661531688e-05,
+ "loss": 0.3895,
+ "step": 11599
+ },
+ {
+ "epoch": 31.607629427792915,
+ "grad_norm": 7.842855930328369,
+ "learning_rate": 1.600611104779149e-05,
+ "loss": 0.3889,
+ "step": 11600
+ },
+ {
+ "epoch": 31.61035422343324,
+ "grad_norm": 7.594421863555908,
+ "learning_rate": 1.6005405433490694e-05,
+ "loss": 0.3911,
+ "step": 11601
+ },
+ {
+ "epoch": 31.61307901907357,
+ "grad_norm": 5.4124908447265625,
+ "learning_rate": 1.600469977242e-05,
+ "loss": 0.5018,
+ "step": 11602
+ },
+ {
+ "epoch": 31.615803814713896,
+ "grad_norm": 6.882364749908447,
+ "learning_rate": 1.6003994064584895e-05,
+ "loss": 0.3772,
+ "step": 11603
+ },
+ {
+ "epoch": 31.618528610354222,
+ "grad_norm": 8.891324043273926,
+ "learning_rate": 1.600328830999088e-05,
+ "loss": 0.3677,
+ "step": 11604
+ },
+ {
+ "epoch": 31.62125340599455,
+ "grad_norm": 8.092884063720703,
+ "learning_rate": 1.6002582508643446e-05,
+ "loss": 0.4644,
+ "step": 11605
+ },
+ {
+ "epoch": 31.623978201634877,
+ "grad_norm": 13.51522445678711,
+ "learning_rate": 1.6001876660548098e-05,
+ "loss": 0.2916,
+ "step": 11606
+ },
+ {
+ "epoch": 31.626702997275203,
+ "grad_norm": 7.009510040283203,
+ "learning_rate": 1.6001170765710323e-05,
+ "loss": 0.4711,
+ "step": 11607
+ },
+ {
+ "epoch": 31.629427792915532,
+ "grad_norm": 6.411016941070557,
+ "learning_rate": 1.6000464824135623e-05,
+ "loss": 0.3018,
+ "step": 11608
+ },
+ {
+ "epoch": 31.632152588555858,
+ "grad_norm": 8.686745643615723,
+ "learning_rate": 1.5999758835829497e-05,
+ "loss": 0.458,
+ "step": 11609
+ },
+ {
+ "epoch": 31.634877384196184,
+ "grad_norm": 7.0936102867126465,
+ "learning_rate": 1.599905280079744e-05,
+ "loss": 0.4555,
+ "step": 11610
+ },
+ {
+ "epoch": 31.637602179836513,
+ "grad_norm": 5.631973743438721,
+ "learning_rate": 1.5998346719044956e-05,
+ "loss": 0.3708,
+ "step": 11611
+ },
+ {
+ "epoch": 31.64032697547684,
+ "grad_norm": 9.096990585327148,
+ "learning_rate": 1.5997640590577544e-05,
+ "loss": 0.4305,
+ "step": 11612
+ },
+ {
+ "epoch": 31.643051771117165,
+ "grad_norm": 8.056363105773926,
+ "learning_rate": 1.5996934415400694e-05,
+ "loss": 0.5111,
+ "step": 11613
+ },
+ {
+ "epoch": 31.645776566757494,
+ "grad_norm": 7.630584716796875,
+ "learning_rate": 1.5996228193519914e-05,
+ "loss": 0.4622,
+ "step": 11614
+ },
+ {
+ "epoch": 31.64850136239782,
+ "grad_norm": 8.496237754821777,
+ "learning_rate": 1.5995521924940704e-05,
+ "loss": 0.3883,
+ "step": 11615
+ },
+ {
+ "epoch": 31.651226158038146,
+ "grad_norm": 6.984487056732178,
+ "learning_rate": 1.5994815609668558e-05,
+ "loss": 0.5494,
+ "step": 11616
+ },
+ {
+ "epoch": 31.653950953678475,
+ "grad_norm": 8.360382080078125,
+ "learning_rate": 1.5994109247708983e-05,
+ "loss": 0.6595,
+ "step": 11617
+ },
+ {
+ "epoch": 31.6566757493188,
+ "grad_norm": 7.152622222900391,
+ "learning_rate": 1.5993402839067477e-05,
+ "loss": 0.3386,
+ "step": 11618
+ },
+ {
+ "epoch": 31.659400544959126,
+ "grad_norm": 30.050329208374023,
+ "learning_rate": 1.5992696383749543e-05,
+ "loss": 0.4098,
+ "step": 11619
+ },
+ {
+ "epoch": 31.662125340599456,
+ "grad_norm": 6.905817031860352,
+ "learning_rate": 1.5991989881760687e-05,
+ "loss": 0.4179,
+ "step": 11620
+ },
+ {
+ "epoch": 31.66485013623978,
+ "grad_norm": 6.6429572105407715,
+ "learning_rate": 1.59912833331064e-05,
+ "loss": 0.563,
+ "step": 11621
+ },
+ {
+ "epoch": 31.667574931880107,
+ "grad_norm": 7.85490608215332,
+ "learning_rate": 1.5990576737792192e-05,
+ "loss": 0.3966,
+ "step": 11622
+ },
+ {
+ "epoch": 31.670299727520437,
+ "grad_norm": 7.767920017242432,
+ "learning_rate": 1.598987009582357e-05,
+ "loss": 0.434,
+ "step": 11623
+ },
+ {
+ "epoch": 31.673024523160763,
+ "grad_norm": 6.833701133728027,
+ "learning_rate": 1.598916340720603e-05,
+ "loss": 0.4659,
+ "step": 11624
+ },
+ {
+ "epoch": 31.67574931880109,
+ "grad_norm": 7.239294052124023,
+ "learning_rate": 1.5988456671945078e-05,
+ "loss": 0.3643,
+ "step": 11625
+ },
+ {
+ "epoch": 31.678474114441418,
+ "grad_norm": 13.427486419677734,
+ "learning_rate": 1.598774989004622e-05,
+ "loss": 0.5385,
+ "step": 11626
+ },
+ {
+ "epoch": 31.681198910081743,
+ "grad_norm": 6.485818862915039,
+ "learning_rate": 1.5987043061514953e-05,
+ "loss": 0.4117,
+ "step": 11627
+ },
+ {
+ "epoch": 31.68392370572207,
+ "grad_norm": 6.466250419616699,
+ "learning_rate": 1.598633618635679e-05,
+ "loss": 0.5883,
+ "step": 11628
+ },
+ {
+ "epoch": 31.6866485013624,
+ "grad_norm": 6.980894565582275,
+ "learning_rate": 1.5985629264577237e-05,
+ "loss": 0.5242,
+ "step": 11629
+ },
+ {
+ "epoch": 31.689373297002724,
+ "grad_norm": 7.625382423400879,
+ "learning_rate": 1.5984922296181794e-05,
+ "loss": 0.5074,
+ "step": 11630
+ },
+ {
+ "epoch": 31.69209809264305,
+ "grad_norm": 9.570500373840332,
+ "learning_rate": 1.5984215281175964e-05,
+ "loss": 0.3946,
+ "step": 11631
+ },
+ {
+ "epoch": 31.69482288828338,
+ "grad_norm": 6.711041450500488,
+ "learning_rate": 1.5983508219565264e-05,
+ "loss": 0.2941,
+ "step": 11632
+ },
+ {
+ "epoch": 31.697547683923705,
+ "grad_norm": 6.9375104904174805,
+ "learning_rate": 1.5982801111355195e-05,
+ "loss": 0.3896,
+ "step": 11633
+ },
+ {
+ "epoch": 31.70027247956403,
+ "grad_norm": 9.227879524230957,
+ "learning_rate": 1.598209395655126e-05,
+ "loss": 0.5455,
+ "step": 11634
+ },
+ {
+ "epoch": 31.70299727520436,
+ "grad_norm": 7.8122687339782715,
+ "learning_rate": 1.598138675515897e-05,
+ "loss": 0.5035,
+ "step": 11635
+ },
+ {
+ "epoch": 31.705722070844686,
+ "grad_norm": 8.350142478942871,
+ "learning_rate": 1.5980679507183834e-05,
+ "loss": 0.4818,
+ "step": 11636
+ },
+ {
+ "epoch": 31.708446866485012,
+ "grad_norm": 17.139902114868164,
+ "learning_rate": 1.5979972212631358e-05,
+ "loss": 0.437,
+ "step": 11637
+ },
+ {
+ "epoch": 31.71117166212534,
+ "grad_norm": 6.634777545928955,
+ "learning_rate": 1.597926487150705e-05,
+ "loss": 0.4443,
+ "step": 11638
+ },
+ {
+ "epoch": 31.713896457765667,
+ "grad_norm": 8.797743797302246,
+ "learning_rate": 1.5978557483816423e-05,
+ "loss": 0.3745,
+ "step": 11639
+ },
+ {
+ "epoch": 31.716621253405993,
+ "grad_norm": 5.549252510070801,
+ "learning_rate": 1.5977850049564978e-05,
+ "loss": 0.4563,
+ "step": 11640
+ },
+ {
+ "epoch": 31.719346049046322,
+ "grad_norm": 7.894062519073486,
+ "learning_rate": 1.597714256875823e-05,
+ "loss": 0.3588,
+ "step": 11641
+ },
+ {
+ "epoch": 31.722070844686648,
+ "grad_norm": 7.197150707244873,
+ "learning_rate": 1.597643504140169e-05,
+ "loss": 0.4125,
+ "step": 11642
+ },
+ {
+ "epoch": 31.724795640326974,
+ "grad_norm": 7.9397687911987305,
+ "learning_rate": 1.597572746750087e-05,
+ "loss": 0.4016,
+ "step": 11643
+ },
+ {
+ "epoch": 31.727520435967303,
+ "grad_norm": 12.798469543457031,
+ "learning_rate": 1.597501984706127e-05,
+ "loss": 0.4362,
+ "step": 11644
+ },
+ {
+ "epoch": 31.73024523160763,
+ "grad_norm": 7.300980091094971,
+ "learning_rate": 1.5974312180088407e-05,
+ "loss": 0.4783,
+ "step": 11645
+ },
+ {
+ "epoch": 31.732970027247955,
+ "grad_norm": 7.096359729766846,
+ "learning_rate": 1.5973604466587797e-05,
+ "loss": 0.4644,
+ "step": 11646
+ },
+ {
+ "epoch": 31.735694822888284,
+ "grad_norm": 8.164803504943848,
+ "learning_rate": 1.597289670656495e-05,
+ "loss": 0.4043,
+ "step": 11647
+ },
+ {
+ "epoch": 31.73841961852861,
+ "grad_norm": 7.867160797119141,
+ "learning_rate": 1.5972188900025368e-05,
+ "loss": 0.4754,
+ "step": 11648
+ },
+ {
+ "epoch": 31.741144414168936,
+ "grad_norm": 8.261493682861328,
+ "learning_rate": 1.5971481046974576e-05,
+ "loss": 0.3015,
+ "step": 11649
+ },
+ {
+ "epoch": 31.743869209809265,
+ "grad_norm": 15.797551155090332,
+ "learning_rate": 1.5970773147418084e-05,
+ "loss": 0.4188,
+ "step": 11650
+ },
+ {
+ "epoch": 31.74659400544959,
+ "grad_norm": 9.968244552612305,
+ "learning_rate": 1.59700652013614e-05,
+ "loss": 0.455,
+ "step": 11651
+ },
+ {
+ "epoch": 31.749318801089917,
+ "grad_norm": 7.915208339691162,
+ "learning_rate": 1.5969357208810043e-05,
+ "loss": 0.378,
+ "step": 11652
+ },
+ {
+ "epoch": 31.752043596730246,
+ "grad_norm": 10.037928581237793,
+ "learning_rate": 1.5968649169769518e-05,
+ "loss": 0.451,
+ "step": 11653
+ },
+ {
+ "epoch": 31.754768392370572,
+ "grad_norm": 7.658346652984619,
+ "learning_rate": 1.596794108424535e-05,
+ "loss": 0.3637,
+ "step": 11654
+ },
+ {
+ "epoch": 31.757493188010898,
+ "grad_norm": 16.169321060180664,
+ "learning_rate": 1.5967232952243048e-05,
+ "loss": 0.4568,
+ "step": 11655
+ },
+ {
+ "epoch": 31.760217983651227,
+ "grad_norm": 7.466304302215576,
+ "learning_rate": 1.5966524773768127e-05,
+ "loss": 0.4997,
+ "step": 11656
+ },
+ {
+ "epoch": 31.762942779291553,
+ "grad_norm": 8.412617683410645,
+ "learning_rate": 1.5965816548826104e-05,
+ "loss": 0.4415,
+ "step": 11657
+ },
+ {
+ "epoch": 31.76566757493188,
+ "grad_norm": 8.815930366516113,
+ "learning_rate": 1.5965108277422493e-05,
+ "loss": 0.372,
+ "step": 11658
+ },
+ {
+ "epoch": 31.768392370572208,
+ "grad_norm": 9.237602233886719,
+ "learning_rate": 1.5964399959562812e-05,
+ "loss": 0.5867,
+ "step": 11659
+ },
+ {
+ "epoch": 31.771117166212534,
+ "grad_norm": 11.187580108642578,
+ "learning_rate": 1.5963691595252576e-05,
+ "loss": 0.3711,
+ "step": 11660
+ },
+ {
+ "epoch": 31.77384196185286,
+ "grad_norm": 8.331928253173828,
+ "learning_rate": 1.5962983184497304e-05,
+ "loss": 0.4207,
+ "step": 11661
+ },
+ {
+ "epoch": 31.77656675749319,
+ "grad_norm": 7.726268768310547,
+ "learning_rate": 1.5962274727302506e-05,
+ "loss": 0.4157,
+ "step": 11662
+ },
+ {
+ "epoch": 31.779291553133515,
+ "grad_norm": 7.6028594970703125,
+ "learning_rate": 1.5961566223673707e-05,
+ "loss": 0.4979,
+ "step": 11663
+ },
+ {
+ "epoch": 31.78201634877384,
+ "grad_norm": 8.230978012084961,
+ "learning_rate": 1.5960857673616423e-05,
+ "loss": 0.3914,
+ "step": 11664
+ },
+ {
+ "epoch": 31.78474114441417,
+ "grad_norm": 11.412215232849121,
+ "learning_rate": 1.5960149077136167e-05,
+ "loss": 0.3205,
+ "step": 11665
+ },
+ {
+ "epoch": 31.787465940054496,
+ "grad_norm": 7.51002311706543,
+ "learning_rate": 1.5959440434238465e-05,
+ "loss": 0.3669,
+ "step": 11666
+ },
+ {
+ "epoch": 31.79019073569482,
+ "grad_norm": 6.666199684143066,
+ "learning_rate": 1.5958731744928836e-05,
+ "loss": 0.3662,
+ "step": 11667
+ },
+ {
+ "epoch": 31.79291553133515,
+ "grad_norm": 7.396177768707275,
+ "learning_rate": 1.595802300921279e-05,
+ "loss": 0.4617,
+ "step": 11668
+ },
+ {
+ "epoch": 31.795640326975477,
+ "grad_norm": 8.355841636657715,
+ "learning_rate": 1.5957314227095854e-05,
+ "loss": 0.4491,
+ "step": 11669
+ },
+ {
+ "epoch": 31.798365122615802,
+ "grad_norm": 6.12953519821167,
+ "learning_rate": 1.5956605398583547e-05,
+ "loss": 0.4865,
+ "step": 11670
+ },
+ {
+ "epoch": 31.80108991825613,
+ "grad_norm": 8.663213729858398,
+ "learning_rate": 1.5955896523681392e-05,
+ "loss": 0.5633,
+ "step": 11671
+ },
+ {
+ "epoch": 31.803814713896458,
+ "grad_norm": 8.228528022766113,
+ "learning_rate": 1.5955187602394904e-05,
+ "loss": 0.4255,
+ "step": 11672
+ },
+ {
+ "epoch": 31.806539509536783,
+ "grad_norm": 8.043113708496094,
+ "learning_rate": 1.5954478634729605e-05,
+ "loss": 0.5658,
+ "step": 11673
+ },
+ {
+ "epoch": 31.809264305177113,
+ "grad_norm": 8.05732250213623,
+ "learning_rate": 1.595376962069102e-05,
+ "loss": 0.4994,
+ "step": 11674
+ },
+ {
+ "epoch": 31.81198910081744,
+ "grad_norm": 9.802180290222168,
+ "learning_rate": 1.5953060560284666e-05,
+ "loss": 0.4033,
+ "step": 11675
+ },
+ {
+ "epoch": 31.814713896457764,
+ "grad_norm": 9.854981422424316,
+ "learning_rate": 1.5952351453516076e-05,
+ "loss": 0.3839,
+ "step": 11676
+ },
+ {
+ "epoch": 31.817438692098094,
+ "grad_norm": 7.649071216583252,
+ "learning_rate": 1.5951642300390755e-05,
+ "loss": 0.5664,
+ "step": 11677
+ },
+ {
+ "epoch": 31.82016348773842,
+ "grad_norm": 8.393444061279297,
+ "learning_rate": 1.5950933100914242e-05,
+ "loss": 0.3582,
+ "step": 11678
+ },
+ {
+ "epoch": 31.822888283378745,
+ "grad_norm": 6.505215644836426,
+ "learning_rate": 1.5950223855092047e-05,
+ "loss": 0.4206,
+ "step": 11679
+ },
+ {
+ "epoch": 31.825613079019075,
+ "grad_norm": 9.40150260925293,
+ "learning_rate": 1.5949514562929706e-05,
+ "loss": 0.5851,
+ "step": 11680
+ },
+ {
+ "epoch": 31.8283378746594,
+ "grad_norm": 8.124299049377441,
+ "learning_rate": 1.5948805224432736e-05,
+ "loss": 0.3621,
+ "step": 11681
+ },
+ {
+ "epoch": 31.831062670299726,
+ "grad_norm": 12.069969177246094,
+ "learning_rate": 1.5948095839606657e-05,
+ "loss": 0.3731,
+ "step": 11682
+ },
+ {
+ "epoch": 31.833787465940055,
+ "grad_norm": 7.199894428253174,
+ "learning_rate": 1.5947386408457005e-05,
+ "loss": 0.3736,
+ "step": 11683
+ },
+ {
+ "epoch": 31.83651226158038,
+ "grad_norm": 7.235996723175049,
+ "learning_rate": 1.5946676930989296e-05,
+ "loss": 0.3235,
+ "step": 11684
+ },
+ {
+ "epoch": 31.839237057220707,
+ "grad_norm": 13.020691871643066,
+ "learning_rate": 1.5945967407209062e-05,
+ "loss": 0.3165,
+ "step": 11685
+ },
+ {
+ "epoch": 31.841961852861036,
+ "grad_norm": 8.26447868347168,
+ "learning_rate": 1.5945257837121825e-05,
+ "loss": 0.3387,
+ "step": 11686
+ },
+ {
+ "epoch": 31.844686648501362,
+ "grad_norm": 8.25384521484375,
+ "learning_rate": 1.5944548220733107e-05,
+ "loss": 0.3323,
+ "step": 11687
+ },
+ {
+ "epoch": 31.847411444141688,
+ "grad_norm": 7.659300804138184,
+ "learning_rate": 1.5943838558048442e-05,
+ "loss": 0.3542,
+ "step": 11688
+ },
+ {
+ "epoch": 31.850136239782017,
+ "grad_norm": 7.018349647521973,
+ "learning_rate": 1.594312884907335e-05,
+ "loss": 0.4067,
+ "step": 11689
+ },
+ {
+ "epoch": 31.852861035422343,
+ "grad_norm": 9.388994216918945,
+ "learning_rate": 1.5942419093813365e-05,
+ "loss": 0.494,
+ "step": 11690
+ },
+ {
+ "epoch": 31.85558583106267,
+ "grad_norm": 8.678350448608398,
+ "learning_rate": 1.5941709292274012e-05,
+ "loss": 0.4118,
+ "step": 11691
+ },
+ {
+ "epoch": 31.858310626703,
+ "grad_norm": 7.856499195098877,
+ "learning_rate": 1.594099944446082e-05,
+ "loss": 0.4857,
+ "step": 11692
+ },
+ {
+ "epoch": 31.861035422343324,
+ "grad_norm": 8.969182968139648,
+ "learning_rate": 1.5940289550379312e-05,
+ "loss": 0.3589,
+ "step": 11693
+ },
+ {
+ "epoch": 31.86376021798365,
+ "grad_norm": 42.84821319580078,
+ "learning_rate": 1.5939579610035017e-05,
+ "loss": 0.5277,
+ "step": 11694
+ },
+ {
+ "epoch": 31.86648501362398,
+ "grad_norm": 6.726892471313477,
+ "learning_rate": 1.5938869623433474e-05,
+ "loss": 0.2977,
+ "step": 11695
+ },
+ {
+ "epoch": 31.869209809264305,
+ "grad_norm": 7.893887996673584,
+ "learning_rate": 1.59381595905802e-05,
+ "loss": 0.3669,
+ "step": 11696
+ },
+ {
+ "epoch": 31.87193460490463,
+ "grad_norm": 8.389455795288086,
+ "learning_rate": 1.5937449511480735e-05,
+ "loss": 0.4604,
+ "step": 11697
+ },
+ {
+ "epoch": 31.87465940054496,
+ "grad_norm": 7.12132453918457,
+ "learning_rate": 1.5936739386140602e-05,
+ "loss": 0.5257,
+ "step": 11698
+ },
+ {
+ "epoch": 31.877384196185286,
+ "grad_norm": 9.241552352905273,
+ "learning_rate": 1.593602921456533e-05,
+ "loss": 0.4019,
+ "step": 11699
+ },
+ {
+ "epoch": 31.88010899182561,
+ "grad_norm": 8.437087059020996,
+ "learning_rate": 1.593531899676046e-05,
+ "loss": 0.3466,
+ "step": 11700
+ },
+ {
+ "epoch": 31.88283378746594,
+ "grad_norm": 11.758437156677246,
+ "learning_rate": 1.5934608732731516e-05,
+ "loss": 0.3138,
+ "step": 11701
+ },
+ {
+ "epoch": 31.885558583106267,
+ "grad_norm": 7.625300407409668,
+ "learning_rate": 1.5933898422484026e-05,
+ "loss": 0.5699,
+ "step": 11702
+ },
+ {
+ "epoch": 31.888283378746593,
+ "grad_norm": 12.781292915344238,
+ "learning_rate": 1.593318806602353e-05,
+ "loss": 0.4352,
+ "step": 11703
+ },
+ {
+ "epoch": 31.891008174386922,
+ "grad_norm": 9.552247047424316,
+ "learning_rate": 1.5932477663355554e-05,
+ "loss": 0.3774,
+ "step": 11704
+ },
+ {
+ "epoch": 31.893732970027248,
+ "grad_norm": 6.996197700500488,
+ "learning_rate": 1.593176721448563e-05,
+ "loss": 0.3453,
+ "step": 11705
+ },
+ {
+ "epoch": 31.896457765667574,
+ "grad_norm": 16.7490177154541,
+ "learning_rate": 1.59310567194193e-05,
+ "loss": 0.3861,
+ "step": 11706
+ },
+ {
+ "epoch": 31.899182561307903,
+ "grad_norm": 7.065978050231934,
+ "learning_rate": 1.593034617816209e-05,
+ "loss": 0.5357,
+ "step": 11707
+ },
+ {
+ "epoch": 31.90190735694823,
+ "grad_norm": 10.968025207519531,
+ "learning_rate": 1.592963559071953e-05,
+ "loss": 0.3481,
+ "step": 11708
+ },
+ {
+ "epoch": 31.904632152588555,
+ "grad_norm": 12.107632637023926,
+ "learning_rate": 1.5928924957097166e-05,
+ "loss": 0.3795,
+ "step": 11709
+ },
+ {
+ "epoch": 31.907356948228884,
+ "grad_norm": 8.137904167175293,
+ "learning_rate": 1.5928214277300517e-05,
+ "loss": 0.4666,
+ "step": 11710
+ },
+ {
+ "epoch": 31.91008174386921,
+ "grad_norm": 7.665256500244141,
+ "learning_rate": 1.5927503551335132e-05,
+ "loss": 0.3523,
+ "step": 11711
+ },
+ {
+ "epoch": 31.912806539509535,
+ "grad_norm": 8.476051330566406,
+ "learning_rate": 1.592679277920654e-05,
+ "loss": 0.454,
+ "step": 11712
+ },
+ {
+ "epoch": 31.915531335149865,
+ "grad_norm": 8.426595687866211,
+ "learning_rate": 1.5926081960920276e-05,
+ "loss": 0.4902,
+ "step": 11713
+ },
+ {
+ "epoch": 31.91825613079019,
+ "grad_norm": 8.372299194335938,
+ "learning_rate": 1.5925371096481873e-05,
+ "loss": 0.4849,
+ "step": 11714
+ },
+ {
+ "epoch": 31.920980926430516,
+ "grad_norm": 9.851797103881836,
+ "learning_rate": 1.592466018589687e-05,
+ "loss": 0.3605,
+ "step": 11715
+ },
+ {
+ "epoch": 31.923705722070846,
+ "grad_norm": 7.402262210845947,
+ "learning_rate": 1.592394922917081e-05,
+ "loss": 0.4611,
+ "step": 11716
+ },
+ {
+ "epoch": 31.92643051771117,
+ "grad_norm": 8.301385879516602,
+ "learning_rate": 1.592323822630922e-05,
+ "loss": 0.4348,
+ "step": 11717
+ },
+ {
+ "epoch": 31.929155313351497,
+ "grad_norm": 10.224685668945312,
+ "learning_rate": 1.5922527177317646e-05,
+ "loss": 0.4246,
+ "step": 11718
+ },
+ {
+ "epoch": 31.931880108991827,
+ "grad_norm": 7.9992451667785645,
+ "learning_rate": 1.5921816082201614e-05,
+ "loss": 0.4367,
+ "step": 11719
+ },
+ {
+ "epoch": 31.934604904632153,
+ "grad_norm": 9.548096656799316,
+ "learning_rate": 1.5921104940966675e-05,
+ "loss": 0.6477,
+ "step": 11720
+ },
+ {
+ "epoch": 31.93732970027248,
+ "grad_norm": 8.109225273132324,
+ "learning_rate": 1.592039375361836e-05,
+ "loss": 0.4449,
+ "step": 11721
+ },
+ {
+ "epoch": 31.940054495912808,
+ "grad_norm": 8.547680854797363,
+ "learning_rate": 1.5919682520162208e-05,
+ "loss": 0.5069,
+ "step": 11722
+ },
+ {
+ "epoch": 31.942779291553133,
+ "grad_norm": 9.245973587036133,
+ "learning_rate": 1.591897124060376e-05,
+ "loss": 0.6393,
+ "step": 11723
+ },
+ {
+ "epoch": 31.94550408719346,
+ "grad_norm": 11.543919563293457,
+ "learning_rate": 1.591825991494855e-05,
+ "loss": 0.3292,
+ "step": 11724
+ },
+ {
+ "epoch": 31.94822888283379,
+ "grad_norm": 9.651740074157715,
+ "learning_rate": 1.5917548543202127e-05,
+ "loss": 0.4369,
+ "step": 11725
+ },
+ {
+ "epoch": 31.950953678474114,
+ "grad_norm": 12.728254318237305,
+ "learning_rate": 1.5916837125370025e-05,
+ "loss": 0.4299,
+ "step": 11726
+ },
+ {
+ "epoch": 31.95367847411444,
+ "grad_norm": 10.07304859161377,
+ "learning_rate": 1.5916125661457786e-05,
+ "loss": 0.4309,
+ "step": 11727
+ },
+ {
+ "epoch": 31.95640326975477,
+ "grad_norm": 8.557503700256348,
+ "learning_rate": 1.5915414151470953e-05,
+ "loss": 0.5154,
+ "step": 11728
+ },
+ {
+ "epoch": 31.959128065395095,
+ "grad_norm": 9.72024154663086,
+ "learning_rate": 1.5914702595415062e-05,
+ "loss": 0.3552,
+ "step": 11729
+ },
+ {
+ "epoch": 31.96185286103542,
+ "grad_norm": 8.9443998336792,
+ "learning_rate": 1.5913990993295655e-05,
+ "loss": 0.4208,
+ "step": 11730
+ },
+ {
+ "epoch": 31.96457765667575,
+ "grad_norm": 9.49070930480957,
+ "learning_rate": 1.5913279345118284e-05,
+ "loss": 0.4914,
+ "step": 11731
+ },
+ {
+ "epoch": 31.967302452316076,
+ "grad_norm": 7.919051647186279,
+ "learning_rate": 1.5912567650888476e-05,
+ "loss": 0.3918,
+ "step": 11732
+ },
+ {
+ "epoch": 31.970027247956402,
+ "grad_norm": 8.020977973937988,
+ "learning_rate": 1.5911855910611785e-05,
+ "loss": 0.519,
+ "step": 11733
+ },
+ {
+ "epoch": 31.97275204359673,
+ "grad_norm": 7.276769161224365,
+ "learning_rate": 1.591114412429375e-05,
+ "loss": 0.4469,
+ "step": 11734
+ },
+ {
+ "epoch": 31.975476839237057,
+ "grad_norm": 13.29661750793457,
+ "learning_rate": 1.5910432291939917e-05,
+ "loss": 0.4273,
+ "step": 11735
+ },
+ {
+ "epoch": 31.978201634877383,
+ "grad_norm": 7.530263423919678,
+ "learning_rate": 1.5909720413555826e-05,
+ "loss": 0.4412,
+ "step": 11736
+ },
+ {
+ "epoch": 31.980926430517712,
+ "grad_norm": 8.672321319580078,
+ "learning_rate": 1.590900848914702e-05,
+ "loss": 0.3605,
+ "step": 11737
+ },
+ {
+ "epoch": 31.983651226158038,
+ "grad_norm": 8.137622833251953,
+ "learning_rate": 1.590829651871905e-05,
+ "loss": 0.4903,
+ "step": 11738
+ },
+ {
+ "epoch": 31.986376021798364,
+ "grad_norm": 15.847869873046875,
+ "learning_rate": 1.5907584502277456e-05,
+ "loss": 0.3915,
+ "step": 11739
+ },
+ {
+ "epoch": 31.989100817438693,
+ "grad_norm": 6.88349723815918,
+ "learning_rate": 1.5906872439827782e-05,
+ "loss": 0.5171,
+ "step": 11740
+ },
+ {
+ "epoch": 31.99182561307902,
+ "grad_norm": 7.6084160804748535,
+ "learning_rate": 1.5906160331375577e-05,
+ "loss": 0.4654,
+ "step": 11741
+ },
+ {
+ "epoch": 31.994550408719345,
+ "grad_norm": 11.99288558959961,
+ "learning_rate": 1.5905448176926385e-05,
+ "loss": 0.3553,
+ "step": 11742
+ },
+ {
+ "epoch": 31.997275204359674,
+ "grad_norm": 9.274868965148926,
+ "learning_rate": 1.5904735976485754e-05,
+ "loss": 0.6314,
+ "step": 11743
+ },
+ {
+ "epoch": 32.0,
+ "grad_norm": 7.692490100860596,
+ "learning_rate": 1.5904023730059227e-05,
+ "loss": 0.5656,
+ "step": 11744
+ },
+ {
+ "epoch": 32.002724795640326,
+ "grad_norm": 6.655430793762207,
+ "learning_rate": 1.5903311437652357e-05,
+ "loss": 0.3511,
+ "step": 11745
+ },
+ {
+ "epoch": 32.00544959128065,
+ "grad_norm": 7.963028907775879,
+ "learning_rate": 1.5902599099270686e-05,
+ "loss": 0.4009,
+ "step": 11746
+ },
+ {
+ "epoch": 32.00817438692098,
+ "grad_norm": 11.768818855285645,
+ "learning_rate": 1.5901886714919758e-05,
+ "loss": 0.275,
+ "step": 11747
+ },
+ {
+ "epoch": 32.01089918256131,
+ "grad_norm": 7.126332759857178,
+ "learning_rate": 1.5901174284605132e-05,
+ "loss": 0.2981,
+ "step": 11748
+ },
+ {
+ "epoch": 32.013623978201636,
+ "grad_norm": 9.119898796081543,
+ "learning_rate": 1.590046180833235e-05,
+ "loss": 0.3867,
+ "step": 11749
+ },
+ {
+ "epoch": 32.01634877384196,
+ "grad_norm": 6.50003719329834,
+ "learning_rate": 1.5899749286106957e-05,
+ "loss": 0.4581,
+ "step": 11750
+ },
+ {
+ "epoch": 32.01907356948229,
+ "grad_norm": 8.52955436706543,
+ "learning_rate": 1.5899036717934514e-05,
+ "loss": 0.3926,
+ "step": 11751
+ },
+ {
+ "epoch": 32.02179836512261,
+ "grad_norm": 7.3344244956970215,
+ "learning_rate": 1.5898324103820556e-05,
+ "loss": 0.3102,
+ "step": 11752
+ },
+ {
+ "epoch": 32.02452316076294,
+ "grad_norm": 7.1891679763793945,
+ "learning_rate": 1.5897611443770643e-05,
+ "loss": 0.3102,
+ "step": 11753
+ },
+ {
+ "epoch": 32.02724795640327,
+ "grad_norm": 8.859405517578125,
+ "learning_rate": 1.5896898737790323e-05,
+ "loss": 0.5104,
+ "step": 11754
+ },
+ {
+ "epoch": 32.0299727520436,
+ "grad_norm": 7.968280792236328,
+ "learning_rate": 1.589618598588514e-05,
+ "loss": 0.4209,
+ "step": 11755
+ },
+ {
+ "epoch": 32.032697547683924,
+ "grad_norm": 7.986744403839111,
+ "learning_rate": 1.5895473188060654e-05,
+ "loss": 0.386,
+ "step": 11756
+ },
+ {
+ "epoch": 32.03542234332425,
+ "grad_norm": 20.042699813842773,
+ "learning_rate": 1.5894760344322416e-05,
+ "loss": 0.3549,
+ "step": 11757
+ },
+ {
+ "epoch": 32.038147138964575,
+ "grad_norm": 7.735237121582031,
+ "learning_rate": 1.589404745467597e-05,
+ "loss": 0.359,
+ "step": 11758
+ },
+ {
+ "epoch": 32.0408719346049,
+ "grad_norm": 8.201799392700195,
+ "learning_rate": 1.589333451912687e-05,
+ "loss": 0.6518,
+ "step": 11759
+ },
+ {
+ "epoch": 32.043596730245234,
+ "grad_norm": 7.063997268676758,
+ "learning_rate": 1.5892621537680674e-05,
+ "loss": 0.2672,
+ "step": 11760
+ },
+ {
+ "epoch": 32.04632152588556,
+ "grad_norm": 7.970167636871338,
+ "learning_rate": 1.5891908510342932e-05,
+ "loss": 0.3202,
+ "step": 11761
+ },
+ {
+ "epoch": 32.049046321525886,
+ "grad_norm": 7.34511137008667,
+ "learning_rate": 1.5891195437119193e-05,
+ "loss": 0.4982,
+ "step": 11762
+ },
+ {
+ "epoch": 32.05177111716621,
+ "grad_norm": 21.53789710998535,
+ "learning_rate": 1.5890482318015017e-05,
+ "loss": 0.3787,
+ "step": 11763
+ },
+ {
+ "epoch": 32.05449591280654,
+ "grad_norm": 14.992596626281738,
+ "learning_rate": 1.5889769153035953e-05,
+ "loss": 0.4414,
+ "step": 11764
+ },
+ {
+ "epoch": 32.05722070844686,
+ "grad_norm": 8.265618324279785,
+ "learning_rate": 1.588905594218755e-05,
+ "loss": 0.3199,
+ "step": 11765
+ },
+ {
+ "epoch": 32.059945504087196,
+ "grad_norm": 7.635008335113525,
+ "learning_rate": 1.588834268547538e-05,
+ "loss": 0.3056,
+ "step": 11766
+ },
+ {
+ "epoch": 32.06267029972752,
+ "grad_norm": 7.344765663146973,
+ "learning_rate": 1.588762938290498e-05,
+ "loss": 0.5309,
+ "step": 11767
+ },
+ {
+ "epoch": 32.06539509536785,
+ "grad_norm": 9.463160514831543,
+ "learning_rate": 1.5886916034481914e-05,
+ "loss": 0.5813,
+ "step": 11768
+ },
+ {
+ "epoch": 32.06811989100817,
+ "grad_norm": 9.012089729309082,
+ "learning_rate": 1.5886202640211733e-05,
+ "loss": 0.5155,
+ "step": 11769
+ },
+ {
+ "epoch": 32.0708446866485,
+ "grad_norm": 10.00454044342041,
+ "learning_rate": 1.5885489200099996e-05,
+ "loss": 0.3176,
+ "step": 11770
+ },
+ {
+ "epoch": 32.073569482288825,
+ "grad_norm": 7.091330051422119,
+ "learning_rate": 1.588477571415226e-05,
+ "loss": 0.3793,
+ "step": 11771
+ },
+ {
+ "epoch": 32.07629427792916,
+ "grad_norm": 8.165772438049316,
+ "learning_rate": 1.5884062182374083e-05,
+ "loss": 0.2841,
+ "step": 11772
+ },
+ {
+ "epoch": 32.079019073569484,
+ "grad_norm": 8.757858276367188,
+ "learning_rate": 1.5883348604771013e-05,
+ "loss": 0.2816,
+ "step": 11773
+ },
+ {
+ "epoch": 32.08174386920981,
+ "grad_norm": 6.973340034484863,
+ "learning_rate": 1.5882634981348614e-05,
+ "loss": 0.4262,
+ "step": 11774
+ },
+ {
+ "epoch": 32.084468664850135,
+ "grad_norm": 7.131436347961426,
+ "learning_rate": 1.5881921312112446e-05,
+ "loss": 0.3938,
+ "step": 11775
+ },
+ {
+ "epoch": 32.08719346049046,
+ "grad_norm": 8.54784870147705,
+ "learning_rate": 1.5881207597068065e-05,
+ "loss": 0.3687,
+ "step": 11776
+ },
+ {
+ "epoch": 32.08991825613079,
+ "grad_norm": 7.42059850692749,
+ "learning_rate": 1.5880493836221025e-05,
+ "loss": 0.3914,
+ "step": 11777
+ },
+ {
+ "epoch": 32.09264305177112,
+ "grad_norm": 8.61288070678711,
+ "learning_rate": 1.587978002957689e-05,
+ "loss": 0.4535,
+ "step": 11778
+ },
+ {
+ "epoch": 32.095367847411445,
+ "grad_norm": 9.793703079223633,
+ "learning_rate": 1.587906617714122e-05,
+ "loss": 0.3553,
+ "step": 11779
+ },
+ {
+ "epoch": 32.09809264305177,
+ "grad_norm": 7.9810004234313965,
+ "learning_rate": 1.587835227891957e-05,
+ "loss": 0.3646,
+ "step": 11780
+ },
+ {
+ "epoch": 32.1008174386921,
+ "grad_norm": 6.956366062164307,
+ "learning_rate": 1.58776383349175e-05,
+ "loss": 0.3989,
+ "step": 11781
+ },
+ {
+ "epoch": 32.10354223433242,
+ "grad_norm": 9.917304992675781,
+ "learning_rate": 1.587692434514057e-05,
+ "loss": 0.3329,
+ "step": 11782
+ },
+ {
+ "epoch": 32.10626702997275,
+ "grad_norm": 9.136825561523438,
+ "learning_rate": 1.5876210309594347e-05,
+ "loss": 0.2871,
+ "step": 11783
+ },
+ {
+ "epoch": 32.10899182561308,
+ "grad_norm": 7.9324469566345215,
+ "learning_rate": 1.5875496228284385e-05,
+ "loss": 0.4206,
+ "step": 11784
+ },
+ {
+ "epoch": 32.11171662125341,
+ "grad_norm": 17.721887588500977,
+ "learning_rate": 1.5874782101216246e-05,
+ "loss": 0.4341,
+ "step": 11785
+ },
+ {
+ "epoch": 32.11444141689373,
+ "grad_norm": 12.41125202178955,
+ "learning_rate": 1.5874067928395497e-05,
+ "loss": 0.4029,
+ "step": 11786
+ },
+ {
+ "epoch": 32.11716621253406,
+ "grad_norm": 9.059920310974121,
+ "learning_rate": 1.5873353709827695e-05,
+ "loss": 0.4584,
+ "step": 11787
+ },
+ {
+ "epoch": 32.119891008174385,
+ "grad_norm": 9.27950382232666,
+ "learning_rate": 1.58726394455184e-05,
+ "loss": 0.3017,
+ "step": 11788
+ },
+ {
+ "epoch": 32.12261580381471,
+ "grad_norm": 6.377040386199951,
+ "learning_rate": 1.587192513547318e-05,
+ "loss": 0.3109,
+ "step": 11789
+ },
+ {
+ "epoch": 32.12534059945504,
+ "grad_norm": 7.2704243659973145,
+ "learning_rate": 1.5871210779697598e-05,
+ "loss": 0.3922,
+ "step": 11790
+ },
+ {
+ "epoch": 32.12806539509537,
+ "grad_norm": 8.584101676940918,
+ "learning_rate": 1.587049637819721e-05,
+ "loss": 0.4524,
+ "step": 11791
+ },
+ {
+ "epoch": 32.130790190735695,
+ "grad_norm": 12.669682502746582,
+ "learning_rate": 1.586978193097759e-05,
+ "loss": 0.4226,
+ "step": 11792
+ },
+ {
+ "epoch": 32.13351498637602,
+ "grad_norm": 8.62442398071289,
+ "learning_rate": 1.5869067438044298e-05,
+ "loss": 0.3394,
+ "step": 11793
+ },
+ {
+ "epoch": 32.13623978201635,
+ "grad_norm": 7.36232328414917,
+ "learning_rate": 1.5868352899402895e-05,
+ "loss": 0.5303,
+ "step": 11794
+ },
+ {
+ "epoch": 32.13896457765667,
+ "grad_norm": 9.210404396057129,
+ "learning_rate": 1.5867638315058947e-05,
+ "loss": 0.6094,
+ "step": 11795
+ },
+ {
+ "epoch": 32.141689373297005,
+ "grad_norm": 6.262637615203857,
+ "learning_rate": 1.5866923685018026e-05,
+ "loss": 0.4605,
+ "step": 11796
+ },
+ {
+ "epoch": 32.14441416893733,
+ "grad_norm": 13.885269165039062,
+ "learning_rate": 1.586620900928569e-05,
+ "loss": 0.3381,
+ "step": 11797
+ },
+ {
+ "epoch": 32.14713896457766,
+ "grad_norm": 6.554561614990234,
+ "learning_rate": 1.5865494287867504e-05,
+ "loss": 0.3335,
+ "step": 11798
+ },
+ {
+ "epoch": 32.14986376021798,
+ "grad_norm": 7.8454108238220215,
+ "learning_rate": 1.586477952076904e-05,
+ "loss": 0.4303,
+ "step": 11799
+ },
+ {
+ "epoch": 32.15258855585831,
+ "grad_norm": 7.831639289855957,
+ "learning_rate": 1.586406470799586e-05,
+ "loss": 0.5651,
+ "step": 11800
+ },
+ {
+ "epoch": 32.155313351498634,
+ "grad_norm": 12.072447776794434,
+ "learning_rate": 1.5863349849553533e-05,
+ "loss": 0.4243,
+ "step": 11801
+ },
+ {
+ "epoch": 32.15803814713897,
+ "grad_norm": 7.685490608215332,
+ "learning_rate": 1.5862634945447628e-05,
+ "loss": 0.3981,
+ "step": 11802
+ },
+ {
+ "epoch": 32.16076294277929,
+ "grad_norm": 8.947986602783203,
+ "learning_rate": 1.5861919995683713e-05,
+ "loss": 0.4612,
+ "step": 11803
+ },
+ {
+ "epoch": 32.16348773841962,
+ "grad_norm": 10.897587776184082,
+ "learning_rate": 1.586120500026735e-05,
+ "loss": 0.3702,
+ "step": 11804
+ },
+ {
+ "epoch": 32.166212534059945,
+ "grad_norm": 8.40881061553955,
+ "learning_rate": 1.586048995920411e-05,
+ "loss": 0.4109,
+ "step": 11805
+ },
+ {
+ "epoch": 32.16893732970027,
+ "grad_norm": 6.445413112640381,
+ "learning_rate": 1.5859774872499564e-05,
+ "loss": 0.3076,
+ "step": 11806
+ },
+ {
+ "epoch": 32.171662125340596,
+ "grad_norm": 7.084362030029297,
+ "learning_rate": 1.5859059740159283e-05,
+ "loss": 0.5631,
+ "step": 11807
+ },
+ {
+ "epoch": 32.17438692098093,
+ "grad_norm": 6.634472846984863,
+ "learning_rate": 1.585834456218883e-05,
+ "loss": 0.2851,
+ "step": 11808
+ },
+ {
+ "epoch": 32.177111716621255,
+ "grad_norm": 6.578856468200684,
+ "learning_rate": 1.585762933859378e-05,
+ "loss": 0.4152,
+ "step": 11809
+ },
+ {
+ "epoch": 32.17983651226158,
+ "grad_norm": 9.397659301757812,
+ "learning_rate": 1.58569140693797e-05,
+ "loss": 0.4192,
+ "step": 11810
+ },
+ {
+ "epoch": 32.182561307901906,
+ "grad_norm": 6.69155740737915,
+ "learning_rate": 1.585619875455216e-05,
+ "loss": 0.306,
+ "step": 11811
+ },
+ {
+ "epoch": 32.18528610354223,
+ "grad_norm": 7.759404182434082,
+ "learning_rate": 1.5855483394116734e-05,
+ "loss": 0.4203,
+ "step": 11812
+ },
+ {
+ "epoch": 32.18801089918256,
+ "grad_norm": 7.001629829406738,
+ "learning_rate": 1.5854767988078992e-05,
+ "loss": 0.3216,
+ "step": 11813
+ },
+ {
+ "epoch": 32.19073569482289,
+ "grad_norm": 9.282877922058105,
+ "learning_rate": 1.5854052536444505e-05,
+ "loss": 0.4682,
+ "step": 11814
+ },
+ {
+ "epoch": 32.19346049046322,
+ "grad_norm": 7.756398677825928,
+ "learning_rate": 1.5853337039218846e-05,
+ "loss": 0.4177,
+ "step": 11815
+ },
+ {
+ "epoch": 32.19618528610354,
+ "grad_norm": 8.572132110595703,
+ "learning_rate": 1.5852621496407584e-05,
+ "loss": 0.4274,
+ "step": 11816
+ },
+ {
+ "epoch": 32.19891008174387,
+ "grad_norm": 6.335931777954102,
+ "learning_rate": 1.5851905908016297e-05,
+ "loss": 0.395,
+ "step": 11817
+ },
+ {
+ "epoch": 32.201634877384194,
+ "grad_norm": 6.162834167480469,
+ "learning_rate": 1.5851190274050555e-05,
+ "loss": 0.3054,
+ "step": 11818
+ },
+ {
+ "epoch": 32.20435967302452,
+ "grad_norm": 6.942822456359863,
+ "learning_rate": 1.585047459451593e-05,
+ "loss": 0.4146,
+ "step": 11819
+ },
+ {
+ "epoch": 32.20708446866485,
+ "grad_norm": 5.796833038330078,
+ "learning_rate": 1.5849758869418002e-05,
+ "loss": 0.2725,
+ "step": 11820
+ },
+ {
+ "epoch": 32.20980926430518,
+ "grad_norm": 9.037385940551758,
+ "learning_rate": 1.5849043098762335e-05,
+ "loss": 0.3282,
+ "step": 11821
+ },
+ {
+ "epoch": 32.212534059945504,
+ "grad_norm": 9.565847396850586,
+ "learning_rate": 1.584832728255451e-05,
+ "loss": 0.4362,
+ "step": 11822
+ },
+ {
+ "epoch": 32.21525885558583,
+ "grad_norm": 9.69047737121582,
+ "learning_rate": 1.58476114208001e-05,
+ "loss": 0.3274,
+ "step": 11823
+ },
+ {
+ "epoch": 32.217983651226156,
+ "grad_norm": 8.620555877685547,
+ "learning_rate": 1.584689551350468e-05,
+ "loss": 0.3643,
+ "step": 11824
+ },
+ {
+ "epoch": 32.22070844686648,
+ "grad_norm": 9.036141395568848,
+ "learning_rate": 1.5846179560673825e-05,
+ "loss": 0.3236,
+ "step": 11825
+ },
+ {
+ "epoch": 32.223433242506815,
+ "grad_norm": 5.609255313873291,
+ "learning_rate": 1.5845463562313113e-05,
+ "loss": 0.4547,
+ "step": 11826
+ },
+ {
+ "epoch": 32.22615803814714,
+ "grad_norm": 8.770671844482422,
+ "learning_rate": 1.5844747518428124e-05,
+ "loss": 0.5427,
+ "step": 11827
+ },
+ {
+ "epoch": 32.228882833787466,
+ "grad_norm": 11.33442497253418,
+ "learning_rate": 1.584403142902442e-05,
+ "loss": 0.4137,
+ "step": 11828
+ },
+ {
+ "epoch": 32.23160762942779,
+ "grad_norm": 6.859502792358398,
+ "learning_rate": 1.5843315294107595e-05,
+ "loss": 0.2459,
+ "step": 11829
+ },
+ {
+ "epoch": 32.23433242506812,
+ "grad_norm": 7.492730140686035,
+ "learning_rate": 1.5842599113683216e-05,
+ "loss": 0.3889,
+ "step": 11830
+ },
+ {
+ "epoch": 32.237057220708444,
+ "grad_norm": 7.895528316497803,
+ "learning_rate": 1.5841882887756864e-05,
+ "loss": 0.4388,
+ "step": 11831
+ },
+ {
+ "epoch": 32.23978201634878,
+ "grad_norm": 12.864253044128418,
+ "learning_rate": 1.5841166616334112e-05,
+ "loss": 0.4497,
+ "step": 11832
+ },
+ {
+ "epoch": 32.2425068119891,
+ "grad_norm": 6.970122337341309,
+ "learning_rate": 1.5840450299420548e-05,
+ "loss": 0.4554,
+ "step": 11833
+ },
+ {
+ "epoch": 32.24523160762943,
+ "grad_norm": 8.694933891296387,
+ "learning_rate": 1.5839733937021738e-05,
+ "loss": 0.2998,
+ "step": 11834
+ },
+ {
+ "epoch": 32.247956403269754,
+ "grad_norm": 8.716221809387207,
+ "learning_rate": 1.5839017529143276e-05,
+ "loss": 0.4441,
+ "step": 11835
+ },
+ {
+ "epoch": 32.25068119891008,
+ "grad_norm": 6.544258117675781,
+ "learning_rate": 1.5838301075790726e-05,
+ "loss": 0.343,
+ "step": 11836
+ },
+ {
+ "epoch": 32.253405994550405,
+ "grad_norm": 7.905789375305176,
+ "learning_rate": 1.583758457696968e-05,
+ "loss": 0.3984,
+ "step": 11837
+ },
+ {
+ "epoch": 32.25613079019074,
+ "grad_norm": 7.267482757568359,
+ "learning_rate": 1.5836868032685714e-05,
+ "loss": 0.3942,
+ "step": 11838
+ },
+ {
+ "epoch": 32.258855585831064,
+ "grad_norm": 7.333285331726074,
+ "learning_rate": 1.5836151442944406e-05,
+ "loss": 0.2985,
+ "step": 11839
+ },
+ {
+ "epoch": 32.26158038147139,
+ "grad_norm": 7.183562278747559,
+ "learning_rate": 1.5835434807751337e-05,
+ "loss": 0.3709,
+ "step": 11840
+ },
+ {
+ "epoch": 32.264305177111716,
+ "grad_norm": 6.645139217376709,
+ "learning_rate": 1.583471812711209e-05,
+ "loss": 0.442,
+ "step": 11841
+ },
+ {
+ "epoch": 32.26702997275204,
+ "grad_norm": 26.506385803222656,
+ "learning_rate": 1.583400140103225e-05,
+ "loss": 0.3225,
+ "step": 11842
+ },
+ {
+ "epoch": 32.26975476839237,
+ "grad_norm": 25.365419387817383,
+ "learning_rate": 1.583328462951739e-05,
+ "loss": 0.4845,
+ "step": 11843
+ },
+ {
+ "epoch": 32.2724795640327,
+ "grad_norm": 6.552819728851318,
+ "learning_rate": 1.5832567812573097e-05,
+ "loss": 0.3095,
+ "step": 11844
+ },
+ {
+ "epoch": 32.275204359673026,
+ "grad_norm": 7.264756202697754,
+ "learning_rate": 1.5831850950204955e-05,
+ "loss": 0.3252,
+ "step": 11845
+ },
+ {
+ "epoch": 32.27792915531335,
+ "grad_norm": 6.431404113769531,
+ "learning_rate": 1.5831134042418547e-05,
+ "loss": 0.4528,
+ "step": 11846
+ },
+ {
+ "epoch": 32.28065395095368,
+ "grad_norm": 8.371557235717773,
+ "learning_rate": 1.5830417089219454e-05,
+ "loss": 0.2578,
+ "step": 11847
+ },
+ {
+ "epoch": 32.283378746594,
+ "grad_norm": 7.391849517822266,
+ "learning_rate": 1.582970009061326e-05,
+ "loss": 0.3527,
+ "step": 11848
+ },
+ {
+ "epoch": 32.28610354223433,
+ "grad_norm": 8.503427505493164,
+ "learning_rate": 1.582898304660555e-05,
+ "loss": 0.2731,
+ "step": 11849
+ },
+ {
+ "epoch": 32.28882833787466,
+ "grad_norm": 8.949432373046875,
+ "learning_rate": 1.5828265957201904e-05,
+ "loss": 0.3873,
+ "step": 11850
+ },
+ {
+ "epoch": 32.29155313351499,
+ "grad_norm": 6.752440452575684,
+ "learning_rate": 1.5827548822407912e-05,
+ "loss": 0.4052,
+ "step": 11851
+ },
+ {
+ "epoch": 32.294277929155314,
+ "grad_norm": 6.268543243408203,
+ "learning_rate": 1.582683164222916e-05,
+ "loss": 0.3759,
+ "step": 11852
+ },
+ {
+ "epoch": 32.29700272479564,
+ "grad_norm": 6.491923809051514,
+ "learning_rate": 1.582611441667123e-05,
+ "loss": 0.3365,
+ "step": 11853
+ },
+ {
+ "epoch": 32.299727520435965,
+ "grad_norm": 6.925135612487793,
+ "learning_rate": 1.5825397145739704e-05,
+ "loss": 0.3329,
+ "step": 11854
+ },
+ {
+ "epoch": 32.30245231607629,
+ "grad_norm": 7.322439193725586,
+ "learning_rate": 1.582467982944018e-05,
+ "loss": 0.4421,
+ "step": 11855
+ },
+ {
+ "epoch": 32.305177111716624,
+ "grad_norm": 5.905395984649658,
+ "learning_rate": 1.582396246777823e-05,
+ "loss": 0.4805,
+ "step": 11856
+ },
+ {
+ "epoch": 32.30790190735695,
+ "grad_norm": 7.987797260284424,
+ "learning_rate": 1.582324506075945e-05,
+ "loss": 0.4595,
+ "step": 11857
+ },
+ {
+ "epoch": 32.310626702997276,
+ "grad_norm": 8.10444164276123,
+ "learning_rate": 1.5822527608389428e-05,
+ "loss": 0.3066,
+ "step": 11858
+ },
+ {
+ "epoch": 32.3133514986376,
+ "grad_norm": 7.959553241729736,
+ "learning_rate": 1.5821810110673744e-05,
+ "loss": 0.2758,
+ "step": 11859
+ },
+ {
+ "epoch": 32.31607629427793,
+ "grad_norm": 7.548391819000244,
+ "learning_rate": 1.5821092567617993e-05,
+ "loss": 0.4469,
+ "step": 11860
+ },
+ {
+ "epoch": 32.31880108991825,
+ "grad_norm": 6.731222629547119,
+ "learning_rate": 1.582037497922776e-05,
+ "loss": 0.4565,
+ "step": 11861
+ },
+ {
+ "epoch": 32.321525885558586,
+ "grad_norm": 7.5333991050720215,
+ "learning_rate": 1.581965734550863e-05,
+ "loss": 0.3308,
+ "step": 11862
+ },
+ {
+ "epoch": 32.32425068119891,
+ "grad_norm": 13.58120059967041,
+ "learning_rate": 1.5818939666466203e-05,
+ "loss": 0.3882,
+ "step": 11863
+ },
+ {
+ "epoch": 32.32697547683924,
+ "grad_norm": 13.837489128112793,
+ "learning_rate": 1.5818221942106058e-05,
+ "loss": 0.3484,
+ "step": 11864
+ },
+ {
+ "epoch": 32.32970027247956,
+ "grad_norm": 9.037531852722168,
+ "learning_rate": 1.581750417243379e-05,
+ "loss": 0.4246,
+ "step": 11865
+ },
+ {
+ "epoch": 32.33242506811989,
+ "grad_norm": 6.657193660736084,
+ "learning_rate": 1.5816786357454984e-05,
+ "loss": 0.3333,
+ "step": 11866
+ },
+ {
+ "epoch": 32.335149863760215,
+ "grad_norm": 7.076379299163818,
+ "learning_rate": 1.5816068497175233e-05,
+ "loss": 0.264,
+ "step": 11867
+ },
+ {
+ "epoch": 32.33787465940055,
+ "grad_norm": 7.124920845031738,
+ "learning_rate": 1.5815350591600124e-05,
+ "loss": 0.4204,
+ "step": 11868
+ },
+ {
+ "epoch": 32.34059945504087,
+ "grad_norm": 7.654149055480957,
+ "learning_rate": 1.5814632640735258e-05,
+ "loss": 0.4473,
+ "step": 11869
+ },
+ {
+ "epoch": 32.3433242506812,
+ "grad_norm": 9.05989933013916,
+ "learning_rate": 1.5813914644586218e-05,
+ "loss": 0.3142,
+ "step": 11870
+ },
+ {
+ "epoch": 32.346049046321525,
+ "grad_norm": 6.905852794647217,
+ "learning_rate": 1.5813196603158594e-05,
+ "loss": 0.4329,
+ "step": 11871
+ },
+ {
+ "epoch": 32.34877384196185,
+ "grad_norm": 7.0673933029174805,
+ "learning_rate": 1.581247851645799e-05,
+ "loss": 0.3491,
+ "step": 11872
+ },
+ {
+ "epoch": 32.35149863760218,
+ "grad_norm": 7.70352840423584,
+ "learning_rate": 1.5811760384489983e-05,
+ "loss": 0.2582,
+ "step": 11873
+ },
+ {
+ "epoch": 32.35422343324251,
+ "grad_norm": 12.85704517364502,
+ "learning_rate": 1.581104220726018e-05,
+ "loss": 0.4186,
+ "step": 11874
+ },
+ {
+ "epoch": 32.356948228882835,
+ "grad_norm": 8.48851490020752,
+ "learning_rate": 1.581032398477416e-05,
+ "loss": 0.3688,
+ "step": 11875
+ },
+ {
+ "epoch": 32.35967302452316,
+ "grad_norm": 5.9951934814453125,
+ "learning_rate": 1.580960571703753e-05,
+ "loss": 0.3363,
+ "step": 11876
+ },
+ {
+ "epoch": 32.36239782016349,
+ "grad_norm": 6.69450044631958,
+ "learning_rate": 1.5808887404055876e-05,
+ "loss": 0.3303,
+ "step": 11877
+ },
+ {
+ "epoch": 32.36512261580381,
+ "grad_norm": 9.448138236999512,
+ "learning_rate": 1.580816904583479e-05,
+ "loss": 0.4879,
+ "step": 11878
+ },
+ {
+ "epoch": 32.36784741144414,
+ "grad_norm": 6.074221134185791,
+ "learning_rate": 1.5807450642379874e-05,
+ "loss": 0.2635,
+ "step": 11879
+ },
+ {
+ "epoch": 32.37057220708447,
+ "grad_norm": 8.59503173828125,
+ "learning_rate": 1.580673219369672e-05,
+ "loss": 0.3106,
+ "step": 11880
+ },
+ {
+ "epoch": 32.3732970027248,
+ "grad_norm": 9.456225395202637,
+ "learning_rate": 1.580601369979092e-05,
+ "loss": 0.42,
+ "step": 11881
+ },
+ {
+ "epoch": 32.37602179836512,
+ "grad_norm": 6.988005638122559,
+ "learning_rate": 1.5805295160668075e-05,
+ "loss": 0.4572,
+ "step": 11882
+ },
+ {
+ "epoch": 32.37874659400545,
+ "grad_norm": 15.075167655944824,
+ "learning_rate": 1.5804576576333776e-05,
+ "loss": 0.3986,
+ "step": 11883
+ },
+ {
+ "epoch": 32.381471389645775,
+ "grad_norm": 7.345865249633789,
+ "learning_rate": 1.580385794679362e-05,
+ "loss": 0.4762,
+ "step": 11884
+ },
+ {
+ "epoch": 32.3841961852861,
+ "grad_norm": 5.510758876800537,
+ "learning_rate": 1.580313927205321e-05,
+ "loss": 0.437,
+ "step": 11885
+ },
+ {
+ "epoch": 32.38692098092643,
+ "grad_norm": 7.573642253875732,
+ "learning_rate": 1.5802420552118133e-05,
+ "loss": 0.3484,
+ "step": 11886
+ },
+ {
+ "epoch": 32.38964577656676,
+ "grad_norm": 7.1016011238098145,
+ "learning_rate": 1.5801701786993992e-05,
+ "loss": 0.5948,
+ "step": 11887
+ },
+ {
+ "epoch": 32.392370572207085,
+ "grad_norm": 7.032326698303223,
+ "learning_rate": 1.5800982976686387e-05,
+ "loss": 0.3499,
+ "step": 11888
+ },
+ {
+ "epoch": 32.39509536784741,
+ "grad_norm": 7.155482292175293,
+ "learning_rate": 1.580026412120091e-05,
+ "loss": 0.4247,
+ "step": 11889
+ },
+ {
+ "epoch": 32.39782016348774,
+ "grad_norm": 6.175853729248047,
+ "learning_rate": 1.5799545220543168e-05,
+ "loss": 0.3085,
+ "step": 11890
+ },
+ {
+ "epoch": 32.40054495912806,
+ "grad_norm": 9.193768501281738,
+ "learning_rate": 1.579882627471875e-05,
+ "loss": 0.33,
+ "step": 11891
+ },
+ {
+ "epoch": 32.403269754768395,
+ "grad_norm": 7.0792388916015625,
+ "learning_rate": 1.5798107283733265e-05,
+ "loss": 0.3567,
+ "step": 11892
+ },
+ {
+ "epoch": 32.40599455040872,
+ "grad_norm": 6.419934272766113,
+ "learning_rate": 1.5797388247592304e-05,
+ "loss": 0.3961,
+ "step": 11893
+ },
+ {
+ "epoch": 32.40871934604905,
+ "grad_norm": 6.680984973907471,
+ "learning_rate": 1.5796669166301468e-05,
+ "loss": 0.4934,
+ "step": 11894
+ },
+ {
+ "epoch": 32.41144414168937,
+ "grad_norm": 9.507497787475586,
+ "learning_rate": 1.579595003986636e-05,
+ "loss": 0.346,
+ "step": 11895
+ },
+ {
+ "epoch": 32.4141689373297,
+ "grad_norm": 7.483531951904297,
+ "learning_rate": 1.5795230868292576e-05,
+ "loss": 0.4828,
+ "step": 11896
+ },
+ {
+ "epoch": 32.416893732970024,
+ "grad_norm": 6.597445487976074,
+ "learning_rate": 1.5794511651585725e-05,
+ "loss": 0.3551,
+ "step": 11897
+ },
+ {
+ "epoch": 32.41961852861036,
+ "grad_norm": 7.840703964233398,
+ "learning_rate": 1.5793792389751402e-05,
+ "loss": 0.3699,
+ "step": 11898
+ },
+ {
+ "epoch": 32.42234332425068,
+ "grad_norm": 6.960693836212158,
+ "learning_rate": 1.5793073082795213e-05,
+ "loss": 0.3769,
+ "step": 11899
+ },
+ {
+ "epoch": 32.42506811989101,
+ "grad_norm": 12.177355766296387,
+ "learning_rate": 1.5792353730722757e-05,
+ "loss": 0.3799,
+ "step": 11900
+ },
+ {
+ "epoch": 32.427792915531334,
+ "grad_norm": 8.627708435058594,
+ "learning_rate": 1.5791634333539632e-05,
+ "loss": 0.4571,
+ "step": 11901
+ },
+ {
+ "epoch": 32.43051771117166,
+ "grad_norm": 7.5197434425354,
+ "learning_rate": 1.5790914891251448e-05,
+ "loss": 0.4738,
+ "step": 11902
+ },
+ {
+ "epoch": 32.433242506811986,
+ "grad_norm": 9.005895614624023,
+ "learning_rate": 1.5790195403863808e-05,
+ "loss": 0.3651,
+ "step": 11903
+ },
+ {
+ "epoch": 32.43596730245232,
+ "grad_norm": 8.538691520690918,
+ "learning_rate": 1.578947587138231e-05,
+ "loss": 0.3392,
+ "step": 11904
+ },
+ {
+ "epoch": 32.438692098092645,
+ "grad_norm": 7.353978633880615,
+ "learning_rate": 1.578875629381256e-05,
+ "loss": 0.3974,
+ "step": 11905
+ },
+ {
+ "epoch": 32.44141689373297,
+ "grad_norm": 8.60916519165039,
+ "learning_rate": 1.5788036671160163e-05,
+ "loss": 0.3304,
+ "step": 11906
+ },
+ {
+ "epoch": 32.444141689373296,
+ "grad_norm": 6.569250583648682,
+ "learning_rate": 1.578731700343072e-05,
+ "loss": 0.4344,
+ "step": 11907
+ },
+ {
+ "epoch": 32.44686648501362,
+ "grad_norm": 7.190419673919678,
+ "learning_rate": 1.5786597290629843e-05,
+ "loss": 0.2899,
+ "step": 11908
+ },
+ {
+ "epoch": 32.44959128065395,
+ "grad_norm": 7.1112141609191895,
+ "learning_rate": 1.5785877532763132e-05,
+ "loss": 0.4316,
+ "step": 11909
+ },
+ {
+ "epoch": 32.45231607629428,
+ "grad_norm": 6.34969425201416,
+ "learning_rate": 1.578515772983619e-05,
+ "loss": 0.3689,
+ "step": 11910
+ },
+ {
+ "epoch": 32.45504087193461,
+ "grad_norm": 8.304433822631836,
+ "learning_rate": 1.5784437881854626e-05,
+ "loss": 0.4647,
+ "step": 11911
+ },
+ {
+ "epoch": 32.45776566757493,
+ "grad_norm": 27.573606491088867,
+ "learning_rate": 1.578371798882405e-05,
+ "loss": 0.4462,
+ "step": 11912
+ },
+ {
+ "epoch": 32.46049046321526,
+ "grad_norm": 5.862417697906494,
+ "learning_rate": 1.578299805075006e-05,
+ "loss": 0.4507,
+ "step": 11913
+ },
+ {
+ "epoch": 32.463215258855584,
+ "grad_norm": 9.314671516418457,
+ "learning_rate": 1.5782278067638267e-05,
+ "loss": 0.4748,
+ "step": 11914
+ },
+ {
+ "epoch": 32.46594005449591,
+ "grad_norm": 6.722378253936768,
+ "learning_rate": 1.5781558039494283e-05,
+ "loss": 0.3104,
+ "step": 11915
+ },
+ {
+ "epoch": 32.46866485013624,
+ "grad_norm": 8.106048583984375,
+ "learning_rate": 1.578083796632371e-05,
+ "loss": 0.4258,
+ "step": 11916
+ },
+ {
+ "epoch": 32.47138964577657,
+ "grad_norm": 8.299581527709961,
+ "learning_rate": 1.5780117848132154e-05,
+ "loss": 0.438,
+ "step": 11917
+ },
+ {
+ "epoch": 32.474114441416894,
+ "grad_norm": 7.841410160064697,
+ "learning_rate": 1.5779397684925226e-05,
+ "loss": 0.3873,
+ "step": 11918
+ },
+ {
+ "epoch": 32.47683923705722,
+ "grad_norm": 6.277518272399902,
+ "learning_rate": 1.5778677476708536e-05,
+ "loss": 0.2712,
+ "step": 11919
+ },
+ {
+ "epoch": 32.479564032697546,
+ "grad_norm": 6.815647125244141,
+ "learning_rate": 1.577795722348769e-05,
+ "loss": 0.2715,
+ "step": 11920
+ },
+ {
+ "epoch": 32.48228882833787,
+ "grad_norm": 7.107115745544434,
+ "learning_rate": 1.5777236925268306e-05,
+ "loss": 0.441,
+ "step": 11921
+ },
+ {
+ "epoch": 32.485013623978205,
+ "grad_norm": 6.531349182128906,
+ "learning_rate": 1.577651658205598e-05,
+ "loss": 0.5261,
+ "step": 11922
+ },
+ {
+ "epoch": 32.48773841961853,
+ "grad_norm": 6.629528999328613,
+ "learning_rate": 1.5775796193856332e-05,
+ "loss": 0.293,
+ "step": 11923
+ },
+ {
+ "epoch": 32.490463215258856,
+ "grad_norm": 7.79941987991333,
+ "learning_rate": 1.5775075760674966e-05,
+ "loss": 0.3395,
+ "step": 11924
+ },
+ {
+ "epoch": 32.49318801089918,
+ "grad_norm": 7.020432949066162,
+ "learning_rate": 1.57743552825175e-05,
+ "loss": 0.4031,
+ "step": 11925
+ },
+ {
+ "epoch": 32.49591280653951,
+ "grad_norm": 6.841043472290039,
+ "learning_rate": 1.5773634759389537e-05,
+ "loss": 0.2846,
+ "step": 11926
+ },
+ {
+ "epoch": 32.49863760217983,
+ "grad_norm": 7.659816265106201,
+ "learning_rate": 1.5772914191296697e-05,
+ "loss": 0.3821,
+ "step": 11927
+ },
+ {
+ "epoch": 32.50136239782017,
+ "grad_norm": 7.213796138763428,
+ "learning_rate": 1.577219357824458e-05,
+ "loss": 0.3698,
+ "step": 11928
+ },
+ {
+ "epoch": 32.50408719346049,
+ "grad_norm": 5.5160369873046875,
+ "learning_rate": 1.577147292023881e-05,
+ "loss": 0.4213,
+ "step": 11929
+ },
+ {
+ "epoch": 32.50681198910082,
+ "grad_norm": 7.902105808258057,
+ "learning_rate": 1.5770752217284995e-05,
+ "loss": 0.4316,
+ "step": 11930
+ },
+ {
+ "epoch": 32.509536784741144,
+ "grad_norm": 6.753303527832031,
+ "learning_rate": 1.5770031469388747e-05,
+ "loss": 0.4515,
+ "step": 11931
+ },
+ {
+ "epoch": 32.51226158038147,
+ "grad_norm": 7.130935192108154,
+ "learning_rate": 1.576931067655568e-05,
+ "loss": 0.3441,
+ "step": 11932
+ },
+ {
+ "epoch": 32.514986376021795,
+ "grad_norm": 8.129018783569336,
+ "learning_rate": 1.5768589838791405e-05,
+ "loss": 0.2713,
+ "step": 11933
+ },
+ {
+ "epoch": 32.51771117166213,
+ "grad_norm": 7.047908782958984,
+ "learning_rate": 1.576786895610154e-05,
+ "loss": 0.3265,
+ "step": 11934
+ },
+ {
+ "epoch": 32.520435967302454,
+ "grad_norm": 7.914534568786621,
+ "learning_rate": 1.5767148028491696e-05,
+ "loss": 0.3427,
+ "step": 11935
+ },
+ {
+ "epoch": 32.52316076294278,
+ "grad_norm": 11.322606086730957,
+ "learning_rate": 1.5766427055967488e-05,
+ "loss": 0.3063,
+ "step": 11936
+ },
+ {
+ "epoch": 32.525885558583106,
+ "grad_norm": 12.04789924621582,
+ "learning_rate": 1.5765706038534534e-05,
+ "loss": 0.4918,
+ "step": 11937
+ },
+ {
+ "epoch": 32.52861035422343,
+ "grad_norm": 8.268314361572266,
+ "learning_rate": 1.5764984976198447e-05,
+ "loss": 0.4151,
+ "step": 11938
+ },
+ {
+ "epoch": 32.53133514986376,
+ "grad_norm": 5.861069202423096,
+ "learning_rate": 1.576426386896484e-05,
+ "loss": 0.3702,
+ "step": 11939
+ },
+ {
+ "epoch": 32.53405994550409,
+ "grad_norm": 6.333064556121826,
+ "learning_rate": 1.5763542716839332e-05,
+ "loss": 0.3506,
+ "step": 11940
+ },
+ {
+ "epoch": 32.536784741144416,
+ "grad_norm": 8.839204788208008,
+ "learning_rate": 1.576282151982754e-05,
+ "loss": 0.3522,
+ "step": 11941
+ },
+ {
+ "epoch": 32.53950953678474,
+ "grad_norm": 7.407595634460449,
+ "learning_rate": 1.576210027793508e-05,
+ "loss": 0.4851,
+ "step": 11942
+ },
+ {
+ "epoch": 32.54223433242507,
+ "grad_norm": 7.629887580871582,
+ "learning_rate": 1.5761378991167568e-05,
+ "loss": 0.4349,
+ "step": 11943
+ },
+ {
+ "epoch": 32.54495912806539,
+ "grad_norm": 8.962532043457031,
+ "learning_rate": 1.5760657659530622e-05,
+ "loss": 0.4535,
+ "step": 11944
+ },
+ {
+ "epoch": 32.54768392370572,
+ "grad_norm": 6.943212509155273,
+ "learning_rate": 1.575993628302986e-05,
+ "loss": 0.4005,
+ "step": 11945
+ },
+ {
+ "epoch": 32.55040871934605,
+ "grad_norm": 8.85571575164795,
+ "learning_rate": 1.5759214861670894e-05,
+ "loss": 0.3887,
+ "step": 11946
+ },
+ {
+ "epoch": 32.55313351498638,
+ "grad_norm": 7.18424654006958,
+ "learning_rate": 1.5758493395459353e-05,
+ "loss": 0.4333,
+ "step": 11947
+ },
+ {
+ "epoch": 32.555858310626704,
+ "grad_norm": 6.862495422363281,
+ "learning_rate": 1.5757771884400853e-05,
+ "loss": 0.3755,
+ "step": 11948
+ },
+ {
+ "epoch": 32.55858310626703,
+ "grad_norm": 12.841184616088867,
+ "learning_rate": 1.5757050328501005e-05,
+ "loss": 0.4854,
+ "step": 11949
+ },
+ {
+ "epoch": 32.561307901907355,
+ "grad_norm": 6.726277828216553,
+ "learning_rate": 1.5756328727765443e-05,
+ "loss": 0.3418,
+ "step": 11950
+ },
+ {
+ "epoch": 32.56403269754768,
+ "grad_norm": 7.365610122680664,
+ "learning_rate": 1.575560708219977e-05,
+ "loss": 0.388,
+ "step": 11951
+ },
+ {
+ "epoch": 32.566757493188014,
+ "grad_norm": 8.58881664276123,
+ "learning_rate": 1.5754885391809618e-05,
+ "loss": 0.5242,
+ "step": 11952
+ },
+ {
+ "epoch": 32.56948228882834,
+ "grad_norm": 7.2528533935546875,
+ "learning_rate": 1.5754163656600602e-05,
+ "loss": 0.3458,
+ "step": 11953
+ },
+ {
+ "epoch": 32.572207084468666,
+ "grad_norm": 7.158148288726807,
+ "learning_rate": 1.5753441876578347e-05,
+ "loss": 0.4552,
+ "step": 11954
+ },
+ {
+ "epoch": 32.57493188010899,
+ "grad_norm": 8.406827926635742,
+ "learning_rate": 1.575272005174847e-05,
+ "loss": 0.3913,
+ "step": 11955
+ },
+ {
+ "epoch": 32.57765667574932,
+ "grad_norm": 6.260662078857422,
+ "learning_rate": 1.5751998182116595e-05,
+ "loss": 0.4446,
+ "step": 11956
+ },
+ {
+ "epoch": 32.58038147138964,
+ "grad_norm": 6.576188087463379,
+ "learning_rate": 1.575127626768834e-05,
+ "loss": 0.4244,
+ "step": 11957
+ },
+ {
+ "epoch": 32.583106267029976,
+ "grad_norm": 7.728090763092041,
+ "learning_rate": 1.5750554308469337e-05,
+ "loss": 0.3572,
+ "step": 11958
+ },
+ {
+ "epoch": 32.5858310626703,
+ "grad_norm": 10.058018684387207,
+ "learning_rate": 1.5749832304465197e-05,
+ "loss": 0.3777,
+ "step": 11959
+ },
+ {
+ "epoch": 32.58855585831063,
+ "grad_norm": 9.505508422851562,
+ "learning_rate": 1.574911025568155e-05,
+ "loss": 0.3886,
+ "step": 11960
+ },
+ {
+ "epoch": 32.59128065395095,
+ "grad_norm": 10.549141883850098,
+ "learning_rate": 1.5748388162124017e-05,
+ "loss": 0.3792,
+ "step": 11961
+ },
+ {
+ "epoch": 32.59400544959128,
+ "grad_norm": 6.701169490814209,
+ "learning_rate": 1.5747666023798226e-05,
+ "loss": 0.3253,
+ "step": 11962
+ },
+ {
+ "epoch": 32.596730245231605,
+ "grad_norm": 7.991512775421143,
+ "learning_rate": 1.5746943840709786e-05,
+ "loss": 0.2688,
+ "step": 11963
+ },
+ {
+ "epoch": 32.59945504087194,
+ "grad_norm": 7.135027885437012,
+ "learning_rate": 1.5746221612864342e-05,
+ "loss": 0.3714,
+ "step": 11964
+ },
+ {
+ "epoch": 32.60217983651226,
+ "grad_norm": 9.023070335388184,
+ "learning_rate": 1.5745499340267508e-05,
+ "loss": 0.5009,
+ "step": 11965
+ },
+ {
+ "epoch": 32.60490463215259,
+ "grad_norm": 6.113072395324707,
+ "learning_rate": 1.574477702292491e-05,
+ "loss": 0.4158,
+ "step": 11966
+ },
+ {
+ "epoch": 32.607629427792915,
+ "grad_norm": 6.196746349334717,
+ "learning_rate": 1.574405466084217e-05,
+ "loss": 0.2893,
+ "step": 11967
+ },
+ {
+ "epoch": 32.61035422343324,
+ "grad_norm": 7.036569595336914,
+ "learning_rate": 1.574333225402492e-05,
+ "loss": 0.3227,
+ "step": 11968
+ },
+ {
+ "epoch": 32.61307901907357,
+ "grad_norm": 9.898079872131348,
+ "learning_rate": 1.5742609802478782e-05,
+ "loss": 0.2725,
+ "step": 11969
+ },
+ {
+ "epoch": 32.6158038147139,
+ "grad_norm": 9.416449546813965,
+ "learning_rate": 1.5741887306209383e-05,
+ "loss": 0.5483,
+ "step": 11970
+ },
+ {
+ "epoch": 32.618528610354225,
+ "grad_norm": 12.58320426940918,
+ "learning_rate": 1.574116476522235e-05,
+ "loss": 0.3538,
+ "step": 11971
+ },
+ {
+ "epoch": 32.62125340599455,
+ "grad_norm": 9.070144653320312,
+ "learning_rate": 1.5740442179523315e-05,
+ "loss": 0.4606,
+ "step": 11972
+ },
+ {
+ "epoch": 32.62397820163488,
+ "grad_norm": 12.15832805633545,
+ "learning_rate": 1.5739719549117897e-05,
+ "loss": 0.3821,
+ "step": 11973
+ },
+ {
+ "epoch": 32.6267029972752,
+ "grad_norm": 7.7303547859191895,
+ "learning_rate": 1.5738996874011728e-05,
+ "loss": 0.3867,
+ "step": 11974
+ },
+ {
+ "epoch": 32.62942779291553,
+ "grad_norm": 11.707273483276367,
+ "learning_rate": 1.573827415421044e-05,
+ "loss": 0.4366,
+ "step": 11975
+ },
+ {
+ "epoch": 32.63215258855586,
+ "grad_norm": 6.971134662628174,
+ "learning_rate": 1.5737551389719655e-05,
+ "loss": 0.4473,
+ "step": 11976
+ },
+ {
+ "epoch": 32.63487738419619,
+ "grad_norm": 7.204379081726074,
+ "learning_rate": 1.5736828580545003e-05,
+ "loss": 0.2962,
+ "step": 11977
+ },
+ {
+ "epoch": 32.63760217983651,
+ "grad_norm": 7.457752704620361,
+ "learning_rate": 1.5736105726692117e-05,
+ "loss": 0.3885,
+ "step": 11978
+ },
+ {
+ "epoch": 32.64032697547684,
+ "grad_norm": 6.843810081481934,
+ "learning_rate": 1.5735382828166623e-05,
+ "loss": 0.5171,
+ "step": 11979
+ },
+ {
+ "epoch": 32.643051771117165,
+ "grad_norm": 7.744211673736572,
+ "learning_rate": 1.573465988497415e-05,
+ "loss": 0.4914,
+ "step": 11980
+ },
+ {
+ "epoch": 32.64577656675749,
+ "grad_norm": 8.346298217773438,
+ "learning_rate": 1.5733936897120333e-05,
+ "loss": 0.3502,
+ "step": 11981
+ },
+ {
+ "epoch": 32.64850136239782,
+ "grad_norm": 10.77584457397461,
+ "learning_rate": 1.57332138646108e-05,
+ "loss": 0.3922,
+ "step": 11982
+ },
+ {
+ "epoch": 32.65122615803815,
+ "grad_norm": 6.4791693687438965,
+ "learning_rate": 1.573249078745118e-05,
+ "loss": 0.4125,
+ "step": 11983
+ },
+ {
+ "epoch": 32.653950953678475,
+ "grad_norm": 10.286407470703125,
+ "learning_rate": 1.573176766564711e-05,
+ "loss": 0.4296,
+ "step": 11984
+ },
+ {
+ "epoch": 32.6566757493188,
+ "grad_norm": 7.827480316162109,
+ "learning_rate": 1.5731044499204213e-05,
+ "loss": 0.4174,
+ "step": 11985
+ },
+ {
+ "epoch": 32.65940054495913,
+ "grad_norm": 7.769915580749512,
+ "learning_rate": 1.5730321288128128e-05,
+ "loss": 0.292,
+ "step": 11986
+ },
+ {
+ "epoch": 32.66212534059945,
+ "grad_norm": 7.813076972961426,
+ "learning_rate": 1.5729598032424486e-05,
+ "loss": 0.4645,
+ "step": 11987
+ },
+ {
+ "epoch": 32.664850136239785,
+ "grad_norm": 7.816955089569092,
+ "learning_rate": 1.572887473209892e-05,
+ "loss": 0.3946,
+ "step": 11988
+ },
+ {
+ "epoch": 32.66757493188011,
+ "grad_norm": 7.383937835693359,
+ "learning_rate": 1.572815138715706e-05,
+ "loss": 0.4445,
+ "step": 11989
+ },
+ {
+ "epoch": 32.67029972752044,
+ "grad_norm": 11.780363082885742,
+ "learning_rate": 1.5727427997604545e-05,
+ "loss": 0.3294,
+ "step": 11990
+ },
+ {
+ "epoch": 32.67302452316076,
+ "grad_norm": 10.708660125732422,
+ "learning_rate": 1.5726704563446998e-05,
+ "loss": 0.2985,
+ "step": 11991
+ },
+ {
+ "epoch": 32.67574931880109,
+ "grad_norm": 8.770447731018066,
+ "learning_rate": 1.5725981084690067e-05,
+ "loss": 0.3227,
+ "step": 11992
+ },
+ {
+ "epoch": 32.678474114441414,
+ "grad_norm": 8.673264503479004,
+ "learning_rate": 1.5725257561339375e-05,
+ "loss": 0.4449,
+ "step": 11993
+ },
+ {
+ "epoch": 32.68119891008175,
+ "grad_norm": 9.200652122497559,
+ "learning_rate": 1.5724533993400564e-05,
+ "loss": 0.3591,
+ "step": 11994
+ },
+ {
+ "epoch": 32.68392370572207,
+ "grad_norm": 7.240207195281982,
+ "learning_rate": 1.572381038087927e-05,
+ "loss": 0.5212,
+ "step": 11995
+ },
+ {
+ "epoch": 32.6866485013624,
+ "grad_norm": 9.379121780395508,
+ "learning_rate": 1.5723086723781116e-05,
+ "loss": 0.3761,
+ "step": 11996
+ },
+ {
+ "epoch": 32.689373297002724,
+ "grad_norm": 6.244917392730713,
+ "learning_rate": 1.572236302211175e-05,
+ "loss": 0.2638,
+ "step": 11997
+ },
+ {
+ "epoch": 32.69209809264305,
+ "grad_norm": 8.620534896850586,
+ "learning_rate": 1.5721639275876807e-05,
+ "loss": 0.3557,
+ "step": 11998
+ },
+ {
+ "epoch": 32.694822888283376,
+ "grad_norm": 8.94057559967041,
+ "learning_rate": 1.5720915485081923e-05,
+ "loss": 0.3119,
+ "step": 11999
+ },
+ {
+ "epoch": 32.69754768392371,
+ "grad_norm": 15.445932388305664,
+ "learning_rate": 1.572019164973273e-05,
+ "loss": 0.3889,
+ "step": 12000
+ },
+ {
+ "epoch": 32.700272479564035,
+ "grad_norm": 7.084281921386719,
+ "learning_rate": 1.571946776983487e-05,
+ "loss": 0.3085,
+ "step": 12001
+ },
+ {
+ "epoch": 32.70299727520436,
+ "grad_norm": 6.626097679138184,
+ "learning_rate": 1.571874384539398e-05,
+ "loss": 0.3419,
+ "step": 12002
+ },
+ {
+ "epoch": 32.705722070844686,
+ "grad_norm": 6.412007808685303,
+ "learning_rate": 1.5718019876415696e-05,
+ "loss": 0.473,
+ "step": 12003
+ },
+ {
+ "epoch": 32.70844686648501,
+ "grad_norm": 8.777931213378906,
+ "learning_rate": 1.571729586290566e-05,
+ "loss": 0.4618,
+ "step": 12004
+ },
+ {
+ "epoch": 32.71117166212534,
+ "grad_norm": 7.052206039428711,
+ "learning_rate": 1.5716571804869502e-05,
+ "loss": 0.3517,
+ "step": 12005
+ },
+ {
+ "epoch": 32.71389645776567,
+ "grad_norm": 7.550273895263672,
+ "learning_rate": 1.571584770231287e-05,
+ "loss": 0.5114,
+ "step": 12006
+ },
+ {
+ "epoch": 32.716621253406,
+ "grad_norm": 8.385041236877441,
+ "learning_rate": 1.5715123555241397e-05,
+ "loss": 0.4684,
+ "step": 12007
+ },
+ {
+ "epoch": 32.71934604904632,
+ "grad_norm": 7.535192966461182,
+ "learning_rate": 1.571439936366073e-05,
+ "loss": 0.5306,
+ "step": 12008
+ },
+ {
+ "epoch": 32.72207084468665,
+ "grad_norm": 6.882071495056152,
+ "learning_rate": 1.5713675127576504e-05,
+ "loss": 0.5009,
+ "step": 12009
+ },
+ {
+ "epoch": 32.724795640326974,
+ "grad_norm": 9.158919334411621,
+ "learning_rate": 1.571295084699436e-05,
+ "loss": 0.4095,
+ "step": 12010
+ },
+ {
+ "epoch": 32.7275204359673,
+ "grad_norm": 7.361640930175781,
+ "learning_rate": 1.5712226521919936e-05,
+ "loss": 0.4253,
+ "step": 12011
+ },
+ {
+ "epoch": 32.73024523160763,
+ "grad_norm": 7.760611534118652,
+ "learning_rate": 1.5711502152358878e-05,
+ "loss": 0.3644,
+ "step": 12012
+ },
+ {
+ "epoch": 32.73297002724796,
+ "grad_norm": 6.2527756690979,
+ "learning_rate": 1.5710777738316827e-05,
+ "loss": 0.3277,
+ "step": 12013
+ },
+ {
+ "epoch": 32.735694822888284,
+ "grad_norm": 8.708322525024414,
+ "learning_rate": 1.5710053279799416e-05,
+ "loss": 0.455,
+ "step": 12014
+ },
+ {
+ "epoch": 32.73841961852861,
+ "grad_norm": 10.21238899230957,
+ "learning_rate": 1.5709328776812302e-05,
+ "loss": 0.4052,
+ "step": 12015
+ },
+ {
+ "epoch": 32.741144414168936,
+ "grad_norm": 8.482315063476562,
+ "learning_rate": 1.5708604229361115e-05,
+ "loss": 0.3911,
+ "step": 12016
+ },
+ {
+ "epoch": 32.74386920980926,
+ "grad_norm": 7.245648384094238,
+ "learning_rate": 1.5707879637451502e-05,
+ "loss": 0.4201,
+ "step": 12017
+ },
+ {
+ "epoch": 32.746594005449595,
+ "grad_norm": 9.180356979370117,
+ "learning_rate": 1.5707155001089106e-05,
+ "loss": 0.4395,
+ "step": 12018
+ },
+ {
+ "epoch": 32.74931880108992,
+ "grad_norm": 9.307323455810547,
+ "learning_rate": 1.570643032027957e-05,
+ "loss": 0.3676,
+ "step": 12019
+ },
+ {
+ "epoch": 32.752043596730246,
+ "grad_norm": 7.687534809112549,
+ "learning_rate": 1.570570559502854e-05,
+ "loss": 0.3707,
+ "step": 12020
+ },
+ {
+ "epoch": 32.75476839237057,
+ "grad_norm": 6.333620071411133,
+ "learning_rate": 1.570498082534166e-05,
+ "loss": 0.4487,
+ "step": 12021
+ },
+ {
+ "epoch": 32.7574931880109,
+ "grad_norm": 6.845382213592529,
+ "learning_rate": 1.570425601122457e-05,
+ "loss": 0.3813,
+ "step": 12022
+ },
+ {
+ "epoch": 32.76021798365122,
+ "grad_norm": 6.706961154937744,
+ "learning_rate": 1.5703531152682918e-05,
+ "loss": 0.466,
+ "step": 12023
+ },
+ {
+ "epoch": 32.762942779291556,
+ "grad_norm": 8.425186157226562,
+ "learning_rate": 1.570280624972235e-05,
+ "loss": 0.4315,
+ "step": 12024
+ },
+ {
+ "epoch": 32.76566757493188,
+ "grad_norm": 7.779570579528809,
+ "learning_rate": 1.570208130234851e-05,
+ "loss": 0.3782,
+ "step": 12025
+ },
+ {
+ "epoch": 32.76839237057221,
+ "grad_norm": 39.01546096801758,
+ "learning_rate": 1.5701356310567044e-05,
+ "loss": 0.3603,
+ "step": 12026
+ },
+ {
+ "epoch": 32.771117166212534,
+ "grad_norm": 8.052181243896484,
+ "learning_rate": 1.57006312743836e-05,
+ "loss": 0.5454,
+ "step": 12027
+ },
+ {
+ "epoch": 32.77384196185286,
+ "grad_norm": 8.000152587890625,
+ "learning_rate": 1.569990619380382e-05,
+ "loss": 0.2993,
+ "step": 12028
+ },
+ {
+ "epoch": 32.776566757493185,
+ "grad_norm": 8.588805198669434,
+ "learning_rate": 1.5699181068833355e-05,
+ "loss": 0.3774,
+ "step": 12029
+ },
+ {
+ "epoch": 32.77929155313352,
+ "grad_norm": 6.751492023468018,
+ "learning_rate": 1.5698455899477852e-05,
+ "loss": 0.3899,
+ "step": 12030
+ },
+ {
+ "epoch": 32.782016348773844,
+ "grad_norm": 6.409905433654785,
+ "learning_rate": 1.569773068574296e-05,
+ "loss": 0.2914,
+ "step": 12031
+ },
+ {
+ "epoch": 32.78474114441417,
+ "grad_norm": 7.139047145843506,
+ "learning_rate": 1.5697005427634324e-05,
+ "loss": 0.331,
+ "step": 12032
+ },
+ {
+ "epoch": 32.787465940054496,
+ "grad_norm": 6.8841094970703125,
+ "learning_rate": 1.569628012515759e-05,
+ "loss": 0.3943,
+ "step": 12033
+ },
+ {
+ "epoch": 32.79019073569482,
+ "grad_norm": 8.627446174621582,
+ "learning_rate": 1.5695554778318413e-05,
+ "loss": 0.534,
+ "step": 12034
+ },
+ {
+ "epoch": 32.79291553133515,
+ "grad_norm": 7.6862311363220215,
+ "learning_rate": 1.5694829387122436e-05,
+ "loss": 0.28,
+ "step": 12035
+ },
+ {
+ "epoch": 32.79564032697548,
+ "grad_norm": 9.490158081054688,
+ "learning_rate": 1.5694103951575313e-05,
+ "loss": 0.4632,
+ "step": 12036
+ },
+ {
+ "epoch": 32.798365122615806,
+ "grad_norm": 6.376895904541016,
+ "learning_rate": 1.5693378471682688e-05,
+ "loss": 0.3123,
+ "step": 12037
+ },
+ {
+ "epoch": 32.80108991825613,
+ "grad_norm": 8.53414535522461,
+ "learning_rate": 1.569265294745022e-05,
+ "loss": 0.5134,
+ "step": 12038
+ },
+ {
+ "epoch": 32.80381471389646,
+ "grad_norm": 8.084589004516602,
+ "learning_rate": 1.5691927378883555e-05,
+ "loss": 0.4007,
+ "step": 12039
+ },
+ {
+ "epoch": 32.80653950953678,
+ "grad_norm": 9.008152961730957,
+ "learning_rate": 1.5691201765988336e-05,
+ "loss": 0.4251,
+ "step": 12040
+ },
+ {
+ "epoch": 32.80926430517711,
+ "grad_norm": 7.938703536987305,
+ "learning_rate": 1.5690476108770224e-05,
+ "loss": 0.5161,
+ "step": 12041
+ },
+ {
+ "epoch": 32.81198910081744,
+ "grad_norm": 8.03249454498291,
+ "learning_rate": 1.568975040723487e-05,
+ "loss": 0.3499,
+ "step": 12042
+ },
+ {
+ "epoch": 32.81471389645777,
+ "grad_norm": 8.85582447052002,
+ "learning_rate": 1.568902466138792e-05,
+ "loss": 0.4211,
+ "step": 12043
+ },
+ {
+ "epoch": 32.817438692098094,
+ "grad_norm": 7.650516033172607,
+ "learning_rate": 1.5688298871235028e-05,
+ "loss": 0.445,
+ "step": 12044
+ },
+ {
+ "epoch": 32.82016348773842,
+ "grad_norm": 7.037267208099365,
+ "learning_rate": 1.568757303678185e-05,
+ "loss": 0.3871,
+ "step": 12045
+ },
+ {
+ "epoch": 32.822888283378745,
+ "grad_norm": 8.33869743347168,
+ "learning_rate": 1.5686847158034036e-05,
+ "loss": 0.4173,
+ "step": 12046
+ },
+ {
+ "epoch": 32.82561307901907,
+ "grad_norm": 9.3466796875,
+ "learning_rate": 1.568612123499724e-05,
+ "loss": 0.4705,
+ "step": 12047
+ },
+ {
+ "epoch": 32.828337874659404,
+ "grad_norm": 7.2523417472839355,
+ "learning_rate": 1.5685395267677113e-05,
+ "loss": 0.4606,
+ "step": 12048
+ },
+ {
+ "epoch": 32.83106267029973,
+ "grad_norm": 7.06911563873291,
+ "learning_rate": 1.568466925607931e-05,
+ "loss": 0.4572,
+ "step": 12049
+ },
+ {
+ "epoch": 32.833787465940055,
+ "grad_norm": 8.29034423828125,
+ "learning_rate": 1.5683943200209486e-05,
+ "loss": 0.347,
+ "step": 12050
+ },
+ {
+ "epoch": 32.83651226158038,
+ "grad_norm": 7.922194480895996,
+ "learning_rate": 1.56832171000733e-05,
+ "loss": 0.4034,
+ "step": 12051
+ },
+ {
+ "epoch": 32.83923705722071,
+ "grad_norm": 7.565577030181885,
+ "learning_rate": 1.5682490955676395e-05,
+ "loss": 0.3679,
+ "step": 12052
+ },
+ {
+ "epoch": 32.84196185286103,
+ "grad_norm": 8.645038604736328,
+ "learning_rate": 1.5681764767024435e-05,
+ "loss": 0.42,
+ "step": 12053
+ },
+ {
+ "epoch": 32.844686648501366,
+ "grad_norm": 7.09843111038208,
+ "learning_rate": 1.5681038534123078e-05,
+ "loss": 0.5084,
+ "step": 12054
+ },
+ {
+ "epoch": 32.84741144414169,
+ "grad_norm": 8.0593843460083,
+ "learning_rate": 1.5680312256977974e-05,
+ "loss": 0.3346,
+ "step": 12055
+ },
+ {
+ "epoch": 32.85013623978202,
+ "grad_norm": 5.948692798614502,
+ "learning_rate": 1.5679585935594782e-05,
+ "loss": 0.493,
+ "step": 12056
+ },
+ {
+ "epoch": 32.85286103542234,
+ "grad_norm": 6.850461959838867,
+ "learning_rate": 1.5678859569979154e-05,
+ "loss": 0.3345,
+ "step": 12057
+ },
+ {
+ "epoch": 32.85558583106267,
+ "grad_norm": 6.771362781524658,
+ "learning_rate": 1.5678133160136754e-05,
+ "loss": 0.4419,
+ "step": 12058
+ },
+ {
+ "epoch": 32.858310626702995,
+ "grad_norm": 7.2968878746032715,
+ "learning_rate": 1.5677406706073234e-05,
+ "loss": 0.3654,
+ "step": 12059
+ },
+ {
+ "epoch": 32.86103542234333,
+ "grad_norm": 6.3690643310546875,
+ "learning_rate": 1.5676680207794252e-05,
+ "loss": 0.3576,
+ "step": 12060
+ },
+ {
+ "epoch": 32.86376021798365,
+ "grad_norm": 7.52684211730957,
+ "learning_rate": 1.567595366530547e-05,
+ "loss": 0.6186,
+ "step": 12061
+ },
+ {
+ "epoch": 32.86648501362398,
+ "grad_norm": 6.275260925292969,
+ "learning_rate": 1.567522707861254e-05,
+ "loss": 0.5436,
+ "step": 12062
+ },
+ {
+ "epoch": 32.869209809264305,
+ "grad_norm": 7.670266628265381,
+ "learning_rate": 1.567450044772113e-05,
+ "loss": 0.5059,
+ "step": 12063
+ },
+ {
+ "epoch": 32.87193460490463,
+ "grad_norm": 7.877997875213623,
+ "learning_rate": 1.5673773772636887e-05,
+ "loss": 0.4254,
+ "step": 12064
+ },
+ {
+ "epoch": 32.87465940054496,
+ "grad_norm": 7.987328052520752,
+ "learning_rate": 1.567304705336548e-05,
+ "loss": 0.3008,
+ "step": 12065
+ },
+ {
+ "epoch": 32.87738419618529,
+ "grad_norm": 6.786599159240723,
+ "learning_rate": 1.567232028991256e-05,
+ "loss": 0.4849,
+ "step": 12066
+ },
+ {
+ "epoch": 32.880108991825615,
+ "grad_norm": 7.205345630645752,
+ "learning_rate": 1.5671593482283797e-05,
+ "loss": 0.3793,
+ "step": 12067
+ },
+ {
+ "epoch": 32.88283378746594,
+ "grad_norm": 8.275880813598633,
+ "learning_rate": 1.5670866630484847e-05,
+ "loss": 0.4988,
+ "step": 12068
+ },
+ {
+ "epoch": 32.88555858310627,
+ "grad_norm": 6.805363655090332,
+ "learning_rate": 1.567013973452137e-05,
+ "loss": 0.3616,
+ "step": 12069
+ },
+ {
+ "epoch": 32.88828337874659,
+ "grad_norm": 7.106833457946777,
+ "learning_rate": 1.5669412794399027e-05,
+ "loss": 0.5326,
+ "step": 12070
+ },
+ {
+ "epoch": 32.89100817438692,
+ "grad_norm": 9.400209426879883,
+ "learning_rate": 1.5668685810123477e-05,
+ "loss": 0.472,
+ "step": 12071
+ },
+ {
+ "epoch": 32.89373297002725,
+ "grad_norm": 8.801173210144043,
+ "learning_rate": 1.5667958781700386e-05,
+ "loss": 0.3932,
+ "step": 12072
+ },
+ {
+ "epoch": 32.89645776566758,
+ "grad_norm": 7.403770446777344,
+ "learning_rate": 1.5667231709135414e-05,
+ "loss": 0.4413,
+ "step": 12073
+ },
+ {
+ "epoch": 32.8991825613079,
+ "grad_norm": 8.15301513671875,
+ "learning_rate": 1.5666504592434228e-05,
+ "loss": 0.313,
+ "step": 12074
+ },
+ {
+ "epoch": 32.90190735694823,
+ "grad_norm": 8.188809394836426,
+ "learning_rate": 1.566577743160248e-05,
+ "loss": 0.4168,
+ "step": 12075
+ },
+ {
+ "epoch": 32.904632152588555,
+ "grad_norm": 6.774173259735107,
+ "learning_rate": 1.566505022664584e-05,
+ "loss": 0.3796,
+ "step": 12076
+ },
+ {
+ "epoch": 32.90735694822888,
+ "grad_norm": 8.598569869995117,
+ "learning_rate": 1.5664322977569976e-05,
+ "loss": 0.4853,
+ "step": 12077
+ },
+ {
+ "epoch": 32.91008174386921,
+ "grad_norm": 9.037574768066406,
+ "learning_rate": 1.5663595684380544e-05,
+ "loss": 0.3386,
+ "step": 12078
+ },
+ {
+ "epoch": 32.91280653950954,
+ "grad_norm": 8.221321105957031,
+ "learning_rate": 1.5662868347083213e-05,
+ "loss": 0.4525,
+ "step": 12079
+ },
+ {
+ "epoch": 32.915531335149865,
+ "grad_norm": 8.122885704040527,
+ "learning_rate": 1.5662140965683645e-05,
+ "loss": 0.511,
+ "step": 12080
+ },
+ {
+ "epoch": 32.91825613079019,
+ "grad_norm": 12.633194923400879,
+ "learning_rate": 1.5661413540187504e-05,
+ "loss": 0.448,
+ "step": 12081
+ },
+ {
+ "epoch": 32.920980926430516,
+ "grad_norm": 7.939639091491699,
+ "learning_rate": 1.566068607060046e-05,
+ "loss": 0.4385,
+ "step": 12082
+ },
+ {
+ "epoch": 32.92370572207084,
+ "grad_norm": 6.504891395568848,
+ "learning_rate": 1.565995855692817e-05,
+ "loss": 0.3574,
+ "step": 12083
+ },
+ {
+ "epoch": 32.926430517711175,
+ "grad_norm": 7.92395544052124,
+ "learning_rate": 1.5659230999176307e-05,
+ "loss": 0.3979,
+ "step": 12084
+ },
+ {
+ "epoch": 32.9291553133515,
+ "grad_norm": 7.3674635887146,
+ "learning_rate": 1.5658503397350536e-05,
+ "loss": 0.5131,
+ "step": 12085
+ },
+ {
+ "epoch": 32.93188010899183,
+ "grad_norm": 5.609498023986816,
+ "learning_rate": 1.5657775751456524e-05,
+ "loss": 0.3665,
+ "step": 12086
+ },
+ {
+ "epoch": 32.93460490463215,
+ "grad_norm": 11.792949676513672,
+ "learning_rate": 1.5657048061499932e-05,
+ "loss": 0.4108,
+ "step": 12087
+ },
+ {
+ "epoch": 32.93732970027248,
+ "grad_norm": 7.255577087402344,
+ "learning_rate": 1.5656320327486433e-05,
+ "loss": 0.37,
+ "step": 12088
+ },
+ {
+ "epoch": 32.940054495912804,
+ "grad_norm": 17.582035064697266,
+ "learning_rate": 1.5655592549421695e-05,
+ "loss": 0.4506,
+ "step": 12089
+ },
+ {
+ "epoch": 32.94277929155314,
+ "grad_norm": 10.486715316772461,
+ "learning_rate": 1.565486472731139e-05,
+ "loss": 0.4735,
+ "step": 12090
+ },
+ {
+ "epoch": 32.94550408719346,
+ "grad_norm": 7.075913429260254,
+ "learning_rate": 1.5654136861161174e-05,
+ "loss": 0.4352,
+ "step": 12091
+ },
+ {
+ "epoch": 32.94822888283379,
+ "grad_norm": 9.81493091583252,
+ "learning_rate": 1.5653408950976717e-05,
+ "loss": 0.3662,
+ "step": 12092
+ },
+ {
+ "epoch": 32.950953678474114,
+ "grad_norm": 11.64074420928955,
+ "learning_rate": 1.5652680996763702e-05,
+ "loss": 0.4028,
+ "step": 12093
+ },
+ {
+ "epoch": 32.95367847411444,
+ "grad_norm": 6.694557189941406,
+ "learning_rate": 1.5651952998527786e-05,
+ "loss": 0.3807,
+ "step": 12094
+ },
+ {
+ "epoch": 32.956403269754766,
+ "grad_norm": 8.660942077636719,
+ "learning_rate": 1.5651224956274643e-05,
+ "loss": 0.3384,
+ "step": 12095
+ },
+ {
+ "epoch": 32.95912806539509,
+ "grad_norm": 7.801591873168945,
+ "learning_rate": 1.565049687000994e-05,
+ "loss": 0.4241,
+ "step": 12096
+ },
+ {
+ "epoch": 32.961852861035425,
+ "grad_norm": 6.360088348388672,
+ "learning_rate": 1.5649768739739348e-05,
+ "loss": 0.5128,
+ "step": 12097
+ },
+ {
+ "epoch": 32.96457765667575,
+ "grad_norm": 5.70269775390625,
+ "learning_rate": 1.564904056546854e-05,
+ "loss": 0.3537,
+ "step": 12098
+ },
+ {
+ "epoch": 32.967302452316076,
+ "grad_norm": 7.237667560577393,
+ "learning_rate": 1.564831234720319e-05,
+ "loss": 0.4069,
+ "step": 12099
+ },
+ {
+ "epoch": 32.9700272479564,
+ "grad_norm": 9.81737232208252,
+ "learning_rate": 1.564758408494896e-05,
+ "loss": 0.5043,
+ "step": 12100
+ },
+ {
+ "epoch": 32.97275204359673,
+ "grad_norm": 6.362037181854248,
+ "learning_rate": 1.564685577871153e-05,
+ "loss": 0.4174,
+ "step": 12101
+ },
+ {
+ "epoch": 32.97547683923706,
+ "grad_norm": 6.462863922119141,
+ "learning_rate": 1.564612742849657e-05,
+ "loss": 0.4637,
+ "step": 12102
+ },
+ {
+ "epoch": 32.97820163487739,
+ "grad_norm": 12.043787956237793,
+ "learning_rate": 1.564539903430975e-05,
+ "loss": 0.4103,
+ "step": 12103
+ },
+ {
+ "epoch": 32.98092643051771,
+ "grad_norm": 7.939565181732178,
+ "learning_rate": 1.564467059615674e-05,
+ "loss": 0.4692,
+ "step": 12104
+ },
+ {
+ "epoch": 32.98365122615804,
+ "grad_norm": 8.781482696533203,
+ "learning_rate": 1.564394211404322e-05,
+ "loss": 0.3722,
+ "step": 12105
+ },
+ {
+ "epoch": 32.986376021798364,
+ "grad_norm": 8.51310920715332,
+ "learning_rate": 1.564321358797486e-05,
+ "loss": 0.4591,
+ "step": 12106
+ },
+ {
+ "epoch": 32.98910081743869,
+ "grad_norm": 5.838075160980225,
+ "learning_rate": 1.564248501795734e-05,
+ "loss": 0.4764,
+ "step": 12107
+ },
+ {
+ "epoch": 32.991825613079016,
+ "grad_norm": 6.868386745452881,
+ "learning_rate": 1.564175640399632e-05,
+ "loss": 0.3613,
+ "step": 12108
+ },
+ {
+ "epoch": 32.99455040871935,
+ "grad_norm": 6.692442417144775,
+ "learning_rate": 1.5641027746097484e-05,
+ "loss": 0.6792,
+ "step": 12109
+ },
+ {
+ "epoch": 32.997275204359674,
+ "grad_norm": 8.148579597473145,
+ "learning_rate": 1.564029904426651e-05,
+ "loss": 0.4401,
+ "step": 12110
+ },
+ {
+ "epoch": 33.0,
+ "grad_norm": 6.626377105712891,
+ "learning_rate": 1.5639570298509067e-05,
+ "loss": 0.2638,
+ "step": 12111
+ },
+ {
+ "epoch": 33.002724795640326,
+ "grad_norm": 7.323823928833008,
+ "learning_rate": 1.563884150883083e-05,
+ "loss": 0.5676,
+ "step": 12112
+ },
+ {
+ "epoch": 33.00544959128065,
+ "grad_norm": 6.628137588500977,
+ "learning_rate": 1.563811267523748e-05,
+ "loss": 0.3055,
+ "step": 12113
+ },
+ {
+ "epoch": 33.00817438692098,
+ "grad_norm": 10.509965896606445,
+ "learning_rate": 1.5637383797734685e-05,
+ "loss": 0.5372,
+ "step": 12114
+ },
+ {
+ "epoch": 33.01089918256131,
+ "grad_norm": 7.332951068878174,
+ "learning_rate": 1.5636654876328134e-05,
+ "loss": 0.3818,
+ "step": 12115
+ },
+ {
+ "epoch": 33.013623978201636,
+ "grad_norm": 5.587296009063721,
+ "learning_rate": 1.563592591102349e-05,
+ "loss": 0.4557,
+ "step": 12116
+ },
+ {
+ "epoch": 33.01634877384196,
+ "grad_norm": 7.477775573730469,
+ "learning_rate": 1.5635196901826436e-05,
+ "loss": 0.6977,
+ "step": 12117
+ },
+ {
+ "epoch": 33.01907356948229,
+ "grad_norm": 6.747099876403809,
+ "learning_rate": 1.563446784874265e-05,
+ "loss": 0.3499,
+ "step": 12118
+ },
+ {
+ "epoch": 33.02179836512261,
+ "grad_norm": 6.576713562011719,
+ "learning_rate": 1.5633738751777814e-05,
+ "loss": 0.3163,
+ "step": 12119
+ },
+ {
+ "epoch": 33.02452316076294,
+ "grad_norm": 5.987857818603516,
+ "learning_rate": 1.56330096109376e-05,
+ "loss": 0.3235,
+ "step": 12120
+ },
+ {
+ "epoch": 33.02724795640327,
+ "grad_norm": 9.134624481201172,
+ "learning_rate": 1.5632280426227685e-05,
+ "loss": 0.5594,
+ "step": 12121
+ },
+ {
+ "epoch": 33.0299727520436,
+ "grad_norm": 6.8406829833984375,
+ "learning_rate": 1.5631551197653756e-05,
+ "loss": 0.3962,
+ "step": 12122
+ },
+ {
+ "epoch": 33.032697547683924,
+ "grad_norm": 7.628662586212158,
+ "learning_rate": 1.5630821925221488e-05,
+ "loss": 0.2757,
+ "step": 12123
+ },
+ {
+ "epoch": 33.03542234332425,
+ "grad_norm": 6.215722560882568,
+ "learning_rate": 1.563009260893656e-05,
+ "loss": 0.3205,
+ "step": 12124
+ },
+ {
+ "epoch": 33.038147138964575,
+ "grad_norm": 9.666122436523438,
+ "learning_rate": 1.5629363248804644e-05,
+ "loss": 0.2663,
+ "step": 12125
+ },
+ {
+ "epoch": 33.0408719346049,
+ "grad_norm": 6.604397296905518,
+ "learning_rate": 1.5628633844831436e-05,
+ "loss": 0.3544,
+ "step": 12126
+ },
+ {
+ "epoch": 33.043596730245234,
+ "grad_norm": 5.744869232177734,
+ "learning_rate": 1.5627904397022605e-05,
+ "loss": 0.4654,
+ "step": 12127
+ },
+ {
+ "epoch": 33.04632152588556,
+ "grad_norm": 9.151631355285645,
+ "learning_rate": 1.5627174905383838e-05,
+ "loss": 0.3775,
+ "step": 12128
+ },
+ {
+ "epoch": 33.049046321525886,
+ "grad_norm": 7.482045650482178,
+ "learning_rate": 1.5626445369920816e-05,
+ "loss": 0.3073,
+ "step": 12129
+ },
+ {
+ "epoch": 33.05177111716621,
+ "grad_norm": 6.341897487640381,
+ "learning_rate": 1.5625715790639214e-05,
+ "loss": 0.3134,
+ "step": 12130
+ },
+ {
+ "epoch": 33.05449591280654,
+ "grad_norm": 8.26285457611084,
+ "learning_rate": 1.562498616754472e-05,
+ "loss": 0.4222,
+ "step": 12131
+ },
+ {
+ "epoch": 33.05722070844686,
+ "grad_norm": 7.009021282196045,
+ "learning_rate": 1.5624256500643016e-05,
+ "loss": 0.3741,
+ "step": 12132
+ },
+ {
+ "epoch": 33.059945504087196,
+ "grad_norm": 7.427831172943115,
+ "learning_rate": 1.5623526789939784e-05,
+ "loss": 0.4128,
+ "step": 12133
+ },
+ {
+ "epoch": 33.06267029972752,
+ "grad_norm": 5.852236270904541,
+ "learning_rate": 1.5622797035440703e-05,
+ "loss": 0.4782,
+ "step": 12134
+ },
+ {
+ "epoch": 33.06539509536785,
+ "grad_norm": 6.832294940948486,
+ "learning_rate": 1.5622067237151465e-05,
+ "loss": 0.2744,
+ "step": 12135
+ },
+ {
+ "epoch": 33.06811989100817,
+ "grad_norm": 6.296779155731201,
+ "learning_rate": 1.5621337395077742e-05,
+ "loss": 0.2502,
+ "step": 12136
+ },
+ {
+ "epoch": 33.0708446866485,
+ "grad_norm": 9.04610538482666,
+ "learning_rate": 1.5620607509225227e-05,
+ "loss": 0.5152,
+ "step": 12137
+ },
+ {
+ "epoch": 33.073569482288825,
+ "grad_norm": 6.3163909912109375,
+ "learning_rate": 1.5619877579599604e-05,
+ "loss": 0.4043,
+ "step": 12138
+ },
+ {
+ "epoch": 33.07629427792916,
+ "grad_norm": 6.203168869018555,
+ "learning_rate": 1.5619147606206552e-05,
+ "loss": 0.4096,
+ "step": 12139
+ },
+ {
+ "epoch": 33.079019073569484,
+ "grad_norm": 6.571667671203613,
+ "learning_rate": 1.561841758905176e-05,
+ "loss": 0.3661,
+ "step": 12140
+ },
+ {
+ "epoch": 33.08174386920981,
+ "grad_norm": 6.468061447143555,
+ "learning_rate": 1.5617687528140915e-05,
+ "loss": 0.4316,
+ "step": 12141
+ },
+ {
+ "epoch": 33.084468664850135,
+ "grad_norm": 4.98010778427124,
+ "learning_rate": 1.5616957423479698e-05,
+ "loss": 0.2972,
+ "step": 12142
+ },
+ {
+ "epoch": 33.08719346049046,
+ "grad_norm": 7.058682441711426,
+ "learning_rate": 1.5616227275073796e-05,
+ "loss": 0.3562,
+ "step": 12143
+ },
+ {
+ "epoch": 33.08991825613079,
+ "grad_norm": 5.501753807067871,
+ "learning_rate": 1.56154970829289e-05,
+ "loss": 0.4178,
+ "step": 12144
+ },
+ {
+ "epoch": 33.09264305177112,
+ "grad_norm": 6.312686920166016,
+ "learning_rate": 1.561476684705069e-05,
+ "loss": 0.2449,
+ "step": 12145
+ },
+ {
+ "epoch": 33.095367847411445,
+ "grad_norm": 6.514692783355713,
+ "learning_rate": 1.561403656744486e-05,
+ "loss": 0.2487,
+ "step": 12146
+ },
+ {
+ "epoch": 33.09809264305177,
+ "grad_norm": 7.077640056610107,
+ "learning_rate": 1.5613306244117092e-05,
+ "loss": 0.4452,
+ "step": 12147
+ },
+ {
+ "epoch": 33.1008174386921,
+ "grad_norm": 8.67483901977539,
+ "learning_rate": 1.5612575877073078e-05,
+ "loss": 0.3589,
+ "step": 12148
+ },
+ {
+ "epoch": 33.10354223433242,
+ "grad_norm": 5.831808090209961,
+ "learning_rate": 1.56118454663185e-05,
+ "loss": 0.3697,
+ "step": 12149
+ },
+ {
+ "epoch": 33.10626702997275,
+ "grad_norm": 6.515407562255859,
+ "learning_rate": 1.5611115011859052e-05,
+ "loss": 0.3438,
+ "step": 12150
+ },
+ {
+ "epoch": 33.10899182561308,
+ "grad_norm": 8.445128440856934,
+ "learning_rate": 1.5610384513700422e-05,
+ "loss": 0.3747,
+ "step": 12151
+ },
+ {
+ "epoch": 33.11171662125341,
+ "grad_norm": 11.156426429748535,
+ "learning_rate": 1.5609653971848296e-05,
+ "loss": 0.3044,
+ "step": 12152
+ },
+ {
+ "epoch": 33.11444141689373,
+ "grad_norm": 10.229217529296875,
+ "learning_rate": 1.5608923386308365e-05,
+ "loss": 0.2704,
+ "step": 12153
+ },
+ {
+ "epoch": 33.11716621253406,
+ "grad_norm": 6.33029842376709,
+ "learning_rate": 1.560819275708632e-05,
+ "loss": 0.3672,
+ "step": 12154
+ },
+ {
+ "epoch": 33.119891008174385,
+ "grad_norm": 7.576890468597412,
+ "learning_rate": 1.5607462084187853e-05,
+ "loss": 0.2351,
+ "step": 12155
+ },
+ {
+ "epoch": 33.12261580381471,
+ "grad_norm": 7.682079792022705,
+ "learning_rate": 1.5606731367618647e-05,
+ "loss": 0.3261,
+ "step": 12156
+ },
+ {
+ "epoch": 33.12534059945504,
+ "grad_norm": 6.63905668258667,
+ "learning_rate": 1.5606000607384402e-05,
+ "loss": 0.3571,
+ "step": 12157
+ },
+ {
+ "epoch": 33.12806539509537,
+ "grad_norm": 7.063698768615723,
+ "learning_rate": 1.56052698034908e-05,
+ "loss": 0.3713,
+ "step": 12158
+ },
+ {
+ "epoch": 33.130790190735695,
+ "grad_norm": 6.658858299255371,
+ "learning_rate": 1.5604538955943542e-05,
+ "loss": 0.3423,
+ "step": 12159
+ },
+ {
+ "epoch": 33.13351498637602,
+ "grad_norm": 9.059860229492188,
+ "learning_rate": 1.5603808064748313e-05,
+ "loss": 0.3508,
+ "step": 12160
+ },
+ {
+ "epoch": 33.13623978201635,
+ "grad_norm": 7.219796657562256,
+ "learning_rate": 1.5603077129910805e-05,
+ "loss": 0.3313,
+ "step": 12161
+ },
+ {
+ "epoch": 33.13896457765667,
+ "grad_norm": 11.955741882324219,
+ "learning_rate": 1.5602346151436715e-05,
+ "loss": 0.3326,
+ "step": 12162
+ },
+ {
+ "epoch": 33.141689373297005,
+ "grad_norm": 6.73663854598999,
+ "learning_rate": 1.5601615129331734e-05,
+ "loss": 0.4324,
+ "step": 12163
+ },
+ {
+ "epoch": 33.14441416893733,
+ "grad_norm": 6.877493858337402,
+ "learning_rate": 1.5600884063601554e-05,
+ "loss": 0.4032,
+ "step": 12164
+ },
+ {
+ "epoch": 33.14713896457766,
+ "grad_norm": 6.520141124725342,
+ "learning_rate": 1.560015295425187e-05,
+ "loss": 0.3725,
+ "step": 12165
+ },
+ {
+ "epoch": 33.14986376021798,
+ "grad_norm": 6.258823871612549,
+ "learning_rate": 1.5599421801288373e-05,
+ "loss": 0.3919,
+ "step": 12166
+ },
+ {
+ "epoch": 33.15258855585831,
+ "grad_norm": 6.118670463562012,
+ "learning_rate": 1.5598690604716763e-05,
+ "loss": 0.3483,
+ "step": 12167
+ },
+ {
+ "epoch": 33.155313351498634,
+ "grad_norm": 8.57835865020752,
+ "learning_rate": 1.5597959364542726e-05,
+ "loss": 0.401,
+ "step": 12168
+ },
+ {
+ "epoch": 33.15803814713897,
+ "grad_norm": 8.096592903137207,
+ "learning_rate": 1.559722808077196e-05,
+ "loss": 0.3821,
+ "step": 12169
+ },
+ {
+ "epoch": 33.16076294277929,
+ "grad_norm": 6.646443843841553,
+ "learning_rate": 1.559649675341017e-05,
+ "loss": 0.3525,
+ "step": 12170
+ },
+ {
+ "epoch": 33.16348773841962,
+ "grad_norm": 6.403456211090088,
+ "learning_rate": 1.5595765382463035e-05,
+ "loss": 0.3165,
+ "step": 12171
+ },
+ {
+ "epoch": 33.166212534059945,
+ "grad_norm": 6.006011009216309,
+ "learning_rate": 1.5595033967936264e-05,
+ "loss": 0.4086,
+ "step": 12172
+ },
+ {
+ "epoch": 33.16893732970027,
+ "grad_norm": 6.651188850402832,
+ "learning_rate": 1.5594302509835548e-05,
+ "loss": 0.4548,
+ "step": 12173
+ },
+ {
+ "epoch": 33.171662125340596,
+ "grad_norm": 11.389019966125488,
+ "learning_rate": 1.5593571008166587e-05,
+ "loss": 0.3697,
+ "step": 12174
+ },
+ {
+ "epoch": 33.17438692098093,
+ "grad_norm": 5.870072841644287,
+ "learning_rate": 1.559283946293507e-05,
+ "loss": 0.2602,
+ "step": 12175
+ },
+ {
+ "epoch": 33.177111716621255,
+ "grad_norm": 5.876684665679932,
+ "learning_rate": 1.55921078741467e-05,
+ "loss": 0.2562,
+ "step": 12176
+ },
+ {
+ "epoch": 33.17983651226158,
+ "grad_norm": 7.102714538574219,
+ "learning_rate": 1.5591376241807177e-05,
+ "loss": 0.3668,
+ "step": 12177
+ },
+ {
+ "epoch": 33.182561307901906,
+ "grad_norm": 8.703709602355957,
+ "learning_rate": 1.559064456592219e-05,
+ "loss": 0.346,
+ "step": 12178
+ },
+ {
+ "epoch": 33.18528610354223,
+ "grad_norm": 6.849244117736816,
+ "learning_rate": 1.5589912846497447e-05,
+ "loss": 0.3544,
+ "step": 12179
+ },
+ {
+ "epoch": 33.18801089918256,
+ "grad_norm": 5.676214218139648,
+ "learning_rate": 1.5589181083538646e-05,
+ "loss": 0.385,
+ "step": 12180
+ },
+ {
+ "epoch": 33.19073569482289,
+ "grad_norm": 7.680464744567871,
+ "learning_rate": 1.5588449277051476e-05,
+ "loss": 0.4911,
+ "step": 12181
+ },
+ {
+ "epoch": 33.19346049046322,
+ "grad_norm": 8.966886520385742,
+ "learning_rate": 1.5587717427041645e-05,
+ "loss": 0.4529,
+ "step": 12182
+ },
+ {
+ "epoch": 33.19618528610354,
+ "grad_norm": 8.935302734375,
+ "learning_rate": 1.5586985533514853e-05,
+ "loss": 0.334,
+ "step": 12183
+ },
+ {
+ "epoch": 33.19891008174387,
+ "grad_norm": 6.224770545959473,
+ "learning_rate": 1.5586253596476798e-05,
+ "loss": 0.3634,
+ "step": 12184
+ },
+ {
+ "epoch": 33.201634877384194,
+ "grad_norm": 8.594982147216797,
+ "learning_rate": 1.5585521615933176e-05,
+ "loss": 0.3778,
+ "step": 12185
+ },
+ {
+ "epoch": 33.20435967302452,
+ "grad_norm": 6.484743595123291,
+ "learning_rate": 1.5584789591889693e-05,
+ "loss": 0.4342,
+ "step": 12186
+ },
+ {
+ "epoch": 33.20708446866485,
+ "grad_norm": 6.004835605621338,
+ "learning_rate": 1.5584057524352047e-05,
+ "loss": 0.2728,
+ "step": 12187
+ },
+ {
+ "epoch": 33.20980926430518,
+ "grad_norm": 6.681808948516846,
+ "learning_rate": 1.5583325413325944e-05,
+ "loss": 0.4458,
+ "step": 12188
+ },
+ {
+ "epoch": 33.212534059945504,
+ "grad_norm": 7.355443000793457,
+ "learning_rate": 1.558259325881708e-05,
+ "loss": 0.6285,
+ "step": 12189
+ },
+ {
+ "epoch": 33.21525885558583,
+ "grad_norm": 6.397506237030029,
+ "learning_rate": 1.558186106083116e-05,
+ "loss": 0.4643,
+ "step": 12190
+ },
+ {
+ "epoch": 33.217983651226156,
+ "grad_norm": 7.421044826507568,
+ "learning_rate": 1.5581128819373885e-05,
+ "loss": 0.3742,
+ "step": 12191
+ },
+ {
+ "epoch": 33.22070844686648,
+ "grad_norm": 7.265703201293945,
+ "learning_rate": 1.558039653445096e-05,
+ "loss": 0.3751,
+ "step": 12192
+ },
+ {
+ "epoch": 33.223433242506815,
+ "grad_norm": 7.574958801269531,
+ "learning_rate": 1.5579664206068087e-05,
+ "loss": 0.2934,
+ "step": 12193
+ },
+ {
+ "epoch": 33.22615803814714,
+ "grad_norm": 12.124749183654785,
+ "learning_rate": 1.5578931834230968e-05,
+ "loss": 0.3745,
+ "step": 12194
+ },
+ {
+ "epoch": 33.228882833787466,
+ "grad_norm": 8.5874605178833,
+ "learning_rate": 1.5578199418945304e-05,
+ "loss": 0.4017,
+ "step": 12195
+ },
+ {
+ "epoch": 33.23160762942779,
+ "grad_norm": 5.97220516204834,
+ "learning_rate": 1.5577466960216805e-05,
+ "loss": 0.2773,
+ "step": 12196
+ },
+ {
+ "epoch": 33.23433242506812,
+ "grad_norm": 7.527440547943115,
+ "learning_rate": 1.557673445805117e-05,
+ "loss": 0.3442,
+ "step": 12197
+ },
+ {
+ "epoch": 33.237057220708444,
+ "grad_norm": 10.769542694091797,
+ "learning_rate": 1.5576001912454114e-05,
+ "loss": 0.3999,
+ "step": 12198
+ },
+ {
+ "epoch": 33.23978201634878,
+ "grad_norm": 5.666802406311035,
+ "learning_rate": 1.5575269323431327e-05,
+ "loss": 0.3604,
+ "step": 12199
+ },
+ {
+ "epoch": 33.2425068119891,
+ "grad_norm": 7.8562092781066895,
+ "learning_rate": 1.5574536690988526e-05,
+ "loss": 0.3625,
+ "step": 12200
+ },
+ {
+ "epoch": 33.24523160762943,
+ "grad_norm": 7.768949508666992,
+ "learning_rate": 1.5573804015131414e-05,
+ "loss": 0.3944,
+ "step": 12201
+ },
+ {
+ "epoch": 33.247956403269754,
+ "grad_norm": 6.802807807922363,
+ "learning_rate": 1.5573071295865694e-05,
+ "loss": 0.2741,
+ "step": 12202
+ },
+ {
+ "epoch": 33.25068119891008,
+ "grad_norm": 7.93035364151001,
+ "learning_rate": 1.557233853319707e-05,
+ "loss": 0.3,
+ "step": 12203
+ },
+ {
+ "epoch": 33.253405994550405,
+ "grad_norm": 7.202589511871338,
+ "learning_rate": 1.5571605727131255e-05,
+ "loss": 0.3619,
+ "step": 12204
+ },
+ {
+ "epoch": 33.25613079019074,
+ "grad_norm": 9.372316360473633,
+ "learning_rate": 1.5570872877673958e-05,
+ "loss": 0.3482,
+ "step": 12205
+ },
+ {
+ "epoch": 33.258855585831064,
+ "grad_norm": 7.737120628356934,
+ "learning_rate": 1.5570139984830878e-05,
+ "loss": 0.2645,
+ "step": 12206
+ },
+ {
+ "epoch": 33.26158038147139,
+ "grad_norm": 10.476534843444824,
+ "learning_rate": 1.556940704860773e-05,
+ "loss": 0.4134,
+ "step": 12207
+ },
+ {
+ "epoch": 33.264305177111716,
+ "grad_norm": 10.893311500549316,
+ "learning_rate": 1.5568674069010218e-05,
+ "loss": 0.4485,
+ "step": 12208
+ },
+ {
+ "epoch": 33.26702997275204,
+ "grad_norm": 7.452104568481445,
+ "learning_rate": 1.5567941046044053e-05,
+ "loss": 0.4108,
+ "step": 12209
+ },
+ {
+ "epoch": 33.26975476839237,
+ "grad_norm": 6.8772382736206055,
+ "learning_rate": 1.556720797971494e-05,
+ "loss": 0.2637,
+ "step": 12210
+ },
+ {
+ "epoch": 33.2724795640327,
+ "grad_norm": 7.585111618041992,
+ "learning_rate": 1.556647487002859e-05,
+ "loss": 0.3127,
+ "step": 12211
+ },
+ {
+ "epoch": 33.275204359673026,
+ "grad_norm": 11.086917877197266,
+ "learning_rate": 1.5565741716990714e-05,
+ "loss": 0.5108,
+ "step": 12212
+ },
+ {
+ "epoch": 33.27792915531335,
+ "grad_norm": 8.147093772888184,
+ "learning_rate": 1.556500852060702e-05,
+ "loss": 0.3434,
+ "step": 12213
+ },
+ {
+ "epoch": 33.28065395095368,
+ "grad_norm": 7.377264022827148,
+ "learning_rate": 1.556427528088322e-05,
+ "loss": 0.4055,
+ "step": 12214
+ },
+ {
+ "epoch": 33.283378746594,
+ "grad_norm": 6.8624725341796875,
+ "learning_rate": 1.5563541997825025e-05,
+ "loss": 0.5069,
+ "step": 12215
+ },
+ {
+ "epoch": 33.28610354223433,
+ "grad_norm": 9.36638069152832,
+ "learning_rate": 1.556280867143814e-05,
+ "loss": 0.425,
+ "step": 12216
+ },
+ {
+ "epoch": 33.28882833787466,
+ "grad_norm": 5.822850227355957,
+ "learning_rate": 1.556207530172828e-05,
+ "loss": 0.3252,
+ "step": 12217
+ },
+ {
+ "epoch": 33.29155313351499,
+ "grad_norm": 6.872265338897705,
+ "learning_rate": 1.556134188870116e-05,
+ "loss": 0.2645,
+ "step": 12218
+ },
+ {
+ "epoch": 33.294277929155314,
+ "grad_norm": 6.900471210479736,
+ "learning_rate": 1.5560608432362486e-05,
+ "loss": 0.2932,
+ "step": 12219
+ },
+ {
+ "epoch": 33.29700272479564,
+ "grad_norm": 7.023861408233643,
+ "learning_rate": 1.5559874932717972e-05,
+ "loss": 0.5451,
+ "step": 12220
+ },
+ {
+ "epoch": 33.299727520435965,
+ "grad_norm": 8.168889999389648,
+ "learning_rate": 1.5559141389773334e-05,
+ "loss": 0.2791,
+ "step": 12221
+ },
+ {
+ "epoch": 33.30245231607629,
+ "grad_norm": 8.27985954284668,
+ "learning_rate": 1.555840780353428e-05,
+ "loss": 0.3385,
+ "step": 12222
+ },
+ {
+ "epoch": 33.305177111716624,
+ "grad_norm": 6.772516250610352,
+ "learning_rate": 1.5557674174006525e-05,
+ "loss": 0.2226,
+ "step": 12223
+ },
+ {
+ "epoch": 33.30790190735695,
+ "grad_norm": 9.39065933227539,
+ "learning_rate": 1.5556940501195784e-05,
+ "loss": 0.2984,
+ "step": 12224
+ },
+ {
+ "epoch": 33.310626702997276,
+ "grad_norm": 7.225677013397217,
+ "learning_rate": 1.5556206785107766e-05,
+ "loss": 0.3233,
+ "step": 12225
+ },
+ {
+ "epoch": 33.3133514986376,
+ "grad_norm": 6.888895034790039,
+ "learning_rate": 1.555547302574819e-05,
+ "loss": 0.3261,
+ "step": 12226
+ },
+ {
+ "epoch": 33.31607629427793,
+ "grad_norm": 6.585740089416504,
+ "learning_rate": 1.5554739223122768e-05,
+ "loss": 0.3632,
+ "step": 12227
+ },
+ {
+ "epoch": 33.31880108991825,
+ "grad_norm": 6.724668979644775,
+ "learning_rate": 1.5554005377237217e-05,
+ "loss": 0.3252,
+ "step": 12228
+ },
+ {
+ "epoch": 33.321525885558586,
+ "grad_norm": 7.033156394958496,
+ "learning_rate": 1.5553271488097247e-05,
+ "loss": 0.3376,
+ "step": 12229
+ },
+ {
+ "epoch": 33.32425068119891,
+ "grad_norm": 6.2989959716796875,
+ "learning_rate": 1.5552537555708584e-05,
+ "loss": 0.4559,
+ "step": 12230
+ },
+ {
+ "epoch": 33.32697547683924,
+ "grad_norm": 7.348972320556641,
+ "learning_rate": 1.5551803580076935e-05,
+ "loss": 0.2397,
+ "step": 12231
+ },
+ {
+ "epoch": 33.32970027247956,
+ "grad_norm": 6.269176483154297,
+ "learning_rate": 1.5551069561208018e-05,
+ "loss": 0.2628,
+ "step": 12232
+ },
+ {
+ "epoch": 33.33242506811989,
+ "grad_norm": 7.6189093589782715,
+ "learning_rate": 1.555033549910755e-05,
+ "loss": 0.3294,
+ "step": 12233
+ },
+ {
+ "epoch": 33.335149863760215,
+ "grad_norm": 8.982177734375,
+ "learning_rate": 1.5549601393781244e-05,
+ "loss": 0.504,
+ "step": 12234
+ },
+ {
+ "epoch": 33.33787465940055,
+ "grad_norm": 7.15234899520874,
+ "learning_rate": 1.5548867245234825e-05,
+ "loss": 0.4194,
+ "step": 12235
+ },
+ {
+ "epoch": 33.34059945504087,
+ "grad_norm": 5.938183307647705,
+ "learning_rate": 1.5548133053474004e-05,
+ "loss": 0.264,
+ "step": 12236
+ },
+ {
+ "epoch": 33.3433242506812,
+ "grad_norm": 7.6514482498168945,
+ "learning_rate": 1.5547398818504502e-05,
+ "loss": 0.4264,
+ "step": 12237
+ },
+ {
+ "epoch": 33.346049046321525,
+ "grad_norm": 6.497241020202637,
+ "learning_rate": 1.5546664540332037e-05,
+ "loss": 0.2015,
+ "step": 12238
+ },
+ {
+ "epoch": 33.34877384196185,
+ "grad_norm": 6.456487655639648,
+ "learning_rate": 1.554593021896233e-05,
+ "loss": 0.257,
+ "step": 12239
+ },
+ {
+ "epoch": 33.35149863760218,
+ "grad_norm": 7.130777359008789,
+ "learning_rate": 1.5545195854401095e-05,
+ "loss": 0.3681,
+ "step": 12240
+ },
+ {
+ "epoch": 33.35422343324251,
+ "grad_norm": 6.268331050872803,
+ "learning_rate": 1.5544461446654053e-05,
+ "loss": 0.2092,
+ "step": 12241
+ },
+ {
+ "epoch": 33.356948228882835,
+ "grad_norm": 7.931918144226074,
+ "learning_rate": 1.554372699572692e-05,
+ "loss": 0.3724,
+ "step": 12242
+ },
+ {
+ "epoch": 33.35967302452316,
+ "grad_norm": 6.673097610473633,
+ "learning_rate": 1.5542992501625425e-05,
+ "loss": 0.3635,
+ "step": 12243
+ },
+ {
+ "epoch": 33.36239782016349,
+ "grad_norm": 7.56607723236084,
+ "learning_rate": 1.5542257964355282e-05,
+ "loss": 0.3472,
+ "step": 12244
+ },
+ {
+ "epoch": 33.36512261580381,
+ "grad_norm": 5.374823093414307,
+ "learning_rate": 1.5541523383922206e-05,
+ "loss": 0.3676,
+ "step": 12245
+ },
+ {
+ "epoch": 33.36784741144414,
+ "grad_norm": 7.16453218460083,
+ "learning_rate": 1.554078876033193e-05,
+ "loss": 0.416,
+ "step": 12246
+ },
+ {
+ "epoch": 33.37057220708447,
+ "grad_norm": 6.608232498168945,
+ "learning_rate": 1.5540054093590173e-05,
+ "loss": 0.4185,
+ "step": 12247
+ },
+ {
+ "epoch": 33.3732970027248,
+ "grad_norm": 6.824566841125488,
+ "learning_rate": 1.5539319383702646e-05,
+ "loss": 0.3732,
+ "step": 12248
+ },
+ {
+ "epoch": 33.37602179836512,
+ "grad_norm": 6.502536296844482,
+ "learning_rate": 1.553858463067508e-05,
+ "loss": 0.3053,
+ "step": 12249
+ },
+ {
+ "epoch": 33.37874659400545,
+ "grad_norm": 6.010274887084961,
+ "learning_rate": 1.5537849834513197e-05,
+ "loss": 0.2581,
+ "step": 12250
+ },
+ {
+ "epoch": 33.381471389645775,
+ "grad_norm": 7.1450371742248535,
+ "learning_rate": 1.5537114995222716e-05,
+ "loss": 0.4281,
+ "step": 12251
+ },
+ {
+ "epoch": 33.3841961852861,
+ "grad_norm": 6.057378768920898,
+ "learning_rate": 1.553638011280936e-05,
+ "loss": 0.4492,
+ "step": 12252
+ },
+ {
+ "epoch": 33.38692098092643,
+ "grad_norm": 5.5235772132873535,
+ "learning_rate": 1.553564518727886e-05,
+ "loss": 0.4549,
+ "step": 12253
+ },
+ {
+ "epoch": 33.38964577656676,
+ "grad_norm": 5.668849468231201,
+ "learning_rate": 1.553491021863693e-05,
+ "loss": 0.2589,
+ "step": 12254
+ },
+ {
+ "epoch": 33.392370572207085,
+ "grad_norm": 6.622274875640869,
+ "learning_rate": 1.553417520688929e-05,
+ "loss": 0.297,
+ "step": 12255
+ },
+ {
+ "epoch": 33.39509536784741,
+ "grad_norm": 6.553107738494873,
+ "learning_rate": 1.553344015204168e-05,
+ "loss": 0.3379,
+ "step": 12256
+ },
+ {
+ "epoch": 33.39782016348774,
+ "grad_norm": 7.671754360198975,
+ "learning_rate": 1.5532705054099816e-05,
+ "loss": 0.4111,
+ "step": 12257
+ },
+ {
+ "epoch": 33.40054495912806,
+ "grad_norm": 5.965877056121826,
+ "learning_rate": 1.5531969913069423e-05,
+ "loss": 0.3313,
+ "step": 12258
+ },
+ {
+ "epoch": 33.403269754768395,
+ "grad_norm": 10.241011619567871,
+ "learning_rate": 1.5531234728956227e-05,
+ "loss": 0.4214,
+ "step": 12259
+ },
+ {
+ "epoch": 33.40599455040872,
+ "grad_norm": 9.025012969970703,
+ "learning_rate": 1.553049950176595e-05,
+ "loss": 0.4389,
+ "step": 12260
+ },
+ {
+ "epoch": 33.40871934604905,
+ "grad_norm": 6.43281888961792,
+ "learning_rate": 1.552976423150432e-05,
+ "loss": 0.3975,
+ "step": 12261
+ },
+ {
+ "epoch": 33.41144414168937,
+ "grad_norm": 8.139632225036621,
+ "learning_rate": 1.5529028918177067e-05,
+ "loss": 0.5136,
+ "step": 12262
+ },
+ {
+ "epoch": 33.4141689373297,
+ "grad_norm": 7.0361833572387695,
+ "learning_rate": 1.5528293561789912e-05,
+ "loss": 0.4117,
+ "step": 12263
+ },
+ {
+ "epoch": 33.416893732970024,
+ "grad_norm": 7.069800853729248,
+ "learning_rate": 1.5527558162348588e-05,
+ "loss": 0.4446,
+ "step": 12264
+ },
+ {
+ "epoch": 33.41961852861036,
+ "grad_norm": 6.559822082519531,
+ "learning_rate": 1.5526822719858816e-05,
+ "loss": 0.3782,
+ "step": 12265
+ },
+ {
+ "epoch": 33.42234332425068,
+ "grad_norm": 7.176815032958984,
+ "learning_rate": 1.5526087234326327e-05,
+ "loss": 0.3492,
+ "step": 12266
+ },
+ {
+ "epoch": 33.42506811989101,
+ "grad_norm": 6.263866901397705,
+ "learning_rate": 1.5525351705756852e-05,
+ "loss": 0.4857,
+ "step": 12267
+ },
+ {
+ "epoch": 33.427792915531334,
+ "grad_norm": 5.193022727966309,
+ "learning_rate": 1.552461613415611e-05,
+ "loss": 0.6106,
+ "step": 12268
+ },
+ {
+ "epoch": 33.43051771117166,
+ "grad_norm": 6.027821063995361,
+ "learning_rate": 1.5523880519529838e-05,
+ "loss": 0.5298,
+ "step": 12269
+ },
+ {
+ "epoch": 33.433242506811986,
+ "grad_norm": 7.548738956451416,
+ "learning_rate": 1.5523144861883767e-05,
+ "loss": 0.4398,
+ "step": 12270
+ },
+ {
+ "epoch": 33.43596730245232,
+ "grad_norm": 9.499189376831055,
+ "learning_rate": 1.5522409161223614e-05,
+ "loss": 0.4428,
+ "step": 12271
+ },
+ {
+ "epoch": 33.438692098092645,
+ "grad_norm": 7.346479892730713,
+ "learning_rate": 1.5521673417555117e-05,
+ "loss": 0.3069,
+ "step": 12272
+ },
+ {
+ "epoch": 33.44141689373297,
+ "grad_norm": 7.802134037017822,
+ "learning_rate": 1.552093763088401e-05,
+ "loss": 0.3533,
+ "step": 12273
+ },
+ {
+ "epoch": 33.444141689373296,
+ "grad_norm": 6.074779033660889,
+ "learning_rate": 1.5520201801216017e-05,
+ "loss": 0.3179,
+ "step": 12274
+ },
+ {
+ "epoch": 33.44686648501362,
+ "grad_norm": 6.945800304412842,
+ "learning_rate": 1.551946592855687e-05,
+ "loss": 0.4674,
+ "step": 12275
+ },
+ {
+ "epoch": 33.44959128065395,
+ "grad_norm": 5.797735214233398,
+ "learning_rate": 1.55187300129123e-05,
+ "loss": 0.5052,
+ "step": 12276
+ },
+ {
+ "epoch": 33.45231607629428,
+ "grad_norm": 10.462039947509766,
+ "learning_rate": 1.5517994054288035e-05,
+ "loss": 0.3609,
+ "step": 12277
+ },
+ {
+ "epoch": 33.45504087193461,
+ "grad_norm": 6.354482650756836,
+ "learning_rate": 1.5517258052689813e-05,
+ "loss": 0.2659,
+ "step": 12278
+ },
+ {
+ "epoch": 33.45776566757493,
+ "grad_norm": 6.137086868286133,
+ "learning_rate": 1.5516522008123364e-05,
+ "loss": 0.29,
+ "step": 12279
+ },
+ {
+ "epoch": 33.46049046321526,
+ "grad_norm": 6.347009181976318,
+ "learning_rate": 1.551578592059442e-05,
+ "loss": 0.307,
+ "step": 12280
+ },
+ {
+ "epoch": 33.463215258855584,
+ "grad_norm": 19.688533782958984,
+ "learning_rate": 1.5515049790108705e-05,
+ "loss": 0.3366,
+ "step": 12281
+ },
+ {
+ "epoch": 33.46594005449591,
+ "grad_norm": 7.231790065765381,
+ "learning_rate": 1.5514313616671967e-05,
+ "loss": 0.4257,
+ "step": 12282
+ },
+ {
+ "epoch": 33.46866485013624,
+ "grad_norm": 6.826254367828369,
+ "learning_rate": 1.5513577400289926e-05,
+ "loss": 0.3163,
+ "step": 12283
+ },
+ {
+ "epoch": 33.47138964577657,
+ "grad_norm": 6.485746383666992,
+ "learning_rate": 1.551284114096833e-05,
+ "loss": 0.2806,
+ "step": 12284
+ },
+ {
+ "epoch": 33.474114441416894,
+ "grad_norm": 5.880269527435303,
+ "learning_rate": 1.55121048387129e-05,
+ "loss": 0.6014,
+ "step": 12285
+ },
+ {
+ "epoch": 33.47683923705722,
+ "grad_norm": 5.744699954986572,
+ "learning_rate": 1.5511368493529375e-05,
+ "loss": 0.3055,
+ "step": 12286
+ },
+ {
+ "epoch": 33.479564032697546,
+ "grad_norm": 6.363956451416016,
+ "learning_rate": 1.551063210542349e-05,
+ "loss": 0.3838,
+ "step": 12287
+ },
+ {
+ "epoch": 33.48228882833787,
+ "grad_norm": 6.764632701873779,
+ "learning_rate": 1.5509895674400977e-05,
+ "loss": 0.3948,
+ "step": 12288
+ },
+ {
+ "epoch": 33.485013623978205,
+ "grad_norm": 9.482726097106934,
+ "learning_rate": 1.5509159200467577e-05,
+ "loss": 0.3629,
+ "step": 12289
+ },
+ {
+ "epoch": 33.48773841961853,
+ "grad_norm": 9.39960765838623,
+ "learning_rate": 1.5508422683629022e-05,
+ "loss": 0.3287,
+ "step": 12290
+ },
+ {
+ "epoch": 33.490463215258856,
+ "grad_norm": 9.882277488708496,
+ "learning_rate": 1.5507686123891046e-05,
+ "loss": 0.3516,
+ "step": 12291
+ },
+ {
+ "epoch": 33.49318801089918,
+ "grad_norm": 6.911797046661377,
+ "learning_rate": 1.5506949521259393e-05,
+ "loss": 0.352,
+ "step": 12292
+ },
+ {
+ "epoch": 33.49591280653951,
+ "grad_norm": 9.063674926757812,
+ "learning_rate": 1.550621287573979e-05,
+ "loss": 0.5132,
+ "step": 12293
+ },
+ {
+ "epoch": 33.49863760217983,
+ "grad_norm": 8.968364715576172,
+ "learning_rate": 1.550547618733798e-05,
+ "loss": 0.5012,
+ "step": 12294
+ },
+ {
+ "epoch": 33.50136239782017,
+ "grad_norm": 5.682219505310059,
+ "learning_rate": 1.5504739456059694e-05,
+ "loss": 0.4999,
+ "step": 12295
+ },
+ {
+ "epoch": 33.50408719346049,
+ "grad_norm": 6.653972625732422,
+ "learning_rate": 1.550400268191068e-05,
+ "loss": 0.2708,
+ "step": 12296
+ },
+ {
+ "epoch": 33.50681198910082,
+ "grad_norm": 7.9966888427734375,
+ "learning_rate": 1.5503265864896668e-05,
+ "loss": 0.33,
+ "step": 12297
+ },
+ {
+ "epoch": 33.509536784741144,
+ "grad_norm": 6.977714538574219,
+ "learning_rate": 1.55025290050234e-05,
+ "loss": 0.3494,
+ "step": 12298
+ },
+ {
+ "epoch": 33.51226158038147,
+ "grad_norm": 6.731818199157715,
+ "learning_rate": 1.550179210229661e-05,
+ "loss": 0.4812,
+ "step": 12299
+ },
+ {
+ "epoch": 33.514986376021795,
+ "grad_norm": 7.986743927001953,
+ "learning_rate": 1.5501055156722044e-05,
+ "loss": 0.4796,
+ "step": 12300
+ },
+ {
+ "epoch": 33.51771117166213,
+ "grad_norm": 29.076562881469727,
+ "learning_rate": 1.5500318168305434e-05,
+ "loss": 0.4885,
+ "step": 12301
+ },
+ {
+ "epoch": 33.520435967302454,
+ "grad_norm": 12.162221908569336,
+ "learning_rate": 1.5499581137052527e-05,
+ "loss": 0.4968,
+ "step": 12302
+ },
+ {
+ "epoch": 33.52316076294278,
+ "grad_norm": 5.864055156707764,
+ "learning_rate": 1.5498844062969055e-05,
+ "loss": 0.2878,
+ "step": 12303
+ },
+ {
+ "epoch": 33.525885558583106,
+ "grad_norm": 7.06923770904541,
+ "learning_rate": 1.5498106946060768e-05,
+ "loss": 0.4002,
+ "step": 12304
+ },
+ {
+ "epoch": 33.52861035422343,
+ "grad_norm": 8.66711711883545,
+ "learning_rate": 1.5497369786333398e-05,
+ "loss": 0.3882,
+ "step": 12305
+ },
+ {
+ "epoch": 33.53133514986376,
+ "grad_norm": 7.390394687652588,
+ "learning_rate": 1.5496632583792686e-05,
+ "loss": 0.416,
+ "step": 12306
+ },
+ {
+ "epoch": 33.53405994550409,
+ "grad_norm": 10.1567964553833,
+ "learning_rate": 1.549589533844438e-05,
+ "loss": 0.3127,
+ "step": 12307
+ },
+ {
+ "epoch": 33.536784741144416,
+ "grad_norm": 7.279140472412109,
+ "learning_rate": 1.5495158050294216e-05,
+ "loss": 0.4403,
+ "step": 12308
+ },
+ {
+ "epoch": 33.53950953678474,
+ "grad_norm": 7.6444902420043945,
+ "learning_rate": 1.549442071934794e-05,
+ "loss": 0.2965,
+ "step": 12309
+ },
+ {
+ "epoch": 33.54223433242507,
+ "grad_norm": 7.107326984405518,
+ "learning_rate": 1.549368334561129e-05,
+ "loss": 0.3421,
+ "step": 12310
+ },
+ {
+ "epoch": 33.54495912806539,
+ "grad_norm": 6.362401485443115,
+ "learning_rate": 1.5492945929090015e-05,
+ "loss": 0.3637,
+ "step": 12311
+ },
+ {
+ "epoch": 33.54768392370572,
+ "grad_norm": 7.301507472991943,
+ "learning_rate": 1.549220846978985e-05,
+ "loss": 0.368,
+ "step": 12312
+ },
+ {
+ "epoch": 33.55040871934605,
+ "grad_norm": 7.936252117156982,
+ "learning_rate": 1.549147096771654e-05,
+ "loss": 0.3716,
+ "step": 12313
+ },
+ {
+ "epoch": 33.55313351498638,
+ "grad_norm": 6.499980449676514,
+ "learning_rate": 1.5490733422875836e-05,
+ "loss": 0.5402,
+ "step": 12314
+ },
+ {
+ "epoch": 33.555858310626704,
+ "grad_norm": 7.899421215057373,
+ "learning_rate": 1.5489995835273476e-05,
+ "loss": 0.3173,
+ "step": 12315
+ },
+ {
+ "epoch": 33.55858310626703,
+ "grad_norm": 9.74738883972168,
+ "learning_rate": 1.5489258204915203e-05,
+ "loss": 0.5145,
+ "step": 12316
+ },
+ {
+ "epoch": 33.561307901907355,
+ "grad_norm": 8.830711364746094,
+ "learning_rate": 1.5488520531806767e-05,
+ "loss": 0.2935,
+ "step": 12317
+ },
+ {
+ "epoch": 33.56403269754768,
+ "grad_norm": 5.760073661804199,
+ "learning_rate": 1.5487782815953908e-05,
+ "loss": 0.3943,
+ "step": 12318
+ },
+ {
+ "epoch": 33.566757493188014,
+ "grad_norm": 7.559969902038574,
+ "learning_rate": 1.548704505736237e-05,
+ "loss": 0.3832,
+ "step": 12319
+ },
+ {
+ "epoch": 33.56948228882834,
+ "grad_norm": 7.594951629638672,
+ "learning_rate": 1.5486307256037908e-05,
+ "loss": 0.4699,
+ "step": 12320
+ },
+ {
+ "epoch": 33.572207084468666,
+ "grad_norm": 6.055371284484863,
+ "learning_rate": 1.5485569411986253e-05,
+ "loss": 0.3524,
+ "step": 12321
+ },
+ {
+ "epoch": 33.57493188010899,
+ "grad_norm": 7.1531596183776855,
+ "learning_rate": 1.5484831525213166e-05,
+ "loss": 0.5202,
+ "step": 12322
+ },
+ {
+ "epoch": 33.57765667574932,
+ "grad_norm": 6.895809650421143,
+ "learning_rate": 1.5484093595724388e-05,
+ "loss": 0.3055,
+ "step": 12323
+ },
+ {
+ "epoch": 33.58038147138964,
+ "grad_norm": 6.4066057205200195,
+ "learning_rate": 1.548335562352566e-05,
+ "loss": 0.2988,
+ "step": 12324
+ },
+ {
+ "epoch": 33.583106267029976,
+ "grad_norm": 9.409860610961914,
+ "learning_rate": 1.5482617608622744e-05,
+ "loss": 0.3773,
+ "step": 12325
+ },
+ {
+ "epoch": 33.5858310626703,
+ "grad_norm": 7.044551849365234,
+ "learning_rate": 1.548187955102137e-05,
+ "loss": 0.3474,
+ "step": 12326
+ },
+ {
+ "epoch": 33.58855585831063,
+ "grad_norm": 6.563586235046387,
+ "learning_rate": 1.54811414507273e-05,
+ "loss": 0.2838,
+ "step": 12327
+ },
+ {
+ "epoch": 33.59128065395095,
+ "grad_norm": 6.07274055480957,
+ "learning_rate": 1.5480403307746274e-05,
+ "loss": 0.3144,
+ "step": 12328
+ },
+ {
+ "epoch": 33.59400544959128,
+ "grad_norm": 6.972324371337891,
+ "learning_rate": 1.5479665122084046e-05,
+ "loss": 0.4146,
+ "step": 12329
+ },
+ {
+ "epoch": 33.596730245231605,
+ "grad_norm": 7.334195613861084,
+ "learning_rate": 1.547892689374636e-05,
+ "loss": 0.368,
+ "step": 12330
+ },
+ {
+ "epoch": 33.59945504087194,
+ "grad_norm": 6.988025188446045,
+ "learning_rate": 1.547818862273897e-05,
+ "loss": 0.2876,
+ "step": 12331
+ },
+ {
+ "epoch": 33.60217983651226,
+ "grad_norm": 5.555150985717773,
+ "learning_rate": 1.547745030906762e-05,
+ "loss": 0.3261,
+ "step": 12332
+ },
+ {
+ "epoch": 33.60490463215259,
+ "grad_norm": 7.14247989654541,
+ "learning_rate": 1.5476711952738065e-05,
+ "loss": 0.4326,
+ "step": 12333
+ },
+ {
+ "epoch": 33.607629427792915,
+ "grad_norm": 6.2259626388549805,
+ "learning_rate": 1.547597355375605e-05,
+ "loss": 0.3841,
+ "step": 12334
+ },
+ {
+ "epoch": 33.61035422343324,
+ "grad_norm": 6.5841288566589355,
+ "learning_rate": 1.5475235112127334e-05,
+ "loss": 0.3844,
+ "step": 12335
+ },
+ {
+ "epoch": 33.61307901907357,
+ "grad_norm": 7.561180114746094,
+ "learning_rate": 1.547449662785766e-05,
+ "loss": 0.3694,
+ "step": 12336
+ },
+ {
+ "epoch": 33.6158038147139,
+ "grad_norm": 10.145565032958984,
+ "learning_rate": 1.5473758100952788e-05,
+ "loss": 0.2518,
+ "step": 12337
+ },
+ {
+ "epoch": 33.618528610354225,
+ "grad_norm": 7.336001873016357,
+ "learning_rate": 1.547301953141846e-05,
+ "loss": 0.3024,
+ "step": 12338
+ },
+ {
+ "epoch": 33.62125340599455,
+ "grad_norm": 6.709211826324463,
+ "learning_rate": 1.5472280919260436e-05,
+ "loss": 0.305,
+ "step": 12339
+ },
+ {
+ "epoch": 33.62397820163488,
+ "grad_norm": 7.38783073425293,
+ "learning_rate": 1.547154226448446e-05,
+ "loss": 0.4097,
+ "step": 12340
+ },
+ {
+ "epoch": 33.6267029972752,
+ "grad_norm": 7.559239387512207,
+ "learning_rate": 1.5470803567096286e-05,
+ "loss": 0.2374,
+ "step": 12341
+ },
+ {
+ "epoch": 33.62942779291553,
+ "grad_norm": 11.160633087158203,
+ "learning_rate": 1.5470064827101677e-05,
+ "loss": 0.4155,
+ "step": 12342
+ },
+ {
+ "epoch": 33.63215258855586,
+ "grad_norm": 8.600433349609375,
+ "learning_rate": 1.5469326044506373e-05,
+ "loss": 0.4086,
+ "step": 12343
+ },
+ {
+ "epoch": 33.63487738419619,
+ "grad_norm": 8.076839447021484,
+ "learning_rate": 1.5468587219316136e-05,
+ "loss": 0.5254,
+ "step": 12344
+ },
+ {
+ "epoch": 33.63760217983651,
+ "grad_norm": 6.322586536407471,
+ "learning_rate": 1.5467848351536717e-05,
+ "loss": 0.487,
+ "step": 12345
+ },
+ {
+ "epoch": 33.64032697547684,
+ "grad_norm": 7.030972480773926,
+ "learning_rate": 1.5467109441173876e-05,
+ "loss": 0.3795,
+ "step": 12346
+ },
+ {
+ "epoch": 33.643051771117165,
+ "grad_norm": 6.812682628631592,
+ "learning_rate": 1.5466370488233358e-05,
+ "loss": 0.4005,
+ "step": 12347
+ },
+ {
+ "epoch": 33.64577656675749,
+ "grad_norm": 7.285449028015137,
+ "learning_rate": 1.5465631492720923e-05,
+ "loss": 0.3118,
+ "step": 12348
+ },
+ {
+ "epoch": 33.64850136239782,
+ "grad_norm": 7.952854633331299,
+ "learning_rate": 1.546489245464233e-05,
+ "loss": 0.3741,
+ "step": 12349
+ },
+ {
+ "epoch": 33.65122615803815,
+ "grad_norm": 7.379002094268799,
+ "learning_rate": 1.5464153374003323e-05,
+ "loss": 0.5068,
+ "step": 12350
+ },
+ {
+ "epoch": 33.653950953678475,
+ "grad_norm": 7.423781394958496,
+ "learning_rate": 1.546341425080967e-05,
+ "loss": 0.4805,
+ "step": 12351
+ },
+ {
+ "epoch": 33.6566757493188,
+ "grad_norm": 10.176163673400879,
+ "learning_rate": 1.546267508506712e-05,
+ "loss": 0.3536,
+ "step": 12352
+ },
+ {
+ "epoch": 33.65940054495913,
+ "grad_norm": 7.722346782684326,
+ "learning_rate": 1.5461935876781436e-05,
+ "loss": 0.4416,
+ "step": 12353
+ },
+ {
+ "epoch": 33.66212534059945,
+ "grad_norm": 8.772095680236816,
+ "learning_rate": 1.546119662595837e-05,
+ "loss": 0.3454,
+ "step": 12354
+ },
+ {
+ "epoch": 33.664850136239785,
+ "grad_norm": 9.018723487854004,
+ "learning_rate": 1.546045733260368e-05,
+ "loss": 0.3676,
+ "step": 12355
+ },
+ {
+ "epoch": 33.66757493188011,
+ "grad_norm": 8.277616500854492,
+ "learning_rate": 1.5459717996723124e-05,
+ "loss": 0.3713,
+ "step": 12356
+ },
+ {
+ "epoch": 33.67029972752044,
+ "grad_norm": 7.505500793457031,
+ "learning_rate": 1.545897861832246e-05,
+ "loss": 0.372,
+ "step": 12357
+ },
+ {
+ "epoch": 33.67302452316076,
+ "grad_norm": 8.260039329528809,
+ "learning_rate": 1.5458239197407446e-05,
+ "loss": 0.3753,
+ "step": 12358
+ },
+ {
+ "epoch": 33.67574931880109,
+ "grad_norm": 5.778948783874512,
+ "learning_rate": 1.545749973398384e-05,
+ "loss": 0.3793,
+ "step": 12359
+ },
+ {
+ "epoch": 33.678474114441414,
+ "grad_norm": 7.623692512512207,
+ "learning_rate": 1.5456760228057405e-05,
+ "loss": 0.2953,
+ "step": 12360
+ },
+ {
+ "epoch": 33.68119891008175,
+ "grad_norm": 8.117790222167969,
+ "learning_rate": 1.545602067963389e-05,
+ "loss": 0.3764,
+ "step": 12361
+ },
+ {
+ "epoch": 33.68392370572207,
+ "grad_norm": 8.630905151367188,
+ "learning_rate": 1.5455281088719067e-05,
+ "loss": 0.306,
+ "step": 12362
+ },
+ {
+ "epoch": 33.6866485013624,
+ "grad_norm": 7.467883110046387,
+ "learning_rate": 1.5454541455318693e-05,
+ "loss": 0.3481,
+ "step": 12363
+ },
+ {
+ "epoch": 33.689373297002724,
+ "grad_norm": 7.620356559753418,
+ "learning_rate": 1.545380177943852e-05,
+ "loss": 0.4457,
+ "step": 12364
+ },
+ {
+ "epoch": 33.69209809264305,
+ "grad_norm": 8.849483489990234,
+ "learning_rate": 1.545306206108432e-05,
+ "loss": 0.3399,
+ "step": 12365
+ },
+ {
+ "epoch": 33.694822888283376,
+ "grad_norm": 7.455567836761475,
+ "learning_rate": 1.545232230026184e-05,
+ "loss": 0.3523,
+ "step": 12366
+ },
+ {
+ "epoch": 33.69754768392371,
+ "grad_norm": 7.081930637359619,
+ "learning_rate": 1.5451582496976856e-05,
+ "loss": 0.3188,
+ "step": 12367
+ },
+ {
+ "epoch": 33.700272479564035,
+ "grad_norm": 6.795620441436768,
+ "learning_rate": 1.5450842651235118e-05,
+ "loss": 0.3658,
+ "step": 12368
+ },
+ {
+ "epoch": 33.70299727520436,
+ "grad_norm": 7.435014724731445,
+ "learning_rate": 1.5450102763042395e-05,
+ "loss": 0.3736,
+ "step": 12369
+ },
+ {
+ "epoch": 33.705722070844686,
+ "grad_norm": 6.455586910247803,
+ "learning_rate": 1.5449362832404452e-05,
+ "loss": 0.3816,
+ "step": 12370
+ },
+ {
+ "epoch": 33.70844686648501,
+ "grad_norm": 7.806655406951904,
+ "learning_rate": 1.544862285932704e-05,
+ "loss": 0.2928,
+ "step": 12371
+ },
+ {
+ "epoch": 33.71117166212534,
+ "grad_norm": 6.863977432250977,
+ "learning_rate": 1.5447882843815932e-05,
+ "loss": 0.4536,
+ "step": 12372
+ },
+ {
+ "epoch": 33.71389645776567,
+ "grad_norm": 7.690101623535156,
+ "learning_rate": 1.544714278587689e-05,
+ "loss": 0.3547,
+ "step": 12373
+ },
+ {
+ "epoch": 33.716621253406,
+ "grad_norm": 9.301826477050781,
+ "learning_rate": 1.544640268551567e-05,
+ "loss": 0.3386,
+ "step": 12374
+ },
+ {
+ "epoch": 33.71934604904632,
+ "grad_norm": 7.949379920959473,
+ "learning_rate": 1.5445662542738044e-05,
+ "loss": 0.407,
+ "step": 12375
+ },
+ {
+ "epoch": 33.72207084468665,
+ "grad_norm": 7.628628253936768,
+ "learning_rate": 1.544492235754977e-05,
+ "loss": 0.2996,
+ "step": 12376
+ },
+ {
+ "epoch": 33.724795640326974,
+ "grad_norm": 5.911596298217773,
+ "learning_rate": 1.544418212995662e-05,
+ "loss": 0.3972,
+ "step": 12377
+ },
+ {
+ "epoch": 33.7275204359673,
+ "grad_norm": 6.364374160766602,
+ "learning_rate": 1.5443441859964353e-05,
+ "loss": 0.3899,
+ "step": 12378
+ },
+ {
+ "epoch": 33.73024523160763,
+ "grad_norm": 7.083815097808838,
+ "learning_rate": 1.5442701547578736e-05,
+ "loss": 0.2889,
+ "step": 12379
+ },
+ {
+ "epoch": 33.73297002724796,
+ "grad_norm": 7.262183666229248,
+ "learning_rate": 1.5441961192805538e-05,
+ "loss": 0.4041,
+ "step": 12380
+ },
+ {
+ "epoch": 33.735694822888284,
+ "grad_norm": 9.222476959228516,
+ "learning_rate": 1.5441220795650518e-05,
+ "loss": 0.2729,
+ "step": 12381
+ },
+ {
+ "epoch": 33.73841961852861,
+ "grad_norm": 5.661161422729492,
+ "learning_rate": 1.5440480356119445e-05,
+ "loss": 0.2729,
+ "step": 12382
+ },
+ {
+ "epoch": 33.741144414168936,
+ "grad_norm": 6.561127662658691,
+ "learning_rate": 1.5439739874218087e-05,
+ "loss": 0.5112,
+ "step": 12383
+ },
+ {
+ "epoch": 33.74386920980926,
+ "grad_norm": 19.514482498168945,
+ "learning_rate": 1.543899934995221e-05,
+ "loss": 0.4377,
+ "step": 12384
+ },
+ {
+ "epoch": 33.746594005449595,
+ "grad_norm": 7.370982646942139,
+ "learning_rate": 1.543825878332758e-05,
+ "loss": 0.4215,
+ "step": 12385
+ },
+ {
+ "epoch": 33.74931880108992,
+ "grad_norm": 6.5547285079956055,
+ "learning_rate": 1.5437518174349967e-05,
+ "loss": 0.3623,
+ "step": 12386
+ },
+ {
+ "epoch": 33.752043596730246,
+ "grad_norm": 6.507667064666748,
+ "learning_rate": 1.543677752302514e-05,
+ "loss": 0.3861,
+ "step": 12387
+ },
+ {
+ "epoch": 33.75476839237057,
+ "grad_norm": 7.1478986740112305,
+ "learning_rate": 1.543603682935886e-05,
+ "loss": 0.4197,
+ "step": 12388
+ },
+ {
+ "epoch": 33.7574931880109,
+ "grad_norm": 6.728658676147461,
+ "learning_rate": 1.5435296093356902e-05,
+ "loss": 0.3558,
+ "step": 12389
+ },
+ {
+ "epoch": 33.76021798365122,
+ "grad_norm": 7.442631244659424,
+ "learning_rate": 1.5434555315025034e-05,
+ "loss": 0.3505,
+ "step": 12390
+ },
+ {
+ "epoch": 33.762942779291556,
+ "grad_norm": 9.225476264953613,
+ "learning_rate": 1.543381449436902e-05,
+ "loss": 0.341,
+ "step": 12391
+ },
+ {
+ "epoch": 33.76566757493188,
+ "grad_norm": 12.1233491897583,
+ "learning_rate": 1.5433073631394638e-05,
+ "loss": 0.3384,
+ "step": 12392
+ },
+ {
+ "epoch": 33.76839237057221,
+ "grad_norm": 7.165793418884277,
+ "learning_rate": 1.5432332726107653e-05,
+ "loss": 0.3573,
+ "step": 12393
+ },
+ {
+ "epoch": 33.771117166212534,
+ "grad_norm": 7.290248870849609,
+ "learning_rate": 1.5431591778513835e-05,
+ "loss": 0.4198,
+ "step": 12394
+ },
+ {
+ "epoch": 33.77384196185286,
+ "grad_norm": 6.255857467651367,
+ "learning_rate": 1.5430850788618955e-05,
+ "loss": 0.4251,
+ "step": 12395
+ },
+ {
+ "epoch": 33.776566757493185,
+ "grad_norm": 9.753196716308594,
+ "learning_rate": 1.5430109756428785e-05,
+ "loss": 0.3881,
+ "step": 12396
+ },
+ {
+ "epoch": 33.77929155313352,
+ "grad_norm": 7.622660160064697,
+ "learning_rate": 1.542936868194909e-05,
+ "loss": 0.3523,
+ "step": 12397
+ },
+ {
+ "epoch": 33.782016348773844,
+ "grad_norm": 6.863631725311279,
+ "learning_rate": 1.5428627565185652e-05,
+ "loss": 0.3501,
+ "step": 12398
+ },
+ {
+ "epoch": 33.78474114441417,
+ "grad_norm": 7.674832820892334,
+ "learning_rate": 1.5427886406144235e-05,
+ "loss": 0.3888,
+ "step": 12399
+ },
+ {
+ "epoch": 33.787465940054496,
+ "grad_norm": 4.952965259552002,
+ "learning_rate": 1.5427145204830615e-05,
+ "loss": 0.3384,
+ "step": 12400
+ },
+ {
+ "epoch": 33.79019073569482,
+ "grad_norm": 6.492983818054199,
+ "learning_rate": 1.542640396125056e-05,
+ "loss": 0.3019,
+ "step": 12401
+ },
+ {
+ "epoch": 33.79291553133515,
+ "grad_norm": 6.460616111755371,
+ "learning_rate": 1.5425662675409845e-05,
+ "loss": 0.3652,
+ "step": 12402
+ },
+ {
+ "epoch": 33.79564032697548,
+ "grad_norm": 8.286467552185059,
+ "learning_rate": 1.5424921347314245e-05,
+ "loss": 0.403,
+ "step": 12403
+ },
+ {
+ "epoch": 33.798365122615806,
+ "grad_norm": 6.715384006500244,
+ "learning_rate": 1.5424179976969536e-05,
+ "loss": 0.408,
+ "step": 12404
+ },
+ {
+ "epoch": 33.80108991825613,
+ "grad_norm": 9.546368598937988,
+ "learning_rate": 1.5423438564381484e-05,
+ "loss": 0.3706,
+ "step": 12405
+ },
+ {
+ "epoch": 33.80381471389646,
+ "grad_norm": 6.578489780426025,
+ "learning_rate": 1.5422697109555867e-05,
+ "loss": 0.3626,
+ "step": 12406
+ },
+ {
+ "epoch": 33.80653950953678,
+ "grad_norm": 6.979336738586426,
+ "learning_rate": 1.542195561249846e-05,
+ "loss": 0.3411,
+ "step": 12407
+ },
+ {
+ "epoch": 33.80926430517711,
+ "grad_norm": 10.89571762084961,
+ "learning_rate": 1.5421214073215037e-05,
+ "loss": 0.4416,
+ "step": 12408
+ },
+ {
+ "epoch": 33.81198910081744,
+ "grad_norm": 5.769643783569336,
+ "learning_rate": 1.5420472491711373e-05,
+ "loss": 0.3075,
+ "step": 12409
+ },
+ {
+ "epoch": 33.81471389645777,
+ "grad_norm": 7.007720470428467,
+ "learning_rate": 1.5419730867993245e-05,
+ "loss": 0.6479,
+ "step": 12410
+ },
+ {
+ "epoch": 33.817438692098094,
+ "grad_norm": 6.751010894775391,
+ "learning_rate": 1.5418989202066427e-05,
+ "loss": 0.3234,
+ "step": 12411
+ },
+ {
+ "epoch": 33.82016348773842,
+ "grad_norm": 7.3624749183654785,
+ "learning_rate": 1.5418247493936695e-05,
+ "loss": 0.2687,
+ "step": 12412
+ },
+ {
+ "epoch": 33.822888283378745,
+ "grad_norm": 6.650275230407715,
+ "learning_rate": 1.5417505743609828e-05,
+ "loss": 0.2815,
+ "step": 12413
+ },
+ {
+ "epoch": 33.82561307901907,
+ "grad_norm": 6.142333030700684,
+ "learning_rate": 1.54167639510916e-05,
+ "loss": 0.4532,
+ "step": 12414
+ },
+ {
+ "epoch": 33.828337874659404,
+ "grad_norm": 11.933963775634766,
+ "learning_rate": 1.5416022116387785e-05,
+ "loss": 0.5086,
+ "step": 12415
+ },
+ {
+ "epoch": 33.83106267029973,
+ "grad_norm": 7.944046497344971,
+ "learning_rate": 1.541528023950417e-05,
+ "loss": 0.4072,
+ "step": 12416
+ },
+ {
+ "epoch": 33.833787465940055,
+ "grad_norm": 6.637248992919922,
+ "learning_rate": 1.5414538320446523e-05,
+ "loss": 0.2994,
+ "step": 12417
+ },
+ {
+ "epoch": 33.83651226158038,
+ "grad_norm": 7.869789123535156,
+ "learning_rate": 1.5413796359220622e-05,
+ "loss": 0.4477,
+ "step": 12418
+ },
+ {
+ "epoch": 33.83923705722071,
+ "grad_norm": 7.0807342529296875,
+ "learning_rate": 1.5413054355832257e-05,
+ "loss": 0.3052,
+ "step": 12419
+ },
+ {
+ "epoch": 33.84196185286103,
+ "grad_norm": 12.607836723327637,
+ "learning_rate": 1.541231231028719e-05,
+ "loss": 0.3612,
+ "step": 12420
+ },
+ {
+ "epoch": 33.844686648501366,
+ "grad_norm": 7.435271263122559,
+ "learning_rate": 1.5411570222591217e-05,
+ "loss": 0.3848,
+ "step": 12421
+ },
+ {
+ "epoch": 33.84741144414169,
+ "grad_norm": 7.234927177429199,
+ "learning_rate": 1.5410828092750106e-05,
+ "loss": 0.3199,
+ "step": 12422
+ },
+ {
+ "epoch": 33.85013623978202,
+ "grad_norm": 12.723918914794922,
+ "learning_rate": 1.541008592076964e-05,
+ "loss": 0.3752,
+ "step": 12423
+ },
+ {
+ "epoch": 33.85286103542234,
+ "grad_norm": 7.345337390899658,
+ "learning_rate": 1.5409343706655603e-05,
+ "loss": 0.3937,
+ "step": 12424
+ },
+ {
+ "epoch": 33.85558583106267,
+ "grad_norm": 7.744995594024658,
+ "learning_rate": 1.5408601450413767e-05,
+ "loss": 0.3183,
+ "step": 12425
+ },
+ {
+ "epoch": 33.858310626702995,
+ "grad_norm": 5.900259494781494,
+ "learning_rate": 1.5407859152049915e-05,
+ "loss": 0.2372,
+ "step": 12426
+ },
+ {
+ "epoch": 33.86103542234333,
+ "grad_norm": 7.837316036224365,
+ "learning_rate": 1.5407116811569833e-05,
+ "loss": 0.4977,
+ "step": 12427
+ },
+ {
+ "epoch": 33.86376021798365,
+ "grad_norm": 6.400331974029541,
+ "learning_rate": 1.54063744289793e-05,
+ "loss": 0.3331,
+ "step": 12428
+ },
+ {
+ "epoch": 33.86648501362398,
+ "grad_norm": 7.602609634399414,
+ "learning_rate": 1.5405632004284097e-05,
+ "loss": 0.4165,
+ "step": 12429
+ },
+ {
+ "epoch": 33.869209809264305,
+ "grad_norm": 14.240015983581543,
+ "learning_rate": 1.5404889537490004e-05,
+ "loss": 0.2772,
+ "step": 12430
+ },
+ {
+ "epoch": 33.87193460490463,
+ "grad_norm": 6.371674060821533,
+ "learning_rate": 1.5404147028602804e-05,
+ "loss": 0.4153,
+ "step": 12431
+ },
+ {
+ "epoch": 33.87465940054496,
+ "grad_norm": 7.883369445800781,
+ "learning_rate": 1.5403404477628286e-05,
+ "loss": 0.2592,
+ "step": 12432
+ },
+ {
+ "epoch": 33.87738419618529,
+ "grad_norm": 7.574853897094727,
+ "learning_rate": 1.5402661884572222e-05,
+ "loss": 0.3174,
+ "step": 12433
+ },
+ {
+ "epoch": 33.880108991825615,
+ "grad_norm": 7.4124884605407715,
+ "learning_rate": 1.5401919249440406e-05,
+ "loss": 0.3696,
+ "step": 12434
+ },
+ {
+ "epoch": 33.88283378746594,
+ "grad_norm": 6.390591144561768,
+ "learning_rate": 1.5401176572238615e-05,
+ "loss": 0.2631,
+ "step": 12435
+ },
+ {
+ "epoch": 33.88555858310627,
+ "grad_norm": 5.953117370605469,
+ "learning_rate": 1.5400433852972633e-05,
+ "loss": 0.3632,
+ "step": 12436
+ },
+ {
+ "epoch": 33.88828337874659,
+ "grad_norm": 6.461482048034668,
+ "learning_rate": 1.5399691091648246e-05,
+ "loss": 0.3871,
+ "step": 12437
+ },
+ {
+ "epoch": 33.89100817438692,
+ "grad_norm": 8.403675079345703,
+ "learning_rate": 1.5398948288271242e-05,
+ "loss": 0.2888,
+ "step": 12438
+ },
+ {
+ "epoch": 33.89373297002725,
+ "grad_norm": 7.038022518157959,
+ "learning_rate": 1.53982054428474e-05,
+ "loss": 0.3359,
+ "step": 12439
+ },
+ {
+ "epoch": 33.89645776566758,
+ "grad_norm": 6.362793922424316,
+ "learning_rate": 1.5397462555382508e-05,
+ "loss": 0.3172,
+ "step": 12440
+ },
+ {
+ "epoch": 33.8991825613079,
+ "grad_norm": 6.867793560028076,
+ "learning_rate": 1.539671962588235e-05,
+ "loss": 0.382,
+ "step": 12441
+ },
+ {
+ "epoch": 33.90190735694823,
+ "grad_norm": 10.121224403381348,
+ "learning_rate": 1.5395976654352715e-05,
+ "loss": 0.3347,
+ "step": 12442
+ },
+ {
+ "epoch": 33.904632152588555,
+ "grad_norm": 7.618274688720703,
+ "learning_rate": 1.539523364079939e-05,
+ "loss": 0.3734,
+ "step": 12443
+ },
+ {
+ "epoch": 33.90735694822888,
+ "grad_norm": 6.563361167907715,
+ "learning_rate": 1.5394490585228154e-05,
+ "loss": 0.2395,
+ "step": 12444
+ },
+ {
+ "epoch": 33.91008174386921,
+ "grad_norm": 6.725279808044434,
+ "learning_rate": 1.5393747487644803e-05,
+ "loss": 0.3066,
+ "step": 12445
+ },
+ {
+ "epoch": 33.91280653950954,
+ "grad_norm": 5.6815619468688965,
+ "learning_rate": 1.539300434805512e-05,
+ "loss": 0.3529,
+ "step": 12446
+ },
+ {
+ "epoch": 33.915531335149865,
+ "grad_norm": 6.796170234680176,
+ "learning_rate": 1.5392261166464886e-05,
+ "loss": 0.3427,
+ "step": 12447
+ },
+ {
+ "epoch": 33.91825613079019,
+ "grad_norm": 5.836400032043457,
+ "learning_rate": 1.5391517942879905e-05,
+ "loss": 0.3239,
+ "step": 12448
+ },
+ {
+ "epoch": 33.920980926430516,
+ "grad_norm": 6.661625385284424,
+ "learning_rate": 1.539077467730595e-05,
+ "loss": 0.4078,
+ "step": 12449
+ },
+ {
+ "epoch": 33.92370572207084,
+ "grad_norm": 12.549825668334961,
+ "learning_rate": 1.539003136974882e-05,
+ "loss": 0.3369,
+ "step": 12450
+ },
+ {
+ "epoch": 33.926430517711175,
+ "grad_norm": 7.375289440155029,
+ "learning_rate": 1.538928802021429e-05,
+ "loss": 0.3853,
+ "step": 12451
+ },
+ {
+ "epoch": 33.9291553133515,
+ "grad_norm": 9.283988952636719,
+ "learning_rate": 1.5388544628708166e-05,
+ "loss": 0.3829,
+ "step": 12452
+ },
+ {
+ "epoch": 33.93188010899183,
+ "grad_norm": 5.844550132751465,
+ "learning_rate": 1.5387801195236227e-05,
+ "loss": 0.3329,
+ "step": 12453
+ },
+ {
+ "epoch": 33.93460490463215,
+ "grad_norm": 6.188870906829834,
+ "learning_rate": 1.538705771980427e-05,
+ "loss": 0.4023,
+ "step": 12454
+ },
+ {
+ "epoch": 33.93732970027248,
+ "grad_norm": 8.369707107543945,
+ "learning_rate": 1.5386314202418076e-05,
+ "loss": 0.3803,
+ "step": 12455
+ },
+ {
+ "epoch": 33.940054495912804,
+ "grad_norm": 12.039058685302734,
+ "learning_rate": 1.538557064308344e-05,
+ "loss": 0.3149,
+ "step": 12456
+ },
+ {
+ "epoch": 33.94277929155314,
+ "grad_norm": 14.115557670593262,
+ "learning_rate": 1.5384827041806157e-05,
+ "loss": 0.4344,
+ "step": 12457
+ },
+ {
+ "epoch": 33.94550408719346,
+ "grad_norm": 7.214237689971924,
+ "learning_rate": 1.5384083398592015e-05,
+ "loss": 0.4768,
+ "step": 12458
+ },
+ {
+ "epoch": 33.94822888283379,
+ "grad_norm": 7.765081405639648,
+ "learning_rate": 1.53833397134468e-05,
+ "loss": 0.3866,
+ "step": 12459
+ },
+ {
+ "epoch": 33.950953678474114,
+ "grad_norm": 13.63409423828125,
+ "learning_rate": 1.5382595986376312e-05,
+ "loss": 0.3347,
+ "step": 12460
+ },
+ {
+ "epoch": 33.95367847411444,
+ "grad_norm": 6.552498817443848,
+ "learning_rate": 1.538185221738634e-05,
+ "loss": 0.3456,
+ "step": 12461
+ },
+ {
+ "epoch": 33.956403269754766,
+ "grad_norm": 7.624207496643066,
+ "learning_rate": 1.538110840648267e-05,
+ "loss": 0.4122,
+ "step": 12462
+ },
+ {
+ "epoch": 33.95912806539509,
+ "grad_norm": 7.696471691131592,
+ "learning_rate": 1.5380364553671107e-05,
+ "loss": 0.4084,
+ "step": 12463
+ },
+ {
+ "epoch": 33.961852861035425,
+ "grad_norm": 6.774961471557617,
+ "learning_rate": 1.537962065895744e-05,
+ "loss": 0.3287,
+ "step": 12464
+ },
+ {
+ "epoch": 33.96457765667575,
+ "grad_norm": 7.877649307250977,
+ "learning_rate": 1.5378876722347455e-05,
+ "loss": 0.5164,
+ "step": 12465
+ },
+ {
+ "epoch": 33.967302452316076,
+ "grad_norm": 7.891627311706543,
+ "learning_rate": 1.5378132743846955e-05,
+ "loss": 0.3705,
+ "step": 12466
+ },
+ {
+ "epoch": 33.9700272479564,
+ "grad_norm": 9.303549766540527,
+ "learning_rate": 1.537738872346173e-05,
+ "loss": 0.292,
+ "step": 12467
+ },
+ {
+ "epoch": 33.97275204359673,
+ "grad_norm": 7.350878715515137,
+ "learning_rate": 1.537664466119757e-05,
+ "loss": 0.3803,
+ "step": 12468
+ },
+ {
+ "epoch": 33.97547683923706,
+ "grad_norm": 8.583620071411133,
+ "learning_rate": 1.537590055706028e-05,
+ "loss": 0.3895,
+ "step": 12469
+ },
+ {
+ "epoch": 33.97820163487739,
+ "grad_norm": 6.492166042327881,
+ "learning_rate": 1.5375156411055644e-05,
+ "loss": 0.3654,
+ "step": 12470
+ },
+ {
+ "epoch": 33.98092643051771,
+ "grad_norm": 7.747386455535889,
+ "learning_rate": 1.5374412223189467e-05,
+ "loss": 0.2872,
+ "step": 12471
+ },
+ {
+ "epoch": 33.98365122615804,
+ "grad_norm": 5.402212619781494,
+ "learning_rate": 1.537366799346754e-05,
+ "loss": 0.4095,
+ "step": 12472
+ },
+ {
+ "epoch": 33.986376021798364,
+ "grad_norm": 11.660005569458008,
+ "learning_rate": 1.537292372189566e-05,
+ "loss": 0.3462,
+ "step": 12473
+ },
+ {
+ "epoch": 33.98910081743869,
+ "grad_norm": 6.122496128082275,
+ "learning_rate": 1.5372179408479624e-05,
+ "loss": 0.2592,
+ "step": 12474
+ },
+ {
+ "epoch": 33.991825613079016,
+ "grad_norm": 6.724801540374756,
+ "learning_rate": 1.5371435053225222e-05,
+ "loss": 0.3505,
+ "step": 12475
+ },
+ {
+ "epoch": 33.99455040871935,
+ "grad_norm": 5.974119186401367,
+ "learning_rate": 1.5370690656138265e-05,
+ "loss": 0.4124,
+ "step": 12476
+ },
+ {
+ "epoch": 33.997275204359674,
+ "grad_norm": 6.9660820960998535,
+ "learning_rate": 1.5369946217224536e-05,
+ "loss": 0.3219,
+ "step": 12477
+ },
+ {
+ "epoch": 34.0,
+ "grad_norm": 7.865757465362549,
+ "learning_rate": 1.536920173648984e-05,
+ "loss": 0.5123,
+ "step": 12478
+ },
+ {
+ "epoch": 34.002724795640326,
+ "grad_norm": 6.852688789367676,
+ "learning_rate": 1.5368457213939973e-05,
+ "loss": 0.2488,
+ "step": 12479
+ },
+ {
+ "epoch": 34.00544959128065,
+ "grad_norm": 7.923671245574951,
+ "learning_rate": 1.5367712649580736e-05,
+ "loss": 0.3334,
+ "step": 12480
+ },
+ {
+ "epoch": 34.00817438692098,
+ "grad_norm": 6.53236198425293,
+ "learning_rate": 1.5366968043417926e-05,
+ "loss": 0.313,
+ "step": 12481
+ },
+ {
+ "epoch": 34.01089918256131,
+ "grad_norm": 6.657381534576416,
+ "learning_rate": 1.5366223395457337e-05,
+ "loss": 0.2969,
+ "step": 12482
+ },
+ {
+ "epoch": 34.013623978201636,
+ "grad_norm": 6.5685038566589355,
+ "learning_rate": 1.536547870570478e-05,
+ "loss": 0.3204,
+ "step": 12483
+ },
+ {
+ "epoch": 34.01634877384196,
+ "grad_norm": 6.03550386428833,
+ "learning_rate": 1.5364733974166042e-05,
+ "loss": 0.3785,
+ "step": 12484
+ },
+ {
+ "epoch": 34.01907356948229,
+ "grad_norm": 6.594084739685059,
+ "learning_rate": 1.536398920084693e-05,
+ "loss": 0.4122,
+ "step": 12485
+ },
+ {
+ "epoch": 34.02179836512261,
+ "grad_norm": 6.372106075286865,
+ "learning_rate": 1.5363244385753244e-05,
+ "loss": 0.2687,
+ "step": 12486
+ },
+ {
+ "epoch": 34.02452316076294,
+ "grad_norm": 6.909015655517578,
+ "learning_rate": 1.5362499528890782e-05,
+ "loss": 0.2734,
+ "step": 12487
+ },
+ {
+ "epoch": 34.02724795640327,
+ "grad_norm": 39.4537239074707,
+ "learning_rate": 1.5361754630265347e-05,
+ "loss": 0.34,
+ "step": 12488
+ },
+ {
+ "epoch": 34.0299727520436,
+ "grad_norm": 6.2265448570251465,
+ "learning_rate": 1.5361009689882737e-05,
+ "loss": 0.2168,
+ "step": 12489
+ },
+ {
+ "epoch": 34.032697547683924,
+ "grad_norm": 7.566519260406494,
+ "learning_rate": 1.5360264707748758e-05,
+ "loss": 0.4664,
+ "step": 12490
+ },
+ {
+ "epoch": 34.03542234332425,
+ "grad_norm": 6.685686111450195,
+ "learning_rate": 1.5359519683869207e-05,
+ "loss": 0.2734,
+ "step": 12491
+ },
+ {
+ "epoch": 34.038147138964575,
+ "grad_norm": 8.083074569702148,
+ "learning_rate": 1.5358774618249895e-05,
+ "loss": 0.4032,
+ "step": 12492
+ },
+ {
+ "epoch": 34.0408719346049,
+ "grad_norm": 5.474445343017578,
+ "learning_rate": 1.5358029510896616e-05,
+ "loss": 0.4359,
+ "step": 12493
+ },
+ {
+ "epoch": 34.043596730245234,
+ "grad_norm": 8.933283805847168,
+ "learning_rate": 1.5357284361815178e-05,
+ "loss": 0.3463,
+ "step": 12494
+ },
+ {
+ "epoch": 34.04632152588556,
+ "grad_norm": 7.755788803100586,
+ "learning_rate": 1.535653917101138e-05,
+ "loss": 0.3312,
+ "step": 12495
+ },
+ {
+ "epoch": 34.049046321525886,
+ "grad_norm": 8.029553413391113,
+ "learning_rate": 1.5355793938491025e-05,
+ "loss": 0.2626,
+ "step": 12496
+ },
+ {
+ "epoch": 34.05177111716621,
+ "grad_norm": 8.580611228942871,
+ "learning_rate": 1.535504866425992e-05,
+ "loss": 0.3463,
+ "step": 12497
+ },
+ {
+ "epoch": 34.05449591280654,
+ "grad_norm": 9.165595054626465,
+ "learning_rate": 1.5354303348323873e-05,
+ "loss": 0.3956,
+ "step": 12498
+ },
+ {
+ "epoch": 34.05722070844686,
+ "grad_norm": 10.379510879516602,
+ "learning_rate": 1.5353557990688675e-05,
+ "loss": 0.3011,
+ "step": 12499
+ },
+ {
+ "epoch": 34.059945504087196,
+ "grad_norm": 8.267645835876465,
+ "learning_rate": 1.5352812591360148e-05,
+ "loss": 0.4059,
+ "step": 12500
+ },
+ {
+ "epoch": 34.06267029972752,
+ "grad_norm": 6.728059768676758,
+ "learning_rate": 1.5352067150344084e-05,
+ "loss": 0.4751,
+ "step": 12501
+ },
+ {
+ "epoch": 34.06539509536785,
+ "grad_norm": 6.893502712249756,
+ "learning_rate": 1.5351321667646298e-05,
+ "loss": 0.3395,
+ "step": 12502
+ },
+ {
+ "epoch": 34.06811989100817,
+ "grad_norm": 7.514678478240967,
+ "learning_rate": 1.5350576143272587e-05,
+ "loss": 0.325,
+ "step": 12503
+ },
+ {
+ "epoch": 34.0708446866485,
+ "grad_norm": 6.598287105560303,
+ "learning_rate": 1.534983057722876e-05,
+ "loss": 0.3159,
+ "step": 12504
+ },
+ {
+ "epoch": 34.073569482288825,
+ "grad_norm": 8.37763500213623,
+ "learning_rate": 1.5349084969520628e-05,
+ "loss": 0.3809,
+ "step": 12505
+ },
+ {
+ "epoch": 34.07629427792916,
+ "grad_norm": 6.894758701324463,
+ "learning_rate": 1.5348339320153992e-05,
+ "loss": 0.3809,
+ "step": 12506
+ },
+ {
+ "epoch": 34.079019073569484,
+ "grad_norm": 7.859985828399658,
+ "learning_rate": 1.5347593629134663e-05,
+ "loss": 0.2865,
+ "step": 12507
+ },
+ {
+ "epoch": 34.08174386920981,
+ "grad_norm": 7.461994647979736,
+ "learning_rate": 1.534684789646845e-05,
+ "loss": 0.3677,
+ "step": 12508
+ },
+ {
+ "epoch": 34.084468664850135,
+ "grad_norm": 8.27462100982666,
+ "learning_rate": 1.5346102122161152e-05,
+ "loss": 0.369,
+ "step": 12509
+ },
+ {
+ "epoch": 34.08719346049046,
+ "grad_norm": 5.675178050994873,
+ "learning_rate": 1.5345356306218586e-05,
+ "loss": 0.3832,
+ "step": 12510
+ },
+ {
+ "epoch": 34.08991825613079,
+ "grad_norm": 7.228993892669678,
+ "learning_rate": 1.5344610448646555e-05,
+ "loss": 0.3028,
+ "step": 12511
+ },
+ {
+ "epoch": 34.09264305177112,
+ "grad_norm": 8.06761360168457,
+ "learning_rate": 1.534386454945087e-05,
+ "loss": 0.4328,
+ "step": 12512
+ },
+ {
+ "epoch": 34.095367847411445,
+ "grad_norm": 9.210061073303223,
+ "learning_rate": 1.5343118608637345e-05,
+ "loss": 0.3381,
+ "step": 12513
+ },
+ {
+ "epoch": 34.09809264305177,
+ "grad_norm": 7.22993803024292,
+ "learning_rate": 1.534237262621178e-05,
+ "loss": 0.425,
+ "step": 12514
+ },
+ {
+ "epoch": 34.1008174386921,
+ "grad_norm": 7.0670599937438965,
+ "learning_rate": 1.5341626602179988e-05,
+ "loss": 0.3392,
+ "step": 12515
+ },
+ {
+ "epoch": 34.10354223433242,
+ "grad_norm": 7.207448959350586,
+ "learning_rate": 1.534088053654778e-05,
+ "loss": 0.4464,
+ "step": 12516
+ },
+ {
+ "epoch": 34.10626702997275,
+ "grad_norm": 8.390975952148438,
+ "learning_rate": 1.534013442932097e-05,
+ "loss": 0.3948,
+ "step": 12517
+ },
+ {
+ "epoch": 34.10899182561308,
+ "grad_norm": 6.45070743560791,
+ "learning_rate": 1.533938828050536e-05,
+ "loss": 0.3434,
+ "step": 12518
+ },
+ {
+ "epoch": 34.11171662125341,
+ "grad_norm": 6.419523239135742,
+ "learning_rate": 1.533864209010677e-05,
+ "loss": 0.4856,
+ "step": 12519
+ },
+ {
+ "epoch": 34.11444141689373,
+ "grad_norm": 7.4021525382995605,
+ "learning_rate": 1.5337895858131004e-05,
+ "loss": 0.3211,
+ "step": 12520
+ },
+ {
+ "epoch": 34.11716621253406,
+ "grad_norm": 5.476337909698486,
+ "learning_rate": 1.5337149584583878e-05,
+ "loss": 0.4803,
+ "step": 12521
+ },
+ {
+ "epoch": 34.119891008174385,
+ "grad_norm": 7.536069393157959,
+ "learning_rate": 1.5336403269471202e-05,
+ "loss": 0.4091,
+ "step": 12522
+ },
+ {
+ "epoch": 34.12261580381471,
+ "grad_norm": 6.384524345397949,
+ "learning_rate": 1.533565691279879e-05,
+ "loss": 0.256,
+ "step": 12523
+ },
+ {
+ "epoch": 34.12534059945504,
+ "grad_norm": 5.690863132476807,
+ "learning_rate": 1.5334910514572453e-05,
+ "loss": 0.2987,
+ "step": 12524
+ },
+ {
+ "epoch": 34.12806539509537,
+ "grad_norm": 7.242108345031738,
+ "learning_rate": 1.5334164074798008e-05,
+ "loss": 0.3978,
+ "step": 12525
+ },
+ {
+ "epoch": 34.130790190735695,
+ "grad_norm": 7.1291890144348145,
+ "learning_rate": 1.5333417593481262e-05,
+ "loss": 0.3231,
+ "step": 12526
+ },
+ {
+ "epoch": 34.13351498637602,
+ "grad_norm": 5.386416912078857,
+ "learning_rate": 1.533267107062803e-05,
+ "loss": 0.4016,
+ "step": 12527
+ },
+ {
+ "epoch": 34.13623978201635,
+ "grad_norm": 6.721260070800781,
+ "learning_rate": 1.5331924506244132e-05,
+ "loss": 0.2899,
+ "step": 12528
+ },
+ {
+ "epoch": 34.13896457765667,
+ "grad_norm": 10.538313865661621,
+ "learning_rate": 1.5331177900335372e-05,
+ "loss": 0.3217,
+ "step": 12529
+ },
+ {
+ "epoch": 34.141689373297005,
+ "grad_norm": 6.040736675262451,
+ "learning_rate": 1.5330431252907575e-05,
+ "loss": 0.2218,
+ "step": 12530
+ },
+ {
+ "epoch": 34.14441416893733,
+ "grad_norm": 5.292067050933838,
+ "learning_rate": 1.5329684563966547e-05,
+ "loss": 0.2944,
+ "step": 12531
+ },
+ {
+ "epoch": 34.14713896457766,
+ "grad_norm": 6.043910026550293,
+ "learning_rate": 1.532893783351811e-05,
+ "loss": 0.3723,
+ "step": 12532
+ },
+ {
+ "epoch": 34.14986376021798,
+ "grad_norm": 6.5580573081970215,
+ "learning_rate": 1.5328191061568076e-05,
+ "loss": 0.2774,
+ "step": 12533
+ },
+ {
+ "epoch": 34.15258855585831,
+ "grad_norm": 8.724053382873535,
+ "learning_rate": 1.532744424812226e-05,
+ "loss": 0.2576,
+ "step": 12534
+ },
+ {
+ "epoch": 34.155313351498634,
+ "grad_norm": 6.399105548858643,
+ "learning_rate": 1.5326697393186482e-05,
+ "loss": 0.4534,
+ "step": 12535
+ },
+ {
+ "epoch": 34.15803814713897,
+ "grad_norm": 7.29347038269043,
+ "learning_rate": 1.5325950496766557e-05,
+ "loss": 0.2491,
+ "step": 12536
+ },
+ {
+ "epoch": 34.16076294277929,
+ "grad_norm": 7.133385181427002,
+ "learning_rate": 1.53252035588683e-05,
+ "loss": 0.3222,
+ "step": 12537
+ },
+ {
+ "epoch": 34.16348773841962,
+ "grad_norm": 7.860514163970947,
+ "learning_rate": 1.5324456579497525e-05,
+ "loss": 0.3557,
+ "step": 12538
+ },
+ {
+ "epoch": 34.166212534059945,
+ "grad_norm": 6.143589496612549,
+ "learning_rate": 1.5323709558660057e-05,
+ "loss": 0.3087,
+ "step": 12539
+ },
+ {
+ "epoch": 34.16893732970027,
+ "grad_norm": 7.355077743530273,
+ "learning_rate": 1.5322962496361705e-05,
+ "loss": 0.5696,
+ "step": 12540
+ },
+ {
+ "epoch": 34.171662125340596,
+ "grad_norm": 6.451420783996582,
+ "learning_rate": 1.53222153926083e-05,
+ "loss": 0.2737,
+ "step": 12541
+ },
+ {
+ "epoch": 34.17438692098093,
+ "grad_norm": 6.261687278747559,
+ "learning_rate": 1.532146824740565e-05,
+ "loss": 0.4085,
+ "step": 12542
+ },
+ {
+ "epoch": 34.177111716621255,
+ "grad_norm": 6.657192707061768,
+ "learning_rate": 1.532072106075958e-05,
+ "loss": 0.3685,
+ "step": 12543
+ },
+ {
+ "epoch": 34.17983651226158,
+ "grad_norm": 10.220606803894043,
+ "learning_rate": 1.53199738326759e-05,
+ "loss": 0.3737,
+ "step": 12544
+ },
+ {
+ "epoch": 34.182561307901906,
+ "grad_norm": 5.563790321350098,
+ "learning_rate": 1.5319226563160438e-05,
+ "loss": 0.3335,
+ "step": 12545
+ },
+ {
+ "epoch": 34.18528610354223,
+ "grad_norm": 6.351738929748535,
+ "learning_rate": 1.531847925221901e-05,
+ "loss": 0.4303,
+ "step": 12546
+ },
+ {
+ "epoch": 34.18801089918256,
+ "grad_norm": 7.620738506317139,
+ "learning_rate": 1.5317731899857434e-05,
+ "loss": 0.3871,
+ "step": 12547
+ },
+ {
+ "epoch": 34.19073569482289,
+ "grad_norm": 8.398337364196777,
+ "learning_rate": 1.5316984506081537e-05,
+ "loss": 0.3358,
+ "step": 12548
+ },
+ {
+ "epoch": 34.19346049046322,
+ "grad_norm": 6.083836555480957,
+ "learning_rate": 1.5316237070897134e-05,
+ "loss": 0.2913,
+ "step": 12549
+ },
+ {
+ "epoch": 34.19618528610354,
+ "grad_norm": 6.6067681312561035,
+ "learning_rate": 1.5315489594310048e-05,
+ "loss": 0.3098,
+ "step": 12550
+ },
+ {
+ "epoch": 34.19891008174387,
+ "grad_norm": 10.521763801574707,
+ "learning_rate": 1.53147420763261e-05,
+ "loss": 0.5455,
+ "step": 12551
+ },
+ {
+ "epoch": 34.201634877384194,
+ "grad_norm": 6.089521884918213,
+ "learning_rate": 1.5313994516951112e-05,
+ "loss": 0.2724,
+ "step": 12552
+ },
+ {
+ "epoch": 34.20435967302452,
+ "grad_norm": 5.61362361907959,
+ "learning_rate": 1.5313246916190907e-05,
+ "loss": 0.3512,
+ "step": 12553
+ },
+ {
+ "epoch": 34.20708446866485,
+ "grad_norm": 6.106107234954834,
+ "learning_rate": 1.5312499274051303e-05,
+ "loss": 0.2629,
+ "step": 12554
+ },
+ {
+ "epoch": 34.20980926430518,
+ "grad_norm": 6.168601036071777,
+ "learning_rate": 1.531175159053813e-05,
+ "loss": 0.3591,
+ "step": 12555
+ },
+ {
+ "epoch": 34.212534059945504,
+ "grad_norm": 6.565435886383057,
+ "learning_rate": 1.5311003865657204e-05,
+ "loss": 0.3029,
+ "step": 12556
+ },
+ {
+ "epoch": 34.21525885558583,
+ "grad_norm": 6.768796443939209,
+ "learning_rate": 1.531025609941435e-05,
+ "loss": 0.2982,
+ "step": 12557
+ },
+ {
+ "epoch": 34.217983651226156,
+ "grad_norm": 9.92309856414795,
+ "learning_rate": 1.5309508291815395e-05,
+ "loss": 0.2703,
+ "step": 12558
+ },
+ {
+ "epoch": 34.22070844686648,
+ "grad_norm": 6.509314060211182,
+ "learning_rate": 1.530876044286616e-05,
+ "loss": 0.344,
+ "step": 12559
+ },
+ {
+ "epoch": 34.223433242506815,
+ "grad_norm": 6.4309234619140625,
+ "learning_rate": 1.5308012552572466e-05,
+ "loss": 0.3406,
+ "step": 12560
+ },
+ {
+ "epoch": 34.22615803814714,
+ "grad_norm": 6.504822731018066,
+ "learning_rate": 1.5307264620940145e-05,
+ "loss": 0.3438,
+ "step": 12561
+ },
+ {
+ "epoch": 34.228882833787466,
+ "grad_norm": 7.467302322387695,
+ "learning_rate": 1.5306516647975014e-05,
+ "loss": 0.3404,
+ "step": 12562
+ },
+ {
+ "epoch": 34.23160762942779,
+ "grad_norm": 7.2365288734436035,
+ "learning_rate": 1.5305768633682906e-05,
+ "loss": 0.3845,
+ "step": 12563
+ },
+ {
+ "epoch": 34.23433242506812,
+ "grad_norm": 6.837965965270996,
+ "learning_rate": 1.530502057806964e-05,
+ "loss": 0.2961,
+ "step": 12564
+ },
+ {
+ "epoch": 34.237057220708444,
+ "grad_norm": 6.4085774421691895,
+ "learning_rate": 1.5304272481141045e-05,
+ "loss": 0.1936,
+ "step": 12565
+ },
+ {
+ "epoch": 34.23978201634878,
+ "grad_norm": 6.5254130363464355,
+ "learning_rate": 1.5303524342902948e-05,
+ "loss": 0.2939,
+ "step": 12566
+ },
+ {
+ "epoch": 34.2425068119891,
+ "grad_norm": 7.245466709136963,
+ "learning_rate": 1.5302776163361173e-05,
+ "loss": 0.3392,
+ "step": 12567
+ },
+ {
+ "epoch": 34.24523160762943,
+ "grad_norm": 11.342859268188477,
+ "learning_rate": 1.530202794252155e-05,
+ "loss": 0.4028,
+ "step": 12568
+ },
+ {
+ "epoch": 34.247956403269754,
+ "grad_norm": 8.174638748168945,
+ "learning_rate": 1.5301279680389902e-05,
+ "loss": 0.33,
+ "step": 12569
+ },
+ {
+ "epoch": 34.25068119891008,
+ "grad_norm": 5.684847354888916,
+ "learning_rate": 1.530053137697206e-05,
+ "loss": 0.2464,
+ "step": 12570
+ },
+ {
+ "epoch": 34.253405994550405,
+ "grad_norm": 5.457337379455566,
+ "learning_rate": 1.5299783032273848e-05,
+ "loss": 0.4058,
+ "step": 12571
+ },
+ {
+ "epoch": 34.25613079019074,
+ "grad_norm": 6.069042205810547,
+ "learning_rate": 1.5299034646301097e-05,
+ "loss": 0.2861,
+ "step": 12572
+ },
+ {
+ "epoch": 34.258855585831064,
+ "grad_norm": 6.74777364730835,
+ "learning_rate": 1.5298286219059634e-05,
+ "loss": 0.2883,
+ "step": 12573
+ },
+ {
+ "epoch": 34.26158038147139,
+ "grad_norm": 6.886902809143066,
+ "learning_rate": 1.5297537750555286e-05,
+ "loss": 0.3531,
+ "step": 12574
+ },
+ {
+ "epoch": 34.264305177111716,
+ "grad_norm": 7.231983184814453,
+ "learning_rate": 1.529678924079389e-05,
+ "loss": 0.2516,
+ "step": 12575
+ },
+ {
+ "epoch": 34.26702997275204,
+ "grad_norm": 8.084550857543945,
+ "learning_rate": 1.5296040689781267e-05,
+ "loss": 0.2573,
+ "step": 12576
+ },
+ {
+ "epoch": 34.26975476839237,
+ "grad_norm": 8.349410057067871,
+ "learning_rate": 1.529529209752325e-05,
+ "loss": 0.3591,
+ "step": 12577
+ },
+ {
+ "epoch": 34.2724795640327,
+ "grad_norm": 5.445027828216553,
+ "learning_rate": 1.529454346402567e-05,
+ "loss": 0.3697,
+ "step": 12578
+ },
+ {
+ "epoch": 34.275204359673026,
+ "grad_norm": 12.19077205657959,
+ "learning_rate": 1.529379478929436e-05,
+ "loss": 0.4547,
+ "step": 12579
+ },
+ {
+ "epoch": 34.27792915531335,
+ "grad_norm": 6.323980808258057,
+ "learning_rate": 1.5293046073335137e-05,
+ "loss": 0.352,
+ "step": 12580
+ },
+ {
+ "epoch": 34.28065395095368,
+ "grad_norm": 7.025436878204346,
+ "learning_rate": 1.529229731615385e-05,
+ "loss": 0.293,
+ "step": 12581
+ },
+ {
+ "epoch": 34.283378746594,
+ "grad_norm": 7.498295783996582,
+ "learning_rate": 1.529154851775631e-05,
+ "loss": 0.264,
+ "step": 12582
+ },
+ {
+ "epoch": 34.28610354223433,
+ "grad_norm": 6.7955780029296875,
+ "learning_rate": 1.529079967814837e-05,
+ "loss": 0.3305,
+ "step": 12583
+ },
+ {
+ "epoch": 34.28882833787466,
+ "grad_norm": 7.907827377319336,
+ "learning_rate": 1.529005079733585e-05,
+ "loss": 0.3605,
+ "step": 12584
+ },
+ {
+ "epoch": 34.29155313351499,
+ "grad_norm": 7.189267158508301,
+ "learning_rate": 1.528930187532459e-05,
+ "loss": 0.3698,
+ "step": 12585
+ },
+ {
+ "epoch": 34.294277929155314,
+ "grad_norm": 8.38147258758545,
+ "learning_rate": 1.528855291212041e-05,
+ "loss": 0.435,
+ "step": 12586
+ },
+ {
+ "epoch": 34.29700272479564,
+ "grad_norm": 6.848021507263184,
+ "learning_rate": 1.5287803907729154e-05,
+ "loss": 0.349,
+ "step": 12587
+ },
+ {
+ "epoch": 34.299727520435965,
+ "grad_norm": 5.953732490539551,
+ "learning_rate": 1.5287054862156648e-05,
+ "loss": 0.3755,
+ "step": 12588
+ },
+ {
+ "epoch": 34.30245231607629,
+ "grad_norm": 6.992973804473877,
+ "learning_rate": 1.5286305775408732e-05,
+ "loss": 0.4518,
+ "step": 12589
+ },
+ {
+ "epoch": 34.305177111716624,
+ "grad_norm": 6.778861999511719,
+ "learning_rate": 1.5285556647491237e-05,
+ "loss": 0.3205,
+ "step": 12590
+ },
+ {
+ "epoch": 34.30790190735695,
+ "grad_norm": 6.7751078605651855,
+ "learning_rate": 1.5284807478409994e-05,
+ "loss": 0.2394,
+ "step": 12591
+ },
+ {
+ "epoch": 34.310626702997276,
+ "grad_norm": 6.508416175842285,
+ "learning_rate": 1.528405826817084e-05,
+ "loss": 0.3088,
+ "step": 12592
+ },
+ {
+ "epoch": 34.3133514986376,
+ "grad_norm": 6.094081878662109,
+ "learning_rate": 1.5283309016779615e-05,
+ "loss": 0.3897,
+ "step": 12593
+ },
+ {
+ "epoch": 34.31607629427793,
+ "grad_norm": 6.154423713684082,
+ "learning_rate": 1.5282559724242145e-05,
+ "loss": 0.2567,
+ "step": 12594
+ },
+ {
+ "epoch": 34.31880108991825,
+ "grad_norm": 6.5120038986206055,
+ "learning_rate": 1.5281810390564274e-05,
+ "loss": 0.3162,
+ "step": 12595
+ },
+ {
+ "epoch": 34.321525885558586,
+ "grad_norm": 6.46196985244751,
+ "learning_rate": 1.528106101575183e-05,
+ "loss": 0.3739,
+ "step": 12596
+ },
+ {
+ "epoch": 34.32425068119891,
+ "grad_norm": 7.718747615814209,
+ "learning_rate": 1.5280311599810654e-05,
+ "loss": 0.2753,
+ "step": 12597
+ },
+ {
+ "epoch": 34.32697547683924,
+ "grad_norm": 5.9966816902160645,
+ "learning_rate": 1.527956214274658e-05,
+ "loss": 0.3034,
+ "step": 12598
+ },
+ {
+ "epoch": 34.32970027247956,
+ "grad_norm": 6.607402801513672,
+ "learning_rate": 1.527881264456545e-05,
+ "loss": 0.2888,
+ "step": 12599
+ },
+ {
+ "epoch": 34.33242506811989,
+ "grad_norm": 6.733821392059326,
+ "learning_rate": 1.5278063105273094e-05,
+ "loss": 0.3195,
+ "step": 12600
+ },
+ {
+ "epoch": 34.335149863760215,
+ "grad_norm": 7.093853950500488,
+ "learning_rate": 1.527731352487535e-05,
+ "loss": 0.3503,
+ "step": 12601
+ },
+ {
+ "epoch": 34.33787465940055,
+ "grad_norm": 6.891481399536133,
+ "learning_rate": 1.5276563903378064e-05,
+ "loss": 0.3297,
+ "step": 12602
+ },
+ {
+ "epoch": 34.34059945504087,
+ "grad_norm": 11.526920318603516,
+ "learning_rate": 1.5275814240787064e-05,
+ "loss": 0.3038,
+ "step": 12603
+ },
+ {
+ "epoch": 34.3433242506812,
+ "grad_norm": 5.182687282562256,
+ "learning_rate": 1.527506453710819e-05,
+ "loss": 0.4803,
+ "step": 12604
+ },
+ {
+ "epoch": 34.346049046321525,
+ "grad_norm": 6.055121421813965,
+ "learning_rate": 1.527431479234729e-05,
+ "loss": 0.3439,
+ "step": 12605
+ },
+ {
+ "epoch": 34.34877384196185,
+ "grad_norm": 7.062063694000244,
+ "learning_rate": 1.527356500651019e-05,
+ "loss": 0.4901,
+ "step": 12606
+ },
+ {
+ "epoch": 34.35149863760218,
+ "grad_norm": 6.244130611419678,
+ "learning_rate": 1.5272815179602743e-05,
+ "loss": 0.3791,
+ "step": 12607
+ },
+ {
+ "epoch": 34.35422343324251,
+ "grad_norm": 7.249322891235352,
+ "learning_rate": 1.5272065311630773e-05,
+ "loss": 0.2953,
+ "step": 12608
+ },
+ {
+ "epoch": 34.356948228882835,
+ "grad_norm": 5.700298309326172,
+ "learning_rate": 1.5271315402600132e-05,
+ "loss": 0.2553,
+ "step": 12609
+ },
+ {
+ "epoch": 34.35967302452316,
+ "grad_norm": 6.6068267822265625,
+ "learning_rate": 1.5270565452516656e-05,
+ "loss": 0.3201,
+ "step": 12610
+ },
+ {
+ "epoch": 34.36239782016349,
+ "grad_norm": 8.201449394226074,
+ "learning_rate": 1.5269815461386187e-05,
+ "loss": 0.2877,
+ "step": 12611
+ },
+ {
+ "epoch": 34.36512261580381,
+ "grad_norm": 5.591947555541992,
+ "learning_rate": 1.5269065429214563e-05,
+ "loss": 0.2398,
+ "step": 12612
+ },
+ {
+ "epoch": 34.36784741144414,
+ "grad_norm": 11.065263748168945,
+ "learning_rate": 1.5268315356007624e-05,
+ "loss": 0.2484,
+ "step": 12613
+ },
+ {
+ "epoch": 34.37057220708447,
+ "grad_norm": 6.8644490242004395,
+ "learning_rate": 1.526756524177122e-05,
+ "loss": 0.3565,
+ "step": 12614
+ },
+ {
+ "epoch": 34.3732970027248,
+ "grad_norm": 8.553791046142578,
+ "learning_rate": 1.5266815086511187e-05,
+ "loss": 0.392,
+ "step": 12615
+ },
+ {
+ "epoch": 34.37602179836512,
+ "grad_norm": 5.286713600158691,
+ "learning_rate": 1.5266064890233363e-05,
+ "loss": 0.3876,
+ "step": 12616
+ },
+ {
+ "epoch": 34.37874659400545,
+ "grad_norm": 5.502371311187744,
+ "learning_rate": 1.52653146529436e-05,
+ "loss": 0.2347,
+ "step": 12617
+ },
+ {
+ "epoch": 34.381471389645775,
+ "grad_norm": 15.500739097595215,
+ "learning_rate": 1.5264564374647732e-05,
+ "loss": 0.523,
+ "step": 12618
+ },
+ {
+ "epoch": 34.3841961852861,
+ "grad_norm": 5.708557605743408,
+ "learning_rate": 1.526381405535161e-05,
+ "loss": 0.4802,
+ "step": 12619
+ },
+ {
+ "epoch": 34.38692098092643,
+ "grad_norm": 7.145052433013916,
+ "learning_rate": 1.5263063695061072e-05,
+ "loss": 0.3866,
+ "step": 12620
+ },
+ {
+ "epoch": 34.38964577656676,
+ "grad_norm": 6.679152488708496,
+ "learning_rate": 1.526231329378196e-05,
+ "loss": 0.3762,
+ "step": 12621
+ },
+ {
+ "epoch": 34.392370572207085,
+ "grad_norm": 6.710231304168701,
+ "learning_rate": 1.5261562851520127e-05,
+ "loss": 0.4016,
+ "step": 12622
+ },
+ {
+ "epoch": 34.39509536784741,
+ "grad_norm": 7.736103534698486,
+ "learning_rate": 1.526081236828141e-05,
+ "loss": 0.2979,
+ "step": 12623
+ },
+ {
+ "epoch": 34.39782016348774,
+ "grad_norm": 5.453094005584717,
+ "learning_rate": 1.5260061844071655e-05,
+ "loss": 0.2635,
+ "step": 12624
+ },
+ {
+ "epoch": 34.40054495912806,
+ "grad_norm": 6.7206292152404785,
+ "learning_rate": 1.5259311278896706e-05,
+ "loss": 0.449,
+ "step": 12625
+ },
+ {
+ "epoch": 34.403269754768395,
+ "grad_norm": 6.7119221687316895,
+ "learning_rate": 1.525856067276241e-05,
+ "loss": 0.3656,
+ "step": 12626
+ },
+ {
+ "epoch": 34.40599455040872,
+ "grad_norm": 7.327425479888916,
+ "learning_rate": 1.5257810025674613e-05,
+ "loss": 0.2811,
+ "step": 12627
+ },
+ {
+ "epoch": 34.40871934604905,
+ "grad_norm": 9.062700271606445,
+ "learning_rate": 1.5257059337639164e-05,
+ "loss": 0.3171,
+ "step": 12628
+ },
+ {
+ "epoch": 34.41144414168937,
+ "grad_norm": 6.503924369812012,
+ "learning_rate": 1.5256308608661904e-05,
+ "loss": 0.2482,
+ "step": 12629
+ },
+ {
+ "epoch": 34.4141689373297,
+ "grad_norm": 7.556908130645752,
+ "learning_rate": 1.5255557838748683e-05,
+ "loss": 0.2938,
+ "step": 12630
+ },
+ {
+ "epoch": 34.416893732970024,
+ "grad_norm": 5.482861042022705,
+ "learning_rate": 1.5254807027905342e-05,
+ "loss": 0.2621,
+ "step": 12631
+ },
+ {
+ "epoch": 34.41961852861036,
+ "grad_norm": 8.334380149841309,
+ "learning_rate": 1.5254056176137742e-05,
+ "loss": 0.3419,
+ "step": 12632
+ },
+ {
+ "epoch": 34.42234332425068,
+ "grad_norm": 8.406848907470703,
+ "learning_rate": 1.5253305283451714e-05,
+ "loss": 0.369,
+ "step": 12633
+ },
+ {
+ "epoch": 34.42506811989101,
+ "grad_norm": 7.206605434417725,
+ "learning_rate": 1.5252554349853114e-05,
+ "loss": 0.3595,
+ "step": 12634
+ },
+ {
+ "epoch": 34.427792915531334,
+ "grad_norm": 5.960251331329346,
+ "learning_rate": 1.5251803375347792e-05,
+ "loss": 0.2827,
+ "step": 12635
+ },
+ {
+ "epoch": 34.43051771117166,
+ "grad_norm": 11.61844253540039,
+ "learning_rate": 1.5251052359941593e-05,
+ "loss": 0.4728,
+ "step": 12636
+ },
+ {
+ "epoch": 34.433242506811986,
+ "grad_norm": 7.506865978240967,
+ "learning_rate": 1.5250301303640368e-05,
+ "loss": 0.3216,
+ "step": 12637
+ },
+ {
+ "epoch": 34.43596730245232,
+ "grad_norm": 11.855709075927734,
+ "learning_rate": 1.5249550206449968e-05,
+ "loss": 0.398,
+ "step": 12638
+ },
+ {
+ "epoch": 34.438692098092645,
+ "grad_norm": 6.202294826507568,
+ "learning_rate": 1.5248799068376236e-05,
+ "loss": 0.4269,
+ "step": 12639
+ },
+ {
+ "epoch": 34.44141689373297,
+ "grad_norm": 7.376853942871094,
+ "learning_rate": 1.5248047889425026e-05,
+ "loss": 0.4138,
+ "step": 12640
+ },
+ {
+ "epoch": 34.444141689373296,
+ "grad_norm": 6.544391632080078,
+ "learning_rate": 1.5247296669602189e-05,
+ "loss": 0.3949,
+ "step": 12641
+ },
+ {
+ "epoch": 34.44686648501362,
+ "grad_norm": 6.126943111419678,
+ "learning_rate": 1.5246545408913575e-05,
+ "loss": 0.262,
+ "step": 12642
+ },
+ {
+ "epoch": 34.44959128065395,
+ "grad_norm": 6.744805812835693,
+ "learning_rate": 1.5245794107365034e-05,
+ "loss": 0.308,
+ "step": 12643
+ },
+ {
+ "epoch": 34.45231607629428,
+ "grad_norm": 8.80776309967041,
+ "learning_rate": 1.5245042764962416e-05,
+ "loss": 0.4443,
+ "step": 12644
+ },
+ {
+ "epoch": 34.45504087193461,
+ "grad_norm": 6.651944637298584,
+ "learning_rate": 1.5244291381711574e-05,
+ "loss": 0.2739,
+ "step": 12645
+ },
+ {
+ "epoch": 34.45776566757493,
+ "grad_norm": 6.812028884887695,
+ "learning_rate": 1.5243539957618363e-05,
+ "loss": 0.4237,
+ "step": 12646
+ },
+ {
+ "epoch": 34.46049046321526,
+ "grad_norm": 12.600976943969727,
+ "learning_rate": 1.5242788492688628e-05,
+ "loss": 0.4821,
+ "step": 12647
+ },
+ {
+ "epoch": 34.463215258855584,
+ "grad_norm": 21.884811401367188,
+ "learning_rate": 1.5242036986928225e-05,
+ "loss": 0.3579,
+ "step": 12648
+ },
+ {
+ "epoch": 34.46594005449591,
+ "grad_norm": 7.988901615142822,
+ "learning_rate": 1.5241285440343008e-05,
+ "loss": 0.3257,
+ "step": 12649
+ },
+ {
+ "epoch": 34.46866485013624,
+ "grad_norm": 7.309326171875,
+ "learning_rate": 1.524053385293883e-05,
+ "loss": 0.3538,
+ "step": 12650
+ },
+ {
+ "epoch": 34.47138964577657,
+ "grad_norm": 8.580944061279297,
+ "learning_rate": 1.5239782224721537e-05,
+ "loss": 0.4138,
+ "step": 12651
+ },
+ {
+ "epoch": 34.474114441416894,
+ "grad_norm": 7.301868438720703,
+ "learning_rate": 1.5239030555696995e-05,
+ "loss": 0.2907,
+ "step": 12652
+ },
+ {
+ "epoch": 34.47683923705722,
+ "grad_norm": 16.115550994873047,
+ "learning_rate": 1.5238278845871048e-05,
+ "loss": 0.4512,
+ "step": 12653
+ },
+ {
+ "epoch": 34.479564032697546,
+ "grad_norm": 6.847012996673584,
+ "learning_rate": 1.5237527095249558e-05,
+ "loss": 0.3115,
+ "step": 12654
+ },
+ {
+ "epoch": 34.48228882833787,
+ "grad_norm": 11.58302116394043,
+ "learning_rate": 1.5236775303838371e-05,
+ "loss": 0.3449,
+ "step": 12655
+ },
+ {
+ "epoch": 34.485013623978205,
+ "grad_norm": 10.742802619934082,
+ "learning_rate": 1.5236023471643352e-05,
+ "loss": 0.2906,
+ "step": 12656
+ },
+ {
+ "epoch": 34.48773841961853,
+ "grad_norm": 7.742465972900391,
+ "learning_rate": 1.5235271598670345e-05,
+ "loss": 0.5452,
+ "step": 12657
+ },
+ {
+ "epoch": 34.490463215258856,
+ "grad_norm": 7.01248025894165,
+ "learning_rate": 1.5234519684925215e-05,
+ "loss": 0.3445,
+ "step": 12658
+ },
+ {
+ "epoch": 34.49318801089918,
+ "grad_norm": 11.43049144744873,
+ "learning_rate": 1.5233767730413811e-05,
+ "loss": 0.261,
+ "step": 12659
+ },
+ {
+ "epoch": 34.49591280653951,
+ "grad_norm": 6.926109313964844,
+ "learning_rate": 1.5233015735141995e-05,
+ "loss": 0.3703,
+ "step": 12660
+ },
+ {
+ "epoch": 34.49863760217983,
+ "grad_norm": 6.705916881561279,
+ "learning_rate": 1.5232263699115616e-05,
+ "loss": 0.4207,
+ "step": 12661
+ },
+ {
+ "epoch": 34.50136239782017,
+ "grad_norm": 6.926370620727539,
+ "learning_rate": 1.5231511622340543e-05,
+ "loss": 0.2558,
+ "step": 12662
+ },
+ {
+ "epoch": 34.50408719346049,
+ "grad_norm": 7.000466823577881,
+ "learning_rate": 1.523075950482262e-05,
+ "loss": 0.4001,
+ "step": 12663
+ },
+ {
+ "epoch": 34.50681198910082,
+ "grad_norm": 7.390921592712402,
+ "learning_rate": 1.5230007346567717e-05,
+ "loss": 0.2559,
+ "step": 12664
+ },
+ {
+ "epoch": 34.509536784741144,
+ "grad_norm": 7.2458343505859375,
+ "learning_rate": 1.5229255147581678e-05,
+ "loss": 0.5916,
+ "step": 12665
+ },
+ {
+ "epoch": 34.51226158038147,
+ "grad_norm": 7.20648717880249,
+ "learning_rate": 1.5228502907870373e-05,
+ "loss": 0.375,
+ "step": 12666
+ },
+ {
+ "epoch": 34.514986376021795,
+ "grad_norm": 13.891578674316406,
+ "learning_rate": 1.5227750627439652e-05,
+ "loss": 0.5149,
+ "step": 12667
+ },
+ {
+ "epoch": 34.51771117166213,
+ "grad_norm": 8.530945777893066,
+ "learning_rate": 1.522699830629538e-05,
+ "loss": 0.4329,
+ "step": 12668
+ },
+ {
+ "epoch": 34.520435967302454,
+ "grad_norm": 6.637569427490234,
+ "learning_rate": 1.522624594444341e-05,
+ "loss": 0.3663,
+ "step": 12669
+ },
+ {
+ "epoch": 34.52316076294278,
+ "grad_norm": 9.173357963562012,
+ "learning_rate": 1.5225493541889609e-05,
+ "loss": 0.3019,
+ "step": 12670
+ },
+ {
+ "epoch": 34.525885558583106,
+ "grad_norm": 10.640692710876465,
+ "learning_rate": 1.522474109863983e-05,
+ "loss": 0.3535,
+ "step": 12671
+ },
+ {
+ "epoch": 34.52861035422343,
+ "grad_norm": 8.41413688659668,
+ "learning_rate": 1.5223988614699939e-05,
+ "loss": 0.4613,
+ "step": 12672
+ },
+ {
+ "epoch": 34.53133514986376,
+ "grad_norm": 8.539817810058594,
+ "learning_rate": 1.5223236090075788e-05,
+ "loss": 0.3545,
+ "step": 12673
+ },
+ {
+ "epoch": 34.53405994550409,
+ "grad_norm": 6.650314807891846,
+ "learning_rate": 1.5222483524773246e-05,
+ "loss": 0.4908,
+ "step": 12674
+ },
+ {
+ "epoch": 34.536784741144416,
+ "grad_norm": 7.6259331703186035,
+ "learning_rate": 1.5221730918798168e-05,
+ "loss": 0.4193,
+ "step": 12675
+ },
+ {
+ "epoch": 34.53950953678474,
+ "grad_norm": 7.47517204284668,
+ "learning_rate": 1.522097827215642e-05,
+ "loss": 0.312,
+ "step": 12676
+ },
+ {
+ "epoch": 34.54223433242507,
+ "grad_norm": 8.829288482666016,
+ "learning_rate": 1.5220225584853858e-05,
+ "loss": 0.419,
+ "step": 12677
+ },
+ {
+ "epoch": 34.54495912806539,
+ "grad_norm": 6.424598217010498,
+ "learning_rate": 1.5219472856896348e-05,
+ "loss": 0.2655,
+ "step": 12678
+ },
+ {
+ "epoch": 34.54768392370572,
+ "grad_norm": 7.619609355926514,
+ "learning_rate": 1.5218720088289753e-05,
+ "loss": 0.2967,
+ "step": 12679
+ },
+ {
+ "epoch": 34.55040871934605,
+ "grad_norm": 5.812038898468018,
+ "learning_rate": 1.5217967279039933e-05,
+ "loss": 0.4395,
+ "step": 12680
+ },
+ {
+ "epoch": 34.55313351498638,
+ "grad_norm": 7.461119174957275,
+ "learning_rate": 1.5217214429152752e-05,
+ "loss": 0.3044,
+ "step": 12681
+ },
+ {
+ "epoch": 34.555858310626704,
+ "grad_norm": 6.197144031524658,
+ "learning_rate": 1.5216461538634076e-05,
+ "loss": 0.3132,
+ "step": 12682
+ },
+ {
+ "epoch": 34.55858310626703,
+ "grad_norm": 7.825538158416748,
+ "learning_rate": 1.521570860748976e-05,
+ "loss": 0.3924,
+ "step": 12683
+ },
+ {
+ "epoch": 34.561307901907355,
+ "grad_norm": 8.52588176727295,
+ "learning_rate": 1.5214955635725677e-05,
+ "loss": 0.5195,
+ "step": 12684
+ },
+ {
+ "epoch": 34.56403269754768,
+ "grad_norm": 7.078782081604004,
+ "learning_rate": 1.5214202623347687e-05,
+ "loss": 0.2614,
+ "step": 12685
+ },
+ {
+ "epoch": 34.566757493188014,
+ "grad_norm": 7.565918922424316,
+ "learning_rate": 1.521344957036165e-05,
+ "loss": 0.3388,
+ "step": 12686
+ },
+ {
+ "epoch": 34.56948228882834,
+ "grad_norm": 6.790742874145508,
+ "learning_rate": 1.5212696476773441e-05,
+ "loss": 0.2745,
+ "step": 12687
+ },
+ {
+ "epoch": 34.572207084468666,
+ "grad_norm": 8.860798835754395,
+ "learning_rate": 1.5211943342588918e-05,
+ "loss": 0.4206,
+ "step": 12688
+ },
+ {
+ "epoch": 34.57493188010899,
+ "grad_norm": 9.137691497802734,
+ "learning_rate": 1.521119016781395e-05,
+ "loss": 0.4454,
+ "step": 12689
+ },
+ {
+ "epoch": 34.57765667574932,
+ "grad_norm": 12.674605369567871,
+ "learning_rate": 1.5210436952454398e-05,
+ "loss": 0.4881,
+ "step": 12690
+ },
+ {
+ "epoch": 34.58038147138964,
+ "grad_norm": 6.639235019683838,
+ "learning_rate": 1.5209683696516129e-05,
+ "loss": 0.2416,
+ "step": 12691
+ },
+ {
+ "epoch": 34.583106267029976,
+ "grad_norm": 8.917923927307129,
+ "learning_rate": 1.5208930400005016e-05,
+ "loss": 0.3309,
+ "step": 12692
+ },
+ {
+ "epoch": 34.5858310626703,
+ "grad_norm": 9.904099464416504,
+ "learning_rate": 1.5208177062926916e-05,
+ "loss": 0.2929,
+ "step": 12693
+ },
+ {
+ "epoch": 34.58855585831063,
+ "grad_norm": 7.763059616088867,
+ "learning_rate": 1.5207423685287704e-05,
+ "loss": 0.3746,
+ "step": 12694
+ },
+ {
+ "epoch": 34.59128065395095,
+ "grad_norm": 6.761361122131348,
+ "learning_rate": 1.5206670267093242e-05,
+ "loss": 0.2741,
+ "step": 12695
+ },
+ {
+ "epoch": 34.59400544959128,
+ "grad_norm": 10.17188835144043,
+ "learning_rate": 1.5205916808349401e-05,
+ "loss": 0.2814,
+ "step": 12696
+ },
+ {
+ "epoch": 34.596730245231605,
+ "grad_norm": 7.0764594078063965,
+ "learning_rate": 1.5205163309062048e-05,
+ "loss": 0.3881,
+ "step": 12697
+ },
+ {
+ "epoch": 34.59945504087194,
+ "grad_norm": 8.067386627197266,
+ "learning_rate": 1.5204409769237048e-05,
+ "loss": 0.3437,
+ "step": 12698
+ },
+ {
+ "epoch": 34.60217983651226,
+ "grad_norm": 11.958366394042969,
+ "learning_rate": 1.5203656188880276e-05,
+ "loss": 0.3264,
+ "step": 12699
+ },
+ {
+ "epoch": 34.60490463215259,
+ "grad_norm": 6.704128742218018,
+ "learning_rate": 1.5202902567997592e-05,
+ "loss": 0.3314,
+ "step": 12700
+ },
+ {
+ "epoch": 34.607629427792915,
+ "grad_norm": 7.999274730682373,
+ "learning_rate": 1.5202148906594874e-05,
+ "loss": 0.3633,
+ "step": 12701
+ },
+ {
+ "epoch": 34.61035422343324,
+ "grad_norm": 10.331748962402344,
+ "learning_rate": 1.5201395204677986e-05,
+ "loss": 0.4229,
+ "step": 12702
+ },
+ {
+ "epoch": 34.61307901907357,
+ "grad_norm": 5.908962726593018,
+ "learning_rate": 1.5200641462252802e-05,
+ "loss": 0.242,
+ "step": 12703
+ },
+ {
+ "epoch": 34.6158038147139,
+ "grad_norm": 9.226425170898438,
+ "learning_rate": 1.5199887679325185e-05,
+ "loss": 0.3636,
+ "step": 12704
+ },
+ {
+ "epoch": 34.618528610354225,
+ "grad_norm": 8.724287986755371,
+ "learning_rate": 1.5199133855901013e-05,
+ "loss": 0.3567,
+ "step": 12705
+ },
+ {
+ "epoch": 34.62125340599455,
+ "grad_norm": 9.33549976348877,
+ "learning_rate": 1.5198379991986154e-05,
+ "loss": 0.5277,
+ "step": 12706
+ },
+ {
+ "epoch": 34.62397820163488,
+ "grad_norm": 7.487105369567871,
+ "learning_rate": 1.519762608758648e-05,
+ "loss": 0.4089,
+ "step": 12707
+ },
+ {
+ "epoch": 34.6267029972752,
+ "grad_norm": 6.3186750411987305,
+ "learning_rate": 1.5196872142707859e-05,
+ "loss": 0.2189,
+ "step": 12708
+ },
+ {
+ "epoch": 34.62942779291553,
+ "grad_norm": 13.810160636901855,
+ "learning_rate": 1.5196118157356168e-05,
+ "loss": 0.4644,
+ "step": 12709
+ },
+ {
+ "epoch": 34.63215258855586,
+ "grad_norm": 7.9806413650512695,
+ "learning_rate": 1.5195364131537273e-05,
+ "loss": 0.363,
+ "step": 12710
+ },
+ {
+ "epoch": 34.63487738419619,
+ "grad_norm": 7.039987564086914,
+ "learning_rate": 1.5194610065257052e-05,
+ "loss": 0.3934,
+ "step": 12711
+ },
+ {
+ "epoch": 34.63760217983651,
+ "grad_norm": 6.936146259307861,
+ "learning_rate": 1.519385595852137e-05,
+ "loss": 0.3399,
+ "step": 12712
+ },
+ {
+ "epoch": 34.64032697547684,
+ "grad_norm": 6.270376205444336,
+ "learning_rate": 1.519310181133611e-05,
+ "loss": 0.4134,
+ "step": 12713
+ },
+ {
+ "epoch": 34.643051771117165,
+ "grad_norm": 7.317523956298828,
+ "learning_rate": 1.5192347623707138e-05,
+ "loss": 0.4918,
+ "step": 12714
+ },
+ {
+ "epoch": 34.64577656675749,
+ "grad_norm": 7.332164764404297,
+ "learning_rate": 1.5191593395640331e-05,
+ "loss": 0.331,
+ "step": 12715
+ },
+ {
+ "epoch": 34.64850136239782,
+ "grad_norm": 6.766537189483643,
+ "learning_rate": 1.5190839127141562e-05,
+ "loss": 0.5164,
+ "step": 12716
+ },
+ {
+ "epoch": 34.65122615803815,
+ "grad_norm": 8.445927619934082,
+ "learning_rate": 1.5190084818216705e-05,
+ "loss": 0.3835,
+ "step": 12717
+ },
+ {
+ "epoch": 34.653950953678475,
+ "grad_norm": 7.979760646820068,
+ "learning_rate": 1.5189330468871633e-05,
+ "loss": 0.2907,
+ "step": 12718
+ },
+ {
+ "epoch": 34.6566757493188,
+ "grad_norm": 10.70372486114502,
+ "learning_rate": 1.5188576079112225e-05,
+ "loss": 0.3962,
+ "step": 12719
+ },
+ {
+ "epoch": 34.65940054495913,
+ "grad_norm": 11.06981086730957,
+ "learning_rate": 1.5187821648944348e-05,
+ "loss": 0.2766,
+ "step": 12720
+ },
+ {
+ "epoch": 34.66212534059945,
+ "grad_norm": 6.434134483337402,
+ "learning_rate": 1.5187067178373887e-05,
+ "loss": 0.3264,
+ "step": 12721
+ },
+ {
+ "epoch": 34.664850136239785,
+ "grad_norm": 7.828649044036865,
+ "learning_rate": 1.5186312667406712e-05,
+ "loss": 0.3538,
+ "step": 12722
+ },
+ {
+ "epoch": 34.66757493188011,
+ "grad_norm": 6.914149761199951,
+ "learning_rate": 1.5185558116048704e-05,
+ "loss": 0.2717,
+ "step": 12723
+ },
+ {
+ "epoch": 34.67029972752044,
+ "grad_norm": 12.35200309753418,
+ "learning_rate": 1.5184803524305733e-05,
+ "loss": 0.2907,
+ "step": 12724
+ },
+ {
+ "epoch": 34.67302452316076,
+ "grad_norm": 9.508199691772461,
+ "learning_rate": 1.5184048892183683e-05,
+ "loss": 0.2726,
+ "step": 12725
+ },
+ {
+ "epoch": 34.67574931880109,
+ "grad_norm": 7.7572712898254395,
+ "learning_rate": 1.5183294219688423e-05,
+ "loss": 0.2978,
+ "step": 12726
+ },
+ {
+ "epoch": 34.678474114441414,
+ "grad_norm": 5.914263725280762,
+ "learning_rate": 1.5182539506825837e-05,
+ "loss": 0.3403,
+ "step": 12727
+ },
+ {
+ "epoch": 34.68119891008175,
+ "grad_norm": 7.788616180419922,
+ "learning_rate": 1.5181784753601797e-05,
+ "loss": 0.4465,
+ "step": 12728
+ },
+ {
+ "epoch": 34.68392370572207,
+ "grad_norm": 5.874246120452881,
+ "learning_rate": 1.5181029960022187e-05,
+ "loss": 0.3644,
+ "step": 12729
+ },
+ {
+ "epoch": 34.6866485013624,
+ "grad_norm": 11.232590675354004,
+ "learning_rate": 1.518027512609288e-05,
+ "loss": 0.3675,
+ "step": 12730
+ },
+ {
+ "epoch": 34.689373297002724,
+ "grad_norm": 6.877134323120117,
+ "learning_rate": 1.5179520251819758e-05,
+ "loss": 0.2774,
+ "step": 12731
+ },
+ {
+ "epoch": 34.69209809264305,
+ "grad_norm": 22.318862915039062,
+ "learning_rate": 1.51787653372087e-05,
+ "loss": 0.3995,
+ "step": 12732
+ },
+ {
+ "epoch": 34.694822888283376,
+ "grad_norm": 6.460038185119629,
+ "learning_rate": 1.5178010382265586e-05,
+ "loss": 0.2565,
+ "step": 12733
+ },
+ {
+ "epoch": 34.69754768392371,
+ "grad_norm": 7.191373825073242,
+ "learning_rate": 1.517725538699629e-05,
+ "loss": 0.3623,
+ "step": 12734
+ },
+ {
+ "epoch": 34.700272479564035,
+ "grad_norm": 6.409982681274414,
+ "learning_rate": 1.51765003514067e-05,
+ "loss": 0.3607,
+ "step": 12735
+ },
+ {
+ "epoch": 34.70299727520436,
+ "grad_norm": 6.087721347808838,
+ "learning_rate": 1.5175745275502686e-05,
+ "loss": 0.3006,
+ "step": 12736
+ },
+ {
+ "epoch": 34.705722070844686,
+ "grad_norm": 16.11115264892578,
+ "learning_rate": 1.5174990159290137e-05,
+ "loss": 0.3904,
+ "step": 12737
+ },
+ {
+ "epoch": 34.70844686648501,
+ "grad_norm": 8.521676063537598,
+ "learning_rate": 1.5174235002774933e-05,
+ "loss": 0.4363,
+ "step": 12738
+ },
+ {
+ "epoch": 34.71117166212534,
+ "grad_norm": 7.016096591949463,
+ "learning_rate": 1.5173479805962954e-05,
+ "loss": 0.2871,
+ "step": 12739
+ },
+ {
+ "epoch": 34.71389645776567,
+ "grad_norm": 8.119922637939453,
+ "learning_rate": 1.5172724568860075e-05,
+ "loss": 0.4052,
+ "step": 12740
+ },
+ {
+ "epoch": 34.716621253406,
+ "grad_norm": 10.564770698547363,
+ "learning_rate": 1.517196929147219e-05,
+ "loss": 0.351,
+ "step": 12741
+ },
+ {
+ "epoch": 34.71934604904632,
+ "grad_norm": 5.689218521118164,
+ "learning_rate": 1.517121397380517e-05,
+ "loss": 0.3754,
+ "step": 12742
+ },
+ {
+ "epoch": 34.72207084468665,
+ "grad_norm": 7.102179050445557,
+ "learning_rate": 1.5170458615864906e-05,
+ "loss": 0.4146,
+ "step": 12743
+ },
+ {
+ "epoch": 34.724795640326974,
+ "grad_norm": 7.624054908752441,
+ "learning_rate": 1.5169703217657274e-05,
+ "loss": 0.4538,
+ "step": 12744
+ },
+ {
+ "epoch": 34.7275204359673,
+ "grad_norm": 8.589566230773926,
+ "learning_rate": 1.5168947779188163e-05,
+ "loss": 0.5319,
+ "step": 12745
+ },
+ {
+ "epoch": 34.73024523160763,
+ "grad_norm": 6.940329074859619,
+ "learning_rate": 1.5168192300463447e-05,
+ "loss": 0.3917,
+ "step": 12746
+ },
+ {
+ "epoch": 34.73297002724796,
+ "grad_norm": 6.856508731842041,
+ "learning_rate": 1.516743678148902e-05,
+ "loss": 0.4256,
+ "step": 12747
+ },
+ {
+ "epoch": 34.735694822888284,
+ "grad_norm": 6.467329978942871,
+ "learning_rate": 1.516668122227076e-05,
+ "loss": 0.3243,
+ "step": 12748
+ },
+ {
+ "epoch": 34.73841961852861,
+ "grad_norm": 12.759373664855957,
+ "learning_rate": 1.5165925622814554e-05,
+ "loss": 0.241,
+ "step": 12749
+ },
+ {
+ "epoch": 34.741144414168936,
+ "grad_norm": 6.045810222625732,
+ "learning_rate": 1.5165169983126287e-05,
+ "loss": 0.2975,
+ "step": 12750
+ },
+ {
+ "epoch": 34.74386920980926,
+ "grad_norm": 25.1729736328125,
+ "learning_rate": 1.516441430321184e-05,
+ "loss": 0.3225,
+ "step": 12751
+ },
+ {
+ "epoch": 34.746594005449595,
+ "grad_norm": 7.094336032867432,
+ "learning_rate": 1.5163658583077103e-05,
+ "loss": 0.2514,
+ "step": 12752
+ },
+ {
+ "epoch": 34.74931880108992,
+ "grad_norm": 12.75036334991455,
+ "learning_rate": 1.5162902822727956e-05,
+ "loss": 0.3227,
+ "step": 12753
+ },
+ {
+ "epoch": 34.752043596730246,
+ "grad_norm": 9.665423393249512,
+ "learning_rate": 1.5162147022170288e-05,
+ "loss": 0.3798,
+ "step": 12754
+ },
+ {
+ "epoch": 34.75476839237057,
+ "grad_norm": 8.1179838180542,
+ "learning_rate": 1.5161391181409987e-05,
+ "loss": 0.3344,
+ "step": 12755
+ },
+ {
+ "epoch": 34.7574931880109,
+ "grad_norm": 25.28486442565918,
+ "learning_rate": 1.5160635300452936e-05,
+ "loss": 0.3,
+ "step": 12756
+ },
+ {
+ "epoch": 34.76021798365122,
+ "grad_norm": 8.724785804748535,
+ "learning_rate": 1.5159879379305028e-05,
+ "loss": 0.3551,
+ "step": 12757
+ },
+ {
+ "epoch": 34.762942779291556,
+ "grad_norm": 7.74306058883667,
+ "learning_rate": 1.515912341797214e-05,
+ "loss": 0.3218,
+ "step": 12758
+ },
+ {
+ "epoch": 34.76566757493188,
+ "grad_norm": 7.537326335906982,
+ "learning_rate": 1.515836741646017e-05,
+ "loss": 0.3193,
+ "step": 12759
+ },
+ {
+ "epoch": 34.76839237057221,
+ "grad_norm": 6.181797504425049,
+ "learning_rate": 1.5157611374774997e-05,
+ "loss": 0.4611,
+ "step": 12760
+ },
+ {
+ "epoch": 34.771117166212534,
+ "grad_norm": 7.308982849121094,
+ "learning_rate": 1.5156855292922512e-05,
+ "loss": 0.29,
+ "step": 12761
+ },
+ {
+ "epoch": 34.77384196185286,
+ "grad_norm": 9.729423522949219,
+ "learning_rate": 1.5156099170908605e-05,
+ "loss": 0.4969,
+ "step": 12762
+ },
+ {
+ "epoch": 34.776566757493185,
+ "grad_norm": 7.62312650680542,
+ "learning_rate": 1.5155343008739162e-05,
+ "loss": 0.3237,
+ "step": 12763
+ },
+ {
+ "epoch": 34.77929155313352,
+ "grad_norm": 7.187760353088379,
+ "learning_rate": 1.5154586806420078e-05,
+ "loss": 0.3556,
+ "step": 12764
+ },
+ {
+ "epoch": 34.782016348773844,
+ "grad_norm": 7.4792561531066895,
+ "learning_rate": 1.5153830563957232e-05,
+ "loss": 0.4765,
+ "step": 12765
+ },
+ {
+ "epoch": 34.78474114441417,
+ "grad_norm": 8.713623046875,
+ "learning_rate": 1.5153074281356523e-05,
+ "loss": 0.3162,
+ "step": 12766
+ },
+ {
+ "epoch": 34.787465940054496,
+ "grad_norm": 6.846462726593018,
+ "learning_rate": 1.5152317958623836e-05,
+ "loss": 0.3005,
+ "step": 12767
+ },
+ {
+ "epoch": 34.79019073569482,
+ "grad_norm": 7.01962423324585,
+ "learning_rate": 1.5151561595765066e-05,
+ "loss": 0.267,
+ "step": 12768
+ },
+ {
+ "epoch": 34.79291553133515,
+ "grad_norm": 8.18949031829834,
+ "learning_rate": 1.5150805192786097e-05,
+ "loss": 0.297,
+ "step": 12769
+ },
+ {
+ "epoch": 34.79564032697548,
+ "grad_norm": 7.413372039794922,
+ "learning_rate": 1.5150048749692822e-05,
+ "loss": 0.3751,
+ "step": 12770
+ },
+ {
+ "epoch": 34.798365122615806,
+ "grad_norm": 10.343478202819824,
+ "learning_rate": 1.5149292266491133e-05,
+ "loss": 0.3061,
+ "step": 12771
+ },
+ {
+ "epoch": 34.80108991825613,
+ "grad_norm": 6.774062633514404,
+ "learning_rate": 1.5148535743186928e-05,
+ "loss": 0.498,
+ "step": 12772
+ },
+ {
+ "epoch": 34.80381471389646,
+ "grad_norm": 6.852293491363525,
+ "learning_rate": 1.5147779179786084e-05,
+ "loss": 0.3989,
+ "step": 12773
+ },
+ {
+ "epoch": 34.80653950953678,
+ "grad_norm": 21.525096893310547,
+ "learning_rate": 1.5147022576294506e-05,
+ "loss": 0.4672,
+ "step": 12774
+ },
+ {
+ "epoch": 34.80926430517711,
+ "grad_norm": 9.819718360900879,
+ "learning_rate": 1.514626593271808e-05,
+ "loss": 0.3227,
+ "step": 12775
+ },
+ {
+ "epoch": 34.81198910081744,
+ "grad_norm": 7.6693572998046875,
+ "learning_rate": 1.5145509249062702e-05,
+ "loss": 0.2576,
+ "step": 12776
+ },
+ {
+ "epoch": 34.81471389645777,
+ "grad_norm": 6.69463586807251,
+ "learning_rate": 1.5144752525334264e-05,
+ "loss": 0.3507,
+ "step": 12777
+ },
+ {
+ "epoch": 34.817438692098094,
+ "grad_norm": 8.588858604431152,
+ "learning_rate": 1.5143995761538657e-05,
+ "loss": 0.4889,
+ "step": 12778
+ },
+ {
+ "epoch": 34.82016348773842,
+ "grad_norm": 10.772705078125,
+ "learning_rate": 1.5143238957681776e-05,
+ "loss": 0.3785,
+ "step": 12779
+ },
+ {
+ "epoch": 34.822888283378745,
+ "grad_norm": 6.9552154541015625,
+ "learning_rate": 1.5142482113769519e-05,
+ "loss": 0.4968,
+ "step": 12780
+ },
+ {
+ "epoch": 34.82561307901907,
+ "grad_norm": 6.593571662902832,
+ "learning_rate": 1.5141725229807773e-05,
+ "loss": 0.3855,
+ "step": 12781
+ },
+ {
+ "epoch": 34.828337874659404,
+ "grad_norm": 7.897350311279297,
+ "learning_rate": 1.5140968305802438e-05,
+ "loss": 0.2631,
+ "step": 12782
+ },
+ {
+ "epoch": 34.83106267029973,
+ "grad_norm": 7.923161506652832,
+ "learning_rate": 1.5140211341759408e-05,
+ "loss": 0.287,
+ "step": 12783
+ },
+ {
+ "epoch": 34.833787465940055,
+ "grad_norm": 7.426450729370117,
+ "learning_rate": 1.5139454337684577e-05,
+ "loss": 0.3377,
+ "step": 12784
+ },
+ {
+ "epoch": 34.83651226158038,
+ "grad_norm": 7.1171088218688965,
+ "learning_rate": 1.5138697293583842e-05,
+ "loss": 0.3357,
+ "step": 12785
+ },
+ {
+ "epoch": 34.83923705722071,
+ "grad_norm": 8.326007843017578,
+ "learning_rate": 1.5137940209463095e-05,
+ "loss": 0.3349,
+ "step": 12786
+ },
+ {
+ "epoch": 34.84196185286103,
+ "grad_norm": 6.74309778213501,
+ "learning_rate": 1.5137183085328237e-05,
+ "loss": 0.3382,
+ "step": 12787
+ },
+ {
+ "epoch": 34.844686648501366,
+ "grad_norm": 7.596869468688965,
+ "learning_rate": 1.5136425921185162e-05,
+ "loss": 0.4407,
+ "step": 12788
+ },
+ {
+ "epoch": 34.84741144414169,
+ "grad_norm": 9.84290885925293,
+ "learning_rate": 1.5135668717039767e-05,
+ "loss": 0.4174,
+ "step": 12789
+ },
+ {
+ "epoch": 34.85013623978202,
+ "grad_norm": 8.881937980651855,
+ "learning_rate": 1.513491147289795e-05,
+ "loss": 0.3128,
+ "step": 12790
+ },
+ {
+ "epoch": 34.85286103542234,
+ "grad_norm": 7.489529609680176,
+ "learning_rate": 1.5134154188765608e-05,
+ "loss": 0.2996,
+ "step": 12791
+ },
+ {
+ "epoch": 34.85558583106267,
+ "grad_norm": 5.962601661682129,
+ "learning_rate": 1.513339686464864e-05,
+ "loss": 0.2526,
+ "step": 12792
+ },
+ {
+ "epoch": 34.858310626702995,
+ "grad_norm": 5.978816509246826,
+ "learning_rate": 1.513263950055294e-05,
+ "loss": 0.3769,
+ "step": 12793
+ },
+ {
+ "epoch": 34.86103542234333,
+ "grad_norm": 7.779540538787842,
+ "learning_rate": 1.5131882096484409e-05,
+ "loss": 0.3186,
+ "step": 12794
+ },
+ {
+ "epoch": 34.86376021798365,
+ "grad_norm": 9.456623077392578,
+ "learning_rate": 1.5131124652448943e-05,
+ "loss": 0.3513,
+ "step": 12795
+ },
+ {
+ "epoch": 34.86648501362398,
+ "grad_norm": 7.130842208862305,
+ "learning_rate": 1.5130367168452449e-05,
+ "loss": 0.4387,
+ "step": 12796
+ },
+ {
+ "epoch": 34.869209809264305,
+ "grad_norm": 6.189455986022949,
+ "learning_rate": 1.5129609644500813e-05,
+ "loss": 0.4162,
+ "step": 12797
+ },
+ {
+ "epoch": 34.87193460490463,
+ "grad_norm": 7.358476161956787,
+ "learning_rate": 1.5128852080599949e-05,
+ "loss": 0.2995,
+ "step": 12798
+ },
+ {
+ "epoch": 34.87465940054496,
+ "grad_norm": 6.125901222229004,
+ "learning_rate": 1.5128094476755747e-05,
+ "loss": 0.457,
+ "step": 12799
+ },
+ {
+ "epoch": 34.87738419618529,
+ "grad_norm": 5.849795818328857,
+ "learning_rate": 1.5127336832974111e-05,
+ "loss": 0.4403,
+ "step": 12800
+ },
+ {
+ "epoch": 34.880108991825615,
+ "grad_norm": 6.29843807220459,
+ "learning_rate": 1.512657914926094e-05,
+ "loss": 0.2894,
+ "step": 12801
+ },
+ {
+ "epoch": 34.88283378746594,
+ "grad_norm": 7.504866600036621,
+ "learning_rate": 1.5125821425622137e-05,
+ "loss": 0.4162,
+ "step": 12802
+ },
+ {
+ "epoch": 34.88555858310627,
+ "grad_norm": 7.649609565734863,
+ "learning_rate": 1.5125063662063602e-05,
+ "loss": 0.5047,
+ "step": 12803
+ },
+ {
+ "epoch": 34.88828337874659,
+ "grad_norm": 6.444530010223389,
+ "learning_rate": 1.5124305858591238e-05,
+ "loss": 0.4594,
+ "step": 12804
+ },
+ {
+ "epoch": 34.89100817438692,
+ "grad_norm": 9.201496124267578,
+ "learning_rate": 1.5123548015210941e-05,
+ "loss": 0.315,
+ "step": 12805
+ },
+ {
+ "epoch": 34.89373297002725,
+ "grad_norm": 9.123472213745117,
+ "learning_rate": 1.5122790131928615e-05,
+ "loss": 0.3701,
+ "step": 12806
+ },
+ {
+ "epoch": 34.89645776566758,
+ "grad_norm": 7.393870830535889,
+ "learning_rate": 1.5122032208750168e-05,
+ "loss": 0.3359,
+ "step": 12807
+ },
+ {
+ "epoch": 34.8991825613079,
+ "grad_norm": 8.265925407409668,
+ "learning_rate": 1.51212742456815e-05,
+ "loss": 0.3147,
+ "step": 12808
+ },
+ {
+ "epoch": 34.90190735694823,
+ "grad_norm": 6.999871253967285,
+ "learning_rate": 1.5120516242728508e-05,
+ "loss": 0.3462,
+ "step": 12809
+ },
+ {
+ "epoch": 34.904632152588555,
+ "grad_norm": 9.759187698364258,
+ "learning_rate": 1.5119758199897106e-05,
+ "loss": 0.4647,
+ "step": 12810
+ },
+ {
+ "epoch": 34.90735694822888,
+ "grad_norm": 12.058571815490723,
+ "learning_rate": 1.511900011719319e-05,
+ "loss": 0.4572,
+ "step": 12811
+ },
+ {
+ "epoch": 34.91008174386921,
+ "grad_norm": 5.392372131347656,
+ "learning_rate": 1.5118241994622666e-05,
+ "loss": 0.3235,
+ "step": 12812
+ },
+ {
+ "epoch": 34.91280653950954,
+ "grad_norm": 6.347375869750977,
+ "learning_rate": 1.5117483832191438e-05,
+ "loss": 0.2578,
+ "step": 12813
+ },
+ {
+ "epoch": 34.915531335149865,
+ "grad_norm": 5.794153690338135,
+ "learning_rate": 1.5116725629905408e-05,
+ "loss": 0.4393,
+ "step": 12814
+ },
+ {
+ "epoch": 34.91825613079019,
+ "grad_norm": 7.6299028396606445,
+ "learning_rate": 1.5115967387770484e-05,
+ "loss": 0.2598,
+ "step": 12815
+ },
+ {
+ "epoch": 34.920980926430516,
+ "grad_norm": 6.074033260345459,
+ "learning_rate": 1.5115209105792574e-05,
+ "loss": 0.2385,
+ "step": 12816
+ },
+ {
+ "epoch": 34.92370572207084,
+ "grad_norm": 7.3379411697387695,
+ "learning_rate": 1.5114450783977579e-05,
+ "loss": 0.4849,
+ "step": 12817
+ },
+ {
+ "epoch": 34.926430517711175,
+ "grad_norm": 8.817684173583984,
+ "learning_rate": 1.5113692422331406e-05,
+ "loss": 0.446,
+ "step": 12818
+ },
+ {
+ "epoch": 34.9291553133515,
+ "grad_norm": 6.351326942443848,
+ "learning_rate": 1.511293402085996e-05,
+ "loss": 0.4822,
+ "step": 12819
+ },
+ {
+ "epoch": 34.93188010899183,
+ "grad_norm": 14.489463806152344,
+ "learning_rate": 1.5112175579569149e-05,
+ "loss": 0.3636,
+ "step": 12820
+ },
+ {
+ "epoch": 34.93460490463215,
+ "grad_norm": 7.836480617523193,
+ "learning_rate": 1.5111417098464879e-05,
+ "loss": 0.3438,
+ "step": 12821
+ },
+ {
+ "epoch": 34.93732970027248,
+ "grad_norm": 7.352789878845215,
+ "learning_rate": 1.5110658577553058e-05,
+ "loss": 0.5103,
+ "step": 12822
+ },
+ {
+ "epoch": 34.940054495912804,
+ "grad_norm": 6.39596700668335,
+ "learning_rate": 1.510990001683959e-05,
+ "loss": 0.2738,
+ "step": 12823
+ },
+ {
+ "epoch": 34.94277929155314,
+ "grad_norm": 6.166970729827881,
+ "learning_rate": 1.5109141416330386e-05,
+ "loss": 0.3428,
+ "step": 12824
+ },
+ {
+ "epoch": 34.94550408719346,
+ "grad_norm": 5.944089889526367,
+ "learning_rate": 1.5108382776031354e-05,
+ "loss": 0.4155,
+ "step": 12825
+ },
+ {
+ "epoch": 34.94822888283379,
+ "grad_norm": 6.506803512573242,
+ "learning_rate": 1.51076240959484e-05,
+ "loss": 0.294,
+ "step": 12826
+ },
+ {
+ "epoch": 34.950953678474114,
+ "grad_norm": 7.878262519836426,
+ "learning_rate": 1.5106865376087437e-05,
+ "loss": 0.4139,
+ "step": 12827
+ },
+ {
+ "epoch": 34.95367847411444,
+ "grad_norm": 7.29544734954834,
+ "learning_rate": 1.5106106616454371e-05,
+ "loss": 0.3418,
+ "step": 12828
+ },
+ {
+ "epoch": 34.956403269754766,
+ "grad_norm": 6.37436580657959,
+ "learning_rate": 1.5105347817055106e-05,
+ "loss": 0.3661,
+ "step": 12829
+ },
+ {
+ "epoch": 34.95912806539509,
+ "grad_norm": 6.1794633865356445,
+ "learning_rate": 1.510458897789556e-05,
+ "loss": 0.434,
+ "step": 12830
+ },
+ {
+ "epoch": 34.961852861035425,
+ "grad_norm": 7.422924518585205,
+ "learning_rate": 1.5103830098981637e-05,
+ "loss": 0.3311,
+ "step": 12831
+ },
+ {
+ "epoch": 34.96457765667575,
+ "grad_norm": 6.644876480102539,
+ "learning_rate": 1.5103071180319254e-05,
+ "loss": 0.337,
+ "step": 12832
+ },
+ {
+ "epoch": 34.967302452316076,
+ "grad_norm": 7.06466007232666,
+ "learning_rate": 1.510231222191431e-05,
+ "loss": 0.3248,
+ "step": 12833
+ },
+ {
+ "epoch": 34.9700272479564,
+ "grad_norm": 6.119283676147461,
+ "learning_rate": 1.5101553223772728e-05,
+ "loss": 0.2797,
+ "step": 12834
+ },
+ {
+ "epoch": 34.97275204359673,
+ "grad_norm": 8.348386764526367,
+ "learning_rate": 1.5100794185900411e-05,
+ "loss": 0.3005,
+ "step": 12835
+ },
+ {
+ "epoch": 34.97547683923706,
+ "grad_norm": 6.874670505523682,
+ "learning_rate": 1.5100035108303278e-05,
+ "loss": 0.4833,
+ "step": 12836
+ },
+ {
+ "epoch": 34.97820163487739,
+ "grad_norm": 6.618953227996826,
+ "learning_rate": 1.509927599098723e-05,
+ "loss": 0.2442,
+ "step": 12837
+ },
+ {
+ "epoch": 34.98092643051771,
+ "grad_norm": 10.766705513000488,
+ "learning_rate": 1.5098516833958187e-05,
+ "loss": 0.3206,
+ "step": 12838
+ },
+ {
+ "epoch": 34.98365122615804,
+ "grad_norm": 9.001296997070312,
+ "learning_rate": 1.509775763722206e-05,
+ "loss": 0.4433,
+ "step": 12839
+ },
+ {
+ "epoch": 34.986376021798364,
+ "grad_norm": 8.988316535949707,
+ "learning_rate": 1.5096998400784756e-05,
+ "loss": 0.4554,
+ "step": 12840
+ },
+ {
+ "epoch": 34.98910081743869,
+ "grad_norm": 6.756176948547363,
+ "learning_rate": 1.5096239124652197e-05,
+ "loss": 0.2471,
+ "step": 12841
+ },
+ {
+ "epoch": 34.991825613079016,
+ "grad_norm": 7.477931022644043,
+ "learning_rate": 1.5095479808830292e-05,
+ "loss": 0.7057,
+ "step": 12842
+ },
+ {
+ "epoch": 34.99455040871935,
+ "grad_norm": 9.176545143127441,
+ "learning_rate": 1.5094720453324952e-05,
+ "loss": 0.3825,
+ "step": 12843
+ },
+ {
+ "epoch": 34.997275204359674,
+ "grad_norm": 7.517789363861084,
+ "learning_rate": 1.5093961058142095e-05,
+ "loss": 0.4518,
+ "step": 12844
+ },
+ {
+ "epoch": 35.0,
+ "grad_norm": 6.629086017608643,
+ "learning_rate": 1.5093201623287631e-05,
+ "loss": 0.3144,
+ "step": 12845
+ },
+ {
+ "epoch": 35.002724795640326,
+ "grad_norm": 5.785049915313721,
+ "learning_rate": 1.509244214876748e-05,
+ "loss": 0.4406,
+ "step": 12846
+ },
+ {
+ "epoch": 35.00544959128065,
+ "grad_norm": 5.573185443878174,
+ "learning_rate": 1.5091682634587547e-05,
+ "loss": 0.3493,
+ "step": 12847
+ },
+ {
+ "epoch": 35.00817438692098,
+ "grad_norm": 7.0667548179626465,
+ "learning_rate": 1.509092308075376e-05,
+ "loss": 0.3315,
+ "step": 12848
+ },
+ {
+ "epoch": 35.01089918256131,
+ "grad_norm": 8.357725143432617,
+ "learning_rate": 1.5090163487272027e-05,
+ "loss": 0.3625,
+ "step": 12849
+ },
+ {
+ "epoch": 35.013623978201636,
+ "grad_norm": 5.935133457183838,
+ "learning_rate": 1.5089403854148261e-05,
+ "loss": 0.2876,
+ "step": 12850
+ },
+ {
+ "epoch": 35.01634877384196,
+ "grad_norm": 7.409773826599121,
+ "learning_rate": 1.5088644181388386e-05,
+ "loss": 0.191,
+ "step": 12851
+ },
+ {
+ "epoch": 35.01907356948229,
+ "grad_norm": 6.038036823272705,
+ "learning_rate": 1.508788446899831e-05,
+ "loss": 0.4126,
+ "step": 12852
+ },
+ {
+ "epoch": 35.02179836512261,
+ "grad_norm": 5.311971187591553,
+ "learning_rate": 1.5087124716983956e-05,
+ "loss": 0.2346,
+ "step": 12853
+ },
+ {
+ "epoch": 35.02452316076294,
+ "grad_norm": 8.31474494934082,
+ "learning_rate": 1.5086364925351238e-05,
+ "loss": 0.2484,
+ "step": 12854
+ },
+ {
+ "epoch": 35.02724795640327,
+ "grad_norm": 6.290774822235107,
+ "learning_rate": 1.5085605094106072e-05,
+ "loss": 0.374,
+ "step": 12855
+ },
+ {
+ "epoch": 35.0299727520436,
+ "grad_norm": 6.906851768493652,
+ "learning_rate": 1.5084845223254381e-05,
+ "loss": 0.2697,
+ "step": 12856
+ },
+ {
+ "epoch": 35.032697547683924,
+ "grad_norm": 6.9600982666015625,
+ "learning_rate": 1.5084085312802075e-05,
+ "loss": 0.2094,
+ "step": 12857
+ },
+ {
+ "epoch": 35.03542234332425,
+ "grad_norm": 8.362553596496582,
+ "learning_rate": 1.5083325362755077e-05,
+ "loss": 0.3174,
+ "step": 12858
+ },
+ {
+ "epoch": 35.038147138964575,
+ "grad_norm": 6.994814872741699,
+ "learning_rate": 1.5082565373119307e-05,
+ "loss": 0.2646,
+ "step": 12859
+ },
+ {
+ "epoch": 35.0408719346049,
+ "grad_norm": 5.494656562805176,
+ "learning_rate": 1.508180534390068e-05,
+ "loss": 0.3244,
+ "step": 12860
+ },
+ {
+ "epoch": 35.043596730245234,
+ "grad_norm": 6.103918552398682,
+ "learning_rate": 1.5081045275105117e-05,
+ "loss": 0.3241,
+ "step": 12861
+ },
+ {
+ "epoch": 35.04632152588556,
+ "grad_norm": 5.130848407745361,
+ "learning_rate": 1.5080285166738535e-05,
+ "loss": 0.3754,
+ "step": 12862
+ },
+ {
+ "epoch": 35.049046321525886,
+ "grad_norm": 5.91086483001709,
+ "learning_rate": 1.5079525018806856e-05,
+ "loss": 0.2361,
+ "step": 12863
+ },
+ {
+ "epoch": 35.05177111716621,
+ "grad_norm": 5.534972667694092,
+ "learning_rate": 1.5078764831316002e-05,
+ "loss": 0.2357,
+ "step": 12864
+ },
+ {
+ "epoch": 35.05449591280654,
+ "grad_norm": 13.435774803161621,
+ "learning_rate": 1.507800460427189e-05,
+ "loss": 0.3418,
+ "step": 12865
+ },
+ {
+ "epoch": 35.05722070844686,
+ "grad_norm": 6.177347660064697,
+ "learning_rate": 1.5077244337680439e-05,
+ "loss": 0.2652,
+ "step": 12866
+ },
+ {
+ "epoch": 35.059945504087196,
+ "grad_norm": 5.603326320648193,
+ "learning_rate": 1.5076484031547578e-05,
+ "loss": 0.5273,
+ "step": 12867
+ },
+ {
+ "epoch": 35.06267029972752,
+ "grad_norm": 7.058253765106201,
+ "learning_rate": 1.5075723685879218e-05,
+ "loss": 0.3388,
+ "step": 12868
+ },
+ {
+ "epoch": 35.06539509536785,
+ "grad_norm": 6.102175235748291,
+ "learning_rate": 1.5074963300681286e-05,
+ "loss": 0.2981,
+ "step": 12869
+ },
+ {
+ "epoch": 35.06811989100817,
+ "grad_norm": 5.3113203048706055,
+ "learning_rate": 1.5074202875959704e-05,
+ "loss": 0.2601,
+ "step": 12870
+ },
+ {
+ "epoch": 35.0708446866485,
+ "grad_norm": 5.491559028625488,
+ "learning_rate": 1.5073442411720397e-05,
+ "loss": 0.4017,
+ "step": 12871
+ },
+ {
+ "epoch": 35.073569482288825,
+ "grad_norm": 7.598811626434326,
+ "learning_rate": 1.5072681907969277e-05,
+ "loss": 0.3106,
+ "step": 12872
+ },
+ {
+ "epoch": 35.07629427792916,
+ "grad_norm": 9.770064353942871,
+ "learning_rate": 1.5071921364712278e-05,
+ "loss": 0.2632,
+ "step": 12873
+ },
+ {
+ "epoch": 35.079019073569484,
+ "grad_norm": 9.12311840057373,
+ "learning_rate": 1.5071160781955316e-05,
+ "loss": 0.3592,
+ "step": 12874
+ },
+ {
+ "epoch": 35.08174386920981,
+ "grad_norm": 6.149101734161377,
+ "learning_rate": 1.5070400159704317e-05,
+ "loss": 0.3208,
+ "step": 12875
+ },
+ {
+ "epoch": 35.084468664850135,
+ "grad_norm": 5.999884128570557,
+ "learning_rate": 1.5069639497965205e-05,
+ "loss": 0.2534,
+ "step": 12876
+ },
+ {
+ "epoch": 35.08719346049046,
+ "grad_norm": 8.41357421875,
+ "learning_rate": 1.5068878796743907e-05,
+ "loss": 0.3031,
+ "step": 12877
+ },
+ {
+ "epoch": 35.08991825613079,
+ "grad_norm": 7.803460597991943,
+ "learning_rate": 1.5068118056046342e-05,
+ "loss": 0.2934,
+ "step": 12878
+ },
+ {
+ "epoch": 35.09264305177112,
+ "grad_norm": 13.252748489379883,
+ "learning_rate": 1.5067357275878438e-05,
+ "loss": 0.3236,
+ "step": 12879
+ },
+ {
+ "epoch": 35.095367847411445,
+ "grad_norm": 5.52808141708374,
+ "learning_rate": 1.5066596456246116e-05,
+ "loss": 0.2805,
+ "step": 12880
+ },
+ {
+ "epoch": 35.09809264305177,
+ "grad_norm": 6.531493663787842,
+ "learning_rate": 1.5065835597155305e-05,
+ "loss": 0.3039,
+ "step": 12881
+ },
+ {
+ "epoch": 35.1008174386921,
+ "grad_norm": 6.289060592651367,
+ "learning_rate": 1.506507469861193e-05,
+ "loss": 0.2648,
+ "step": 12882
+ },
+ {
+ "epoch": 35.10354223433242,
+ "grad_norm": 5.346847057342529,
+ "learning_rate": 1.5064313760621913e-05,
+ "loss": 0.1923,
+ "step": 12883
+ },
+ {
+ "epoch": 35.10626702997275,
+ "grad_norm": 6.987293243408203,
+ "learning_rate": 1.5063552783191186e-05,
+ "loss": 0.3647,
+ "step": 12884
+ },
+ {
+ "epoch": 35.10899182561308,
+ "grad_norm": 6.071861267089844,
+ "learning_rate": 1.5062791766325676e-05,
+ "loss": 0.2628,
+ "step": 12885
+ },
+ {
+ "epoch": 35.11171662125341,
+ "grad_norm": 6.821843147277832,
+ "learning_rate": 1.5062030710031304e-05,
+ "loss": 0.2214,
+ "step": 12886
+ },
+ {
+ "epoch": 35.11444141689373,
+ "grad_norm": 6.0386643409729,
+ "learning_rate": 1.5061269614314e-05,
+ "loss": 0.3656,
+ "step": 12887
+ },
+ {
+ "epoch": 35.11716621253406,
+ "grad_norm": 12.071297645568848,
+ "learning_rate": 1.506050847917969e-05,
+ "loss": 0.2701,
+ "step": 12888
+ },
+ {
+ "epoch": 35.119891008174385,
+ "grad_norm": 8.566832542419434,
+ "learning_rate": 1.5059747304634304e-05,
+ "loss": 0.4954,
+ "step": 12889
+ },
+ {
+ "epoch": 35.12261580381471,
+ "grad_norm": 6.731941223144531,
+ "learning_rate": 1.5058986090683767e-05,
+ "loss": 0.4046,
+ "step": 12890
+ },
+ {
+ "epoch": 35.12534059945504,
+ "grad_norm": 5.576921463012695,
+ "learning_rate": 1.5058224837334012e-05,
+ "loss": 0.3425,
+ "step": 12891
+ },
+ {
+ "epoch": 35.12806539509537,
+ "grad_norm": 7.817747592926025,
+ "learning_rate": 1.505746354459096e-05,
+ "loss": 0.3054,
+ "step": 12892
+ },
+ {
+ "epoch": 35.130790190735695,
+ "grad_norm": 5.836747646331787,
+ "learning_rate": 1.5056702212460547e-05,
+ "loss": 0.1724,
+ "step": 12893
+ },
+ {
+ "epoch": 35.13351498637602,
+ "grad_norm": 7.261024475097656,
+ "learning_rate": 1.5055940840948702e-05,
+ "loss": 0.2533,
+ "step": 12894
+ },
+ {
+ "epoch": 35.13623978201635,
+ "grad_norm": 6.892082691192627,
+ "learning_rate": 1.5055179430061354e-05,
+ "loss": 0.3005,
+ "step": 12895
+ },
+ {
+ "epoch": 35.13896457765667,
+ "grad_norm": 11.652900695800781,
+ "learning_rate": 1.5054417979804426e-05,
+ "loss": 0.2771,
+ "step": 12896
+ },
+ {
+ "epoch": 35.141689373297005,
+ "grad_norm": 6.214851379394531,
+ "learning_rate": 1.5053656490183856e-05,
+ "loss": 0.2691,
+ "step": 12897
+ },
+ {
+ "epoch": 35.14441416893733,
+ "grad_norm": 9.134818077087402,
+ "learning_rate": 1.5052894961205573e-05,
+ "loss": 0.3449,
+ "step": 12898
+ },
+ {
+ "epoch": 35.14713896457766,
+ "grad_norm": 6.546474933624268,
+ "learning_rate": 1.5052133392875505e-05,
+ "loss": 0.1782,
+ "step": 12899
+ },
+ {
+ "epoch": 35.14986376021798,
+ "grad_norm": 6.9917988777160645,
+ "learning_rate": 1.5051371785199585e-05,
+ "loss": 0.3135,
+ "step": 12900
+ },
+ {
+ "epoch": 35.15258855585831,
+ "grad_norm": 6.644484043121338,
+ "learning_rate": 1.5050610138183746e-05,
+ "loss": 0.3666,
+ "step": 12901
+ },
+ {
+ "epoch": 35.155313351498634,
+ "grad_norm": 5.416781902313232,
+ "learning_rate": 1.5049848451833912e-05,
+ "loss": 0.2019,
+ "step": 12902
+ },
+ {
+ "epoch": 35.15803814713897,
+ "grad_norm": 8.030413627624512,
+ "learning_rate": 1.5049086726156028e-05,
+ "loss": 0.2774,
+ "step": 12903
+ },
+ {
+ "epoch": 35.16076294277929,
+ "grad_norm": 6.396627902984619,
+ "learning_rate": 1.5048324961156016e-05,
+ "loss": 0.267,
+ "step": 12904
+ },
+ {
+ "epoch": 35.16348773841962,
+ "grad_norm": 5.942184925079346,
+ "learning_rate": 1.5047563156839812e-05,
+ "loss": 0.2117,
+ "step": 12905
+ },
+ {
+ "epoch": 35.166212534059945,
+ "grad_norm": 6.416858196258545,
+ "learning_rate": 1.5046801313213349e-05,
+ "loss": 0.3,
+ "step": 12906
+ },
+ {
+ "epoch": 35.16893732970027,
+ "grad_norm": 6.120514869689941,
+ "learning_rate": 1.5046039430282559e-05,
+ "loss": 0.4378,
+ "step": 12907
+ },
+ {
+ "epoch": 35.171662125340596,
+ "grad_norm": 8.632964134216309,
+ "learning_rate": 1.5045277508053376e-05,
+ "loss": 0.236,
+ "step": 12908
+ },
+ {
+ "epoch": 35.17438692098093,
+ "grad_norm": 7.408965110778809,
+ "learning_rate": 1.5044515546531733e-05,
+ "loss": 0.3813,
+ "step": 12909
+ },
+ {
+ "epoch": 35.177111716621255,
+ "grad_norm": 7.03118371963501,
+ "learning_rate": 1.5043753545723568e-05,
+ "loss": 0.2874,
+ "step": 12910
+ },
+ {
+ "epoch": 35.17983651226158,
+ "grad_norm": 7.311297416687012,
+ "learning_rate": 1.5042991505634812e-05,
+ "loss": 0.3885,
+ "step": 12911
+ },
+ {
+ "epoch": 35.182561307901906,
+ "grad_norm": 6.356116771697998,
+ "learning_rate": 1.50422294262714e-05,
+ "loss": 0.2529,
+ "step": 12912
+ },
+ {
+ "epoch": 35.18528610354223,
+ "grad_norm": 7.108633041381836,
+ "learning_rate": 1.5041467307639268e-05,
+ "loss": 0.2782,
+ "step": 12913
+ },
+ {
+ "epoch": 35.18801089918256,
+ "grad_norm": 47.94351577758789,
+ "learning_rate": 1.504070514974435e-05,
+ "loss": 0.3183,
+ "step": 12914
+ },
+ {
+ "epoch": 35.19073569482289,
+ "grad_norm": 5.8043365478515625,
+ "learning_rate": 1.5039942952592585e-05,
+ "loss": 0.2344,
+ "step": 12915
+ },
+ {
+ "epoch": 35.19346049046322,
+ "grad_norm": 9.831428527832031,
+ "learning_rate": 1.5039180716189903e-05,
+ "loss": 0.2695,
+ "step": 12916
+ },
+ {
+ "epoch": 35.19618528610354,
+ "grad_norm": 6.711259365081787,
+ "learning_rate": 1.5038418440542247e-05,
+ "loss": 0.2715,
+ "step": 12917
+ },
+ {
+ "epoch": 35.19891008174387,
+ "grad_norm": 7.609066009521484,
+ "learning_rate": 1.5037656125655543e-05,
+ "loss": 0.468,
+ "step": 12918
+ },
+ {
+ "epoch": 35.201634877384194,
+ "grad_norm": 6.482602119445801,
+ "learning_rate": 1.5036893771535743e-05,
+ "loss": 0.4118,
+ "step": 12919
+ },
+ {
+ "epoch": 35.20435967302452,
+ "grad_norm": 8.60822868347168,
+ "learning_rate": 1.5036131378188774e-05,
+ "loss": 0.4206,
+ "step": 12920
+ },
+ {
+ "epoch": 35.20708446866485,
+ "grad_norm": 7.4198689460754395,
+ "learning_rate": 1.5035368945620578e-05,
+ "loss": 0.332,
+ "step": 12921
+ },
+ {
+ "epoch": 35.20980926430518,
+ "grad_norm": 7.01581335067749,
+ "learning_rate": 1.503460647383709e-05,
+ "loss": 0.3773,
+ "step": 12922
+ },
+ {
+ "epoch": 35.212534059945504,
+ "grad_norm": 7.587332725524902,
+ "learning_rate": 1.5033843962844246e-05,
+ "loss": 0.3295,
+ "step": 12923
+ },
+ {
+ "epoch": 35.21525885558583,
+ "grad_norm": 10.930032730102539,
+ "learning_rate": 1.503308141264799e-05,
+ "loss": 0.6685,
+ "step": 12924
+ },
+ {
+ "epoch": 35.217983651226156,
+ "grad_norm": 6.387872695922852,
+ "learning_rate": 1.5032318823254257e-05,
+ "loss": 0.3438,
+ "step": 12925
+ },
+ {
+ "epoch": 35.22070844686648,
+ "grad_norm": 11.000805854797363,
+ "learning_rate": 1.5031556194668988e-05,
+ "loss": 0.3216,
+ "step": 12926
+ },
+ {
+ "epoch": 35.223433242506815,
+ "grad_norm": 12.715154647827148,
+ "learning_rate": 1.5030793526898118e-05,
+ "loss": 0.2976,
+ "step": 12927
+ },
+ {
+ "epoch": 35.22615803814714,
+ "grad_norm": 6.091267108917236,
+ "learning_rate": 1.5030030819947592e-05,
+ "loss": 0.3266,
+ "step": 12928
+ },
+ {
+ "epoch": 35.228882833787466,
+ "grad_norm": 7.640657901763916,
+ "learning_rate": 1.5029268073823349e-05,
+ "loss": 0.4821,
+ "step": 12929
+ },
+ {
+ "epoch": 35.23160762942779,
+ "grad_norm": 25.278005599975586,
+ "learning_rate": 1.5028505288531325e-05,
+ "loss": 0.2789,
+ "step": 12930
+ },
+ {
+ "epoch": 35.23433242506812,
+ "grad_norm": 9.08450984954834,
+ "learning_rate": 1.5027742464077468e-05,
+ "loss": 0.3575,
+ "step": 12931
+ },
+ {
+ "epoch": 35.237057220708444,
+ "grad_norm": 18.064441680908203,
+ "learning_rate": 1.502697960046771e-05,
+ "loss": 0.5448,
+ "step": 12932
+ },
+ {
+ "epoch": 35.23978201634878,
+ "grad_norm": 9.034799575805664,
+ "learning_rate": 1.5026216697708002e-05,
+ "loss": 0.425,
+ "step": 12933
+ },
+ {
+ "epoch": 35.2425068119891,
+ "grad_norm": 9.033137321472168,
+ "learning_rate": 1.5025453755804275e-05,
+ "loss": 0.4044,
+ "step": 12934
+ },
+ {
+ "epoch": 35.24523160762943,
+ "grad_norm": 6.852743625640869,
+ "learning_rate": 1.5024690774762478e-05,
+ "loss": 0.2435,
+ "step": 12935
+ },
+ {
+ "epoch": 35.247956403269754,
+ "grad_norm": 6.676074981689453,
+ "learning_rate": 1.5023927754588551e-05,
+ "loss": 0.2675,
+ "step": 12936
+ },
+ {
+ "epoch": 35.25068119891008,
+ "grad_norm": 5.360869884490967,
+ "learning_rate": 1.5023164695288435e-05,
+ "loss": 0.4157,
+ "step": 12937
+ },
+ {
+ "epoch": 35.253405994550405,
+ "grad_norm": 7.680437088012695,
+ "learning_rate": 1.502240159686808e-05,
+ "loss": 0.3692,
+ "step": 12938
+ },
+ {
+ "epoch": 35.25613079019074,
+ "grad_norm": 8.144967079162598,
+ "learning_rate": 1.5021638459333417e-05,
+ "loss": 0.3655,
+ "step": 12939
+ },
+ {
+ "epoch": 35.258855585831064,
+ "grad_norm": 7.062442779541016,
+ "learning_rate": 1.5020875282690392e-05,
+ "loss": 0.2522,
+ "step": 12940
+ },
+ {
+ "epoch": 35.26158038147139,
+ "grad_norm": 7.588070869445801,
+ "learning_rate": 1.502011206694496e-05,
+ "loss": 0.3133,
+ "step": 12941
+ },
+ {
+ "epoch": 35.264305177111716,
+ "grad_norm": 5.228339195251465,
+ "learning_rate": 1.5019348812103052e-05,
+ "loss": 0.276,
+ "step": 12942
+ },
+ {
+ "epoch": 35.26702997275204,
+ "grad_norm": 7.7266411781311035,
+ "learning_rate": 1.501858551817062e-05,
+ "loss": 0.2988,
+ "step": 12943
+ },
+ {
+ "epoch": 35.26975476839237,
+ "grad_norm": 9.450374603271484,
+ "learning_rate": 1.5017822185153602e-05,
+ "loss": 0.3086,
+ "step": 12944
+ },
+ {
+ "epoch": 35.2724795640327,
+ "grad_norm": 8.649518966674805,
+ "learning_rate": 1.5017058813057948e-05,
+ "loss": 0.4817,
+ "step": 12945
+ },
+ {
+ "epoch": 35.275204359673026,
+ "grad_norm": 7.016547679901123,
+ "learning_rate": 1.5016295401889602e-05,
+ "loss": 0.5093,
+ "step": 12946
+ },
+ {
+ "epoch": 35.27792915531335,
+ "grad_norm": 15.65822982788086,
+ "learning_rate": 1.501553195165451e-05,
+ "loss": 0.2648,
+ "step": 12947
+ },
+ {
+ "epoch": 35.28065395095368,
+ "grad_norm": 7.363132953643799,
+ "learning_rate": 1.5014768462358613e-05,
+ "loss": 0.3209,
+ "step": 12948
+ },
+ {
+ "epoch": 35.283378746594,
+ "grad_norm": 8.958174705505371,
+ "learning_rate": 1.5014004934007864e-05,
+ "loss": 0.3528,
+ "step": 12949
+ },
+ {
+ "epoch": 35.28610354223433,
+ "grad_norm": 6.925446033477783,
+ "learning_rate": 1.5013241366608202e-05,
+ "loss": 0.2886,
+ "step": 12950
+ },
+ {
+ "epoch": 35.28882833787466,
+ "grad_norm": 6.035683631896973,
+ "learning_rate": 1.5012477760165581e-05,
+ "loss": 0.2489,
+ "step": 12951
+ },
+ {
+ "epoch": 35.29155313351499,
+ "grad_norm": 7.717945575714111,
+ "learning_rate": 1.5011714114685942e-05,
+ "loss": 0.5134,
+ "step": 12952
+ },
+ {
+ "epoch": 35.294277929155314,
+ "grad_norm": 6.433282375335693,
+ "learning_rate": 1.5010950430175237e-05,
+ "loss": 0.2674,
+ "step": 12953
+ },
+ {
+ "epoch": 35.29700272479564,
+ "grad_norm": 7.275332450866699,
+ "learning_rate": 1.5010186706639412e-05,
+ "loss": 0.3405,
+ "step": 12954
+ },
+ {
+ "epoch": 35.299727520435965,
+ "grad_norm": 6.948375225067139,
+ "learning_rate": 1.5009422944084411e-05,
+ "loss": 0.3185,
+ "step": 12955
+ },
+ {
+ "epoch": 35.30245231607629,
+ "grad_norm": 9.078147888183594,
+ "learning_rate": 1.500865914251619e-05,
+ "loss": 0.4474,
+ "step": 12956
+ },
+ {
+ "epoch": 35.305177111716624,
+ "grad_norm": 7.218676567077637,
+ "learning_rate": 1.500789530194069e-05,
+ "loss": 0.3599,
+ "step": 12957
+ },
+ {
+ "epoch": 35.30790190735695,
+ "grad_norm": 8.05556869506836,
+ "learning_rate": 1.5007131422363864e-05,
+ "loss": 0.4174,
+ "step": 12958
+ },
+ {
+ "epoch": 35.310626702997276,
+ "grad_norm": 8.176007270812988,
+ "learning_rate": 1.5006367503791657e-05,
+ "loss": 0.3093,
+ "step": 12959
+ },
+ {
+ "epoch": 35.3133514986376,
+ "grad_norm": 8.308642387390137,
+ "learning_rate": 1.5005603546230024e-05,
+ "loss": 0.2853,
+ "step": 12960
+ },
+ {
+ "epoch": 35.31607629427793,
+ "grad_norm": 7.603718280792236,
+ "learning_rate": 1.5004839549684907e-05,
+ "loss": 0.2453,
+ "step": 12961
+ },
+ {
+ "epoch": 35.31880108991825,
+ "grad_norm": 8.311637878417969,
+ "learning_rate": 1.5004075514162264e-05,
+ "loss": 0.3121,
+ "step": 12962
+ },
+ {
+ "epoch": 35.321525885558586,
+ "grad_norm": 6.768898963928223,
+ "learning_rate": 1.5003311439668041e-05,
+ "loss": 0.3403,
+ "step": 12963
+ },
+ {
+ "epoch": 35.32425068119891,
+ "grad_norm": 9.002680778503418,
+ "learning_rate": 1.5002547326208193e-05,
+ "loss": 0.3454,
+ "step": 12964
+ },
+ {
+ "epoch": 35.32697547683924,
+ "grad_norm": 6.46567964553833,
+ "learning_rate": 1.5001783173788661e-05,
+ "loss": 0.2999,
+ "step": 12965
+ },
+ {
+ "epoch": 35.32970027247956,
+ "grad_norm": 8.28508472442627,
+ "learning_rate": 1.5001018982415407e-05,
+ "loss": 0.2375,
+ "step": 12966
+ },
+ {
+ "epoch": 35.33242506811989,
+ "grad_norm": 7.745180130004883,
+ "learning_rate": 1.5000254752094376e-05,
+ "loss": 0.3192,
+ "step": 12967
+ },
+ {
+ "epoch": 35.335149863760215,
+ "grad_norm": 6.4640913009643555,
+ "learning_rate": 1.4999490482831526e-05,
+ "loss": 0.3266,
+ "step": 12968
+ },
+ {
+ "epoch": 35.33787465940055,
+ "grad_norm": 6.967803001403809,
+ "learning_rate": 1.49987261746328e-05,
+ "loss": 0.2811,
+ "step": 12969
+ },
+ {
+ "epoch": 35.34059945504087,
+ "grad_norm": 6.355371952056885,
+ "learning_rate": 1.4997961827504156e-05,
+ "loss": 0.5119,
+ "step": 12970
+ },
+ {
+ "epoch": 35.3433242506812,
+ "grad_norm": 6.229894638061523,
+ "learning_rate": 1.499719744145155e-05,
+ "loss": 0.48,
+ "step": 12971
+ },
+ {
+ "epoch": 35.346049046321525,
+ "grad_norm": 6.700027942657471,
+ "learning_rate": 1.499643301648093e-05,
+ "loss": 0.3835,
+ "step": 12972
+ },
+ {
+ "epoch": 35.34877384196185,
+ "grad_norm": 6.299387454986572,
+ "learning_rate": 1.4995668552598249e-05,
+ "loss": 0.3477,
+ "step": 12973
+ },
+ {
+ "epoch": 35.35149863760218,
+ "grad_norm": 7.223231315612793,
+ "learning_rate": 1.4994904049809463e-05,
+ "loss": 0.3934,
+ "step": 12974
+ },
+ {
+ "epoch": 35.35422343324251,
+ "grad_norm": 6.085124969482422,
+ "learning_rate": 1.4994139508120524e-05,
+ "loss": 0.3353,
+ "step": 12975
+ },
+ {
+ "epoch": 35.356948228882835,
+ "grad_norm": 9.593476295471191,
+ "learning_rate": 1.499337492753739e-05,
+ "loss": 0.4173,
+ "step": 12976
+ },
+ {
+ "epoch": 35.35967302452316,
+ "grad_norm": 7.308346748352051,
+ "learning_rate": 1.4992610308066008e-05,
+ "loss": 0.3616,
+ "step": 12977
+ },
+ {
+ "epoch": 35.36239782016349,
+ "grad_norm": 8.746541976928711,
+ "learning_rate": 1.499184564971234e-05,
+ "loss": 0.3167,
+ "step": 12978
+ },
+ {
+ "epoch": 35.36512261580381,
+ "grad_norm": 8.048002243041992,
+ "learning_rate": 1.4991080952482337e-05,
+ "loss": 0.2381,
+ "step": 12979
+ },
+ {
+ "epoch": 35.36784741144414,
+ "grad_norm": 7.211552619934082,
+ "learning_rate": 1.4990316216381961e-05,
+ "loss": 0.2842,
+ "step": 12980
+ },
+ {
+ "epoch": 35.37057220708447,
+ "grad_norm": 6.82273530960083,
+ "learning_rate": 1.4989551441417159e-05,
+ "loss": 0.4873,
+ "step": 12981
+ },
+ {
+ "epoch": 35.3732970027248,
+ "grad_norm": 7.440096378326416,
+ "learning_rate": 1.4988786627593891e-05,
+ "loss": 0.428,
+ "step": 12982
+ },
+ {
+ "epoch": 35.37602179836512,
+ "grad_norm": 6.173402309417725,
+ "learning_rate": 1.4988021774918116e-05,
+ "loss": 0.3199,
+ "step": 12983
+ },
+ {
+ "epoch": 35.37874659400545,
+ "grad_norm": 7.369758605957031,
+ "learning_rate": 1.4987256883395786e-05,
+ "loss": 0.2651,
+ "step": 12984
+ },
+ {
+ "epoch": 35.381471389645775,
+ "grad_norm": 6.719857692718506,
+ "learning_rate": 1.498649195303286e-05,
+ "loss": 0.4166,
+ "step": 12985
+ },
+ {
+ "epoch": 35.3841961852861,
+ "grad_norm": 7.939483642578125,
+ "learning_rate": 1.4985726983835296e-05,
+ "loss": 0.3062,
+ "step": 12986
+ },
+ {
+ "epoch": 35.38692098092643,
+ "grad_norm": 8.635056495666504,
+ "learning_rate": 1.498496197580905e-05,
+ "loss": 0.3906,
+ "step": 12987
+ },
+ {
+ "epoch": 35.38964577656676,
+ "grad_norm": 5.695560455322266,
+ "learning_rate": 1.498419692896008e-05,
+ "loss": 0.2885,
+ "step": 12988
+ },
+ {
+ "epoch": 35.392370572207085,
+ "grad_norm": 12.678315162658691,
+ "learning_rate": 1.4983431843294345e-05,
+ "loss": 0.2282,
+ "step": 12989
+ },
+ {
+ "epoch": 35.39509536784741,
+ "grad_norm": 5.157857894897461,
+ "learning_rate": 1.4982666718817804e-05,
+ "loss": 0.2074,
+ "step": 12990
+ },
+ {
+ "epoch": 35.39782016348774,
+ "grad_norm": 7.161243438720703,
+ "learning_rate": 1.4981901555536414e-05,
+ "loss": 0.4799,
+ "step": 12991
+ },
+ {
+ "epoch": 35.40054495912806,
+ "grad_norm": 6.926211833953857,
+ "learning_rate": 1.4981136353456135e-05,
+ "loss": 0.3473,
+ "step": 12992
+ },
+ {
+ "epoch": 35.403269754768395,
+ "grad_norm": 5.929111003875732,
+ "learning_rate": 1.4980371112582927e-05,
+ "loss": 0.2735,
+ "step": 12993
+ },
+ {
+ "epoch": 35.40599455040872,
+ "grad_norm": 7.072702884674072,
+ "learning_rate": 1.497960583292275e-05,
+ "loss": 0.3306,
+ "step": 12994
+ },
+ {
+ "epoch": 35.40871934604905,
+ "grad_norm": 9.228020668029785,
+ "learning_rate": 1.497884051448156e-05,
+ "loss": 0.3293,
+ "step": 12995
+ },
+ {
+ "epoch": 35.41144414168937,
+ "grad_norm": 7.056519031524658,
+ "learning_rate": 1.4978075157265324e-05,
+ "loss": 0.3887,
+ "step": 12996
+ },
+ {
+ "epoch": 35.4141689373297,
+ "grad_norm": 5.909057140350342,
+ "learning_rate": 1.4977309761279997e-05,
+ "loss": 0.2881,
+ "step": 12997
+ },
+ {
+ "epoch": 35.416893732970024,
+ "grad_norm": 8.001152038574219,
+ "learning_rate": 1.4976544326531542e-05,
+ "loss": 0.3256,
+ "step": 12998
+ },
+ {
+ "epoch": 35.41961852861036,
+ "grad_norm": 7.966976642608643,
+ "learning_rate": 1.497577885302592e-05,
+ "loss": 0.3325,
+ "step": 12999
+ },
+ {
+ "epoch": 35.42234332425068,
+ "grad_norm": 7.403523921966553,
+ "learning_rate": 1.4975013340769094e-05,
+ "loss": 0.2838,
+ "step": 13000
+ },
+ {
+ "epoch": 35.42506811989101,
+ "grad_norm": 8.983705520629883,
+ "learning_rate": 1.497424778976702e-05,
+ "loss": 0.2521,
+ "step": 13001
+ },
+ {
+ "epoch": 35.427792915531334,
+ "grad_norm": 16.565153121948242,
+ "learning_rate": 1.4973482200025669e-05,
+ "loss": 0.395,
+ "step": 13002
+ },
+ {
+ "epoch": 35.43051771117166,
+ "grad_norm": 8.130942344665527,
+ "learning_rate": 1.4972716571550996e-05,
+ "loss": 0.3645,
+ "step": 13003
+ },
+ {
+ "epoch": 35.433242506811986,
+ "grad_norm": 6.450094223022461,
+ "learning_rate": 1.4971950904348966e-05,
+ "loss": 0.2584,
+ "step": 13004
+ },
+ {
+ "epoch": 35.43596730245232,
+ "grad_norm": 14.972867012023926,
+ "learning_rate": 1.4971185198425544e-05,
+ "loss": 0.3554,
+ "step": 13005
+ },
+ {
+ "epoch": 35.438692098092645,
+ "grad_norm": 8.811211585998535,
+ "learning_rate": 1.497041945378669e-05,
+ "loss": 0.4207,
+ "step": 13006
+ },
+ {
+ "epoch": 35.44141689373297,
+ "grad_norm": 10.867773056030273,
+ "learning_rate": 1.4969653670438372e-05,
+ "loss": 0.2978,
+ "step": 13007
+ },
+ {
+ "epoch": 35.444141689373296,
+ "grad_norm": 7.401322841644287,
+ "learning_rate": 1.496888784838655e-05,
+ "loss": 0.4389,
+ "step": 13008
+ },
+ {
+ "epoch": 35.44686648501362,
+ "grad_norm": 9.335734367370605,
+ "learning_rate": 1.4968121987637188e-05,
+ "loss": 0.4746,
+ "step": 13009
+ },
+ {
+ "epoch": 35.44959128065395,
+ "grad_norm": 12.53529167175293,
+ "learning_rate": 1.4967356088196252e-05,
+ "loss": 0.3506,
+ "step": 13010
+ },
+ {
+ "epoch": 35.45231607629428,
+ "grad_norm": 8.071320533752441,
+ "learning_rate": 1.496659015006971e-05,
+ "loss": 0.2522,
+ "step": 13011
+ },
+ {
+ "epoch": 35.45504087193461,
+ "grad_norm": 7.37003755569458,
+ "learning_rate": 1.4965824173263519e-05,
+ "loss": 0.2563,
+ "step": 13012
+ },
+ {
+ "epoch": 35.45776566757493,
+ "grad_norm": 6.280857563018799,
+ "learning_rate": 1.4965058157783651e-05,
+ "loss": 0.2775,
+ "step": 13013
+ },
+ {
+ "epoch": 35.46049046321526,
+ "grad_norm": 7.227498531341553,
+ "learning_rate": 1.4964292103636072e-05,
+ "loss": 0.3485,
+ "step": 13014
+ },
+ {
+ "epoch": 35.463215258855584,
+ "grad_norm": 7.105706691741943,
+ "learning_rate": 1.496352601082674e-05,
+ "loss": 0.3675,
+ "step": 13015
+ },
+ {
+ "epoch": 35.46594005449591,
+ "grad_norm": 7.031396865844727,
+ "learning_rate": 1.4962759879361635e-05,
+ "loss": 0.2964,
+ "step": 13016
+ },
+ {
+ "epoch": 35.46866485013624,
+ "grad_norm": 7.706293106079102,
+ "learning_rate": 1.4961993709246709e-05,
+ "loss": 0.4787,
+ "step": 13017
+ },
+ {
+ "epoch": 35.47138964577657,
+ "grad_norm": 6.265936374664307,
+ "learning_rate": 1.496122750048794e-05,
+ "loss": 0.2879,
+ "step": 13018
+ },
+ {
+ "epoch": 35.474114441416894,
+ "grad_norm": 9.70106315612793,
+ "learning_rate": 1.496046125309129e-05,
+ "loss": 0.3036,
+ "step": 13019
+ },
+ {
+ "epoch": 35.47683923705722,
+ "grad_norm": 9.175358772277832,
+ "learning_rate": 1.4959694967062727e-05,
+ "loss": 0.4707,
+ "step": 13020
+ },
+ {
+ "epoch": 35.479564032697546,
+ "grad_norm": 9.831436157226562,
+ "learning_rate": 1.4958928642408219e-05,
+ "loss": 0.3326,
+ "step": 13021
+ },
+ {
+ "epoch": 35.48228882833787,
+ "grad_norm": 18.738372802734375,
+ "learning_rate": 1.4958162279133734e-05,
+ "loss": 0.3783,
+ "step": 13022
+ },
+ {
+ "epoch": 35.485013623978205,
+ "grad_norm": 7.148810863494873,
+ "learning_rate": 1.4957395877245242e-05,
+ "loss": 0.4752,
+ "step": 13023
+ },
+ {
+ "epoch": 35.48773841961853,
+ "grad_norm": 8.935877799987793,
+ "learning_rate": 1.4956629436748712e-05,
+ "loss": 0.2694,
+ "step": 13024
+ },
+ {
+ "epoch": 35.490463215258856,
+ "grad_norm": 7.80535888671875,
+ "learning_rate": 1.4955862957650108e-05,
+ "loss": 0.4427,
+ "step": 13025
+ },
+ {
+ "epoch": 35.49318801089918,
+ "grad_norm": 8.087099075317383,
+ "learning_rate": 1.4955096439955404e-05,
+ "loss": 0.37,
+ "step": 13026
+ },
+ {
+ "epoch": 35.49591280653951,
+ "grad_norm": 6.996232032775879,
+ "learning_rate": 1.4954329883670569e-05,
+ "loss": 0.4202,
+ "step": 13027
+ },
+ {
+ "epoch": 35.49863760217983,
+ "grad_norm": 5.583734512329102,
+ "learning_rate": 1.4953563288801571e-05,
+ "loss": 0.3756,
+ "step": 13028
+ },
+ {
+ "epoch": 35.50136239782017,
+ "grad_norm": 12.677495002746582,
+ "learning_rate": 1.4952796655354383e-05,
+ "loss": 0.3509,
+ "step": 13029
+ },
+ {
+ "epoch": 35.50408719346049,
+ "grad_norm": 7.13171911239624,
+ "learning_rate": 1.4952029983334973e-05,
+ "loss": 0.2833,
+ "step": 13030
+ },
+ {
+ "epoch": 35.50681198910082,
+ "grad_norm": 9.175862312316895,
+ "learning_rate": 1.4951263272749313e-05,
+ "loss": 0.4503,
+ "step": 13031
+ },
+ {
+ "epoch": 35.509536784741144,
+ "grad_norm": 40.1395149230957,
+ "learning_rate": 1.4950496523603373e-05,
+ "loss": 0.2751,
+ "step": 13032
+ },
+ {
+ "epoch": 35.51226158038147,
+ "grad_norm": 8.28769588470459,
+ "learning_rate": 1.4949729735903127e-05,
+ "loss": 0.3824,
+ "step": 13033
+ },
+ {
+ "epoch": 35.514986376021795,
+ "grad_norm": 8.487380027770996,
+ "learning_rate": 1.4948962909654545e-05,
+ "loss": 0.3179,
+ "step": 13034
+ },
+ {
+ "epoch": 35.51771117166213,
+ "grad_norm": 8.022058486938477,
+ "learning_rate": 1.4948196044863599e-05,
+ "loss": 0.3322,
+ "step": 13035
+ },
+ {
+ "epoch": 35.520435967302454,
+ "grad_norm": 7.599024295806885,
+ "learning_rate": 1.4947429141536262e-05,
+ "loss": 0.5132,
+ "step": 13036
+ },
+ {
+ "epoch": 35.52316076294278,
+ "grad_norm": 6.896925926208496,
+ "learning_rate": 1.4946662199678503e-05,
+ "loss": 0.4443,
+ "step": 13037
+ },
+ {
+ "epoch": 35.525885558583106,
+ "grad_norm": 7.097535133361816,
+ "learning_rate": 1.49458952192963e-05,
+ "loss": 0.3708,
+ "step": 13038
+ },
+ {
+ "epoch": 35.52861035422343,
+ "grad_norm": 7.393113613128662,
+ "learning_rate": 1.4945128200395627e-05,
+ "loss": 0.4984,
+ "step": 13039
+ },
+ {
+ "epoch": 35.53133514986376,
+ "grad_norm": 16.788925170898438,
+ "learning_rate": 1.494436114298245e-05,
+ "loss": 0.339,
+ "step": 13040
+ },
+ {
+ "epoch": 35.53405994550409,
+ "grad_norm": 6.135458469390869,
+ "learning_rate": 1.4943594047062752e-05,
+ "loss": 0.3078,
+ "step": 13041
+ },
+ {
+ "epoch": 35.536784741144416,
+ "grad_norm": 22.487558364868164,
+ "learning_rate": 1.4942826912642501e-05,
+ "loss": 0.3701,
+ "step": 13042
+ },
+ {
+ "epoch": 35.53950953678474,
+ "grad_norm": 5.258029937744141,
+ "learning_rate": 1.4942059739727674e-05,
+ "loss": 0.2841,
+ "step": 13043
+ },
+ {
+ "epoch": 35.54223433242507,
+ "grad_norm": 6.1360039710998535,
+ "learning_rate": 1.4941292528324243e-05,
+ "loss": 0.4158,
+ "step": 13044
+ },
+ {
+ "epoch": 35.54495912806539,
+ "grad_norm": 17.92101287841797,
+ "learning_rate": 1.4940525278438185e-05,
+ "loss": 0.2211,
+ "step": 13045
+ },
+ {
+ "epoch": 35.54768392370572,
+ "grad_norm": 5.610847473144531,
+ "learning_rate": 1.4939757990075477e-05,
+ "loss": 0.3317,
+ "step": 13046
+ },
+ {
+ "epoch": 35.55040871934605,
+ "grad_norm": 7.047835826873779,
+ "learning_rate": 1.4938990663242088e-05,
+ "loss": 0.3626,
+ "step": 13047
+ },
+ {
+ "epoch": 35.55313351498638,
+ "grad_norm": 8.515892028808594,
+ "learning_rate": 1.4938223297944002e-05,
+ "loss": 0.4571,
+ "step": 13048
+ },
+ {
+ "epoch": 35.555858310626704,
+ "grad_norm": 8.290979385375977,
+ "learning_rate": 1.4937455894187194e-05,
+ "loss": 0.282,
+ "step": 13049
+ },
+ {
+ "epoch": 35.55858310626703,
+ "grad_norm": 8.804868698120117,
+ "learning_rate": 1.4936688451977634e-05,
+ "loss": 0.2292,
+ "step": 13050
+ },
+ {
+ "epoch": 35.561307901907355,
+ "grad_norm": 9.756802558898926,
+ "learning_rate": 1.4935920971321307e-05,
+ "loss": 0.4769,
+ "step": 13051
+ },
+ {
+ "epoch": 35.56403269754768,
+ "grad_norm": 9.684371948242188,
+ "learning_rate": 1.4935153452224182e-05,
+ "loss": 0.2839,
+ "step": 13052
+ },
+ {
+ "epoch": 35.566757493188014,
+ "grad_norm": 7.277624130249023,
+ "learning_rate": 1.4934385894692247e-05,
+ "loss": 0.3809,
+ "step": 13053
+ },
+ {
+ "epoch": 35.56948228882834,
+ "grad_norm": 7.828587055206299,
+ "learning_rate": 1.493361829873147e-05,
+ "loss": 0.3798,
+ "step": 13054
+ },
+ {
+ "epoch": 35.572207084468666,
+ "grad_norm": 6.445404052734375,
+ "learning_rate": 1.493285066434783e-05,
+ "loss": 0.4615,
+ "step": 13055
+ },
+ {
+ "epoch": 35.57493188010899,
+ "grad_norm": 8.173526763916016,
+ "learning_rate": 1.493208299154731e-05,
+ "loss": 0.3491,
+ "step": 13056
+ },
+ {
+ "epoch": 35.57765667574932,
+ "grad_norm": 13.190991401672363,
+ "learning_rate": 1.4931315280335888e-05,
+ "loss": 0.3542,
+ "step": 13057
+ },
+ {
+ "epoch": 35.58038147138964,
+ "grad_norm": 8.441964149475098,
+ "learning_rate": 1.4930547530719539e-05,
+ "loss": 0.2137,
+ "step": 13058
+ },
+ {
+ "epoch": 35.583106267029976,
+ "grad_norm": 15.430624008178711,
+ "learning_rate": 1.4929779742704246e-05,
+ "loss": 0.4155,
+ "step": 13059
+ },
+ {
+ "epoch": 35.5858310626703,
+ "grad_norm": 9.153474807739258,
+ "learning_rate": 1.4929011916295986e-05,
+ "loss": 0.2364,
+ "step": 13060
+ },
+ {
+ "epoch": 35.58855585831063,
+ "grad_norm": 8.394576072692871,
+ "learning_rate": 1.4928244051500742e-05,
+ "loss": 0.277,
+ "step": 13061
+ },
+ {
+ "epoch": 35.59128065395095,
+ "grad_norm": 6.277867317199707,
+ "learning_rate": 1.4927476148324488e-05,
+ "loss": 0.3002,
+ "step": 13062
+ },
+ {
+ "epoch": 35.59400544959128,
+ "grad_norm": 6.191000938415527,
+ "learning_rate": 1.4926708206773213e-05,
+ "loss": 0.4512,
+ "step": 13063
+ },
+ {
+ "epoch": 35.596730245231605,
+ "grad_norm": 6.844345569610596,
+ "learning_rate": 1.4925940226852889e-05,
+ "loss": 0.4242,
+ "step": 13064
+ },
+ {
+ "epoch": 35.59945504087194,
+ "grad_norm": 6.637400150299072,
+ "learning_rate": 1.4925172208569502e-05,
+ "loss": 0.3007,
+ "step": 13065
+ },
+ {
+ "epoch": 35.60217983651226,
+ "grad_norm": 14.81370735168457,
+ "learning_rate": 1.4924404151929033e-05,
+ "loss": 0.4465,
+ "step": 13066
+ },
+ {
+ "epoch": 35.60490463215259,
+ "grad_norm": 9.97683048248291,
+ "learning_rate": 1.4923636056937466e-05,
+ "loss": 0.2724,
+ "step": 13067
+ },
+ {
+ "epoch": 35.607629427792915,
+ "grad_norm": 28.20574378967285,
+ "learning_rate": 1.4922867923600774e-05,
+ "loss": 0.3198,
+ "step": 13068
+ },
+ {
+ "epoch": 35.61035422343324,
+ "grad_norm": 8.994606971740723,
+ "learning_rate": 1.492209975192495e-05,
+ "loss": 0.3557,
+ "step": 13069
+ },
+ {
+ "epoch": 35.61307901907357,
+ "grad_norm": 7.081641674041748,
+ "learning_rate": 1.492133154191597e-05,
+ "loss": 0.3023,
+ "step": 13070
+ },
+ {
+ "epoch": 35.6158038147139,
+ "grad_norm": 7.818090915679932,
+ "learning_rate": 1.4920563293579817e-05,
+ "loss": 0.4968,
+ "step": 13071
+ },
+ {
+ "epoch": 35.618528610354225,
+ "grad_norm": 6.1535162925720215,
+ "learning_rate": 1.4919795006922475e-05,
+ "loss": 0.2741,
+ "step": 13072
+ },
+ {
+ "epoch": 35.62125340599455,
+ "grad_norm": 7.111542701721191,
+ "learning_rate": 1.491902668194993e-05,
+ "loss": 0.3892,
+ "step": 13073
+ },
+ {
+ "epoch": 35.62397820163488,
+ "grad_norm": 12.075234413146973,
+ "learning_rate": 1.491825831866816e-05,
+ "loss": 0.2781,
+ "step": 13074
+ },
+ {
+ "epoch": 35.6267029972752,
+ "grad_norm": 7.627728462219238,
+ "learning_rate": 1.4917489917083157e-05,
+ "loss": 0.3509,
+ "step": 13075
+ },
+ {
+ "epoch": 35.62942779291553,
+ "grad_norm": 6.458619594573975,
+ "learning_rate": 1.49167214772009e-05,
+ "loss": 0.3506,
+ "step": 13076
+ },
+ {
+ "epoch": 35.63215258855586,
+ "grad_norm": 7.432330131530762,
+ "learning_rate": 1.4915952999027371e-05,
+ "loss": 0.359,
+ "step": 13077
+ },
+ {
+ "epoch": 35.63487738419619,
+ "grad_norm": 6.9332146644592285,
+ "learning_rate": 1.4915184482568562e-05,
+ "loss": 0.3243,
+ "step": 13078
+ },
+ {
+ "epoch": 35.63760217983651,
+ "grad_norm": 6.224339008331299,
+ "learning_rate": 1.4914415927830455e-05,
+ "loss": 0.3245,
+ "step": 13079
+ },
+ {
+ "epoch": 35.64032697547684,
+ "grad_norm": 7.042000770568848,
+ "learning_rate": 1.491364733481903e-05,
+ "loss": 0.4737,
+ "step": 13080
+ },
+ {
+ "epoch": 35.643051771117165,
+ "grad_norm": 6.224331855773926,
+ "learning_rate": 1.4912878703540281e-05,
+ "loss": 0.2442,
+ "step": 13081
+ },
+ {
+ "epoch": 35.64577656675749,
+ "grad_norm": 7.393121719360352,
+ "learning_rate": 1.4912110034000189e-05,
+ "loss": 0.403,
+ "step": 13082
+ },
+ {
+ "epoch": 35.64850136239782,
+ "grad_norm": 11.491524696350098,
+ "learning_rate": 1.4911341326204744e-05,
+ "loss": 0.2932,
+ "step": 13083
+ },
+ {
+ "epoch": 35.65122615803815,
+ "grad_norm": 5.53161096572876,
+ "learning_rate": 1.491057258015993e-05,
+ "loss": 0.2961,
+ "step": 13084
+ },
+ {
+ "epoch": 35.653950953678475,
+ "grad_norm": 8.468855857849121,
+ "learning_rate": 1.4909803795871738e-05,
+ "loss": 0.2301,
+ "step": 13085
+ },
+ {
+ "epoch": 35.6566757493188,
+ "grad_norm": 5.951993942260742,
+ "learning_rate": 1.4909034973346148e-05,
+ "loss": 0.3076,
+ "step": 13086
+ },
+ {
+ "epoch": 35.65940054495913,
+ "grad_norm": 7.281175136566162,
+ "learning_rate": 1.4908266112589154e-05,
+ "loss": 0.5266,
+ "step": 13087
+ },
+ {
+ "epoch": 35.66212534059945,
+ "grad_norm": 6.1608428955078125,
+ "learning_rate": 1.4907497213606738e-05,
+ "loss": 0.4055,
+ "step": 13088
+ },
+ {
+ "epoch": 35.664850136239785,
+ "grad_norm": 9.514596939086914,
+ "learning_rate": 1.4906728276404897e-05,
+ "loss": 0.3609,
+ "step": 13089
+ },
+ {
+ "epoch": 35.66757493188011,
+ "grad_norm": 8.773531913757324,
+ "learning_rate": 1.4905959300989607e-05,
+ "loss": 0.4261,
+ "step": 13090
+ },
+ {
+ "epoch": 35.67029972752044,
+ "grad_norm": 10.161262512207031,
+ "learning_rate": 1.4905190287366868e-05,
+ "loss": 0.305,
+ "step": 13091
+ },
+ {
+ "epoch": 35.67302452316076,
+ "grad_norm": 7.274245262145996,
+ "learning_rate": 1.4904421235542666e-05,
+ "loss": 0.2856,
+ "step": 13092
+ },
+ {
+ "epoch": 35.67574931880109,
+ "grad_norm": 6.7615227699279785,
+ "learning_rate": 1.4903652145522989e-05,
+ "loss": 0.3203,
+ "step": 13093
+ },
+ {
+ "epoch": 35.678474114441414,
+ "grad_norm": 5.8968095779418945,
+ "learning_rate": 1.4902883017313825e-05,
+ "loss": 0.3685,
+ "step": 13094
+ },
+ {
+ "epoch": 35.68119891008175,
+ "grad_norm": 8.771279335021973,
+ "learning_rate": 1.4902113850921169e-05,
+ "loss": 0.4639,
+ "step": 13095
+ },
+ {
+ "epoch": 35.68392370572207,
+ "grad_norm": 6.069421291351318,
+ "learning_rate": 1.4901344646351006e-05,
+ "loss": 0.2535,
+ "step": 13096
+ },
+ {
+ "epoch": 35.6866485013624,
+ "grad_norm": 6.342672348022461,
+ "learning_rate": 1.4900575403609328e-05,
+ "loss": 0.2945,
+ "step": 13097
+ },
+ {
+ "epoch": 35.689373297002724,
+ "grad_norm": 6.845711708068848,
+ "learning_rate": 1.4899806122702127e-05,
+ "loss": 0.4431,
+ "step": 13098
+ },
+ {
+ "epoch": 35.69209809264305,
+ "grad_norm": 7.4353814125061035,
+ "learning_rate": 1.4899036803635393e-05,
+ "loss": 0.4305,
+ "step": 13099
+ },
+ {
+ "epoch": 35.694822888283376,
+ "grad_norm": 7.208191871643066,
+ "learning_rate": 1.489826744641512e-05,
+ "loss": 0.2509,
+ "step": 13100
+ },
+ {
+ "epoch": 35.69754768392371,
+ "grad_norm": 7.7229156494140625,
+ "learning_rate": 1.4897498051047297e-05,
+ "loss": 0.2904,
+ "step": 13101
+ },
+ {
+ "epoch": 35.700272479564035,
+ "grad_norm": 6.398213863372803,
+ "learning_rate": 1.4896728617537914e-05,
+ "loss": 0.5042,
+ "step": 13102
+ },
+ {
+ "epoch": 35.70299727520436,
+ "grad_norm": 19.481176376342773,
+ "learning_rate": 1.489595914589297e-05,
+ "loss": 0.3272,
+ "step": 13103
+ },
+ {
+ "epoch": 35.705722070844686,
+ "grad_norm": 7.918393611907959,
+ "learning_rate": 1.4895189636118453e-05,
+ "loss": 0.3833,
+ "step": 13104
+ },
+ {
+ "epoch": 35.70844686648501,
+ "grad_norm": 6.956137657165527,
+ "learning_rate": 1.4894420088220356e-05,
+ "loss": 0.3163,
+ "step": 13105
+ },
+ {
+ "epoch": 35.71117166212534,
+ "grad_norm": 8.419601440429688,
+ "learning_rate": 1.4893650502204673e-05,
+ "loss": 0.311,
+ "step": 13106
+ },
+ {
+ "epoch": 35.71389645776567,
+ "grad_norm": 6.122564315795898,
+ "learning_rate": 1.4892880878077396e-05,
+ "loss": 0.5188,
+ "step": 13107
+ },
+ {
+ "epoch": 35.716621253406,
+ "grad_norm": 14.754682540893555,
+ "learning_rate": 1.4892111215844523e-05,
+ "loss": 0.2638,
+ "step": 13108
+ },
+ {
+ "epoch": 35.71934604904632,
+ "grad_norm": 8.965763092041016,
+ "learning_rate": 1.489134151551204e-05,
+ "loss": 0.4526,
+ "step": 13109
+ },
+ {
+ "epoch": 35.72207084468665,
+ "grad_norm": 7.389782428741455,
+ "learning_rate": 1.4890571777085954e-05,
+ "loss": 0.2732,
+ "step": 13110
+ },
+ {
+ "epoch": 35.724795640326974,
+ "grad_norm": 6.4090118408203125,
+ "learning_rate": 1.4889802000572247e-05,
+ "loss": 0.3694,
+ "step": 13111
+ },
+ {
+ "epoch": 35.7275204359673,
+ "grad_norm": 7.850404739379883,
+ "learning_rate": 1.4889032185976922e-05,
+ "loss": 0.3446,
+ "step": 13112
+ },
+ {
+ "epoch": 35.73024523160763,
+ "grad_norm": 7.053712844848633,
+ "learning_rate": 1.4888262333305971e-05,
+ "loss": 0.3712,
+ "step": 13113
+ },
+ {
+ "epoch": 35.73297002724796,
+ "grad_norm": 15.967446327209473,
+ "learning_rate": 1.488749244256539e-05,
+ "loss": 0.4603,
+ "step": 13114
+ },
+ {
+ "epoch": 35.735694822888284,
+ "grad_norm": 9.032360076904297,
+ "learning_rate": 1.4886722513761176e-05,
+ "loss": 0.3412,
+ "step": 13115
+ },
+ {
+ "epoch": 35.73841961852861,
+ "grad_norm": 6.181352138519287,
+ "learning_rate": 1.4885952546899323e-05,
+ "loss": 0.3625,
+ "step": 13116
+ },
+ {
+ "epoch": 35.741144414168936,
+ "grad_norm": 6.852163314819336,
+ "learning_rate": 1.4885182541985827e-05,
+ "loss": 0.3344,
+ "step": 13117
+ },
+ {
+ "epoch": 35.74386920980926,
+ "grad_norm": 6.599365711212158,
+ "learning_rate": 1.4884412499026693e-05,
+ "loss": 0.3532,
+ "step": 13118
+ },
+ {
+ "epoch": 35.746594005449595,
+ "grad_norm": 9.913313865661621,
+ "learning_rate": 1.4883642418027906e-05,
+ "loss": 0.3358,
+ "step": 13119
+ },
+ {
+ "epoch": 35.74931880108992,
+ "grad_norm": 7.836754322052002,
+ "learning_rate": 1.4882872298995472e-05,
+ "loss": 0.3151,
+ "step": 13120
+ },
+ {
+ "epoch": 35.752043596730246,
+ "grad_norm": 6.892861843109131,
+ "learning_rate": 1.4882102141935381e-05,
+ "loss": 0.2828,
+ "step": 13121
+ },
+ {
+ "epoch": 35.75476839237057,
+ "grad_norm": 6.486696243286133,
+ "learning_rate": 1.4881331946853643e-05,
+ "loss": 0.3953,
+ "step": 13122
+ },
+ {
+ "epoch": 35.7574931880109,
+ "grad_norm": 8.368975639343262,
+ "learning_rate": 1.4880561713756243e-05,
+ "loss": 0.3417,
+ "step": 13123
+ },
+ {
+ "epoch": 35.76021798365122,
+ "grad_norm": 6.539047718048096,
+ "learning_rate": 1.4879791442649188e-05,
+ "loss": 0.3057,
+ "step": 13124
+ },
+ {
+ "epoch": 35.762942779291556,
+ "grad_norm": 6.887070655822754,
+ "learning_rate": 1.4879021133538471e-05,
+ "loss": 0.4626,
+ "step": 13125
+ },
+ {
+ "epoch": 35.76566757493188,
+ "grad_norm": 5.815514087677002,
+ "learning_rate": 1.4878250786430099e-05,
+ "loss": 0.2421,
+ "step": 13126
+ },
+ {
+ "epoch": 35.76839237057221,
+ "grad_norm": 9.211060523986816,
+ "learning_rate": 1.4877480401330065e-05,
+ "loss": 0.4502,
+ "step": 13127
+ },
+ {
+ "epoch": 35.771117166212534,
+ "grad_norm": 11.286864280700684,
+ "learning_rate": 1.4876709978244372e-05,
+ "loss": 0.3573,
+ "step": 13128
+ },
+ {
+ "epoch": 35.77384196185286,
+ "grad_norm": 11.223306655883789,
+ "learning_rate": 1.4875939517179016e-05,
+ "loss": 0.3916,
+ "step": 13129
+ },
+ {
+ "epoch": 35.776566757493185,
+ "grad_norm": 12.014117240905762,
+ "learning_rate": 1.4875169018140003e-05,
+ "loss": 0.3492,
+ "step": 13130
+ },
+ {
+ "epoch": 35.77929155313352,
+ "grad_norm": 7.441474914550781,
+ "learning_rate": 1.4874398481133327e-05,
+ "loss": 0.4038,
+ "step": 13131
+ },
+ {
+ "epoch": 35.782016348773844,
+ "grad_norm": 12.697399139404297,
+ "learning_rate": 1.4873627906164997e-05,
+ "loss": 0.2928,
+ "step": 13132
+ },
+ {
+ "epoch": 35.78474114441417,
+ "grad_norm": 8.545955657958984,
+ "learning_rate": 1.4872857293241002e-05,
+ "loss": 0.2599,
+ "step": 13133
+ },
+ {
+ "epoch": 35.787465940054496,
+ "grad_norm": 10.86761474609375,
+ "learning_rate": 1.487208664236736e-05,
+ "loss": 0.1661,
+ "step": 13134
+ },
+ {
+ "epoch": 35.79019073569482,
+ "grad_norm": 9.067625045776367,
+ "learning_rate": 1.487131595355006e-05,
+ "loss": 0.3055,
+ "step": 13135
+ },
+ {
+ "epoch": 35.79291553133515,
+ "grad_norm": 7.21870231628418,
+ "learning_rate": 1.487054522679511e-05,
+ "loss": 0.3204,
+ "step": 13136
+ },
+ {
+ "epoch": 35.79564032697548,
+ "grad_norm": 6.984853744506836,
+ "learning_rate": 1.4869774462108506e-05,
+ "loss": 0.2603,
+ "step": 13137
+ },
+ {
+ "epoch": 35.798365122615806,
+ "grad_norm": 6.351567268371582,
+ "learning_rate": 1.4869003659496262e-05,
+ "loss": 0.2962,
+ "step": 13138
+ },
+ {
+ "epoch": 35.80108991825613,
+ "grad_norm": 8.221277236938477,
+ "learning_rate": 1.4868232818964368e-05,
+ "loss": 0.3925,
+ "step": 13139
+ },
+ {
+ "epoch": 35.80381471389646,
+ "grad_norm": 6.445461273193359,
+ "learning_rate": 1.4867461940518836e-05,
+ "loss": 0.2764,
+ "step": 13140
+ },
+ {
+ "epoch": 35.80653950953678,
+ "grad_norm": 10.9315185546875,
+ "learning_rate": 1.4866691024165665e-05,
+ "loss": 0.3392,
+ "step": 13141
+ },
+ {
+ "epoch": 35.80926430517711,
+ "grad_norm": 7.6769890785217285,
+ "learning_rate": 1.4865920069910865e-05,
+ "loss": 0.4421,
+ "step": 13142
+ },
+ {
+ "epoch": 35.81198910081744,
+ "grad_norm": 6.350608825683594,
+ "learning_rate": 1.4865149077760435e-05,
+ "loss": 0.3172,
+ "step": 13143
+ },
+ {
+ "epoch": 35.81471389645777,
+ "grad_norm": 7.1840291023254395,
+ "learning_rate": 1.486437804772038e-05,
+ "loss": 0.3192,
+ "step": 13144
+ },
+ {
+ "epoch": 35.817438692098094,
+ "grad_norm": 6.86708402633667,
+ "learning_rate": 1.4863606979796703e-05,
+ "loss": 0.3418,
+ "step": 13145
+ },
+ {
+ "epoch": 35.82016348773842,
+ "grad_norm": 7.209695339202881,
+ "learning_rate": 1.4862835873995416e-05,
+ "loss": 0.2687,
+ "step": 13146
+ },
+ {
+ "epoch": 35.822888283378745,
+ "grad_norm": 6.7395524978637695,
+ "learning_rate": 1.4862064730322516e-05,
+ "loss": 0.2544,
+ "step": 13147
+ },
+ {
+ "epoch": 35.82561307901907,
+ "grad_norm": 7.084775447845459,
+ "learning_rate": 1.4861293548784016e-05,
+ "loss": 0.2883,
+ "step": 13148
+ },
+ {
+ "epoch": 35.828337874659404,
+ "grad_norm": 9.86668872833252,
+ "learning_rate": 1.4860522329385914e-05,
+ "loss": 0.3532,
+ "step": 13149
+ },
+ {
+ "epoch": 35.83106267029973,
+ "grad_norm": 8.076080322265625,
+ "learning_rate": 1.485975107213422e-05,
+ "loss": 0.3002,
+ "step": 13150
+ },
+ {
+ "epoch": 35.833787465940055,
+ "grad_norm": 6.871728897094727,
+ "learning_rate": 1.4858979777034943e-05,
+ "loss": 0.2149,
+ "step": 13151
+ },
+ {
+ "epoch": 35.83651226158038,
+ "grad_norm": 6.7171759605407715,
+ "learning_rate": 1.4858208444094092e-05,
+ "loss": 0.3418,
+ "step": 13152
+ },
+ {
+ "epoch": 35.83923705722071,
+ "grad_norm": 7.652675151824951,
+ "learning_rate": 1.4857437073317665e-05,
+ "loss": 0.4183,
+ "step": 13153
+ },
+ {
+ "epoch": 35.84196185286103,
+ "grad_norm": 8.919107437133789,
+ "learning_rate": 1.4856665664711676e-05,
+ "loss": 0.3783,
+ "step": 13154
+ },
+ {
+ "epoch": 35.844686648501366,
+ "grad_norm": 12.379136085510254,
+ "learning_rate": 1.485589421828213e-05,
+ "loss": 0.4065,
+ "step": 13155
+ },
+ {
+ "epoch": 35.84741144414169,
+ "grad_norm": 8.966519355773926,
+ "learning_rate": 1.4855122734035037e-05,
+ "loss": 0.3304,
+ "step": 13156
+ },
+ {
+ "epoch": 35.85013623978202,
+ "grad_norm": 6.137722969055176,
+ "learning_rate": 1.4854351211976403e-05,
+ "loss": 0.3392,
+ "step": 13157
+ },
+ {
+ "epoch": 35.85286103542234,
+ "grad_norm": 7.204695701599121,
+ "learning_rate": 1.485357965211224e-05,
+ "loss": 0.4766,
+ "step": 13158
+ },
+ {
+ "epoch": 35.85558583106267,
+ "grad_norm": 5.848073482513428,
+ "learning_rate": 1.4852808054448553e-05,
+ "loss": 0.3183,
+ "step": 13159
+ },
+ {
+ "epoch": 35.858310626702995,
+ "grad_norm": 6.540821552276611,
+ "learning_rate": 1.4852036418991356e-05,
+ "loss": 0.2634,
+ "step": 13160
+ },
+ {
+ "epoch": 35.86103542234333,
+ "grad_norm": 7.086192607879639,
+ "learning_rate": 1.4851264745746653e-05,
+ "loss": 0.2425,
+ "step": 13161
+ },
+ {
+ "epoch": 35.86376021798365,
+ "grad_norm": 7.513698577880859,
+ "learning_rate": 1.4850493034720457e-05,
+ "loss": 0.2538,
+ "step": 13162
+ },
+ {
+ "epoch": 35.86648501362398,
+ "grad_norm": 9.127217292785645,
+ "learning_rate": 1.4849721285918777e-05,
+ "loss": 0.3346,
+ "step": 13163
+ },
+ {
+ "epoch": 35.869209809264305,
+ "grad_norm": 6.7912373542785645,
+ "learning_rate": 1.4848949499347625e-05,
+ "loss": 0.2762,
+ "step": 13164
+ },
+ {
+ "epoch": 35.87193460490463,
+ "grad_norm": 8.182476997375488,
+ "learning_rate": 1.4848177675013009e-05,
+ "loss": 0.2885,
+ "step": 13165
+ },
+ {
+ "epoch": 35.87465940054496,
+ "grad_norm": 7.489778518676758,
+ "learning_rate": 1.4847405812920943e-05,
+ "loss": 0.6197,
+ "step": 13166
+ },
+ {
+ "epoch": 35.87738419618529,
+ "grad_norm": 7.308894157409668,
+ "learning_rate": 1.4846633913077432e-05,
+ "loss": 0.2206,
+ "step": 13167
+ },
+ {
+ "epoch": 35.880108991825615,
+ "grad_norm": 7.15823221206665,
+ "learning_rate": 1.4845861975488495e-05,
+ "loss": 0.402,
+ "step": 13168
+ },
+ {
+ "epoch": 35.88283378746594,
+ "grad_norm": 5.423677444458008,
+ "learning_rate": 1.4845090000160142e-05,
+ "loss": 0.3098,
+ "step": 13169
+ },
+ {
+ "epoch": 35.88555858310627,
+ "grad_norm": 6.926116466522217,
+ "learning_rate": 1.4844317987098384e-05,
+ "loss": 0.2586,
+ "step": 13170
+ },
+ {
+ "epoch": 35.88828337874659,
+ "grad_norm": 6.592591762542725,
+ "learning_rate": 1.4843545936309233e-05,
+ "loss": 0.2909,
+ "step": 13171
+ },
+ {
+ "epoch": 35.89100817438692,
+ "grad_norm": 6.371806621551514,
+ "learning_rate": 1.4842773847798703e-05,
+ "loss": 0.3787,
+ "step": 13172
+ },
+ {
+ "epoch": 35.89373297002725,
+ "grad_norm": 6.53985595703125,
+ "learning_rate": 1.4842001721572804e-05,
+ "loss": 0.2646,
+ "step": 13173
+ },
+ {
+ "epoch": 35.89645776566758,
+ "grad_norm": 7.660606384277344,
+ "learning_rate": 1.4841229557637553e-05,
+ "loss": 0.3408,
+ "step": 13174
+ },
+ {
+ "epoch": 35.8991825613079,
+ "grad_norm": 9.842541694641113,
+ "learning_rate": 1.4840457355998963e-05,
+ "loss": 0.3557,
+ "step": 13175
+ },
+ {
+ "epoch": 35.90190735694823,
+ "grad_norm": 8.344846725463867,
+ "learning_rate": 1.4839685116663042e-05,
+ "loss": 0.2732,
+ "step": 13176
+ },
+ {
+ "epoch": 35.904632152588555,
+ "grad_norm": 5.782425880432129,
+ "learning_rate": 1.4838912839635813e-05,
+ "loss": 0.2045,
+ "step": 13177
+ },
+ {
+ "epoch": 35.90735694822888,
+ "grad_norm": 8.65829086303711,
+ "learning_rate": 1.4838140524923286e-05,
+ "loss": 0.3608,
+ "step": 13178
+ },
+ {
+ "epoch": 35.91008174386921,
+ "grad_norm": 7.713167667388916,
+ "learning_rate": 1.4837368172531477e-05,
+ "loss": 0.4244,
+ "step": 13179
+ },
+ {
+ "epoch": 35.91280653950954,
+ "grad_norm": 5.795069694519043,
+ "learning_rate": 1.4836595782466401e-05,
+ "loss": 0.462,
+ "step": 13180
+ },
+ {
+ "epoch": 35.915531335149865,
+ "grad_norm": 6.473036766052246,
+ "learning_rate": 1.4835823354734072e-05,
+ "loss": 0.366,
+ "step": 13181
+ },
+ {
+ "epoch": 35.91825613079019,
+ "grad_norm": 7.549315929412842,
+ "learning_rate": 1.4835050889340506e-05,
+ "loss": 0.3901,
+ "step": 13182
+ },
+ {
+ "epoch": 35.920980926430516,
+ "grad_norm": 8.299123764038086,
+ "learning_rate": 1.4834278386291718e-05,
+ "loss": 0.3112,
+ "step": 13183
+ },
+ {
+ "epoch": 35.92370572207084,
+ "grad_norm": 9.232878684997559,
+ "learning_rate": 1.4833505845593725e-05,
+ "loss": 0.4068,
+ "step": 13184
+ },
+ {
+ "epoch": 35.926430517711175,
+ "grad_norm": 7.171113967895508,
+ "learning_rate": 1.4832733267252545e-05,
+ "loss": 0.2828,
+ "step": 13185
+ },
+ {
+ "epoch": 35.9291553133515,
+ "grad_norm": 7.342721939086914,
+ "learning_rate": 1.4831960651274196e-05,
+ "loss": 0.2781,
+ "step": 13186
+ },
+ {
+ "epoch": 35.93188010899183,
+ "grad_norm": 7.980126857757568,
+ "learning_rate": 1.4831187997664691e-05,
+ "loss": 0.4585,
+ "step": 13187
+ },
+ {
+ "epoch": 35.93460490463215,
+ "grad_norm": 10.442893028259277,
+ "learning_rate": 1.4830415306430051e-05,
+ "loss": 0.5404,
+ "step": 13188
+ },
+ {
+ "epoch": 35.93732970027248,
+ "grad_norm": 7.508268356323242,
+ "learning_rate": 1.4829642577576289e-05,
+ "loss": 0.3302,
+ "step": 13189
+ },
+ {
+ "epoch": 35.940054495912804,
+ "grad_norm": 6.966134071350098,
+ "learning_rate": 1.482886981110943e-05,
+ "loss": 0.3431,
+ "step": 13190
+ },
+ {
+ "epoch": 35.94277929155314,
+ "grad_norm": 7.196403503417969,
+ "learning_rate": 1.4828097007035484e-05,
+ "loss": 0.3547,
+ "step": 13191
+ },
+ {
+ "epoch": 35.94550408719346,
+ "grad_norm": 7.072295188903809,
+ "learning_rate": 1.4827324165360478e-05,
+ "loss": 0.3083,
+ "step": 13192
+ },
+ {
+ "epoch": 35.94822888283379,
+ "grad_norm": 7.4165802001953125,
+ "learning_rate": 1.4826551286090425e-05,
+ "loss": 0.5513,
+ "step": 13193
+ },
+ {
+ "epoch": 35.950953678474114,
+ "grad_norm": 6.74781608581543,
+ "learning_rate": 1.4825778369231344e-05,
+ "loss": 0.2412,
+ "step": 13194
+ },
+ {
+ "epoch": 35.95367847411444,
+ "grad_norm": 7.24605131149292,
+ "learning_rate": 1.482500541478926e-05,
+ "loss": 0.45,
+ "step": 13195
+ },
+ {
+ "epoch": 35.956403269754766,
+ "grad_norm": 6.660770416259766,
+ "learning_rate": 1.4824232422770185e-05,
+ "loss": 0.3214,
+ "step": 13196
+ },
+ {
+ "epoch": 35.95912806539509,
+ "grad_norm": 11.896281242370605,
+ "learning_rate": 1.4823459393180147e-05,
+ "loss": 0.3054,
+ "step": 13197
+ },
+ {
+ "epoch": 35.961852861035425,
+ "grad_norm": 6.343620300292969,
+ "learning_rate": 1.482268632602516e-05,
+ "loss": 0.3669,
+ "step": 13198
+ },
+ {
+ "epoch": 35.96457765667575,
+ "grad_norm": 5.846088886260986,
+ "learning_rate": 1.4821913221311249e-05,
+ "loss": 0.315,
+ "step": 13199
+ },
+ {
+ "epoch": 35.967302452316076,
+ "grad_norm": 6.030350685119629,
+ "learning_rate": 1.482114007904443e-05,
+ "loss": 0.3785,
+ "step": 13200
+ },
+ {
+ "epoch": 35.9700272479564,
+ "grad_norm": 5.9081549644470215,
+ "learning_rate": 1.4820366899230729e-05,
+ "loss": 0.2973,
+ "step": 13201
+ },
+ {
+ "epoch": 35.97275204359673,
+ "grad_norm": 8.589384078979492,
+ "learning_rate": 1.4819593681876168e-05,
+ "loss": 0.4471,
+ "step": 13202
+ },
+ {
+ "epoch": 35.97547683923706,
+ "grad_norm": 9.04414176940918,
+ "learning_rate": 1.4818820426986763e-05,
+ "loss": 0.3004,
+ "step": 13203
+ },
+ {
+ "epoch": 35.97820163487739,
+ "grad_norm": 5.686853885650635,
+ "learning_rate": 1.481804713456854e-05,
+ "loss": 0.3357,
+ "step": 13204
+ },
+ {
+ "epoch": 35.98092643051771,
+ "grad_norm": 6.3393330574035645,
+ "learning_rate": 1.4817273804627526e-05,
+ "loss": 0.4384,
+ "step": 13205
+ },
+ {
+ "epoch": 35.98365122615804,
+ "grad_norm": 8.94064998626709,
+ "learning_rate": 1.4816500437169735e-05,
+ "loss": 0.4419,
+ "step": 13206
+ },
+ {
+ "epoch": 35.986376021798364,
+ "grad_norm": 6.159207820892334,
+ "learning_rate": 1.4815727032201192e-05,
+ "loss": 0.3942,
+ "step": 13207
+ },
+ {
+ "epoch": 35.98910081743869,
+ "grad_norm": 8.340045928955078,
+ "learning_rate": 1.4814953589727922e-05,
+ "loss": 0.2921,
+ "step": 13208
+ },
+ {
+ "epoch": 35.991825613079016,
+ "grad_norm": 9.072864532470703,
+ "learning_rate": 1.4814180109755954e-05,
+ "loss": 0.3489,
+ "step": 13209
+ },
+ {
+ "epoch": 35.99455040871935,
+ "grad_norm": 5.044756889343262,
+ "learning_rate": 1.4813406592291298e-05,
+ "loss": 0.4151,
+ "step": 13210
+ },
+ {
+ "epoch": 35.997275204359674,
+ "grad_norm": 7.601471424102783,
+ "learning_rate": 1.4812633037339992e-05,
+ "loss": 0.4428,
+ "step": 13211
+ },
+ {
+ "epoch": 36.0,
+ "grad_norm": 5.451930046081543,
+ "learning_rate": 1.4811859444908053e-05,
+ "loss": 0.5436,
+ "step": 13212
+ },
+ {
+ "epoch": 36.002724795640326,
+ "grad_norm": 8.351494789123535,
+ "learning_rate": 1.4811085815001507e-05,
+ "loss": 0.3569,
+ "step": 13213
+ },
+ {
+ "epoch": 36.00544959128065,
+ "grad_norm": 6.551837921142578,
+ "learning_rate": 1.481031214762638e-05,
+ "loss": 0.2808,
+ "step": 13214
+ },
+ {
+ "epoch": 36.00817438692098,
+ "grad_norm": 5.7202863693237305,
+ "learning_rate": 1.4809538442788698e-05,
+ "loss": 0.3351,
+ "step": 13215
+ },
+ {
+ "epoch": 36.01089918256131,
+ "grad_norm": 8.296695709228516,
+ "learning_rate": 1.4808764700494482e-05,
+ "loss": 0.3342,
+ "step": 13216
+ },
+ {
+ "epoch": 36.013623978201636,
+ "grad_norm": 5.594487190246582,
+ "learning_rate": 1.4807990920749766e-05,
+ "loss": 0.3683,
+ "step": 13217
+ },
+ {
+ "epoch": 36.01634877384196,
+ "grad_norm": 8.664252281188965,
+ "learning_rate": 1.4807217103560567e-05,
+ "loss": 0.3099,
+ "step": 13218
+ },
+ {
+ "epoch": 36.01907356948229,
+ "grad_norm": 7.050753593444824,
+ "learning_rate": 1.4806443248932917e-05,
+ "loss": 0.4896,
+ "step": 13219
+ },
+ {
+ "epoch": 36.02179836512261,
+ "grad_norm": 6.4368438720703125,
+ "learning_rate": 1.4805669356872843e-05,
+ "loss": 0.3148,
+ "step": 13220
+ },
+ {
+ "epoch": 36.02452316076294,
+ "grad_norm": 7.973339557647705,
+ "learning_rate": 1.4804895427386371e-05,
+ "loss": 0.3784,
+ "step": 13221
+ },
+ {
+ "epoch": 36.02724795640327,
+ "grad_norm": 7.606378555297852,
+ "learning_rate": 1.4804121460479528e-05,
+ "loss": 0.2506,
+ "step": 13222
+ },
+ {
+ "epoch": 36.0299727520436,
+ "grad_norm": 7.317055702209473,
+ "learning_rate": 1.4803347456158341e-05,
+ "loss": 0.4169,
+ "step": 13223
+ },
+ {
+ "epoch": 36.032697547683924,
+ "grad_norm": 6.236683368682861,
+ "learning_rate": 1.4802573414428837e-05,
+ "loss": 0.2888,
+ "step": 13224
+ },
+ {
+ "epoch": 36.03542234332425,
+ "grad_norm": 7.838255405426025,
+ "learning_rate": 1.4801799335297052e-05,
+ "loss": 0.2142,
+ "step": 13225
+ },
+ {
+ "epoch": 36.038147138964575,
+ "grad_norm": 5.358719348907471,
+ "learning_rate": 1.4801025218769001e-05,
+ "loss": 0.2151,
+ "step": 13226
+ },
+ {
+ "epoch": 36.0408719346049,
+ "grad_norm": 8.163990020751953,
+ "learning_rate": 1.4800251064850723e-05,
+ "loss": 0.4248,
+ "step": 13227
+ },
+ {
+ "epoch": 36.043596730245234,
+ "grad_norm": 9.340973854064941,
+ "learning_rate": 1.4799476873548244e-05,
+ "loss": 0.2144,
+ "step": 13228
+ },
+ {
+ "epoch": 36.04632152588556,
+ "grad_norm": 5.8173322677612305,
+ "learning_rate": 1.4798702644867596e-05,
+ "loss": 0.3967,
+ "step": 13229
+ },
+ {
+ "epoch": 36.049046321525886,
+ "grad_norm": 5.602415561676025,
+ "learning_rate": 1.47979283788148e-05,
+ "loss": 0.2408,
+ "step": 13230
+ },
+ {
+ "epoch": 36.05177111716621,
+ "grad_norm": 5.840487957000732,
+ "learning_rate": 1.4797154075395899e-05,
+ "loss": 0.2478,
+ "step": 13231
+ },
+ {
+ "epoch": 36.05449591280654,
+ "grad_norm": 6.682070732116699,
+ "learning_rate": 1.4796379734616912e-05,
+ "loss": 0.2356,
+ "step": 13232
+ },
+ {
+ "epoch": 36.05722070844686,
+ "grad_norm": 5.006386756896973,
+ "learning_rate": 1.4795605356483877e-05,
+ "loss": 0.3284,
+ "step": 13233
+ },
+ {
+ "epoch": 36.059945504087196,
+ "grad_norm": 7.425999641418457,
+ "learning_rate": 1.479483094100282e-05,
+ "loss": 0.5058,
+ "step": 13234
+ },
+ {
+ "epoch": 36.06267029972752,
+ "grad_norm": 6.135932445526123,
+ "learning_rate": 1.4794056488179776e-05,
+ "loss": 0.2256,
+ "step": 13235
+ },
+ {
+ "epoch": 36.06539509536785,
+ "grad_norm": 21.26055908203125,
+ "learning_rate": 1.479328199802077e-05,
+ "loss": 0.2314,
+ "step": 13236
+ },
+ {
+ "epoch": 36.06811989100817,
+ "grad_norm": 5.896805763244629,
+ "learning_rate": 1.4792507470531842e-05,
+ "loss": 0.3028,
+ "step": 13237
+ },
+ {
+ "epoch": 36.0708446866485,
+ "grad_norm": 8.05986213684082,
+ "learning_rate": 1.4791732905719019e-05,
+ "loss": 0.3826,
+ "step": 13238
+ },
+ {
+ "epoch": 36.073569482288825,
+ "grad_norm": 6.583298683166504,
+ "learning_rate": 1.4790958303588334e-05,
+ "loss": 0.2308,
+ "step": 13239
+ },
+ {
+ "epoch": 36.07629427792916,
+ "grad_norm": 5.833327293395996,
+ "learning_rate": 1.4790183664145821e-05,
+ "loss": 0.278,
+ "step": 13240
+ },
+ {
+ "epoch": 36.079019073569484,
+ "grad_norm": 6.4417924880981445,
+ "learning_rate": 1.4789408987397512e-05,
+ "loss": 0.4019,
+ "step": 13241
+ },
+ {
+ "epoch": 36.08174386920981,
+ "grad_norm": 8.08556842803955,
+ "learning_rate": 1.4788634273349439e-05,
+ "loss": 0.3405,
+ "step": 13242
+ },
+ {
+ "epoch": 36.084468664850135,
+ "grad_norm": 20.261943817138672,
+ "learning_rate": 1.4787859522007638e-05,
+ "loss": 0.3115,
+ "step": 13243
+ },
+ {
+ "epoch": 36.08719346049046,
+ "grad_norm": 5.491735458374023,
+ "learning_rate": 1.4787084733378138e-05,
+ "loss": 0.25,
+ "step": 13244
+ },
+ {
+ "epoch": 36.08991825613079,
+ "grad_norm": 5.954740524291992,
+ "learning_rate": 1.4786309907466975e-05,
+ "loss": 0.2966,
+ "step": 13245
+ },
+ {
+ "epoch": 36.09264305177112,
+ "grad_norm": 7.659736156463623,
+ "learning_rate": 1.4785535044280189e-05,
+ "loss": 0.2715,
+ "step": 13246
+ },
+ {
+ "epoch": 36.095367847411445,
+ "grad_norm": 5.393923759460449,
+ "learning_rate": 1.478476014382381e-05,
+ "loss": 0.2464,
+ "step": 13247
+ },
+ {
+ "epoch": 36.09809264305177,
+ "grad_norm": 6.913016319274902,
+ "learning_rate": 1.4783985206103868e-05,
+ "loss": 0.3614,
+ "step": 13248
+ },
+ {
+ "epoch": 36.1008174386921,
+ "grad_norm": 5.978140830993652,
+ "learning_rate": 1.4783210231126411e-05,
+ "loss": 0.2519,
+ "step": 13249
+ },
+ {
+ "epoch": 36.10354223433242,
+ "grad_norm": 6.325464725494385,
+ "learning_rate": 1.4782435218897459e-05,
+ "loss": 0.2686,
+ "step": 13250
+ },
+ {
+ "epoch": 36.10626702997275,
+ "grad_norm": 5.510571479797363,
+ "learning_rate": 1.478166016942306e-05,
+ "loss": 0.1749,
+ "step": 13251
+ },
+ {
+ "epoch": 36.10899182561308,
+ "grad_norm": 12.347222328186035,
+ "learning_rate": 1.4780885082709242e-05,
+ "loss": 0.3969,
+ "step": 13252
+ },
+ {
+ "epoch": 36.11171662125341,
+ "grad_norm": 7.096447944641113,
+ "learning_rate": 1.4780109958762049e-05,
+ "loss": 0.331,
+ "step": 13253
+ },
+ {
+ "epoch": 36.11444141689373,
+ "grad_norm": 6.075213432312012,
+ "learning_rate": 1.4779334797587508e-05,
+ "loss": 0.2931,
+ "step": 13254
+ },
+ {
+ "epoch": 36.11716621253406,
+ "grad_norm": 6.677272319793701,
+ "learning_rate": 1.4778559599191668e-05,
+ "loss": 0.2206,
+ "step": 13255
+ },
+ {
+ "epoch": 36.119891008174385,
+ "grad_norm": 8.224448204040527,
+ "learning_rate": 1.4777784363580553e-05,
+ "loss": 0.4144,
+ "step": 13256
+ },
+ {
+ "epoch": 36.12261580381471,
+ "grad_norm": 22.851787567138672,
+ "learning_rate": 1.4777009090760213e-05,
+ "loss": 0.3081,
+ "step": 13257
+ },
+ {
+ "epoch": 36.12534059945504,
+ "grad_norm": 6.327375888824463,
+ "learning_rate": 1.4776233780736677e-05,
+ "loss": 0.184,
+ "step": 13258
+ },
+ {
+ "epoch": 36.12806539509537,
+ "grad_norm": 6.861517429351807,
+ "learning_rate": 1.4775458433515988e-05,
+ "loss": 0.2499,
+ "step": 13259
+ },
+ {
+ "epoch": 36.130790190735695,
+ "grad_norm": 5.776194095611572,
+ "learning_rate": 1.477468304910418e-05,
+ "loss": 0.2825,
+ "step": 13260
+ },
+ {
+ "epoch": 36.13351498637602,
+ "grad_norm": 6.355883598327637,
+ "learning_rate": 1.4773907627507296e-05,
+ "loss": 0.2797,
+ "step": 13261
+ },
+ {
+ "epoch": 36.13623978201635,
+ "grad_norm": 7.135884761810303,
+ "learning_rate": 1.4773132168731372e-05,
+ "loss": 0.2202,
+ "step": 13262
+ },
+ {
+ "epoch": 36.13896457765667,
+ "grad_norm": 5.922659397125244,
+ "learning_rate": 1.4772356672782448e-05,
+ "loss": 0.4088,
+ "step": 13263
+ },
+ {
+ "epoch": 36.141689373297005,
+ "grad_norm": 4.835375785827637,
+ "learning_rate": 1.4771581139666564e-05,
+ "loss": 0.3039,
+ "step": 13264
+ },
+ {
+ "epoch": 36.14441416893733,
+ "grad_norm": 5.040340900421143,
+ "learning_rate": 1.4770805569389762e-05,
+ "loss": 0.3017,
+ "step": 13265
+ },
+ {
+ "epoch": 36.14713896457766,
+ "grad_norm": 6.48061466217041,
+ "learning_rate": 1.4770029961958075e-05,
+ "loss": 0.3271,
+ "step": 13266
+ },
+ {
+ "epoch": 36.14986376021798,
+ "grad_norm": 6.813900947570801,
+ "learning_rate": 1.4769254317377553e-05,
+ "loss": 0.2408,
+ "step": 13267
+ },
+ {
+ "epoch": 36.15258855585831,
+ "grad_norm": 4.941844940185547,
+ "learning_rate": 1.476847863565423e-05,
+ "loss": 0.3785,
+ "step": 13268
+ },
+ {
+ "epoch": 36.155313351498634,
+ "grad_norm": 7.042545318603516,
+ "learning_rate": 1.4767702916794149e-05,
+ "loss": 0.3079,
+ "step": 13269
+ },
+ {
+ "epoch": 36.15803814713897,
+ "grad_norm": 5.209319114685059,
+ "learning_rate": 1.476692716080335e-05,
+ "loss": 0.2709,
+ "step": 13270
+ },
+ {
+ "epoch": 36.16076294277929,
+ "grad_norm": 5.897314548492432,
+ "learning_rate": 1.4766151367687875e-05,
+ "loss": 0.2773,
+ "step": 13271
+ },
+ {
+ "epoch": 36.16348773841962,
+ "grad_norm": 6.35041618347168,
+ "learning_rate": 1.476537553745377e-05,
+ "loss": 0.6002,
+ "step": 13272
+ },
+ {
+ "epoch": 36.166212534059945,
+ "grad_norm": 6.693200588226318,
+ "learning_rate": 1.476459967010707e-05,
+ "loss": 0.2687,
+ "step": 13273
+ },
+ {
+ "epoch": 36.16893732970027,
+ "grad_norm": 6.460749626159668,
+ "learning_rate": 1.4763823765653824e-05,
+ "loss": 0.3471,
+ "step": 13274
+ },
+ {
+ "epoch": 36.171662125340596,
+ "grad_norm": 8.597285270690918,
+ "learning_rate": 1.476304782410007e-05,
+ "loss": 0.357,
+ "step": 13275
+ },
+ {
+ "epoch": 36.17438692098093,
+ "grad_norm": 6.624594211578369,
+ "learning_rate": 1.4762271845451852e-05,
+ "loss": 0.2743,
+ "step": 13276
+ },
+ {
+ "epoch": 36.177111716621255,
+ "grad_norm": 4.66386079788208,
+ "learning_rate": 1.4761495829715219e-05,
+ "loss": 0.3172,
+ "step": 13277
+ },
+ {
+ "epoch": 36.17983651226158,
+ "grad_norm": 5.907938003540039,
+ "learning_rate": 1.4760719776896205e-05,
+ "loss": 0.3369,
+ "step": 13278
+ },
+ {
+ "epoch": 36.182561307901906,
+ "grad_norm": 6.306649684906006,
+ "learning_rate": 1.4759943687000858e-05,
+ "loss": 0.4182,
+ "step": 13279
+ },
+ {
+ "epoch": 36.18528610354223,
+ "grad_norm": 5.4794230461120605,
+ "learning_rate": 1.4759167560035226e-05,
+ "loss": 0.2356,
+ "step": 13280
+ },
+ {
+ "epoch": 36.18801089918256,
+ "grad_norm": 6.161020755767822,
+ "learning_rate": 1.475839139600535e-05,
+ "loss": 0.3469,
+ "step": 13281
+ },
+ {
+ "epoch": 36.19073569482289,
+ "grad_norm": 7.272459030151367,
+ "learning_rate": 1.4757615194917274e-05,
+ "loss": 0.3511,
+ "step": 13282
+ },
+ {
+ "epoch": 36.19346049046322,
+ "grad_norm": 5.768618106842041,
+ "learning_rate": 1.4756838956777043e-05,
+ "loss": 0.2256,
+ "step": 13283
+ },
+ {
+ "epoch": 36.19618528610354,
+ "grad_norm": 5.862088680267334,
+ "learning_rate": 1.4756062681590706e-05,
+ "loss": 0.286,
+ "step": 13284
+ },
+ {
+ "epoch": 36.19891008174387,
+ "grad_norm": 4.525655269622803,
+ "learning_rate": 1.4755286369364301e-05,
+ "loss": 0.3037,
+ "step": 13285
+ },
+ {
+ "epoch": 36.201634877384194,
+ "grad_norm": 6.0322113037109375,
+ "learning_rate": 1.4754510020103883e-05,
+ "loss": 0.2969,
+ "step": 13286
+ },
+ {
+ "epoch": 36.20435967302452,
+ "grad_norm": 6.035339832305908,
+ "learning_rate": 1.4753733633815492e-05,
+ "loss": 0.2284,
+ "step": 13287
+ },
+ {
+ "epoch": 36.20708446866485,
+ "grad_norm": 5.587437629699707,
+ "learning_rate": 1.4752957210505179e-05,
+ "loss": 0.185,
+ "step": 13288
+ },
+ {
+ "epoch": 36.20980926430518,
+ "grad_norm": 5.474676132202148,
+ "learning_rate": 1.4752180750178986e-05,
+ "loss": 0.2577,
+ "step": 13289
+ },
+ {
+ "epoch": 36.212534059945504,
+ "grad_norm": 7.268446922302246,
+ "learning_rate": 1.4751404252842962e-05,
+ "loss": 0.3511,
+ "step": 13290
+ },
+ {
+ "epoch": 36.21525885558583,
+ "grad_norm": 7.861775875091553,
+ "learning_rate": 1.4750627718503156e-05,
+ "loss": 0.3217,
+ "step": 13291
+ },
+ {
+ "epoch": 36.217983651226156,
+ "grad_norm": 5.511539459228516,
+ "learning_rate": 1.4749851147165615e-05,
+ "loss": 0.3541,
+ "step": 13292
+ },
+ {
+ "epoch": 36.22070844686648,
+ "grad_norm": 6.481141567230225,
+ "learning_rate": 1.4749074538836384e-05,
+ "loss": 0.2819,
+ "step": 13293
+ },
+ {
+ "epoch": 36.223433242506815,
+ "grad_norm": 5.233092784881592,
+ "learning_rate": 1.4748297893521515e-05,
+ "loss": 0.3057,
+ "step": 13294
+ },
+ {
+ "epoch": 36.22615803814714,
+ "grad_norm": 5.9000115394592285,
+ "learning_rate": 1.4747521211227054e-05,
+ "loss": 0.3302,
+ "step": 13295
+ },
+ {
+ "epoch": 36.228882833787466,
+ "grad_norm": 6.1863694190979,
+ "learning_rate": 1.4746744491959049e-05,
+ "loss": 0.341,
+ "step": 13296
+ },
+ {
+ "epoch": 36.23160762942779,
+ "grad_norm": 7.300392150878906,
+ "learning_rate": 1.4745967735723552e-05,
+ "loss": 0.3684,
+ "step": 13297
+ },
+ {
+ "epoch": 36.23433242506812,
+ "grad_norm": 5.948448181152344,
+ "learning_rate": 1.4745190942526613e-05,
+ "loss": 0.3226,
+ "step": 13298
+ },
+ {
+ "epoch": 36.237057220708444,
+ "grad_norm": 5.368710041046143,
+ "learning_rate": 1.4744414112374274e-05,
+ "loss": 0.3194,
+ "step": 13299
+ },
+ {
+ "epoch": 36.23978201634878,
+ "grad_norm": 5.769564151763916,
+ "learning_rate": 1.4743637245272598e-05,
+ "loss": 0.2969,
+ "step": 13300
+ },
+ {
+ "epoch": 36.2425068119891,
+ "grad_norm": 6.390039920806885,
+ "learning_rate": 1.4742860341227622e-05,
+ "loss": 0.2234,
+ "step": 13301
+ },
+ {
+ "epoch": 36.24523160762943,
+ "grad_norm": 5.80669641494751,
+ "learning_rate": 1.4742083400245406e-05,
+ "loss": 0.3753,
+ "step": 13302
+ },
+ {
+ "epoch": 36.247956403269754,
+ "grad_norm": 6.172638416290283,
+ "learning_rate": 1.4741306422331995e-05,
+ "loss": 0.2963,
+ "step": 13303
+ },
+ {
+ "epoch": 36.25068119891008,
+ "grad_norm": 6.281661510467529,
+ "learning_rate": 1.4740529407493444e-05,
+ "loss": 0.2376,
+ "step": 13304
+ },
+ {
+ "epoch": 36.253405994550405,
+ "grad_norm": 6.107354164123535,
+ "learning_rate": 1.4739752355735799e-05,
+ "loss": 0.3358,
+ "step": 13305
+ },
+ {
+ "epoch": 36.25613079019074,
+ "grad_norm": 6.2487969398498535,
+ "learning_rate": 1.4738975267065118e-05,
+ "loss": 0.3114,
+ "step": 13306
+ },
+ {
+ "epoch": 36.258855585831064,
+ "grad_norm": 6.440620422363281,
+ "learning_rate": 1.473819814148745e-05,
+ "loss": 0.2623,
+ "step": 13307
+ },
+ {
+ "epoch": 36.26158038147139,
+ "grad_norm": 6.070278167724609,
+ "learning_rate": 1.473742097900885e-05,
+ "loss": 0.29,
+ "step": 13308
+ },
+ {
+ "epoch": 36.264305177111716,
+ "grad_norm": 6.380928039550781,
+ "learning_rate": 1.4736643779635362e-05,
+ "loss": 0.2677,
+ "step": 13309
+ },
+ {
+ "epoch": 36.26702997275204,
+ "grad_norm": 5.88615083694458,
+ "learning_rate": 1.473586654337305e-05,
+ "loss": 0.3181,
+ "step": 13310
+ },
+ {
+ "epoch": 36.26975476839237,
+ "grad_norm": 4.7790327072143555,
+ "learning_rate": 1.4735089270227958e-05,
+ "loss": 0.3222,
+ "step": 13311
+ },
+ {
+ "epoch": 36.2724795640327,
+ "grad_norm": 5.748852252960205,
+ "learning_rate": 1.4734311960206147e-05,
+ "loss": 0.3753,
+ "step": 13312
+ },
+ {
+ "epoch": 36.275204359673026,
+ "grad_norm": 6.661259174346924,
+ "learning_rate": 1.473353461331366e-05,
+ "loss": 0.3835,
+ "step": 13313
+ },
+ {
+ "epoch": 36.27792915531335,
+ "grad_norm": 5.821951389312744,
+ "learning_rate": 1.4732757229556565e-05,
+ "loss": 0.2562,
+ "step": 13314
+ },
+ {
+ "epoch": 36.28065395095368,
+ "grad_norm": 6.301092624664307,
+ "learning_rate": 1.4731979808940906e-05,
+ "loss": 0.3367,
+ "step": 13315
+ },
+ {
+ "epoch": 36.283378746594,
+ "grad_norm": 7.271420001983643,
+ "learning_rate": 1.4731202351472741e-05,
+ "loss": 0.3906,
+ "step": 13316
+ },
+ {
+ "epoch": 36.28610354223433,
+ "grad_norm": 6.201592445373535,
+ "learning_rate": 1.4730424857158123e-05,
+ "loss": 0.2709,
+ "step": 13317
+ },
+ {
+ "epoch": 36.28882833787466,
+ "grad_norm": 8.571123123168945,
+ "learning_rate": 1.472964732600311e-05,
+ "loss": 0.2953,
+ "step": 13318
+ },
+ {
+ "epoch": 36.29155313351499,
+ "grad_norm": 4.723077297210693,
+ "learning_rate": 1.4728869758013758e-05,
+ "loss": 0.2857,
+ "step": 13319
+ },
+ {
+ "epoch": 36.294277929155314,
+ "grad_norm": 6.588447570800781,
+ "learning_rate": 1.4728092153196119e-05,
+ "loss": 0.2544,
+ "step": 13320
+ },
+ {
+ "epoch": 36.29700272479564,
+ "grad_norm": 5.947713851928711,
+ "learning_rate": 1.4727314511556248e-05,
+ "loss": 0.5516,
+ "step": 13321
+ },
+ {
+ "epoch": 36.299727520435965,
+ "grad_norm": 5.802780628204346,
+ "learning_rate": 1.4726536833100204e-05,
+ "loss": 0.3207,
+ "step": 13322
+ },
+ {
+ "epoch": 36.30245231607629,
+ "grad_norm": 7.036726474761963,
+ "learning_rate": 1.4725759117834045e-05,
+ "loss": 0.2175,
+ "step": 13323
+ },
+ {
+ "epoch": 36.305177111716624,
+ "grad_norm": 5.762254238128662,
+ "learning_rate": 1.4724981365763826e-05,
+ "loss": 0.3055,
+ "step": 13324
+ },
+ {
+ "epoch": 36.30790190735695,
+ "grad_norm": 6.607092380523682,
+ "learning_rate": 1.4724203576895604e-05,
+ "loss": 0.2481,
+ "step": 13325
+ },
+ {
+ "epoch": 36.310626702997276,
+ "grad_norm": 7.0382914543151855,
+ "learning_rate": 1.4723425751235436e-05,
+ "loss": 0.273,
+ "step": 13326
+ },
+ {
+ "epoch": 36.3133514986376,
+ "grad_norm": 5.677168846130371,
+ "learning_rate": 1.4722647888789382e-05,
+ "loss": 0.2465,
+ "step": 13327
+ },
+ {
+ "epoch": 36.31607629427793,
+ "grad_norm": 5.887604713439941,
+ "learning_rate": 1.4721869989563495e-05,
+ "loss": 0.1993,
+ "step": 13328
+ },
+ {
+ "epoch": 36.31880108991825,
+ "grad_norm": 5.209313869476318,
+ "learning_rate": 1.472109205356384e-05,
+ "loss": 0.2846,
+ "step": 13329
+ },
+ {
+ "epoch": 36.321525885558586,
+ "grad_norm": 5.660128593444824,
+ "learning_rate": 1.4720314080796469e-05,
+ "loss": 0.4316,
+ "step": 13330
+ },
+ {
+ "epoch": 36.32425068119891,
+ "grad_norm": 5.628818035125732,
+ "learning_rate": 1.4719536071267443e-05,
+ "loss": 0.1807,
+ "step": 13331
+ },
+ {
+ "epoch": 36.32697547683924,
+ "grad_norm": 7.614799499511719,
+ "learning_rate": 1.4718758024982827e-05,
+ "loss": 0.2442,
+ "step": 13332
+ },
+ {
+ "epoch": 36.32970027247956,
+ "grad_norm": 6.920741081237793,
+ "learning_rate": 1.4717979941948672e-05,
+ "loss": 0.2404,
+ "step": 13333
+ },
+ {
+ "epoch": 36.33242506811989,
+ "grad_norm": 6.268089771270752,
+ "learning_rate": 1.4717201822171043e-05,
+ "loss": 0.2939,
+ "step": 13334
+ },
+ {
+ "epoch": 36.335149863760215,
+ "grad_norm": 7.400482654571533,
+ "learning_rate": 1.4716423665655995e-05,
+ "loss": 0.2523,
+ "step": 13335
+ },
+ {
+ "epoch": 36.33787465940055,
+ "grad_norm": 6.6051506996154785,
+ "learning_rate": 1.4715645472409594e-05,
+ "loss": 0.4303,
+ "step": 13336
+ },
+ {
+ "epoch": 36.34059945504087,
+ "grad_norm": 5.198501110076904,
+ "learning_rate": 1.4714867242437896e-05,
+ "loss": 0.2853,
+ "step": 13337
+ },
+ {
+ "epoch": 36.3433242506812,
+ "grad_norm": 7.610172271728516,
+ "learning_rate": 1.4714088975746967e-05,
+ "loss": 0.2253,
+ "step": 13338
+ },
+ {
+ "epoch": 36.346049046321525,
+ "grad_norm": 5.972766876220703,
+ "learning_rate": 1.471331067234286e-05,
+ "loss": 0.3062,
+ "step": 13339
+ },
+ {
+ "epoch": 36.34877384196185,
+ "grad_norm": 5.427735805511475,
+ "learning_rate": 1.4712532332231644e-05,
+ "loss": 0.2979,
+ "step": 13340
+ },
+ {
+ "epoch": 36.35149863760218,
+ "grad_norm": 5.4658684730529785,
+ "learning_rate": 1.4711753955419376e-05,
+ "loss": 0.2765,
+ "step": 13341
+ },
+ {
+ "epoch": 36.35422343324251,
+ "grad_norm": 9.625960350036621,
+ "learning_rate": 1.4710975541912122e-05,
+ "loss": 0.2669,
+ "step": 13342
+ },
+ {
+ "epoch": 36.356948228882835,
+ "grad_norm": 6.750884532928467,
+ "learning_rate": 1.471019709171594e-05,
+ "loss": 0.2986,
+ "step": 13343
+ },
+ {
+ "epoch": 36.35967302452316,
+ "grad_norm": 8.63830852508545,
+ "learning_rate": 1.4709418604836898e-05,
+ "loss": 0.4565,
+ "step": 13344
+ },
+ {
+ "epoch": 36.36239782016349,
+ "grad_norm": 6.362757205963135,
+ "learning_rate": 1.4708640081281054e-05,
+ "loss": 0.2891,
+ "step": 13345
+ },
+ {
+ "epoch": 36.36512261580381,
+ "grad_norm": 6.810002326965332,
+ "learning_rate": 1.4707861521054471e-05,
+ "loss": 0.1971,
+ "step": 13346
+ },
+ {
+ "epoch": 36.36784741144414,
+ "grad_norm": 5.628415107727051,
+ "learning_rate": 1.4707082924163216e-05,
+ "loss": 0.3101,
+ "step": 13347
+ },
+ {
+ "epoch": 36.37057220708447,
+ "grad_norm": 6.321719169616699,
+ "learning_rate": 1.470630429061335e-05,
+ "loss": 0.2809,
+ "step": 13348
+ },
+ {
+ "epoch": 36.3732970027248,
+ "grad_norm": 9.022990226745605,
+ "learning_rate": 1.4705525620410936e-05,
+ "loss": 0.2779,
+ "step": 13349
+ },
+ {
+ "epoch": 36.37602179836512,
+ "grad_norm": 13.800345420837402,
+ "learning_rate": 1.4704746913562043e-05,
+ "loss": 0.2912,
+ "step": 13350
+ },
+ {
+ "epoch": 36.37874659400545,
+ "grad_norm": 7.537498950958252,
+ "learning_rate": 1.470396817007273e-05,
+ "loss": 0.2954,
+ "step": 13351
+ },
+ {
+ "epoch": 36.381471389645775,
+ "grad_norm": 5.671634197235107,
+ "learning_rate": 1.4703189389949066e-05,
+ "loss": 0.2158,
+ "step": 13352
+ },
+ {
+ "epoch": 36.3841961852861,
+ "grad_norm": 6.502307891845703,
+ "learning_rate": 1.4702410573197112e-05,
+ "loss": 0.3534,
+ "step": 13353
+ },
+ {
+ "epoch": 36.38692098092643,
+ "grad_norm": 5.736046314239502,
+ "learning_rate": 1.4701631719822937e-05,
+ "loss": 0.3752,
+ "step": 13354
+ },
+ {
+ "epoch": 36.38964577656676,
+ "grad_norm": 5.479292869567871,
+ "learning_rate": 1.4700852829832605e-05,
+ "loss": 0.221,
+ "step": 13355
+ },
+ {
+ "epoch": 36.392370572207085,
+ "grad_norm": 5.3284196853637695,
+ "learning_rate": 1.4700073903232184e-05,
+ "loss": 0.2644,
+ "step": 13356
+ },
+ {
+ "epoch": 36.39509536784741,
+ "grad_norm": 5.863639831542969,
+ "learning_rate": 1.469929494002774e-05,
+ "loss": 0.395,
+ "step": 13357
+ },
+ {
+ "epoch": 36.39782016348774,
+ "grad_norm": 6.0642523765563965,
+ "learning_rate": 1.4698515940225333e-05,
+ "loss": 0.2675,
+ "step": 13358
+ },
+ {
+ "epoch": 36.40054495912806,
+ "grad_norm": 7.674149513244629,
+ "learning_rate": 1.4697736903831041e-05,
+ "loss": 0.2501,
+ "step": 13359
+ },
+ {
+ "epoch": 36.403269754768395,
+ "grad_norm": 6.642250061035156,
+ "learning_rate": 1.4696957830850922e-05,
+ "loss": 0.3921,
+ "step": 13360
+ },
+ {
+ "epoch": 36.40599455040872,
+ "grad_norm": 8.71288776397705,
+ "learning_rate": 1.4696178721291048e-05,
+ "loss": 0.3495,
+ "step": 13361
+ },
+ {
+ "epoch": 36.40871934604905,
+ "grad_norm": 8.118603706359863,
+ "learning_rate": 1.4695399575157483e-05,
+ "loss": 0.357,
+ "step": 13362
+ },
+ {
+ "epoch": 36.41144414168937,
+ "grad_norm": 7.166381359100342,
+ "learning_rate": 1.4694620392456299e-05,
+ "loss": 0.2482,
+ "step": 13363
+ },
+ {
+ "epoch": 36.4141689373297,
+ "grad_norm": 6.337353229522705,
+ "learning_rate": 1.4693841173193562e-05,
+ "loss": 0.2439,
+ "step": 13364
+ },
+ {
+ "epoch": 36.416893732970024,
+ "grad_norm": 5.224032402038574,
+ "learning_rate": 1.469306191737534e-05,
+ "loss": 0.306,
+ "step": 13365
+ },
+ {
+ "epoch": 36.41961852861036,
+ "grad_norm": 6.916603088378906,
+ "learning_rate": 1.4692282625007703e-05,
+ "loss": 0.3333,
+ "step": 13366
+ },
+ {
+ "epoch": 36.42234332425068,
+ "grad_norm": 10.736503601074219,
+ "learning_rate": 1.4691503296096721e-05,
+ "loss": 0.3271,
+ "step": 13367
+ },
+ {
+ "epoch": 36.42506811989101,
+ "grad_norm": 6.419002056121826,
+ "learning_rate": 1.4690723930648463e-05,
+ "loss": 0.2392,
+ "step": 13368
+ },
+ {
+ "epoch": 36.427792915531334,
+ "grad_norm": 6.702088832855225,
+ "learning_rate": 1.4689944528668997e-05,
+ "loss": 0.2708,
+ "step": 13369
+ },
+ {
+ "epoch": 36.43051771117166,
+ "grad_norm": 6.408752918243408,
+ "learning_rate": 1.4689165090164395e-05,
+ "loss": 0.2514,
+ "step": 13370
+ },
+ {
+ "epoch": 36.433242506811986,
+ "grad_norm": 6.2014617919921875,
+ "learning_rate": 1.4688385615140726e-05,
+ "loss": 0.2501,
+ "step": 13371
+ },
+ {
+ "epoch": 36.43596730245232,
+ "grad_norm": 8.093091011047363,
+ "learning_rate": 1.4687606103604057e-05,
+ "loss": 0.3111,
+ "step": 13372
+ },
+ {
+ "epoch": 36.438692098092645,
+ "grad_norm": 7.146554946899414,
+ "learning_rate": 1.4686826555560468e-05,
+ "loss": 0.435,
+ "step": 13373
+ },
+ {
+ "epoch": 36.44141689373297,
+ "grad_norm": 5.736241817474365,
+ "learning_rate": 1.468604697101602e-05,
+ "loss": 0.2479,
+ "step": 13374
+ },
+ {
+ "epoch": 36.444141689373296,
+ "grad_norm": 5.841864585876465,
+ "learning_rate": 1.468526734997679e-05,
+ "loss": 0.2032,
+ "step": 13375
+ },
+ {
+ "epoch": 36.44686648501362,
+ "grad_norm": 6.242249965667725,
+ "learning_rate": 1.468448769244885e-05,
+ "loss": 0.2147,
+ "step": 13376
+ },
+ {
+ "epoch": 36.44959128065395,
+ "grad_norm": 5.7653303146362305,
+ "learning_rate": 1.4683707998438273e-05,
+ "loss": 0.3541,
+ "step": 13377
+ },
+ {
+ "epoch": 36.45231607629428,
+ "grad_norm": 6.387267589569092,
+ "learning_rate": 1.4682928267951124e-05,
+ "loss": 0.2736,
+ "step": 13378
+ },
+ {
+ "epoch": 36.45504087193461,
+ "grad_norm": 6.599924087524414,
+ "learning_rate": 1.4682148500993486e-05,
+ "loss": 0.4249,
+ "step": 13379
+ },
+ {
+ "epoch": 36.45776566757493,
+ "grad_norm": 5.238255500793457,
+ "learning_rate": 1.4681368697571421e-05,
+ "loss": 0.2681,
+ "step": 13380
+ },
+ {
+ "epoch": 36.46049046321526,
+ "grad_norm": 5.064724922180176,
+ "learning_rate": 1.4680588857691009e-05,
+ "loss": 0.3273,
+ "step": 13381
+ },
+ {
+ "epoch": 36.463215258855584,
+ "grad_norm": 6.155890464782715,
+ "learning_rate": 1.4679808981358319e-05,
+ "loss": 0.1873,
+ "step": 13382
+ },
+ {
+ "epoch": 36.46594005449591,
+ "grad_norm": 5.978591442108154,
+ "learning_rate": 1.4679029068579432e-05,
+ "loss": 0.3087,
+ "step": 13383
+ },
+ {
+ "epoch": 36.46866485013624,
+ "grad_norm": 5.726358890533447,
+ "learning_rate": 1.4678249119360415e-05,
+ "loss": 0.3177,
+ "step": 13384
+ },
+ {
+ "epoch": 36.47138964577657,
+ "grad_norm": 5.267200469970703,
+ "learning_rate": 1.4677469133707346e-05,
+ "loss": 0.3525,
+ "step": 13385
+ },
+ {
+ "epoch": 36.474114441416894,
+ "grad_norm": 5.896948337554932,
+ "learning_rate": 1.4676689111626294e-05,
+ "loss": 0.3116,
+ "step": 13386
+ },
+ {
+ "epoch": 36.47683923705722,
+ "grad_norm": 5.342823505401611,
+ "learning_rate": 1.4675909053123342e-05,
+ "loss": 0.2621,
+ "step": 13387
+ },
+ {
+ "epoch": 36.479564032697546,
+ "grad_norm": 5.99827241897583,
+ "learning_rate": 1.4675128958204559e-05,
+ "loss": 0.2905,
+ "step": 13388
+ },
+ {
+ "epoch": 36.48228882833787,
+ "grad_norm": 5.374172210693359,
+ "learning_rate": 1.4674348826876024e-05,
+ "loss": 0.4813,
+ "step": 13389
+ },
+ {
+ "epoch": 36.485013623978205,
+ "grad_norm": 5.049845218658447,
+ "learning_rate": 1.4673568659143806e-05,
+ "loss": 0.2846,
+ "step": 13390
+ },
+ {
+ "epoch": 36.48773841961853,
+ "grad_norm": 5.735440731048584,
+ "learning_rate": 1.4672788455013988e-05,
+ "loss": 0.2975,
+ "step": 13391
+ },
+ {
+ "epoch": 36.490463215258856,
+ "grad_norm": 5.560763835906982,
+ "learning_rate": 1.4672008214492643e-05,
+ "loss": 0.3355,
+ "step": 13392
+ },
+ {
+ "epoch": 36.49318801089918,
+ "grad_norm": 7.372814655303955,
+ "learning_rate": 1.4671227937585853e-05,
+ "loss": 0.3286,
+ "step": 13393
+ },
+ {
+ "epoch": 36.49591280653951,
+ "grad_norm": 11.579628944396973,
+ "learning_rate": 1.4670447624299685e-05,
+ "loss": 0.1994,
+ "step": 13394
+ },
+ {
+ "epoch": 36.49863760217983,
+ "grad_norm": 5.694832801818848,
+ "learning_rate": 1.4669667274640227e-05,
+ "loss": 0.249,
+ "step": 13395
+ },
+ {
+ "epoch": 36.50136239782017,
+ "grad_norm": 7.621641159057617,
+ "learning_rate": 1.4668886888613545e-05,
+ "loss": 0.5377,
+ "step": 13396
+ },
+ {
+ "epoch": 36.50408719346049,
+ "grad_norm": 5.279268741607666,
+ "learning_rate": 1.4668106466225724e-05,
+ "loss": 0.3796,
+ "step": 13397
+ },
+ {
+ "epoch": 36.50681198910082,
+ "grad_norm": 5.475941181182861,
+ "learning_rate": 1.466732600748284e-05,
+ "loss": 0.2565,
+ "step": 13398
+ },
+ {
+ "epoch": 36.509536784741144,
+ "grad_norm": 5.412313461303711,
+ "learning_rate": 1.4666545512390971e-05,
+ "loss": 0.3062,
+ "step": 13399
+ },
+ {
+ "epoch": 36.51226158038147,
+ "grad_norm": 6.111344337463379,
+ "learning_rate": 1.4665764980956196e-05,
+ "loss": 0.5159,
+ "step": 13400
+ },
+ {
+ "epoch": 36.514986376021795,
+ "grad_norm": 6.7449564933776855,
+ "learning_rate": 1.4664984413184595e-05,
+ "loss": 0.3046,
+ "step": 13401
+ },
+ {
+ "epoch": 36.51771117166213,
+ "grad_norm": 6.346858501434326,
+ "learning_rate": 1.4664203809082242e-05,
+ "loss": 0.3814,
+ "step": 13402
+ },
+ {
+ "epoch": 36.520435967302454,
+ "grad_norm": 5.561699867248535,
+ "learning_rate": 1.4663423168655224e-05,
+ "loss": 0.3898,
+ "step": 13403
+ },
+ {
+ "epoch": 36.52316076294278,
+ "grad_norm": 7.484636306762695,
+ "learning_rate": 1.4662642491909613e-05,
+ "loss": 0.2744,
+ "step": 13404
+ },
+ {
+ "epoch": 36.525885558583106,
+ "grad_norm": 7.572459697723389,
+ "learning_rate": 1.4661861778851495e-05,
+ "loss": 0.3589,
+ "step": 13405
+ },
+ {
+ "epoch": 36.52861035422343,
+ "grad_norm": 5.904122352600098,
+ "learning_rate": 1.4661081029486947e-05,
+ "loss": 0.2995,
+ "step": 13406
+ },
+ {
+ "epoch": 36.53133514986376,
+ "grad_norm": 6.616388320922852,
+ "learning_rate": 1.466030024382205e-05,
+ "loss": 0.3282,
+ "step": 13407
+ },
+ {
+ "epoch": 36.53405994550409,
+ "grad_norm": 9.58329963684082,
+ "learning_rate": 1.4659519421862882e-05,
+ "loss": 0.3186,
+ "step": 13408
+ },
+ {
+ "epoch": 36.536784741144416,
+ "grad_norm": 4.5477705001831055,
+ "learning_rate": 1.4658738563615528e-05,
+ "loss": 0.3818,
+ "step": 13409
+ },
+ {
+ "epoch": 36.53950953678474,
+ "grad_norm": 6.984385013580322,
+ "learning_rate": 1.4657957669086068e-05,
+ "loss": 0.2544,
+ "step": 13410
+ },
+ {
+ "epoch": 36.54223433242507,
+ "grad_norm": 6.979449272155762,
+ "learning_rate": 1.4657176738280587e-05,
+ "loss": 0.4612,
+ "step": 13411
+ },
+ {
+ "epoch": 36.54495912806539,
+ "grad_norm": 9.876516342163086,
+ "learning_rate": 1.4656395771205159e-05,
+ "loss": 0.2459,
+ "step": 13412
+ },
+ {
+ "epoch": 36.54768392370572,
+ "grad_norm": 8.801257133483887,
+ "learning_rate": 1.4655614767865874e-05,
+ "loss": 0.2674,
+ "step": 13413
+ },
+ {
+ "epoch": 36.55040871934605,
+ "grad_norm": 5.759488105773926,
+ "learning_rate": 1.4654833728268809e-05,
+ "loss": 0.2815,
+ "step": 13414
+ },
+ {
+ "epoch": 36.55313351498638,
+ "grad_norm": 6.719549179077148,
+ "learning_rate": 1.465405265242005e-05,
+ "loss": 0.2354,
+ "step": 13415
+ },
+ {
+ "epoch": 36.555858310626704,
+ "grad_norm": 5.147261619567871,
+ "learning_rate": 1.4653271540325678e-05,
+ "loss": 0.2369,
+ "step": 13416
+ },
+ {
+ "epoch": 36.55858310626703,
+ "grad_norm": 4.3034892082214355,
+ "learning_rate": 1.4652490391991776e-05,
+ "loss": 0.3875,
+ "step": 13417
+ },
+ {
+ "epoch": 36.561307901907355,
+ "grad_norm": 5.992101192474365,
+ "learning_rate": 1.4651709207424427e-05,
+ "loss": 0.2996,
+ "step": 13418
+ },
+ {
+ "epoch": 36.56403269754768,
+ "grad_norm": 7.512600421905518,
+ "learning_rate": 1.4650927986629721e-05,
+ "loss": 0.304,
+ "step": 13419
+ },
+ {
+ "epoch": 36.566757493188014,
+ "grad_norm": 8.687450408935547,
+ "learning_rate": 1.4650146729613735e-05,
+ "loss": 0.315,
+ "step": 13420
+ },
+ {
+ "epoch": 36.56948228882834,
+ "grad_norm": 8.934673309326172,
+ "learning_rate": 1.4649365436382557e-05,
+ "loss": 0.2188,
+ "step": 13421
+ },
+ {
+ "epoch": 36.572207084468666,
+ "grad_norm": 7.995282173156738,
+ "learning_rate": 1.464858410694227e-05,
+ "loss": 0.3398,
+ "step": 13422
+ },
+ {
+ "epoch": 36.57493188010899,
+ "grad_norm": 6.303302764892578,
+ "learning_rate": 1.464780274129896e-05,
+ "loss": 0.6181,
+ "step": 13423
+ },
+ {
+ "epoch": 36.57765667574932,
+ "grad_norm": 5.564570903778076,
+ "learning_rate": 1.464702133945871e-05,
+ "loss": 0.3231,
+ "step": 13424
+ },
+ {
+ "epoch": 36.58038147138964,
+ "grad_norm": 5.620957851409912,
+ "learning_rate": 1.4646239901427608e-05,
+ "loss": 0.2775,
+ "step": 13425
+ },
+ {
+ "epoch": 36.583106267029976,
+ "grad_norm": 7.0095744132995605,
+ "learning_rate": 1.464545842721174e-05,
+ "loss": 0.3576,
+ "step": 13426
+ },
+ {
+ "epoch": 36.5858310626703,
+ "grad_norm": 6.371780872344971,
+ "learning_rate": 1.4644676916817191e-05,
+ "loss": 0.3585,
+ "step": 13427
+ },
+ {
+ "epoch": 36.58855585831063,
+ "grad_norm": 6.885015964508057,
+ "learning_rate": 1.4643895370250048e-05,
+ "loss": 0.232,
+ "step": 13428
+ },
+ {
+ "epoch": 36.59128065395095,
+ "grad_norm": 6.714498996734619,
+ "learning_rate": 1.4643113787516398e-05,
+ "loss": 0.1946,
+ "step": 13429
+ },
+ {
+ "epoch": 36.59400544959128,
+ "grad_norm": 5.592657566070557,
+ "learning_rate": 1.4642332168622326e-05,
+ "loss": 0.3248,
+ "step": 13430
+ },
+ {
+ "epoch": 36.596730245231605,
+ "grad_norm": 5.791368007659912,
+ "learning_rate": 1.4641550513573922e-05,
+ "loss": 0.1738,
+ "step": 13431
+ },
+ {
+ "epoch": 36.59945504087194,
+ "grad_norm": 6.553666591644287,
+ "learning_rate": 1.464076882237727e-05,
+ "loss": 0.3313,
+ "step": 13432
+ },
+ {
+ "epoch": 36.60217983651226,
+ "grad_norm": 5.692700386047363,
+ "learning_rate": 1.4639987095038462e-05,
+ "loss": 0.2475,
+ "step": 13433
+ },
+ {
+ "epoch": 36.60490463215259,
+ "grad_norm": 6.713046073913574,
+ "learning_rate": 1.4639205331563582e-05,
+ "loss": 0.2303,
+ "step": 13434
+ },
+ {
+ "epoch": 36.607629427792915,
+ "grad_norm": 6.671408176422119,
+ "learning_rate": 1.4638423531958719e-05,
+ "loss": 0.3086,
+ "step": 13435
+ },
+ {
+ "epoch": 36.61035422343324,
+ "grad_norm": 7.590618133544922,
+ "learning_rate": 1.4637641696229967e-05,
+ "loss": 0.2469,
+ "step": 13436
+ },
+ {
+ "epoch": 36.61307901907357,
+ "grad_norm": 6.4383087158203125,
+ "learning_rate": 1.4636859824383406e-05,
+ "loss": 0.1952,
+ "step": 13437
+ },
+ {
+ "epoch": 36.6158038147139,
+ "grad_norm": 6.405405044555664,
+ "learning_rate": 1.4636077916425133e-05,
+ "loss": 0.2763,
+ "step": 13438
+ },
+ {
+ "epoch": 36.618528610354225,
+ "grad_norm": 6.324481010437012,
+ "learning_rate": 1.4635295972361235e-05,
+ "loss": 0.3177,
+ "step": 13439
+ },
+ {
+ "epoch": 36.62125340599455,
+ "grad_norm": 6.219964027404785,
+ "learning_rate": 1.4634513992197798e-05,
+ "loss": 0.2487,
+ "step": 13440
+ },
+ {
+ "epoch": 36.62397820163488,
+ "grad_norm": 7.315922737121582,
+ "learning_rate": 1.463373197594092e-05,
+ "loss": 0.2831,
+ "step": 13441
+ },
+ {
+ "epoch": 36.6267029972752,
+ "grad_norm": 6.487116813659668,
+ "learning_rate": 1.4632949923596681e-05,
+ "loss": 0.3255,
+ "step": 13442
+ },
+ {
+ "epoch": 36.62942779291553,
+ "grad_norm": 11.113147735595703,
+ "learning_rate": 1.4632167835171177e-05,
+ "loss": 0.2622,
+ "step": 13443
+ },
+ {
+ "epoch": 36.63215258855586,
+ "grad_norm": 5.978334903717041,
+ "learning_rate": 1.4631385710670505e-05,
+ "loss": 0.4852,
+ "step": 13444
+ },
+ {
+ "epoch": 36.63487738419619,
+ "grad_norm": 5.589931488037109,
+ "learning_rate": 1.4630603550100747e-05,
+ "loss": 0.3033,
+ "step": 13445
+ },
+ {
+ "epoch": 36.63760217983651,
+ "grad_norm": 5.926933288574219,
+ "learning_rate": 1.4629821353467997e-05,
+ "loss": 0.2702,
+ "step": 13446
+ },
+ {
+ "epoch": 36.64032697547684,
+ "grad_norm": 10.75122356414795,
+ "learning_rate": 1.4629039120778345e-05,
+ "loss": 0.2697,
+ "step": 13447
+ },
+ {
+ "epoch": 36.643051771117165,
+ "grad_norm": 7.649288654327393,
+ "learning_rate": 1.462825685203789e-05,
+ "loss": 0.2147,
+ "step": 13448
+ },
+ {
+ "epoch": 36.64577656675749,
+ "grad_norm": 7.236257076263428,
+ "learning_rate": 1.4627474547252718e-05,
+ "loss": 0.3286,
+ "step": 13449
+ },
+ {
+ "epoch": 36.64850136239782,
+ "grad_norm": 7.800262928009033,
+ "learning_rate": 1.462669220642892e-05,
+ "loss": 0.2531,
+ "step": 13450
+ },
+ {
+ "epoch": 36.65122615803815,
+ "grad_norm": 6.149899005889893,
+ "learning_rate": 1.4625909829572596e-05,
+ "loss": 0.2659,
+ "step": 13451
+ },
+ {
+ "epoch": 36.653950953678475,
+ "grad_norm": 10.267043113708496,
+ "learning_rate": 1.4625127416689834e-05,
+ "loss": 0.3417,
+ "step": 13452
+ },
+ {
+ "epoch": 36.6566757493188,
+ "grad_norm": 7.2573652267456055,
+ "learning_rate": 1.4624344967786729e-05,
+ "loss": 0.2353,
+ "step": 13453
+ },
+ {
+ "epoch": 36.65940054495913,
+ "grad_norm": 7.371579170227051,
+ "learning_rate": 1.4623562482869373e-05,
+ "loss": 0.3017,
+ "step": 13454
+ },
+ {
+ "epoch": 36.66212534059945,
+ "grad_norm": 5.899842262268066,
+ "learning_rate": 1.462277996194386e-05,
+ "loss": 0.321,
+ "step": 13455
+ },
+ {
+ "epoch": 36.664850136239785,
+ "grad_norm": 7.154221534729004,
+ "learning_rate": 1.462199740501629e-05,
+ "loss": 0.257,
+ "step": 13456
+ },
+ {
+ "epoch": 36.66757493188011,
+ "grad_norm": 7.6316118240356445,
+ "learning_rate": 1.462121481209275e-05,
+ "loss": 0.4272,
+ "step": 13457
+ },
+ {
+ "epoch": 36.67029972752044,
+ "grad_norm": 6.10270881652832,
+ "learning_rate": 1.4620432183179339e-05,
+ "loss": 0.3264,
+ "step": 13458
+ },
+ {
+ "epoch": 36.67302452316076,
+ "grad_norm": 7.653482913970947,
+ "learning_rate": 1.461964951828215e-05,
+ "loss": 0.3745,
+ "step": 13459
+ },
+ {
+ "epoch": 36.67574931880109,
+ "grad_norm": 6.101099014282227,
+ "learning_rate": 1.4618866817407276e-05,
+ "loss": 0.2604,
+ "step": 13460
+ },
+ {
+ "epoch": 36.678474114441414,
+ "grad_norm": 5.745018482208252,
+ "learning_rate": 1.4618084080560819e-05,
+ "loss": 0.2885,
+ "step": 13461
+ },
+ {
+ "epoch": 36.68119891008175,
+ "grad_norm": 6.850214004516602,
+ "learning_rate": 1.4617301307748872e-05,
+ "loss": 0.2923,
+ "step": 13462
+ },
+ {
+ "epoch": 36.68392370572207,
+ "grad_norm": 6.942055702209473,
+ "learning_rate": 1.461651849897753e-05,
+ "loss": 0.2498,
+ "step": 13463
+ },
+ {
+ "epoch": 36.6866485013624,
+ "grad_norm": 6.727579116821289,
+ "learning_rate": 1.4615735654252894e-05,
+ "loss": 0.2479,
+ "step": 13464
+ },
+ {
+ "epoch": 36.689373297002724,
+ "grad_norm": 5.656120300292969,
+ "learning_rate": 1.4614952773581052e-05,
+ "loss": 0.3414,
+ "step": 13465
+ },
+ {
+ "epoch": 36.69209809264305,
+ "grad_norm": 8.685868263244629,
+ "learning_rate": 1.461416985696811e-05,
+ "loss": 0.335,
+ "step": 13466
+ },
+ {
+ "epoch": 36.694822888283376,
+ "grad_norm": 7.29338264465332,
+ "learning_rate": 1.4613386904420161e-05,
+ "loss": 0.3169,
+ "step": 13467
+ },
+ {
+ "epoch": 36.69754768392371,
+ "grad_norm": 7.772313117980957,
+ "learning_rate": 1.4612603915943302e-05,
+ "loss": 0.422,
+ "step": 13468
+ },
+ {
+ "epoch": 36.700272479564035,
+ "grad_norm": 6.467717170715332,
+ "learning_rate": 1.4611820891543632e-05,
+ "loss": 0.2767,
+ "step": 13469
+ },
+ {
+ "epoch": 36.70299727520436,
+ "grad_norm": 11.327056884765625,
+ "learning_rate": 1.461103783122725e-05,
+ "loss": 0.2394,
+ "step": 13470
+ },
+ {
+ "epoch": 36.705722070844686,
+ "grad_norm": 6.666938781738281,
+ "learning_rate": 1.4610254735000254e-05,
+ "loss": 0.2871,
+ "step": 13471
+ },
+ {
+ "epoch": 36.70844686648501,
+ "grad_norm": 5.195796489715576,
+ "learning_rate": 1.4609471602868743e-05,
+ "loss": 0.4612,
+ "step": 13472
+ },
+ {
+ "epoch": 36.71117166212534,
+ "grad_norm": 6.200788974761963,
+ "learning_rate": 1.4608688434838816e-05,
+ "loss": 0.4299,
+ "step": 13473
+ },
+ {
+ "epoch": 36.71389645776567,
+ "grad_norm": 6.3313140869140625,
+ "learning_rate": 1.460790523091657e-05,
+ "loss": 0.3321,
+ "step": 13474
+ },
+ {
+ "epoch": 36.716621253406,
+ "grad_norm": 6.990638732910156,
+ "learning_rate": 1.4607121991108109e-05,
+ "loss": 0.2406,
+ "step": 13475
+ },
+ {
+ "epoch": 36.71934604904632,
+ "grad_norm": 6.073096752166748,
+ "learning_rate": 1.4606338715419528e-05,
+ "loss": 0.1578,
+ "step": 13476
+ },
+ {
+ "epoch": 36.72207084468665,
+ "grad_norm": 8.439026832580566,
+ "learning_rate": 1.4605555403856928e-05,
+ "loss": 0.3236,
+ "step": 13477
+ },
+ {
+ "epoch": 36.724795640326974,
+ "grad_norm": 5.879141330718994,
+ "learning_rate": 1.4604772056426412e-05,
+ "loss": 0.2809,
+ "step": 13478
+ },
+ {
+ "epoch": 36.7275204359673,
+ "grad_norm": 5.959609031677246,
+ "learning_rate": 1.460398867313408e-05,
+ "loss": 0.3346,
+ "step": 13479
+ },
+ {
+ "epoch": 36.73024523160763,
+ "grad_norm": 7.834115982055664,
+ "learning_rate": 1.4603205253986034e-05,
+ "loss": 0.358,
+ "step": 13480
+ },
+ {
+ "epoch": 36.73297002724796,
+ "grad_norm": 10.48446273803711,
+ "learning_rate": 1.4602421798988371e-05,
+ "loss": 0.39,
+ "step": 13481
+ },
+ {
+ "epoch": 36.735694822888284,
+ "grad_norm": 5.4694366455078125,
+ "learning_rate": 1.4601638308147196e-05,
+ "loss": 0.2053,
+ "step": 13482
+ },
+ {
+ "epoch": 36.73841961852861,
+ "grad_norm": 6.326745986938477,
+ "learning_rate": 1.4600854781468611e-05,
+ "loss": 0.2877,
+ "step": 13483
+ },
+ {
+ "epoch": 36.741144414168936,
+ "grad_norm": 7.83394193649292,
+ "learning_rate": 1.4600071218958718e-05,
+ "loss": 0.2609,
+ "step": 13484
+ },
+ {
+ "epoch": 36.74386920980926,
+ "grad_norm": 6.081604957580566,
+ "learning_rate": 1.4599287620623612e-05,
+ "loss": 0.2216,
+ "step": 13485
+ },
+ {
+ "epoch": 36.746594005449595,
+ "grad_norm": 6.674520969390869,
+ "learning_rate": 1.4598503986469408e-05,
+ "loss": 0.3105,
+ "step": 13486
+ },
+ {
+ "epoch": 36.74931880108992,
+ "grad_norm": 13.587553977966309,
+ "learning_rate": 1.4597720316502201e-05,
+ "loss": 0.3659,
+ "step": 13487
+ },
+ {
+ "epoch": 36.752043596730246,
+ "grad_norm": 5.815481662750244,
+ "learning_rate": 1.4596936610728098e-05,
+ "loss": 0.2341,
+ "step": 13488
+ },
+ {
+ "epoch": 36.75476839237057,
+ "grad_norm": 6.632508754730225,
+ "learning_rate": 1.4596152869153199e-05,
+ "loss": 0.2267,
+ "step": 13489
+ },
+ {
+ "epoch": 36.7574931880109,
+ "grad_norm": 14.098983764648438,
+ "learning_rate": 1.459536909178361e-05,
+ "loss": 0.3257,
+ "step": 13490
+ },
+ {
+ "epoch": 36.76021798365122,
+ "grad_norm": 6.832345485687256,
+ "learning_rate": 1.4594585278625435e-05,
+ "loss": 0.2021,
+ "step": 13491
+ },
+ {
+ "epoch": 36.762942779291556,
+ "grad_norm": 6.347101211547852,
+ "learning_rate": 1.4593801429684778e-05,
+ "loss": 0.4977,
+ "step": 13492
+ },
+ {
+ "epoch": 36.76566757493188,
+ "grad_norm": 6.067656993865967,
+ "learning_rate": 1.4593017544967741e-05,
+ "loss": 0.3394,
+ "step": 13493
+ },
+ {
+ "epoch": 36.76839237057221,
+ "grad_norm": 6.473677635192871,
+ "learning_rate": 1.4592233624480432e-05,
+ "loss": 0.2516,
+ "step": 13494
+ },
+ {
+ "epoch": 36.771117166212534,
+ "grad_norm": 6.269806385040283,
+ "learning_rate": 1.4591449668228954e-05,
+ "loss": 0.3989,
+ "step": 13495
+ },
+ {
+ "epoch": 36.77384196185286,
+ "grad_norm": 6.156412124633789,
+ "learning_rate": 1.4590665676219416e-05,
+ "loss": 0.2751,
+ "step": 13496
+ },
+ {
+ "epoch": 36.776566757493185,
+ "grad_norm": 5.466747760772705,
+ "learning_rate": 1.458988164845792e-05,
+ "loss": 0.2327,
+ "step": 13497
+ },
+ {
+ "epoch": 36.77929155313352,
+ "grad_norm": 6.75571346282959,
+ "learning_rate": 1.4589097584950576e-05,
+ "loss": 0.2463,
+ "step": 13498
+ },
+ {
+ "epoch": 36.782016348773844,
+ "grad_norm": 7.74921178817749,
+ "learning_rate": 1.4588313485703484e-05,
+ "loss": 0.1803,
+ "step": 13499
+ },
+ {
+ "epoch": 36.78474114441417,
+ "grad_norm": 6.87742805480957,
+ "learning_rate": 1.4587529350722758e-05,
+ "loss": 0.3144,
+ "step": 13500
+ },
+ {
+ "epoch": 36.787465940054496,
+ "grad_norm": 6.258539199829102,
+ "learning_rate": 1.4586745180014498e-05,
+ "loss": 0.291,
+ "step": 13501
+ },
+ {
+ "epoch": 36.79019073569482,
+ "grad_norm": 6.405124664306641,
+ "learning_rate": 1.4585960973584819e-05,
+ "loss": 0.2778,
+ "step": 13502
+ },
+ {
+ "epoch": 36.79291553133515,
+ "grad_norm": 6.355350494384766,
+ "learning_rate": 1.4585176731439816e-05,
+ "loss": 0.5846,
+ "step": 13503
+ },
+ {
+ "epoch": 36.79564032697548,
+ "grad_norm": 6.275414943695068,
+ "learning_rate": 1.458439245358561e-05,
+ "loss": 0.2856,
+ "step": 13504
+ },
+ {
+ "epoch": 36.798365122615806,
+ "grad_norm": 6.55458402633667,
+ "learning_rate": 1.4583608140028301e-05,
+ "loss": 0.4235,
+ "step": 13505
+ },
+ {
+ "epoch": 36.80108991825613,
+ "grad_norm": 6.362923622131348,
+ "learning_rate": 1.4582823790774001e-05,
+ "loss": 0.1937,
+ "step": 13506
+ },
+ {
+ "epoch": 36.80381471389646,
+ "grad_norm": 6.119221210479736,
+ "learning_rate": 1.4582039405828813e-05,
+ "loss": 0.2638,
+ "step": 13507
+ },
+ {
+ "epoch": 36.80653950953678,
+ "grad_norm": 6.98737907409668,
+ "learning_rate": 1.4581254985198854e-05,
+ "loss": 0.4198,
+ "step": 13508
+ },
+ {
+ "epoch": 36.80926430517711,
+ "grad_norm": 8.595921516418457,
+ "learning_rate": 1.4580470528890227e-05,
+ "loss": 0.3013,
+ "step": 13509
+ },
+ {
+ "epoch": 36.81198910081744,
+ "grad_norm": 6.572314739227295,
+ "learning_rate": 1.4579686036909043e-05,
+ "loss": 0.2438,
+ "step": 13510
+ },
+ {
+ "epoch": 36.81471389645777,
+ "grad_norm": 6.793776035308838,
+ "learning_rate": 1.457890150926141e-05,
+ "loss": 0.3829,
+ "step": 13511
+ },
+ {
+ "epoch": 36.817438692098094,
+ "grad_norm": 7.48348331451416,
+ "learning_rate": 1.457811694595344e-05,
+ "loss": 0.3203,
+ "step": 13512
+ },
+ {
+ "epoch": 36.82016348773842,
+ "grad_norm": 8.285489082336426,
+ "learning_rate": 1.4577332346991244e-05,
+ "loss": 0.3666,
+ "step": 13513
+ },
+ {
+ "epoch": 36.822888283378745,
+ "grad_norm": 5.748161792755127,
+ "learning_rate": 1.4576547712380931e-05,
+ "loss": 0.2483,
+ "step": 13514
+ },
+ {
+ "epoch": 36.82561307901907,
+ "grad_norm": 8.75537395477295,
+ "learning_rate": 1.457576304212861e-05,
+ "loss": 0.4648,
+ "step": 13515
+ },
+ {
+ "epoch": 36.828337874659404,
+ "grad_norm": 6.129855632781982,
+ "learning_rate": 1.4574978336240396e-05,
+ "loss": 0.3243,
+ "step": 13516
+ },
+ {
+ "epoch": 36.83106267029973,
+ "grad_norm": 6.249845504760742,
+ "learning_rate": 1.4574193594722394e-05,
+ "loss": 0.4031,
+ "step": 13517
+ },
+ {
+ "epoch": 36.833787465940055,
+ "grad_norm": 13.521490097045898,
+ "learning_rate": 1.4573408817580723e-05,
+ "loss": 0.2516,
+ "step": 13518
+ },
+ {
+ "epoch": 36.83651226158038,
+ "grad_norm": 8.591753959655762,
+ "learning_rate": 1.457262400482149e-05,
+ "loss": 0.3831,
+ "step": 13519
+ },
+ {
+ "epoch": 36.83923705722071,
+ "grad_norm": 9.518485069274902,
+ "learning_rate": 1.4571839156450809e-05,
+ "loss": 0.3139,
+ "step": 13520
+ },
+ {
+ "epoch": 36.84196185286103,
+ "grad_norm": 7.928452491760254,
+ "learning_rate": 1.4571054272474791e-05,
+ "loss": 0.3539,
+ "step": 13521
+ },
+ {
+ "epoch": 36.844686648501366,
+ "grad_norm": 6.2169294357299805,
+ "learning_rate": 1.457026935289955e-05,
+ "loss": 0.2234,
+ "step": 13522
+ },
+ {
+ "epoch": 36.84741144414169,
+ "grad_norm": 5.923735618591309,
+ "learning_rate": 1.45694843977312e-05,
+ "loss": 0.2801,
+ "step": 13523
+ },
+ {
+ "epoch": 36.85013623978202,
+ "grad_norm": 6.010656833648682,
+ "learning_rate": 1.456869940697585e-05,
+ "loss": 0.2323,
+ "step": 13524
+ },
+ {
+ "epoch": 36.85286103542234,
+ "grad_norm": 6.384903430938721,
+ "learning_rate": 1.4567914380639617e-05,
+ "loss": 0.3567,
+ "step": 13525
+ },
+ {
+ "epoch": 36.85558583106267,
+ "grad_norm": 6.307415962219238,
+ "learning_rate": 1.4567129318728614e-05,
+ "loss": 0.2615,
+ "step": 13526
+ },
+ {
+ "epoch": 36.858310626702995,
+ "grad_norm": 5.263106346130371,
+ "learning_rate": 1.4566344221248957e-05,
+ "loss": 0.3254,
+ "step": 13527
+ },
+ {
+ "epoch": 36.86103542234333,
+ "grad_norm": 8.703821182250977,
+ "learning_rate": 1.4565559088206753e-05,
+ "loss": 0.2455,
+ "step": 13528
+ },
+ {
+ "epoch": 36.86376021798365,
+ "grad_norm": 7.47613000869751,
+ "learning_rate": 1.4564773919608125e-05,
+ "loss": 0.3584,
+ "step": 13529
+ },
+ {
+ "epoch": 36.86648501362398,
+ "grad_norm": 5.817327499389648,
+ "learning_rate": 1.4563988715459185e-05,
+ "loss": 0.2518,
+ "step": 13530
+ },
+ {
+ "epoch": 36.869209809264305,
+ "grad_norm": 6.253386974334717,
+ "learning_rate": 1.4563203475766048e-05,
+ "loss": 0.3105,
+ "step": 13531
+ },
+ {
+ "epoch": 36.87193460490463,
+ "grad_norm": 6.917342662811279,
+ "learning_rate": 1.4562418200534827e-05,
+ "loss": 0.3243,
+ "step": 13532
+ },
+ {
+ "epoch": 36.87465940054496,
+ "grad_norm": 9.005016326904297,
+ "learning_rate": 1.4561632889771642e-05,
+ "loss": 0.2649,
+ "step": 13533
+ },
+ {
+ "epoch": 36.87738419618529,
+ "grad_norm": 6.099979400634766,
+ "learning_rate": 1.4560847543482605e-05,
+ "loss": 0.4409,
+ "step": 13534
+ },
+ {
+ "epoch": 36.880108991825615,
+ "grad_norm": 6.624093532562256,
+ "learning_rate": 1.4560062161673838e-05,
+ "loss": 0.3391,
+ "step": 13535
+ },
+ {
+ "epoch": 36.88283378746594,
+ "grad_norm": 5.857081413269043,
+ "learning_rate": 1.455927674435145e-05,
+ "loss": 0.3004,
+ "step": 13536
+ },
+ {
+ "epoch": 36.88555858310627,
+ "grad_norm": 6.330967426300049,
+ "learning_rate": 1.4558491291521561e-05,
+ "loss": 0.2773,
+ "step": 13537
+ },
+ {
+ "epoch": 36.88828337874659,
+ "grad_norm": 6.213892459869385,
+ "learning_rate": 1.455770580319029e-05,
+ "loss": 0.4926,
+ "step": 13538
+ },
+ {
+ "epoch": 36.89100817438692,
+ "grad_norm": 6.335833549499512,
+ "learning_rate": 1.4556920279363754e-05,
+ "loss": 0.404,
+ "step": 13539
+ },
+ {
+ "epoch": 36.89373297002725,
+ "grad_norm": 7.174566745758057,
+ "learning_rate": 1.4556134720048066e-05,
+ "loss": 0.3728,
+ "step": 13540
+ },
+ {
+ "epoch": 36.89645776566758,
+ "grad_norm": 12.14997673034668,
+ "learning_rate": 1.4555349125249353e-05,
+ "loss": 0.357,
+ "step": 13541
+ },
+ {
+ "epoch": 36.8991825613079,
+ "grad_norm": 5.641149997711182,
+ "learning_rate": 1.4554563494973721e-05,
+ "loss": 0.5276,
+ "step": 13542
+ },
+ {
+ "epoch": 36.90190735694823,
+ "grad_norm": 7.460294723510742,
+ "learning_rate": 1.45537778292273e-05,
+ "loss": 0.229,
+ "step": 13543
+ },
+ {
+ "epoch": 36.904632152588555,
+ "grad_norm": 5.240541458129883,
+ "learning_rate": 1.4552992128016202e-05,
+ "loss": 0.337,
+ "step": 13544
+ },
+ {
+ "epoch": 36.90735694822888,
+ "grad_norm": 7.271333694458008,
+ "learning_rate": 1.4552206391346548e-05,
+ "loss": 0.521,
+ "step": 13545
+ },
+ {
+ "epoch": 36.91008174386921,
+ "grad_norm": 5.819964408874512,
+ "learning_rate": 1.4551420619224455e-05,
+ "loss": 0.322,
+ "step": 13546
+ },
+ {
+ "epoch": 36.91280653950954,
+ "grad_norm": 6.316477298736572,
+ "learning_rate": 1.4550634811656048e-05,
+ "loss": 0.3957,
+ "step": 13547
+ },
+ {
+ "epoch": 36.915531335149865,
+ "grad_norm": 7.788074016571045,
+ "learning_rate": 1.4549848968647441e-05,
+ "loss": 0.2825,
+ "step": 13548
+ },
+ {
+ "epoch": 36.91825613079019,
+ "grad_norm": 6.44636869430542,
+ "learning_rate": 1.454906309020476e-05,
+ "loss": 0.3064,
+ "step": 13549
+ },
+ {
+ "epoch": 36.920980926430516,
+ "grad_norm": 7.1698832511901855,
+ "learning_rate": 1.4548277176334121e-05,
+ "loss": 0.3694,
+ "step": 13550
+ },
+ {
+ "epoch": 36.92370572207084,
+ "grad_norm": 7.369454860687256,
+ "learning_rate": 1.4547491227041643e-05,
+ "loss": 0.3172,
+ "step": 13551
+ },
+ {
+ "epoch": 36.926430517711175,
+ "grad_norm": 5.6260271072387695,
+ "learning_rate": 1.4546705242333452e-05,
+ "loss": 0.3223,
+ "step": 13552
+ },
+ {
+ "epoch": 36.9291553133515,
+ "grad_norm": 6.899228096008301,
+ "learning_rate": 1.4545919222215668e-05,
+ "loss": 0.5161,
+ "step": 13553
+ },
+ {
+ "epoch": 36.93188010899183,
+ "grad_norm": 5.509049892425537,
+ "learning_rate": 1.4545133166694408e-05,
+ "loss": 0.3986,
+ "step": 13554
+ },
+ {
+ "epoch": 36.93460490463215,
+ "grad_norm": 5.448057174682617,
+ "learning_rate": 1.45443470757758e-05,
+ "loss": 0.2816,
+ "step": 13555
+ },
+ {
+ "epoch": 36.93732970027248,
+ "grad_norm": 6.382065296173096,
+ "learning_rate": 1.4543560949465963e-05,
+ "loss": 0.2829,
+ "step": 13556
+ },
+ {
+ "epoch": 36.940054495912804,
+ "grad_norm": 5.697299003601074,
+ "learning_rate": 1.4542774787771019e-05,
+ "loss": 0.2551,
+ "step": 13557
+ },
+ {
+ "epoch": 36.94277929155314,
+ "grad_norm": 6.731752872467041,
+ "learning_rate": 1.4541988590697089e-05,
+ "loss": 0.3117,
+ "step": 13558
+ },
+ {
+ "epoch": 36.94550408719346,
+ "grad_norm": 6.797028541564941,
+ "learning_rate": 1.4541202358250301e-05,
+ "loss": 0.2345,
+ "step": 13559
+ },
+ {
+ "epoch": 36.94822888283379,
+ "grad_norm": 6.267938613891602,
+ "learning_rate": 1.4540416090436775e-05,
+ "loss": 0.3517,
+ "step": 13560
+ },
+ {
+ "epoch": 36.950953678474114,
+ "grad_norm": 7.315567493438721,
+ "learning_rate": 1.4539629787262635e-05,
+ "loss": 0.3029,
+ "step": 13561
+ },
+ {
+ "epoch": 36.95367847411444,
+ "grad_norm": 5.532219409942627,
+ "learning_rate": 1.4538843448734001e-05,
+ "loss": 0.3416,
+ "step": 13562
+ },
+ {
+ "epoch": 36.956403269754766,
+ "grad_norm": 6.393294334411621,
+ "learning_rate": 1.4538057074857004e-05,
+ "loss": 0.4073,
+ "step": 13563
+ },
+ {
+ "epoch": 36.95912806539509,
+ "grad_norm": 6.493333339691162,
+ "learning_rate": 1.4537270665637762e-05,
+ "loss": 0.2682,
+ "step": 13564
+ },
+ {
+ "epoch": 36.961852861035425,
+ "grad_norm": 6.927456378936768,
+ "learning_rate": 1.4536484221082403e-05,
+ "loss": 0.2459,
+ "step": 13565
+ },
+ {
+ "epoch": 36.96457765667575,
+ "grad_norm": 5.922084808349609,
+ "learning_rate": 1.453569774119705e-05,
+ "loss": 0.3593,
+ "step": 13566
+ },
+ {
+ "epoch": 36.967302452316076,
+ "grad_norm": 5.5476884841918945,
+ "learning_rate": 1.4534911225987832e-05,
+ "loss": 0.4234,
+ "step": 13567
+ },
+ {
+ "epoch": 36.9700272479564,
+ "grad_norm": 6.00234842300415,
+ "learning_rate": 1.4534124675460868e-05,
+ "loss": 0.3124,
+ "step": 13568
+ },
+ {
+ "epoch": 36.97275204359673,
+ "grad_norm": 7.949798583984375,
+ "learning_rate": 1.453333808962229e-05,
+ "loss": 0.3183,
+ "step": 13569
+ },
+ {
+ "epoch": 36.97547683923706,
+ "grad_norm": 12.44044017791748,
+ "learning_rate": 1.4532551468478217e-05,
+ "loss": 0.3472,
+ "step": 13570
+ },
+ {
+ "epoch": 36.97820163487739,
+ "grad_norm": 5.803534030914307,
+ "learning_rate": 1.4531764812034781e-05,
+ "loss": 0.3768,
+ "step": 13571
+ },
+ {
+ "epoch": 36.98092643051771,
+ "grad_norm": 6.589306354522705,
+ "learning_rate": 1.4530978120298108e-05,
+ "loss": 0.2889,
+ "step": 13572
+ },
+ {
+ "epoch": 36.98365122615804,
+ "grad_norm": 7.242832183837891,
+ "learning_rate": 1.4530191393274322e-05,
+ "loss": 0.2752,
+ "step": 13573
+ },
+ {
+ "epoch": 36.986376021798364,
+ "grad_norm": 10.549457550048828,
+ "learning_rate": 1.452940463096955e-05,
+ "loss": 0.2005,
+ "step": 13574
+ },
+ {
+ "epoch": 36.98910081743869,
+ "grad_norm": 8.42289924621582,
+ "learning_rate": 1.4528617833389925e-05,
+ "loss": 0.3764,
+ "step": 13575
+ },
+ {
+ "epoch": 36.991825613079016,
+ "grad_norm": 5.723546981811523,
+ "learning_rate": 1.4527831000541564e-05,
+ "loss": 0.3205,
+ "step": 13576
+ },
+ {
+ "epoch": 36.99455040871935,
+ "grad_norm": 7.526780605316162,
+ "learning_rate": 1.4527044132430605e-05,
+ "loss": 0.4643,
+ "step": 13577
+ },
+ {
+ "epoch": 36.997275204359674,
+ "grad_norm": 5.826638698577881,
+ "learning_rate": 1.452625722906317e-05,
+ "loss": 0.3167,
+ "step": 13578
+ },
+ {
+ "epoch": 37.0,
+ "grad_norm": 6.392323970794678,
+ "learning_rate": 1.4525470290445392e-05,
+ "loss": 0.2362,
+ "step": 13579
+ },
+ {
+ "epoch": 37.002724795640326,
+ "grad_norm": 5.40487003326416,
+ "learning_rate": 1.4524683316583392e-05,
+ "loss": 0.3614,
+ "step": 13580
+ },
+ {
+ "epoch": 37.00544959128065,
+ "grad_norm": 6.00352668762207,
+ "learning_rate": 1.4523896307483308e-05,
+ "loss": 0.3345,
+ "step": 13581
+ },
+ {
+ "epoch": 37.00817438692098,
+ "grad_norm": 5.279332160949707,
+ "learning_rate": 1.4523109263151262e-05,
+ "loss": 0.2882,
+ "step": 13582
+ },
+ {
+ "epoch": 37.01089918256131,
+ "grad_norm": 5.116689682006836,
+ "learning_rate": 1.4522322183593392e-05,
+ "loss": 0.2096,
+ "step": 13583
+ },
+ {
+ "epoch": 37.013623978201636,
+ "grad_norm": 5.397965908050537,
+ "learning_rate": 1.4521535068815817e-05,
+ "loss": 0.3013,
+ "step": 13584
+ },
+ {
+ "epoch": 37.01634877384196,
+ "grad_norm": 10.295614242553711,
+ "learning_rate": 1.4520747918824676e-05,
+ "loss": 0.2728,
+ "step": 13585
+ },
+ {
+ "epoch": 37.01907356948229,
+ "grad_norm": 6.142119884490967,
+ "learning_rate": 1.4519960733626093e-05,
+ "loss": 0.2662,
+ "step": 13586
+ },
+ {
+ "epoch": 37.02179836512261,
+ "grad_norm": 5.42104434967041,
+ "learning_rate": 1.4519173513226203e-05,
+ "loss": 0.255,
+ "step": 13587
+ },
+ {
+ "epoch": 37.02452316076294,
+ "grad_norm": 6.4026618003845215,
+ "learning_rate": 1.4518386257631135e-05,
+ "loss": 0.2265,
+ "step": 13588
+ },
+ {
+ "epoch": 37.02724795640327,
+ "grad_norm": 5.611619472503662,
+ "learning_rate": 1.4517598966847019e-05,
+ "loss": 0.3412,
+ "step": 13589
+ },
+ {
+ "epoch": 37.0299727520436,
+ "grad_norm": 5.409390926361084,
+ "learning_rate": 1.4516811640879988e-05,
+ "loss": 0.2619,
+ "step": 13590
+ },
+ {
+ "epoch": 37.032697547683924,
+ "grad_norm": 4.898901462554932,
+ "learning_rate": 1.4516024279736177e-05,
+ "loss": 0.3071,
+ "step": 13591
+ },
+ {
+ "epoch": 37.03542234332425,
+ "grad_norm": 5.6210479736328125,
+ "learning_rate": 1.4515236883421708e-05,
+ "loss": 0.1871,
+ "step": 13592
+ },
+ {
+ "epoch": 37.038147138964575,
+ "grad_norm": 5.9645161628723145,
+ "learning_rate": 1.4514449451942725e-05,
+ "loss": 0.3825,
+ "step": 13593
+ },
+ {
+ "epoch": 37.0408719346049,
+ "grad_norm": 5.265384674072266,
+ "learning_rate": 1.4513661985305351e-05,
+ "loss": 0.3369,
+ "step": 13594
+ },
+ {
+ "epoch": 37.043596730245234,
+ "grad_norm": 6.3180832862854,
+ "learning_rate": 1.4512874483515727e-05,
+ "loss": 0.3513,
+ "step": 13595
+ },
+ {
+ "epoch": 37.04632152588556,
+ "grad_norm": 5.28624153137207,
+ "learning_rate": 1.4512086946579977e-05,
+ "loss": 0.4906,
+ "step": 13596
+ },
+ {
+ "epoch": 37.049046321525886,
+ "grad_norm": 5.494368553161621,
+ "learning_rate": 1.4511299374504242e-05,
+ "loss": 0.3748,
+ "step": 13597
+ },
+ {
+ "epoch": 37.05177111716621,
+ "grad_norm": 6.383624076843262,
+ "learning_rate": 1.4510511767294653e-05,
+ "loss": 0.1972,
+ "step": 13598
+ },
+ {
+ "epoch": 37.05449591280654,
+ "grad_norm": 7.064739227294922,
+ "learning_rate": 1.4509724124957341e-05,
+ "loss": 0.2488,
+ "step": 13599
+ },
+ {
+ "epoch": 37.05722070844686,
+ "grad_norm": 5.792699337005615,
+ "learning_rate": 1.4508936447498442e-05,
+ "loss": 0.2599,
+ "step": 13600
+ },
+ {
+ "epoch": 37.059945504087196,
+ "grad_norm": 6.29413366317749,
+ "learning_rate": 1.4508148734924095e-05,
+ "loss": 0.2135,
+ "step": 13601
+ },
+ {
+ "epoch": 37.06267029972752,
+ "grad_norm": 11.314350128173828,
+ "learning_rate": 1.4507360987240429e-05,
+ "loss": 0.2141,
+ "step": 13602
+ },
+ {
+ "epoch": 37.06539509536785,
+ "grad_norm": 6.594211101531982,
+ "learning_rate": 1.450657320445358e-05,
+ "loss": 0.4008,
+ "step": 13603
+ },
+ {
+ "epoch": 37.06811989100817,
+ "grad_norm": 6.072294235229492,
+ "learning_rate": 1.4505785386569686e-05,
+ "loss": 0.2754,
+ "step": 13604
+ },
+ {
+ "epoch": 37.0708446866485,
+ "grad_norm": 7.498562812805176,
+ "learning_rate": 1.4504997533594881e-05,
+ "loss": 0.2602,
+ "step": 13605
+ },
+ {
+ "epoch": 37.073569482288825,
+ "grad_norm": 7.032705307006836,
+ "learning_rate": 1.4504209645535294e-05,
+ "loss": 0.259,
+ "step": 13606
+ },
+ {
+ "epoch": 37.07629427792916,
+ "grad_norm": 6.204941749572754,
+ "learning_rate": 1.450342172239707e-05,
+ "loss": 0.2395,
+ "step": 13607
+ },
+ {
+ "epoch": 37.079019073569484,
+ "grad_norm": 6.8277907371521,
+ "learning_rate": 1.4502633764186346e-05,
+ "loss": 0.3278,
+ "step": 13608
+ },
+ {
+ "epoch": 37.08174386920981,
+ "grad_norm": 5.717363357543945,
+ "learning_rate": 1.4501845770909253e-05,
+ "loss": 0.2976,
+ "step": 13609
+ },
+ {
+ "epoch": 37.084468664850135,
+ "grad_norm": 4.983062267303467,
+ "learning_rate": 1.4501057742571931e-05,
+ "loss": 0.2898,
+ "step": 13610
+ },
+ {
+ "epoch": 37.08719346049046,
+ "grad_norm": 6.429154396057129,
+ "learning_rate": 1.4500269679180513e-05,
+ "loss": 0.4847,
+ "step": 13611
+ },
+ {
+ "epoch": 37.08991825613079,
+ "grad_norm": 5.963826656341553,
+ "learning_rate": 1.4499481580741144e-05,
+ "loss": 0.2522,
+ "step": 13612
+ },
+ {
+ "epoch": 37.09264305177112,
+ "grad_norm": 6.59958028793335,
+ "learning_rate": 1.4498693447259956e-05,
+ "loss": 0.3997,
+ "step": 13613
+ },
+ {
+ "epoch": 37.095367847411445,
+ "grad_norm": 4.506076812744141,
+ "learning_rate": 1.4497905278743086e-05,
+ "loss": 0.2088,
+ "step": 13614
+ },
+ {
+ "epoch": 37.09809264305177,
+ "grad_norm": 6.12763786315918,
+ "learning_rate": 1.4497117075196677e-05,
+ "loss": 0.2474,
+ "step": 13615
+ },
+ {
+ "epoch": 37.1008174386921,
+ "grad_norm": 7.154154300689697,
+ "learning_rate": 1.4496328836626863e-05,
+ "loss": 0.3685,
+ "step": 13616
+ },
+ {
+ "epoch": 37.10354223433242,
+ "grad_norm": 6.3774285316467285,
+ "learning_rate": 1.4495540563039785e-05,
+ "loss": 0.2685,
+ "step": 13617
+ },
+ {
+ "epoch": 37.10626702997275,
+ "grad_norm": 4.6779279708862305,
+ "learning_rate": 1.4494752254441585e-05,
+ "loss": 0.2375,
+ "step": 13618
+ },
+ {
+ "epoch": 37.10899182561308,
+ "grad_norm": 5.380875110626221,
+ "learning_rate": 1.4493963910838393e-05,
+ "loss": 0.391,
+ "step": 13619
+ },
+ {
+ "epoch": 37.11171662125341,
+ "grad_norm": 5.728816986083984,
+ "learning_rate": 1.4493175532236361e-05,
+ "loss": 0.2866,
+ "step": 13620
+ },
+ {
+ "epoch": 37.11444141689373,
+ "grad_norm": 5.909167289733887,
+ "learning_rate": 1.4492387118641618e-05,
+ "loss": 0.2805,
+ "step": 13621
+ },
+ {
+ "epoch": 37.11716621253406,
+ "grad_norm": 5.537550926208496,
+ "learning_rate": 1.4491598670060312e-05,
+ "loss": 0.3844,
+ "step": 13622
+ },
+ {
+ "epoch": 37.119891008174385,
+ "grad_norm": 5.119868278503418,
+ "learning_rate": 1.4490810186498577e-05,
+ "loss": 0.2268,
+ "step": 13623
+ },
+ {
+ "epoch": 37.12261580381471,
+ "grad_norm": 7.367032051086426,
+ "learning_rate": 1.4490021667962556e-05,
+ "loss": 0.2613,
+ "step": 13624
+ },
+ {
+ "epoch": 37.12534059945504,
+ "grad_norm": 5.83549690246582,
+ "learning_rate": 1.4489233114458394e-05,
+ "loss": 0.3523,
+ "step": 13625
+ },
+ {
+ "epoch": 37.12806539509537,
+ "grad_norm": 5.785162448883057,
+ "learning_rate": 1.448844452599223e-05,
+ "loss": 0.3449,
+ "step": 13626
+ },
+ {
+ "epoch": 37.130790190735695,
+ "grad_norm": 5.571055889129639,
+ "learning_rate": 1.4487655902570201e-05,
+ "loss": 0.3671,
+ "step": 13627
+ },
+ {
+ "epoch": 37.13351498637602,
+ "grad_norm": 6.009766578674316,
+ "learning_rate": 1.4486867244198455e-05,
+ "loss": 0.3368,
+ "step": 13628
+ },
+ {
+ "epoch": 37.13623978201635,
+ "grad_norm": 6.343024730682373,
+ "learning_rate": 1.4486078550883129e-05,
+ "loss": 0.2497,
+ "step": 13629
+ },
+ {
+ "epoch": 37.13896457765667,
+ "grad_norm": 5.5884599685668945,
+ "learning_rate": 1.448528982263037e-05,
+ "loss": 0.224,
+ "step": 13630
+ },
+ {
+ "epoch": 37.141689373297005,
+ "grad_norm": 5.679103851318359,
+ "learning_rate": 1.4484501059446317e-05,
+ "loss": 0.3214,
+ "step": 13631
+ },
+ {
+ "epoch": 37.14441416893733,
+ "grad_norm": 4.739778518676758,
+ "learning_rate": 1.4483712261337113e-05,
+ "loss": 0.3524,
+ "step": 13632
+ },
+ {
+ "epoch": 37.14713896457766,
+ "grad_norm": 8.464988708496094,
+ "learning_rate": 1.4482923428308904e-05,
+ "loss": 0.4272,
+ "step": 13633
+ },
+ {
+ "epoch": 37.14986376021798,
+ "grad_norm": 5.842249870300293,
+ "learning_rate": 1.448213456036783e-05,
+ "loss": 0.2496,
+ "step": 13634
+ },
+ {
+ "epoch": 37.15258855585831,
+ "grad_norm": 5.07939338684082,
+ "learning_rate": 1.4481345657520036e-05,
+ "loss": 0.4718,
+ "step": 13635
+ },
+ {
+ "epoch": 37.155313351498634,
+ "grad_norm": 6.1155595779418945,
+ "learning_rate": 1.4480556719771671e-05,
+ "loss": 0.2461,
+ "step": 13636
+ },
+ {
+ "epoch": 37.15803814713897,
+ "grad_norm": 7.305619239807129,
+ "learning_rate": 1.447976774712887e-05,
+ "loss": 0.1876,
+ "step": 13637
+ },
+ {
+ "epoch": 37.16076294277929,
+ "grad_norm": 5.101131916046143,
+ "learning_rate": 1.4478978739597781e-05,
+ "loss": 0.2981,
+ "step": 13638
+ },
+ {
+ "epoch": 37.16348773841962,
+ "grad_norm": 6.35480260848999,
+ "learning_rate": 1.4478189697184553e-05,
+ "loss": 0.1937,
+ "step": 13639
+ },
+ {
+ "epoch": 37.166212534059945,
+ "grad_norm": 4.870874881744385,
+ "learning_rate": 1.4477400619895326e-05,
+ "loss": 0.1893,
+ "step": 13640
+ },
+ {
+ "epoch": 37.16893732970027,
+ "grad_norm": 5.622579574584961,
+ "learning_rate": 1.4476611507736244e-05,
+ "loss": 0.2455,
+ "step": 13641
+ },
+ {
+ "epoch": 37.171662125340596,
+ "grad_norm": 6.2390947341918945,
+ "learning_rate": 1.4475822360713463e-05,
+ "loss": 0.3851,
+ "step": 13642
+ },
+ {
+ "epoch": 37.17438692098093,
+ "grad_norm": 7.213648319244385,
+ "learning_rate": 1.4475033178833116e-05,
+ "loss": 0.2074,
+ "step": 13643
+ },
+ {
+ "epoch": 37.177111716621255,
+ "grad_norm": 5.573960304260254,
+ "learning_rate": 1.4474243962101357e-05,
+ "loss": 0.2524,
+ "step": 13644
+ },
+ {
+ "epoch": 37.17983651226158,
+ "grad_norm": 6.93544340133667,
+ "learning_rate": 1.4473454710524328e-05,
+ "loss": 0.2539,
+ "step": 13645
+ },
+ {
+ "epoch": 37.182561307901906,
+ "grad_norm": 6.557056903839111,
+ "learning_rate": 1.447266542410818e-05,
+ "loss": 0.2092,
+ "step": 13646
+ },
+ {
+ "epoch": 37.18528610354223,
+ "grad_norm": 6.192226409912109,
+ "learning_rate": 1.4471876102859057e-05,
+ "loss": 0.2141,
+ "step": 13647
+ },
+ {
+ "epoch": 37.18801089918256,
+ "grad_norm": 6.104713439941406,
+ "learning_rate": 1.4471086746783108e-05,
+ "loss": 0.3153,
+ "step": 13648
+ },
+ {
+ "epoch": 37.19073569482289,
+ "grad_norm": 6.464320182800293,
+ "learning_rate": 1.4470297355886476e-05,
+ "loss": 0.2886,
+ "step": 13649
+ },
+ {
+ "epoch": 37.19346049046322,
+ "grad_norm": 6.354846954345703,
+ "learning_rate": 1.4469507930175313e-05,
+ "loss": 0.2008,
+ "step": 13650
+ },
+ {
+ "epoch": 37.19618528610354,
+ "grad_norm": 6.795820236206055,
+ "learning_rate": 1.4468718469655766e-05,
+ "loss": 0.2286,
+ "step": 13651
+ },
+ {
+ "epoch": 37.19891008174387,
+ "grad_norm": 6.503321647644043,
+ "learning_rate": 1.4467928974333987e-05,
+ "loss": 0.3454,
+ "step": 13652
+ },
+ {
+ "epoch": 37.201634877384194,
+ "grad_norm": 5.964447975158691,
+ "learning_rate": 1.4467139444216117e-05,
+ "loss": 0.3126,
+ "step": 13653
+ },
+ {
+ "epoch": 37.20435967302452,
+ "grad_norm": 5.265637397766113,
+ "learning_rate": 1.446634987930831e-05,
+ "loss": 0.2384,
+ "step": 13654
+ },
+ {
+ "epoch": 37.20708446866485,
+ "grad_norm": 5.736026287078857,
+ "learning_rate": 1.4465560279616714e-05,
+ "loss": 0.1817,
+ "step": 13655
+ },
+ {
+ "epoch": 37.20980926430518,
+ "grad_norm": 6.372326850891113,
+ "learning_rate": 1.446477064514748e-05,
+ "loss": 0.2786,
+ "step": 13656
+ },
+ {
+ "epoch": 37.212534059945504,
+ "grad_norm": 9.852974891662598,
+ "learning_rate": 1.4463980975906753e-05,
+ "loss": 0.293,
+ "step": 13657
+ },
+ {
+ "epoch": 37.21525885558583,
+ "grad_norm": 5.008190631866455,
+ "learning_rate": 1.4463191271900686e-05,
+ "loss": 0.1955,
+ "step": 13658
+ },
+ {
+ "epoch": 37.217983651226156,
+ "grad_norm": 5.530735015869141,
+ "learning_rate": 1.4462401533135429e-05,
+ "loss": 0.2639,
+ "step": 13659
+ },
+ {
+ "epoch": 37.22070844686648,
+ "grad_norm": 6.269716739654541,
+ "learning_rate": 1.4461611759617134e-05,
+ "loss": 0.1737,
+ "step": 13660
+ },
+ {
+ "epoch": 37.223433242506815,
+ "grad_norm": 6.597443580627441,
+ "learning_rate": 1.446082195135195e-05,
+ "loss": 0.3604,
+ "step": 13661
+ },
+ {
+ "epoch": 37.22615803814714,
+ "grad_norm": 7.4416375160217285,
+ "learning_rate": 1.4460032108346029e-05,
+ "loss": 0.3043,
+ "step": 13662
+ },
+ {
+ "epoch": 37.228882833787466,
+ "grad_norm": 6.190356731414795,
+ "learning_rate": 1.445924223060552e-05,
+ "loss": 0.4641,
+ "step": 13663
+ },
+ {
+ "epoch": 37.23160762942779,
+ "grad_norm": 5.487213134765625,
+ "learning_rate": 1.4458452318136575e-05,
+ "loss": 0.2169,
+ "step": 13664
+ },
+ {
+ "epoch": 37.23433242506812,
+ "grad_norm": 7.421302795410156,
+ "learning_rate": 1.4457662370945348e-05,
+ "loss": 0.2897,
+ "step": 13665
+ },
+ {
+ "epoch": 37.237057220708444,
+ "grad_norm": 6.267577171325684,
+ "learning_rate": 1.445687238903799e-05,
+ "loss": 0.3732,
+ "step": 13666
+ },
+ {
+ "epoch": 37.23978201634878,
+ "grad_norm": 5.17593240737915,
+ "learning_rate": 1.4456082372420652e-05,
+ "loss": 0.3845,
+ "step": 13667
+ },
+ {
+ "epoch": 37.2425068119891,
+ "grad_norm": 4.650514602661133,
+ "learning_rate": 1.4455292321099492e-05,
+ "loss": 0.4111,
+ "step": 13668
+ },
+ {
+ "epoch": 37.24523160762943,
+ "grad_norm": 5.345720291137695,
+ "learning_rate": 1.4454502235080654e-05,
+ "loss": 0.2173,
+ "step": 13669
+ },
+ {
+ "epoch": 37.247956403269754,
+ "grad_norm": 5.987113952636719,
+ "learning_rate": 1.44537121143703e-05,
+ "loss": 0.3471,
+ "step": 13670
+ },
+ {
+ "epoch": 37.25068119891008,
+ "grad_norm": 5.843854904174805,
+ "learning_rate": 1.4452921958974578e-05,
+ "loss": 0.2214,
+ "step": 13671
+ },
+ {
+ "epoch": 37.253405994550405,
+ "grad_norm": 6.542635917663574,
+ "learning_rate": 1.4452131768899641e-05,
+ "loss": 0.2692,
+ "step": 13672
+ },
+ {
+ "epoch": 37.25613079019074,
+ "grad_norm": 12.215797424316406,
+ "learning_rate": 1.4451341544151647e-05,
+ "loss": 0.3048,
+ "step": 13673
+ },
+ {
+ "epoch": 37.258855585831064,
+ "grad_norm": 6.043381214141846,
+ "learning_rate": 1.4450551284736748e-05,
+ "loss": 0.3226,
+ "step": 13674
+ },
+ {
+ "epoch": 37.26158038147139,
+ "grad_norm": 6.124060153961182,
+ "learning_rate": 1.4449760990661098e-05,
+ "loss": 0.2841,
+ "step": 13675
+ },
+ {
+ "epoch": 37.264305177111716,
+ "grad_norm": 5.762239456176758,
+ "learning_rate": 1.4448970661930854e-05,
+ "loss": 0.2475,
+ "step": 13676
+ },
+ {
+ "epoch": 37.26702997275204,
+ "grad_norm": 6.271738052368164,
+ "learning_rate": 1.4448180298552168e-05,
+ "loss": 0.2762,
+ "step": 13677
+ },
+ {
+ "epoch": 37.26975476839237,
+ "grad_norm": 5.748197555541992,
+ "learning_rate": 1.4447389900531199e-05,
+ "loss": 0.2891,
+ "step": 13678
+ },
+ {
+ "epoch": 37.2724795640327,
+ "grad_norm": 5.341134071350098,
+ "learning_rate": 1.44465994678741e-05,
+ "loss": 0.2315,
+ "step": 13679
+ },
+ {
+ "epoch": 37.275204359673026,
+ "grad_norm": 6.73088264465332,
+ "learning_rate": 1.4445809000587027e-05,
+ "loss": 0.3155,
+ "step": 13680
+ },
+ {
+ "epoch": 37.27792915531335,
+ "grad_norm": 10.141463279724121,
+ "learning_rate": 1.4445018498676135e-05,
+ "loss": 0.4325,
+ "step": 13681
+ },
+ {
+ "epoch": 37.28065395095368,
+ "grad_norm": 6.6343207359313965,
+ "learning_rate": 1.4444227962147586e-05,
+ "loss": 0.4275,
+ "step": 13682
+ },
+ {
+ "epoch": 37.283378746594,
+ "grad_norm": 6.762706756591797,
+ "learning_rate": 1.4443437391007531e-05,
+ "loss": 0.2278,
+ "step": 13683
+ },
+ {
+ "epoch": 37.28610354223433,
+ "grad_norm": 6.540870189666748,
+ "learning_rate": 1.4442646785262126e-05,
+ "loss": 0.4446,
+ "step": 13684
+ },
+ {
+ "epoch": 37.28882833787466,
+ "grad_norm": 5.8193206787109375,
+ "learning_rate": 1.4441856144917535e-05,
+ "loss": 0.4615,
+ "step": 13685
+ },
+ {
+ "epoch": 37.29155313351499,
+ "grad_norm": 5.472895622253418,
+ "learning_rate": 1.4441065469979908e-05,
+ "loss": 0.3626,
+ "step": 13686
+ },
+ {
+ "epoch": 37.294277929155314,
+ "grad_norm": 5.899320602416992,
+ "learning_rate": 1.4440274760455406e-05,
+ "loss": 0.3423,
+ "step": 13687
+ },
+ {
+ "epoch": 37.29700272479564,
+ "grad_norm": 6.971601486206055,
+ "learning_rate": 1.443948401635019e-05,
+ "loss": 0.2655,
+ "step": 13688
+ },
+ {
+ "epoch": 37.299727520435965,
+ "grad_norm": 5.75792932510376,
+ "learning_rate": 1.4438693237670412e-05,
+ "loss": 0.3479,
+ "step": 13689
+ },
+ {
+ "epoch": 37.30245231607629,
+ "grad_norm": 5.564891815185547,
+ "learning_rate": 1.4437902424422236e-05,
+ "loss": 0.468,
+ "step": 13690
+ },
+ {
+ "epoch": 37.305177111716624,
+ "grad_norm": 5.492071628570557,
+ "learning_rate": 1.443711157661182e-05,
+ "loss": 0.2078,
+ "step": 13691
+ },
+ {
+ "epoch": 37.30790190735695,
+ "grad_norm": 4.296332359313965,
+ "learning_rate": 1.4436320694245318e-05,
+ "loss": 0.1584,
+ "step": 13692
+ },
+ {
+ "epoch": 37.310626702997276,
+ "grad_norm": 4.209894180297852,
+ "learning_rate": 1.4435529777328895e-05,
+ "loss": 0.1995,
+ "step": 13693
+ },
+ {
+ "epoch": 37.3133514986376,
+ "grad_norm": 5.265773296356201,
+ "learning_rate": 1.443473882586871e-05,
+ "loss": 0.2421,
+ "step": 13694
+ },
+ {
+ "epoch": 37.31607629427793,
+ "grad_norm": 4.542918682098389,
+ "learning_rate": 1.4433947839870924e-05,
+ "loss": 0.2087,
+ "step": 13695
+ },
+ {
+ "epoch": 37.31880108991825,
+ "grad_norm": 9.200000762939453,
+ "learning_rate": 1.443315681934169e-05,
+ "loss": 0.2547,
+ "step": 13696
+ },
+ {
+ "epoch": 37.321525885558586,
+ "grad_norm": 6.090592861175537,
+ "learning_rate": 1.4432365764287175e-05,
+ "loss": 0.325,
+ "step": 13697
+ },
+ {
+ "epoch": 37.32425068119891,
+ "grad_norm": 6.258579730987549,
+ "learning_rate": 1.4431574674713538e-05,
+ "loss": 0.312,
+ "step": 13698
+ },
+ {
+ "epoch": 37.32697547683924,
+ "grad_norm": 5.172791004180908,
+ "learning_rate": 1.443078355062694e-05,
+ "loss": 0.1498,
+ "step": 13699
+ },
+ {
+ "epoch": 37.32970027247956,
+ "grad_norm": 5.496511459350586,
+ "learning_rate": 1.4429992392033545e-05,
+ "loss": 0.4258,
+ "step": 13700
+ },
+ {
+ "epoch": 37.33242506811989,
+ "grad_norm": 6.028332710266113,
+ "learning_rate": 1.4429201198939508e-05,
+ "loss": 0.2749,
+ "step": 13701
+ },
+ {
+ "epoch": 37.335149863760215,
+ "grad_norm": 7.874242305755615,
+ "learning_rate": 1.4428409971350994e-05,
+ "loss": 0.2789,
+ "step": 13702
+ },
+ {
+ "epoch": 37.33787465940055,
+ "grad_norm": 5.639641284942627,
+ "learning_rate": 1.442761870927417e-05,
+ "loss": 0.1975,
+ "step": 13703
+ },
+ {
+ "epoch": 37.34059945504087,
+ "grad_norm": 6.8148884773254395,
+ "learning_rate": 1.4426827412715192e-05,
+ "loss": 0.3941,
+ "step": 13704
+ },
+ {
+ "epoch": 37.3433242506812,
+ "grad_norm": 8.138447761535645,
+ "learning_rate": 1.4426036081680223e-05,
+ "loss": 0.2075,
+ "step": 13705
+ },
+ {
+ "epoch": 37.346049046321525,
+ "grad_norm": 5.802258014678955,
+ "learning_rate": 1.4425244716175431e-05,
+ "loss": 0.4133,
+ "step": 13706
+ },
+ {
+ "epoch": 37.34877384196185,
+ "grad_norm": 8.083141326904297,
+ "learning_rate": 1.4424453316206974e-05,
+ "loss": 0.3503,
+ "step": 13707
+ },
+ {
+ "epoch": 37.35149863760218,
+ "grad_norm": 4.53306770324707,
+ "learning_rate": 1.4423661881781014e-05,
+ "loss": 0.1835,
+ "step": 13708
+ },
+ {
+ "epoch": 37.35422343324251,
+ "grad_norm": 6.26450777053833,
+ "learning_rate": 1.442287041290372e-05,
+ "loss": 0.3317,
+ "step": 13709
+ },
+ {
+ "epoch": 37.356948228882835,
+ "grad_norm": 5.232570648193359,
+ "learning_rate": 1.4422078909581253e-05,
+ "loss": 0.25,
+ "step": 13710
+ },
+ {
+ "epoch": 37.35967302452316,
+ "grad_norm": 5.264657974243164,
+ "learning_rate": 1.4421287371819781e-05,
+ "loss": 0.2209,
+ "step": 13711
+ },
+ {
+ "epoch": 37.36239782016349,
+ "grad_norm": 5.533340930938721,
+ "learning_rate": 1.442049579962546e-05,
+ "loss": 0.2596,
+ "step": 13712
+ },
+ {
+ "epoch": 37.36512261580381,
+ "grad_norm": 6.200746059417725,
+ "learning_rate": 1.4419704193004464e-05,
+ "loss": 0.2444,
+ "step": 13713
+ },
+ {
+ "epoch": 37.36784741144414,
+ "grad_norm": 6.443899631500244,
+ "learning_rate": 1.4418912551962953e-05,
+ "loss": 0.2205,
+ "step": 13714
+ },
+ {
+ "epoch": 37.37057220708447,
+ "grad_norm": 7.062668323516846,
+ "learning_rate": 1.4418120876507093e-05,
+ "loss": 0.1915,
+ "step": 13715
+ },
+ {
+ "epoch": 37.3732970027248,
+ "grad_norm": 7.006562232971191,
+ "learning_rate": 1.441732916664305e-05,
+ "loss": 0.333,
+ "step": 13716
+ },
+ {
+ "epoch": 37.37602179836512,
+ "grad_norm": 6.008820533752441,
+ "learning_rate": 1.441653742237699e-05,
+ "loss": 0.3147,
+ "step": 13717
+ },
+ {
+ "epoch": 37.37874659400545,
+ "grad_norm": 6.851540565490723,
+ "learning_rate": 1.4415745643715075e-05,
+ "loss": 0.2743,
+ "step": 13718
+ },
+ {
+ "epoch": 37.381471389645775,
+ "grad_norm": 5.677096843719482,
+ "learning_rate": 1.4414953830663478e-05,
+ "loss": 0.4421,
+ "step": 13719
+ },
+ {
+ "epoch": 37.3841961852861,
+ "grad_norm": 5.402856349945068,
+ "learning_rate": 1.4414161983228362e-05,
+ "loss": 0.297,
+ "step": 13720
+ },
+ {
+ "epoch": 37.38692098092643,
+ "grad_norm": 4.693260192871094,
+ "learning_rate": 1.4413370101415898e-05,
+ "loss": 0.189,
+ "step": 13721
+ },
+ {
+ "epoch": 37.38964577656676,
+ "grad_norm": 7.506068706512451,
+ "learning_rate": 1.4412578185232246e-05,
+ "loss": 0.435,
+ "step": 13722
+ },
+ {
+ "epoch": 37.392370572207085,
+ "grad_norm": 6.2235283851623535,
+ "learning_rate": 1.441178623468358e-05,
+ "loss": 0.3595,
+ "step": 13723
+ },
+ {
+ "epoch": 37.39509536784741,
+ "grad_norm": 6.36119270324707,
+ "learning_rate": 1.441099424977606e-05,
+ "loss": 0.2841,
+ "step": 13724
+ },
+ {
+ "epoch": 37.39782016348774,
+ "grad_norm": 5.588457107543945,
+ "learning_rate": 1.4410202230515865e-05,
+ "loss": 0.162,
+ "step": 13725
+ },
+ {
+ "epoch": 37.40054495912806,
+ "grad_norm": 5.098292827606201,
+ "learning_rate": 1.440941017690915e-05,
+ "loss": 0.1873,
+ "step": 13726
+ },
+ {
+ "epoch": 37.403269754768395,
+ "grad_norm": 7.046430587768555,
+ "learning_rate": 1.4408618088962096e-05,
+ "loss": 0.3149,
+ "step": 13727
+ },
+ {
+ "epoch": 37.40599455040872,
+ "grad_norm": 5.249959468841553,
+ "learning_rate": 1.4407825966680862e-05,
+ "loss": 0.2182,
+ "step": 13728
+ },
+ {
+ "epoch": 37.40871934604905,
+ "grad_norm": 9.688139915466309,
+ "learning_rate": 1.4407033810071624e-05,
+ "loss": 0.2852,
+ "step": 13729
+ },
+ {
+ "epoch": 37.41144414168937,
+ "grad_norm": 4.626587867736816,
+ "learning_rate": 1.4406241619140549e-05,
+ "loss": 0.1972,
+ "step": 13730
+ },
+ {
+ "epoch": 37.4141689373297,
+ "grad_norm": 5.785120964050293,
+ "learning_rate": 1.4405449393893807e-05,
+ "loss": 0.2773,
+ "step": 13731
+ },
+ {
+ "epoch": 37.416893732970024,
+ "grad_norm": 6.856450080871582,
+ "learning_rate": 1.4404657134337562e-05,
+ "loss": 0.2383,
+ "step": 13732
+ },
+ {
+ "epoch": 37.41961852861036,
+ "grad_norm": 5.6097259521484375,
+ "learning_rate": 1.4403864840477994e-05,
+ "loss": 0.4141,
+ "step": 13733
+ },
+ {
+ "epoch": 37.42234332425068,
+ "grad_norm": 8.284987449645996,
+ "learning_rate": 1.4403072512321266e-05,
+ "loss": 0.2511,
+ "step": 13734
+ },
+ {
+ "epoch": 37.42506811989101,
+ "grad_norm": 8.898246765136719,
+ "learning_rate": 1.440228014987355e-05,
+ "loss": 0.2932,
+ "step": 13735
+ },
+ {
+ "epoch": 37.427792915531334,
+ "grad_norm": 5.818563461303711,
+ "learning_rate": 1.440148775314102e-05,
+ "loss": 0.2899,
+ "step": 13736
+ },
+ {
+ "epoch": 37.43051771117166,
+ "grad_norm": 5.395720481872559,
+ "learning_rate": 1.4400695322129846e-05,
+ "loss": 0.3019,
+ "step": 13737
+ },
+ {
+ "epoch": 37.433242506811986,
+ "grad_norm": 5.264636039733887,
+ "learning_rate": 1.4399902856846195e-05,
+ "loss": 0.2049,
+ "step": 13738
+ },
+ {
+ "epoch": 37.43596730245232,
+ "grad_norm": 6.397223949432373,
+ "learning_rate": 1.4399110357296244e-05,
+ "loss": 0.3132,
+ "step": 13739
+ },
+ {
+ "epoch": 37.438692098092645,
+ "grad_norm": 5.450150489807129,
+ "learning_rate": 1.4398317823486164e-05,
+ "loss": 0.2116,
+ "step": 13740
+ },
+ {
+ "epoch": 37.44141689373297,
+ "grad_norm": 5.349878311157227,
+ "learning_rate": 1.4397525255422125e-05,
+ "loss": 0.2759,
+ "step": 13741
+ },
+ {
+ "epoch": 37.444141689373296,
+ "grad_norm": 7.868896961212158,
+ "learning_rate": 1.4396732653110302e-05,
+ "loss": 0.2057,
+ "step": 13742
+ },
+ {
+ "epoch": 37.44686648501362,
+ "grad_norm": 10.411602973937988,
+ "learning_rate": 1.4395940016556867e-05,
+ "loss": 0.2873,
+ "step": 13743
+ },
+ {
+ "epoch": 37.44959128065395,
+ "grad_norm": 7.2601542472839355,
+ "learning_rate": 1.4395147345767988e-05,
+ "loss": 0.4367,
+ "step": 13744
+ },
+ {
+ "epoch": 37.45231607629428,
+ "grad_norm": 5.517092227935791,
+ "learning_rate": 1.4394354640749848e-05,
+ "loss": 0.2008,
+ "step": 13745
+ },
+ {
+ "epoch": 37.45504087193461,
+ "grad_norm": 8.747833251953125,
+ "learning_rate": 1.4393561901508613e-05,
+ "loss": 0.2881,
+ "step": 13746
+ },
+ {
+ "epoch": 37.45776566757493,
+ "grad_norm": 5.685414791107178,
+ "learning_rate": 1.439276912805046e-05,
+ "loss": 0.2178,
+ "step": 13747
+ },
+ {
+ "epoch": 37.46049046321526,
+ "grad_norm": 5.122185230255127,
+ "learning_rate": 1.4391976320381562e-05,
+ "loss": 0.166,
+ "step": 13748
+ },
+ {
+ "epoch": 37.463215258855584,
+ "grad_norm": 7.064228057861328,
+ "learning_rate": 1.4391183478508098e-05,
+ "loss": 0.2955,
+ "step": 13749
+ },
+ {
+ "epoch": 37.46594005449591,
+ "grad_norm": 7.867053031921387,
+ "learning_rate": 1.4390390602436232e-05,
+ "loss": 0.2117,
+ "step": 13750
+ },
+ {
+ "epoch": 37.46866485013624,
+ "grad_norm": 5.2257466316223145,
+ "learning_rate": 1.438959769217215e-05,
+ "loss": 0.3257,
+ "step": 13751
+ },
+ {
+ "epoch": 37.47138964577657,
+ "grad_norm": 6.032914638519287,
+ "learning_rate": 1.4388804747722018e-05,
+ "loss": 0.2724,
+ "step": 13752
+ },
+ {
+ "epoch": 37.474114441416894,
+ "grad_norm": 5.87555456161499,
+ "learning_rate": 1.4388011769092018e-05,
+ "loss": 0.2836,
+ "step": 13753
+ },
+ {
+ "epoch": 37.47683923705722,
+ "grad_norm": 5.952106952667236,
+ "learning_rate": 1.4387218756288323e-05,
+ "loss": 0.3994,
+ "step": 13754
+ },
+ {
+ "epoch": 37.479564032697546,
+ "grad_norm": 6.191522598266602,
+ "learning_rate": 1.4386425709317113e-05,
+ "loss": 0.2023,
+ "step": 13755
+ },
+ {
+ "epoch": 37.48228882833787,
+ "grad_norm": 6.224193096160889,
+ "learning_rate": 1.4385632628184558e-05,
+ "loss": 0.2334,
+ "step": 13756
+ },
+ {
+ "epoch": 37.485013623978205,
+ "grad_norm": 7.023881912231445,
+ "learning_rate": 1.4384839512896837e-05,
+ "loss": 0.2537,
+ "step": 13757
+ },
+ {
+ "epoch": 37.48773841961853,
+ "grad_norm": 6.266427516937256,
+ "learning_rate": 1.4384046363460129e-05,
+ "loss": 0.2319,
+ "step": 13758
+ },
+ {
+ "epoch": 37.490463215258856,
+ "grad_norm": 6.77350378036499,
+ "learning_rate": 1.4383253179880607e-05,
+ "loss": 0.5074,
+ "step": 13759
+ },
+ {
+ "epoch": 37.49318801089918,
+ "grad_norm": 5.959731101989746,
+ "learning_rate": 1.4382459962164452e-05,
+ "loss": 0.2427,
+ "step": 13760
+ },
+ {
+ "epoch": 37.49591280653951,
+ "grad_norm": 6.488434314727783,
+ "learning_rate": 1.4381666710317837e-05,
+ "loss": 0.2007,
+ "step": 13761
+ },
+ {
+ "epoch": 37.49863760217983,
+ "grad_norm": 7.6190185546875,
+ "learning_rate": 1.4380873424346945e-05,
+ "loss": 0.2081,
+ "step": 13762
+ },
+ {
+ "epoch": 37.50136239782017,
+ "grad_norm": 8.222481727600098,
+ "learning_rate": 1.438008010425795e-05,
+ "loss": 0.3317,
+ "step": 13763
+ },
+ {
+ "epoch": 37.50408719346049,
+ "grad_norm": 7.253337860107422,
+ "learning_rate": 1.4379286750057033e-05,
+ "loss": 0.2043,
+ "step": 13764
+ },
+ {
+ "epoch": 37.50681198910082,
+ "grad_norm": 18.86480140686035,
+ "learning_rate": 1.4378493361750374e-05,
+ "loss": 0.3537,
+ "step": 13765
+ },
+ {
+ "epoch": 37.509536784741144,
+ "grad_norm": 6.140002250671387,
+ "learning_rate": 1.4377699939344148e-05,
+ "loss": 0.2787,
+ "step": 13766
+ },
+ {
+ "epoch": 37.51226158038147,
+ "grad_norm": 6.517630100250244,
+ "learning_rate": 1.4376906482844534e-05,
+ "loss": 0.2522,
+ "step": 13767
+ },
+ {
+ "epoch": 37.514986376021795,
+ "grad_norm": 5.6096649169921875,
+ "learning_rate": 1.4376112992257714e-05,
+ "loss": 0.2505,
+ "step": 13768
+ },
+ {
+ "epoch": 37.51771117166213,
+ "grad_norm": 6.280866622924805,
+ "learning_rate": 1.4375319467589868e-05,
+ "loss": 0.3471,
+ "step": 13769
+ },
+ {
+ "epoch": 37.520435967302454,
+ "grad_norm": 5.432213306427002,
+ "learning_rate": 1.4374525908847175e-05,
+ "loss": 0.24,
+ "step": 13770
+ },
+ {
+ "epoch": 37.52316076294278,
+ "grad_norm": 6.034014701843262,
+ "learning_rate": 1.4373732316035813e-05,
+ "loss": 0.2612,
+ "step": 13771
+ },
+ {
+ "epoch": 37.525885558583106,
+ "grad_norm": 5.9695000648498535,
+ "learning_rate": 1.4372938689161969e-05,
+ "loss": 0.3268,
+ "step": 13772
+ },
+ {
+ "epoch": 37.52861035422343,
+ "grad_norm": 6.036328315734863,
+ "learning_rate": 1.4372145028231814e-05,
+ "loss": 0.2262,
+ "step": 13773
+ },
+ {
+ "epoch": 37.53133514986376,
+ "grad_norm": 5.686705112457275,
+ "learning_rate": 1.4371351333251535e-05,
+ "loss": 0.2376,
+ "step": 13774
+ },
+ {
+ "epoch": 37.53405994550409,
+ "grad_norm": 6.202902793884277,
+ "learning_rate": 1.4370557604227316e-05,
+ "loss": 0.3719,
+ "step": 13775
+ },
+ {
+ "epoch": 37.536784741144416,
+ "grad_norm": 6.547354698181152,
+ "learning_rate": 1.4369763841165331e-05,
+ "loss": 0.2327,
+ "step": 13776
+ },
+ {
+ "epoch": 37.53950953678474,
+ "grad_norm": 12.354787826538086,
+ "learning_rate": 1.4368970044071768e-05,
+ "loss": 0.2022,
+ "step": 13777
+ },
+ {
+ "epoch": 37.54223433242507,
+ "grad_norm": 4.935760974884033,
+ "learning_rate": 1.4368176212952807e-05,
+ "loss": 0.2329,
+ "step": 13778
+ },
+ {
+ "epoch": 37.54495912806539,
+ "grad_norm": 6.330197811126709,
+ "learning_rate": 1.4367382347814628e-05,
+ "loss": 0.226,
+ "step": 13779
+ },
+ {
+ "epoch": 37.54768392370572,
+ "grad_norm": 5.834701061248779,
+ "learning_rate": 1.436658844866342e-05,
+ "loss": 0.3147,
+ "step": 13780
+ },
+ {
+ "epoch": 37.55040871934605,
+ "grad_norm": 5.683170795440674,
+ "learning_rate": 1.4365794515505359e-05,
+ "loss": 0.2083,
+ "step": 13781
+ },
+ {
+ "epoch": 37.55313351498638,
+ "grad_norm": 7.662569046020508,
+ "learning_rate": 1.4365000548346633e-05,
+ "loss": 0.3043,
+ "step": 13782
+ },
+ {
+ "epoch": 37.555858310626704,
+ "grad_norm": 6.115015506744385,
+ "learning_rate": 1.436420654719342e-05,
+ "loss": 0.2692,
+ "step": 13783
+ },
+ {
+ "epoch": 37.55858310626703,
+ "grad_norm": 7.078417778015137,
+ "learning_rate": 1.4363412512051908e-05,
+ "loss": 0.228,
+ "step": 13784
+ },
+ {
+ "epoch": 37.561307901907355,
+ "grad_norm": 6.246332168579102,
+ "learning_rate": 1.436261844292828e-05,
+ "loss": 0.3627,
+ "step": 13785
+ },
+ {
+ "epoch": 37.56403269754768,
+ "grad_norm": 6.897421836853027,
+ "learning_rate": 1.4361824339828718e-05,
+ "loss": 0.3459,
+ "step": 13786
+ },
+ {
+ "epoch": 37.566757493188014,
+ "grad_norm": 6.10270357131958,
+ "learning_rate": 1.4361030202759412e-05,
+ "loss": 0.3805,
+ "step": 13787
+ },
+ {
+ "epoch": 37.56948228882834,
+ "grad_norm": 6.087770938873291,
+ "learning_rate": 1.4360236031726543e-05,
+ "loss": 0.2395,
+ "step": 13788
+ },
+ {
+ "epoch": 37.572207084468666,
+ "grad_norm": 5.868922233581543,
+ "learning_rate": 1.4359441826736294e-05,
+ "loss": 0.3105,
+ "step": 13789
+ },
+ {
+ "epoch": 37.57493188010899,
+ "grad_norm": 6.516274452209473,
+ "learning_rate": 1.4358647587794851e-05,
+ "loss": 0.285,
+ "step": 13790
+ },
+ {
+ "epoch": 37.57765667574932,
+ "grad_norm": 6.568358898162842,
+ "learning_rate": 1.4357853314908403e-05,
+ "loss": 0.2906,
+ "step": 13791
+ },
+ {
+ "epoch": 37.58038147138964,
+ "grad_norm": 5.451956272125244,
+ "learning_rate": 1.4357059008083133e-05,
+ "loss": 0.3814,
+ "step": 13792
+ },
+ {
+ "epoch": 37.583106267029976,
+ "grad_norm": 6.1217427253723145,
+ "learning_rate": 1.4356264667325231e-05,
+ "loss": 0.2633,
+ "step": 13793
+ },
+ {
+ "epoch": 37.5858310626703,
+ "grad_norm": 5.793474197387695,
+ "learning_rate": 1.4355470292640879e-05,
+ "loss": 0.3409,
+ "step": 13794
+ },
+ {
+ "epoch": 37.58855585831063,
+ "grad_norm": 7.553661823272705,
+ "learning_rate": 1.4354675884036257e-05,
+ "loss": 0.3251,
+ "step": 13795
+ },
+ {
+ "epoch": 37.59128065395095,
+ "grad_norm": 5.576457500457764,
+ "learning_rate": 1.4353881441517568e-05,
+ "loss": 0.3749,
+ "step": 13796
+ },
+ {
+ "epoch": 37.59400544959128,
+ "grad_norm": 4.476280212402344,
+ "learning_rate": 1.4353086965090985e-05,
+ "loss": 0.2102,
+ "step": 13797
+ },
+ {
+ "epoch": 37.596730245231605,
+ "grad_norm": 5.663008689880371,
+ "learning_rate": 1.4352292454762705e-05,
+ "loss": 0.2438,
+ "step": 13798
+ },
+ {
+ "epoch": 37.59945504087194,
+ "grad_norm": 7.217907428741455,
+ "learning_rate": 1.435149791053891e-05,
+ "loss": 0.296,
+ "step": 13799
+ },
+ {
+ "epoch": 37.60217983651226,
+ "grad_norm": 6.813621997833252,
+ "learning_rate": 1.4350703332425791e-05,
+ "loss": 0.3095,
+ "step": 13800
+ },
+ {
+ "epoch": 37.60490463215259,
+ "grad_norm": 6.3153815269470215,
+ "learning_rate": 1.4349908720429531e-05,
+ "loss": 0.4815,
+ "step": 13801
+ },
+ {
+ "epoch": 37.607629427792915,
+ "grad_norm": 6.94346809387207,
+ "learning_rate": 1.4349114074556326e-05,
+ "loss": 0.3065,
+ "step": 13802
+ },
+ {
+ "epoch": 37.61035422343324,
+ "grad_norm": 6.070793151855469,
+ "learning_rate": 1.4348319394812355e-05,
+ "loss": 0.227,
+ "step": 13803
+ },
+ {
+ "epoch": 37.61307901907357,
+ "grad_norm": 9.789314270019531,
+ "learning_rate": 1.4347524681203817e-05,
+ "loss": 0.2587,
+ "step": 13804
+ },
+ {
+ "epoch": 37.6158038147139,
+ "grad_norm": 5.945764064788818,
+ "learning_rate": 1.4346729933736894e-05,
+ "loss": 0.3088,
+ "step": 13805
+ },
+ {
+ "epoch": 37.618528610354225,
+ "grad_norm": 5.794508457183838,
+ "learning_rate": 1.434593515241778e-05,
+ "loss": 0.3408,
+ "step": 13806
+ },
+ {
+ "epoch": 37.62125340599455,
+ "grad_norm": 5.566441059112549,
+ "learning_rate": 1.4345140337252663e-05,
+ "loss": 0.412,
+ "step": 13807
+ },
+ {
+ "epoch": 37.62397820163488,
+ "grad_norm": 5.600670337677002,
+ "learning_rate": 1.4344345488247733e-05,
+ "loss": 0.2984,
+ "step": 13808
+ },
+ {
+ "epoch": 37.6267029972752,
+ "grad_norm": 6.36623477935791,
+ "learning_rate": 1.4343550605409178e-05,
+ "loss": 0.374,
+ "step": 13809
+ },
+ {
+ "epoch": 37.62942779291553,
+ "grad_norm": 7.658454895019531,
+ "learning_rate": 1.4342755688743192e-05,
+ "loss": 0.2512,
+ "step": 13810
+ },
+ {
+ "epoch": 37.63215258855586,
+ "grad_norm": 6.459691524505615,
+ "learning_rate": 1.4341960738255965e-05,
+ "loss": 0.3131,
+ "step": 13811
+ },
+ {
+ "epoch": 37.63487738419619,
+ "grad_norm": 5.796911239624023,
+ "learning_rate": 1.4341165753953688e-05,
+ "loss": 0.2245,
+ "step": 13812
+ },
+ {
+ "epoch": 37.63760217983651,
+ "grad_norm": 6.59001350402832,
+ "learning_rate": 1.4340370735842548e-05,
+ "loss": 0.3234,
+ "step": 13813
+ },
+ {
+ "epoch": 37.64032697547684,
+ "grad_norm": 5.7899370193481445,
+ "learning_rate": 1.4339575683928746e-05,
+ "loss": 0.2126,
+ "step": 13814
+ },
+ {
+ "epoch": 37.643051771117165,
+ "grad_norm": 5.424726963043213,
+ "learning_rate": 1.4338780598218465e-05,
+ "loss": 0.3813,
+ "step": 13815
+ },
+ {
+ "epoch": 37.64577656675749,
+ "grad_norm": 6.8555989265441895,
+ "learning_rate": 1.4337985478717902e-05,
+ "loss": 0.2491,
+ "step": 13816
+ },
+ {
+ "epoch": 37.64850136239782,
+ "grad_norm": 7.039730548858643,
+ "learning_rate": 1.4337190325433246e-05,
+ "loss": 0.2726,
+ "step": 13817
+ },
+ {
+ "epoch": 37.65122615803815,
+ "grad_norm": 5.639499664306641,
+ "learning_rate": 1.4336395138370694e-05,
+ "loss": 0.2294,
+ "step": 13818
+ },
+ {
+ "epoch": 37.653950953678475,
+ "grad_norm": 6.956472873687744,
+ "learning_rate": 1.4335599917536432e-05,
+ "loss": 0.252,
+ "step": 13819
+ },
+ {
+ "epoch": 37.6566757493188,
+ "grad_norm": 10.79681396484375,
+ "learning_rate": 1.4334804662936661e-05,
+ "loss": 0.3697,
+ "step": 13820
+ },
+ {
+ "epoch": 37.65940054495913,
+ "grad_norm": 6.606871128082275,
+ "learning_rate": 1.4334009374577566e-05,
+ "loss": 0.2361,
+ "step": 13821
+ },
+ {
+ "epoch": 37.66212534059945,
+ "grad_norm": 6.776033401489258,
+ "learning_rate": 1.433321405246535e-05,
+ "loss": 0.2047,
+ "step": 13822
+ },
+ {
+ "epoch": 37.664850136239785,
+ "grad_norm": 6.886871814727783,
+ "learning_rate": 1.43324186966062e-05,
+ "loss": 0.2916,
+ "step": 13823
+ },
+ {
+ "epoch": 37.66757493188011,
+ "grad_norm": 5.7386040687561035,
+ "learning_rate": 1.4331623307006316e-05,
+ "loss": 0.2835,
+ "step": 13824
+ },
+ {
+ "epoch": 37.67029972752044,
+ "grad_norm": 7.095458030700684,
+ "learning_rate": 1.4330827883671885e-05,
+ "loss": 0.258,
+ "step": 13825
+ },
+ {
+ "epoch": 37.67302452316076,
+ "grad_norm": 9.257341384887695,
+ "learning_rate": 1.433003242660911e-05,
+ "loss": 0.3476,
+ "step": 13826
+ },
+ {
+ "epoch": 37.67574931880109,
+ "grad_norm": 11.596256256103516,
+ "learning_rate": 1.432923693582418e-05,
+ "loss": 0.287,
+ "step": 13827
+ },
+ {
+ "epoch": 37.678474114441414,
+ "grad_norm": 4.983880043029785,
+ "learning_rate": 1.4328441411323292e-05,
+ "loss": 0.3643,
+ "step": 13828
+ },
+ {
+ "epoch": 37.68119891008175,
+ "grad_norm": 8.73643970489502,
+ "learning_rate": 1.432764585311264e-05,
+ "loss": 0.2546,
+ "step": 13829
+ },
+ {
+ "epoch": 37.68392370572207,
+ "grad_norm": 14.080904960632324,
+ "learning_rate": 1.4326850261198422e-05,
+ "loss": 0.4435,
+ "step": 13830
+ },
+ {
+ "epoch": 37.6866485013624,
+ "grad_norm": 7.07788610458374,
+ "learning_rate": 1.4326054635586833e-05,
+ "loss": 0.1955,
+ "step": 13831
+ },
+ {
+ "epoch": 37.689373297002724,
+ "grad_norm": 6.612051486968994,
+ "learning_rate": 1.4325258976284073e-05,
+ "loss": 0.346,
+ "step": 13832
+ },
+ {
+ "epoch": 37.69209809264305,
+ "grad_norm": 8.311551094055176,
+ "learning_rate": 1.4324463283296332e-05,
+ "loss": 0.235,
+ "step": 13833
+ },
+ {
+ "epoch": 37.694822888283376,
+ "grad_norm": 6.00632381439209,
+ "learning_rate": 1.4323667556629812e-05,
+ "loss": 0.2324,
+ "step": 13834
+ },
+ {
+ "epoch": 37.69754768392371,
+ "grad_norm": 24.169116973876953,
+ "learning_rate": 1.4322871796290707e-05,
+ "loss": 0.3493,
+ "step": 13835
+ },
+ {
+ "epoch": 37.700272479564035,
+ "grad_norm": 5.777043342590332,
+ "learning_rate": 1.4322076002285216e-05,
+ "loss": 0.3258,
+ "step": 13836
+ },
+ {
+ "epoch": 37.70299727520436,
+ "grad_norm": 7.018303871154785,
+ "learning_rate": 1.4321280174619538e-05,
+ "loss": 0.351,
+ "step": 13837
+ },
+ {
+ "epoch": 37.705722070844686,
+ "grad_norm": 8.782502174377441,
+ "learning_rate": 1.4320484313299865e-05,
+ "loss": 0.2552,
+ "step": 13838
+ },
+ {
+ "epoch": 37.70844686648501,
+ "grad_norm": 7.098335266113281,
+ "learning_rate": 1.43196884183324e-05,
+ "loss": 0.2238,
+ "step": 13839
+ },
+ {
+ "epoch": 37.71117166212534,
+ "grad_norm": 5.654666900634766,
+ "learning_rate": 1.4318892489723345e-05,
+ "loss": 0.3625,
+ "step": 13840
+ },
+ {
+ "epoch": 37.71389645776567,
+ "grad_norm": 6.63136625289917,
+ "learning_rate": 1.431809652747889e-05,
+ "loss": 0.2601,
+ "step": 13841
+ },
+ {
+ "epoch": 37.716621253406,
+ "grad_norm": 15.09497356414795,
+ "learning_rate": 1.4317300531605241e-05,
+ "loss": 0.4105,
+ "step": 13842
+ },
+ {
+ "epoch": 37.71934604904632,
+ "grad_norm": 8.670364379882812,
+ "learning_rate": 1.4316504502108592e-05,
+ "loss": 0.3698,
+ "step": 13843
+ },
+ {
+ "epoch": 37.72207084468665,
+ "grad_norm": 7.739365577697754,
+ "learning_rate": 1.4315708438995148e-05,
+ "loss": 0.2654,
+ "step": 13844
+ },
+ {
+ "epoch": 37.724795640326974,
+ "grad_norm": 7.329006195068359,
+ "learning_rate": 1.4314912342271103e-05,
+ "loss": 0.3591,
+ "step": 13845
+ },
+ {
+ "epoch": 37.7275204359673,
+ "grad_norm": 5.840755462646484,
+ "learning_rate": 1.431411621194266e-05,
+ "loss": 0.2794,
+ "step": 13846
+ },
+ {
+ "epoch": 37.73024523160763,
+ "grad_norm": 5.9024200439453125,
+ "learning_rate": 1.431332004801602e-05,
+ "loss": 0.26,
+ "step": 13847
+ },
+ {
+ "epoch": 37.73297002724796,
+ "grad_norm": 7.745482921600342,
+ "learning_rate": 1.431252385049738e-05,
+ "loss": 0.2239,
+ "step": 13848
+ },
+ {
+ "epoch": 37.735694822888284,
+ "grad_norm": 7.3622145652771,
+ "learning_rate": 1.4311727619392944e-05,
+ "loss": 0.3758,
+ "step": 13849
+ },
+ {
+ "epoch": 37.73841961852861,
+ "grad_norm": 10.321468353271484,
+ "learning_rate": 1.4310931354708913e-05,
+ "loss": 0.4225,
+ "step": 13850
+ },
+ {
+ "epoch": 37.741144414168936,
+ "grad_norm": 6.619589328765869,
+ "learning_rate": 1.4310135056451486e-05,
+ "loss": 0.3065,
+ "step": 13851
+ },
+ {
+ "epoch": 37.74386920980926,
+ "grad_norm": 7.6803483963012695,
+ "learning_rate": 1.4309338724626869e-05,
+ "loss": 0.6291,
+ "step": 13852
+ },
+ {
+ "epoch": 37.746594005449595,
+ "grad_norm": 6.695158958435059,
+ "learning_rate": 1.4308542359241257e-05,
+ "loss": 0.4344,
+ "step": 13853
+ },
+ {
+ "epoch": 37.74931880108992,
+ "grad_norm": 11.790595054626465,
+ "learning_rate": 1.4307745960300858e-05,
+ "loss": 0.3157,
+ "step": 13854
+ },
+ {
+ "epoch": 37.752043596730246,
+ "grad_norm": 7.67926549911499,
+ "learning_rate": 1.430694952781187e-05,
+ "loss": 0.2043,
+ "step": 13855
+ },
+ {
+ "epoch": 37.75476839237057,
+ "grad_norm": 5.822719097137451,
+ "learning_rate": 1.43061530617805e-05,
+ "loss": 0.2033,
+ "step": 13856
+ },
+ {
+ "epoch": 37.7574931880109,
+ "grad_norm": 7.06847620010376,
+ "learning_rate": 1.4305356562212947e-05,
+ "loss": 0.2908,
+ "step": 13857
+ },
+ {
+ "epoch": 37.76021798365122,
+ "grad_norm": 5.968804836273193,
+ "learning_rate": 1.4304560029115415e-05,
+ "loss": 0.2198,
+ "step": 13858
+ },
+ {
+ "epoch": 37.762942779291556,
+ "grad_norm": 8.030414581298828,
+ "learning_rate": 1.4303763462494112e-05,
+ "loss": 0.2816,
+ "step": 13859
+ },
+ {
+ "epoch": 37.76566757493188,
+ "grad_norm": 10.792121887207031,
+ "learning_rate": 1.4302966862355235e-05,
+ "loss": 0.2744,
+ "step": 13860
+ },
+ {
+ "epoch": 37.76839237057221,
+ "grad_norm": 7.105438709259033,
+ "learning_rate": 1.4302170228704987e-05,
+ "loss": 0.2207,
+ "step": 13861
+ },
+ {
+ "epoch": 37.771117166212534,
+ "grad_norm": 5.91572904586792,
+ "learning_rate": 1.430137356154958e-05,
+ "loss": 0.1683,
+ "step": 13862
+ },
+ {
+ "epoch": 37.77384196185286,
+ "grad_norm": 6.855401515960693,
+ "learning_rate": 1.4300576860895215e-05,
+ "loss": 0.3463,
+ "step": 13863
+ },
+ {
+ "epoch": 37.776566757493185,
+ "grad_norm": 6.339083671569824,
+ "learning_rate": 1.4299780126748091e-05,
+ "loss": 0.2751,
+ "step": 13864
+ },
+ {
+ "epoch": 37.77929155313352,
+ "grad_norm": 6.983968257904053,
+ "learning_rate": 1.4298983359114422e-05,
+ "loss": 0.565,
+ "step": 13865
+ },
+ {
+ "epoch": 37.782016348773844,
+ "grad_norm": 7.245323657989502,
+ "learning_rate": 1.4298186558000406e-05,
+ "loss": 0.3568,
+ "step": 13866
+ },
+ {
+ "epoch": 37.78474114441417,
+ "grad_norm": 6.835300445556641,
+ "learning_rate": 1.4297389723412256e-05,
+ "loss": 0.3072,
+ "step": 13867
+ },
+ {
+ "epoch": 37.787465940054496,
+ "grad_norm": 5.132641792297363,
+ "learning_rate": 1.429659285535617e-05,
+ "loss": 0.2679,
+ "step": 13868
+ },
+ {
+ "epoch": 37.79019073569482,
+ "grad_norm": 18.43865394592285,
+ "learning_rate": 1.4295795953838358e-05,
+ "loss": 0.284,
+ "step": 13869
+ },
+ {
+ "epoch": 37.79291553133515,
+ "grad_norm": 5.493300914764404,
+ "learning_rate": 1.4294999018865023e-05,
+ "loss": 0.4596,
+ "step": 13870
+ },
+ {
+ "epoch": 37.79564032697548,
+ "grad_norm": 6.84777307510376,
+ "learning_rate": 1.4294202050442379e-05,
+ "loss": 0.4657,
+ "step": 13871
+ },
+ {
+ "epoch": 37.798365122615806,
+ "grad_norm": 5.2925124168396,
+ "learning_rate": 1.4293405048576623e-05,
+ "loss": 0.2627,
+ "step": 13872
+ },
+ {
+ "epoch": 37.80108991825613,
+ "grad_norm": 6.45269250869751,
+ "learning_rate": 1.4292608013273968e-05,
+ "loss": 0.1688,
+ "step": 13873
+ },
+ {
+ "epoch": 37.80381471389646,
+ "grad_norm": 5.663297176361084,
+ "learning_rate": 1.4291810944540619e-05,
+ "loss": 0.3882,
+ "step": 13874
+ },
+ {
+ "epoch": 37.80653950953678,
+ "grad_norm": 5.370720863342285,
+ "learning_rate": 1.4291013842382785e-05,
+ "loss": 0.4996,
+ "step": 13875
+ },
+ {
+ "epoch": 37.80926430517711,
+ "grad_norm": 7.206972122192383,
+ "learning_rate": 1.4290216706806675e-05,
+ "loss": 0.23,
+ "step": 13876
+ },
+ {
+ "epoch": 37.81198910081744,
+ "grad_norm": 7.181276321411133,
+ "learning_rate": 1.4289419537818494e-05,
+ "loss": 0.3261,
+ "step": 13877
+ },
+ {
+ "epoch": 37.81471389645777,
+ "grad_norm": 6.361824035644531,
+ "learning_rate": 1.4288622335424452e-05,
+ "loss": 0.3921,
+ "step": 13878
+ },
+ {
+ "epoch": 37.817438692098094,
+ "grad_norm": 6.072926998138428,
+ "learning_rate": 1.4287825099630759e-05,
+ "loss": 0.2404,
+ "step": 13879
+ },
+ {
+ "epoch": 37.82016348773842,
+ "grad_norm": 6.359704494476318,
+ "learning_rate": 1.4287027830443618e-05,
+ "loss": 0.2664,
+ "step": 13880
+ },
+ {
+ "epoch": 37.822888283378745,
+ "grad_norm": 5.395126819610596,
+ "learning_rate": 1.4286230527869245e-05,
+ "loss": 0.1834,
+ "step": 13881
+ },
+ {
+ "epoch": 37.82561307901907,
+ "grad_norm": 5.825087070465088,
+ "learning_rate": 1.4285433191913845e-05,
+ "loss": 0.2545,
+ "step": 13882
+ },
+ {
+ "epoch": 37.828337874659404,
+ "grad_norm": 6.945882797241211,
+ "learning_rate": 1.4284635822583632e-05,
+ "loss": 0.3561,
+ "step": 13883
+ },
+ {
+ "epoch": 37.83106267029973,
+ "grad_norm": 6.538568019866943,
+ "learning_rate": 1.428383841988481e-05,
+ "loss": 0.2595,
+ "step": 13884
+ },
+ {
+ "epoch": 37.833787465940055,
+ "grad_norm": 5.49812650680542,
+ "learning_rate": 1.4283040983823594e-05,
+ "loss": 0.2719,
+ "step": 13885
+ },
+ {
+ "epoch": 37.83651226158038,
+ "grad_norm": 7.490963459014893,
+ "learning_rate": 1.4282243514406192e-05,
+ "loss": 0.3662,
+ "step": 13886
+ },
+ {
+ "epoch": 37.83923705722071,
+ "grad_norm": 5.736569881439209,
+ "learning_rate": 1.4281446011638818e-05,
+ "loss": 0.3821,
+ "step": 13887
+ },
+ {
+ "epoch": 37.84196185286103,
+ "grad_norm": 6.814878463745117,
+ "learning_rate": 1.4280648475527676e-05,
+ "loss": 0.3307,
+ "step": 13888
+ },
+ {
+ "epoch": 37.844686648501366,
+ "grad_norm": 7.027327537536621,
+ "learning_rate": 1.4279850906078984e-05,
+ "loss": 0.3086,
+ "step": 13889
+ },
+ {
+ "epoch": 37.84741144414169,
+ "grad_norm": 5.297640323638916,
+ "learning_rate": 1.427905330329895e-05,
+ "loss": 0.3211,
+ "step": 13890
+ },
+ {
+ "epoch": 37.85013623978202,
+ "grad_norm": 5.85853385925293,
+ "learning_rate": 1.4278255667193785e-05,
+ "loss": 0.2456,
+ "step": 13891
+ },
+ {
+ "epoch": 37.85286103542234,
+ "grad_norm": 8.093560218811035,
+ "learning_rate": 1.4277457997769707e-05,
+ "loss": 0.2427,
+ "step": 13892
+ },
+ {
+ "epoch": 37.85558583106267,
+ "grad_norm": 5.991091728210449,
+ "learning_rate": 1.427666029503292e-05,
+ "loss": 0.2615,
+ "step": 13893
+ },
+ {
+ "epoch": 37.858310626702995,
+ "grad_norm": 5.490238666534424,
+ "learning_rate": 1.4275862558989642e-05,
+ "loss": 0.2807,
+ "step": 13894
+ },
+ {
+ "epoch": 37.86103542234333,
+ "grad_norm": 5.897800445556641,
+ "learning_rate": 1.4275064789646085e-05,
+ "loss": 0.2792,
+ "step": 13895
+ },
+ {
+ "epoch": 37.86376021798365,
+ "grad_norm": 5.740957260131836,
+ "learning_rate": 1.4274266987008459e-05,
+ "loss": 0.3357,
+ "step": 13896
+ },
+ {
+ "epoch": 37.86648501362398,
+ "grad_norm": 5.91965389251709,
+ "learning_rate": 1.427346915108298e-05,
+ "loss": 0.4214,
+ "step": 13897
+ },
+ {
+ "epoch": 37.869209809264305,
+ "grad_norm": 6.701809883117676,
+ "learning_rate": 1.4272671281875857e-05,
+ "loss": 0.3539,
+ "step": 13898
+ },
+ {
+ "epoch": 37.87193460490463,
+ "grad_norm": 5.178858280181885,
+ "learning_rate": 1.4271873379393314e-05,
+ "loss": 0.3049,
+ "step": 13899
+ },
+ {
+ "epoch": 37.87465940054496,
+ "grad_norm": 6.695412635803223,
+ "learning_rate": 1.4271075443641552e-05,
+ "loss": 0.2471,
+ "step": 13900
+ },
+ {
+ "epoch": 37.87738419618529,
+ "grad_norm": 6.38279390335083,
+ "learning_rate": 1.4270277474626799e-05,
+ "loss": 0.4324,
+ "step": 13901
+ },
+ {
+ "epoch": 37.880108991825615,
+ "grad_norm": 5.44714879989624,
+ "learning_rate": 1.4269479472355259e-05,
+ "loss": 0.2364,
+ "step": 13902
+ },
+ {
+ "epoch": 37.88283378746594,
+ "grad_norm": 6.585297584533691,
+ "learning_rate": 1.4268681436833149e-05,
+ "loss": 0.2476,
+ "step": 13903
+ },
+ {
+ "epoch": 37.88555858310627,
+ "grad_norm": 5.468698024749756,
+ "learning_rate": 1.4267883368066688e-05,
+ "loss": 0.2676,
+ "step": 13904
+ },
+ {
+ "epoch": 37.88828337874659,
+ "grad_norm": 6.195644378662109,
+ "learning_rate": 1.4267085266062088e-05,
+ "loss": 0.2874,
+ "step": 13905
+ },
+ {
+ "epoch": 37.89100817438692,
+ "grad_norm": 9.75532341003418,
+ "learning_rate": 1.4266287130825564e-05,
+ "loss": 0.3411,
+ "step": 13906
+ },
+ {
+ "epoch": 37.89373297002725,
+ "grad_norm": 5.855805397033691,
+ "learning_rate": 1.4265488962363334e-05,
+ "loss": 0.2052,
+ "step": 13907
+ },
+ {
+ "epoch": 37.89645776566758,
+ "grad_norm": 7.247859954833984,
+ "learning_rate": 1.4264690760681613e-05,
+ "loss": 0.4378,
+ "step": 13908
+ },
+ {
+ "epoch": 37.8991825613079,
+ "grad_norm": 6.3888654708862305,
+ "learning_rate": 1.4263892525786617e-05,
+ "loss": 0.3044,
+ "step": 13909
+ },
+ {
+ "epoch": 37.90190735694823,
+ "grad_norm": 6.496111869812012,
+ "learning_rate": 1.4263094257684564e-05,
+ "loss": 0.4275,
+ "step": 13910
+ },
+ {
+ "epoch": 37.904632152588555,
+ "grad_norm": 6.1391825675964355,
+ "learning_rate": 1.426229595638167e-05,
+ "loss": 0.2492,
+ "step": 13911
+ },
+ {
+ "epoch": 37.90735694822888,
+ "grad_norm": 11.097859382629395,
+ "learning_rate": 1.4261497621884152e-05,
+ "loss": 0.2425,
+ "step": 13912
+ },
+ {
+ "epoch": 37.91008174386921,
+ "grad_norm": 5.487829685211182,
+ "learning_rate": 1.4260699254198231e-05,
+ "loss": 0.2703,
+ "step": 13913
+ },
+ {
+ "epoch": 37.91280653950954,
+ "grad_norm": 6.309706211090088,
+ "learning_rate": 1.4259900853330116e-05,
+ "loss": 0.2534,
+ "step": 13914
+ },
+ {
+ "epoch": 37.915531335149865,
+ "grad_norm": 6.878724575042725,
+ "learning_rate": 1.4259102419286035e-05,
+ "loss": 0.2386,
+ "step": 13915
+ },
+ {
+ "epoch": 37.91825613079019,
+ "grad_norm": 5.6779985427856445,
+ "learning_rate": 1.4258303952072197e-05,
+ "loss": 0.3365,
+ "step": 13916
+ },
+ {
+ "epoch": 37.920980926430516,
+ "grad_norm": 6.016035079956055,
+ "learning_rate": 1.4257505451694826e-05,
+ "loss": 0.2068,
+ "step": 13917
+ },
+ {
+ "epoch": 37.92370572207084,
+ "grad_norm": 5.624186992645264,
+ "learning_rate": 1.4256706918160142e-05,
+ "loss": 0.3402,
+ "step": 13918
+ },
+ {
+ "epoch": 37.926430517711175,
+ "grad_norm": 6.045122146606445,
+ "learning_rate": 1.4255908351474358e-05,
+ "loss": 0.195,
+ "step": 13919
+ },
+ {
+ "epoch": 37.9291553133515,
+ "grad_norm": 7.068624973297119,
+ "learning_rate": 1.4255109751643698e-05,
+ "loss": 0.2797,
+ "step": 13920
+ },
+ {
+ "epoch": 37.93188010899183,
+ "grad_norm": 5.509274959564209,
+ "learning_rate": 1.4254311118674385e-05,
+ "loss": 0.3661,
+ "step": 13921
+ },
+ {
+ "epoch": 37.93460490463215,
+ "grad_norm": 6.219267845153809,
+ "learning_rate": 1.4253512452572629e-05,
+ "loss": 0.1712,
+ "step": 13922
+ },
+ {
+ "epoch": 37.93732970027248,
+ "grad_norm": 5.982593059539795,
+ "learning_rate": 1.4252713753344656e-05,
+ "loss": 0.33,
+ "step": 13923
+ },
+ {
+ "epoch": 37.940054495912804,
+ "grad_norm": 9.742803573608398,
+ "learning_rate": 1.4251915020996686e-05,
+ "loss": 0.3737,
+ "step": 13924
+ },
+ {
+ "epoch": 37.94277929155314,
+ "grad_norm": 5.775113105773926,
+ "learning_rate": 1.4251116255534936e-05,
+ "loss": 0.3099,
+ "step": 13925
+ },
+ {
+ "epoch": 37.94550408719346,
+ "grad_norm": 7.870527744293213,
+ "learning_rate": 1.425031745696563e-05,
+ "loss": 0.1759,
+ "step": 13926
+ },
+ {
+ "epoch": 37.94822888283379,
+ "grad_norm": 9.597245216369629,
+ "learning_rate": 1.4249518625294991e-05,
+ "loss": 0.3413,
+ "step": 13927
+ },
+ {
+ "epoch": 37.950953678474114,
+ "grad_norm": 5.649352073669434,
+ "learning_rate": 1.4248719760529235e-05,
+ "loss": 0.3091,
+ "step": 13928
+ },
+ {
+ "epoch": 37.95367847411444,
+ "grad_norm": 6.283723831176758,
+ "learning_rate": 1.4247920862674589e-05,
+ "loss": 0.3779,
+ "step": 13929
+ },
+ {
+ "epoch": 37.956403269754766,
+ "grad_norm": 7.923952579498291,
+ "learning_rate": 1.4247121931737269e-05,
+ "loss": 0.4114,
+ "step": 13930
+ },
+ {
+ "epoch": 37.95912806539509,
+ "grad_norm": 7.428585529327393,
+ "learning_rate": 1.4246322967723502e-05,
+ "loss": 0.1706,
+ "step": 13931
+ },
+ {
+ "epoch": 37.961852861035425,
+ "grad_norm": 5.831275939941406,
+ "learning_rate": 1.424552397063951e-05,
+ "loss": 0.4125,
+ "step": 13932
+ },
+ {
+ "epoch": 37.96457765667575,
+ "grad_norm": 6.238661766052246,
+ "learning_rate": 1.424472494049151e-05,
+ "loss": 0.2897,
+ "step": 13933
+ },
+ {
+ "epoch": 37.967302452316076,
+ "grad_norm": 6.399302959442139,
+ "learning_rate": 1.4243925877285731e-05,
+ "loss": 0.369,
+ "step": 13934
+ },
+ {
+ "epoch": 37.9700272479564,
+ "grad_norm": 7.374026298522949,
+ "learning_rate": 1.4243126781028393e-05,
+ "loss": 0.3454,
+ "step": 13935
+ },
+ {
+ "epoch": 37.97275204359673,
+ "grad_norm": 6.311505317687988,
+ "learning_rate": 1.424232765172572e-05,
+ "loss": 0.2968,
+ "step": 13936
+ },
+ {
+ "epoch": 37.97547683923706,
+ "grad_norm": 7.2645955085754395,
+ "learning_rate": 1.4241528489383938e-05,
+ "loss": 0.2826,
+ "step": 13937
+ },
+ {
+ "epoch": 37.97820163487739,
+ "grad_norm": 6.588016986846924,
+ "learning_rate": 1.4240729294009268e-05,
+ "loss": 0.2749,
+ "step": 13938
+ },
+ {
+ "epoch": 37.98092643051771,
+ "grad_norm": 7.065012454986572,
+ "learning_rate": 1.4239930065607934e-05,
+ "loss": 0.326,
+ "step": 13939
+ },
+ {
+ "epoch": 37.98365122615804,
+ "grad_norm": 9.638312339782715,
+ "learning_rate": 1.4239130804186161e-05,
+ "loss": 0.2731,
+ "step": 13940
+ },
+ {
+ "epoch": 37.986376021798364,
+ "grad_norm": 7.051853179931641,
+ "learning_rate": 1.4238331509750173e-05,
+ "loss": 0.4256,
+ "step": 13941
+ },
+ {
+ "epoch": 37.98910081743869,
+ "grad_norm": 7.029924392700195,
+ "learning_rate": 1.4237532182306198e-05,
+ "loss": 0.2442,
+ "step": 13942
+ },
+ {
+ "epoch": 37.991825613079016,
+ "grad_norm": 6.4894633293151855,
+ "learning_rate": 1.4236732821860456e-05,
+ "loss": 0.1772,
+ "step": 13943
+ },
+ {
+ "epoch": 37.99455040871935,
+ "grad_norm": 6.099433898925781,
+ "learning_rate": 1.4235933428419177e-05,
+ "loss": 0.2225,
+ "step": 13944
+ },
+ {
+ "epoch": 37.997275204359674,
+ "grad_norm": 9.0189847946167,
+ "learning_rate": 1.4235134001988584e-05,
+ "loss": 0.3329,
+ "step": 13945
+ },
+ {
+ "epoch": 38.0,
+ "grad_norm": 6.745449066162109,
+ "learning_rate": 1.4234334542574906e-05,
+ "loss": 0.3312,
+ "step": 13946
+ },
+ {
+ "epoch": 38.002724795640326,
+ "grad_norm": 5.828391075134277,
+ "learning_rate": 1.4233535050184362e-05,
+ "loss": 0.1915,
+ "step": 13947
+ },
+ {
+ "epoch": 38.00544959128065,
+ "grad_norm": 6.628112316131592,
+ "learning_rate": 1.4232735524823187e-05,
+ "loss": 0.3048,
+ "step": 13948
+ },
+ {
+ "epoch": 38.00817438692098,
+ "grad_norm": 7.644171714782715,
+ "learning_rate": 1.4231935966497603e-05,
+ "loss": 0.211,
+ "step": 13949
+ },
+ {
+ "epoch": 38.01089918256131,
+ "grad_norm": 7.779391288757324,
+ "learning_rate": 1.4231136375213837e-05,
+ "loss": 0.34,
+ "step": 13950
+ },
+ {
+ "epoch": 38.013623978201636,
+ "grad_norm": 5.219463348388672,
+ "learning_rate": 1.4230336750978117e-05,
+ "loss": 0.1672,
+ "step": 13951
+ },
+ {
+ "epoch": 38.01634877384196,
+ "grad_norm": 6.442633628845215,
+ "learning_rate": 1.4229537093796672e-05,
+ "loss": 0.363,
+ "step": 13952
+ },
+ {
+ "epoch": 38.01907356948229,
+ "grad_norm": 5.483616828918457,
+ "learning_rate": 1.4228737403675727e-05,
+ "loss": 0.21,
+ "step": 13953
+ },
+ {
+ "epoch": 38.02179836512261,
+ "grad_norm": 5.897453784942627,
+ "learning_rate": 1.4227937680621513e-05,
+ "loss": 0.3088,
+ "step": 13954
+ },
+ {
+ "epoch": 38.02452316076294,
+ "grad_norm": 5.241434574127197,
+ "learning_rate": 1.4227137924640255e-05,
+ "loss": 0.2805,
+ "step": 13955
+ },
+ {
+ "epoch": 38.02724795640327,
+ "grad_norm": 4.7049126625061035,
+ "learning_rate": 1.4226338135738185e-05,
+ "loss": 0.234,
+ "step": 13956
+ },
+ {
+ "epoch": 38.0299727520436,
+ "grad_norm": 6.1228413581848145,
+ "learning_rate": 1.4225538313921527e-05,
+ "loss": 0.2327,
+ "step": 13957
+ },
+ {
+ "epoch": 38.032697547683924,
+ "grad_norm": 6.522132873535156,
+ "learning_rate": 1.4224738459196514e-05,
+ "loss": 0.2843,
+ "step": 13958
+ },
+ {
+ "epoch": 38.03542234332425,
+ "grad_norm": 5.426480770111084,
+ "learning_rate": 1.4223938571569371e-05,
+ "loss": 0.2536,
+ "step": 13959
+ },
+ {
+ "epoch": 38.038147138964575,
+ "grad_norm": 7.3476409912109375,
+ "learning_rate": 1.4223138651046333e-05,
+ "loss": 0.292,
+ "step": 13960
+ },
+ {
+ "epoch": 38.0408719346049,
+ "grad_norm": 5.566215515136719,
+ "learning_rate": 1.4222338697633627e-05,
+ "loss": 0.2537,
+ "step": 13961
+ },
+ {
+ "epoch": 38.043596730245234,
+ "grad_norm": 5.8920207023620605,
+ "learning_rate": 1.4221538711337483e-05,
+ "loss": 0.1773,
+ "step": 13962
+ },
+ {
+ "epoch": 38.04632152588556,
+ "grad_norm": 7.461595058441162,
+ "learning_rate": 1.4220738692164132e-05,
+ "loss": 0.2825,
+ "step": 13963
+ },
+ {
+ "epoch": 38.049046321525886,
+ "grad_norm": 5.866862773895264,
+ "learning_rate": 1.4219938640119803e-05,
+ "loss": 0.2876,
+ "step": 13964
+ },
+ {
+ "epoch": 38.05177111716621,
+ "grad_norm": 5.897693157196045,
+ "learning_rate": 1.4219138555210727e-05,
+ "loss": 0.4412,
+ "step": 13965
+ },
+ {
+ "epoch": 38.05449591280654,
+ "grad_norm": 5.753302097320557,
+ "learning_rate": 1.421833843744314e-05,
+ "loss": 0.2656,
+ "step": 13966
+ },
+ {
+ "epoch": 38.05722070844686,
+ "grad_norm": 6.437390327453613,
+ "learning_rate": 1.4217538286823262e-05,
+ "loss": 0.1365,
+ "step": 13967
+ },
+ {
+ "epoch": 38.059945504087196,
+ "grad_norm": 5.829328536987305,
+ "learning_rate": 1.4216738103357335e-05,
+ "loss": 0.2829,
+ "step": 13968
+ },
+ {
+ "epoch": 38.06267029972752,
+ "grad_norm": 9.179716110229492,
+ "learning_rate": 1.4215937887051588e-05,
+ "loss": 0.2632,
+ "step": 13969
+ },
+ {
+ "epoch": 38.06539509536785,
+ "grad_norm": 6.491574287414551,
+ "learning_rate": 1.4215137637912252e-05,
+ "loss": 0.3179,
+ "step": 13970
+ },
+ {
+ "epoch": 38.06811989100817,
+ "grad_norm": 8.215079307556152,
+ "learning_rate": 1.421433735594556e-05,
+ "loss": 0.2418,
+ "step": 13971
+ },
+ {
+ "epoch": 38.0708446866485,
+ "grad_norm": 5.035507678985596,
+ "learning_rate": 1.4213537041157746e-05,
+ "loss": 0.1278,
+ "step": 13972
+ },
+ {
+ "epoch": 38.073569482288825,
+ "grad_norm": 7.004916191101074,
+ "learning_rate": 1.4212736693555038e-05,
+ "loss": 0.2279,
+ "step": 13973
+ },
+ {
+ "epoch": 38.07629427792916,
+ "grad_norm": 5.82853364944458,
+ "learning_rate": 1.4211936313143673e-05,
+ "loss": 0.2233,
+ "step": 13974
+ },
+ {
+ "epoch": 38.079019073569484,
+ "grad_norm": 6.827931880950928,
+ "learning_rate": 1.4211135899929885e-05,
+ "loss": 0.2453,
+ "step": 13975
+ },
+ {
+ "epoch": 38.08174386920981,
+ "grad_norm": 5.678162574768066,
+ "learning_rate": 1.4210335453919904e-05,
+ "loss": 0.2307,
+ "step": 13976
+ },
+ {
+ "epoch": 38.084468664850135,
+ "grad_norm": 6.095455169677734,
+ "learning_rate": 1.4209534975119965e-05,
+ "loss": 0.2744,
+ "step": 13977
+ },
+ {
+ "epoch": 38.08719346049046,
+ "grad_norm": 7.953395366668701,
+ "learning_rate": 1.4208734463536307e-05,
+ "loss": 0.215,
+ "step": 13978
+ },
+ {
+ "epoch": 38.08991825613079,
+ "grad_norm": 6.966280460357666,
+ "learning_rate": 1.4207933919175157e-05,
+ "loss": 0.2914,
+ "step": 13979
+ },
+ {
+ "epoch": 38.09264305177112,
+ "grad_norm": 5.814003944396973,
+ "learning_rate": 1.4207133342042756e-05,
+ "loss": 0.3221,
+ "step": 13980
+ },
+ {
+ "epoch": 38.095367847411445,
+ "grad_norm": 6.032495021820068,
+ "learning_rate": 1.4206332732145334e-05,
+ "loss": 0.3495,
+ "step": 13981
+ },
+ {
+ "epoch": 38.09809264305177,
+ "grad_norm": 7.486771106719971,
+ "learning_rate": 1.420553208948913e-05,
+ "loss": 0.2506,
+ "step": 13982
+ },
+ {
+ "epoch": 38.1008174386921,
+ "grad_norm": 5.105815410614014,
+ "learning_rate": 1.4204731414080375e-05,
+ "loss": 0.3923,
+ "step": 13983
+ },
+ {
+ "epoch": 38.10354223433242,
+ "grad_norm": 5.73434591293335,
+ "learning_rate": 1.4203930705925308e-05,
+ "loss": 0.3165,
+ "step": 13984
+ },
+ {
+ "epoch": 38.10626702997275,
+ "grad_norm": 5.713719367980957,
+ "learning_rate": 1.4203129965030162e-05,
+ "loss": 0.1771,
+ "step": 13985
+ },
+ {
+ "epoch": 38.10899182561308,
+ "grad_norm": 8.072136878967285,
+ "learning_rate": 1.4202329191401178e-05,
+ "loss": 0.2828,
+ "step": 13986
+ },
+ {
+ "epoch": 38.11171662125341,
+ "grad_norm": 6.253368854522705,
+ "learning_rate": 1.4201528385044589e-05,
+ "loss": 0.2762,
+ "step": 13987
+ },
+ {
+ "epoch": 38.11444141689373,
+ "grad_norm": 7.055810451507568,
+ "learning_rate": 1.4200727545966633e-05,
+ "loss": 0.3133,
+ "step": 13988
+ },
+ {
+ "epoch": 38.11716621253406,
+ "grad_norm": 4.999205589294434,
+ "learning_rate": 1.4199926674173545e-05,
+ "loss": 0.2086,
+ "step": 13989
+ },
+ {
+ "epoch": 38.119891008174385,
+ "grad_norm": 5.597371578216553,
+ "learning_rate": 1.4199125769671564e-05,
+ "loss": 0.3203,
+ "step": 13990
+ },
+ {
+ "epoch": 38.12261580381471,
+ "grad_norm": 5.3502373695373535,
+ "learning_rate": 1.4198324832466925e-05,
+ "loss": 0.32,
+ "step": 13991
+ },
+ {
+ "epoch": 38.12534059945504,
+ "grad_norm": 8.164291381835938,
+ "learning_rate": 1.419752386256587e-05,
+ "loss": 0.4567,
+ "step": 13992
+ },
+ {
+ "epoch": 38.12806539509537,
+ "grad_norm": 5.968377590179443,
+ "learning_rate": 1.4196722859974629e-05,
+ "loss": 0.2638,
+ "step": 13993
+ },
+ {
+ "epoch": 38.130790190735695,
+ "grad_norm": 6.087549209594727,
+ "learning_rate": 1.419592182469945e-05,
+ "loss": 0.1793,
+ "step": 13994
+ },
+ {
+ "epoch": 38.13351498637602,
+ "grad_norm": 6.813994884490967,
+ "learning_rate": 1.4195120756746566e-05,
+ "loss": 0.3072,
+ "step": 13995
+ },
+ {
+ "epoch": 38.13623978201635,
+ "grad_norm": 7.23217248916626,
+ "learning_rate": 1.4194319656122217e-05,
+ "loss": 0.2021,
+ "step": 13996
+ },
+ {
+ "epoch": 38.13896457765667,
+ "grad_norm": 4.884246349334717,
+ "learning_rate": 1.4193518522832642e-05,
+ "loss": 0.2717,
+ "step": 13997
+ },
+ {
+ "epoch": 38.141689373297005,
+ "grad_norm": 5.066684722900391,
+ "learning_rate": 1.4192717356884078e-05,
+ "loss": 0.2404,
+ "step": 13998
+ },
+ {
+ "epoch": 38.14441416893733,
+ "grad_norm": 6.179629325866699,
+ "learning_rate": 1.4191916158282766e-05,
+ "loss": 0.2885,
+ "step": 13999
+ },
+ {
+ "epoch": 38.14713896457766,
+ "grad_norm": 5.496793270111084,
+ "learning_rate": 1.4191114927034949e-05,
+ "loss": 0.1613,
+ "step": 14000
+ },
+ {
+ "epoch": 38.14986376021798,
+ "grad_norm": 5.1892290115356445,
+ "learning_rate": 1.4190313663146859e-05,
+ "loss": 0.2329,
+ "step": 14001
+ },
+ {
+ "epoch": 38.15258855585831,
+ "grad_norm": 6.829507827758789,
+ "learning_rate": 1.4189512366624745e-05,
+ "loss": 0.3313,
+ "step": 14002
+ },
+ {
+ "epoch": 38.155313351498634,
+ "grad_norm": 6.3000054359436035,
+ "learning_rate": 1.418871103747484e-05,
+ "loss": 0.2714,
+ "step": 14003
+ },
+ {
+ "epoch": 38.15803814713897,
+ "grad_norm": 7.200273513793945,
+ "learning_rate": 1.4187909675703391e-05,
+ "loss": 0.2042,
+ "step": 14004
+ },
+ {
+ "epoch": 38.16076294277929,
+ "grad_norm": 6.331015586853027,
+ "learning_rate": 1.4187108281316635e-05,
+ "loss": 0.3781,
+ "step": 14005
+ },
+ {
+ "epoch": 38.16348773841962,
+ "grad_norm": 6.415987014770508,
+ "learning_rate": 1.4186306854320817e-05,
+ "loss": 0.2836,
+ "step": 14006
+ },
+ {
+ "epoch": 38.166212534059945,
+ "grad_norm": 7.1509199142456055,
+ "learning_rate": 1.4185505394722172e-05,
+ "loss": 0.283,
+ "step": 14007
+ },
+ {
+ "epoch": 38.16893732970027,
+ "grad_norm": 5.582503795623779,
+ "learning_rate": 1.418470390252695e-05,
+ "loss": 0.2593,
+ "step": 14008
+ },
+ {
+ "epoch": 38.171662125340596,
+ "grad_norm": 7.300879001617432,
+ "learning_rate": 1.4183902377741385e-05,
+ "loss": 0.3265,
+ "step": 14009
+ },
+ {
+ "epoch": 38.17438692098093,
+ "grad_norm": 5.514047145843506,
+ "learning_rate": 1.4183100820371723e-05,
+ "loss": 0.2384,
+ "step": 14010
+ },
+ {
+ "epoch": 38.177111716621255,
+ "grad_norm": 6.768276691436768,
+ "learning_rate": 1.418229923042421e-05,
+ "loss": 0.3659,
+ "step": 14011
+ },
+ {
+ "epoch": 38.17983651226158,
+ "grad_norm": 7.209909439086914,
+ "learning_rate": 1.4181497607905082e-05,
+ "loss": 0.3259,
+ "step": 14012
+ },
+ {
+ "epoch": 38.182561307901906,
+ "grad_norm": 6.693050384521484,
+ "learning_rate": 1.4180695952820585e-05,
+ "loss": 0.2859,
+ "step": 14013
+ },
+ {
+ "epoch": 38.18528610354223,
+ "grad_norm": 5.3056206703186035,
+ "learning_rate": 1.4179894265176964e-05,
+ "loss": 0.3568,
+ "step": 14014
+ },
+ {
+ "epoch": 38.18801089918256,
+ "grad_norm": 6.389018535614014,
+ "learning_rate": 1.4179092544980459e-05,
+ "loss": 0.1603,
+ "step": 14015
+ },
+ {
+ "epoch": 38.19073569482289,
+ "grad_norm": 11.500627517700195,
+ "learning_rate": 1.4178290792237319e-05,
+ "loss": 0.2413,
+ "step": 14016
+ },
+ {
+ "epoch": 38.19346049046322,
+ "grad_norm": 4.9877214431762695,
+ "learning_rate": 1.4177489006953784e-05,
+ "loss": 0.2359,
+ "step": 14017
+ },
+ {
+ "epoch": 38.19618528610354,
+ "grad_norm": 4.357906341552734,
+ "learning_rate": 1.4176687189136098e-05,
+ "loss": 0.1855,
+ "step": 14018
+ },
+ {
+ "epoch": 38.19891008174387,
+ "grad_norm": 6.749527931213379,
+ "learning_rate": 1.4175885338790507e-05,
+ "loss": 0.4336,
+ "step": 14019
+ },
+ {
+ "epoch": 38.201634877384194,
+ "grad_norm": 5.563653945922852,
+ "learning_rate": 1.4175083455923254e-05,
+ "loss": 0.2687,
+ "step": 14020
+ },
+ {
+ "epoch": 38.20435967302452,
+ "grad_norm": 6.073885917663574,
+ "learning_rate": 1.417428154054059e-05,
+ "loss": 0.3654,
+ "step": 14021
+ },
+ {
+ "epoch": 38.20708446866485,
+ "grad_norm": 5.087289810180664,
+ "learning_rate": 1.417347959264875e-05,
+ "loss": 0.2058,
+ "step": 14022
+ },
+ {
+ "epoch": 38.20980926430518,
+ "grad_norm": 6.296276092529297,
+ "learning_rate": 1.4172677612253987e-05,
+ "loss": 0.2492,
+ "step": 14023
+ },
+ {
+ "epoch": 38.212534059945504,
+ "grad_norm": 7.721444606781006,
+ "learning_rate": 1.4171875599362545e-05,
+ "loss": 0.3712,
+ "step": 14024
+ },
+ {
+ "epoch": 38.21525885558583,
+ "grad_norm": 5.24257230758667,
+ "learning_rate": 1.4171073553980673e-05,
+ "loss": 0.2746,
+ "step": 14025
+ },
+ {
+ "epoch": 38.217983651226156,
+ "grad_norm": 7.223959922790527,
+ "learning_rate": 1.4170271476114612e-05,
+ "loss": 0.1926,
+ "step": 14026
+ },
+ {
+ "epoch": 38.22070844686648,
+ "grad_norm": 5.934112071990967,
+ "learning_rate": 1.416946936577061e-05,
+ "loss": 0.1913,
+ "step": 14027
+ },
+ {
+ "epoch": 38.223433242506815,
+ "grad_norm": 5.871982574462891,
+ "learning_rate": 1.4168667222954915e-05,
+ "loss": 0.2797,
+ "step": 14028
+ },
+ {
+ "epoch": 38.22615803814714,
+ "grad_norm": 5.042227745056152,
+ "learning_rate": 1.4167865047673775e-05,
+ "loss": 0.283,
+ "step": 14029
+ },
+ {
+ "epoch": 38.228882833787466,
+ "grad_norm": 5.960148811340332,
+ "learning_rate": 1.4167062839933437e-05,
+ "loss": 0.2523,
+ "step": 14030
+ },
+ {
+ "epoch": 38.23160762942779,
+ "grad_norm": 11.43106746673584,
+ "learning_rate": 1.4166260599740148e-05,
+ "loss": 0.2967,
+ "step": 14031
+ },
+ {
+ "epoch": 38.23433242506812,
+ "grad_norm": 6.651676177978516,
+ "learning_rate": 1.4165458327100152e-05,
+ "loss": 0.2797,
+ "step": 14032
+ },
+ {
+ "epoch": 38.237057220708444,
+ "grad_norm": 5.880712985992432,
+ "learning_rate": 1.4164656022019702e-05,
+ "loss": 0.3331,
+ "step": 14033
+ },
+ {
+ "epoch": 38.23978201634878,
+ "grad_norm": 6.207973957061768,
+ "learning_rate": 1.4163853684505046e-05,
+ "loss": 0.3976,
+ "step": 14034
+ },
+ {
+ "epoch": 38.2425068119891,
+ "grad_norm": 4.574272155761719,
+ "learning_rate": 1.416305131456243e-05,
+ "loss": 0.1279,
+ "step": 14035
+ },
+ {
+ "epoch": 38.24523160762943,
+ "grad_norm": 4.726644992828369,
+ "learning_rate": 1.4162248912198107e-05,
+ "loss": 0.256,
+ "step": 14036
+ },
+ {
+ "epoch": 38.247956403269754,
+ "grad_norm": 5.637514591217041,
+ "learning_rate": 1.4161446477418322e-05,
+ "loss": 0.2778,
+ "step": 14037
+ },
+ {
+ "epoch": 38.25068119891008,
+ "grad_norm": 5.931151390075684,
+ "learning_rate": 1.4160644010229325e-05,
+ "loss": 0.2351,
+ "step": 14038
+ },
+ {
+ "epoch": 38.253405994550405,
+ "grad_norm": 5.666237831115723,
+ "learning_rate": 1.4159841510637368e-05,
+ "loss": 0.2453,
+ "step": 14039
+ },
+ {
+ "epoch": 38.25613079019074,
+ "grad_norm": 5.902411460876465,
+ "learning_rate": 1.4159038978648698e-05,
+ "loss": 0.3376,
+ "step": 14040
+ },
+ {
+ "epoch": 38.258855585831064,
+ "grad_norm": 5.361380100250244,
+ "learning_rate": 1.4158236414269569e-05,
+ "loss": 0.2046,
+ "step": 14041
+ },
+ {
+ "epoch": 38.26158038147139,
+ "grad_norm": 5.141907691955566,
+ "learning_rate": 1.4157433817506224e-05,
+ "loss": 0.2404,
+ "step": 14042
+ },
+ {
+ "epoch": 38.264305177111716,
+ "grad_norm": 5.590311527252197,
+ "learning_rate": 1.4156631188364922e-05,
+ "loss": 0.2377,
+ "step": 14043
+ },
+ {
+ "epoch": 38.26702997275204,
+ "grad_norm": 5.858974933624268,
+ "learning_rate": 1.4155828526851907e-05,
+ "loss": 0.1895,
+ "step": 14044
+ },
+ {
+ "epoch": 38.26975476839237,
+ "grad_norm": 5.813584804534912,
+ "learning_rate": 1.4155025832973435e-05,
+ "loss": 0.2008,
+ "step": 14045
+ },
+ {
+ "epoch": 38.2724795640327,
+ "grad_norm": 5.5272369384765625,
+ "learning_rate": 1.4154223106735754e-05,
+ "loss": 0.2745,
+ "step": 14046
+ },
+ {
+ "epoch": 38.275204359673026,
+ "grad_norm": 5.37410831451416,
+ "learning_rate": 1.415342034814512e-05,
+ "loss": 0.4397,
+ "step": 14047
+ },
+ {
+ "epoch": 38.27792915531335,
+ "grad_norm": 6.916401386260986,
+ "learning_rate": 1.4152617557207779e-05,
+ "loss": 0.2548,
+ "step": 14048
+ },
+ {
+ "epoch": 38.28065395095368,
+ "grad_norm": 5.114424705505371,
+ "learning_rate": 1.4151814733929989e-05,
+ "loss": 0.1748,
+ "step": 14049
+ },
+ {
+ "epoch": 38.283378746594,
+ "grad_norm": 7.644888401031494,
+ "learning_rate": 1.4151011878317998e-05,
+ "loss": 0.2413,
+ "step": 14050
+ },
+ {
+ "epoch": 38.28610354223433,
+ "grad_norm": 5.31462287902832,
+ "learning_rate": 1.415020899037806e-05,
+ "loss": 0.27,
+ "step": 14051
+ },
+ {
+ "epoch": 38.28882833787466,
+ "grad_norm": 11.65475082397461,
+ "learning_rate": 1.4149406070116429e-05,
+ "loss": 0.3211,
+ "step": 14052
+ },
+ {
+ "epoch": 38.29155313351499,
+ "grad_norm": 12.475391387939453,
+ "learning_rate": 1.4148603117539354e-05,
+ "loss": 0.1888,
+ "step": 14053
+ },
+ {
+ "epoch": 38.294277929155314,
+ "grad_norm": 5.723780155181885,
+ "learning_rate": 1.4147800132653093e-05,
+ "loss": 0.3493,
+ "step": 14054
+ },
+ {
+ "epoch": 38.29700272479564,
+ "grad_norm": 5.613542556762695,
+ "learning_rate": 1.4146997115463901e-05,
+ "loss": 0.4031,
+ "step": 14055
+ },
+ {
+ "epoch": 38.299727520435965,
+ "grad_norm": 7.107828617095947,
+ "learning_rate": 1.4146194065978024e-05,
+ "loss": 0.4164,
+ "step": 14056
+ },
+ {
+ "epoch": 38.30245231607629,
+ "grad_norm": 5.172051906585693,
+ "learning_rate": 1.4145390984201726e-05,
+ "loss": 0.1524,
+ "step": 14057
+ },
+ {
+ "epoch": 38.305177111716624,
+ "grad_norm": 5.915720462799072,
+ "learning_rate": 1.4144587870141252e-05,
+ "loss": 0.362,
+ "step": 14058
+ },
+ {
+ "epoch": 38.30790190735695,
+ "grad_norm": 7.770023822784424,
+ "learning_rate": 1.4143784723802865e-05,
+ "loss": 0.3484,
+ "step": 14059
+ },
+ {
+ "epoch": 38.310626702997276,
+ "grad_norm": 5.6410698890686035,
+ "learning_rate": 1.4142981545192814e-05,
+ "loss": 0.2348,
+ "step": 14060
+ },
+ {
+ "epoch": 38.3133514986376,
+ "grad_norm": 5.968530178070068,
+ "learning_rate": 1.4142178334317356e-05,
+ "loss": 0.3093,
+ "step": 14061
+ },
+ {
+ "epoch": 38.31607629427793,
+ "grad_norm": 6.009503364562988,
+ "learning_rate": 1.4141375091182746e-05,
+ "loss": 0.274,
+ "step": 14062
+ },
+ {
+ "epoch": 38.31880108991825,
+ "grad_norm": 5.930474758148193,
+ "learning_rate": 1.4140571815795242e-05,
+ "loss": 0.2842,
+ "step": 14063
+ },
+ {
+ "epoch": 38.321525885558586,
+ "grad_norm": 7.296756744384766,
+ "learning_rate": 1.4139768508161097e-05,
+ "loss": 0.413,
+ "step": 14064
+ },
+ {
+ "epoch": 38.32425068119891,
+ "grad_norm": 6.180625915527344,
+ "learning_rate": 1.4138965168286567e-05,
+ "loss": 0.2228,
+ "step": 14065
+ },
+ {
+ "epoch": 38.32697547683924,
+ "grad_norm": 5.570156574249268,
+ "learning_rate": 1.4138161796177909e-05,
+ "loss": 0.3784,
+ "step": 14066
+ },
+ {
+ "epoch": 38.32970027247956,
+ "grad_norm": 6.180319786071777,
+ "learning_rate": 1.4137358391841383e-05,
+ "loss": 0.2585,
+ "step": 14067
+ },
+ {
+ "epoch": 38.33242506811989,
+ "grad_norm": 13.237462997436523,
+ "learning_rate": 1.413655495528324e-05,
+ "loss": 0.2354,
+ "step": 14068
+ },
+ {
+ "epoch": 38.335149863760215,
+ "grad_norm": 5.750713348388672,
+ "learning_rate": 1.4135751486509743e-05,
+ "loss": 0.3899,
+ "step": 14069
+ },
+ {
+ "epoch": 38.33787465940055,
+ "grad_norm": 5.069406032562256,
+ "learning_rate": 1.4134947985527143e-05,
+ "loss": 0.2599,
+ "step": 14070
+ },
+ {
+ "epoch": 38.34059945504087,
+ "grad_norm": 5.973121643066406,
+ "learning_rate": 1.4134144452341702e-05,
+ "loss": 0.3579,
+ "step": 14071
+ },
+ {
+ "epoch": 38.3433242506812,
+ "grad_norm": 7.9918904304504395,
+ "learning_rate": 1.4133340886959678e-05,
+ "loss": 0.2699,
+ "step": 14072
+ },
+ {
+ "epoch": 38.346049046321525,
+ "grad_norm": 5.275363922119141,
+ "learning_rate": 1.4132537289387331e-05,
+ "loss": 0.2417,
+ "step": 14073
+ },
+ {
+ "epoch": 38.34877384196185,
+ "grad_norm": 10.604673385620117,
+ "learning_rate": 1.4131733659630913e-05,
+ "loss": 0.2502,
+ "step": 14074
+ },
+ {
+ "epoch": 38.35149863760218,
+ "grad_norm": 4.963611602783203,
+ "learning_rate": 1.4130929997696688e-05,
+ "loss": 0.3596,
+ "step": 14075
+ },
+ {
+ "epoch": 38.35422343324251,
+ "grad_norm": 6.919105052947998,
+ "learning_rate": 1.4130126303590911e-05,
+ "loss": 0.3586,
+ "step": 14076
+ },
+ {
+ "epoch": 38.356948228882835,
+ "grad_norm": 7.2395501136779785,
+ "learning_rate": 1.4129322577319846e-05,
+ "loss": 0.2636,
+ "step": 14077
+ },
+ {
+ "epoch": 38.35967302452316,
+ "grad_norm": 6.036019802093506,
+ "learning_rate": 1.4128518818889747e-05,
+ "loss": 0.424,
+ "step": 14078
+ },
+ {
+ "epoch": 38.36239782016349,
+ "grad_norm": 8.016825675964355,
+ "learning_rate": 1.4127715028306879e-05,
+ "loss": 0.2052,
+ "step": 14079
+ },
+ {
+ "epoch": 38.36512261580381,
+ "grad_norm": 7.741454601287842,
+ "learning_rate": 1.4126911205577495e-05,
+ "loss": 0.2644,
+ "step": 14080
+ },
+ {
+ "epoch": 38.36784741144414,
+ "grad_norm": 6.438891887664795,
+ "learning_rate": 1.4126107350707865e-05,
+ "loss": 0.3134,
+ "step": 14081
+ },
+ {
+ "epoch": 38.37057220708447,
+ "grad_norm": 5.113155364990234,
+ "learning_rate": 1.4125303463704241e-05,
+ "loss": 0.2095,
+ "step": 14082
+ },
+ {
+ "epoch": 38.3732970027248,
+ "grad_norm": 5.299055576324463,
+ "learning_rate": 1.4124499544572887e-05,
+ "loss": 0.355,
+ "step": 14083
+ },
+ {
+ "epoch": 38.37602179836512,
+ "grad_norm": 6.142955780029297,
+ "learning_rate": 1.4123695593320062e-05,
+ "loss": 0.2477,
+ "step": 14084
+ },
+ {
+ "epoch": 38.37874659400545,
+ "grad_norm": 6.0444488525390625,
+ "learning_rate": 1.4122891609952029e-05,
+ "loss": 0.2831,
+ "step": 14085
+ },
+ {
+ "epoch": 38.381471389645775,
+ "grad_norm": 8.738221168518066,
+ "learning_rate": 1.4122087594475049e-05,
+ "loss": 0.2417,
+ "step": 14086
+ },
+ {
+ "epoch": 38.3841961852861,
+ "grad_norm": 6.144389629364014,
+ "learning_rate": 1.4121283546895384e-05,
+ "loss": 0.2614,
+ "step": 14087
+ },
+ {
+ "epoch": 38.38692098092643,
+ "grad_norm": 6.7994384765625,
+ "learning_rate": 1.4120479467219292e-05,
+ "loss": 0.2132,
+ "step": 14088
+ },
+ {
+ "epoch": 38.38964577656676,
+ "grad_norm": 5.979526042938232,
+ "learning_rate": 1.4119675355453044e-05,
+ "loss": 0.2659,
+ "step": 14089
+ },
+ {
+ "epoch": 38.392370572207085,
+ "grad_norm": 5.767601490020752,
+ "learning_rate": 1.4118871211602893e-05,
+ "loss": 0.2061,
+ "step": 14090
+ },
+ {
+ "epoch": 38.39509536784741,
+ "grad_norm": 5.567809581756592,
+ "learning_rate": 1.411806703567511e-05,
+ "loss": 0.2214,
+ "step": 14091
+ },
+ {
+ "epoch": 38.39782016348774,
+ "grad_norm": 5.281261444091797,
+ "learning_rate": 1.4117262827675946e-05,
+ "loss": 0.1668,
+ "step": 14092
+ },
+ {
+ "epoch": 38.40054495912806,
+ "grad_norm": 5.884829044342041,
+ "learning_rate": 1.4116458587611678e-05,
+ "loss": 0.2425,
+ "step": 14093
+ },
+ {
+ "epoch": 38.403269754768395,
+ "grad_norm": 5.767762184143066,
+ "learning_rate": 1.411565431548856e-05,
+ "loss": 0.285,
+ "step": 14094
+ },
+ {
+ "epoch": 38.40599455040872,
+ "grad_norm": 5.065497398376465,
+ "learning_rate": 1.4114850011312861e-05,
+ "loss": 0.4338,
+ "step": 14095
+ },
+ {
+ "epoch": 38.40871934604905,
+ "grad_norm": 6.914985656738281,
+ "learning_rate": 1.411404567509084e-05,
+ "loss": 0.3231,
+ "step": 14096
+ },
+ {
+ "epoch": 38.41144414168937,
+ "grad_norm": 4.989675521850586,
+ "learning_rate": 1.4113241306828764e-05,
+ "loss": 0.2965,
+ "step": 14097
+ },
+ {
+ "epoch": 38.4141689373297,
+ "grad_norm": 14.356376647949219,
+ "learning_rate": 1.4112436906532898e-05,
+ "loss": 0.2072,
+ "step": 14098
+ },
+ {
+ "epoch": 38.416893732970024,
+ "grad_norm": 5.906617641448975,
+ "learning_rate": 1.4111632474209506e-05,
+ "loss": 0.2074,
+ "step": 14099
+ },
+ {
+ "epoch": 38.41961852861036,
+ "grad_norm": 5.60844612121582,
+ "learning_rate": 1.4110828009864853e-05,
+ "loss": 0.2516,
+ "step": 14100
+ },
+ {
+ "epoch": 38.42234332425068,
+ "grad_norm": 6.221306324005127,
+ "learning_rate": 1.4110023513505201e-05,
+ "loss": 0.2279,
+ "step": 14101
+ },
+ {
+ "epoch": 38.42506811989101,
+ "grad_norm": 5.365349769592285,
+ "learning_rate": 1.410921898513682e-05,
+ "loss": 0.185,
+ "step": 14102
+ },
+ {
+ "epoch": 38.427792915531334,
+ "grad_norm": 5.050516128540039,
+ "learning_rate": 1.4108414424765978e-05,
+ "loss": 0.2157,
+ "step": 14103
+ },
+ {
+ "epoch": 38.43051771117166,
+ "grad_norm": 5.983419895172119,
+ "learning_rate": 1.410760983239893e-05,
+ "loss": 0.3295,
+ "step": 14104
+ },
+ {
+ "epoch": 38.433242506811986,
+ "grad_norm": 6.8474531173706055,
+ "learning_rate": 1.4106805208041951e-05,
+ "loss": 0.2852,
+ "step": 14105
+ },
+ {
+ "epoch": 38.43596730245232,
+ "grad_norm": 7.26201057434082,
+ "learning_rate": 1.4106000551701309e-05,
+ "loss": 0.1926,
+ "step": 14106
+ },
+ {
+ "epoch": 38.438692098092645,
+ "grad_norm": 5.860100269317627,
+ "learning_rate": 1.4105195863383261e-05,
+ "loss": 0.2115,
+ "step": 14107
+ },
+ {
+ "epoch": 38.44141689373297,
+ "grad_norm": 6.6750688552856445,
+ "learning_rate": 1.4104391143094086e-05,
+ "loss": 0.2304,
+ "step": 14108
+ },
+ {
+ "epoch": 38.444141689373296,
+ "grad_norm": 9.718730926513672,
+ "learning_rate": 1.4103586390840038e-05,
+ "loss": 0.3804,
+ "step": 14109
+ },
+ {
+ "epoch": 38.44686648501362,
+ "grad_norm": 18.901268005371094,
+ "learning_rate": 1.4102781606627393e-05,
+ "loss": 0.2413,
+ "step": 14110
+ },
+ {
+ "epoch": 38.44959128065395,
+ "grad_norm": 5.725854873657227,
+ "learning_rate": 1.4101976790462421e-05,
+ "loss": 0.3876,
+ "step": 14111
+ },
+ {
+ "epoch": 38.45231607629428,
+ "grad_norm": 5.962811470031738,
+ "learning_rate": 1.4101171942351381e-05,
+ "loss": 0.3008,
+ "step": 14112
+ },
+ {
+ "epoch": 38.45504087193461,
+ "grad_norm": 8.318543434143066,
+ "learning_rate": 1.4100367062300548e-05,
+ "loss": 0.2971,
+ "step": 14113
+ },
+ {
+ "epoch": 38.45776566757493,
+ "grad_norm": 10.843289375305176,
+ "learning_rate": 1.409956215031619e-05,
+ "loss": 0.2088,
+ "step": 14114
+ },
+ {
+ "epoch": 38.46049046321526,
+ "grad_norm": 7.146448135375977,
+ "learning_rate": 1.4098757206404572e-05,
+ "loss": 0.3005,
+ "step": 14115
+ },
+ {
+ "epoch": 38.463215258855584,
+ "grad_norm": 5.454993724822998,
+ "learning_rate": 1.4097952230571965e-05,
+ "loss": 0.4388,
+ "step": 14116
+ },
+ {
+ "epoch": 38.46594005449591,
+ "grad_norm": 6.234476089477539,
+ "learning_rate": 1.4097147222824639e-05,
+ "loss": 0.2959,
+ "step": 14117
+ },
+ {
+ "epoch": 38.46866485013624,
+ "grad_norm": 5.893165111541748,
+ "learning_rate": 1.4096342183168861e-05,
+ "loss": 0.2718,
+ "step": 14118
+ },
+ {
+ "epoch": 38.47138964577657,
+ "grad_norm": 6.857761383056641,
+ "learning_rate": 1.4095537111610903e-05,
+ "loss": 0.3173,
+ "step": 14119
+ },
+ {
+ "epoch": 38.474114441416894,
+ "grad_norm": 6.331696033477783,
+ "learning_rate": 1.4094732008157032e-05,
+ "loss": 0.2225,
+ "step": 14120
+ },
+ {
+ "epoch": 38.47683923705722,
+ "grad_norm": 6.403774738311768,
+ "learning_rate": 1.409392687281352e-05,
+ "loss": 0.3651,
+ "step": 14121
+ },
+ {
+ "epoch": 38.479564032697546,
+ "grad_norm": 7.785304546356201,
+ "learning_rate": 1.4093121705586637e-05,
+ "loss": 0.2133,
+ "step": 14122
+ },
+ {
+ "epoch": 38.48228882833787,
+ "grad_norm": 6.4889397621154785,
+ "learning_rate": 1.4092316506482656e-05,
+ "loss": 0.3135,
+ "step": 14123
+ },
+ {
+ "epoch": 38.485013623978205,
+ "grad_norm": 6.590969085693359,
+ "learning_rate": 1.4091511275507845e-05,
+ "loss": 0.2579,
+ "step": 14124
+ },
+ {
+ "epoch": 38.48773841961853,
+ "grad_norm": 5.812717914581299,
+ "learning_rate": 1.4090706012668474e-05,
+ "loss": 0.1655,
+ "step": 14125
+ },
+ {
+ "epoch": 38.490463215258856,
+ "grad_norm": 6.541272163391113,
+ "learning_rate": 1.4089900717970819e-05,
+ "loss": 0.3709,
+ "step": 14126
+ },
+ {
+ "epoch": 38.49318801089918,
+ "grad_norm": 5.469993591308594,
+ "learning_rate": 1.4089095391421148e-05,
+ "loss": 0.3217,
+ "step": 14127
+ },
+ {
+ "epoch": 38.49591280653951,
+ "grad_norm": 5.711572170257568,
+ "learning_rate": 1.4088290033025736e-05,
+ "loss": 0.2817,
+ "step": 14128
+ },
+ {
+ "epoch": 38.49863760217983,
+ "grad_norm": 12.279172897338867,
+ "learning_rate": 1.4087484642790847e-05,
+ "loss": 0.1995,
+ "step": 14129
+ },
+ {
+ "epoch": 38.50136239782017,
+ "grad_norm": 8.407028198242188,
+ "learning_rate": 1.4086679220722765e-05,
+ "loss": 0.2884,
+ "step": 14130
+ },
+ {
+ "epoch": 38.50408719346049,
+ "grad_norm": 7.350332736968994,
+ "learning_rate": 1.4085873766827751e-05,
+ "loss": 0.2821,
+ "step": 14131
+ },
+ {
+ "epoch": 38.50681198910082,
+ "grad_norm": 7.881537914276123,
+ "learning_rate": 1.408506828111209e-05,
+ "loss": 0.2552,
+ "step": 14132
+ },
+ {
+ "epoch": 38.509536784741144,
+ "grad_norm": 21.630401611328125,
+ "learning_rate": 1.4084262763582044e-05,
+ "loss": 0.4385,
+ "step": 14133
+ },
+ {
+ "epoch": 38.51226158038147,
+ "grad_norm": 6.939113140106201,
+ "learning_rate": 1.4083457214243891e-05,
+ "loss": 0.3754,
+ "step": 14134
+ },
+ {
+ "epoch": 38.514986376021795,
+ "grad_norm": 5.386192798614502,
+ "learning_rate": 1.4082651633103908e-05,
+ "loss": 0.2091,
+ "step": 14135
+ },
+ {
+ "epoch": 38.51771117166213,
+ "grad_norm": 7.200022220611572,
+ "learning_rate": 1.4081846020168363e-05,
+ "loss": 0.3168,
+ "step": 14136
+ },
+ {
+ "epoch": 38.520435967302454,
+ "grad_norm": 6.039146423339844,
+ "learning_rate": 1.4081040375443533e-05,
+ "loss": 0.2479,
+ "step": 14137
+ },
+ {
+ "epoch": 38.52316076294278,
+ "grad_norm": 5.907276630401611,
+ "learning_rate": 1.4080234698935693e-05,
+ "loss": 0.3587,
+ "step": 14138
+ },
+ {
+ "epoch": 38.525885558583106,
+ "grad_norm": 7.188309669494629,
+ "learning_rate": 1.4079428990651113e-05,
+ "loss": 0.2617,
+ "step": 14139
+ },
+ {
+ "epoch": 38.52861035422343,
+ "grad_norm": 5.692146301269531,
+ "learning_rate": 1.4078623250596075e-05,
+ "loss": 0.3438,
+ "step": 14140
+ },
+ {
+ "epoch": 38.53133514986376,
+ "grad_norm": 6.520361423492432,
+ "learning_rate": 1.407781747877685e-05,
+ "loss": 0.1848,
+ "step": 14141
+ },
+ {
+ "epoch": 38.53405994550409,
+ "grad_norm": 6.540200710296631,
+ "learning_rate": 1.4077011675199713e-05,
+ "loss": 0.2134,
+ "step": 14142
+ },
+ {
+ "epoch": 38.536784741144416,
+ "grad_norm": 5.5721845626831055,
+ "learning_rate": 1.407620583987094e-05,
+ "loss": 0.2358,
+ "step": 14143
+ },
+ {
+ "epoch": 38.53950953678474,
+ "grad_norm": 6.2767510414123535,
+ "learning_rate": 1.4075399972796808e-05,
+ "loss": 0.3628,
+ "step": 14144
+ },
+ {
+ "epoch": 38.54223433242507,
+ "grad_norm": 6.600429058074951,
+ "learning_rate": 1.4074594073983592e-05,
+ "loss": 0.3173,
+ "step": 14145
+ },
+ {
+ "epoch": 38.54495912806539,
+ "grad_norm": 5.381121635437012,
+ "learning_rate": 1.4073788143437568e-05,
+ "loss": 0.2903,
+ "step": 14146
+ },
+ {
+ "epoch": 38.54768392370572,
+ "grad_norm": 8.758638381958008,
+ "learning_rate": 1.4072982181165014e-05,
+ "loss": 0.4308,
+ "step": 14147
+ },
+ {
+ "epoch": 38.55040871934605,
+ "grad_norm": 6.545938491821289,
+ "learning_rate": 1.4072176187172204e-05,
+ "loss": 0.2765,
+ "step": 14148
+ },
+ {
+ "epoch": 38.55313351498638,
+ "grad_norm": 6.275467872619629,
+ "learning_rate": 1.4071370161465417e-05,
+ "loss": 0.3501,
+ "step": 14149
+ },
+ {
+ "epoch": 38.555858310626704,
+ "grad_norm": 6.002571105957031,
+ "learning_rate": 1.407056410405093e-05,
+ "loss": 0.3592,
+ "step": 14150
+ },
+ {
+ "epoch": 38.55858310626703,
+ "grad_norm": 6.76323127746582,
+ "learning_rate": 1.4069758014935023e-05,
+ "loss": 0.2618,
+ "step": 14151
+ },
+ {
+ "epoch": 38.561307901907355,
+ "grad_norm": 5.465998649597168,
+ "learning_rate": 1.406895189412397e-05,
+ "loss": 0.2019,
+ "step": 14152
+ },
+ {
+ "epoch": 38.56403269754768,
+ "grad_norm": 5.174844741821289,
+ "learning_rate": 1.406814574162405e-05,
+ "loss": 0.2363,
+ "step": 14153
+ },
+ {
+ "epoch": 38.566757493188014,
+ "grad_norm": 5.759891033172607,
+ "learning_rate": 1.4067339557441546e-05,
+ "loss": 0.447,
+ "step": 14154
+ },
+ {
+ "epoch": 38.56948228882834,
+ "grad_norm": 7.666831970214844,
+ "learning_rate": 1.406653334158273e-05,
+ "loss": 0.2877,
+ "step": 14155
+ },
+ {
+ "epoch": 38.572207084468666,
+ "grad_norm": 8.34528923034668,
+ "learning_rate": 1.406572709405388e-05,
+ "loss": 0.293,
+ "step": 14156
+ },
+ {
+ "epoch": 38.57493188010899,
+ "grad_norm": 5.085103988647461,
+ "learning_rate": 1.406492081486128e-05,
+ "loss": 0.1782,
+ "step": 14157
+ },
+ {
+ "epoch": 38.57765667574932,
+ "grad_norm": 6.896602630615234,
+ "learning_rate": 1.406411450401121e-05,
+ "loss": 0.3162,
+ "step": 14158
+ },
+ {
+ "epoch": 38.58038147138964,
+ "grad_norm": 7.838594913482666,
+ "learning_rate": 1.4063308161509945e-05,
+ "loss": 0.2968,
+ "step": 14159
+ },
+ {
+ "epoch": 38.583106267029976,
+ "grad_norm": 6.963497638702393,
+ "learning_rate": 1.406250178736377e-05,
+ "loss": 0.1873,
+ "step": 14160
+ },
+ {
+ "epoch": 38.5858310626703,
+ "grad_norm": 12.829331398010254,
+ "learning_rate": 1.4061695381578957e-05,
+ "loss": 0.4227,
+ "step": 14161
+ },
+ {
+ "epoch": 38.58855585831063,
+ "grad_norm": 6.674540042877197,
+ "learning_rate": 1.4060888944161795e-05,
+ "loss": 0.1976,
+ "step": 14162
+ },
+ {
+ "epoch": 38.59128065395095,
+ "grad_norm": 6.406482696533203,
+ "learning_rate": 1.4060082475118558e-05,
+ "loss": 0.3204,
+ "step": 14163
+ },
+ {
+ "epoch": 38.59400544959128,
+ "grad_norm": 10.174060821533203,
+ "learning_rate": 1.4059275974455531e-05,
+ "loss": 0.2983,
+ "step": 14164
+ },
+ {
+ "epoch": 38.596730245231605,
+ "grad_norm": 5.605705738067627,
+ "learning_rate": 1.4058469442178987e-05,
+ "loss": 0.306,
+ "step": 14165
+ },
+ {
+ "epoch": 38.59945504087194,
+ "grad_norm": 6.45618200302124,
+ "learning_rate": 1.4057662878295221e-05,
+ "loss": 0.2862,
+ "step": 14166
+ },
+ {
+ "epoch": 38.60217983651226,
+ "grad_norm": 8.21015453338623,
+ "learning_rate": 1.4056856282810505e-05,
+ "loss": 0.2853,
+ "step": 14167
+ },
+ {
+ "epoch": 38.60490463215259,
+ "grad_norm": 6.817403316497803,
+ "learning_rate": 1.4056049655731125e-05,
+ "loss": 0.3779,
+ "step": 14168
+ },
+ {
+ "epoch": 38.607629427792915,
+ "grad_norm": 5.516331672668457,
+ "learning_rate": 1.4055242997063359e-05,
+ "loss": 0.2109,
+ "step": 14169
+ },
+ {
+ "epoch": 38.61035422343324,
+ "grad_norm": 6.00640869140625,
+ "learning_rate": 1.4054436306813491e-05,
+ "loss": 0.2894,
+ "step": 14170
+ },
+ {
+ "epoch": 38.61307901907357,
+ "grad_norm": 6.030162811279297,
+ "learning_rate": 1.4053629584987802e-05,
+ "loss": 0.212,
+ "step": 14171
+ },
+ {
+ "epoch": 38.6158038147139,
+ "grad_norm": 5.575711250305176,
+ "learning_rate": 1.405282283159258e-05,
+ "loss": 0.228,
+ "step": 14172
+ },
+ {
+ "epoch": 38.618528610354225,
+ "grad_norm": 5.750463962554932,
+ "learning_rate": 1.4052016046634101e-05,
+ "loss": 0.2615,
+ "step": 14173
+ },
+ {
+ "epoch": 38.62125340599455,
+ "grad_norm": 6.629801273345947,
+ "learning_rate": 1.4051209230118652e-05,
+ "loss": 0.3496,
+ "step": 14174
+ },
+ {
+ "epoch": 38.62397820163488,
+ "grad_norm": 7.826570987701416,
+ "learning_rate": 1.4050402382052514e-05,
+ "loss": 0.3402,
+ "step": 14175
+ },
+ {
+ "epoch": 38.6267029972752,
+ "grad_norm": 4.923995494842529,
+ "learning_rate": 1.4049595502441977e-05,
+ "loss": 0.2725,
+ "step": 14176
+ },
+ {
+ "epoch": 38.62942779291553,
+ "grad_norm": 5.763731956481934,
+ "learning_rate": 1.4048788591293318e-05,
+ "loss": 0.2625,
+ "step": 14177
+ },
+ {
+ "epoch": 38.63215258855586,
+ "grad_norm": 6.039249897003174,
+ "learning_rate": 1.4047981648612824e-05,
+ "loss": 0.2596,
+ "step": 14178
+ },
+ {
+ "epoch": 38.63487738419619,
+ "grad_norm": 7.992038726806641,
+ "learning_rate": 1.4047174674406781e-05,
+ "loss": 0.2342,
+ "step": 14179
+ },
+ {
+ "epoch": 38.63760217983651,
+ "grad_norm": 6.105435848236084,
+ "learning_rate": 1.4046367668681471e-05,
+ "loss": 0.2958,
+ "step": 14180
+ },
+ {
+ "epoch": 38.64032697547684,
+ "grad_norm": 5.173197269439697,
+ "learning_rate": 1.4045560631443178e-05,
+ "loss": 0.2477,
+ "step": 14181
+ },
+ {
+ "epoch": 38.643051771117165,
+ "grad_norm": 7.096261978149414,
+ "learning_rate": 1.4044753562698188e-05,
+ "loss": 0.2266,
+ "step": 14182
+ },
+ {
+ "epoch": 38.64577656675749,
+ "grad_norm": 6.047508239746094,
+ "learning_rate": 1.4043946462452791e-05,
+ "loss": 0.3668,
+ "step": 14183
+ },
+ {
+ "epoch": 38.64850136239782,
+ "grad_norm": 8.10651969909668,
+ "learning_rate": 1.4043139330713267e-05,
+ "loss": 0.1872,
+ "step": 14184
+ },
+ {
+ "epoch": 38.65122615803815,
+ "grad_norm": 7.908143997192383,
+ "learning_rate": 1.4042332167485904e-05,
+ "loss": 0.2151,
+ "step": 14185
+ },
+ {
+ "epoch": 38.653950953678475,
+ "grad_norm": 7.34572696685791,
+ "learning_rate": 1.4041524972776989e-05,
+ "loss": 0.3318,
+ "step": 14186
+ },
+ {
+ "epoch": 38.6566757493188,
+ "grad_norm": 6.163498401641846,
+ "learning_rate": 1.404071774659281e-05,
+ "loss": 0.2318,
+ "step": 14187
+ },
+ {
+ "epoch": 38.65940054495913,
+ "grad_norm": 5.7085652351379395,
+ "learning_rate": 1.4039910488939648e-05,
+ "loss": 0.5327,
+ "step": 14188
+ },
+ {
+ "epoch": 38.66212534059945,
+ "grad_norm": 6.371049880981445,
+ "learning_rate": 1.4039103199823794e-05,
+ "loss": 0.3045,
+ "step": 14189
+ },
+ {
+ "epoch": 38.664850136239785,
+ "grad_norm": 6.019608974456787,
+ "learning_rate": 1.4038295879251535e-05,
+ "loss": 0.2065,
+ "step": 14190
+ },
+ {
+ "epoch": 38.66757493188011,
+ "grad_norm": 6.799952030181885,
+ "learning_rate": 1.4037488527229156e-05,
+ "loss": 0.1905,
+ "step": 14191
+ },
+ {
+ "epoch": 38.67029972752044,
+ "grad_norm": 6.0175018310546875,
+ "learning_rate": 1.4036681143762945e-05,
+ "loss": 0.3696,
+ "step": 14192
+ },
+ {
+ "epoch": 38.67302452316076,
+ "grad_norm": 5.6262922286987305,
+ "learning_rate": 1.4035873728859195e-05,
+ "loss": 0.4247,
+ "step": 14193
+ },
+ {
+ "epoch": 38.67574931880109,
+ "grad_norm": 5.667084693908691,
+ "learning_rate": 1.4035066282524188e-05,
+ "loss": 0.1786,
+ "step": 14194
+ },
+ {
+ "epoch": 38.678474114441414,
+ "grad_norm": 6.430644512176514,
+ "learning_rate": 1.4034258804764217e-05,
+ "loss": 0.2489,
+ "step": 14195
+ },
+ {
+ "epoch": 38.68119891008175,
+ "grad_norm": 6.629088878631592,
+ "learning_rate": 1.4033451295585565e-05,
+ "loss": 0.2445,
+ "step": 14196
+ },
+ {
+ "epoch": 38.68392370572207,
+ "grad_norm": 5.922722816467285,
+ "learning_rate": 1.4032643754994526e-05,
+ "loss": 0.26,
+ "step": 14197
+ },
+ {
+ "epoch": 38.6866485013624,
+ "grad_norm": 6.801407337188721,
+ "learning_rate": 1.4031836182997387e-05,
+ "loss": 0.2057,
+ "step": 14198
+ },
+ {
+ "epoch": 38.689373297002724,
+ "grad_norm": 7.064025402069092,
+ "learning_rate": 1.4031028579600436e-05,
+ "loss": 0.2804,
+ "step": 14199
+ },
+ {
+ "epoch": 38.69209809264305,
+ "grad_norm": 6.30210018157959,
+ "learning_rate": 1.4030220944809965e-05,
+ "loss": 0.2088,
+ "step": 14200
+ },
+ {
+ "epoch": 38.694822888283376,
+ "grad_norm": 5.764710903167725,
+ "learning_rate": 1.4029413278632266e-05,
+ "loss": 0.2938,
+ "step": 14201
+ },
+ {
+ "epoch": 38.69754768392371,
+ "grad_norm": 4.9857096672058105,
+ "learning_rate": 1.4028605581073623e-05,
+ "loss": 0.3989,
+ "step": 14202
+ },
+ {
+ "epoch": 38.700272479564035,
+ "grad_norm": 5.339354038238525,
+ "learning_rate": 1.402779785214033e-05,
+ "loss": 0.3175,
+ "step": 14203
+ },
+ {
+ "epoch": 38.70299727520436,
+ "grad_norm": 7.36276912689209,
+ "learning_rate": 1.4026990091838677e-05,
+ "loss": 0.3404,
+ "step": 14204
+ },
+ {
+ "epoch": 38.705722070844686,
+ "grad_norm": 6.679203510284424,
+ "learning_rate": 1.4026182300174955e-05,
+ "loss": 0.2287,
+ "step": 14205
+ },
+ {
+ "epoch": 38.70844686648501,
+ "grad_norm": 5.4260711669921875,
+ "learning_rate": 1.4025374477155453e-05,
+ "loss": 0.2688,
+ "step": 14206
+ },
+ {
+ "epoch": 38.71117166212534,
+ "grad_norm": 6.5926079750061035,
+ "learning_rate": 1.4024566622786468e-05,
+ "loss": 0.2319,
+ "step": 14207
+ },
+ {
+ "epoch": 38.71389645776567,
+ "grad_norm": 6.10131311416626,
+ "learning_rate": 1.4023758737074284e-05,
+ "loss": 0.3527,
+ "step": 14208
+ },
+ {
+ "epoch": 38.716621253406,
+ "grad_norm": 5.418936252593994,
+ "learning_rate": 1.4022950820025198e-05,
+ "loss": 0.2347,
+ "step": 14209
+ },
+ {
+ "epoch": 38.71934604904632,
+ "grad_norm": 6.062687397003174,
+ "learning_rate": 1.40221428716455e-05,
+ "loss": 0.2633,
+ "step": 14210
+ },
+ {
+ "epoch": 38.72207084468665,
+ "grad_norm": 6.946159839630127,
+ "learning_rate": 1.4021334891941484e-05,
+ "loss": 0.2942,
+ "step": 14211
+ },
+ {
+ "epoch": 38.724795640326974,
+ "grad_norm": 7.638200283050537,
+ "learning_rate": 1.4020526880919439e-05,
+ "loss": 0.2323,
+ "step": 14212
+ },
+ {
+ "epoch": 38.7275204359673,
+ "grad_norm": 6.2911601066589355,
+ "learning_rate": 1.4019718838585664e-05,
+ "loss": 0.2085,
+ "step": 14213
+ },
+ {
+ "epoch": 38.73024523160763,
+ "grad_norm": 5.667962074279785,
+ "learning_rate": 1.4018910764946445e-05,
+ "loss": 0.3607,
+ "step": 14214
+ },
+ {
+ "epoch": 38.73297002724796,
+ "grad_norm": 5.755716800689697,
+ "learning_rate": 1.4018102660008079e-05,
+ "loss": 0.2263,
+ "step": 14215
+ },
+ {
+ "epoch": 38.735694822888284,
+ "grad_norm": 6.369229793548584,
+ "learning_rate": 1.4017294523776859e-05,
+ "loss": 0.3123,
+ "step": 14216
+ },
+ {
+ "epoch": 38.73841961852861,
+ "grad_norm": 6.430229663848877,
+ "learning_rate": 1.4016486356259076e-05,
+ "loss": 0.2245,
+ "step": 14217
+ },
+ {
+ "epoch": 38.741144414168936,
+ "grad_norm": 7.5628252029418945,
+ "learning_rate": 1.4015678157461028e-05,
+ "loss": 0.3125,
+ "step": 14218
+ },
+ {
+ "epoch": 38.74386920980926,
+ "grad_norm": 6.894842624664307,
+ "learning_rate": 1.401486992738901e-05,
+ "loss": 0.323,
+ "step": 14219
+ },
+ {
+ "epoch": 38.746594005449595,
+ "grad_norm": 5.481640338897705,
+ "learning_rate": 1.4014061666049312e-05,
+ "loss": 0.2659,
+ "step": 14220
+ },
+ {
+ "epoch": 38.74931880108992,
+ "grad_norm": 5.837904453277588,
+ "learning_rate": 1.4013253373448232e-05,
+ "loss": 0.1764,
+ "step": 14221
+ },
+ {
+ "epoch": 38.752043596730246,
+ "grad_norm": 6.2947893142700195,
+ "learning_rate": 1.4012445049592063e-05,
+ "loss": 0.3758,
+ "step": 14222
+ },
+ {
+ "epoch": 38.75476839237057,
+ "grad_norm": 6.084985733032227,
+ "learning_rate": 1.4011636694487103e-05,
+ "loss": 0.2057,
+ "step": 14223
+ },
+ {
+ "epoch": 38.7574931880109,
+ "grad_norm": 9.457454681396484,
+ "learning_rate": 1.4010828308139644e-05,
+ "loss": 0.2041,
+ "step": 14224
+ },
+ {
+ "epoch": 38.76021798365122,
+ "grad_norm": 6.452712535858154,
+ "learning_rate": 1.4010019890555982e-05,
+ "loss": 0.2663,
+ "step": 14225
+ },
+ {
+ "epoch": 38.762942779291556,
+ "grad_norm": 5.780202388763428,
+ "learning_rate": 1.4009211441742413e-05,
+ "loss": 0.394,
+ "step": 14226
+ },
+ {
+ "epoch": 38.76566757493188,
+ "grad_norm": 7.74014139175415,
+ "learning_rate": 1.4008402961705238e-05,
+ "loss": 0.3185,
+ "step": 14227
+ },
+ {
+ "epoch": 38.76839237057221,
+ "grad_norm": 6.427647590637207,
+ "learning_rate": 1.400759445045075e-05,
+ "loss": 0.2703,
+ "step": 14228
+ },
+ {
+ "epoch": 38.771117166212534,
+ "grad_norm": 6.909052848815918,
+ "learning_rate": 1.4006785907985245e-05,
+ "loss": 0.2979,
+ "step": 14229
+ },
+ {
+ "epoch": 38.77384196185286,
+ "grad_norm": 5.844265460968018,
+ "learning_rate": 1.4005977334315017e-05,
+ "loss": 0.4356,
+ "step": 14230
+ },
+ {
+ "epoch": 38.776566757493185,
+ "grad_norm": 5.299291133880615,
+ "learning_rate": 1.4005168729446372e-05,
+ "loss": 0.1722,
+ "step": 14231
+ },
+ {
+ "epoch": 38.77929155313352,
+ "grad_norm": 5.50273323059082,
+ "learning_rate": 1.4004360093385599e-05,
+ "loss": 0.3339,
+ "step": 14232
+ },
+ {
+ "epoch": 38.782016348773844,
+ "grad_norm": 6.551215171813965,
+ "learning_rate": 1.4003551426138998e-05,
+ "loss": 0.2394,
+ "step": 14233
+ },
+ {
+ "epoch": 38.78474114441417,
+ "grad_norm": 7.548563480377197,
+ "learning_rate": 1.4002742727712863e-05,
+ "loss": 0.3318,
+ "step": 14234
+ },
+ {
+ "epoch": 38.787465940054496,
+ "grad_norm": 5.244667053222656,
+ "learning_rate": 1.4001933998113504e-05,
+ "loss": 0.2234,
+ "step": 14235
+ },
+ {
+ "epoch": 38.79019073569482,
+ "grad_norm": 6.541910648345947,
+ "learning_rate": 1.4001125237347206e-05,
+ "loss": 0.2836,
+ "step": 14236
+ },
+ {
+ "epoch": 38.79291553133515,
+ "grad_norm": 5.8126091957092285,
+ "learning_rate": 1.4000316445420279e-05,
+ "loss": 0.23,
+ "step": 14237
+ },
+ {
+ "epoch": 38.79564032697548,
+ "grad_norm": 7.460387706756592,
+ "learning_rate": 1.3999507622339013e-05,
+ "loss": 0.2507,
+ "step": 14238
+ },
+ {
+ "epoch": 38.798365122615806,
+ "grad_norm": 6.648134708404541,
+ "learning_rate": 1.399869876810971e-05,
+ "loss": 0.3432,
+ "step": 14239
+ },
+ {
+ "epoch": 38.80108991825613,
+ "grad_norm": 7.125775337219238,
+ "learning_rate": 1.3997889882738671e-05,
+ "loss": 0.2813,
+ "step": 14240
+ },
+ {
+ "epoch": 38.80381471389646,
+ "grad_norm": 5.923659801483154,
+ "learning_rate": 1.3997080966232195e-05,
+ "loss": 0.1668,
+ "step": 14241
+ },
+ {
+ "epoch": 38.80653950953678,
+ "grad_norm": 7.02187442779541,
+ "learning_rate": 1.399627201859658e-05,
+ "loss": 0.2254,
+ "step": 14242
+ },
+ {
+ "epoch": 38.80926430517711,
+ "grad_norm": 8.10549259185791,
+ "learning_rate": 1.3995463039838123e-05,
+ "loss": 0.2408,
+ "step": 14243
+ },
+ {
+ "epoch": 38.81198910081744,
+ "grad_norm": 4.8937883377075195,
+ "learning_rate": 1.3994654029963132e-05,
+ "loss": 0.3194,
+ "step": 14244
+ },
+ {
+ "epoch": 38.81471389645777,
+ "grad_norm": 6.10452127456665,
+ "learning_rate": 1.3993844988977907e-05,
+ "loss": 0.2596,
+ "step": 14245
+ },
+ {
+ "epoch": 38.817438692098094,
+ "grad_norm": 7.868805408477783,
+ "learning_rate": 1.3993035916888742e-05,
+ "loss": 0.313,
+ "step": 14246
+ },
+ {
+ "epoch": 38.82016348773842,
+ "grad_norm": 8.325532913208008,
+ "learning_rate": 1.3992226813701946e-05,
+ "loss": 0.2721,
+ "step": 14247
+ },
+ {
+ "epoch": 38.822888283378745,
+ "grad_norm": 6.1731276512146,
+ "learning_rate": 1.399141767942381e-05,
+ "loss": 0.2142,
+ "step": 14248
+ },
+ {
+ "epoch": 38.82561307901907,
+ "grad_norm": 5.461709022521973,
+ "learning_rate": 1.3990608514060646e-05,
+ "loss": 0.3013,
+ "step": 14249
+ },
+ {
+ "epoch": 38.828337874659404,
+ "grad_norm": 5.8272552490234375,
+ "learning_rate": 1.3989799317618751e-05,
+ "loss": 0.2695,
+ "step": 14250
+ },
+ {
+ "epoch": 38.83106267029973,
+ "grad_norm": 5.033504962921143,
+ "learning_rate": 1.3988990090104424e-05,
+ "loss": 0.2505,
+ "step": 14251
+ },
+ {
+ "epoch": 38.833787465940055,
+ "grad_norm": 6.392061233520508,
+ "learning_rate": 1.3988180831523972e-05,
+ "loss": 0.2032,
+ "step": 14252
+ },
+ {
+ "epoch": 38.83651226158038,
+ "grad_norm": 6.937142372131348,
+ "learning_rate": 1.3987371541883699e-05,
+ "loss": 0.2637,
+ "step": 14253
+ },
+ {
+ "epoch": 38.83923705722071,
+ "grad_norm": 5.689050197601318,
+ "learning_rate": 1.3986562221189902e-05,
+ "loss": 0.3088,
+ "step": 14254
+ },
+ {
+ "epoch": 38.84196185286103,
+ "grad_norm": 5.71989631652832,
+ "learning_rate": 1.3985752869448888e-05,
+ "loss": 0.3759,
+ "step": 14255
+ },
+ {
+ "epoch": 38.844686648501366,
+ "grad_norm": 6.083313941955566,
+ "learning_rate": 1.3984943486666957e-05,
+ "loss": 0.2458,
+ "step": 14256
+ },
+ {
+ "epoch": 38.84741144414169,
+ "grad_norm": 4.9870123863220215,
+ "learning_rate": 1.3984134072850417e-05,
+ "loss": 0.2922,
+ "step": 14257
+ },
+ {
+ "epoch": 38.85013623978202,
+ "grad_norm": 5.492220401763916,
+ "learning_rate": 1.3983324628005566e-05,
+ "loss": 0.2931,
+ "step": 14258
+ },
+ {
+ "epoch": 38.85286103542234,
+ "grad_norm": 5.595819473266602,
+ "learning_rate": 1.3982515152138713e-05,
+ "loss": 0.1908,
+ "step": 14259
+ },
+ {
+ "epoch": 38.85558583106267,
+ "grad_norm": 30.5610408782959,
+ "learning_rate": 1.3981705645256161e-05,
+ "loss": 0.3721,
+ "step": 14260
+ },
+ {
+ "epoch": 38.858310626702995,
+ "grad_norm": 6.095954895019531,
+ "learning_rate": 1.3980896107364212e-05,
+ "loss": 0.3642,
+ "step": 14261
+ },
+ {
+ "epoch": 38.86103542234333,
+ "grad_norm": 7.429832935333252,
+ "learning_rate": 1.398008653846917e-05,
+ "loss": 0.3167,
+ "step": 14262
+ },
+ {
+ "epoch": 38.86376021798365,
+ "grad_norm": 5.93065071105957,
+ "learning_rate": 1.3979276938577347e-05,
+ "loss": 0.2809,
+ "step": 14263
+ },
+ {
+ "epoch": 38.86648501362398,
+ "grad_norm": 9.602701187133789,
+ "learning_rate": 1.397846730769504e-05,
+ "loss": 0.3329,
+ "step": 14264
+ },
+ {
+ "epoch": 38.869209809264305,
+ "grad_norm": 6.699948787689209,
+ "learning_rate": 1.3977657645828559e-05,
+ "loss": 0.3971,
+ "step": 14265
+ },
+ {
+ "epoch": 38.87193460490463,
+ "grad_norm": 7.0116448402404785,
+ "learning_rate": 1.3976847952984209e-05,
+ "loss": 0.2015,
+ "step": 14266
+ },
+ {
+ "epoch": 38.87465940054496,
+ "grad_norm": 5.536526679992676,
+ "learning_rate": 1.3976038229168296e-05,
+ "loss": 0.2613,
+ "step": 14267
+ },
+ {
+ "epoch": 38.87738419618529,
+ "grad_norm": 7.464479446411133,
+ "learning_rate": 1.3975228474387122e-05,
+ "loss": 0.26,
+ "step": 14268
+ },
+ {
+ "epoch": 38.880108991825615,
+ "grad_norm": 7.937355995178223,
+ "learning_rate": 1.3974418688646997e-05,
+ "loss": 0.271,
+ "step": 14269
+ },
+ {
+ "epoch": 38.88283378746594,
+ "grad_norm": 7.095129489898682,
+ "learning_rate": 1.397360887195423e-05,
+ "loss": 0.2693,
+ "step": 14270
+ },
+ {
+ "epoch": 38.88555858310627,
+ "grad_norm": 6.2759928703308105,
+ "learning_rate": 1.3972799024315123e-05,
+ "loss": 0.391,
+ "step": 14271
+ },
+ {
+ "epoch": 38.88828337874659,
+ "grad_norm": 8.566492080688477,
+ "learning_rate": 1.3971989145735982e-05,
+ "loss": 0.3997,
+ "step": 14272
+ },
+ {
+ "epoch": 38.89100817438692,
+ "grad_norm": 7.450653076171875,
+ "learning_rate": 1.3971179236223122e-05,
+ "loss": 0.2993,
+ "step": 14273
+ },
+ {
+ "epoch": 38.89373297002725,
+ "grad_norm": 7.209585189819336,
+ "learning_rate": 1.3970369295782844e-05,
+ "loss": 0.2408,
+ "step": 14274
+ },
+ {
+ "epoch": 38.89645776566758,
+ "grad_norm": 7.133180141448975,
+ "learning_rate": 1.396955932442146e-05,
+ "loss": 0.311,
+ "step": 14275
+ },
+ {
+ "epoch": 38.8991825613079,
+ "grad_norm": 9.923151016235352,
+ "learning_rate": 1.3968749322145274e-05,
+ "loss": 0.4052,
+ "step": 14276
+ },
+ {
+ "epoch": 38.90190735694823,
+ "grad_norm": 6.90376615524292,
+ "learning_rate": 1.3967939288960595e-05,
+ "loss": 0.2784,
+ "step": 14277
+ },
+ {
+ "epoch": 38.904632152588555,
+ "grad_norm": 6.0615458488464355,
+ "learning_rate": 1.3967129224873734e-05,
+ "loss": 0.1817,
+ "step": 14278
+ },
+ {
+ "epoch": 38.90735694822888,
+ "grad_norm": 5.877019882202148,
+ "learning_rate": 1.3966319129890997e-05,
+ "loss": 0.205,
+ "step": 14279
+ },
+ {
+ "epoch": 38.91008174386921,
+ "grad_norm": 6.62255859375,
+ "learning_rate": 1.3965509004018695e-05,
+ "loss": 0.2224,
+ "step": 14280
+ },
+ {
+ "epoch": 38.91280653950954,
+ "grad_norm": 6.7541656494140625,
+ "learning_rate": 1.3964698847263138e-05,
+ "loss": 0.4018,
+ "step": 14281
+ },
+ {
+ "epoch": 38.915531335149865,
+ "grad_norm": 5.898073196411133,
+ "learning_rate": 1.3963888659630634e-05,
+ "loss": 0.4525,
+ "step": 14282
+ },
+ {
+ "epoch": 38.91825613079019,
+ "grad_norm": 6.852269172668457,
+ "learning_rate": 1.396307844112749e-05,
+ "loss": 0.287,
+ "step": 14283
+ },
+ {
+ "epoch": 38.920980926430516,
+ "grad_norm": 7.012596607208252,
+ "learning_rate": 1.3962268191760019e-05,
+ "loss": 0.3561,
+ "step": 14284
+ },
+ {
+ "epoch": 38.92370572207084,
+ "grad_norm": 7.041779041290283,
+ "learning_rate": 1.3961457911534532e-05,
+ "loss": 0.2817,
+ "step": 14285
+ },
+ {
+ "epoch": 38.926430517711175,
+ "grad_norm": 7.059216022491455,
+ "learning_rate": 1.3960647600457338e-05,
+ "loss": 0.252,
+ "step": 14286
+ },
+ {
+ "epoch": 38.9291553133515,
+ "grad_norm": 7.676758766174316,
+ "learning_rate": 1.3959837258534748e-05,
+ "loss": 0.3079,
+ "step": 14287
+ },
+ {
+ "epoch": 38.93188010899183,
+ "grad_norm": 6.447818279266357,
+ "learning_rate": 1.3959026885773072e-05,
+ "loss": 0.3198,
+ "step": 14288
+ },
+ {
+ "epoch": 38.93460490463215,
+ "grad_norm": 6.1130266189575195,
+ "learning_rate": 1.3958216482178623e-05,
+ "loss": 0.2326,
+ "step": 14289
+ },
+ {
+ "epoch": 38.93732970027248,
+ "grad_norm": 6.401403427124023,
+ "learning_rate": 1.3957406047757714e-05,
+ "loss": 0.3269,
+ "step": 14290
+ },
+ {
+ "epoch": 38.940054495912804,
+ "grad_norm": 7.1712541580200195,
+ "learning_rate": 1.395659558251665e-05,
+ "loss": 0.2905,
+ "step": 14291
+ },
+ {
+ "epoch": 38.94277929155314,
+ "grad_norm": 6.875960350036621,
+ "learning_rate": 1.3955785086461749e-05,
+ "loss": 0.3475,
+ "step": 14292
+ },
+ {
+ "epoch": 38.94550408719346,
+ "grad_norm": 6.088695526123047,
+ "learning_rate": 1.395497455959932e-05,
+ "loss": 0.3795,
+ "step": 14293
+ },
+ {
+ "epoch": 38.94822888283379,
+ "grad_norm": 10.818563461303711,
+ "learning_rate": 1.3954164001935674e-05,
+ "loss": 0.4487,
+ "step": 14294
+ },
+ {
+ "epoch": 38.950953678474114,
+ "grad_norm": 5.353722095489502,
+ "learning_rate": 1.3953353413477132e-05,
+ "loss": 0.3378,
+ "step": 14295
+ },
+ {
+ "epoch": 38.95367847411444,
+ "grad_norm": 8.669241905212402,
+ "learning_rate": 1.3952542794229998e-05,
+ "loss": 0.2861,
+ "step": 14296
+ },
+ {
+ "epoch": 38.956403269754766,
+ "grad_norm": 5.692200183868408,
+ "learning_rate": 1.3951732144200584e-05,
+ "loss": 0.2019,
+ "step": 14297
+ },
+ {
+ "epoch": 38.95912806539509,
+ "grad_norm": 10.162614822387695,
+ "learning_rate": 1.3950921463395213e-05,
+ "loss": 0.1877,
+ "step": 14298
+ },
+ {
+ "epoch": 38.961852861035425,
+ "grad_norm": 6.350072383880615,
+ "learning_rate": 1.3950110751820192e-05,
+ "loss": 0.2676,
+ "step": 14299
+ },
+ {
+ "epoch": 38.96457765667575,
+ "grad_norm": 5.5919013023376465,
+ "learning_rate": 1.3949300009481835e-05,
+ "loss": 0.2422,
+ "step": 14300
+ },
+ {
+ "epoch": 38.967302452316076,
+ "grad_norm": 7.189586162567139,
+ "learning_rate": 1.3948489236386454e-05,
+ "loss": 0.1902,
+ "step": 14301
+ },
+ {
+ "epoch": 38.9700272479564,
+ "grad_norm": 7.617172718048096,
+ "learning_rate": 1.3947678432540368e-05,
+ "loss": 0.2649,
+ "step": 14302
+ },
+ {
+ "epoch": 38.97275204359673,
+ "grad_norm": 5.228553771972656,
+ "learning_rate": 1.3946867597949887e-05,
+ "loss": 0.2438,
+ "step": 14303
+ },
+ {
+ "epoch": 38.97547683923706,
+ "grad_norm": 6.238590717315674,
+ "learning_rate": 1.3946056732621332e-05,
+ "loss": 0.265,
+ "step": 14304
+ },
+ {
+ "epoch": 38.97820163487739,
+ "grad_norm": 7.42759895324707,
+ "learning_rate": 1.3945245836561013e-05,
+ "loss": 0.6329,
+ "step": 14305
+ },
+ {
+ "epoch": 38.98092643051771,
+ "grad_norm": 10.85505199432373,
+ "learning_rate": 1.3944434909775247e-05,
+ "loss": 0.3737,
+ "step": 14306
+ },
+ {
+ "epoch": 38.98365122615804,
+ "grad_norm": 6.245872497558594,
+ "learning_rate": 1.3943623952270346e-05,
+ "loss": 0.2907,
+ "step": 14307
+ },
+ {
+ "epoch": 38.986376021798364,
+ "grad_norm": 8.080317497253418,
+ "learning_rate": 1.3942812964052632e-05,
+ "loss": 0.2971,
+ "step": 14308
+ },
+ {
+ "epoch": 38.98910081743869,
+ "grad_norm": 5.9236836433410645,
+ "learning_rate": 1.3942001945128416e-05,
+ "loss": 0.2373,
+ "step": 14309
+ },
+ {
+ "epoch": 38.991825613079016,
+ "grad_norm": 6.837869644165039,
+ "learning_rate": 1.3941190895504015e-05,
+ "loss": 0.31,
+ "step": 14310
+ },
+ {
+ "epoch": 38.99455040871935,
+ "grad_norm": 6.478810787200928,
+ "learning_rate": 1.3940379815185746e-05,
+ "loss": 0.3202,
+ "step": 14311
+ },
+ {
+ "epoch": 38.997275204359674,
+ "grad_norm": 7.109516143798828,
+ "learning_rate": 1.3939568704179926e-05,
+ "loss": 0.5093,
+ "step": 14312
+ },
+ {
+ "epoch": 39.0,
+ "grad_norm": 6.694377422332764,
+ "learning_rate": 1.3938757562492873e-05,
+ "loss": 0.1959,
+ "step": 14313
+ },
+ {
+ "epoch": 39.002724795640326,
+ "grad_norm": 5.328964710235596,
+ "learning_rate": 1.3937946390130904e-05,
+ "loss": 0.2201,
+ "step": 14314
+ },
+ {
+ "epoch": 39.00544959128065,
+ "grad_norm": 5.843469142913818,
+ "learning_rate": 1.3937135187100332e-05,
+ "loss": 0.2167,
+ "step": 14315
+ },
+ {
+ "epoch": 39.00817438692098,
+ "grad_norm": 5.099860668182373,
+ "learning_rate": 1.393632395340748e-05,
+ "loss": 0.3085,
+ "step": 14316
+ },
+ {
+ "epoch": 39.01089918256131,
+ "grad_norm": 6.607177257537842,
+ "learning_rate": 1.3935512689058663e-05,
+ "loss": 0.2555,
+ "step": 14317
+ },
+ {
+ "epoch": 39.013623978201636,
+ "grad_norm": 6.643643856048584,
+ "learning_rate": 1.3934701394060202e-05,
+ "loss": 0.2245,
+ "step": 14318
+ },
+ {
+ "epoch": 39.01634877384196,
+ "grad_norm": 5.466268062591553,
+ "learning_rate": 1.393389006841841e-05,
+ "loss": 0.4362,
+ "step": 14319
+ },
+ {
+ "epoch": 39.01907356948229,
+ "grad_norm": 4.7354021072387695,
+ "learning_rate": 1.3933078712139607e-05,
+ "loss": 0.1747,
+ "step": 14320
+ },
+ {
+ "epoch": 39.02179836512261,
+ "grad_norm": 6.899024963378906,
+ "learning_rate": 1.3932267325230118e-05,
+ "loss": 0.2903,
+ "step": 14321
+ },
+ {
+ "epoch": 39.02452316076294,
+ "grad_norm": 6.467222690582275,
+ "learning_rate": 1.3931455907696257e-05,
+ "loss": 0.211,
+ "step": 14322
+ },
+ {
+ "epoch": 39.02724795640327,
+ "grad_norm": 6.949442386627197,
+ "learning_rate": 1.3930644459544343e-05,
+ "loss": 0.3762,
+ "step": 14323
+ },
+ {
+ "epoch": 39.0299727520436,
+ "grad_norm": 7.553343772888184,
+ "learning_rate": 1.3929832980780696e-05,
+ "loss": 0.2569,
+ "step": 14324
+ },
+ {
+ "epoch": 39.032697547683924,
+ "grad_norm": 5.200009822845459,
+ "learning_rate": 1.3929021471411637e-05,
+ "loss": 0.1993,
+ "step": 14325
+ },
+ {
+ "epoch": 39.03542234332425,
+ "grad_norm": 28.745405197143555,
+ "learning_rate": 1.3928209931443487e-05,
+ "loss": 0.2299,
+ "step": 14326
+ },
+ {
+ "epoch": 39.038147138964575,
+ "grad_norm": 8.111405372619629,
+ "learning_rate": 1.392739836088256e-05,
+ "loss": 0.3381,
+ "step": 14327
+ },
+ {
+ "epoch": 39.0408719346049,
+ "grad_norm": 7.686152935028076,
+ "learning_rate": 1.3926586759735185e-05,
+ "loss": 0.2045,
+ "step": 14328
+ },
+ {
+ "epoch": 39.043596730245234,
+ "grad_norm": 5.327547073364258,
+ "learning_rate": 1.3925775128007674e-05,
+ "loss": 0.3247,
+ "step": 14329
+ },
+ {
+ "epoch": 39.04632152588556,
+ "grad_norm": 5.757328033447266,
+ "learning_rate": 1.3924963465706358e-05,
+ "loss": 0.3708,
+ "step": 14330
+ },
+ {
+ "epoch": 39.049046321525886,
+ "grad_norm": 5.843682289123535,
+ "learning_rate": 1.3924151772837549e-05,
+ "loss": 0.2439,
+ "step": 14331
+ },
+ {
+ "epoch": 39.05177111716621,
+ "grad_norm": 9.030362129211426,
+ "learning_rate": 1.3923340049407576e-05,
+ "loss": 0.4127,
+ "step": 14332
+ },
+ {
+ "epoch": 39.05449591280654,
+ "grad_norm": 7.151304721832275,
+ "learning_rate": 1.3922528295422755e-05,
+ "loss": 0.3836,
+ "step": 14333
+ },
+ {
+ "epoch": 39.05722070844686,
+ "grad_norm": 6.7778096199035645,
+ "learning_rate": 1.392171651088941e-05,
+ "loss": 0.2563,
+ "step": 14334
+ },
+ {
+ "epoch": 39.059945504087196,
+ "grad_norm": 8.462702751159668,
+ "learning_rate": 1.3920904695813861e-05,
+ "loss": 0.2613,
+ "step": 14335
+ },
+ {
+ "epoch": 39.06267029972752,
+ "grad_norm": 6.116037845611572,
+ "learning_rate": 1.3920092850202435e-05,
+ "loss": 0.2851,
+ "step": 14336
+ },
+ {
+ "epoch": 39.06539509536785,
+ "grad_norm": 5.209856033325195,
+ "learning_rate": 1.391928097406145e-05,
+ "loss": 0.277,
+ "step": 14337
+ },
+ {
+ "epoch": 39.06811989100817,
+ "grad_norm": 7.555953502655029,
+ "learning_rate": 1.3918469067397233e-05,
+ "loss": 0.2476,
+ "step": 14338
+ },
+ {
+ "epoch": 39.0708446866485,
+ "grad_norm": 8.173412322998047,
+ "learning_rate": 1.3917657130216103e-05,
+ "loss": 0.3123,
+ "step": 14339
+ },
+ {
+ "epoch": 39.073569482288825,
+ "grad_norm": 6.560594081878662,
+ "learning_rate": 1.3916845162524388e-05,
+ "loss": 0.2472,
+ "step": 14340
+ },
+ {
+ "epoch": 39.07629427792916,
+ "grad_norm": 4.919372081756592,
+ "learning_rate": 1.3916033164328406e-05,
+ "loss": 0.1607,
+ "step": 14341
+ },
+ {
+ "epoch": 39.079019073569484,
+ "grad_norm": 7.3588151931762695,
+ "learning_rate": 1.3915221135634487e-05,
+ "loss": 0.2097,
+ "step": 14342
+ },
+ {
+ "epoch": 39.08174386920981,
+ "grad_norm": 6.464593887329102,
+ "learning_rate": 1.391440907644895e-05,
+ "loss": 0.3798,
+ "step": 14343
+ },
+ {
+ "epoch": 39.084468664850135,
+ "grad_norm": 7.673997402191162,
+ "learning_rate": 1.3913596986778123e-05,
+ "loss": 0.2715,
+ "step": 14344
+ },
+ {
+ "epoch": 39.08719346049046,
+ "grad_norm": 7.415081024169922,
+ "learning_rate": 1.3912784866628326e-05,
+ "loss": 0.3838,
+ "step": 14345
+ },
+ {
+ "epoch": 39.08991825613079,
+ "grad_norm": 4.880640506744385,
+ "learning_rate": 1.3911972716005887e-05,
+ "loss": 0.1909,
+ "step": 14346
+ },
+ {
+ "epoch": 39.09264305177112,
+ "grad_norm": 5.719912052154541,
+ "learning_rate": 1.391116053491713e-05,
+ "loss": 0.2416,
+ "step": 14347
+ },
+ {
+ "epoch": 39.095367847411445,
+ "grad_norm": 5.737791061401367,
+ "learning_rate": 1.3910348323368381e-05,
+ "loss": 0.1778,
+ "step": 14348
+ },
+ {
+ "epoch": 39.09809264305177,
+ "grad_norm": 7.773014545440674,
+ "learning_rate": 1.3909536081365964e-05,
+ "loss": 0.2668,
+ "step": 14349
+ },
+ {
+ "epoch": 39.1008174386921,
+ "grad_norm": 5.769792556762695,
+ "learning_rate": 1.390872380891621e-05,
+ "loss": 0.2946,
+ "step": 14350
+ },
+ {
+ "epoch": 39.10354223433242,
+ "grad_norm": 6.600955963134766,
+ "learning_rate": 1.3907911506025436e-05,
+ "loss": 0.2388,
+ "step": 14351
+ },
+ {
+ "epoch": 39.10626702997275,
+ "grad_norm": 6.24024772644043,
+ "learning_rate": 1.3907099172699976e-05,
+ "loss": 0.2556,
+ "step": 14352
+ },
+ {
+ "epoch": 39.10899182561308,
+ "grad_norm": 7.633904457092285,
+ "learning_rate": 1.390628680894615e-05,
+ "loss": 0.2729,
+ "step": 14353
+ },
+ {
+ "epoch": 39.11171662125341,
+ "grad_norm": 6.381833553314209,
+ "learning_rate": 1.390547441477029e-05,
+ "loss": 0.2037,
+ "step": 14354
+ },
+ {
+ "epoch": 39.11444141689373,
+ "grad_norm": 5.045418739318848,
+ "learning_rate": 1.3904661990178723e-05,
+ "loss": 0.187,
+ "step": 14355
+ },
+ {
+ "epoch": 39.11716621253406,
+ "grad_norm": 5.261258125305176,
+ "learning_rate": 1.390384953517777e-05,
+ "loss": 0.1665,
+ "step": 14356
+ },
+ {
+ "epoch": 39.119891008174385,
+ "grad_norm": 5.163601875305176,
+ "learning_rate": 1.3903037049773769e-05,
+ "loss": 0.3376,
+ "step": 14357
+ },
+ {
+ "epoch": 39.12261580381471,
+ "grad_norm": 6.772798538208008,
+ "learning_rate": 1.3902224533973034e-05,
+ "loss": 0.4315,
+ "step": 14358
+ },
+ {
+ "epoch": 39.12534059945504,
+ "grad_norm": 8.250518798828125,
+ "learning_rate": 1.3901411987781904e-05,
+ "loss": 0.437,
+ "step": 14359
+ },
+ {
+ "epoch": 39.12806539509537,
+ "grad_norm": 5.6278276443481445,
+ "learning_rate": 1.3900599411206704e-05,
+ "loss": 0.2517,
+ "step": 14360
+ },
+ {
+ "epoch": 39.130790190735695,
+ "grad_norm": 6.756508827209473,
+ "learning_rate": 1.3899786804253757e-05,
+ "loss": 0.321,
+ "step": 14361
+ },
+ {
+ "epoch": 39.13351498637602,
+ "grad_norm": 5.385969638824463,
+ "learning_rate": 1.3898974166929398e-05,
+ "loss": 0.3564,
+ "step": 14362
+ },
+ {
+ "epoch": 39.13623978201635,
+ "grad_norm": 5.501603126525879,
+ "learning_rate": 1.3898161499239952e-05,
+ "loss": 0.2124,
+ "step": 14363
+ },
+ {
+ "epoch": 39.13896457765667,
+ "grad_norm": 7.773250579833984,
+ "learning_rate": 1.3897348801191752e-05,
+ "loss": 0.3246,
+ "step": 14364
+ },
+ {
+ "epoch": 39.141689373297005,
+ "grad_norm": 5.84032678604126,
+ "learning_rate": 1.3896536072791125e-05,
+ "loss": 0.2693,
+ "step": 14365
+ },
+ {
+ "epoch": 39.14441416893733,
+ "grad_norm": 6.377506256103516,
+ "learning_rate": 1.38957233140444e-05,
+ "loss": 0.2886,
+ "step": 14366
+ },
+ {
+ "epoch": 39.14713896457766,
+ "grad_norm": 5.796489715576172,
+ "learning_rate": 1.3894910524957907e-05,
+ "loss": 0.2948,
+ "step": 14367
+ },
+ {
+ "epoch": 39.14986376021798,
+ "grad_norm": 11.502608299255371,
+ "learning_rate": 1.3894097705537977e-05,
+ "loss": 0.2247,
+ "step": 14368
+ },
+ {
+ "epoch": 39.15258855585831,
+ "grad_norm": 7.887616157531738,
+ "learning_rate": 1.389328485579094e-05,
+ "loss": 0.4033,
+ "step": 14369
+ },
+ {
+ "epoch": 39.155313351498634,
+ "grad_norm": 5.441971778869629,
+ "learning_rate": 1.3892471975723122e-05,
+ "loss": 0.2924,
+ "step": 14370
+ },
+ {
+ "epoch": 39.15803814713897,
+ "grad_norm": 6.963483810424805,
+ "learning_rate": 1.3891659065340861e-05,
+ "loss": 0.2221,
+ "step": 14371
+ },
+ {
+ "epoch": 39.16076294277929,
+ "grad_norm": 5.960539817810059,
+ "learning_rate": 1.3890846124650482e-05,
+ "loss": 0.2971,
+ "step": 14372
+ },
+ {
+ "epoch": 39.16348773841962,
+ "grad_norm": 5.39940881729126,
+ "learning_rate": 1.3890033153658322e-05,
+ "loss": 0.2168,
+ "step": 14373
+ },
+ {
+ "epoch": 39.166212534059945,
+ "grad_norm": 5.560946941375732,
+ "learning_rate": 1.3889220152370706e-05,
+ "loss": 0.2249,
+ "step": 14374
+ },
+ {
+ "epoch": 39.16893732970027,
+ "grad_norm": 5.56072473526001,
+ "learning_rate": 1.3888407120793973e-05,
+ "loss": 0.2118,
+ "step": 14375
+ },
+ {
+ "epoch": 39.171662125340596,
+ "grad_norm": 6.4710259437561035,
+ "learning_rate": 1.3887594058934444e-05,
+ "loss": 0.3568,
+ "step": 14376
+ },
+ {
+ "epoch": 39.17438692098093,
+ "grad_norm": 7.413678169250488,
+ "learning_rate": 1.3886780966798464e-05,
+ "loss": 0.2221,
+ "step": 14377
+ },
+ {
+ "epoch": 39.177111716621255,
+ "grad_norm": 5.558591842651367,
+ "learning_rate": 1.3885967844392354e-05,
+ "loss": 0.2545,
+ "step": 14378
+ },
+ {
+ "epoch": 39.17983651226158,
+ "grad_norm": 5.393101215362549,
+ "learning_rate": 1.3885154691722453e-05,
+ "loss": 0.2334,
+ "step": 14379
+ },
+ {
+ "epoch": 39.182561307901906,
+ "grad_norm": 6.346226215362549,
+ "learning_rate": 1.3884341508795092e-05,
+ "loss": 0.2947,
+ "step": 14380
+ },
+ {
+ "epoch": 39.18528610354223,
+ "grad_norm": 6.576112270355225,
+ "learning_rate": 1.3883528295616606e-05,
+ "loss": 0.2093,
+ "step": 14381
+ },
+ {
+ "epoch": 39.18801089918256,
+ "grad_norm": 6.0815958976745605,
+ "learning_rate": 1.3882715052193323e-05,
+ "loss": 0.273,
+ "step": 14382
+ },
+ {
+ "epoch": 39.19073569482289,
+ "grad_norm": 5.966588973999023,
+ "learning_rate": 1.3881901778531583e-05,
+ "loss": 0.5629,
+ "step": 14383
+ },
+ {
+ "epoch": 39.19346049046322,
+ "grad_norm": 8.157422065734863,
+ "learning_rate": 1.3881088474637716e-05,
+ "loss": 0.2407,
+ "step": 14384
+ },
+ {
+ "epoch": 39.19618528610354,
+ "grad_norm": 6.78936767578125,
+ "learning_rate": 1.388027514051806e-05,
+ "loss": 0.2205,
+ "step": 14385
+ },
+ {
+ "epoch": 39.19891008174387,
+ "grad_norm": 6.487745761871338,
+ "learning_rate": 1.3879461776178943e-05,
+ "loss": 0.3394,
+ "step": 14386
+ },
+ {
+ "epoch": 39.201634877384194,
+ "grad_norm": 7.317575931549072,
+ "learning_rate": 1.3878648381626704e-05,
+ "loss": 0.2415,
+ "step": 14387
+ },
+ {
+ "epoch": 39.20435967302452,
+ "grad_norm": 5.161836624145508,
+ "learning_rate": 1.3877834956867675e-05,
+ "loss": 0.2265,
+ "step": 14388
+ },
+ {
+ "epoch": 39.20708446866485,
+ "grad_norm": 5.480639457702637,
+ "learning_rate": 1.387702150190819e-05,
+ "loss": 0.2178,
+ "step": 14389
+ },
+ {
+ "epoch": 39.20980926430518,
+ "grad_norm": 8.126582145690918,
+ "learning_rate": 1.3876208016754589e-05,
+ "loss": 0.209,
+ "step": 14390
+ },
+ {
+ "epoch": 39.212534059945504,
+ "grad_norm": 7.839139461517334,
+ "learning_rate": 1.3875394501413206e-05,
+ "loss": 0.3221,
+ "step": 14391
+ },
+ {
+ "epoch": 39.21525885558583,
+ "grad_norm": 8.001127243041992,
+ "learning_rate": 1.3874580955890374e-05,
+ "loss": 0.2136,
+ "step": 14392
+ },
+ {
+ "epoch": 39.217983651226156,
+ "grad_norm": 10.482834815979004,
+ "learning_rate": 1.3873767380192431e-05,
+ "loss": 0.1745,
+ "step": 14393
+ },
+ {
+ "epoch": 39.22070844686648,
+ "grad_norm": 5.722413063049316,
+ "learning_rate": 1.387295377432571e-05,
+ "loss": 0.2396,
+ "step": 14394
+ },
+ {
+ "epoch": 39.223433242506815,
+ "grad_norm": 5.641980171203613,
+ "learning_rate": 1.3872140138296553e-05,
+ "loss": 0.2631,
+ "step": 14395
+ },
+ {
+ "epoch": 39.22615803814714,
+ "grad_norm": 4.87531852722168,
+ "learning_rate": 1.387132647211129e-05,
+ "loss": 0.2508,
+ "step": 14396
+ },
+ {
+ "epoch": 39.228882833787466,
+ "grad_norm": 6.67892599105835,
+ "learning_rate": 1.3870512775776262e-05,
+ "loss": 0.2729,
+ "step": 14397
+ },
+ {
+ "epoch": 39.23160762942779,
+ "grad_norm": 6.84233283996582,
+ "learning_rate": 1.3869699049297805e-05,
+ "loss": 0.189,
+ "step": 14398
+ },
+ {
+ "epoch": 39.23433242506812,
+ "grad_norm": 5.77467679977417,
+ "learning_rate": 1.3868885292682258e-05,
+ "loss": 0.2601,
+ "step": 14399
+ },
+ {
+ "epoch": 39.237057220708444,
+ "grad_norm": 4.727165222167969,
+ "learning_rate": 1.3868071505935953e-05,
+ "loss": 0.3941,
+ "step": 14400
+ },
+ {
+ "epoch": 39.23978201634878,
+ "grad_norm": 5.63623046875,
+ "learning_rate": 1.3867257689065237e-05,
+ "loss": 0.2054,
+ "step": 14401
+ },
+ {
+ "epoch": 39.2425068119891,
+ "grad_norm": 6.149964809417725,
+ "learning_rate": 1.3866443842076438e-05,
+ "loss": 0.2709,
+ "step": 14402
+ },
+ {
+ "epoch": 39.24523160762943,
+ "grad_norm": 7.443466663360596,
+ "learning_rate": 1.3865629964975901e-05,
+ "loss": 0.1891,
+ "step": 14403
+ },
+ {
+ "epoch": 39.247956403269754,
+ "grad_norm": 6.356564044952393,
+ "learning_rate": 1.3864816057769961e-05,
+ "loss": 0.2976,
+ "step": 14404
+ },
+ {
+ "epoch": 39.25068119891008,
+ "grad_norm": 6.187931060791016,
+ "learning_rate": 1.3864002120464962e-05,
+ "loss": 0.1702,
+ "step": 14405
+ },
+ {
+ "epoch": 39.253405994550405,
+ "grad_norm": 5.51117467880249,
+ "learning_rate": 1.3863188153067233e-05,
+ "loss": 0.3435,
+ "step": 14406
+ },
+ {
+ "epoch": 39.25613079019074,
+ "grad_norm": 5.29209041595459,
+ "learning_rate": 1.3862374155583122e-05,
+ "loss": 0.2872,
+ "step": 14407
+ },
+ {
+ "epoch": 39.258855585831064,
+ "grad_norm": 5.761871337890625,
+ "learning_rate": 1.3861560128018962e-05,
+ "loss": 0.2604,
+ "step": 14408
+ },
+ {
+ "epoch": 39.26158038147139,
+ "grad_norm": 6.281421184539795,
+ "learning_rate": 1.3860746070381101e-05,
+ "loss": 0.2898,
+ "step": 14409
+ },
+ {
+ "epoch": 39.264305177111716,
+ "grad_norm": 5.377538681030273,
+ "learning_rate": 1.3859931982675872e-05,
+ "loss": 0.2023,
+ "step": 14410
+ },
+ {
+ "epoch": 39.26702997275204,
+ "grad_norm": 5.567324161529541,
+ "learning_rate": 1.3859117864909619e-05,
+ "loss": 0.1759,
+ "step": 14411
+ },
+ {
+ "epoch": 39.26975476839237,
+ "grad_norm": 6.55522346496582,
+ "learning_rate": 1.3858303717088676e-05,
+ "loss": 0.2079,
+ "step": 14412
+ },
+ {
+ "epoch": 39.2724795640327,
+ "grad_norm": 5.562514781951904,
+ "learning_rate": 1.3857489539219393e-05,
+ "loss": 0.2517,
+ "step": 14413
+ },
+ {
+ "epoch": 39.275204359673026,
+ "grad_norm": 5.650949954986572,
+ "learning_rate": 1.38566753313081e-05,
+ "loss": 0.2165,
+ "step": 14414
+ },
+ {
+ "epoch": 39.27792915531335,
+ "grad_norm": 6.258750915527344,
+ "learning_rate": 1.3855861093361144e-05,
+ "loss": 0.3011,
+ "step": 14415
+ },
+ {
+ "epoch": 39.28065395095368,
+ "grad_norm": 6.140244960784912,
+ "learning_rate": 1.3855046825384868e-05,
+ "loss": 0.3481,
+ "step": 14416
+ },
+ {
+ "epoch": 39.283378746594,
+ "grad_norm": 10.04259967803955,
+ "learning_rate": 1.3854232527385614e-05,
+ "loss": 0.2651,
+ "step": 14417
+ },
+ {
+ "epoch": 39.28610354223433,
+ "grad_norm": 6.4561896324157715,
+ "learning_rate": 1.3853418199369717e-05,
+ "loss": 0.2029,
+ "step": 14418
+ },
+ {
+ "epoch": 39.28882833787466,
+ "grad_norm": 5.495051860809326,
+ "learning_rate": 1.3852603841343525e-05,
+ "loss": 0.1995,
+ "step": 14419
+ },
+ {
+ "epoch": 39.29155313351499,
+ "grad_norm": 5.664775848388672,
+ "learning_rate": 1.385178945331338e-05,
+ "loss": 0.2686,
+ "step": 14420
+ },
+ {
+ "epoch": 39.294277929155314,
+ "grad_norm": 7.046104431152344,
+ "learning_rate": 1.385097503528562e-05,
+ "loss": 0.2892,
+ "step": 14421
+ },
+ {
+ "epoch": 39.29700272479564,
+ "grad_norm": 5.487584114074707,
+ "learning_rate": 1.385016058726659e-05,
+ "loss": 0.2466,
+ "step": 14422
+ },
+ {
+ "epoch": 39.299727520435965,
+ "grad_norm": 6.687308311462402,
+ "learning_rate": 1.3849346109262634e-05,
+ "loss": 0.2345,
+ "step": 14423
+ },
+ {
+ "epoch": 39.30245231607629,
+ "grad_norm": 5.87015438079834,
+ "learning_rate": 1.3848531601280095e-05,
+ "loss": 0.2002,
+ "step": 14424
+ },
+ {
+ "epoch": 39.305177111716624,
+ "grad_norm": 7.049134731292725,
+ "learning_rate": 1.3847717063325316e-05,
+ "loss": 0.1947,
+ "step": 14425
+ },
+ {
+ "epoch": 39.30790190735695,
+ "grad_norm": 5.7420654296875,
+ "learning_rate": 1.384690249540464e-05,
+ "loss": 0.2124,
+ "step": 14426
+ },
+ {
+ "epoch": 39.310626702997276,
+ "grad_norm": 6.156968116760254,
+ "learning_rate": 1.3846087897524412e-05,
+ "loss": 0.1808,
+ "step": 14427
+ },
+ {
+ "epoch": 39.3133514986376,
+ "grad_norm": 6.691866397857666,
+ "learning_rate": 1.3845273269690973e-05,
+ "loss": 0.2945,
+ "step": 14428
+ },
+ {
+ "epoch": 39.31607629427793,
+ "grad_norm": 5.193544864654541,
+ "learning_rate": 1.3844458611910671e-05,
+ "loss": 0.2237,
+ "step": 14429
+ },
+ {
+ "epoch": 39.31880108991825,
+ "grad_norm": 6.388106346130371,
+ "learning_rate": 1.384364392418985e-05,
+ "loss": 0.2084,
+ "step": 14430
+ },
+ {
+ "epoch": 39.321525885558586,
+ "grad_norm": 6.0377583503723145,
+ "learning_rate": 1.3842829206534854e-05,
+ "loss": 0.4066,
+ "step": 14431
+ },
+ {
+ "epoch": 39.32425068119891,
+ "grad_norm": 5.002970218658447,
+ "learning_rate": 1.3842014458952025e-05,
+ "loss": 0.1642,
+ "step": 14432
+ },
+ {
+ "epoch": 39.32697547683924,
+ "grad_norm": 6.982475757598877,
+ "learning_rate": 1.3841199681447713e-05,
+ "loss": 0.1986,
+ "step": 14433
+ },
+ {
+ "epoch": 39.32970027247956,
+ "grad_norm": 5.248578071594238,
+ "learning_rate": 1.3840384874028262e-05,
+ "loss": 0.2947,
+ "step": 14434
+ },
+ {
+ "epoch": 39.33242506811989,
+ "grad_norm": 6.221617221832275,
+ "learning_rate": 1.3839570036700015e-05,
+ "loss": 0.3211,
+ "step": 14435
+ },
+ {
+ "epoch": 39.335149863760215,
+ "grad_norm": 6.641686916351318,
+ "learning_rate": 1.383875516946932e-05,
+ "loss": 0.2894,
+ "step": 14436
+ },
+ {
+ "epoch": 39.33787465940055,
+ "grad_norm": 6.050511360168457,
+ "learning_rate": 1.3837940272342525e-05,
+ "loss": 0.3503,
+ "step": 14437
+ },
+ {
+ "epoch": 39.34059945504087,
+ "grad_norm": 6.534960746765137,
+ "learning_rate": 1.3837125345325975e-05,
+ "loss": 0.2766,
+ "step": 14438
+ },
+ {
+ "epoch": 39.3433242506812,
+ "grad_norm": 5.614215850830078,
+ "learning_rate": 1.3836310388426015e-05,
+ "loss": 0.3974,
+ "step": 14439
+ },
+ {
+ "epoch": 39.346049046321525,
+ "grad_norm": 6.731872081756592,
+ "learning_rate": 1.3835495401648995e-05,
+ "loss": 0.3325,
+ "step": 14440
+ },
+ {
+ "epoch": 39.34877384196185,
+ "grad_norm": 8.455556869506836,
+ "learning_rate": 1.3834680385001257e-05,
+ "loss": 0.2448,
+ "step": 14441
+ },
+ {
+ "epoch": 39.35149863760218,
+ "grad_norm": 8.348003387451172,
+ "learning_rate": 1.3833865338489156e-05,
+ "loss": 0.3221,
+ "step": 14442
+ },
+ {
+ "epoch": 39.35422343324251,
+ "grad_norm": 5.993939399719238,
+ "learning_rate": 1.383305026211903e-05,
+ "loss": 0.1674,
+ "step": 14443
+ },
+ {
+ "epoch": 39.356948228882835,
+ "grad_norm": 5.404088973999023,
+ "learning_rate": 1.3832235155897237e-05,
+ "loss": 0.3732,
+ "step": 14444
+ },
+ {
+ "epoch": 39.35967302452316,
+ "grad_norm": 4.829730987548828,
+ "learning_rate": 1.3831420019830118e-05,
+ "loss": 0.2053,
+ "step": 14445
+ },
+ {
+ "epoch": 39.36239782016349,
+ "grad_norm": 6.515233516693115,
+ "learning_rate": 1.3830604853924021e-05,
+ "loss": 0.2587,
+ "step": 14446
+ },
+ {
+ "epoch": 39.36512261580381,
+ "grad_norm": 6.463160991668701,
+ "learning_rate": 1.3829789658185299e-05,
+ "loss": 0.3481,
+ "step": 14447
+ },
+ {
+ "epoch": 39.36784741144414,
+ "grad_norm": 6.9467997550964355,
+ "learning_rate": 1.3828974432620297e-05,
+ "loss": 0.3206,
+ "step": 14448
+ },
+ {
+ "epoch": 39.37057220708447,
+ "grad_norm": 6.457395553588867,
+ "learning_rate": 1.3828159177235368e-05,
+ "loss": 0.2884,
+ "step": 14449
+ },
+ {
+ "epoch": 39.3732970027248,
+ "grad_norm": 7.020283222198486,
+ "learning_rate": 1.3827343892036855e-05,
+ "loss": 0.2181,
+ "step": 14450
+ },
+ {
+ "epoch": 39.37602179836512,
+ "grad_norm": 6.745564937591553,
+ "learning_rate": 1.3826528577031113e-05,
+ "loss": 0.2353,
+ "step": 14451
+ },
+ {
+ "epoch": 39.37874659400545,
+ "grad_norm": 8.310040473937988,
+ "learning_rate": 1.3825713232224492e-05,
+ "loss": 0.2115,
+ "step": 14452
+ },
+ {
+ "epoch": 39.381471389645775,
+ "grad_norm": 5.74802827835083,
+ "learning_rate": 1.3824897857623336e-05,
+ "loss": 0.2852,
+ "step": 14453
+ },
+ {
+ "epoch": 39.3841961852861,
+ "grad_norm": 6.839849948883057,
+ "learning_rate": 1.3824082453234e-05,
+ "loss": 0.2355,
+ "step": 14454
+ },
+ {
+ "epoch": 39.38692098092643,
+ "grad_norm": 6.283200263977051,
+ "learning_rate": 1.3823267019062832e-05,
+ "loss": 0.2132,
+ "step": 14455
+ },
+ {
+ "epoch": 39.38964577656676,
+ "grad_norm": 5.922610759735107,
+ "learning_rate": 1.3822451555116186e-05,
+ "loss": 0.2582,
+ "step": 14456
+ },
+ {
+ "epoch": 39.392370572207085,
+ "grad_norm": 5.901951313018799,
+ "learning_rate": 1.3821636061400407e-05,
+ "loss": 0.3616,
+ "step": 14457
+ },
+ {
+ "epoch": 39.39509536784741,
+ "grad_norm": 5.894443988800049,
+ "learning_rate": 1.3820820537921849e-05,
+ "loss": 0.3356,
+ "step": 14458
+ },
+ {
+ "epoch": 39.39782016348774,
+ "grad_norm": 4.748549461364746,
+ "learning_rate": 1.3820004984686866e-05,
+ "loss": 0.2984,
+ "step": 14459
+ },
+ {
+ "epoch": 39.40054495912806,
+ "grad_norm": 7.824007987976074,
+ "learning_rate": 1.3819189401701807e-05,
+ "loss": 0.3224,
+ "step": 14460
+ },
+ {
+ "epoch": 39.403269754768395,
+ "grad_norm": 5.506160736083984,
+ "learning_rate": 1.381837378897302e-05,
+ "loss": 0.3262,
+ "step": 14461
+ },
+ {
+ "epoch": 39.40599455040872,
+ "grad_norm": 6.4132304191589355,
+ "learning_rate": 1.3817558146506867e-05,
+ "loss": 0.4223,
+ "step": 14462
+ },
+ {
+ "epoch": 39.40871934604905,
+ "grad_norm": 6.343233108520508,
+ "learning_rate": 1.381674247430969e-05,
+ "loss": 0.216,
+ "step": 14463
+ },
+ {
+ "epoch": 39.41144414168937,
+ "grad_norm": 7.911228656768799,
+ "learning_rate": 1.3815926772387847e-05,
+ "loss": 0.1699,
+ "step": 14464
+ },
+ {
+ "epoch": 39.4141689373297,
+ "grad_norm": 6.358527660369873,
+ "learning_rate": 1.3815111040747688e-05,
+ "loss": 0.1799,
+ "step": 14465
+ },
+ {
+ "epoch": 39.416893732970024,
+ "grad_norm": 7.4972357749938965,
+ "learning_rate": 1.3814295279395566e-05,
+ "loss": 0.2331,
+ "step": 14466
+ },
+ {
+ "epoch": 39.41961852861036,
+ "grad_norm": 10.910237312316895,
+ "learning_rate": 1.3813479488337838e-05,
+ "loss": 0.265,
+ "step": 14467
+ },
+ {
+ "epoch": 39.42234332425068,
+ "grad_norm": 7.198177337646484,
+ "learning_rate": 1.3812663667580855e-05,
+ "loss": 0.3017,
+ "step": 14468
+ },
+ {
+ "epoch": 39.42506811989101,
+ "grad_norm": 5.954398155212402,
+ "learning_rate": 1.3811847817130965e-05,
+ "loss": 0.3837,
+ "step": 14469
+ },
+ {
+ "epoch": 39.427792915531334,
+ "grad_norm": 6.609823226928711,
+ "learning_rate": 1.3811031936994533e-05,
+ "loss": 0.3177,
+ "step": 14470
+ },
+ {
+ "epoch": 39.43051771117166,
+ "grad_norm": 6.191345691680908,
+ "learning_rate": 1.3810216027177903e-05,
+ "loss": 0.2287,
+ "step": 14471
+ },
+ {
+ "epoch": 39.433242506811986,
+ "grad_norm": 5.148782730102539,
+ "learning_rate": 1.3809400087687434e-05,
+ "loss": 0.4851,
+ "step": 14472
+ },
+ {
+ "epoch": 39.43596730245232,
+ "grad_norm": 6.095325469970703,
+ "learning_rate": 1.380858411852948e-05,
+ "loss": 0.2578,
+ "step": 14473
+ },
+ {
+ "epoch": 39.438692098092645,
+ "grad_norm": 4.201200008392334,
+ "learning_rate": 1.3807768119710397e-05,
+ "loss": 0.1481,
+ "step": 14474
+ },
+ {
+ "epoch": 39.44141689373297,
+ "grad_norm": 6.30897331237793,
+ "learning_rate": 1.3806952091236533e-05,
+ "loss": 0.4306,
+ "step": 14475
+ },
+ {
+ "epoch": 39.444141689373296,
+ "grad_norm": 5.3930511474609375,
+ "learning_rate": 1.3806136033114255e-05,
+ "loss": 0.3352,
+ "step": 14476
+ },
+ {
+ "epoch": 39.44686648501362,
+ "grad_norm": 6.518143177032471,
+ "learning_rate": 1.3805319945349908e-05,
+ "loss": 0.3578,
+ "step": 14477
+ },
+ {
+ "epoch": 39.44959128065395,
+ "grad_norm": 5.120165824890137,
+ "learning_rate": 1.3804503827949855e-05,
+ "loss": 0.2277,
+ "step": 14478
+ },
+ {
+ "epoch": 39.45231607629428,
+ "grad_norm": 5.436894416809082,
+ "learning_rate": 1.3803687680920446e-05,
+ "loss": 0.2536,
+ "step": 14479
+ },
+ {
+ "epoch": 39.45504087193461,
+ "grad_norm": 6.164616584777832,
+ "learning_rate": 1.3802871504268043e-05,
+ "loss": 0.1834,
+ "step": 14480
+ },
+ {
+ "epoch": 39.45776566757493,
+ "grad_norm": 7.045543670654297,
+ "learning_rate": 1.3802055297998996e-05,
+ "loss": 0.3184,
+ "step": 14481
+ },
+ {
+ "epoch": 39.46049046321526,
+ "grad_norm": 6.383248329162598,
+ "learning_rate": 1.3801239062119666e-05,
+ "loss": 0.3735,
+ "step": 14482
+ },
+ {
+ "epoch": 39.463215258855584,
+ "grad_norm": 6.647173881530762,
+ "learning_rate": 1.3800422796636406e-05,
+ "loss": 0.2435,
+ "step": 14483
+ },
+ {
+ "epoch": 39.46594005449591,
+ "grad_norm": 5.340779781341553,
+ "learning_rate": 1.3799606501555578e-05,
+ "loss": 0.1776,
+ "step": 14484
+ },
+ {
+ "epoch": 39.46866485013624,
+ "grad_norm": 6.516035556793213,
+ "learning_rate": 1.3798790176883536e-05,
+ "loss": 0.1985,
+ "step": 14485
+ },
+ {
+ "epoch": 39.47138964577657,
+ "grad_norm": 5.881908893585205,
+ "learning_rate": 1.379797382262664e-05,
+ "loss": 0.4826,
+ "step": 14486
+ },
+ {
+ "epoch": 39.474114441416894,
+ "grad_norm": 4.972786903381348,
+ "learning_rate": 1.3797157438791244e-05,
+ "loss": 0.2321,
+ "step": 14487
+ },
+ {
+ "epoch": 39.47683923705722,
+ "grad_norm": 15.548818588256836,
+ "learning_rate": 1.379634102538371e-05,
+ "loss": 0.2608,
+ "step": 14488
+ },
+ {
+ "epoch": 39.479564032697546,
+ "grad_norm": 6.68283224105835,
+ "learning_rate": 1.3795524582410394e-05,
+ "loss": 0.2219,
+ "step": 14489
+ },
+ {
+ "epoch": 39.48228882833787,
+ "grad_norm": 5.611134052276611,
+ "learning_rate": 1.3794708109877655e-05,
+ "loss": 0.1968,
+ "step": 14490
+ },
+ {
+ "epoch": 39.485013623978205,
+ "grad_norm": 4.328458309173584,
+ "learning_rate": 1.379389160779185e-05,
+ "loss": 0.1002,
+ "step": 14491
+ },
+ {
+ "epoch": 39.48773841961853,
+ "grad_norm": 5.882762908935547,
+ "learning_rate": 1.379307507615934e-05,
+ "loss": 0.2224,
+ "step": 14492
+ },
+ {
+ "epoch": 39.490463215258856,
+ "grad_norm": 8.353507995605469,
+ "learning_rate": 1.3792258514986481e-05,
+ "loss": 0.3127,
+ "step": 14493
+ },
+ {
+ "epoch": 39.49318801089918,
+ "grad_norm": 6.130002021789551,
+ "learning_rate": 1.3791441924279638e-05,
+ "loss": 0.2527,
+ "step": 14494
+ },
+ {
+ "epoch": 39.49591280653951,
+ "grad_norm": 5.884676933288574,
+ "learning_rate": 1.3790625304045165e-05,
+ "loss": 0.2389,
+ "step": 14495
+ },
+ {
+ "epoch": 39.49863760217983,
+ "grad_norm": 7.270334243774414,
+ "learning_rate": 1.3789808654289428e-05,
+ "loss": 0.2778,
+ "step": 14496
+ },
+ {
+ "epoch": 39.50136239782017,
+ "grad_norm": 6.881333827972412,
+ "learning_rate": 1.3788991975018777e-05,
+ "loss": 0.2471,
+ "step": 14497
+ },
+ {
+ "epoch": 39.50408719346049,
+ "grad_norm": 6.791107654571533,
+ "learning_rate": 1.3788175266239585e-05,
+ "loss": 0.3028,
+ "step": 14498
+ },
+ {
+ "epoch": 39.50681198910082,
+ "grad_norm": 7.451920986175537,
+ "learning_rate": 1.37873585279582e-05,
+ "loss": 0.2419,
+ "step": 14499
+ },
+ {
+ "epoch": 39.509536784741144,
+ "grad_norm": 5.3681721687316895,
+ "learning_rate": 1.3786541760180994e-05,
+ "loss": 0.1921,
+ "step": 14500
+ },
+ {
+ "epoch": 39.51226158038147,
+ "grad_norm": 7.38743257522583,
+ "learning_rate": 1.3785724962914317e-05,
+ "loss": 0.3115,
+ "step": 14501
+ },
+ {
+ "epoch": 39.514986376021795,
+ "grad_norm": 5.627354621887207,
+ "learning_rate": 1.378490813616454e-05,
+ "loss": 0.3022,
+ "step": 14502
+ },
+ {
+ "epoch": 39.51771117166213,
+ "grad_norm": 6.181478500366211,
+ "learning_rate": 1.3784091279938019e-05,
+ "loss": 0.2282,
+ "step": 14503
+ },
+ {
+ "epoch": 39.520435967302454,
+ "grad_norm": 6.117964267730713,
+ "learning_rate": 1.3783274394241119e-05,
+ "loss": 0.3128,
+ "step": 14504
+ },
+ {
+ "epoch": 39.52316076294278,
+ "grad_norm": 5.2905964851379395,
+ "learning_rate": 1.3782457479080198e-05,
+ "loss": 0.4057,
+ "step": 14505
+ },
+ {
+ "epoch": 39.525885558583106,
+ "grad_norm": 4.802488803863525,
+ "learning_rate": 1.378164053446162e-05,
+ "loss": 0.2117,
+ "step": 14506
+ },
+ {
+ "epoch": 39.52861035422343,
+ "grad_norm": 6.579444408416748,
+ "learning_rate": 1.3780823560391748e-05,
+ "loss": 0.1497,
+ "step": 14507
+ },
+ {
+ "epoch": 39.53133514986376,
+ "grad_norm": 5.356363296508789,
+ "learning_rate": 1.378000655687694e-05,
+ "loss": 0.3481,
+ "step": 14508
+ },
+ {
+ "epoch": 39.53405994550409,
+ "grad_norm": 7.40226411819458,
+ "learning_rate": 1.3779189523923568e-05,
+ "loss": 0.2441,
+ "step": 14509
+ },
+ {
+ "epoch": 39.536784741144416,
+ "grad_norm": 6.068542003631592,
+ "learning_rate": 1.3778372461537985e-05,
+ "loss": 0.2196,
+ "step": 14510
+ },
+ {
+ "epoch": 39.53950953678474,
+ "grad_norm": 6.02263069152832,
+ "learning_rate": 1.3777555369726561e-05,
+ "loss": 0.2503,
+ "step": 14511
+ },
+ {
+ "epoch": 39.54223433242507,
+ "grad_norm": 7.612646579742432,
+ "learning_rate": 1.3776738248495659e-05,
+ "loss": 0.2763,
+ "step": 14512
+ },
+ {
+ "epoch": 39.54495912806539,
+ "grad_norm": 4.873693466186523,
+ "learning_rate": 1.3775921097851637e-05,
+ "loss": 0.2158,
+ "step": 14513
+ },
+ {
+ "epoch": 39.54768392370572,
+ "grad_norm": 5.309380054473877,
+ "learning_rate": 1.3775103917800867e-05,
+ "loss": 0.2633,
+ "step": 14514
+ },
+ {
+ "epoch": 39.55040871934605,
+ "grad_norm": 5.206650733947754,
+ "learning_rate": 1.3774286708349706e-05,
+ "loss": 0.206,
+ "step": 14515
+ },
+ {
+ "epoch": 39.55313351498638,
+ "grad_norm": 5.255007743835449,
+ "learning_rate": 1.3773469469504526e-05,
+ "loss": 0.2872,
+ "step": 14516
+ },
+ {
+ "epoch": 39.555858310626704,
+ "grad_norm": 6.5827717781066895,
+ "learning_rate": 1.3772652201271684e-05,
+ "loss": 0.265,
+ "step": 14517
+ },
+ {
+ "epoch": 39.55858310626703,
+ "grad_norm": 6.465464115142822,
+ "learning_rate": 1.3771834903657548e-05,
+ "loss": 0.2229,
+ "step": 14518
+ },
+ {
+ "epoch": 39.561307901907355,
+ "grad_norm": 5.544752597808838,
+ "learning_rate": 1.3771017576668485e-05,
+ "loss": 0.2967,
+ "step": 14519
+ },
+ {
+ "epoch": 39.56403269754768,
+ "grad_norm": 6.1680989265441895,
+ "learning_rate": 1.3770200220310855e-05,
+ "loss": 0.2068,
+ "step": 14520
+ },
+ {
+ "epoch": 39.566757493188014,
+ "grad_norm": 6.143753528594971,
+ "learning_rate": 1.3769382834591029e-05,
+ "loss": 0.2755,
+ "step": 14521
+ },
+ {
+ "epoch": 39.56948228882834,
+ "grad_norm": 4.713968753814697,
+ "learning_rate": 1.3768565419515371e-05,
+ "loss": 0.3034,
+ "step": 14522
+ },
+ {
+ "epoch": 39.572207084468666,
+ "grad_norm": 5.635724067687988,
+ "learning_rate": 1.3767747975090247e-05,
+ "loss": 0.4184,
+ "step": 14523
+ },
+ {
+ "epoch": 39.57493188010899,
+ "grad_norm": 12.68502426147461,
+ "learning_rate": 1.3766930501322024e-05,
+ "loss": 0.2532,
+ "step": 14524
+ },
+ {
+ "epoch": 39.57765667574932,
+ "grad_norm": 6.0208611488342285,
+ "learning_rate": 1.3766112998217064e-05,
+ "loss": 0.1414,
+ "step": 14525
+ },
+ {
+ "epoch": 39.58038147138964,
+ "grad_norm": 8.426074028015137,
+ "learning_rate": 1.376529546578174e-05,
+ "loss": 0.2204,
+ "step": 14526
+ },
+ {
+ "epoch": 39.583106267029976,
+ "grad_norm": 5.933780193328857,
+ "learning_rate": 1.3764477904022417e-05,
+ "loss": 0.2143,
+ "step": 14527
+ },
+ {
+ "epoch": 39.5858310626703,
+ "grad_norm": 9.801464080810547,
+ "learning_rate": 1.3763660312945459e-05,
+ "loss": 0.2581,
+ "step": 14528
+ },
+ {
+ "epoch": 39.58855585831063,
+ "grad_norm": 5.783325672149658,
+ "learning_rate": 1.3762842692557236e-05,
+ "loss": 0.2134,
+ "step": 14529
+ },
+ {
+ "epoch": 39.59128065395095,
+ "grad_norm": 7.276175498962402,
+ "learning_rate": 1.3762025042864116e-05,
+ "loss": 0.2136,
+ "step": 14530
+ },
+ {
+ "epoch": 39.59400544959128,
+ "grad_norm": 5.434111595153809,
+ "learning_rate": 1.3761207363872466e-05,
+ "loss": 0.3399,
+ "step": 14531
+ },
+ {
+ "epoch": 39.596730245231605,
+ "grad_norm": 5.848511219024658,
+ "learning_rate": 1.3760389655588656e-05,
+ "loss": 0.178,
+ "step": 14532
+ },
+ {
+ "epoch": 39.59945504087194,
+ "grad_norm": 5.863616943359375,
+ "learning_rate": 1.3759571918019048e-05,
+ "loss": 0.2931,
+ "step": 14533
+ },
+ {
+ "epoch": 39.60217983651226,
+ "grad_norm": 6.135962009429932,
+ "learning_rate": 1.375875415117002e-05,
+ "loss": 0.2129,
+ "step": 14534
+ },
+ {
+ "epoch": 39.60490463215259,
+ "grad_norm": 7.874301910400391,
+ "learning_rate": 1.375793635504793e-05,
+ "loss": 0.2667,
+ "step": 14535
+ },
+ {
+ "epoch": 39.607629427792915,
+ "grad_norm": 12.337894439697266,
+ "learning_rate": 1.3757118529659155e-05,
+ "loss": 0.3004,
+ "step": 14536
+ },
+ {
+ "epoch": 39.61035422343324,
+ "grad_norm": 5.171806812286377,
+ "learning_rate": 1.3756300675010064e-05,
+ "loss": 0.2465,
+ "step": 14537
+ },
+ {
+ "epoch": 39.61307901907357,
+ "grad_norm": 4.8838934898376465,
+ "learning_rate": 1.375548279110702e-05,
+ "loss": 0.243,
+ "step": 14538
+ },
+ {
+ "epoch": 39.6158038147139,
+ "grad_norm": 6.0601654052734375,
+ "learning_rate": 1.3754664877956401e-05,
+ "loss": 0.2417,
+ "step": 14539
+ },
+ {
+ "epoch": 39.618528610354225,
+ "grad_norm": 6.87872838973999,
+ "learning_rate": 1.375384693556457e-05,
+ "loss": 0.2371,
+ "step": 14540
+ },
+ {
+ "epoch": 39.62125340599455,
+ "grad_norm": 7.159520149230957,
+ "learning_rate": 1.3753028963937902e-05,
+ "loss": 0.2317,
+ "step": 14541
+ },
+ {
+ "epoch": 39.62397820163488,
+ "grad_norm": 6.424330711364746,
+ "learning_rate": 1.3752210963082764e-05,
+ "loss": 0.2436,
+ "step": 14542
+ },
+ {
+ "epoch": 39.6267029972752,
+ "grad_norm": 6.434669494628906,
+ "learning_rate": 1.375139293300553e-05,
+ "loss": 0.2291,
+ "step": 14543
+ },
+ {
+ "epoch": 39.62942779291553,
+ "grad_norm": 5.746603488922119,
+ "learning_rate": 1.3750574873712563e-05,
+ "loss": 0.2731,
+ "step": 14544
+ },
+ {
+ "epoch": 39.63215258855586,
+ "grad_norm": 6.475936412811279,
+ "learning_rate": 1.3749756785210245e-05,
+ "loss": 0.275,
+ "step": 14545
+ },
+ {
+ "epoch": 39.63487738419619,
+ "grad_norm": 6.085830211639404,
+ "learning_rate": 1.3748938667504938e-05,
+ "loss": 0.224,
+ "step": 14546
+ },
+ {
+ "epoch": 39.63760217983651,
+ "grad_norm": 9.126067161560059,
+ "learning_rate": 1.3748120520603022e-05,
+ "loss": 0.4167,
+ "step": 14547
+ },
+ {
+ "epoch": 39.64032697547684,
+ "grad_norm": 7.992452621459961,
+ "learning_rate": 1.374730234451086e-05,
+ "loss": 0.2461,
+ "step": 14548
+ },
+ {
+ "epoch": 39.643051771117165,
+ "grad_norm": 5.556773662567139,
+ "learning_rate": 1.374648413923483e-05,
+ "loss": 0.3287,
+ "step": 14549
+ },
+ {
+ "epoch": 39.64577656675749,
+ "grad_norm": 5.716811656951904,
+ "learning_rate": 1.37456659047813e-05,
+ "loss": 0.2177,
+ "step": 14550
+ },
+ {
+ "epoch": 39.64850136239782,
+ "grad_norm": 5.8144989013671875,
+ "learning_rate": 1.3744847641156649e-05,
+ "loss": 0.2023,
+ "step": 14551
+ },
+ {
+ "epoch": 39.65122615803815,
+ "grad_norm": 10.226764678955078,
+ "learning_rate": 1.3744029348367238e-05,
+ "loss": 0.2317,
+ "step": 14552
+ },
+ {
+ "epoch": 39.653950953678475,
+ "grad_norm": 5.7301859855651855,
+ "learning_rate": 1.3743211026419452e-05,
+ "loss": 0.2363,
+ "step": 14553
+ },
+ {
+ "epoch": 39.6566757493188,
+ "grad_norm": 8.517986297607422,
+ "learning_rate": 1.3742392675319657e-05,
+ "loss": 0.3702,
+ "step": 14554
+ },
+ {
+ "epoch": 39.65940054495913,
+ "grad_norm": 5.571247577667236,
+ "learning_rate": 1.3741574295074232e-05,
+ "loss": 0.4313,
+ "step": 14555
+ },
+ {
+ "epoch": 39.66212534059945,
+ "grad_norm": 5.858706474304199,
+ "learning_rate": 1.3740755885689541e-05,
+ "loss": 0.3682,
+ "step": 14556
+ },
+ {
+ "epoch": 39.664850136239785,
+ "grad_norm": 4.895678520202637,
+ "learning_rate": 1.373993744717197e-05,
+ "loss": 0.4425,
+ "step": 14557
+ },
+ {
+ "epoch": 39.66757493188011,
+ "grad_norm": 5.619413375854492,
+ "learning_rate": 1.3739118979527882e-05,
+ "loss": 0.2836,
+ "step": 14558
+ },
+ {
+ "epoch": 39.67029972752044,
+ "grad_norm": 5.4406046867370605,
+ "learning_rate": 1.3738300482763655e-05,
+ "loss": 0.2448,
+ "step": 14559
+ },
+ {
+ "epoch": 39.67302452316076,
+ "grad_norm": 4.460606575012207,
+ "learning_rate": 1.3737481956885668e-05,
+ "loss": 0.1949,
+ "step": 14560
+ },
+ {
+ "epoch": 39.67574931880109,
+ "grad_norm": 6.217899322509766,
+ "learning_rate": 1.3736663401900288e-05,
+ "loss": 0.2768,
+ "step": 14561
+ },
+ {
+ "epoch": 39.678474114441414,
+ "grad_norm": 5.351813793182373,
+ "learning_rate": 1.3735844817813895e-05,
+ "loss": 0.2784,
+ "step": 14562
+ },
+ {
+ "epoch": 39.68119891008175,
+ "grad_norm": 5.458523273468018,
+ "learning_rate": 1.3735026204632864e-05,
+ "loss": 0.2043,
+ "step": 14563
+ },
+ {
+ "epoch": 39.68392370572207,
+ "grad_norm": 5.464929103851318,
+ "learning_rate": 1.3734207562363568e-05,
+ "loss": 0.2792,
+ "step": 14564
+ },
+ {
+ "epoch": 39.6866485013624,
+ "grad_norm": 6.421558380126953,
+ "learning_rate": 1.3733388891012385e-05,
+ "loss": 0.2537,
+ "step": 14565
+ },
+ {
+ "epoch": 39.689373297002724,
+ "grad_norm": 6.545646667480469,
+ "learning_rate": 1.3732570190585689e-05,
+ "loss": 0.239,
+ "step": 14566
+ },
+ {
+ "epoch": 39.69209809264305,
+ "grad_norm": 6.9950432777404785,
+ "learning_rate": 1.3731751461089858e-05,
+ "loss": 0.2151,
+ "step": 14567
+ },
+ {
+ "epoch": 39.694822888283376,
+ "grad_norm": 6.908062934875488,
+ "learning_rate": 1.3730932702531261e-05,
+ "loss": 0.3112,
+ "step": 14568
+ },
+ {
+ "epoch": 39.69754768392371,
+ "grad_norm": 6.2741899490356445,
+ "learning_rate": 1.3730113914916285e-05,
+ "loss": 0.2596,
+ "step": 14569
+ },
+ {
+ "epoch": 39.700272479564035,
+ "grad_norm": 6.59345817565918,
+ "learning_rate": 1.37292950982513e-05,
+ "loss": 0.2039,
+ "step": 14570
+ },
+ {
+ "epoch": 39.70299727520436,
+ "grad_norm": 11.277990341186523,
+ "learning_rate": 1.3728476252542687e-05,
+ "loss": 0.2684,
+ "step": 14571
+ },
+ {
+ "epoch": 39.705722070844686,
+ "grad_norm": 8.434755325317383,
+ "learning_rate": 1.3727657377796816e-05,
+ "loss": 0.2751,
+ "step": 14572
+ },
+ {
+ "epoch": 39.70844686648501,
+ "grad_norm": 6.903609752655029,
+ "learning_rate": 1.3726838474020077e-05,
+ "loss": 0.238,
+ "step": 14573
+ },
+ {
+ "epoch": 39.71117166212534,
+ "grad_norm": 5.95989990234375,
+ "learning_rate": 1.3726019541218833e-05,
+ "loss": 0.2779,
+ "step": 14574
+ },
+ {
+ "epoch": 39.71389645776567,
+ "grad_norm": 6.068815231323242,
+ "learning_rate": 1.3725200579399474e-05,
+ "loss": 0.184,
+ "step": 14575
+ },
+ {
+ "epoch": 39.716621253406,
+ "grad_norm": 8.695172309875488,
+ "learning_rate": 1.372438158856837e-05,
+ "loss": 0.2631,
+ "step": 14576
+ },
+ {
+ "epoch": 39.71934604904632,
+ "grad_norm": 14.273383140563965,
+ "learning_rate": 1.3723562568731903e-05,
+ "loss": 0.2376,
+ "step": 14577
+ },
+ {
+ "epoch": 39.72207084468665,
+ "grad_norm": 7.18869686126709,
+ "learning_rate": 1.3722743519896447e-05,
+ "loss": 0.2187,
+ "step": 14578
+ },
+ {
+ "epoch": 39.724795640326974,
+ "grad_norm": 6.22044563293457,
+ "learning_rate": 1.3721924442068388e-05,
+ "loss": 0.1456,
+ "step": 14579
+ },
+ {
+ "epoch": 39.7275204359673,
+ "grad_norm": 6.530173301696777,
+ "learning_rate": 1.37211053352541e-05,
+ "loss": 0.2498,
+ "step": 14580
+ },
+ {
+ "epoch": 39.73024523160763,
+ "grad_norm": 6.607137680053711,
+ "learning_rate": 1.3720286199459967e-05,
+ "loss": 0.2833,
+ "step": 14581
+ },
+ {
+ "epoch": 39.73297002724796,
+ "grad_norm": 7.22041130065918,
+ "learning_rate": 1.371946703469236e-05,
+ "loss": 0.2257,
+ "step": 14582
+ },
+ {
+ "epoch": 39.735694822888284,
+ "grad_norm": 5.8552565574646,
+ "learning_rate": 1.3718647840957666e-05,
+ "loss": 0.2111,
+ "step": 14583
+ },
+ {
+ "epoch": 39.73841961852861,
+ "grad_norm": 6.913836479187012,
+ "learning_rate": 1.3717828618262261e-05,
+ "loss": 0.1929,
+ "step": 14584
+ },
+ {
+ "epoch": 39.741144414168936,
+ "grad_norm": 5.870815277099609,
+ "learning_rate": 1.3717009366612528e-05,
+ "loss": 0.1751,
+ "step": 14585
+ },
+ {
+ "epoch": 39.74386920980926,
+ "grad_norm": 6.600525379180908,
+ "learning_rate": 1.3716190086014844e-05,
+ "loss": 0.1993,
+ "step": 14586
+ },
+ {
+ "epoch": 39.746594005449595,
+ "grad_norm": 7.7413740158081055,
+ "learning_rate": 1.3715370776475591e-05,
+ "loss": 0.3372,
+ "step": 14587
+ },
+ {
+ "epoch": 39.74931880108992,
+ "grad_norm": 7.063012599945068,
+ "learning_rate": 1.3714551438001149e-05,
+ "loss": 0.2917,
+ "step": 14588
+ },
+ {
+ "epoch": 39.752043596730246,
+ "grad_norm": 8.96944522857666,
+ "learning_rate": 1.3713732070597902e-05,
+ "loss": 0.3526,
+ "step": 14589
+ },
+ {
+ "epoch": 39.75476839237057,
+ "grad_norm": 6.1891560554504395,
+ "learning_rate": 1.371291267427223e-05,
+ "loss": 0.2988,
+ "step": 14590
+ },
+ {
+ "epoch": 39.7574931880109,
+ "grad_norm": 10.691773414611816,
+ "learning_rate": 1.3712093249030513e-05,
+ "loss": 0.2568,
+ "step": 14591
+ },
+ {
+ "epoch": 39.76021798365122,
+ "grad_norm": 6.2613935470581055,
+ "learning_rate": 1.3711273794879131e-05,
+ "loss": 0.2761,
+ "step": 14592
+ },
+ {
+ "epoch": 39.762942779291556,
+ "grad_norm": 6.848296165466309,
+ "learning_rate": 1.3710454311824472e-05,
+ "loss": 0.2192,
+ "step": 14593
+ },
+ {
+ "epoch": 39.76566757493188,
+ "grad_norm": 8.631440162658691,
+ "learning_rate": 1.370963479987291e-05,
+ "loss": 0.278,
+ "step": 14594
+ },
+ {
+ "epoch": 39.76839237057221,
+ "grad_norm": 8.44626235961914,
+ "learning_rate": 1.3708815259030835e-05,
+ "loss": 0.2311,
+ "step": 14595
+ },
+ {
+ "epoch": 39.771117166212534,
+ "grad_norm": 5.785213470458984,
+ "learning_rate": 1.3707995689304626e-05,
+ "loss": 0.3227,
+ "step": 14596
+ },
+ {
+ "epoch": 39.77384196185286,
+ "grad_norm": 7.679196357727051,
+ "learning_rate": 1.3707176090700662e-05,
+ "loss": 0.3581,
+ "step": 14597
+ },
+ {
+ "epoch": 39.776566757493185,
+ "grad_norm": 7.344898223876953,
+ "learning_rate": 1.3706356463225332e-05,
+ "loss": 0.4623,
+ "step": 14598
+ },
+ {
+ "epoch": 39.77929155313352,
+ "grad_norm": 6.047147274017334,
+ "learning_rate": 1.3705536806885018e-05,
+ "loss": 0.2981,
+ "step": 14599
+ },
+ {
+ "epoch": 39.782016348773844,
+ "grad_norm": 4.970607280731201,
+ "learning_rate": 1.3704717121686103e-05,
+ "loss": 0.1991,
+ "step": 14600
+ },
+ {
+ "epoch": 39.78474114441417,
+ "grad_norm": 6.093405246734619,
+ "learning_rate": 1.3703897407634971e-05,
+ "loss": 0.5023,
+ "step": 14601
+ },
+ {
+ "epoch": 39.787465940054496,
+ "grad_norm": 6.924727916717529,
+ "learning_rate": 1.3703077664738002e-05,
+ "loss": 0.273,
+ "step": 14602
+ },
+ {
+ "epoch": 39.79019073569482,
+ "grad_norm": 5.4926228523254395,
+ "learning_rate": 1.3702257893001588e-05,
+ "loss": 0.2254,
+ "step": 14603
+ },
+ {
+ "epoch": 39.79291553133515,
+ "grad_norm": 6.771979331970215,
+ "learning_rate": 1.3701438092432104e-05,
+ "loss": 0.1754,
+ "step": 14604
+ },
+ {
+ "epoch": 39.79564032697548,
+ "grad_norm": 6.45460319519043,
+ "learning_rate": 1.3700618263035941e-05,
+ "loss": 0.2474,
+ "step": 14605
+ },
+ {
+ "epoch": 39.798365122615806,
+ "grad_norm": 7.092337608337402,
+ "learning_rate": 1.3699798404819485e-05,
+ "loss": 0.3309,
+ "step": 14606
+ },
+ {
+ "epoch": 39.80108991825613,
+ "grad_norm": 5.740354537963867,
+ "learning_rate": 1.3698978517789112e-05,
+ "loss": 0.1925,
+ "step": 14607
+ },
+ {
+ "epoch": 39.80381471389646,
+ "grad_norm": 5.312353610992432,
+ "learning_rate": 1.3698158601951217e-05,
+ "loss": 0.3696,
+ "step": 14608
+ },
+ {
+ "epoch": 39.80653950953678,
+ "grad_norm": 6.3158063888549805,
+ "learning_rate": 1.3697338657312183e-05,
+ "loss": 0.3152,
+ "step": 14609
+ },
+ {
+ "epoch": 39.80926430517711,
+ "grad_norm": 5.625290870666504,
+ "learning_rate": 1.3696518683878392e-05,
+ "loss": 0.1586,
+ "step": 14610
+ },
+ {
+ "epoch": 39.81198910081744,
+ "grad_norm": 10.652303695678711,
+ "learning_rate": 1.3695698681656233e-05,
+ "loss": 0.2413,
+ "step": 14611
+ },
+ {
+ "epoch": 39.81471389645777,
+ "grad_norm": 6.256007194519043,
+ "learning_rate": 1.3694878650652092e-05,
+ "loss": 0.2786,
+ "step": 14612
+ },
+ {
+ "epoch": 39.817438692098094,
+ "grad_norm": 4.749094486236572,
+ "learning_rate": 1.3694058590872354e-05,
+ "loss": 0.185,
+ "step": 14613
+ },
+ {
+ "epoch": 39.82016348773842,
+ "grad_norm": 6.310389518737793,
+ "learning_rate": 1.369323850232341e-05,
+ "loss": 0.4304,
+ "step": 14614
+ },
+ {
+ "epoch": 39.822888283378745,
+ "grad_norm": 6.497410297393799,
+ "learning_rate": 1.3692418385011639e-05,
+ "loss": 0.2418,
+ "step": 14615
+ },
+ {
+ "epoch": 39.82561307901907,
+ "grad_norm": 7.917486667633057,
+ "learning_rate": 1.3691598238943438e-05,
+ "loss": 0.3297,
+ "step": 14616
+ },
+ {
+ "epoch": 39.828337874659404,
+ "grad_norm": 6.416966438293457,
+ "learning_rate": 1.3690778064125182e-05,
+ "loss": 0.2968,
+ "step": 14617
+ },
+ {
+ "epoch": 39.83106267029973,
+ "grad_norm": 5.088503837585449,
+ "learning_rate": 1.368995786056327e-05,
+ "loss": 0.5073,
+ "step": 14618
+ },
+ {
+ "epoch": 39.833787465940055,
+ "grad_norm": 6.163337707519531,
+ "learning_rate": 1.3689137628264085e-05,
+ "loss": 0.2898,
+ "step": 14619
+ },
+ {
+ "epoch": 39.83651226158038,
+ "grad_norm": 4.374394416809082,
+ "learning_rate": 1.368831736723401e-05,
+ "loss": 0.2234,
+ "step": 14620
+ },
+ {
+ "epoch": 39.83923705722071,
+ "grad_norm": 6.270904064178467,
+ "learning_rate": 1.3687497077479441e-05,
+ "loss": 0.1773,
+ "step": 14621
+ },
+ {
+ "epoch": 39.84196185286103,
+ "grad_norm": 5.866994857788086,
+ "learning_rate": 1.3686676759006764e-05,
+ "loss": 0.3527,
+ "step": 14622
+ },
+ {
+ "epoch": 39.844686648501366,
+ "grad_norm": 5.5044426918029785,
+ "learning_rate": 1.3685856411822367e-05,
+ "loss": 0.3417,
+ "step": 14623
+ },
+ {
+ "epoch": 39.84741144414169,
+ "grad_norm": 5.12974214553833,
+ "learning_rate": 1.3685036035932639e-05,
+ "loss": 0.165,
+ "step": 14624
+ },
+ {
+ "epoch": 39.85013623978202,
+ "grad_norm": 6.531769752502441,
+ "learning_rate": 1.3684215631343969e-05,
+ "loss": 0.2958,
+ "step": 14625
+ },
+ {
+ "epoch": 39.85286103542234,
+ "grad_norm": 18.12469482421875,
+ "learning_rate": 1.3683395198062747e-05,
+ "loss": 0.4338,
+ "step": 14626
+ },
+ {
+ "epoch": 39.85558583106267,
+ "grad_norm": 5.587963581085205,
+ "learning_rate": 1.368257473609536e-05,
+ "loss": 0.3274,
+ "step": 14627
+ },
+ {
+ "epoch": 39.858310626702995,
+ "grad_norm": 6.947348117828369,
+ "learning_rate": 1.3681754245448202e-05,
+ "loss": 0.2568,
+ "step": 14628
+ },
+ {
+ "epoch": 39.86103542234333,
+ "grad_norm": 6.23321008682251,
+ "learning_rate": 1.3680933726127656e-05,
+ "loss": 0.286,
+ "step": 14629
+ },
+ {
+ "epoch": 39.86376021798365,
+ "grad_norm": 4.902149200439453,
+ "learning_rate": 1.368011317814012e-05,
+ "loss": 0.2003,
+ "step": 14630
+ },
+ {
+ "epoch": 39.86648501362398,
+ "grad_norm": 7.079772472381592,
+ "learning_rate": 1.367929260149198e-05,
+ "loss": 0.3779,
+ "step": 14631
+ },
+ {
+ "epoch": 39.869209809264305,
+ "grad_norm": 5.892935276031494,
+ "learning_rate": 1.3678471996189629e-05,
+ "loss": 0.2592,
+ "step": 14632
+ },
+ {
+ "epoch": 39.87193460490463,
+ "grad_norm": 5.965717315673828,
+ "learning_rate": 1.3677651362239454e-05,
+ "loss": 0.2357,
+ "step": 14633
+ },
+ {
+ "epoch": 39.87465940054496,
+ "grad_norm": 6.772895336151123,
+ "learning_rate": 1.3676830699647852e-05,
+ "loss": 0.1866,
+ "step": 14634
+ },
+ {
+ "epoch": 39.87738419618529,
+ "grad_norm": 6.63701057434082,
+ "learning_rate": 1.3676010008421208e-05,
+ "loss": 0.2314,
+ "step": 14635
+ },
+ {
+ "epoch": 39.880108991825615,
+ "grad_norm": 4.581226825714111,
+ "learning_rate": 1.3675189288565918e-05,
+ "loss": 0.2225,
+ "step": 14636
+ },
+ {
+ "epoch": 39.88283378746594,
+ "grad_norm": 4.762144088745117,
+ "learning_rate": 1.367436854008837e-05,
+ "loss": 0.322,
+ "step": 14637
+ },
+ {
+ "epoch": 39.88555858310627,
+ "grad_norm": 5.054895401000977,
+ "learning_rate": 1.3673547762994959e-05,
+ "loss": 0.2633,
+ "step": 14638
+ },
+ {
+ "epoch": 39.88828337874659,
+ "grad_norm": 4.342443466186523,
+ "learning_rate": 1.3672726957292075e-05,
+ "loss": 0.306,
+ "step": 14639
+ },
+ {
+ "epoch": 39.89100817438692,
+ "grad_norm": 4.6823272705078125,
+ "learning_rate": 1.3671906122986114e-05,
+ "loss": 0.4968,
+ "step": 14640
+ },
+ {
+ "epoch": 39.89373297002725,
+ "grad_norm": 6.215219974517822,
+ "learning_rate": 1.3671085260083465e-05,
+ "loss": 0.1587,
+ "step": 14641
+ },
+ {
+ "epoch": 39.89645776566758,
+ "grad_norm": 6.84375524520874,
+ "learning_rate": 1.3670264368590524e-05,
+ "loss": 0.2072,
+ "step": 14642
+ },
+ {
+ "epoch": 39.8991825613079,
+ "grad_norm": 5.9075727462768555,
+ "learning_rate": 1.3669443448513679e-05,
+ "loss": 0.316,
+ "step": 14643
+ },
+ {
+ "epoch": 39.90190735694823,
+ "grad_norm": 7.016509532928467,
+ "learning_rate": 1.366862249985933e-05,
+ "loss": 0.3074,
+ "step": 14644
+ },
+ {
+ "epoch": 39.904632152588555,
+ "grad_norm": 5.5128254890441895,
+ "learning_rate": 1.3667801522633866e-05,
+ "loss": 0.1993,
+ "step": 14645
+ },
+ {
+ "epoch": 39.90735694822888,
+ "grad_norm": 6.173662185668945,
+ "learning_rate": 1.3666980516843682e-05,
+ "loss": 0.2124,
+ "step": 14646
+ },
+ {
+ "epoch": 39.91008174386921,
+ "grad_norm": 5.529973983764648,
+ "learning_rate": 1.3666159482495167e-05,
+ "loss": 0.2811,
+ "step": 14647
+ },
+ {
+ "epoch": 39.91280653950954,
+ "grad_norm": 5.944946765899658,
+ "learning_rate": 1.3665338419594725e-05,
+ "loss": 0.1991,
+ "step": 14648
+ },
+ {
+ "epoch": 39.915531335149865,
+ "grad_norm": 4.5183820724487305,
+ "learning_rate": 1.3664517328148744e-05,
+ "loss": 0.2014,
+ "step": 14649
+ },
+ {
+ "epoch": 39.91825613079019,
+ "grad_norm": 6.031014919281006,
+ "learning_rate": 1.3663696208163622e-05,
+ "loss": 0.2306,
+ "step": 14650
+ },
+ {
+ "epoch": 39.920980926430516,
+ "grad_norm": 5.391735076904297,
+ "learning_rate": 1.366287505964575e-05,
+ "loss": 0.4026,
+ "step": 14651
+ },
+ {
+ "epoch": 39.92370572207084,
+ "grad_norm": 5.912613391876221,
+ "learning_rate": 1.3662053882601525e-05,
+ "loss": 0.2459,
+ "step": 14652
+ },
+ {
+ "epoch": 39.926430517711175,
+ "grad_norm": 6.257481098175049,
+ "learning_rate": 1.3661232677037341e-05,
+ "loss": 0.3528,
+ "step": 14653
+ },
+ {
+ "epoch": 39.9291553133515,
+ "grad_norm": 5.020956993103027,
+ "learning_rate": 1.3660411442959597e-05,
+ "loss": 0.2401,
+ "step": 14654
+ },
+ {
+ "epoch": 39.93188010899183,
+ "grad_norm": 5.578127384185791,
+ "learning_rate": 1.3659590180374685e-05,
+ "loss": 0.1824,
+ "step": 14655
+ },
+ {
+ "epoch": 39.93460490463215,
+ "grad_norm": 7.9125494956970215,
+ "learning_rate": 1.3658768889289003e-05,
+ "loss": 0.2713,
+ "step": 14656
+ },
+ {
+ "epoch": 39.93732970027248,
+ "grad_norm": 4.773212432861328,
+ "learning_rate": 1.3657947569708946e-05,
+ "loss": 0.2169,
+ "step": 14657
+ },
+ {
+ "epoch": 39.940054495912804,
+ "grad_norm": 5.907552719116211,
+ "learning_rate": 1.3657126221640914e-05,
+ "loss": 0.2264,
+ "step": 14658
+ },
+ {
+ "epoch": 39.94277929155314,
+ "grad_norm": 5.584198474884033,
+ "learning_rate": 1.3656304845091298e-05,
+ "loss": 0.3464,
+ "step": 14659
+ },
+ {
+ "epoch": 39.94550408719346,
+ "grad_norm": 6.994326591491699,
+ "learning_rate": 1.3655483440066496e-05,
+ "loss": 0.3241,
+ "step": 14660
+ },
+ {
+ "epoch": 39.94822888283379,
+ "grad_norm": 5.74834680557251,
+ "learning_rate": 1.3654662006572909e-05,
+ "loss": 0.3925,
+ "step": 14661
+ },
+ {
+ "epoch": 39.950953678474114,
+ "grad_norm": 5.148861885070801,
+ "learning_rate": 1.3653840544616932e-05,
+ "loss": 0.2659,
+ "step": 14662
+ },
+ {
+ "epoch": 39.95367847411444,
+ "grad_norm": 8.553078651428223,
+ "learning_rate": 1.3653019054204962e-05,
+ "loss": 0.2401,
+ "step": 14663
+ },
+ {
+ "epoch": 39.956403269754766,
+ "grad_norm": 5.828797817230225,
+ "learning_rate": 1.3652197535343396e-05,
+ "loss": 0.2697,
+ "step": 14664
+ },
+ {
+ "epoch": 39.95912806539509,
+ "grad_norm": 4.388965606689453,
+ "learning_rate": 1.3651375988038633e-05,
+ "loss": 0.1892,
+ "step": 14665
+ },
+ {
+ "epoch": 39.961852861035425,
+ "grad_norm": 7.490252494812012,
+ "learning_rate": 1.3650554412297075e-05,
+ "loss": 0.193,
+ "step": 14666
+ },
+ {
+ "epoch": 39.96457765667575,
+ "grad_norm": 6.492657661437988,
+ "learning_rate": 1.3649732808125114e-05,
+ "loss": 0.3375,
+ "step": 14667
+ },
+ {
+ "epoch": 39.967302452316076,
+ "grad_norm": 9.734619140625,
+ "learning_rate": 1.3648911175529151e-05,
+ "loss": 0.3243,
+ "step": 14668
+ },
+ {
+ "epoch": 39.9700272479564,
+ "grad_norm": 6.138456344604492,
+ "learning_rate": 1.3648089514515585e-05,
+ "loss": 0.2633,
+ "step": 14669
+ },
+ {
+ "epoch": 39.97275204359673,
+ "grad_norm": 6.453230381011963,
+ "learning_rate": 1.3647267825090818e-05,
+ "loss": 0.2957,
+ "step": 14670
+ },
+ {
+ "epoch": 39.97547683923706,
+ "grad_norm": 6.128805637359619,
+ "learning_rate": 1.3646446107261244e-05,
+ "loss": 0.2565,
+ "step": 14671
+ },
+ {
+ "epoch": 39.97820163487739,
+ "grad_norm": 5.4172139167785645,
+ "learning_rate": 1.3645624361033268e-05,
+ "loss": 0.1973,
+ "step": 14672
+ },
+ {
+ "epoch": 39.98092643051771,
+ "grad_norm": 5.549086093902588,
+ "learning_rate": 1.364480258641328e-05,
+ "loss": 0.2594,
+ "step": 14673
+ },
+ {
+ "epoch": 39.98365122615804,
+ "grad_norm": 5.352941989898682,
+ "learning_rate": 1.3643980783407693e-05,
+ "loss": 0.3738,
+ "step": 14674
+ },
+ {
+ "epoch": 39.986376021798364,
+ "grad_norm": 8.064535140991211,
+ "learning_rate": 1.36431589520229e-05,
+ "loss": 0.2649,
+ "step": 14675
+ },
+ {
+ "epoch": 39.98910081743869,
+ "grad_norm": 5.839471340179443,
+ "learning_rate": 1.3642337092265301e-05,
+ "loss": 0.2395,
+ "step": 14676
+ },
+ {
+ "epoch": 39.991825613079016,
+ "grad_norm": 5.32957124710083,
+ "learning_rate": 1.3641515204141297e-05,
+ "loss": 0.1831,
+ "step": 14677
+ },
+ {
+ "epoch": 39.99455040871935,
+ "grad_norm": 6.660703182220459,
+ "learning_rate": 1.3640693287657294e-05,
+ "loss": 0.2849,
+ "step": 14678
+ },
+ {
+ "epoch": 39.997275204359674,
+ "grad_norm": 5.129420757293701,
+ "learning_rate": 1.3639871342819686e-05,
+ "loss": 0.3918,
+ "step": 14679
+ },
+ {
+ "epoch": 40.0,
+ "grad_norm": 5.764123439788818,
+ "learning_rate": 1.3639049369634878e-05,
+ "loss": 0.2851,
+ "step": 14680
+ },
+ {
+ "epoch": 40.002724795640326,
+ "grad_norm": 4.670469760894775,
+ "learning_rate": 1.3638227368109268e-05,
+ "loss": 0.2391,
+ "step": 14681
+ },
+ {
+ "epoch": 40.00544959128065,
+ "grad_norm": 4.787637233734131,
+ "learning_rate": 1.3637405338249261e-05,
+ "loss": 0.1769,
+ "step": 14682
+ },
+ {
+ "epoch": 40.00817438692098,
+ "grad_norm": 4.994102478027344,
+ "learning_rate": 1.3636583280061262e-05,
+ "loss": 0.353,
+ "step": 14683
+ },
+ {
+ "epoch": 40.01089918256131,
+ "grad_norm": 5.163061618804932,
+ "learning_rate": 1.3635761193551666e-05,
+ "loss": 0.2016,
+ "step": 14684
+ },
+ {
+ "epoch": 40.013623978201636,
+ "grad_norm": 5.797138214111328,
+ "learning_rate": 1.3634939078726878e-05,
+ "loss": 0.3666,
+ "step": 14685
+ },
+ {
+ "epoch": 40.01634877384196,
+ "grad_norm": 5.63509464263916,
+ "learning_rate": 1.3634116935593307e-05,
+ "loss": 0.4189,
+ "step": 14686
+ },
+ {
+ "epoch": 40.01907356948229,
+ "grad_norm": 7.220623970031738,
+ "learning_rate": 1.3633294764157344e-05,
+ "loss": 0.3734,
+ "step": 14687
+ },
+ {
+ "epoch": 40.02179836512261,
+ "grad_norm": 20.821069717407227,
+ "learning_rate": 1.3632472564425402e-05,
+ "loss": 0.2023,
+ "step": 14688
+ },
+ {
+ "epoch": 40.02452316076294,
+ "grad_norm": 6.66929292678833,
+ "learning_rate": 1.3631650336403879e-05,
+ "loss": 0.2946,
+ "step": 14689
+ },
+ {
+ "epoch": 40.02724795640327,
+ "grad_norm": 5.437743663787842,
+ "learning_rate": 1.3630828080099181e-05,
+ "loss": 0.1693,
+ "step": 14690
+ },
+ {
+ "epoch": 40.0299727520436,
+ "grad_norm": 4.195618152618408,
+ "learning_rate": 1.3630005795517712e-05,
+ "loss": 0.1515,
+ "step": 14691
+ },
+ {
+ "epoch": 40.032697547683924,
+ "grad_norm": 6.934732913970947,
+ "learning_rate": 1.362918348266587e-05,
+ "loss": 0.2677,
+ "step": 14692
+ },
+ {
+ "epoch": 40.03542234332425,
+ "grad_norm": 5.9340996742248535,
+ "learning_rate": 1.3628361141550068e-05,
+ "loss": 0.2761,
+ "step": 14693
+ },
+ {
+ "epoch": 40.038147138964575,
+ "grad_norm": 9.502779960632324,
+ "learning_rate": 1.3627538772176705e-05,
+ "loss": 0.3185,
+ "step": 14694
+ },
+ {
+ "epoch": 40.0408719346049,
+ "grad_norm": 5.000411510467529,
+ "learning_rate": 1.3626716374552187e-05,
+ "loss": 0.1497,
+ "step": 14695
+ },
+ {
+ "epoch": 40.043596730245234,
+ "grad_norm": 5.282544136047363,
+ "learning_rate": 1.3625893948682919e-05,
+ "loss": 0.266,
+ "step": 14696
+ },
+ {
+ "epoch": 40.04632152588556,
+ "grad_norm": 5.492834091186523,
+ "learning_rate": 1.3625071494575304e-05,
+ "loss": 0.1529,
+ "step": 14697
+ },
+ {
+ "epoch": 40.049046321525886,
+ "grad_norm": 4.832657337188721,
+ "learning_rate": 1.3624249012235748e-05,
+ "loss": 0.1769,
+ "step": 14698
+ },
+ {
+ "epoch": 40.05177111716621,
+ "grad_norm": 5.096675872802734,
+ "learning_rate": 1.3623426501670662e-05,
+ "loss": 0.2924,
+ "step": 14699
+ },
+ {
+ "epoch": 40.05449591280654,
+ "grad_norm": 5.773919582366943,
+ "learning_rate": 1.3622603962886443e-05,
+ "loss": 0.2339,
+ "step": 14700
+ },
+ {
+ "epoch": 40.05722070844686,
+ "grad_norm": 8.40015697479248,
+ "learning_rate": 1.3621781395889503e-05,
+ "loss": 0.3245,
+ "step": 14701
+ },
+ {
+ "epoch": 40.059945504087196,
+ "grad_norm": 6.444672107696533,
+ "learning_rate": 1.3620958800686246e-05,
+ "loss": 0.3568,
+ "step": 14702
+ },
+ {
+ "epoch": 40.06267029972752,
+ "grad_norm": 5.762142181396484,
+ "learning_rate": 1.3620136177283078e-05,
+ "loss": 0.1714,
+ "step": 14703
+ },
+ {
+ "epoch": 40.06539509536785,
+ "grad_norm": 11.245086669921875,
+ "learning_rate": 1.3619313525686407e-05,
+ "loss": 0.2463,
+ "step": 14704
+ },
+ {
+ "epoch": 40.06811989100817,
+ "grad_norm": 4.8663411140441895,
+ "learning_rate": 1.3618490845902637e-05,
+ "loss": 0.1648,
+ "step": 14705
+ },
+ {
+ "epoch": 40.0708446866485,
+ "grad_norm": 4.974968433380127,
+ "learning_rate": 1.3617668137938176e-05,
+ "loss": 0.3024,
+ "step": 14706
+ },
+ {
+ "epoch": 40.073569482288825,
+ "grad_norm": 4.860438346862793,
+ "learning_rate": 1.3616845401799433e-05,
+ "loss": 0.2716,
+ "step": 14707
+ },
+ {
+ "epoch": 40.07629427792916,
+ "grad_norm": 5.657793998718262,
+ "learning_rate": 1.3616022637492814e-05,
+ "loss": 0.2576,
+ "step": 14708
+ },
+ {
+ "epoch": 40.079019073569484,
+ "grad_norm": 17.060792922973633,
+ "learning_rate": 1.3615199845024729e-05,
+ "loss": 0.2642,
+ "step": 14709
+ },
+ {
+ "epoch": 40.08174386920981,
+ "grad_norm": 4.534100532531738,
+ "learning_rate": 1.3614377024401581e-05,
+ "loss": 0.3705,
+ "step": 14710
+ },
+ {
+ "epoch": 40.084468664850135,
+ "grad_norm": 5.813042640686035,
+ "learning_rate": 1.3613554175629783e-05,
+ "loss": 0.2808,
+ "step": 14711
+ },
+ {
+ "epoch": 40.08719346049046,
+ "grad_norm": 5.779947280883789,
+ "learning_rate": 1.3612731298715743e-05,
+ "loss": 0.2162,
+ "step": 14712
+ },
+ {
+ "epoch": 40.08991825613079,
+ "grad_norm": 5.839858055114746,
+ "learning_rate": 1.3611908393665866e-05,
+ "loss": 0.3207,
+ "step": 14713
+ },
+ {
+ "epoch": 40.09264305177112,
+ "grad_norm": 7.131965637207031,
+ "learning_rate": 1.3611085460486561e-05,
+ "loss": 0.1586,
+ "step": 14714
+ },
+ {
+ "epoch": 40.095367847411445,
+ "grad_norm": 5.477025032043457,
+ "learning_rate": 1.3610262499184241e-05,
+ "loss": 0.2087,
+ "step": 14715
+ },
+ {
+ "epoch": 40.09809264305177,
+ "grad_norm": 8.843849182128906,
+ "learning_rate": 1.360943950976531e-05,
+ "loss": 0.2567,
+ "step": 14716
+ },
+ {
+ "epoch": 40.1008174386921,
+ "grad_norm": 5.079222679138184,
+ "learning_rate": 1.3608616492236185e-05,
+ "loss": 0.2525,
+ "step": 14717
+ },
+ {
+ "epoch": 40.10354223433242,
+ "grad_norm": 5.357724666595459,
+ "learning_rate": 1.3607793446603266e-05,
+ "loss": 0.3328,
+ "step": 14718
+ },
+ {
+ "epoch": 40.10626702997275,
+ "grad_norm": 5.058252334594727,
+ "learning_rate": 1.3606970372872972e-05,
+ "loss": 0.2778,
+ "step": 14719
+ },
+ {
+ "epoch": 40.10899182561308,
+ "grad_norm": 6.287322044372559,
+ "learning_rate": 1.3606147271051706e-05,
+ "loss": 0.1813,
+ "step": 14720
+ },
+ {
+ "epoch": 40.11171662125341,
+ "grad_norm": 5.835550308227539,
+ "learning_rate": 1.3605324141145883e-05,
+ "loss": 0.2213,
+ "step": 14721
+ },
+ {
+ "epoch": 40.11444141689373,
+ "grad_norm": 6.14241886138916,
+ "learning_rate": 1.3604500983161911e-05,
+ "loss": 0.2883,
+ "step": 14722
+ },
+ {
+ "epoch": 40.11716621253406,
+ "grad_norm": 5.560632228851318,
+ "learning_rate": 1.36036777971062e-05,
+ "loss": 0.2858,
+ "step": 14723
+ },
+ {
+ "epoch": 40.119891008174385,
+ "grad_norm": 5.573838233947754,
+ "learning_rate": 1.3602854582985163e-05,
+ "loss": 0.3586,
+ "step": 14724
+ },
+ {
+ "epoch": 40.12261580381471,
+ "grad_norm": 6.711114406585693,
+ "learning_rate": 1.360203134080521e-05,
+ "loss": 0.2218,
+ "step": 14725
+ },
+ {
+ "epoch": 40.12534059945504,
+ "grad_norm": 7.186511993408203,
+ "learning_rate": 1.3601208070572754e-05,
+ "loss": 0.2581,
+ "step": 14726
+ },
+ {
+ "epoch": 40.12806539509537,
+ "grad_norm": 9.657685279846191,
+ "learning_rate": 1.3600384772294206e-05,
+ "loss": 0.3543,
+ "step": 14727
+ },
+ {
+ "epoch": 40.130790190735695,
+ "grad_norm": 4.581483840942383,
+ "learning_rate": 1.3599561445975975e-05,
+ "loss": 0.347,
+ "step": 14728
+ },
+ {
+ "epoch": 40.13351498637602,
+ "grad_norm": 6.904247283935547,
+ "learning_rate": 1.3598738091624477e-05,
+ "loss": 0.2191,
+ "step": 14729
+ },
+ {
+ "epoch": 40.13623978201635,
+ "grad_norm": 5.889281749725342,
+ "learning_rate": 1.3597914709246122e-05,
+ "loss": 0.2881,
+ "step": 14730
+ },
+ {
+ "epoch": 40.13896457765667,
+ "grad_norm": 5.417539596557617,
+ "learning_rate": 1.3597091298847325e-05,
+ "loss": 0.2457,
+ "step": 14731
+ },
+ {
+ "epoch": 40.141689373297005,
+ "grad_norm": 6.106906414031982,
+ "learning_rate": 1.3596267860434496e-05,
+ "loss": 0.281,
+ "step": 14732
+ },
+ {
+ "epoch": 40.14441416893733,
+ "grad_norm": 5.275127410888672,
+ "learning_rate": 1.3595444394014046e-05,
+ "loss": 0.2599,
+ "step": 14733
+ },
+ {
+ "epoch": 40.14713896457766,
+ "grad_norm": 7.4308319091796875,
+ "learning_rate": 1.359462089959239e-05,
+ "loss": 0.216,
+ "step": 14734
+ },
+ {
+ "epoch": 40.14986376021798,
+ "grad_norm": 4.960119247436523,
+ "learning_rate": 1.3593797377175949e-05,
+ "loss": 0.3427,
+ "step": 14735
+ },
+ {
+ "epoch": 40.15258855585831,
+ "grad_norm": 5.1894636154174805,
+ "learning_rate": 1.3592973826771123e-05,
+ "loss": 0.2075,
+ "step": 14736
+ },
+ {
+ "epoch": 40.155313351498634,
+ "grad_norm": 6.531680583953857,
+ "learning_rate": 1.3592150248384334e-05,
+ "loss": 0.4168,
+ "step": 14737
+ },
+ {
+ "epoch": 40.15803814713897,
+ "grad_norm": 4.947193145751953,
+ "learning_rate": 1.3591326642021996e-05,
+ "loss": 0.229,
+ "step": 14738
+ },
+ {
+ "epoch": 40.16076294277929,
+ "grad_norm": 7.752299785614014,
+ "learning_rate": 1.3590503007690523e-05,
+ "loss": 0.333,
+ "step": 14739
+ },
+ {
+ "epoch": 40.16348773841962,
+ "grad_norm": 5.813737869262695,
+ "learning_rate": 1.3589679345396323e-05,
+ "loss": 0.1799,
+ "step": 14740
+ },
+ {
+ "epoch": 40.166212534059945,
+ "grad_norm": 4.673559188842773,
+ "learning_rate": 1.3588855655145819e-05,
+ "loss": 0.2692,
+ "step": 14741
+ },
+ {
+ "epoch": 40.16893732970027,
+ "grad_norm": 5.340415000915527,
+ "learning_rate": 1.3588031936945423e-05,
+ "loss": 0.3775,
+ "step": 14742
+ },
+ {
+ "epoch": 40.171662125340596,
+ "grad_norm": 5.528367519378662,
+ "learning_rate": 1.3587208190801549e-05,
+ "loss": 0.2867,
+ "step": 14743
+ },
+ {
+ "epoch": 40.17438692098093,
+ "grad_norm": 5.196868896484375,
+ "learning_rate": 1.3586384416720612e-05,
+ "loss": 0.167,
+ "step": 14744
+ },
+ {
+ "epoch": 40.177111716621255,
+ "grad_norm": 5.872586250305176,
+ "learning_rate": 1.3585560614709033e-05,
+ "loss": 0.1531,
+ "step": 14745
+ },
+ {
+ "epoch": 40.17983651226158,
+ "grad_norm": 7.798600196838379,
+ "learning_rate": 1.3584736784773218e-05,
+ "loss": 0.2896,
+ "step": 14746
+ },
+ {
+ "epoch": 40.182561307901906,
+ "grad_norm": 6.427639007568359,
+ "learning_rate": 1.3583912926919594e-05,
+ "loss": 0.1616,
+ "step": 14747
+ },
+ {
+ "epoch": 40.18528610354223,
+ "grad_norm": 5.750645637512207,
+ "learning_rate": 1.3583089041154565e-05,
+ "loss": 0.3266,
+ "step": 14748
+ },
+ {
+ "epoch": 40.18801089918256,
+ "grad_norm": 5.34175968170166,
+ "learning_rate": 1.358226512748456e-05,
+ "loss": 0.1887,
+ "step": 14749
+ },
+ {
+ "epoch": 40.19073569482289,
+ "grad_norm": 6.367232322692871,
+ "learning_rate": 1.3581441185915982e-05,
+ "loss": 0.1972,
+ "step": 14750
+ },
+ {
+ "epoch": 40.19346049046322,
+ "grad_norm": 5.012624263763428,
+ "learning_rate": 1.3580617216455261e-05,
+ "loss": 0.1836,
+ "step": 14751
+ },
+ {
+ "epoch": 40.19618528610354,
+ "grad_norm": 5.424821376800537,
+ "learning_rate": 1.3579793219108805e-05,
+ "loss": 0.2442,
+ "step": 14752
+ },
+ {
+ "epoch": 40.19891008174387,
+ "grad_norm": 5.797748565673828,
+ "learning_rate": 1.3578969193883038e-05,
+ "loss": 0.3721,
+ "step": 14753
+ },
+ {
+ "epoch": 40.201634877384194,
+ "grad_norm": 7.14633321762085,
+ "learning_rate": 1.3578145140784373e-05,
+ "loss": 0.3064,
+ "step": 14754
+ },
+ {
+ "epoch": 40.20435967302452,
+ "grad_norm": 5.756343364715576,
+ "learning_rate": 1.3577321059819229e-05,
+ "loss": 0.2394,
+ "step": 14755
+ },
+ {
+ "epoch": 40.20708446866485,
+ "grad_norm": 6.218676567077637,
+ "learning_rate": 1.3576496950994022e-05,
+ "loss": 0.1745,
+ "step": 14756
+ },
+ {
+ "epoch": 40.20980926430518,
+ "grad_norm": 7.166897296905518,
+ "learning_rate": 1.3575672814315174e-05,
+ "loss": 0.2559,
+ "step": 14757
+ },
+ {
+ "epoch": 40.212534059945504,
+ "grad_norm": 6.445605754852295,
+ "learning_rate": 1.3574848649789102e-05,
+ "loss": 0.1658,
+ "step": 14758
+ },
+ {
+ "epoch": 40.21525885558583,
+ "grad_norm": 5.106618881225586,
+ "learning_rate": 1.357402445742222e-05,
+ "loss": 0.3415,
+ "step": 14759
+ },
+ {
+ "epoch": 40.217983651226156,
+ "grad_norm": 5.6757965087890625,
+ "learning_rate": 1.3573200237220951e-05,
+ "loss": 0.2629,
+ "step": 14760
+ },
+ {
+ "epoch": 40.22070844686648,
+ "grad_norm": 6.836151599884033,
+ "learning_rate": 1.3572375989191717e-05,
+ "loss": 0.2822,
+ "step": 14761
+ },
+ {
+ "epoch": 40.223433242506815,
+ "grad_norm": 4.928470134735107,
+ "learning_rate": 1.3571551713340931e-05,
+ "loss": 0.3333,
+ "step": 14762
+ },
+ {
+ "epoch": 40.22615803814714,
+ "grad_norm": 4.809662818908691,
+ "learning_rate": 1.3570727409675018e-05,
+ "loss": 0.1796,
+ "step": 14763
+ },
+ {
+ "epoch": 40.228882833787466,
+ "grad_norm": 6.912206172943115,
+ "learning_rate": 1.3569903078200393e-05,
+ "loss": 0.1788,
+ "step": 14764
+ },
+ {
+ "epoch": 40.23160762942779,
+ "grad_norm": 5.686048984527588,
+ "learning_rate": 1.3569078718923478e-05,
+ "loss": 0.1935,
+ "step": 14765
+ },
+ {
+ "epoch": 40.23433242506812,
+ "grad_norm": 6.835017681121826,
+ "learning_rate": 1.3568254331850693e-05,
+ "loss": 0.1676,
+ "step": 14766
+ },
+ {
+ "epoch": 40.237057220708444,
+ "grad_norm": 6.015300750732422,
+ "learning_rate": 1.3567429916988457e-05,
+ "loss": 0.2258,
+ "step": 14767
+ },
+ {
+ "epoch": 40.23978201634878,
+ "grad_norm": 26.15471076965332,
+ "learning_rate": 1.3566605474343192e-05,
+ "loss": 0.2457,
+ "step": 14768
+ },
+ {
+ "epoch": 40.2425068119891,
+ "grad_norm": 5.850229740142822,
+ "learning_rate": 1.3565781003921318e-05,
+ "loss": 0.2355,
+ "step": 14769
+ },
+ {
+ "epoch": 40.24523160762943,
+ "grad_norm": 4.393250942230225,
+ "learning_rate": 1.3564956505729259e-05,
+ "loss": 0.3133,
+ "step": 14770
+ },
+ {
+ "epoch": 40.247956403269754,
+ "grad_norm": 5.310056686401367,
+ "learning_rate": 1.356413197977343e-05,
+ "loss": 0.1958,
+ "step": 14771
+ },
+ {
+ "epoch": 40.25068119891008,
+ "grad_norm": 6.719603538513184,
+ "learning_rate": 1.3563307426060258e-05,
+ "loss": 0.2014,
+ "step": 14772
+ },
+ {
+ "epoch": 40.253405994550405,
+ "grad_norm": 6.757342338562012,
+ "learning_rate": 1.3562482844596164e-05,
+ "loss": 0.2555,
+ "step": 14773
+ },
+ {
+ "epoch": 40.25613079019074,
+ "grad_norm": 4.700272560119629,
+ "learning_rate": 1.3561658235387562e-05,
+ "loss": 0.3251,
+ "step": 14774
+ },
+ {
+ "epoch": 40.258855585831064,
+ "grad_norm": 5.600427150726318,
+ "learning_rate": 1.3560833598440887e-05,
+ "loss": 0.1668,
+ "step": 14775
+ },
+ {
+ "epoch": 40.26158038147139,
+ "grad_norm": 7.44266939163208,
+ "learning_rate": 1.3560008933762552e-05,
+ "loss": 0.2774,
+ "step": 14776
+ },
+ {
+ "epoch": 40.264305177111716,
+ "grad_norm": 4.850956916809082,
+ "learning_rate": 1.355918424135898e-05,
+ "loss": 0.2892,
+ "step": 14777
+ },
+ {
+ "epoch": 40.26702997275204,
+ "grad_norm": 4.869438648223877,
+ "learning_rate": 1.35583595212366e-05,
+ "loss": 0.5064,
+ "step": 14778
+ },
+ {
+ "epoch": 40.26975476839237,
+ "grad_norm": 6.677958011627197,
+ "learning_rate": 1.3557534773401827e-05,
+ "loss": 0.3253,
+ "step": 14779
+ },
+ {
+ "epoch": 40.2724795640327,
+ "grad_norm": 6.601706504821777,
+ "learning_rate": 1.355670999786109e-05,
+ "loss": 0.2698,
+ "step": 14780
+ },
+ {
+ "epoch": 40.275204359673026,
+ "grad_norm": 4.455941677093506,
+ "learning_rate": 1.3555885194620806e-05,
+ "loss": 0.2024,
+ "step": 14781
+ },
+ {
+ "epoch": 40.27792915531335,
+ "grad_norm": 4.924816131591797,
+ "learning_rate": 1.3555060363687407e-05,
+ "loss": 0.1795,
+ "step": 14782
+ },
+ {
+ "epoch": 40.28065395095368,
+ "grad_norm": 6.3266119956970215,
+ "learning_rate": 1.355423550506731e-05,
+ "loss": 0.2472,
+ "step": 14783
+ },
+ {
+ "epoch": 40.283378746594,
+ "grad_norm": 6.0468549728393555,
+ "learning_rate": 1.3553410618766942e-05,
+ "loss": 0.2499,
+ "step": 14784
+ },
+ {
+ "epoch": 40.28610354223433,
+ "grad_norm": 4.959547519683838,
+ "learning_rate": 1.3552585704792724e-05,
+ "loss": 0.1743,
+ "step": 14785
+ },
+ {
+ "epoch": 40.28882833787466,
+ "grad_norm": 5.919888496398926,
+ "learning_rate": 1.3551760763151087e-05,
+ "loss": 0.2734,
+ "step": 14786
+ },
+ {
+ "epoch": 40.29155313351499,
+ "grad_norm": 6.15693998336792,
+ "learning_rate": 1.355093579384845e-05,
+ "loss": 0.2804,
+ "step": 14787
+ },
+ {
+ "epoch": 40.294277929155314,
+ "grad_norm": 6.691210746765137,
+ "learning_rate": 1.3550110796891241e-05,
+ "loss": 0.2145,
+ "step": 14788
+ },
+ {
+ "epoch": 40.29700272479564,
+ "grad_norm": 5.143745422363281,
+ "learning_rate": 1.3549285772285881e-05,
+ "loss": 0.2393,
+ "step": 14789
+ },
+ {
+ "epoch": 40.299727520435965,
+ "grad_norm": 7.448602199554443,
+ "learning_rate": 1.3548460720038798e-05,
+ "loss": 0.3274,
+ "step": 14790
+ },
+ {
+ "epoch": 40.30245231607629,
+ "grad_norm": 5.299944877624512,
+ "learning_rate": 1.3547635640156415e-05,
+ "loss": 0.1837,
+ "step": 14791
+ },
+ {
+ "epoch": 40.305177111716624,
+ "grad_norm": 6.9879679679870605,
+ "learning_rate": 1.3546810532645166e-05,
+ "loss": 0.2359,
+ "step": 14792
+ },
+ {
+ "epoch": 40.30790190735695,
+ "grad_norm": 5.754627227783203,
+ "learning_rate": 1.3545985397511464e-05,
+ "loss": 0.1475,
+ "step": 14793
+ },
+ {
+ "epoch": 40.310626702997276,
+ "grad_norm": 5.53333854675293,
+ "learning_rate": 1.3545160234761745e-05,
+ "loss": 0.1715,
+ "step": 14794
+ },
+ {
+ "epoch": 40.3133514986376,
+ "grad_norm": 7.198060989379883,
+ "learning_rate": 1.354433504440243e-05,
+ "loss": 0.2008,
+ "step": 14795
+ },
+ {
+ "epoch": 40.31607629427793,
+ "grad_norm": 6.643033027648926,
+ "learning_rate": 1.3543509826439951e-05,
+ "loss": 0.2318,
+ "step": 14796
+ },
+ {
+ "epoch": 40.31880108991825,
+ "grad_norm": 6.457057476043701,
+ "learning_rate": 1.3542684580880729e-05,
+ "loss": 0.3141,
+ "step": 14797
+ },
+ {
+ "epoch": 40.321525885558586,
+ "grad_norm": 5.512293815612793,
+ "learning_rate": 1.3541859307731198e-05,
+ "loss": 0.3023,
+ "step": 14798
+ },
+ {
+ "epoch": 40.32425068119891,
+ "grad_norm": 5.504129886627197,
+ "learning_rate": 1.3541034006997776e-05,
+ "loss": 0.1915,
+ "step": 14799
+ },
+ {
+ "epoch": 40.32697547683924,
+ "grad_norm": 6.146503925323486,
+ "learning_rate": 1.3540208678686897e-05,
+ "loss": 0.2172,
+ "step": 14800
+ },
+ {
+ "epoch": 40.32970027247956,
+ "grad_norm": 5.390168190002441,
+ "learning_rate": 1.3539383322804986e-05,
+ "loss": 0.1998,
+ "step": 14801
+ },
+ {
+ "epoch": 40.33242506811989,
+ "grad_norm": 5.944275379180908,
+ "learning_rate": 1.353855793935847e-05,
+ "loss": 0.3185,
+ "step": 14802
+ },
+ {
+ "epoch": 40.335149863760215,
+ "grad_norm": 6.440017223358154,
+ "learning_rate": 1.353773252835378e-05,
+ "loss": 0.245,
+ "step": 14803
+ },
+ {
+ "epoch": 40.33787465940055,
+ "grad_norm": 5.658210277557373,
+ "learning_rate": 1.3536907089797344e-05,
+ "loss": 0.1766,
+ "step": 14804
+ },
+ {
+ "epoch": 40.34059945504087,
+ "grad_norm": 6.608595371246338,
+ "learning_rate": 1.3536081623695588e-05,
+ "loss": 0.2682,
+ "step": 14805
+ },
+ {
+ "epoch": 40.3433242506812,
+ "grad_norm": 7.2391510009765625,
+ "learning_rate": 1.3535256130054943e-05,
+ "loss": 0.3797,
+ "step": 14806
+ },
+ {
+ "epoch": 40.346049046321525,
+ "grad_norm": 8.538012504577637,
+ "learning_rate": 1.3534430608881837e-05,
+ "loss": 0.229,
+ "step": 14807
+ },
+ {
+ "epoch": 40.34877384196185,
+ "grad_norm": 5.476230621337891,
+ "learning_rate": 1.35336050601827e-05,
+ "loss": 0.2702,
+ "step": 14808
+ },
+ {
+ "epoch": 40.35149863760218,
+ "grad_norm": 4.536299228668213,
+ "learning_rate": 1.353277948396396e-05,
+ "loss": 0.1606,
+ "step": 14809
+ },
+ {
+ "epoch": 40.35422343324251,
+ "grad_norm": 5.5461320877075195,
+ "learning_rate": 1.3531953880232044e-05,
+ "loss": 0.375,
+ "step": 14810
+ },
+ {
+ "epoch": 40.356948228882835,
+ "grad_norm": 5.543405532836914,
+ "learning_rate": 1.3531128248993388e-05,
+ "loss": 0.1926,
+ "step": 14811
+ },
+ {
+ "epoch": 40.35967302452316,
+ "grad_norm": 4.79237174987793,
+ "learning_rate": 1.353030259025442e-05,
+ "loss": 0.232,
+ "step": 14812
+ },
+ {
+ "epoch": 40.36239782016349,
+ "grad_norm": 4.4786200523376465,
+ "learning_rate": 1.3529476904021565e-05,
+ "loss": 0.1896,
+ "step": 14813
+ },
+ {
+ "epoch": 40.36512261580381,
+ "grad_norm": 5.660500526428223,
+ "learning_rate": 1.3528651190301263e-05,
+ "loss": 0.1839,
+ "step": 14814
+ },
+ {
+ "epoch": 40.36784741144414,
+ "grad_norm": 6.6640520095825195,
+ "learning_rate": 1.3527825449099936e-05,
+ "loss": 0.3246,
+ "step": 14815
+ },
+ {
+ "epoch": 40.37057220708447,
+ "grad_norm": 4.925924777984619,
+ "learning_rate": 1.3526999680424018e-05,
+ "loss": 0.2152,
+ "step": 14816
+ },
+ {
+ "epoch": 40.3732970027248,
+ "grad_norm": 6.950525283813477,
+ "learning_rate": 1.352617388427994e-05,
+ "loss": 0.188,
+ "step": 14817
+ },
+ {
+ "epoch": 40.37602179836512,
+ "grad_norm": 6.052989482879639,
+ "learning_rate": 1.3525348060674133e-05,
+ "loss": 0.2143,
+ "step": 14818
+ },
+ {
+ "epoch": 40.37874659400545,
+ "grad_norm": 5.452238082885742,
+ "learning_rate": 1.3524522209613027e-05,
+ "loss": 0.3057,
+ "step": 14819
+ },
+ {
+ "epoch": 40.381471389645775,
+ "grad_norm": 6.343240737915039,
+ "learning_rate": 1.3523696331103058e-05,
+ "loss": 0.2796,
+ "step": 14820
+ },
+ {
+ "epoch": 40.3841961852861,
+ "grad_norm": 4.896117687225342,
+ "learning_rate": 1.3522870425150654e-05,
+ "loss": 0.3237,
+ "step": 14821
+ },
+ {
+ "epoch": 40.38692098092643,
+ "grad_norm": 6.452795505523682,
+ "learning_rate": 1.3522044491762253e-05,
+ "loss": 0.2743,
+ "step": 14822
+ },
+ {
+ "epoch": 40.38964577656676,
+ "grad_norm": 8.737284660339355,
+ "learning_rate": 1.3521218530944276e-05,
+ "loss": 0.3762,
+ "step": 14823
+ },
+ {
+ "epoch": 40.392370572207085,
+ "grad_norm": 7.082198143005371,
+ "learning_rate": 1.3520392542703167e-05,
+ "loss": 0.3012,
+ "step": 14824
+ },
+ {
+ "epoch": 40.39509536784741,
+ "grad_norm": 6.1143879890441895,
+ "learning_rate": 1.3519566527045354e-05,
+ "loss": 0.1956,
+ "step": 14825
+ },
+ {
+ "epoch": 40.39782016348774,
+ "grad_norm": 8.48856258392334,
+ "learning_rate": 1.3518740483977268e-05,
+ "loss": 0.2278,
+ "step": 14826
+ },
+ {
+ "epoch": 40.40054495912806,
+ "grad_norm": 4.892963886260986,
+ "learning_rate": 1.3517914413505344e-05,
+ "loss": 0.2896,
+ "step": 14827
+ },
+ {
+ "epoch": 40.403269754768395,
+ "grad_norm": 5.718017101287842,
+ "learning_rate": 1.3517088315636018e-05,
+ "loss": 0.1962,
+ "step": 14828
+ },
+ {
+ "epoch": 40.40599455040872,
+ "grad_norm": 6.417229652404785,
+ "learning_rate": 1.351626219037572e-05,
+ "loss": 0.4118,
+ "step": 14829
+ },
+ {
+ "epoch": 40.40871934604905,
+ "grad_norm": 7.505584716796875,
+ "learning_rate": 1.3515436037730887e-05,
+ "loss": 0.2588,
+ "step": 14830
+ },
+ {
+ "epoch": 40.41144414168937,
+ "grad_norm": 5.5002264976501465,
+ "learning_rate": 1.3514609857707948e-05,
+ "loss": 0.1766,
+ "step": 14831
+ },
+ {
+ "epoch": 40.4141689373297,
+ "grad_norm": 5.516236305236816,
+ "learning_rate": 1.3513783650313346e-05,
+ "loss": 0.1651,
+ "step": 14832
+ },
+ {
+ "epoch": 40.416893732970024,
+ "grad_norm": 6.154860496520996,
+ "learning_rate": 1.3512957415553505e-05,
+ "loss": 0.2749,
+ "step": 14833
+ },
+ {
+ "epoch": 40.41961852861036,
+ "grad_norm": 6.072230339050293,
+ "learning_rate": 1.3512131153434867e-05,
+ "loss": 0.2501,
+ "step": 14834
+ },
+ {
+ "epoch": 40.42234332425068,
+ "grad_norm": 5.330625534057617,
+ "learning_rate": 1.3511304863963863e-05,
+ "loss": 0.2563,
+ "step": 14835
+ },
+ {
+ "epoch": 40.42506811989101,
+ "grad_norm": 4.895598888397217,
+ "learning_rate": 1.351047854714693e-05,
+ "loss": 0.1862,
+ "step": 14836
+ },
+ {
+ "epoch": 40.427792915531334,
+ "grad_norm": 5.669843673706055,
+ "learning_rate": 1.3509652202990501e-05,
+ "loss": 0.1945,
+ "step": 14837
+ },
+ {
+ "epoch": 40.43051771117166,
+ "grad_norm": 7.436789512634277,
+ "learning_rate": 1.350882583150102e-05,
+ "loss": 0.3026,
+ "step": 14838
+ },
+ {
+ "epoch": 40.433242506811986,
+ "grad_norm": 5.909114360809326,
+ "learning_rate": 1.3507999432684911e-05,
+ "loss": 0.2505,
+ "step": 14839
+ },
+ {
+ "epoch": 40.43596730245232,
+ "grad_norm": 5.152442455291748,
+ "learning_rate": 1.350717300654862e-05,
+ "loss": 0.2828,
+ "step": 14840
+ },
+ {
+ "epoch": 40.438692098092645,
+ "grad_norm": 5.967596530914307,
+ "learning_rate": 1.3506346553098573e-05,
+ "loss": 0.2723,
+ "step": 14841
+ },
+ {
+ "epoch": 40.44141689373297,
+ "grad_norm": 5.889393329620361,
+ "learning_rate": 1.3505520072341216e-05,
+ "loss": 0.1981,
+ "step": 14842
+ },
+ {
+ "epoch": 40.444141689373296,
+ "grad_norm": 5.980917930603027,
+ "learning_rate": 1.3504693564282977e-05,
+ "loss": 0.3313,
+ "step": 14843
+ },
+ {
+ "epoch": 40.44686648501362,
+ "grad_norm": 5.2491559982299805,
+ "learning_rate": 1.3503867028930305e-05,
+ "loss": 0.1679,
+ "step": 14844
+ },
+ {
+ "epoch": 40.44959128065395,
+ "grad_norm": 5.511984825134277,
+ "learning_rate": 1.350304046628962e-05,
+ "loss": 0.1712,
+ "step": 14845
+ },
+ {
+ "epoch": 40.45231607629428,
+ "grad_norm": 5.705016136169434,
+ "learning_rate": 1.3502213876367373e-05,
+ "loss": 0.2663,
+ "step": 14846
+ },
+ {
+ "epoch": 40.45504087193461,
+ "grad_norm": 5.521117687225342,
+ "learning_rate": 1.3501387259169998e-05,
+ "loss": 0.2274,
+ "step": 14847
+ },
+ {
+ "epoch": 40.45776566757493,
+ "grad_norm": 5.227612495422363,
+ "learning_rate": 1.3500560614703932e-05,
+ "loss": 0.2319,
+ "step": 14848
+ },
+ {
+ "epoch": 40.46049046321526,
+ "grad_norm": 5.669434547424316,
+ "learning_rate": 1.3499733942975611e-05,
+ "loss": 0.2661,
+ "step": 14849
+ },
+ {
+ "epoch": 40.463215258855584,
+ "grad_norm": 5.9248175621032715,
+ "learning_rate": 1.3498907243991477e-05,
+ "loss": 0.1756,
+ "step": 14850
+ },
+ {
+ "epoch": 40.46594005449591,
+ "grad_norm": 5.283051490783691,
+ "learning_rate": 1.3498080517757961e-05,
+ "loss": 0.3733,
+ "step": 14851
+ },
+ {
+ "epoch": 40.46866485013624,
+ "grad_norm": 4.850691795349121,
+ "learning_rate": 1.3497253764281513e-05,
+ "loss": 0.166,
+ "step": 14852
+ },
+ {
+ "epoch": 40.47138964577657,
+ "grad_norm": 5.2142791748046875,
+ "learning_rate": 1.3496426983568561e-05,
+ "loss": 0.1824,
+ "step": 14853
+ },
+ {
+ "epoch": 40.474114441416894,
+ "grad_norm": 4.949707508087158,
+ "learning_rate": 1.3495600175625548e-05,
+ "loss": 0.2636,
+ "step": 14854
+ },
+ {
+ "epoch": 40.47683923705722,
+ "grad_norm": 6.136460304260254,
+ "learning_rate": 1.3494773340458916e-05,
+ "loss": 0.2619,
+ "step": 14855
+ },
+ {
+ "epoch": 40.479564032697546,
+ "grad_norm": 5.417229175567627,
+ "learning_rate": 1.34939464780751e-05,
+ "loss": 0.2144,
+ "step": 14856
+ },
+ {
+ "epoch": 40.48228882833787,
+ "grad_norm": 6.840548992156982,
+ "learning_rate": 1.3493119588480541e-05,
+ "loss": 0.4061,
+ "step": 14857
+ },
+ {
+ "epoch": 40.485013623978205,
+ "grad_norm": 7.138721942901611,
+ "learning_rate": 1.349229267168168e-05,
+ "loss": 0.2626,
+ "step": 14858
+ },
+ {
+ "epoch": 40.48773841961853,
+ "grad_norm": 7.157942295074463,
+ "learning_rate": 1.3491465727684953e-05,
+ "loss": 0.3388,
+ "step": 14859
+ },
+ {
+ "epoch": 40.490463215258856,
+ "grad_norm": 6.756263732910156,
+ "learning_rate": 1.3490638756496807e-05,
+ "loss": 0.2513,
+ "step": 14860
+ },
+ {
+ "epoch": 40.49318801089918,
+ "grad_norm": 7.291346073150635,
+ "learning_rate": 1.348981175812368e-05,
+ "loss": 0.2314,
+ "step": 14861
+ },
+ {
+ "epoch": 40.49591280653951,
+ "grad_norm": 5.688564300537109,
+ "learning_rate": 1.3488984732572006e-05,
+ "loss": 0.1974,
+ "step": 14862
+ },
+ {
+ "epoch": 40.49863760217983,
+ "grad_norm": 6.727434158325195,
+ "learning_rate": 1.3488157679848235e-05,
+ "loss": 0.2977,
+ "step": 14863
+ },
+ {
+ "epoch": 40.50136239782017,
+ "grad_norm": 4.9347968101501465,
+ "learning_rate": 1.3487330599958802e-05,
+ "loss": 0.2374,
+ "step": 14864
+ },
+ {
+ "epoch": 40.50408719346049,
+ "grad_norm": 5.227428436279297,
+ "learning_rate": 1.3486503492910155e-05,
+ "loss": 0.2063,
+ "step": 14865
+ },
+ {
+ "epoch": 40.50681198910082,
+ "grad_norm": 7.073912143707275,
+ "learning_rate": 1.3485676358708725e-05,
+ "loss": 0.2745,
+ "step": 14866
+ },
+ {
+ "epoch": 40.509536784741144,
+ "grad_norm": 8.08021068572998,
+ "learning_rate": 1.3484849197360964e-05,
+ "loss": 0.1532,
+ "step": 14867
+ },
+ {
+ "epoch": 40.51226158038147,
+ "grad_norm": 5.847911834716797,
+ "learning_rate": 1.348402200887331e-05,
+ "loss": 0.3067,
+ "step": 14868
+ },
+ {
+ "epoch": 40.514986376021795,
+ "grad_norm": 5.258172035217285,
+ "learning_rate": 1.3483194793252202e-05,
+ "loss": 0.3422,
+ "step": 14869
+ },
+ {
+ "epoch": 40.51771117166213,
+ "grad_norm": 5.617648124694824,
+ "learning_rate": 1.3482367550504085e-05,
+ "loss": 0.1506,
+ "step": 14870
+ },
+ {
+ "epoch": 40.520435967302454,
+ "grad_norm": 5.911000728607178,
+ "learning_rate": 1.3481540280635403e-05,
+ "loss": 0.3285,
+ "step": 14871
+ },
+ {
+ "epoch": 40.52316076294278,
+ "grad_norm": 7.393513202667236,
+ "learning_rate": 1.3480712983652598e-05,
+ "loss": 0.2773,
+ "step": 14872
+ },
+ {
+ "epoch": 40.525885558583106,
+ "grad_norm": 5.925257682800293,
+ "learning_rate": 1.3479885659562111e-05,
+ "loss": 0.2323,
+ "step": 14873
+ },
+ {
+ "epoch": 40.52861035422343,
+ "grad_norm": 5.522267818450928,
+ "learning_rate": 1.3479058308370386e-05,
+ "loss": 0.33,
+ "step": 14874
+ },
+ {
+ "epoch": 40.53133514986376,
+ "grad_norm": 5.7643256187438965,
+ "learning_rate": 1.3478230930083868e-05,
+ "loss": 0.2511,
+ "step": 14875
+ },
+ {
+ "epoch": 40.53405994550409,
+ "grad_norm": 6.358617782592773,
+ "learning_rate": 1.3477403524708998e-05,
+ "loss": 0.229,
+ "step": 14876
+ },
+ {
+ "epoch": 40.536784741144416,
+ "grad_norm": 5.766740798950195,
+ "learning_rate": 1.3476576092252225e-05,
+ "loss": 0.2071,
+ "step": 14877
+ },
+ {
+ "epoch": 40.53950953678474,
+ "grad_norm": 4.795498847961426,
+ "learning_rate": 1.3475748632719985e-05,
+ "loss": 0.2402,
+ "step": 14878
+ },
+ {
+ "epoch": 40.54223433242507,
+ "grad_norm": 6.2379350662231445,
+ "learning_rate": 1.3474921146118728e-05,
+ "loss": 0.2724,
+ "step": 14879
+ },
+ {
+ "epoch": 40.54495912806539,
+ "grad_norm": 4.677596092224121,
+ "learning_rate": 1.3474093632454897e-05,
+ "loss": 0.2636,
+ "step": 14880
+ },
+ {
+ "epoch": 40.54768392370572,
+ "grad_norm": 5.005476951599121,
+ "learning_rate": 1.3473266091734938e-05,
+ "loss": 0.3155,
+ "step": 14881
+ },
+ {
+ "epoch": 40.55040871934605,
+ "grad_norm": 6.714357376098633,
+ "learning_rate": 1.3472438523965292e-05,
+ "loss": 0.2178,
+ "step": 14882
+ },
+ {
+ "epoch": 40.55313351498638,
+ "grad_norm": 10.46469497680664,
+ "learning_rate": 1.3471610929152408e-05,
+ "loss": 0.4024,
+ "step": 14883
+ },
+ {
+ "epoch": 40.555858310626704,
+ "grad_norm": 7.666954517364502,
+ "learning_rate": 1.3470783307302728e-05,
+ "loss": 0.2054,
+ "step": 14884
+ },
+ {
+ "epoch": 40.55858310626703,
+ "grad_norm": 6.6751179695129395,
+ "learning_rate": 1.3469955658422701e-05,
+ "loss": 0.3029,
+ "step": 14885
+ },
+ {
+ "epoch": 40.561307901907355,
+ "grad_norm": 5.923067092895508,
+ "learning_rate": 1.3469127982518773e-05,
+ "loss": 0.2173,
+ "step": 14886
+ },
+ {
+ "epoch": 40.56403269754768,
+ "grad_norm": 7.947319507598877,
+ "learning_rate": 1.3468300279597386e-05,
+ "loss": 0.2964,
+ "step": 14887
+ },
+ {
+ "epoch": 40.566757493188014,
+ "grad_norm": 5.859461307525635,
+ "learning_rate": 1.3467472549664983e-05,
+ "loss": 0.2649,
+ "step": 14888
+ },
+ {
+ "epoch": 40.56948228882834,
+ "grad_norm": 6.946326732635498,
+ "learning_rate": 1.3466644792728023e-05,
+ "loss": 0.2178,
+ "step": 14889
+ },
+ {
+ "epoch": 40.572207084468666,
+ "grad_norm": 5.288938999176025,
+ "learning_rate": 1.3465817008792943e-05,
+ "loss": 0.1667,
+ "step": 14890
+ },
+ {
+ "epoch": 40.57493188010899,
+ "grad_norm": 10.767555236816406,
+ "learning_rate": 1.3464989197866192e-05,
+ "loss": 0.3047,
+ "step": 14891
+ },
+ {
+ "epoch": 40.57765667574932,
+ "grad_norm": 5.773517608642578,
+ "learning_rate": 1.3464161359954214e-05,
+ "loss": 0.2887,
+ "step": 14892
+ },
+ {
+ "epoch": 40.58038147138964,
+ "grad_norm": 8.373126029968262,
+ "learning_rate": 1.3463333495063462e-05,
+ "loss": 0.2623,
+ "step": 14893
+ },
+ {
+ "epoch": 40.583106267029976,
+ "grad_norm": 6.424461841583252,
+ "learning_rate": 1.3462505603200377e-05,
+ "loss": 0.2723,
+ "step": 14894
+ },
+ {
+ "epoch": 40.5858310626703,
+ "grad_norm": 7.6376118659973145,
+ "learning_rate": 1.3461677684371412e-05,
+ "loss": 0.3219,
+ "step": 14895
+ },
+ {
+ "epoch": 40.58855585831063,
+ "grad_norm": 5.907564640045166,
+ "learning_rate": 1.346084973858301e-05,
+ "loss": 0.2069,
+ "step": 14896
+ },
+ {
+ "epoch": 40.59128065395095,
+ "grad_norm": 5.691221714019775,
+ "learning_rate": 1.3460021765841625e-05,
+ "loss": 0.198,
+ "step": 14897
+ },
+ {
+ "epoch": 40.59400544959128,
+ "grad_norm": 5.604295253753662,
+ "learning_rate": 1.34591937661537e-05,
+ "loss": 0.2034,
+ "step": 14898
+ },
+ {
+ "epoch": 40.596730245231605,
+ "grad_norm": 4.799344062805176,
+ "learning_rate": 1.3458365739525685e-05,
+ "loss": 0.203,
+ "step": 14899
+ },
+ {
+ "epoch": 40.59945504087194,
+ "grad_norm": 5.533874988555908,
+ "learning_rate": 1.3457537685964029e-05,
+ "loss": 0.3049,
+ "step": 14900
+ },
+ {
+ "epoch": 40.60217983651226,
+ "grad_norm": 6.924694061279297,
+ "learning_rate": 1.3456709605475182e-05,
+ "loss": 0.2093,
+ "step": 14901
+ },
+ {
+ "epoch": 40.60490463215259,
+ "grad_norm": 5.239685535430908,
+ "learning_rate": 1.345588149806559e-05,
+ "loss": 0.2447,
+ "step": 14902
+ },
+ {
+ "epoch": 40.607629427792915,
+ "grad_norm": 5.3831095695495605,
+ "learning_rate": 1.3455053363741708e-05,
+ "loss": 0.1792,
+ "step": 14903
+ },
+ {
+ "epoch": 40.61035422343324,
+ "grad_norm": 6.45353889465332,
+ "learning_rate": 1.3454225202509978e-05,
+ "loss": 0.3018,
+ "step": 14904
+ },
+ {
+ "epoch": 40.61307901907357,
+ "grad_norm": 5.3861212730407715,
+ "learning_rate": 1.3453397014376854e-05,
+ "loss": 0.2651,
+ "step": 14905
+ },
+ {
+ "epoch": 40.6158038147139,
+ "grad_norm": 5.265120983123779,
+ "learning_rate": 1.3452568799348783e-05,
+ "loss": 0.2325,
+ "step": 14906
+ },
+ {
+ "epoch": 40.618528610354225,
+ "grad_norm": 8.889595985412598,
+ "learning_rate": 1.3451740557432223e-05,
+ "loss": 0.2323,
+ "step": 14907
+ },
+ {
+ "epoch": 40.62125340599455,
+ "grad_norm": 5.120465278625488,
+ "learning_rate": 1.3450912288633614e-05,
+ "loss": 0.2641,
+ "step": 14908
+ },
+ {
+ "epoch": 40.62397820163488,
+ "grad_norm": 6.105363368988037,
+ "learning_rate": 1.3450083992959413e-05,
+ "loss": 0.1906,
+ "step": 14909
+ },
+ {
+ "epoch": 40.6267029972752,
+ "grad_norm": 9.551621437072754,
+ "learning_rate": 1.3449255670416068e-05,
+ "loss": 0.3251,
+ "step": 14910
+ },
+ {
+ "epoch": 40.62942779291553,
+ "grad_norm": 6.234216690063477,
+ "learning_rate": 1.3448427321010034e-05,
+ "loss": 0.2052,
+ "step": 14911
+ },
+ {
+ "epoch": 40.63215258855586,
+ "grad_norm": 5.134133815765381,
+ "learning_rate": 1.3447598944747755e-05,
+ "loss": 0.1361,
+ "step": 14912
+ },
+ {
+ "epoch": 40.63487738419619,
+ "grad_norm": 6.906923770904541,
+ "learning_rate": 1.3446770541635687e-05,
+ "loss": 0.2399,
+ "step": 14913
+ },
+ {
+ "epoch": 40.63760217983651,
+ "grad_norm": 5.535183429718018,
+ "learning_rate": 1.3445942111680279e-05,
+ "loss": 0.2268,
+ "step": 14914
+ },
+ {
+ "epoch": 40.64032697547684,
+ "grad_norm": 6.394478797912598,
+ "learning_rate": 1.3445113654887992e-05,
+ "loss": 0.2457,
+ "step": 14915
+ },
+ {
+ "epoch": 40.643051771117165,
+ "grad_norm": 4.879506587982178,
+ "learning_rate": 1.3444285171265263e-05,
+ "loss": 0.1335,
+ "step": 14916
+ },
+ {
+ "epoch": 40.64577656675749,
+ "grad_norm": 5.884253978729248,
+ "learning_rate": 1.3443456660818557e-05,
+ "loss": 0.2834,
+ "step": 14917
+ },
+ {
+ "epoch": 40.64850136239782,
+ "grad_norm": 4.804670333862305,
+ "learning_rate": 1.3442628123554318e-05,
+ "loss": 0.2397,
+ "step": 14918
+ },
+ {
+ "epoch": 40.65122615803815,
+ "grad_norm": 5.187518119812012,
+ "learning_rate": 1.3441799559479005e-05,
+ "loss": 0.2859,
+ "step": 14919
+ },
+ {
+ "epoch": 40.653950953678475,
+ "grad_norm": 4.903922080993652,
+ "learning_rate": 1.3440970968599065e-05,
+ "loss": 0.1925,
+ "step": 14920
+ },
+ {
+ "epoch": 40.6566757493188,
+ "grad_norm": 5.095132350921631,
+ "learning_rate": 1.3440142350920958e-05,
+ "loss": 0.2361,
+ "step": 14921
+ },
+ {
+ "epoch": 40.65940054495913,
+ "grad_norm": 5.3817901611328125,
+ "learning_rate": 1.3439313706451125e-05,
+ "loss": 0.226,
+ "step": 14922
+ },
+ {
+ "epoch": 40.66212534059945,
+ "grad_norm": 5.576498508453369,
+ "learning_rate": 1.3438485035196034e-05,
+ "loss": 0.2948,
+ "step": 14923
+ },
+ {
+ "epoch": 40.664850136239785,
+ "grad_norm": 5.794294357299805,
+ "learning_rate": 1.343765633716213e-05,
+ "loss": 0.1942,
+ "step": 14924
+ },
+ {
+ "epoch": 40.66757493188011,
+ "grad_norm": 4.943784713745117,
+ "learning_rate": 1.3436827612355871e-05,
+ "loss": 0.2043,
+ "step": 14925
+ },
+ {
+ "epoch": 40.67029972752044,
+ "grad_norm": 5.971388816833496,
+ "learning_rate": 1.3435998860783708e-05,
+ "loss": 0.2005,
+ "step": 14926
+ },
+ {
+ "epoch": 40.67302452316076,
+ "grad_norm": 5.976658821105957,
+ "learning_rate": 1.3435170082452097e-05,
+ "loss": 0.2635,
+ "step": 14927
+ },
+ {
+ "epoch": 40.67574931880109,
+ "grad_norm": 5.012649059295654,
+ "learning_rate": 1.3434341277367491e-05,
+ "loss": 0.3775,
+ "step": 14928
+ },
+ {
+ "epoch": 40.678474114441414,
+ "grad_norm": 4.810773849487305,
+ "learning_rate": 1.343351244553635e-05,
+ "loss": 0.2225,
+ "step": 14929
+ },
+ {
+ "epoch": 40.68119891008175,
+ "grad_norm": 5.172163963317871,
+ "learning_rate": 1.343268358696512e-05,
+ "loss": 0.2724,
+ "step": 14930
+ },
+ {
+ "epoch": 40.68392370572207,
+ "grad_norm": 5.959063529968262,
+ "learning_rate": 1.3431854701660259e-05,
+ "loss": 0.2525,
+ "step": 14931
+ },
+ {
+ "epoch": 40.6866485013624,
+ "grad_norm": 5.518011569976807,
+ "learning_rate": 1.3431025789628227e-05,
+ "loss": 0.2462,
+ "step": 14932
+ },
+ {
+ "epoch": 40.689373297002724,
+ "grad_norm": 5.654611110687256,
+ "learning_rate": 1.3430196850875476e-05,
+ "loss": 0.2591,
+ "step": 14933
+ },
+ {
+ "epoch": 40.69209809264305,
+ "grad_norm": 5.825628280639648,
+ "learning_rate": 1.3429367885408461e-05,
+ "loss": 0.216,
+ "step": 14934
+ },
+ {
+ "epoch": 40.694822888283376,
+ "grad_norm": 5.7777886390686035,
+ "learning_rate": 1.3428538893233642e-05,
+ "loss": 0.3862,
+ "step": 14935
+ },
+ {
+ "epoch": 40.69754768392371,
+ "grad_norm": 5.627559661865234,
+ "learning_rate": 1.3427709874357471e-05,
+ "loss": 0.2041,
+ "step": 14936
+ },
+ {
+ "epoch": 40.700272479564035,
+ "grad_norm": 5.278099060058594,
+ "learning_rate": 1.3426880828786408e-05,
+ "loss": 0.2989,
+ "step": 14937
+ },
+ {
+ "epoch": 40.70299727520436,
+ "grad_norm": 4.595234394073486,
+ "learning_rate": 1.3426051756526905e-05,
+ "loss": 0.3122,
+ "step": 14938
+ },
+ {
+ "epoch": 40.705722070844686,
+ "grad_norm": 5.167964935302734,
+ "learning_rate": 1.342522265758542e-05,
+ "loss": 0.278,
+ "step": 14939
+ },
+ {
+ "epoch": 40.70844686648501,
+ "grad_norm": 6.490757465362549,
+ "learning_rate": 1.3424393531968415e-05,
+ "loss": 0.3191,
+ "step": 14940
+ },
+ {
+ "epoch": 40.71117166212534,
+ "grad_norm": 5.710482120513916,
+ "learning_rate": 1.3423564379682339e-05,
+ "loss": 0.4288,
+ "step": 14941
+ },
+ {
+ "epoch": 40.71389645776567,
+ "grad_norm": 5.107451438903809,
+ "learning_rate": 1.342273520073366e-05,
+ "loss": 0.3045,
+ "step": 14942
+ },
+ {
+ "epoch": 40.716621253406,
+ "grad_norm": 6.680281639099121,
+ "learning_rate": 1.3421905995128821e-05,
+ "loss": 0.1385,
+ "step": 14943
+ },
+ {
+ "epoch": 40.71934604904632,
+ "grad_norm": 6.430998802185059,
+ "learning_rate": 1.3421076762874295e-05,
+ "loss": 0.2798,
+ "step": 14944
+ },
+ {
+ "epoch": 40.72207084468665,
+ "grad_norm": 5.79957389831543,
+ "learning_rate": 1.3420247503976529e-05,
+ "loss": 0.3243,
+ "step": 14945
+ },
+ {
+ "epoch": 40.724795640326974,
+ "grad_norm": 5.468590259552002,
+ "learning_rate": 1.3419418218441989e-05,
+ "loss": 0.3202,
+ "step": 14946
+ },
+ {
+ "epoch": 40.7275204359673,
+ "grad_norm": 4.622290134429932,
+ "learning_rate": 1.3418588906277128e-05,
+ "loss": 0.1476,
+ "step": 14947
+ },
+ {
+ "epoch": 40.73024523160763,
+ "grad_norm": 4.551146030426025,
+ "learning_rate": 1.3417759567488407e-05,
+ "loss": 0.2247,
+ "step": 14948
+ },
+ {
+ "epoch": 40.73297002724796,
+ "grad_norm": 5.9461774826049805,
+ "learning_rate": 1.3416930202082284e-05,
+ "loss": 0.3004,
+ "step": 14949
+ },
+ {
+ "epoch": 40.735694822888284,
+ "grad_norm": 5.845150470733643,
+ "learning_rate": 1.341610081006522e-05,
+ "loss": 0.2999,
+ "step": 14950
+ },
+ {
+ "epoch": 40.73841961852861,
+ "grad_norm": 4.415715217590332,
+ "learning_rate": 1.341527139144367e-05,
+ "loss": 0.1576,
+ "step": 14951
+ },
+ {
+ "epoch": 40.741144414168936,
+ "grad_norm": 5.789761066436768,
+ "learning_rate": 1.3414441946224099e-05,
+ "loss": 0.286,
+ "step": 14952
+ },
+ {
+ "epoch": 40.74386920980926,
+ "grad_norm": 5.601269721984863,
+ "learning_rate": 1.3413612474412965e-05,
+ "loss": 0.1891,
+ "step": 14953
+ },
+ {
+ "epoch": 40.746594005449595,
+ "grad_norm": 6.888553142547607,
+ "learning_rate": 1.3412782976016724e-05,
+ "loss": 0.2617,
+ "step": 14954
+ },
+ {
+ "epoch": 40.74931880108992,
+ "grad_norm": 5.94119119644165,
+ "learning_rate": 1.3411953451041839e-05,
+ "loss": 0.2158,
+ "step": 14955
+ },
+ {
+ "epoch": 40.752043596730246,
+ "grad_norm": 9.400856971740723,
+ "learning_rate": 1.3411123899494772e-05,
+ "loss": 0.229,
+ "step": 14956
+ },
+ {
+ "epoch": 40.75476839237057,
+ "grad_norm": 8.853175163269043,
+ "learning_rate": 1.341029432138198e-05,
+ "loss": 0.4265,
+ "step": 14957
+ },
+ {
+ "epoch": 40.7574931880109,
+ "grad_norm": 6.882060527801514,
+ "learning_rate": 1.3409464716709928e-05,
+ "loss": 0.2463,
+ "step": 14958
+ },
+ {
+ "epoch": 40.76021798365122,
+ "grad_norm": 5.097872257232666,
+ "learning_rate": 1.3408635085485074e-05,
+ "loss": 0.1524,
+ "step": 14959
+ },
+ {
+ "epoch": 40.762942779291556,
+ "grad_norm": 5.943040370941162,
+ "learning_rate": 1.340780542771388e-05,
+ "loss": 0.4234,
+ "step": 14960
+ },
+ {
+ "epoch": 40.76566757493188,
+ "grad_norm": 7.117913246154785,
+ "learning_rate": 1.3406975743402805e-05,
+ "loss": 0.2,
+ "step": 14961
+ },
+ {
+ "epoch": 40.76839237057221,
+ "grad_norm": 7.399886131286621,
+ "learning_rate": 1.3406146032558316e-05,
+ "loss": 0.3461,
+ "step": 14962
+ },
+ {
+ "epoch": 40.771117166212534,
+ "grad_norm": 5.474939823150635,
+ "learning_rate": 1.3405316295186868e-05,
+ "loss": 0.218,
+ "step": 14963
+ },
+ {
+ "epoch": 40.77384196185286,
+ "grad_norm": 4.896245956420898,
+ "learning_rate": 1.3404486531294926e-05,
+ "loss": 0.168,
+ "step": 14964
+ },
+ {
+ "epoch": 40.776566757493185,
+ "grad_norm": 6.233972549438477,
+ "learning_rate": 1.3403656740888953e-05,
+ "loss": 0.252,
+ "step": 14965
+ },
+ {
+ "epoch": 40.77929155313352,
+ "grad_norm": 5.181840419769287,
+ "learning_rate": 1.3402826923975414e-05,
+ "loss": 0.1587,
+ "step": 14966
+ },
+ {
+ "epoch": 40.782016348773844,
+ "grad_norm": 6.172066688537598,
+ "learning_rate": 1.3401997080560765e-05,
+ "loss": 0.1852,
+ "step": 14967
+ },
+ {
+ "epoch": 40.78474114441417,
+ "grad_norm": 5.824451446533203,
+ "learning_rate": 1.3401167210651474e-05,
+ "loss": 0.2186,
+ "step": 14968
+ },
+ {
+ "epoch": 40.787465940054496,
+ "grad_norm": 5.7823591232299805,
+ "learning_rate": 1.3400337314254e-05,
+ "loss": 0.2286,
+ "step": 14969
+ },
+ {
+ "epoch": 40.79019073569482,
+ "grad_norm": 5.527565002441406,
+ "learning_rate": 1.339950739137481e-05,
+ "loss": 0.2641,
+ "step": 14970
+ },
+ {
+ "epoch": 40.79291553133515,
+ "grad_norm": 6.882816791534424,
+ "learning_rate": 1.3398677442020367e-05,
+ "loss": 0.2936,
+ "step": 14971
+ },
+ {
+ "epoch": 40.79564032697548,
+ "grad_norm": 5.974388122558594,
+ "learning_rate": 1.3397847466197133e-05,
+ "loss": 0.422,
+ "step": 14972
+ },
+ {
+ "epoch": 40.798365122615806,
+ "grad_norm": 5.234097957611084,
+ "learning_rate": 1.339701746391157e-05,
+ "loss": 0.2596,
+ "step": 14973
+ },
+ {
+ "epoch": 40.80108991825613,
+ "grad_norm": 9.07652759552002,
+ "learning_rate": 1.3396187435170144e-05,
+ "loss": 0.2723,
+ "step": 14974
+ },
+ {
+ "epoch": 40.80381471389646,
+ "grad_norm": 5.8103437423706055,
+ "learning_rate": 1.3395357379979324e-05,
+ "loss": 0.1719,
+ "step": 14975
+ },
+ {
+ "epoch": 40.80653950953678,
+ "grad_norm": 5.6345534324646,
+ "learning_rate": 1.3394527298345567e-05,
+ "loss": 0.193,
+ "step": 14976
+ },
+ {
+ "epoch": 40.80926430517711,
+ "grad_norm": 5.143917083740234,
+ "learning_rate": 1.339369719027534e-05,
+ "loss": 0.1949,
+ "step": 14977
+ },
+ {
+ "epoch": 40.81198910081744,
+ "grad_norm": 5.574187278747559,
+ "learning_rate": 1.3392867055775112e-05,
+ "loss": 0.1412,
+ "step": 14978
+ },
+ {
+ "epoch": 40.81471389645777,
+ "grad_norm": 6.678638458251953,
+ "learning_rate": 1.3392036894851342e-05,
+ "loss": 0.2533,
+ "step": 14979
+ },
+ {
+ "epoch": 40.817438692098094,
+ "grad_norm": 6.180417537689209,
+ "learning_rate": 1.3391206707510498e-05,
+ "loss": 0.166,
+ "step": 14980
+ },
+ {
+ "epoch": 40.82016348773842,
+ "grad_norm": 6.180706024169922,
+ "learning_rate": 1.3390376493759045e-05,
+ "loss": 0.231,
+ "step": 14981
+ },
+ {
+ "epoch": 40.822888283378745,
+ "grad_norm": 5.376947402954102,
+ "learning_rate": 1.3389546253603447e-05,
+ "loss": 0.2622,
+ "step": 14982
+ },
+ {
+ "epoch": 40.82561307901907,
+ "grad_norm": 4.870726585388184,
+ "learning_rate": 1.3388715987050174e-05,
+ "loss": 0.2365,
+ "step": 14983
+ },
+ {
+ "epoch": 40.828337874659404,
+ "grad_norm": 6.5397138595581055,
+ "learning_rate": 1.338788569410569e-05,
+ "loss": 0.2467,
+ "step": 14984
+ },
+ {
+ "epoch": 40.83106267029973,
+ "grad_norm": 5.011137962341309,
+ "learning_rate": 1.3387055374776463e-05,
+ "loss": 0.279,
+ "step": 14985
+ },
+ {
+ "epoch": 40.833787465940055,
+ "grad_norm": 4.846118450164795,
+ "learning_rate": 1.3386225029068959e-05,
+ "loss": 0.1282,
+ "step": 14986
+ },
+ {
+ "epoch": 40.83651226158038,
+ "grad_norm": 6.057253360748291,
+ "learning_rate": 1.338539465698964e-05,
+ "loss": 0.2232,
+ "step": 14987
+ },
+ {
+ "epoch": 40.83923705722071,
+ "grad_norm": 6.4753031730651855,
+ "learning_rate": 1.3384564258544976e-05,
+ "loss": 0.2677,
+ "step": 14988
+ },
+ {
+ "epoch": 40.84196185286103,
+ "grad_norm": 7.979143142700195,
+ "learning_rate": 1.3383733833741434e-05,
+ "loss": 0.2295,
+ "step": 14989
+ },
+ {
+ "epoch": 40.844686648501366,
+ "grad_norm": 6.787848949432373,
+ "learning_rate": 1.3382903382585485e-05,
+ "loss": 0.214,
+ "step": 14990
+ },
+ {
+ "epoch": 40.84741144414169,
+ "grad_norm": 5.826859474182129,
+ "learning_rate": 1.338207290508359e-05,
+ "loss": 0.1957,
+ "step": 14991
+ },
+ {
+ "epoch": 40.85013623978202,
+ "grad_norm": 5.740458011627197,
+ "learning_rate": 1.3381242401242222e-05,
+ "loss": 0.229,
+ "step": 14992
+ },
+ {
+ "epoch": 40.85286103542234,
+ "grad_norm": 5.911404609680176,
+ "learning_rate": 1.3380411871067846e-05,
+ "loss": 0.4161,
+ "step": 14993
+ },
+ {
+ "epoch": 40.85558583106267,
+ "grad_norm": 6.816946506500244,
+ "learning_rate": 1.3379581314566931e-05,
+ "loss": 0.2727,
+ "step": 14994
+ },
+ {
+ "epoch": 40.858310626702995,
+ "grad_norm": 6.2688069343566895,
+ "learning_rate": 1.3378750731745949e-05,
+ "loss": 0.2802,
+ "step": 14995
+ },
+ {
+ "epoch": 40.86103542234333,
+ "grad_norm": 4.649788856506348,
+ "learning_rate": 1.337792012261136e-05,
+ "loss": 0.3784,
+ "step": 14996
+ },
+ {
+ "epoch": 40.86376021798365,
+ "grad_norm": 5.236213684082031,
+ "learning_rate": 1.337708948716964e-05,
+ "loss": 0.2497,
+ "step": 14997
+ },
+ {
+ "epoch": 40.86648501362398,
+ "grad_norm": 4.856684684753418,
+ "learning_rate": 1.3376258825427259e-05,
+ "loss": 0.2789,
+ "step": 14998
+ },
+ {
+ "epoch": 40.869209809264305,
+ "grad_norm": 6.627138137817383,
+ "learning_rate": 1.3375428137390678e-05,
+ "loss": 0.2303,
+ "step": 14999
+ },
+ {
+ "epoch": 40.87193460490463,
+ "grad_norm": 5.439791202545166,
+ "learning_rate": 1.3374597423066373e-05,
+ "loss": 0.3366,
+ "step": 15000
+ },
+ {
+ "epoch": 40.87465940054496,
+ "grad_norm": 5.366386413574219,
+ "learning_rate": 1.3373766682460811e-05,
+ "loss": 0.1568,
+ "step": 15001
+ },
+ {
+ "epoch": 40.87738419618529,
+ "grad_norm": 6.989178657531738,
+ "learning_rate": 1.3372935915580465e-05,
+ "loss": 0.2469,
+ "step": 15002
+ },
+ {
+ "epoch": 40.880108991825615,
+ "grad_norm": 6.559767723083496,
+ "learning_rate": 1.3372105122431801e-05,
+ "loss": 0.2893,
+ "step": 15003
+ },
+ {
+ "epoch": 40.88283378746594,
+ "grad_norm": 5.447100639343262,
+ "learning_rate": 1.3371274303021293e-05,
+ "loss": 0.1565,
+ "step": 15004
+ },
+ {
+ "epoch": 40.88555858310627,
+ "grad_norm": 6.380908012390137,
+ "learning_rate": 1.3370443457355407e-05,
+ "loss": 0.1827,
+ "step": 15005
+ },
+ {
+ "epoch": 40.88828337874659,
+ "grad_norm": 4.741380214691162,
+ "learning_rate": 1.3369612585440617e-05,
+ "loss": 0.2058,
+ "step": 15006
+ },
+ {
+ "epoch": 40.89100817438692,
+ "grad_norm": 5.247865200042725,
+ "learning_rate": 1.336878168728339e-05,
+ "loss": 0.1651,
+ "step": 15007
+ },
+ {
+ "epoch": 40.89373297002725,
+ "grad_norm": 5.421178817749023,
+ "learning_rate": 1.33679507628902e-05,
+ "loss": 0.1881,
+ "step": 15008
+ },
+ {
+ "epoch": 40.89645776566758,
+ "grad_norm": 7.068850517272949,
+ "learning_rate": 1.336711981226752e-05,
+ "loss": 0.2087,
+ "step": 15009
+ },
+ {
+ "epoch": 40.8991825613079,
+ "grad_norm": 6.348726272583008,
+ "learning_rate": 1.336628883542182e-05,
+ "loss": 0.265,
+ "step": 15010
+ },
+ {
+ "epoch": 40.90190735694823,
+ "grad_norm": 5.680532932281494,
+ "learning_rate": 1.3365457832359567e-05,
+ "loss": 0.1723,
+ "step": 15011
+ },
+ {
+ "epoch": 40.904632152588555,
+ "grad_norm": 7.25140380859375,
+ "learning_rate": 1.3364626803087242e-05,
+ "loss": 0.3176,
+ "step": 15012
+ },
+ {
+ "epoch": 40.90735694822888,
+ "grad_norm": 6.55526065826416,
+ "learning_rate": 1.3363795747611309e-05,
+ "loss": 0.3861,
+ "step": 15013
+ },
+ {
+ "epoch": 40.91008174386921,
+ "grad_norm": 5.4566473960876465,
+ "learning_rate": 1.3362964665938246e-05,
+ "loss": 0.2871,
+ "step": 15014
+ },
+ {
+ "epoch": 40.91280653950954,
+ "grad_norm": 5.61224889755249,
+ "learning_rate": 1.3362133558074517e-05,
+ "loss": 0.164,
+ "step": 15015
+ },
+ {
+ "epoch": 40.915531335149865,
+ "grad_norm": 6.36538553237915,
+ "learning_rate": 1.3361302424026603e-05,
+ "loss": 0.2852,
+ "step": 15016
+ },
+ {
+ "epoch": 40.91825613079019,
+ "grad_norm": 5.29815149307251,
+ "learning_rate": 1.3360471263800974e-05,
+ "loss": 0.2155,
+ "step": 15017
+ },
+ {
+ "epoch": 40.920980926430516,
+ "grad_norm": 5.939804553985596,
+ "learning_rate": 1.33596400774041e-05,
+ "loss": 0.3171,
+ "step": 15018
+ },
+ {
+ "epoch": 40.92370572207084,
+ "grad_norm": 4.8379693031311035,
+ "learning_rate": 1.335880886484246e-05,
+ "loss": 0.2887,
+ "step": 15019
+ },
+ {
+ "epoch": 40.926430517711175,
+ "grad_norm": 4.905444145202637,
+ "learning_rate": 1.3357977626122525e-05,
+ "loss": 0.2915,
+ "step": 15020
+ },
+ {
+ "epoch": 40.9291553133515,
+ "grad_norm": 5.513583660125732,
+ "learning_rate": 1.3357146361250765e-05,
+ "loss": 0.2451,
+ "step": 15021
+ },
+ {
+ "epoch": 40.93188010899183,
+ "grad_norm": 6.400475978851318,
+ "learning_rate": 1.3356315070233664e-05,
+ "loss": 0.247,
+ "step": 15022
+ },
+ {
+ "epoch": 40.93460490463215,
+ "grad_norm": 7.196538925170898,
+ "learning_rate": 1.3355483753077682e-05,
+ "loss": 0.2287,
+ "step": 15023
+ },
+ {
+ "epoch": 40.93732970027248,
+ "grad_norm": 5.121399402618408,
+ "learning_rate": 1.3354652409789303e-05,
+ "loss": 0.1901,
+ "step": 15024
+ },
+ {
+ "epoch": 40.940054495912804,
+ "grad_norm": 5.523329257965088,
+ "learning_rate": 1.3353821040375001e-05,
+ "loss": 0.3396,
+ "step": 15025
+ },
+ {
+ "epoch": 40.94277929155314,
+ "grad_norm": 6.12915563583374,
+ "learning_rate": 1.3352989644841245e-05,
+ "loss": 0.2905,
+ "step": 15026
+ },
+ {
+ "epoch": 40.94550408719346,
+ "grad_norm": 5.719439506530762,
+ "learning_rate": 1.3352158223194517e-05,
+ "loss": 0.3653,
+ "step": 15027
+ },
+ {
+ "epoch": 40.94822888283379,
+ "grad_norm": 5.728538990020752,
+ "learning_rate": 1.3351326775441287e-05,
+ "loss": 0.2712,
+ "step": 15028
+ },
+ {
+ "epoch": 40.950953678474114,
+ "grad_norm": 5.390470027923584,
+ "learning_rate": 1.3350495301588034e-05,
+ "loss": 0.2523,
+ "step": 15029
+ },
+ {
+ "epoch": 40.95367847411444,
+ "grad_norm": 4.868643283843994,
+ "learning_rate": 1.334966380164123e-05,
+ "loss": 0.2482,
+ "step": 15030
+ },
+ {
+ "epoch": 40.956403269754766,
+ "grad_norm": 5.358735084533691,
+ "learning_rate": 1.3348832275607351e-05,
+ "loss": 0.3782,
+ "step": 15031
+ },
+ {
+ "epoch": 40.95912806539509,
+ "grad_norm": 6.365812301635742,
+ "learning_rate": 1.3348000723492875e-05,
+ "loss": 0.2387,
+ "step": 15032
+ },
+ {
+ "epoch": 40.961852861035425,
+ "grad_norm": 6.051462173461914,
+ "learning_rate": 1.3347169145304277e-05,
+ "loss": 0.1827,
+ "step": 15033
+ },
+ {
+ "epoch": 40.96457765667575,
+ "grad_norm": 4.960656642913818,
+ "learning_rate": 1.3346337541048034e-05,
+ "loss": 0.257,
+ "step": 15034
+ },
+ {
+ "epoch": 40.967302452316076,
+ "grad_norm": 5.8224873542785645,
+ "learning_rate": 1.3345505910730621e-05,
+ "loss": 0.3081,
+ "step": 15035
+ },
+ {
+ "epoch": 40.9700272479564,
+ "grad_norm": 7.290229797363281,
+ "learning_rate": 1.3344674254358515e-05,
+ "loss": 0.2471,
+ "step": 15036
+ },
+ {
+ "epoch": 40.97275204359673,
+ "grad_norm": 8.550009727478027,
+ "learning_rate": 1.3343842571938197e-05,
+ "loss": 0.2004,
+ "step": 15037
+ },
+ {
+ "epoch": 40.97547683923706,
+ "grad_norm": 5.098455429077148,
+ "learning_rate": 1.3343010863476135e-05,
+ "loss": 0.4074,
+ "step": 15038
+ },
+ {
+ "epoch": 40.97820163487739,
+ "grad_norm": 5.775397777557373,
+ "learning_rate": 1.3342179128978818e-05,
+ "loss": 0.2965,
+ "step": 15039
+ },
+ {
+ "epoch": 40.98092643051771,
+ "grad_norm": 7.7027106285095215,
+ "learning_rate": 1.3341347368452712e-05,
+ "loss": 0.259,
+ "step": 15040
+ },
+ {
+ "epoch": 40.98365122615804,
+ "grad_norm": 6.634826183319092,
+ "learning_rate": 1.3340515581904306e-05,
+ "loss": 0.1937,
+ "step": 15041
+ },
+ {
+ "epoch": 40.986376021798364,
+ "grad_norm": 4.4922614097595215,
+ "learning_rate": 1.3339683769340069e-05,
+ "loss": 0.1159,
+ "step": 15042
+ },
+ {
+ "epoch": 40.98910081743869,
+ "grad_norm": 5.7162275314331055,
+ "learning_rate": 1.333885193076648e-05,
+ "loss": 0.2325,
+ "step": 15043
+ },
+ {
+ "epoch": 40.991825613079016,
+ "grad_norm": 5.713405609130859,
+ "learning_rate": 1.3338020066190022e-05,
+ "loss": 0.382,
+ "step": 15044
+ },
+ {
+ "epoch": 40.99455040871935,
+ "grad_norm": 5.215897560119629,
+ "learning_rate": 1.3337188175617173e-05,
+ "loss": 0.3264,
+ "step": 15045
+ },
+ {
+ "epoch": 40.997275204359674,
+ "grad_norm": 6.1874165534973145,
+ "learning_rate": 1.3336356259054406e-05,
+ "loss": 0.4108,
+ "step": 15046
+ },
+ {
+ "epoch": 41.0,
+ "grad_norm": 6.213327884674072,
+ "learning_rate": 1.3335524316508208e-05,
+ "loss": 0.2671,
+ "step": 15047
+ },
+ {
+ "epoch": 41.002724795640326,
+ "grad_norm": 5.763308048248291,
+ "learning_rate": 1.3334692347985053e-05,
+ "loss": 0.1794,
+ "step": 15048
+ },
+ {
+ "epoch": 41.00544959128065,
+ "grad_norm": 4.891640663146973,
+ "learning_rate": 1.333386035349142e-05,
+ "loss": 0.2744,
+ "step": 15049
+ },
+ {
+ "epoch": 41.00817438692098,
+ "grad_norm": 5.161420822143555,
+ "learning_rate": 1.3333028333033791e-05,
+ "loss": 0.2648,
+ "step": 15050
+ },
+ {
+ "epoch": 41.01089918256131,
+ "grad_norm": 5.25761079788208,
+ "learning_rate": 1.3332196286618641e-05,
+ "loss": 0.1408,
+ "step": 15051
+ },
+ {
+ "epoch": 41.013623978201636,
+ "grad_norm": 5.3399481773376465,
+ "learning_rate": 1.3331364214252456e-05,
+ "loss": 0.1608,
+ "step": 15052
+ },
+ {
+ "epoch": 41.01634877384196,
+ "grad_norm": 4.414523601531982,
+ "learning_rate": 1.3330532115941714e-05,
+ "loss": 0.1297,
+ "step": 15053
+ },
+ {
+ "epoch": 41.01907356948229,
+ "grad_norm": 4.573468208312988,
+ "learning_rate": 1.3329699991692894e-05,
+ "loss": 0.2599,
+ "step": 15054
+ },
+ {
+ "epoch": 41.02179836512261,
+ "grad_norm": 5.290121555328369,
+ "learning_rate": 1.3328867841512481e-05,
+ "loss": 0.1638,
+ "step": 15055
+ },
+ {
+ "epoch": 41.02452316076294,
+ "grad_norm": 5.881246089935303,
+ "learning_rate": 1.3328035665406948e-05,
+ "loss": 0.157,
+ "step": 15056
+ },
+ {
+ "epoch": 41.02724795640327,
+ "grad_norm": 5.0966033935546875,
+ "learning_rate": 1.3327203463382786e-05,
+ "loss": 0.2493,
+ "step": 15057
+ },
+ {
+ "epoch": 41.0299727520436,
+ "grad_norm": 5.441526412963867,
+ "learning_rate": 1.3326371235446464e-05,
+ "loss": 0.2309,
+ "step": 15058
+ },
+ {
+ "epoch": 41.032697547683924,
+ "grad_norm": 7.732897758483887,
+ "learning_rate": 1.3325538981604475e-05,
+ "loss": 0.1622,
+ "step": 15059
+ },
+ {
+ "epoch": 41.03542234332425,
+ "grad_norm": 5.739369869232178,
+ "learning_rate": 1.332470670186329e-05,
+ "loss": 0.2691,
+ "step": 15060
+ },
+ {
+ "epoch": 41.038147138964575,
+ "grad_norm": 6.659055709838867,
+ "learning_rate": 1.3323874396229402e-05,
+ "loss": 0.1583,
+ "step": 15061
+ },
+ {
+ "epoch": 41.0408719346049,
+ "grad_norm": 11.251084327697754,
+ "learning_rate": 1.3323042064709285e-05,
+ "loss": 0.2757,
+ "step": 15062
+ },
+ {
+ "epoch": 41.043596730245234,
+ "grad_norm": 7.61301326751709,
+ "learning_rate": 1.3322209707309424e-05,
+ "loss": 0.3217,
+ "step": 15063
+ },
+ {
+ "epoch": 41.04632152588556,
+ "grad_norm": 5.039181709289551,
+ "learning_rate": 1.3321377324036297e-05,
+ "loss": 0.251,
+ "step": 15064
+ },
+ {
+ "epoch": 41.049046321525886,
+ "grad_norm": 6.336490631103516,
+ "learning_rate": 1.3320544914896396e-05,
+ "loss": 0.1705,
+ "step": 15065
+ },
+ {
+ "epoch": 41.05177111716621,
+ "grad_norm": 4.297523021697998,
+ "learning_rate": 1.3319712479896195e-05,
+ "loss": 0.1433,
+ "step": 15066
+ },
+ {
+ "epoch": 41.05449591280654,
+ "grad_norm": 5.132529258728027,
+ "learning_rate": 1.3318880019042179e-05,
+ "loss": 0.1973,
+ "step": 15067
+ },
+ {
+ "epoch": 41.05722070844686,
+ "grad_norm": 5.375813007354736,
+ "learning_rate": 1.3318047532340833e-05,
+ "loss": 0.18,
+ "step": 15068
+ },
+ {
+ "epoch": 41.059945504087196,
+ "grad_norm": 27.851383209228516,
+ "learning_rate": 1.3317215019798639e-05,
+ "loss": 0.2283,
+ "step": 15069
+ },
+ {
+ "epoch": 41.06267029972752,
+ "grad_norm": 5.794404029846191,
+ "learning_rate": 1.3316382481422081e-05,
+ "loss": 0.3191,
+ "step": 15070
+ },
+ {
+ "epoch": 41.06539509536785,
+ "grad_norm": 5.4679670333862305,
+ "learning_rate": 1.3315549917217647e-05,
+ "loss": 0.1392,
+ "step": 15071
+ },
+ {
+ "epoch": 41.06811989100817,
+ "grad_norm": 6.183343410491943,
+ "learning_rate": 1.3314717327191814e-05,
+ "loss": 0.2343,
+ "step": 15072
+ },
+ {
+ "epoch": 41.0708446866485,
+ "grad_norm": 5.130636215209961,
+ "learning_rate": 1.331388471135107e-05,
+ "loss": 0.3179,
+ "step": 15073
+ },
+ {
+ "epoch": 41.073569482288825,
+ "grad_norm": 4.36638879776001,
+ "learning_rate": 1.3313052069701896e-05,
+ "loss": 0.1996,
+ "step": 15074
+ },
+ {
+ "epoch": 41.07629427792916,
+ "grad_norm": 5.1475629806518555,
+ "learning_rate": 1.3312219402250781e-05,
+ "loss": 0.1936,
+ "step": 15075
+ },
+ {
+ "epoch": 41.079019073569484,
+ "grad_norm": 6.122947692871094,
+ "learning_rate": 1.3311386709004208e-05,
+ "loss": 0.2562,
+ "step": 15076
+ },
+ {
+ "epoch": 41.08174386920981,
+ "grad_norm": 7.6103386878967285,
+ "learning_rate": 1.3310553989968662e-05,
+ "loss": 0.2668,
+ "step": 15077
+ },
+ {
+ "epoch": 41.084468664850135,
+ "grad_norm": 5.603167533874512,
+ "learning_rate": 1.3309721245150627e-05,
+ "loss": 0.221,
+ "step": 15078
+ },
+ {
+ "epoch": 41.08719346049046,
+ "grad_norm": 6.73805046081543,
+ "learning_rate": 1.3308888474556591e-05,
+ "loss": 0.1863,
+ "step": 15079
+ },
+ {
+ "epoch": 41.08991825613079,
+ "grad_norm": 5.044631004333496,
+ "learning_rate": 1.3308055678193037e-05,
+ "loss": 0.2452,
+ "step": 15080
+ },
+ {
+ "epoch": 41.09264305177112,
+ "grad_norm": 5.798475742340088,
+ "learning_rate": 1.3307222856066452e-05,
+ "loss": 0.1698,
+ "step": 15081
+ },
+ {
+ "epoch": 41.095367847411445,
+ "grad_norm": 5.877731800079346,
+ "learning_rate": 1.3306390008183324e-05,
+ "loss": 0.2777,
+ "step": 15082
+ },
+ {
+ "epoch": 41.09809264305177,
+ "grad_norm": 7.005524635314941,
+ "learning_rate": 1.3305557134550133e-05,
+ "loss": 0.2625,
+ "step": 15083
+ },
+ {
+ "epoch": 41.1008174386921,
+ "grad_norm": 5.313305377960205,
+ "learning_rate": 1.3304724235173372e-05,
+ "loss": 0.2115,
+ "step": 15084
+ },
+ {
+ "epoch": 41.10354223433242,
+ "grad_norm": 5.591778755187988,
+ "learning_rate": 1.3303891310059528e-05,
+ "loss": 0.2092,
+ "step": 15085
+ },
+ {
+ "epoch": 41.10626702997275,
+ "grad_norm": 6.332198143005371,
+ "learning_rate": 1.3303058359215075e-05,
+ "loss": 0.2679,
+ "step": 15086
+ },
+ {
+ "epoch": 41.10899182561308,
+ "grad_norm": 5.046824932098389,
+ "learning_rate": 1.3302225382646518e-05,
+ "loss": 0.1625,
+ "step": 15087
+ },
+ {
+ "epoch": 41.11171662125341,
+ "grad_norm": 9.898218154907227,
+ "learning_rate": 1.3301392380360334e-05,
+ "loss": 0.2491,
+ "step": 15088
+ },
+ {
+ "epoch": 41.11444141689373,
+ "grad_norm": 6.03626012802124,
+ "learning_rate": 1.3300559352363015e-05,
+ "loss": 0.2215,
+ "step": 15089
+ },
+ {
+ "epoch": 41.11716621253406,
+ "grad_norm": 5.38420295715332,
+ "learning_rate": 1.3299726298661039e-05,
+ "loss": 0.1795,
+ "step": 15090
+ },
+ {
+ "epoch": 41.119891008174385,
+ "grad_norm": 6.802674293518066,
+ "learning_rate": 1.3298893219260909e-05,
+ "loss": 0.2123,
+ "step": 15091
+ },
+ {
+ "epoch": 41.12261580381471,
+ "grad_norm": 4.805606365203857,
+ "learning_rate": 1.32980601141691e-05,
+ "loss": 0.1599,
+ "step": 15092
+ },
+ {
+ "epoch": 41.12534059945504,
+ "grad_norm": 18.50775718688965,
+ "learning_rate": 1.3297226983392106e-05,
+ "loss": 0.1739,
+ "step": 15093
+ },
+ {
+ "epoch": 41.12806539509537,
+ "grad_norm": 4.983346939086914,
+ "learning_rate": 1.3296393826936416e-05,
+ "loss": 0.2814,
+ "step": 15094
+ },
+ {
+ "epoch": 41.130790190735695,
+ "grad_norm": 6.066840171813965,
+ "learning_rate": 1.3295560644808511e-05,
+ "loss": 0.2472,
+ "step": 15095
+ },
+ {
+ "epoch": 41.13351498637602,
+ "grad_norm": 5.6400017738342285,
+ "learning_rate": 1.3294727437014891e-05,
+ "loss": 0.2128,
+ "step": 15096
+ },
+ {
+ "epoch": 41.13623978201635,
+ "grad_norm": 6.294003486633301,
+ "learning_rate": 1.3293894203562041e-05,
+ "loss": 0.4346,
+ "step": 15097
+ },
+ {
+ "epoch": 41.13896457765667,
+ "grad_norm": 5.857290267944336,
+ "learning_rate": 1.3293060944456446e-05,
+ "loss": 0.3423,
+ "step": 15098
+ },
+ {
+ "epoch": 41.141689373297005,
+ "grad_norm": 5.681890487670898,
+ "learning_rate": 1.32922276597046e-05,
+ "loss": 0.2084,
+ "step": 15099
+ },
+ {
+ "epoch": 41.14441416893733,
+ "grad_norm": 7.933870315551758,
+ "learning_rate": 1.3291394349312989e-05,
+ "loss": 0.1554,
+ "step": 15100
+ },
+ {
+ "epoch": 41.14713896457766,
+ "grad_norm": 5.457008361816406,
+ "learning_rate": 1.3290561013288108e-05,
+ "loss": 0.2418,
+ "step": 15101
+ },
+ {
+ "epoch": 41.14986376021798,
+ "grad_norm": 6.152347564697266,
+ "learning_rate": 1.3289727651636439e-05,
+ "loss": 0.162,
+ "step": 15102
+ },
+ {
+ "epoch": 41.15258855585831,
+ "grad_norm": 6.3874664306640625,
+ "learning_rate": 1.328889426436448e-05,
+ "loss": 0.3618,
+ "step": 15103
+ },
+ {
+ "epoch": 41.155313351498634,
+ "grad_norm": 7.355878829956055,
+ "learning_rate": 1.328806085147872e-05,
+ "loss": 0.2442,
+ "step": 15104
+ },
+ {
+ "epoch": 41.15803814713897,
+ "grad_norm": 5.6302876472473145,
+ "learning_rate": 1.3287227412985644e-05,
+ "loss": 0.1831,
+ "step": 15105
+ },
+ {
+ "epoch": 41.16076294277929,
+ "grad_norm": 5.576440334320068,
+ "learning_rate": 1.3286393948891749e-05,
+ "loss": 0.3528,
+ "step": 15106
+ },
+ {
+ "epoch": 41.16348773841962,
+ "grad_norm": 9.891507148742676,
+ "learning_rate": 1.3285560459203524e-05,
+ "loss": 0.1704,
+ "step": 15107
+ },
+ {
+ "epoch": 41.166212534059945,
+ "grad_norm": 14.930198669433594,
+ "learning_rate": 1.3284726943927458e-05,
+ "loss": 0.2097,
+ "step": 15108
+ },
+ {
+ "epoch": 41.16893732970027,
+ "grad_norm": 7.592243671417236,
+ "learning_rate": 1.3283893403070044e-05,
+ "loss": 0.2157,
+ "step": 15109
+ },
+ {
+ "epoch": 41.171662125340596,
+ "grad_norm": 5.6844000816345215,
+ "learning_rate": 1.3283059836637775e-05,
+ "loss": 0.2903,
+ "step": 15110
+ },
+ {
+ "epoch": 41.17438692098093,
+ "grad_norm": 5.559866905212402,
+ "learning_rate": 1.3282226244637141e-05,
+ "loss": 0.2717,
+ "step": 15111
+ },
+ {
+ "epoch": 41.177111716621255,
+ "grad_norm": 5.3150434494018555,
+ "learning_rate": 1.3281392627074638e-05,
+ "loss": 0.1836,
+ "step": 15112
+ },
+ {
+ "epoch": 41.17983651226158,
+ "grad_norm": 4.613548755645752,
+ "learning_rate": 1.3280558983956753e-05,
+ "loss": 0.2416,
+ "step": 15113
+ },
+ {
+ "epoch": 41.182561307901906,
+ "grad_norm": 5.153605937957764,
+ "learning_rate": 1.3279725315289979e-05,
+ "loss": 0.1446,
+ "step": 15114
+ },
+ {
+ "epoch": 41.18528610354223,
+ "grad_norm": 5.514246940612793,
+ "learning_rate": 1.327889162108081e-05,
+ "loss": 0.3107,
+ "step": 15115
+ },
+ {
+ "epoch": 41.18801089918256,
+ "grad_norm": 7.106926441192627,
+ "learning_rate": 1.327805790133574e-05,
+ "loss": 0.2872,
+ "step": 15116
+ },
+ {
+ "epoch": 41.19073569482289,
+ "grad_norm": 6.395162582397461,
+ "learning_rate": 1.327722415606126e-05,
+ "loss": 0.1159,
+ "step": 15117
+ },
+ {
+ "epoch": 41.19346049046322,
+ "grad_norm": 7.043217658996582,
+ "learning_rate": 1.3276390385263862e-05,
+ "loss": 0.1785,
+ "step": 15118
+ },
+ {
+ "epoch": 41.19618528610354,
+ "grad_norm": 6.702186107635498,
+ "learning_rate": 1.3275556588950043e-05,
+ "loss": 0.2931,
+ "step": 15119
+ },
+ {
+ "epoch": 41.19891008174387,
+ "grad_norm": 5.641571998596191,
+ "learning_rate": 1.3274722767126294e-05,
+ "loss": 0.1619,
+ "step": 15120
+ },
+ {
+ "epoch": 41.201634877384194,
+ "grad_norm": 5.504769325256348,
+ "learning_rate": 1.3273888919799109e-05,
+ "loss": 0.2541,
+ "step": 15121
+ },
+ {
+ "epoch": 41.20435967302452,
+ "grad_norm": 6.530135631561279,
+ "learning_rate": 1.3273055046974984e-05,
+ "loss": 0.2569,
+ "step": 15122
+ },
+ {
+ "epoch": 41.20708446866485,
+ "grad_norm": 6.953867435455322,
+ "learning_rate": 1.3272221148660409e-05,
+ "loss": 0.1993,
+ "step": 15123
+ },
+ {
+ "epoch": 41.20980926430518,
+ "grad_norm": 5.282675266265869,
+ "learning_rate": 1.3271387224861885e-05,
+ "loss": 0.3132,
+ "step": 15124
+ },
+ {
+ "epoch": 41.212534059945504,
+ "grad_norm": 6.146264553070068,
+ "learning_rate": 1.3270553275585897e-05,
+ "loss": 0.1945,
+ "step": 15125
+ },
+ {
+ "epoch": 41.21525885558583,
+ "grad_norm": 6.121618270874023,
+ "learning_rate": 1.3269719300838952e-05,
+ "loss": 0.2037,
+ "step": 15126
+ },
+ {
+ "epoch": 41.217983651226156,
+ "grad_norm": 6.169727802276611,
+ "learning_rate": 1.3268885300627534e-05,
+ "loss": 0.1898,
+ "step": 15127
+ },
+ {
+ "epoch": 41.22070844686648,
+ "grad_norm": 7.4113383293151855,
+ "learning_rate": 1.3268051274958145e-05,
+ "loss": 0.2764,
+ "step": 15128
+ },
+ {
+ "epoch": 41.223433242506815,
+ "grad_norm": 7.6999688148498535,
+ "learning_rate": 1.3267217223837273e-05,
+ "loss": 0.2147,
+ "step": 15129
+ },
+ {
+ "epoch": 41.22615803814714,
+ "grad_norm": 24.69585418701172,
+ "learning_rate": 1.3266383147271422e-05,
+ "loss": 0.178,
+ "step": 15130
+ },
+ {
+ "epoch": 41.228882833787466,
+ "grad_norm": 5.99130392074585,
+ "learning_rate": 1.3265549045267085e-05,
+ "loss": 0.1981,
+ "step": 15131
+ },
+ {
+ "epoch": 41.23160762942779,
+ "grad_norm": 7.409508228302002,
+ "learning_rate": 1.3264714917830756e-05,
+ "loss": 0.2539,
+ "step": 15132
+ },
+ {
+ "epoch": 41.23433242506812,
+ "grad_norm": 5.927445411682129,
+ "learning_rate": 1.3263880764968933e-05,
+ "loss": 0.1674,
+ "step": 15133
+ },
+ {
+ "epoch": 41.237057220708444,
+ "grad_norm": 6.339357376098633,
+ "learning_rate": 1.326304658668811e-05,
+ "loss": 0.2224,
+ "step": 15134
+ },
+ {
+ "epoch": 41.23978201634878,
+ "grad_norm": 4.94216251373291,
+ "learning_rate": 1.3262212382994786e-05,
+ "loss": 0.1854,
+ "step": 15135
+ },
+ {
+ "epoch": 41.2425068119891,
+ "grad_norm": 5.53244161605835,
+ "learning_rate": 1.3261378153895459e-05,
+ "loss": 0.2227,
+ "step": 15136
+ },
+ {
+ "epoch": 41.24523160762943,
+ "grad_norm": 4.807004928588867,
+ "learning_rate": 1.3260543899396618e-05,
+ "loss": 0.1899,
+ "step": 15137
+ },
+ {
+ "epoch": 41.247956403269754,
+ "grad_norm": 5.70207405090332,
+ "learning_rate": 1.3259709619504772e-05,
+ "loss": 0.2131,
+ "step": 15138
+ },
+ {
+ "epoch": 41.25068119891008,
+ "grad_norm": 5.638994216918945,
+ "learning_rate": 1.3258875314226409e-05,
+ "loss": 0.2647,
+ "step": 15139
+ },
+ {
+ "epoch": 41.253405994550405,
+ "grad_norm": 5.902090549468994,
+ "learning_rate": 1.3258040983568035e-05,
+ "loss": 0.3854,
+ "step": 15140
+ },
+ {
+ "epoch": 41.25613079019074,
+ "grad_norm": 5.736852169036865,
+ "learning_rate": 1.3257206627536137e-05,
+ "loss": 0.3005,
+ "step": 15141
+ },
+ {
+ "epoch": 41.258855585831064,
+ "grad_norm": 5.480114936828613,
+ "learning_rate": 1.3256372246137223e-05,
+ "loss": 0.1725,
+ "step": 15142
+ },
+ {
+ "epoch": 41.26158038147139,
+ "grad_norm": 4.521186351776123,
+ "learning_rate": 1.3255537839377784e-05,
+ "loss": 0.1908,
+ "step": 15143
+ },
+ {
+ "epoch": 41.264305177111716,
+ "grad_norm": 5.752655506134033,
+ "learning_rate": 1.3254703407264322e-05,
+ "loss": 0.2556,
+ "step": 15144
+ },
+ {
+ "epoch": 41.26702997275204,
+ "grad_norm": 5.045345306396484,
+ "learning_rate": 1.3253868949803332e-05,
+ "loss": 0.1471,
+ "step": 15145
+ },
+ {
+ "epoch": 41.26975476839237,
+ "grad_norm": 4.824075222015381,
+ "learning_rate": 1.3253034467001319e-05,
+ "loss": 0.2457,
+ "step": 15146
+ },
+ {
+ "epoch": 41.2724795640327,
+ "grad_norm": 6.3114495277404785,
+ "learning_rate": 1.3252199958864775e-05,
+ "loss": 0.263,
+ "step": 15147
+ },
+ {
+ "epoch": 41.275204359673026,
+ "grad_norm": 6.216378211975098,
+ "learning_rate": 1.3251365425400205e-05,
+ "loss": 0.2134,
+ "step": 15148
+ },
+ {
+ "epoch": 41.27792915531335,
+ "grad_norm": 5.833584308624268,
+ "learning_rate": 1.3250530866614104e-05,
+ "loss": 0.2827,
+ "step": 15149
+ },
+ {
+ "epoch": 41.28065395095368,
+ "grad_norm": 5.205456256866455,
+ "learning_rate": 1.3249696282512976e-05,
+ "loss": 0.2104,
+ "step": 15150
+ },
+ {
+ "epoch": 41.283378746594,
+ "grad_norm": 5.878049850463867,
+ "learning_rate": 1.3248861673103315e-05,
+ "loss": 0.2962,
+ "step": 15151
+ },
+ {
+ "epoch": 41.28610354223433,
+ "grad_norm": 4.970963954925537,
+ "learning_rate": 1.3248027038391626e-05,
+ "loss": 0.1247,
+ "step": 15152
+ },
+ {
+ "epoch": 41.28882833787466,
+ "grad_norm": 7.160046100616455,
+ "learning_rate": 1.3247192378384406e-05,
+ "loss": 0.1987,
+ "step": 15153
+ },
+ {
+ "epoch": 41.29155313351499,
+ "grad_norm": 5.031962871551514,
+ "learning_rate": 1.3246357693088155e-05,
+ "loss": 0.3038,
+ "step": 15154
+ },
+ {
+ "epoch": 41.294277929155314,
+ "grad_norm": 6.0762104988098145,
+ "learning_rate": 1.3245522982509376e-05,
+ "loss": 0.226,
+ "step": 15155
+ },
+ {
+ "epoch": 41.29700272479564,
+ "grad_norm": 3.9628217220306396,
+ "learning_rate": 1.3244688246654569e-05,
+ "loss": 0.1666,
+ "step": 15156
+ },
+ {
+ "epoch": 41.299727520435965,
+ "grad_norm": 4.434725284576416,
+ "learning_rate": 1.3243853485530231e-05,
+ "loss": 0.4491,
+ "step": 15157
+ },
+ {
+ "epoch": 41.30245231607629,
+ "grad_norm": 6.514955997467041,
+ "learning_rate": 1.3243018699142871e-05,
+ "loss": 0.251,
+ "step": 15158
+ },
+ {
+ "epoch": 41.305177111716624,
+ "grad_norm": 5.702577590942383,
+ "learning_rate": 1.3242183887498983e-05,
+ "loss": 0.2284,
+ "step": 15159
+ },
+ {
+ "epoch": 41.30790190735695,
+ "grad_norm": 5.384641647338867,
+ "learning_rate": 1.3241349050605074e-05,
+ "loss": 0.1658,
+ "step": 15160
+ },
+ {
+ "epoch": 41.310626702997276,
+ "grad_norm": 4.907167911529541,
+ "learning_rate": 1.324051418846764e-05,
+ "loss": 0.2739,
+ "step": 15161
+ },
+ {
+ "epoch": 41.3133514986376,
+ "grad_norm": 5.377655506134033,
+ "learning_rate": 1.323967930109319e-05,
+ "loss": 0.1862,
+ "step": 15162
+ },
+ {
+ "epoch": 41.31607629427793,
+ "grad_norm": 5.394341945648193,
+ "learning_rate": 1.3238844388488215e-05,
+ "loss": 0.2562,
+ "step": 15163
+ },
+ {
+ "epoch": 41.31880108991825,
+ "grad_norm": 4.6092424392700195,
+ "learning_rate": 1.3238009450659228e-05,
+ "loss": 0.2982,
+ "step": 15164
+ },
+ {
+ "epoch": 41.321525885558586,
+ "grad_norm": 4.88956880569458,
+ "learning_rate": 1.3237174487612727e-05,
+ "loss": 0.1864,
+ "step": 15165
+ },
+ {
+ "epoch": 41.32425068119891,
+ "grad_norm": 5.869426727294922,
+ "learning_rate": 1.3236339499355217e-05,
+ "loss": 0.1928,
+ "step": 15166
+ },
+ {
+ "epoch": 41.32697547683924,
+ "grad_norm": 6.263637065887451,
+ "learning_rate": 1.3235504485893198e-05,
+ "loss": 0.1864,
+ "step": 15167
+ },
+ {
+ "epoch": 41.32970027247956,
+ "grad_norm": 4.82780122756958,
+ "learning_rate": 1.3234669447233175e-05,
+ "loss": 0.2086,
+ "step": 15168
+ },
+ {
+ "epoch": 41.33242506811989,
+ "grad_norm": 4.812079906463623,
+ "learning_rate": 1.323383438338165e-05,
+ "loss": 0.2209,
+ "step": 15169
+ },
+ {
+ "epoch": 41.335149863760215,
+ "grad_norm": 5.495488166809082,
+ "learning_rate": 1.3232999294345126e-05,
+ "loss": 0.2713,
+ "step": 15170
+ },
+ {
+ "epoch": 41.33787465940055,
+ "grad_norm": 6.937367916107178,
+ "learning_rate": 1.3232164180130108e-05,
+ "loss": 0.3763,
+ "step": 15171
+ },
+ {
+ "epoch": 41.34059945504087,
+ "grad_norm": 7.551480293273926,
+ "learning_rate": 1.3231329040743099e-05,
+ "loss": 0.275,
+ "step": 15172
+ },
+ {
+ "epoch": 41.3433242506812,
+ "grad_norm": 5.157136917114258,
+ "learning_rate": 1.3230493876190602e-05,
+ "loss": 0.1614,
+ "step": 15173
+ },
+ {
+ "epoch": 41.346049046321525,
+ "grad_norm": 9.280787467956543,
+ "learning_rate": 1.3229658686479128e-05,
+ "loss": 0.1954,
+ "step": 15174
+ },
+ {
+ "epoch": 41.34877384196185,
+ "grad_norm": 11.969324111938477,
+ "learning_rate": 1.322882347161517e-05,
+ "loss": 0.1795,
+ "step": 15175
+ },
+ {
+ "epoch": 41.35149863760218,
+ "grad_norm": 6.5450968742370605,
+ "learning_rate": 1.3227988231605242e-05,
+ "loss": 0.337,
+ "step": 15176
+ },
+ {
+ "epoch": 41.35422343324251,
+ "grad_norm": 4.671832084655762,
+ "learning_rate": 1.3227152966455844e-05,
+ "loss": 0.3085,
+ "step": 15177
+ },
+ {
+ "epoch": 41.356948228882835,
+ "grad_norm": 5.481117248535156,
+ "learning_rate": 1.3226317676173485e-05,
+ "loss": 0.2548,
+ "step": 15178
+ },
+ {
+ "epoch": 41.35967302452316,
+ "grad_norm": 6.210432529449463,
+ "learning_rate": 1.3225482360764666e-05,
+ "loss": 0.2514,
+ "step": 15179
+ },
+ {
+ "epoch": 41.36239782016349,
+ "grad_norm": 3.732023239135742,
+ "learning_rate": 1.3224647020235894e-05,
+ "loss": 0.2427,
+ "step": 15180
+ },
+ {
+ "epoch": 41.36512261580381,
+ "grad_norm": 4.857550144195557,
+ "learning_rate": 1.3223811654593677e-05,
+ "loss": 0.199,
+ "step": 15181
+ },
+ {
+ "epoch": 41.36784741144414,
+ "grad_norm": 7.312856674194336,
+ "learning_rate": 1.3222976263844517e-05,
+ "loss": 0.2503,
+ "step": 15182
+ },
+ {
+ "epoch": 41.37057220708447,
+ "grad_norm": 5.666393756866455,
+ "learning_rate": 1.3222140847994917e-05,
+ "loss": 0.2112,
+ "step": 15183
+ },
+ {
+ "epoch": 41.3732970027248,
+ "grad_norm": 7.047507286071777,
+ "learning_rate": 1.3221305407051395e-05,
+ "loss": 0.3018,
+ "step": 15184
+ },
+ {
+ "epoch": 41.37602179836512,
+ "grad_norm": 6.197628021240234,
+ "learning_rate": 1.3220469941020447e-05,
+ "loss": 0.2899,
+ "step": 15185
+ },
+ {
+ "epoch": 41.37874659400545,
+ "grad_norm": 5.384599685668945,
+ "learning_rate": 1.3219634449908585e-05,
+ "loss": 0.3897,
+ "step": 15186
+ },
+ {
+ "epoch": 41.381471389645775,
+ "grad_norm": 5.311314582824707,
+ "learning_rate": 1.321879893372231e-05,
+ "loss": 0.2588,
+ "step": 15187
+ },
+ {
+ "epoch": 41.3841961852861,
+ "grad_norm": 5.707054138183594,
+ "learning_rate": 1.3217963392468135e-05,
+ "loss": 0.2493,
+ "step": 15188
+ },
+ {
+ "epoch": 41.38692098092643,
+ "grad_norm": 8.608099937438965,
+ "learning_rate": 1.3217127826152563e-05,
+ "loss": 0.2018,
+ "step": 15189
+ },
+ {
+ "epoch": 41.38964577656676,
+ "grad_norm": 5.823888778686523,
+ "learning_rate": 1.3216292234782104e-05,
+ "loss": 0.202,
+ "step": 15190
+ },
+ {
+ "epoch": 41.392370572207085,
+ "grad_norm": 5.694127082824707,
+ "learning_rate": 1.3215456618363264e-05,
+ "loss": 0.3065,
+ "step": 15191
+ },
+ {
+ "epoch": 41.39509536784741,
+ "grad_norm": 4.225665092468262,
+ "learning_rate": 1.3214620976902553e-05,
+ "loss": 0.1481,
+ "step": 15192
+ },
+ {
+ "epoch": 41.39782016348774,
+ "grad_norm": 7.366786003112793,
+ "learning_rate": 1.3213785310406477e-05,
+ "loss": 0.2728,
+ "step": 15193
+ },
+ {
+ "epoch": 41.40054495912806,
+ "grad_norm": 5.030938148498535,
+ "learning_rate": 1.321294961888154e-05,
+ "loss": 0.217,
+ "step": 15194
+ },
+ {
+ "epoch": 41.403269754768395,
+ "grad_norm": 4.735142230987549,
+ "learning_rate": 1.321211390233426e-05,
+ "loss": 0.1598,
+ "step": 15195
+ },
+ {
+ "epoch": 41.40599455040872,
+ "grad_norm": 4.333200931549072,
+ "learning_rate": 1.321127816077114e-05,
+ "loss": 0.2,
+ "step": 15196
+ },
+ {
+ "epoch": 41.40871934604905,
+ "grad_norm": 5.632680892944336,
+ "learning_rate": 1.3210442394198686e-05,
+ "loss": 0.1638,
+ "step": 15197
+ },
+ {
+ "epoch": 41.41144414168937,
+ "grad_norm": 6.012128829956055,
+ "learning_rate": 1.3209606602623411e-05,
+ "loss": 0.1948,
+ "step": 15198
+ },
+ {
+ "epoch": 41.4141689373297,
+ "grad_norm": 4.546900272369385,
+ "learning_rate": 1.3208770786051826e-05,
+ "loss": 0.1966,
+ "step": 15199
+ },
+ {
+ "epoch": 41.416893732970024,
+ "grad_norm": 4.972142219543457,
+ "learning_rate": 1.3207934944490433e-05,
+ "loss": 0.1824,
+ "step": 15200
+ },
+ {
+ "epoch": 41.41961852861036,
+ "grad_norm": 6.288185119628906,
+ "learning_rate": 1.3207099077945749e-05,
+ "loss": 0.2804,
+ "step": 15201
+ },
+ {
+ "epoch": 41.42234332425068,
+ "grad_norm": 5.620209217071533,
+ "learning_rate": 1.3206263186424279e-05,
+ "loss": 0.2924,
+ "step": 15202
+ },
+ {
+ "epoch": 41.42506811989101,
+ "grad_norm": 4.958395481109619,
+ "learning_rate": 1.3205427269932535e-05,
+ "loss": 0.2925,
+ "step": 15203
+ },
+ {
+ "epoch": 41.427792915531334,
+ "grad_norm": 4.600726127624512,
+ "learning_rate": 1.3204591328477028e-05,
+ "loss": 0.3718,
+ "step": 15204
+ },
+ {
+ "epoch": 41.43051771117166,
+ "grad_norm": 4.540500640869141,
+ "learning_rate": 1.3203755362064263e-05,
+ "loss": 0.17,
+ "step": 15205
+ },
+ {
+ "epoch": 41.433242506811986,
+ "grad_norm": 8.953529357910156,
+ "learning_rate": 1.3202919370700758e-05,
+ "loss": 0.2036,
+ "step": 15206
+ },
+ {
+ "epoch": 41.43596730245232,
+ "grad_norm": 3.953489065170288,
+ "learning_rate": 1.3202083354393019e-05,
+ "loss": 0.1904,
+ "step": 15207
+ },
+ {
+ "epoch": 41.438692098092645,
+ "grad_norm": 5.842988967895508,
+ "learning_rate": 1.3201247313147559e-05,
+ "loss": 0.2263,
+ "step": 15208
+ },
+ {
+ "epoch": 41.44141689373297,
+ "grad_norm": 5.583596706390381,
+ "learning_rate": 1.3200411246970885e-05,
+ "loss": 0.208,
+ "step": 15209
+ },
+ {
+ "epoch": 41.444141689373296,
+ "grad_norm": 4.909837245941162,
+ "learning_rate": 1.3199575155869514e-05,
+ "loss": 0.1663,
+ "step": 15210
+ },
+ {
+ "epoch": 41.44686648501362,
+ "grad_norm": 5.328984260559082,
+ "learning_rate": 1.3198739039849955e-05,
+ "loss": 0.3241,
+ "step": 15211
+ },
+ {
+ "epoch": 41.44959128065395,
+ "grad_norm": 6.674950122833252,
+ "learning_rate": 1.3197902898918718e-05,
+ "loss": 0.4411,
+ "step": 15212
+ },
+ {
+ "epoch": 41.45231607629428,
+ "grad_norm": 5.948317050933838,
+ "learning_rate": 1.3197066733082316e-05,
+ "loss": 0.1893,
+ "step": 15213
+ },
+ {
+ "epoch": 41.45504087193461,
+ "grad_norm": 4.927055835723877,
+ "learning_rate": 1.3196230542347259e-05,
+ "loss": 0.1572,
+ "step": 15214
+ },
+ {
+ "epoch": 41.45776566757493,
+ "grad_norm": 4.261422157287598,
+ "learning_rate": 1.3195394326720063e-05,
+ "loss": 0.2113,
+ "step": 15215
+ },
+ {
+ "epoch": 41.46049046321526,
+ "grad_norm": 5.302755355834961,
+ "learning_rate": 1.3194558086207238e-05,
+ "loss": 0.3796,
+ "step": 15216
+ },
+ {
+ "epoch": 41.463215258855584,
+ "grad_norm": 5.816093921661377,
+ "learning_rate": 1.3193721820815302e-05,
+ "loss": 0.2574,
+ "step": 15217
+ },
+ {
+ "epoch": 41.46594005449591,
+ "grad_norm": 4.7682600021362305,
+ "learning_rate": 1.3192885530550758e-05,
+ "loss": 0.5291,
+ "step": 15218
+ },
+ {
+ "epoch": 41.46866485013624,
+ "grad_norm": 7.575376987457275,
+ "learning_rate": 1.3192049215420129e-05,
+ "loss": 0.3073,
+ "step": 15219
+ },
+ {
+ "epoch": 41.47138964577657,
+ "grad_norm": 5.825736999511719,
+ "learning_rate": 1.319121287542992e-05,
+ "loss": 0.228,
+ "step": 15220
+ },
+ {
+ "epoch": 41.474114441416894,
+ "grad_norm": 5.374505519866943,
+ "learning_rate": 1.319037651058665e-05,
+ "loss": 0.3985,
+ "step": 15221
+ },
+ {
+ "epoch": 41.47683923705722,
+ "grad_norm": 5.100955009460449,
+ "learning_rate": 1.3189540120896829e-05,
+ "loss": 0.2792,
+ "step": 15222
+ },
+ {
+ "epoch": 41.479564032697546,
+ "grad_norm": 5.804059982299805,
+ "learning_rate": 1.318870370636697e-05,
+ "loss": 0.0899,
+ "step": 15223
+ },
+ {
+ "epoch": 41.48228882833787,
+ "grad_norm": 5.3307061195373535,
+ "learning_rate": 1.3187867267003592e-05,
+ "loss": 0.3647,
+ "step": 15224
+ },
+ {
+ "epoch": 41.485013623978205,
+ "grad_norm": 6.556344985961914,
+ "learning_rate": 1.3187030802813206e-05,
+ "loss": 0.3535,
+ "step": 15225
+ },
+ {
+ "epoch": 41.48773841961853,
+ "grad_norm": 5.337364673614502,
+ "learning_rate": 1.3186194313802325e-05,
+ "loss": 0.1569,
+ "step": 15226
+ },
+ {
+ "epoch": 41.490463215258856,
+ "grad_norm": 4.980561256408691,
+ "learning_rate": 1.318535779997747e-05,
+ "loss": 0.2563,
+ "step": 15227
+ },
+ {
+ "epoch": 41.49318801089918,
+ "grad_norm": 6.962838649749756,
+ "learning_rate": 1.3184521261345146e-05,
+ "loss": 0.3742,
+ "step": 15228
+ },
+ {
+ "epoch": 41.49591280653951,
+ "grad_norm": 5.183857440948486,
+ "learning_rate": 1.3183684697911875e-05,
+ "loss": 0.2242,
+ "step": 15229
+ },
+ {
+ "epoch": 41.49863760217983,
+ "grad_norm": 7.675213813781738,
+ "learning_rate": 1.318284810968417e-05,
+ "loss": 0.3745,
+ "step": 15230
+ },
+ {
+ "epoch": 41.50136239782017,
+ "grad_norm": 5.953858852386475,
+ "learning_rate": 1.3182011496668548e-05,
+ "loss": 0.2852,
+ "step": 15231
+ },
+ {
+ "epoch": 41.50408719346049,
+ "grad_norm": 6.068861484527588,
+ "learning_rate": 1.3181174858871517e-05,
+ "loss": 0.2057,
+ "step": 15232
+ },
+ {
+ "epoch": 41.50681198910082,
+ "grad_norm": 7.253425121307373,
+ "learning_rate": 1.3180338196299603e-05,
+ "loss": 0.1679,
+ "step": 15233
+ },
+ {
+ "epoch": 41.509536784741144,
+ "grad_norm": 4.526234149932861,
+ "learning_rate": 1.3179501508959315e-05,
+ "loss": 0.2014,
+ "step": 15234
+ },
+ {
+ "epoch": 41.51226158038147,
+ "grad_norm": 5.607563495635986,
+ "learning_rate": 1.3178664796857176e-05,
+ "loss": 0.2669,
+ "step": 15235
+ },
+ {
+ "epoch": 41.514986376021795,
+ "grad_norm": 6.936614990234375,
+ "learning_rate": 1.3177828059999695e-05,
+ "loss": 0.2768,
+ "step": 15236
+ },
+ {
+ "epoch": 41.51771117166213,
+ "grad_norm": 5.585014820098877,
+ "learning_rate": 1.3176991298393393e-05,
+ "loss": 0.3114,
+ "step": 15237
+ },
+ {
+ "epoch": 41.520435967302454,
+ "grad_norm": 5.922313213348389,
+ "learning_rate": 1.3176154512044783e-05,
+ "loss": 0.237,
+ "step": 15238
+ },
+ {
+ "epoch": 41.52316076294278,
+ "grad_norm": 4.764875411987305,
+ "learning_rate": 1.3175317700960386e-05,
+ "loss": 0.3261,
+ "step": 15239
+ },
+ {
+ "epoch": 41.525885558583106,
+ "grad_norm": 5.3954758644104,
+ "learning_rate": 1.3174480865146712e-05,
+ "loss": 0.3271,
+ "step": 15240
+ },
+ {
+ "epoch": 41.52861035422343,
+ "grad_norm": 4.896951198577881,
+ "learning_rate": 1.317364400461029e-05,
+ "loss": 0.4214,
+ "step": 15241
+ },
+ {
+ "epoch": 41.53133514986376,
+ "grad_norm": 9.775511741638184,
+ "learning_rate": 1.3172807119357625e-05,
+ "loss": 0.2403,
+ "step": 15242
+ },
+ {
+ "epoch": 41.53405994550409,
+ "grad_norm": 4.736580848693848,
+ "learning_rate": 1.3171970209395243e-05,
+ "loss": 0.247,
+ "step": 15243
+ },
+ {
+ "epoch": 41.536784741144416,
+ "grad_norm": 5.65787410736084,
+ "learning_rate": 1.317113327472966e-05,
+ "loss": 0.3753,
+ "step": 15244
+ },
+ {
+ "epoch": 41.53950953678474,
+ "grad_norm": 5.568493366241455,
+ "learning_rate": 1.3170296315367392e-05,
+ "loss": 0.1749,
+ "step": 15245
+ },
+ {
+ "epoch": 41.54223433242507,
+ "grad_norm": 4.574891090393066,
+ "learning_rate": 1.3169459331314958e-05,
+ "loss": 0.2714,
+ "step": 15246
+ },
+ {
+ "epoch": 41.54495912806539,
+ "grad_norm": 5.970724582672119,
+ "learning_rate": 1.3168622322578879e-05,
+ "loss": 0.1911,
+ "step": 15247
+ },
+ {
+ "epoch": 41.54768392370572,
+ "grad_norm": 4.580286026000977,
+ "learning_rate": 1.316778528916567e-05,
+ "loss": 0.1701,
+ "step": 15248
+ },
+ {
+ "epoch": 41.55040871934605,
+ "grad_norm": 6.1775336265563965,
+ "learning_rate": 1.3166948231081849e-05,
+ "loss": 0.2282,
+ "step": 15249
+ },
+ {
+ "epoch": 41.55313351498638,
+ "grad_norm": 4.816786289215088,
+ "learning_rate": 1.3166111148333935e-05,
+ "loss": 0.1585,
+ "step": 15250
+ },
+ {
+ "epoch": 41.555858310626704,
+ "grad_norm": 4.877140998840332,
+ "learning_rate": 1.3165274040928456e-05,
+ "loss": 0.2069,
+ "step": 15251
+ },
+ {
+ "epoch": 41.55858310626703,
+ "grad_norm": 5.608216762542725,
+ "learning_rate": 1.316443690887192e-05,
+ "loss": 0.2691,
+ "step": 15252
+ },
+ {
+ "epoch": 41.561307901907355,
+ "grad_norm": 5.537759780883789,
+ "learning_rate": 1.3163599752170852e-05,
+ "loss": 0.2128,
+ "step": 15253
+ },
+ {
+ "epoch": 41.56403269754768,
+ "grad_norm": 8.375011444091797,
+ "learning_rate": 1.3162762570831773e-05,
+ "loss": 0.1543,
+ "step": 15254
+ },
+ {
+ "epoch": 41.566757493188014,
+ "grad_norm": 5.1054816246032715,
+ "learning_rate": 1.31619253648612e-05,
+ "loss": 0.173,
+ "step": 15255
+ },
+ {
+ "epoch": 41.56948228882834,
+ "grad_norm": 4.622839450836182,
+ "learning_rate": 1.3161088134265651e-05,
+ "loss": 0.2326,
+ "step": 15256
+ },
+ {
+ "epoch": 41.572207084468666,
+ "grad_norm": 5.541858673095703,
+ "learning_rate": 1.3160250879051655e-05,
+ "loss": 0.2054,
+ "step": 15257
+ },
+ {
+ "epoch": 41.57493188010899,
+ "grad_norm": 5.578751087188721,
+ "learning_rate": 1.315941359922572e-05,
+ "loss": 0.2286,
+ "step": 15258
+ },
+ {
+ "epoch": 41.57765667574932,
+ "grad_norm": 5.844489574432373,
+ "learning_rate": 1.3158576294794378e-05,
+ "loss": 0.2263,
+ "step": 15259
+ },
+ {
+ "epoch": 41.58038147138964,
+ "grad_norm": 6.654881477355957,
+ "learning_rate": 1.3157738965764146e-05,
+ "loss": 0.501,
+ "step": 15260
+ },
+ {
+ "epoch": 41.583106267029976,
+ "grad_norm": 5.959126949310303,
+ "learning_rate": 1.3156901612141543e-05,
+ "loss": 0.2935,
+ "step": 15261
+ },
+ {
+ "epoch": 41.5858310626703,
+ "grad_norm": 5.3083415031433105,
+ "learning_rate": 1.3156064233933093e-05,
+ "loss": 0.1636,
+ "step": 15262
+ },
+ {
+ "epoch": 41.58855585831063,
+ "grad_norm": 7.250215530395508,
+ "learning_rate": 1.3155226831145316e-05,
+ "loss": 0.2337,
+ "step": 15263
+ },
+ {
+ "epoch": 41.59128065395095,
+ "grad_norm": 5.6582417488098145,
+ "learning_rate": 1.3154389403784733e-05,
+ "loss": 0.1862,
+ "step": 15264
+ },
+ {
+ "epoch": 41.59400544959128,
+ "grad_norm": 4.778441905975342,
+ "learning_rate": 1.3153551951857869e-05,
+ "loss": 0.298,
+ "step": 15265
+ },
+ {
+ "epoch": 41.596730245231605,
+ "grad_norm": 5.2142839431762695,
+ "learning_rate": 1.315271447537124e-05,
+ "loss": 0.2852,
+ "step": 15266
+ },
+ {
+ "epoch": 41.59945504087194,
+ "grad_norm": 4.115604877471924,
+ "learning_rate": 1.3151876974331375e-05,
+ "loss": 0.1143,
+ "step": 15267
+ },
+ {
+ "epoch": 41.60217983651226,
+ "grad_norm": 7.301044464111328,
+ "learning_rate": 1.3151039448744794e-05,
+ "loss": 0.2248,
+ "step": 15268
+ },
+ {
+ "epoch": 41.60490463215259,
+ "grad_norm": 4.621791839599609,
+ "learning_rate": 1.3150201898618019e-05,
+ "loss": 0.32,
+ "step": 15269
+ },
+ {
+ "epoch": 41.607629427792915,
+ "grad_norm": 6.88387393951416,
+ "learning_rate": 1.314936432395757e-05,
+ "loss": 0.2261,
+ "step": 15270
+ },
+ {
+ "epoch": 41.61035422343324,
+ "grad_norm": 4.959455490112305,
+ "learning_rate": 1.3148526724769976e-05,
+ "loss": 0.1509,
+ "step": 15271
+ },
+ {
+ "epoch": 41.61307901907357,
+ "grad_norm": 6.008310317993164,
+ "learning_rate": 1.3147689101061755e-05,
+ "loss": 0.4298,
+ "step": 15272
+ },
+ {
+ "epoch": 41.6158038147139,
+ "grad_norm": 5.80253267288208,
+ "learning_rate": 1.3146851452839435e-05,
+ "loss": 0.1591,
+ "step": 15273
+ },
+ {
+ "epoch": 41.618528610354225,
+ "grad_norm": 5.511794567108154,
+ "learning_rate": 1.3146013780109536e-05,
+ "loss": 0.244,
+ "step": 15274
+ },
+ {
+ "epoch": 41.62125340599455,
+ "grad_norm": 4.241323947906494,
+ "learning_rate": 1.3145176082878584e-05,
+ "loss": 0.1746,
+ "step": 15275
+ },
+ {
+ "epoch": 41.62397820163488,
+ "grad_norm": 5.244009494781494,
+ "learning_rate": 1.3144338361153101e-05,
+ "loss": 0.2232,
+ "step": 15276
+ },
+ {
+ "epoch": 41.6267029972752,
+ "grad_norm": 5.850700378417969,
+ "learning_rate": 1.314350061493961e-05,
+ "loss": 0.316,
+ "step": 15277
+ },
+ {
+ "epoch": 41.62942779291553,
+ "grad_norm": 5.898186683654785,
+ "learning_rate": 1.314266284424464e-05,
+ "loss": 0.3151,
+ "step": 15278
+ },
+ {
+ "epoch": 41.63215258855586,
+ "grad_norm": 7.902008533477783,
+ "learning_rate": 1.3141825049074712e-05,
+ "loss": 0.2866,
+ "step": 15279
+ },
+ {
+ "epoch": 41.63487738419619,
+ "grad_norm": 4.587899208068848,
+ "learning_rate": 1.3140987229436353e-05,
+ "loss": 0.2135,
+ "step": 15280
+ },
+ {
+ "epoch": 41.63760217983651,
+ "grad_norm": 4.991730213165283,
+ "learning_rate": 1.3140149385336085e-05,
+ "loss": 0.2355,
+ "step": 15281
+ },
+ {
+ "epoch": 41.64032697547684,
+ "grad_norm": 5.29056978225708,
+ "learning_rate": 1.3139311516780435e-05,
+ "loss": 0.3366,
+ "step": 15282
+ },
+ {
+ "epoch": 41.643051771117165,
+ "grad_norm": 4.8959269523620605,
+ "learning_rate": 1.3138473623775927e-05,
+ "loss": 0.242,
+ "step": 15283
+ },
+ {
+ "epoch": 41.64577656675749,
+ "grad_norm": 4.812049865722656,
+ "learning_rate": 1.3137635706329091e-05,
+ "loss": 0.2605,
+ "step": 15284
+ },
+ {
+ "epoch": 41.64850136239782,
+ "grad_norm": 5.69114875793457,
+ "learning_rate": 1.3136797764446445e-05,
+ "loss": 0.2483,
+ "step": 15285
+ },
+ {
+ "epoch": 41.65122615803815,
+ "grad_norm": 4.23663330078125,
+ "learning_rate": 1.3135959798134522e-05,
+ "loss": 0.1755,
+ "step": 15286
+ },
+ {
+ "epoch": 41.653950953678475,
+ "grad_norm": 5.8705153465271,
+ "learning_rate": 1.3135121807399842e-05,
+ "loss": 0.2071,
+ "step": 15287
+ },
+ {
+ "epoch": 41.6566757493188,
+ "grad_norm": 4.611892223358154,
+ "learning_rate": 1.3134283792248939e-05,
+ "loss": 0.1189,
+ "step": 15288
+ },
+ {
+ "epoch": 41.65940054495913,
+ "grad_norm": 6.163382530212402,
+ "learning_rate": 1.3133445752688329e-05,
+ "loss": 0.2847,
+ "step": 15289
+ },
+ {
+ "epoch": 41.66212534059945,
+ "grad_norm": 4.534838676452637,
+ "learning_rate": 1.3132607688724547e-05,
+ "loss": 0.1187,
+ "step": 15290
+ },
+ {
+ "epoch": 41.664850136239785,
+ "grad_norm": 5.232635498046875,
+ "learning_rate": 1.3131769600364117e-05,
+ "loss": 0.2185,
+ "step": 15291
+ },
+ {
+ "epoch": 41.66757493188011,
+ "grad_norm": 4.810821056365967,
+ "learning_rate": 1.3130931487613566e-05,
+ "loss": 0.1955,
+ "step": 15292
+ },
+ {
+ "epoch": 41.67029972752044,
+ "grad_norm": 5.155076026916504,
+ "learning_rate": 1.313009335047942e-05,
+ "loss": 0.2985,
+ "step": 15293
+ },
+ {
+ "epoch": 41.67302452316076,
+ "grad_norm": 5.9662604331970215,
+ "learning_rate": 1.312925518896821e-05,
+ "loss": 0.1742,
+ "step": 15294
+ },
+ {
+ "epoch": 41.67574931880109,
+ "grad_norm": 6.306094646453857,
+ "learning_rate": 1.312841700308646e-05,
+ "loss": 0.2366,
+ "step": 15295
+ },
+ {
+ "epoch": 41.678474114441414,
+ "grad_norm": 9.599309921264648,
+ "learning_rate": 1.31275787928407e-05,
+ "loss": 0.285,
+ "step": 15296
+ },
+ {
+ "epoch": 41.68119891008175,
+ "grad_norm": 7.673811435699463,
+ "learning_rate": 1.3126740558237459e-05,
+ "loss": 0.3566,
+ "step": 15297
+ },
+ {
+ "epoch": 41.68392370572207,
+ "grad_norm": 5.701015949249268,
+ "learning_rate": 1.312590229928326e-05,
+ "loss": 0.2245,
+ "step": 15298
+ },
+ {
+ "epoch": 41.6866485013624,
+ "grad_norm": 5.403347015380859,
+ "learning_rate": 1.3125064015984634e-05,
+ "loss": 0.288,
+ "step": 15299
+ },
+ {
+ "epoch": 41.689373297002724,
+ "grad_norm": 5.293545722961426,
+ "learning_rate": 1.3124225708348113e-05,
+ "loss": 0.2547,
+ "step": 15300
+ },
+ {
+ "epoch": 41.69209809264305,
+ "grad_norm": 5.065179347991943,
+ "learning_rate": 1.3123387376380218e-05,
+ "loss": 0.3229,
+ "step": 15301
+ },
+ {
+ "epoch": 41.694822888283376,
+ "grad_norm": 4.2079644203186035,
+ "learning_rate": 1.3122549020087487e-05,
+ "loss": 0.185,
+ "step": 15302
+ },
+ {
+ "epoch": 41.69754768392371,
+ "grad_norm": 5.518126964569092,
+ "learning_rate": 1.3121710639476444e-05,
+ "loss": 0.1744,
+ "step": 15303
+ },
+ {
+ "epoch": 41.700272479564035,
+ "grad_norm": 7.460519313812256,
+ "learning_rate": 1.3120872234553618e-05,
+ "loss": 0.306,
+ "step": 15304
+ },
+ {
+ "epoch": 41.70299727520436,
+ "grad_norm": 67.50646209716797,
+ "learning_rate": 1.3120033805325541e-05,
+ "loss": 0.2707,
+ "step": 15305
+ },
+ {
+ "epoch": 41.705722070844686,
+ "grad_norm": 5.967147350311279,
+ "learning_rate": 1.3119195351798742e-05,
+ "loss": 0.2522,
+ "step": 15306
+ },
+ {
+ "epoch": 41.70844686648501,
+ "grad_norm": 6.045979976654053,
+ "learning_rate": 1.3118356873979745e-05,
+ "loss": 0.2151,
+ "step": 15307
+ },
+ {
+ "epoch": 41.71117166212534,
+ "grad_norm": 10.25633716583252,
+ "learning_rate": 1.3117518371875091e-05,
+ "loss": 0.3222,
+ "step": 15308
+ },
+ {
+ "epoch": 41.71389645776567,
+ "grad_norm": 9.394362449645996,
+ "learning_rate": 1.3116679845491298e-05,
+ "loss": 0.2045,
+ "step": 15309
+ },
+ {
+ "epoch": 41.716621253406,
+ "grad_norm": 12.04206371307373,
+ "learning_rate": 1.3115841294834908e-05,
+ "loss": 0.2087,
+ "step": 15310
+ },
+ {
+ "epoch": 41.71934604904632,
+ "grad_norm": 6.293303966522217,
+ "learning_rate": 1.3115002719912443e-05,
+ "loss": 0.1517,
+ "step": 15311
+ },
+ {
+ "epoch": 41.72207084468665,
+ "grad_norm": 5.3646087646484375,
+ "learning_rate": 1.3114164120730439e-05,
+ "loss": 0.371,
+ "step": 15312
+ },
+ {
+ "epoch": 41.724795640326974,
+ "grad_norm": 8.045680046081543,
+ "learning_rate": 1.3113325497295424e-05,
+ "loss": 0.34,
+ "step": 15313
+ },
+ {
+ "epoch": 41.7275204359673,
+ "grad_norm": 6.927548885345459,
+ "learning_rate": 1.3112486849613933e-05,
+ "loss": 0.14,
+ "step": 15314
+ },
+ {
+ "epoch": 41.73024523160763,
+ "grad_norm": 6.970993518829346,
+ "learning_rate": 1.311164817769249e-05,
+ "loss": 0.1973,
+ "step": 15315
+ },
+ {
+ "epoch": 41.73297002724796,
+ "grad_norm": 5.929052352905273,
+ "learning_rate": 1.3110809481537637e-05,
+ "loss": 0.3159,
+ "step": 15316
+ },
+ {
+ "epoch": 41.735694822888284,
+ "grad_norm": 6.026272296905518,
+ "learning_rate": 1.3109970761155895e-05,
+ "loss": 0.3716,
+ "step": 15317
+ },
+ {
+ "epoch": 41.73841961852861,
+ "grad_norm": 5.031559944152832,
+ "learning_rate": 1.31091320165538e-05,
+ "loss": 0.2368,
+ "step": 15318
+ },
+ {
+ "epoch": 41.741144414168936,
+ "grad_norm": 5.375189304351807,
+ "learning_rate": 1.3108293247737886e-05,
+ "loss": 0.2339,
+ "step": 15319
+ },
+ {
+ "epoch": 41.74386920980926,
+ "grad_norm": 10.033079147338867,
+ "learning_rate": 1.3107454454714686e-05,
+ "loss": 0.1756,
+ "step": 15320
+ },
+ {
+ "epoch": 41.746594005449595,
+ "grad_norm": 7.099547863006592,
+ "learning_rate": 1.310661563749073e-05,
+ "loss": 0.2812,
+ "step": 15321
+ },
+ {
+ "epoch": 41.74931880108992,
+ "grad_norm": 6.8617048263549805,
+ "learning_rate": 1.3105776796072554e-05,
+ "loss": 0.3354,
+ "step": 15322
+ },
+ {
+ "epoch": 41.752043596730246,
+ "grad_norm": 6.954360485076904,
+ "learning_rate": 1.3104937930466684e-05,
+ "loss": 0.1971,
+ "step": 15323
+ },
+ {
+ "epoch": 41.75476839237057,
+ "grad_norm": 5.201631546020508,
+ "learning_rate": 1.3104099040679658e-05,
+ "loss": 0.2502,
+ "step": 15324
+ },
+ {
+ "epoch": 41.7574931880109,
+ "grad_norm": 6.470422267913818,
+ "learning_rate": 1.3103260126718009e-05,
+ "loss": 0.3214,
+ "step": 15325
+ },
+ {
+ "epoch": 41.76021798365122,
+ "grad_norm": 5.426015853881836,
+ "learning_rate": 1.310242118858827e-05,
+ "loss": 0.1899,
+ "step": 15326
+ },
+ {
+ "epoch": 41.762942779291556,
+ "grad_norm": 6.195144176483154,
+ "learning_rate": 1.3101582226296974e-05,
+ "loss": 0.2476,
+ "step": 15327
+ },
+ {
+ "epoch": 41.76566757493188,
+ "grad_norm": 5.391987323760986,
+ "learning_rate": 1.310074323985066e-05,
+ "loss": 0.2142,
+ "step": 15328
+ },
+ {
+ "epoch": 41.76839237057221,
+ "grad_norm": 7.920438766479492,
+ "learning_rate": 1.3099904229255853e-05,
+ "loss": 0.194,
+ "step": 15329
+ },
+ {
+ "epoch": 41.771117166212534,
+ "grad_norm": 5.797364711761475,
+ "learning_rate": 1.3099065194519094e-05,
+ "loss": 0.202,
+ "step": 15330
+ },
+ {
+ "epoch": 41.77384196185286,
+ "grad_norm": 6.113834381103516,
+ "learning_rate": 1.3098226135646913e-05,
+ "loss": 0.3482,
+ "step": 15331
+ },
+ {
+ "epoch": 41.776566757493185,
+ "grad_norm": 5.577930927276611,
+ "learning_rate": 1.3097387052645848e-05,
+ "loss": 0.3937,
+ "step": 15332
+ },
+ {
+ "epoch": 41.77929155313352,
+ "grad_norm": 5.87706184387207,
+ "learning_rate": 1.3096547945522431e-05,
+ "loss": 0.226,
+ "step": 15333
+ },
+ {
+ "epoch": 41.782016348773844,
+ "grad_norm": 8.071033477783203,
+ "learning_rate": 1.3095708814283199e-05,
+ "loss": 0.1975,
+ "step": 15334
+ },
+ {
+ "epoch": 41.78474114441417,
+ "grad_norm": 14.369377136230469,
+ "learning_rate": 1.3094869658934684e-05,
+ "loss": 0.2438,
+ "step": 15335
+ },
+ {
+ "epoch": 41.787465940054496,
+ "grad_norm": 7.034031391143799,
+ "learning_rate": 1.3094030479483428e-05,
+ "loss": 0.1746,
+ "step": 15336
+ },
+ {
+ "epoch": 41.79019073569482,
+ "grad_norm": 6.4937920570373535,
+ "learning_rate": 1.3093191275935957e-05,
+ "loss": 0.1385,
+ "step": 15337
+ },
+ {
+ "epoch": 41.79291553133515,
+ "grad_norm": 6.9117207527160645,
+ "learning_rate": 1.3092352048298817e-05,
+ "loss": 0.2037,
+ "step": 15338
+ },
+ {
+ "epoch": 41.79564032697548,
+ "grad_norm": 4.784533977508545,
+ "learning_rate": 1.3091512796578536e-05,
+ "loss": 0.1467,
+ "step": 15339
+ },
+ {
+ "epoch": 41.798365122615806,
+ "grad_norm": 7.152564525604248,
+ "learning_rate": 1.3090673520781656e-05,
+ "loss": 0.1942,
+ "step": 15340
+ },
+ {
+ "epoch": 41.80108991825613,
+ "grad_norm": 6.839911937713623,
+ "learning_rate": 1.3089834220914708e-05,
+ "loss": 0.1905,
+ "step": 15341
+ },
+ {
+ "epoch": 41.80381471389646,
+ "grad_norm": 7.334344387054443,
+ "learning_rate": 1.308899489698423e-05,
+ "loss": 0.1861,
+ "step": 15342
+ },
+ {
+ "epoch": 41.80653950953678,
+ "grad_norm": 6.282195568084717,
+ "learning_rate": 1.308815554899676e-05,
+ "loss": 0.2075,
+ "step": 15343
+ },
+ {
+ "epoch": 41.80926430517711,
+ "grad_norm": 5.372369289398193,
+ "learning_rate": 1.3087316176958831e-05,
+ "loss": 0.3172,
+ "step": 15344
+ },
+ {
+ "epoch": 41.81198910081744,
+ "grad_norm": 4.968111038208008,
+ "learning_rate": 1.3086476780876984e-05,
+ "loss": 0.2896,
+ "step": 15345
+ },
+ {
+ "epoch": 41.81471389645777,
+ "grad_norm": 5.8525776863098145,
+ "learning_rate": 1.308563736075776e-05,
+ "loss": 0.2248,
+ "step": 15346
+ },
+ {
+ "epoch": 41.817438692098094,
+ "grad_norm": 5.676025390625,
+ "learning_rate": 1.3084797916607685e-05,
+ "loss": 0.2509,
+ "step": 15347
+ },
+ {
+ "epoch": 41.82016348773842,
+ "grad_norm": 4.851386070251465,
+ "learning_rate": 1.3083958448433309e-05,
+ "loss": 0.2982,
+ "step": 15348
+ },
+ {
+ "epoch": 41.822888283378745,
+ "grad_norm": 6.4344916343688965,
+ "learning_rate": 1.308311895624116e-05,
+ "loss": 0.2299,
+ "step": 15349
+ },
+ {
+ "epoch": 41.82561307901907,
+ "grad_norm": 6.615203380584717,
+ "learning_rate": 1.3082279440037781e-05,
+ "loss": 0.2948,
+ "step": 15350
+ },
+ {
+ "epoch": 41.828337874659404,
+ "grad_norm": 5.562697887420654,
+ "learning_rate": 1.3081439899829708e-05,
+ "loss": 0.1624,
+ "step": 15351
+ },
+ {
+ "epoch": 41.83106267029973,
+ "grad_norm": 12.665985107421875,
+ "learning_rate": 1.3080600335623481e-05,
+ "loss": 0.3642,
+ "step": 15352
+ },
+ {
+ "epoch": 41.833787465940055,
+ "grad_norm": 6.387678146362305,
+ "learning_rate": 1.3079760747425639e-05,
+ "loss": 0.2876,
+ "step": 15353
+ },
+ {
+ "epoch": 41.83651226158038,
+ "grad_norm": 6.966700553894043,
+ "learning_rate": 1.3078921135242717e-05,
+ "loss": 0.3378,
+ "step": 15354
+ },
+ {
+ "epoch": 41.83923705722071,
+ "grad_norm": 6.500558376312256,
+ "learning_rate": 1.307808149908126e-05,
+ "loss": 0.2065,
+ "step": 15355
+ },
+ {
+ "epoch": 41.84196185286103,
+ "grad_norm": 5.680296897888184,
+ "learning_rate": 1.3077241838947799e-05,
+ "loss": 0.1368,
+ "step": 15356
+ },
+ {
+ "epoch": 41.844686648501366,
+ "grad_norm": 6.377245903015137,
+ "learning_rate": 1.307640215484888e-05,
+ "loss": 0.203,
+ "step": 15357
+ },
+ {
+ "epoch": 41.84741144414169,
+ "grad_norm": 22.68838119506836,
+ "learning_rate": 1.3075562446791042e-05,
+ "loss": 0.1714,
+ "step": 15358
+ },
+ {
+ "epoch": 41.85013623978202,
+ "grad_norm": 8.626298904418945,
+ "learning_rate": 1.3074722714780817e-05,
+ "loss": 0.2568,
+ "step": 15359
+ },
+ {
+ "epoch": 41.85286103542234,
+ "grad_norm": 6.1405534744262695,
+ "learning_rate": 1.3073882958824755e-05,
+ "loss": 0.1826,
+ "step": 15360
+ },
+ {
+ "epoch": 41.85558583106267,
+ "grad_norm": 7.051835060119629,
+ "learning_rate": 1.307304317892939e-05,
+ "loss": 0.2987,
+ "step": 15361
+ },
+ {
+ "epoch": 41.858310626702995,
+ "grad_norm": 6.392403602600098,
+ "learning_rate": 1.3072203375101263e-05,
+ "loss": 0.2063,
+ "step": 15362
+ },
+ {
+ "epoch": 41.86103542234333,
+ "grad_norm": 6.399654388427734,
+ "learning_rate": 1.3071363547346916e-05,
+ "loss": 0.3133,
+ "step": 15363
+ },
+ {
+ "epoch": 41.86376021798365,
+ "grad_norm": 6.283120155334473,
+ "learning_rate": 1.3070523695672887e-05,
+ "loss": 0.2275,
+ "step": 15364
+ },
+ {
+ "epoch": 41.86648501362398,
+ "grad_norm": 6.596218585968018,
+ "learning_rate": 1.3069683820085722e-05,
+ "loss": 0.3038,
+ "step": 15365
+ },
+ {
+ "epoch": 41.869209809264305,
+ "grad_norm": 7.6157097816467285,
+ "learning_rate": 1.3068843920591953e-05,
+ "loss": 0.2207,
+ "step": 15366
+ },
+ {
+ "epoch": 41.87193460490463,
+ "grad_norm": 5.655492305755615,
+ "learning_rate": 1.306800399719813e-05,
+ "loss": 0.2601,
+ "step": 15367
+ },
+ {
+ "epoch": 41.87465940054496,
+ "grad_norm": 6.912761688232422,
+ "learning_rate": 1.306716404991079e-05,
+ "loss": 0.2409,
+ "step": 15368
+ },
+ {
+ "epoch": 41.87738419618529,
+ "grad_norm": 6.548763275146484,
+ "learning_rate": 1.3066324078736474e-05,
+ "loss": 0.212,
+ "step": 15369
+ },
+ {
+ "epoch": 41.880108991825615,
+ "grad_norm": 5.032128810882568,
+ "learning_rate": 1.3065484083681726e-05,
+ "loss": 0.2292,
+ "step": 15370
+ },
+ {
+ "epoch": 41.88283378746594,
+ "grad_norm": 6.4837870597839355,
+ "learning_rate": 1.3064644064753088e-05,
+ "loss": 0.3713,
+ "step": 15371
+ },
+ {
+ "epoch": 41.88555858310627,
+ "grad_norm": 5.282232284545898,
+ "learning_rate": 1.3063804021957096e-05,
+ "loss": 0.1822,
+ "step": 15372
+ },
+ {
+ "epoch": 41.88828337874659,
+ "grad_norm": 7.438727378845215,
+ "learning_rate": 1.3062963955300301e-05,
+ "loss": 0.191,
+ "step": 15373
+ },
+ {
+ "epoch": 41.89100817438692,
+ "grad_norm": 5.965965747833252,
+ "learning_rate": 1.306212386478924e-05,
+ "loss": 0.297,
+ "step": 15374
+ },
+ {
+ "epoch": 41.89373297002725,
+ "grad_norm": 7.361672878265381,
+ "learning_rate": 1.3061283750430457e-05,
+ "loss": 0.1581,
+ "step": 15375
+ },
+ {
+ "epoch": 41.89645776566758,
+ "grad_norm": 5.851138114929199,
+ "learning_rate": 1.3060443612230493e-05,
+ "loss": 0.1822,
+ "step": 15376
+ },
+ {
+ "epoch": 41.8991825613079,
+ "grad_norm": 5.922891139984131,
+ "learning_rate": 1.3059603450195897e-05,
+ "loss": 0.2337,
+ "step": 15377
+ },
+ {
+ "epoch": 41.90190735694823,
+ "grad_norm": 5.012266635894775,
+ "learning_rate": 1.30587632643332e-05,
+ "loss": 0.2147,
+ "step": 15378
+ },
+ {
+ "epoch": 41.904632152588555,
+ "grad_norm": 5.913313388824463,
+ "learning_rate": 1.305792305464896e-05,
+ "loss": 0.2551,
+ "step": 15379
+ },
+ {
+ "epoch": 41.90735694822888,
+ "grad_norm": 6.6129608154296875,
+ "learning_rate": 1.305708282114971e-05,
+ "loss": 0.3024,
+ "step": 15380
+ },
+ {
+ "epoch": 41.91008174386921,
+ "grad_norm": 6.702880382537842,
+ "learning_rate": 1.3056242563842003e-05,
+ "loss": 0.4563,
+ "step": 15381
+ },
+ {
+ "epoch": 41.91280653950954,
+ "grad_norm": 7.25404691696167,
+ "learning_rate": 1.3055402282732372e-05,
+ "loss": 0.2057,
+ "step": 15382
+ },
+ {
+ "epoch": 41.915531335149865,
+ "grad_norm": 6.396892547607422,
+ "learning_rate": 1.3054561977827369e-05,
+ "loss": 0.2443,
+ "step": 15383
+ },
+ {
+ "epoch": 41.91825613079019,
+ "grad_norm": 6.1185479164123535,
+ "learning_rate": 1.3053721649133536e-05,
+ "loss": 0.1937,
+ "step": 15384
+ },
+ {
+ "epoch": 41.920980926430516,
+ "grad_norm": 6.4015631675720215,
+ "learning_rate": 1.3052881296657414e-05,
+ "loss": 0.1727,
+ "step": 15385
+ },
+ {
+ "epoch": 41.92370572207084,
+ "grad_norm": 6.655409336090088,
+ "learning_rate": 1.305204092040555e-05,
+ "loss": 0.1824,
+ "step": 15386
+ },
+ {
+ "epoch": 41.926430517711175,
+ "grad_norm": 5.204779148101807,
+ "learning_rate": 1.3051200520384493e-05,
+ "loss": 0.2001,
+ "step": 15387
+ },
+ {
+ "epoch": 41.9291553133515,
+ "grad_norm": 5.45819616317749,
+ "learning_rate": 1.3050360096600782e-05,
+ "loss": 0.1931,
+ "step": 15388
+ },
+ {
+ "epoch": 41.93188010899183,
+ "grad_norm": 5.179225444793701,
+ "learning_rate": 1.304951964906097e-05,
+ "loss": 0.2817,
+ "step": 15389
+ },
+ {
+ "epoch": 41.93460490463215,
+ "grad_norm": 5.597849369049072,
+ "learning_rate": 1.304867917777159e-05,
+ "loss": 0.29,
+ "step": 15390
+ },
+ {
+ "epoch": 41.93732970027248,
+ "grad_norm": 8.691641807556152,
+ "learning_rate": 1.30478386827392e-05,
+ "loss": 0.3512,
+ "step": 15391
+ },
+ {
+ "epoch": 41.940054495912804,
+ "grad_norm": 5.923669815063477,
+ "learning_rate": 1.3046998163970337e-05,
+ "loss": 0.2259,
+ "step": 15392
+ },
+ {
+ "epoch": 41.94277929155314,
+ "grad_norm": 6.423624515533447,
+ "learning_rate": 1.3046157621471554e-05,
+ "loss": 0.2494,
+ "step": 15393
+ },
+ {
+ "epoch": 41.94550408719346,
+ "grad_norm": 6.862639427185059,
+ "learning_rate": 1.304531705524939e-05,
+ "loss": 0.2584,
+ "step": 15394
+ },
+ {
+ "epoch": 41.94822888283379,
+ "grad_norm": 6.9730730056762695,
+ "learning_rate": 1.3044476465310393e-05,
+ "loss": 0.3208,
+ "step": 15395
+ },
+ {
+ "epoch": 41.950953678474114,
+ "grad_norm": 4.9324631690979,
+ "learning_rate": 1.3043635851661114e-05,
+ "loss": 0.279,
+ "step": 15396
+ },
+ {
+ "epoch": 41.95367847411444,
+ "grad_norm": 5.757242202758789,
+ "learning_rate": 1.3042795214308099e-05,
+ "loss": 0.3135,
+ "step": 15397
+ },
+ {
+ "epoch": 41.956403269754766,
+ "grad_norm": 6.020074367523193,
+ "learning_rate": 1.304195455325789e-05,
+ "loss": 0.258,
+ "step": 15398
+ },
+ {
+ "epoch": 41.95912806539509,
+ "grad_norm": 5.665360927581787,
+ "learning_rate": 1.3041113868517039e-05,
+ "loss": 0.3511,
+ "step": 15399
+ },
+ {
+ "epoch": 41.961852861035425,
+ "grad_norm": 6.090458393096924,
+ "learning_rate": 1.3040273160092089e-05,
+ "loss": 0.2254,
+ "step": 15400
+ },
+ {
+ "epoch": 41.96457765667575,
+ "grad_norm": 7.211927890777588,
+ "learning_rate": 1.3039432427989592e-05,
+ "loss": 0.1688,
+ "step": 15401
+ },
+ {
+ "epoch": 41.967302452316076,
+ "grad_norm": 6.268174648284912,
+ "learning_rate": 1.303859167221609e-05,
+ "loss": 0.3152,
+ "step": 15402
+ },
+ {
+ "epoch": 41.9700272479564,
+ "grad_norm": 4.178107261657715,
+ "learning_rate": 1.3037750892778136e-05,
+ "loss": 0.3118,
+ "step": 15403
+ },
+ {
+ "epoch": 41.97275204359673,
+ "grad_norm": 5.503861427307129,
+ "learning_rate": 1.3036910089682272e-05,
+ "loss": 0.2277,
+ "step": 15404
+ },
+ {
+ "epoch": 41.97547683923706,
+ "grad_norm": 5.349115371704102,
+ "learning_rate": 1.3036069262935057e-05,
+ "loss": 0.2132,
+ "step": 15405
+ },
+ {
+ "epoch": 41.97820163487739,
+ "grad_norm": 5.785735607147217,
+ "learning_rate": 1.3035228412543026e-05,
+ "loss": 0.2861,
+ "step": 15406
+ },
+ {
+ "epoch": 41.98092643051771,
+ "grad_norm": 6.72636604309082,
+ "learning_rate": 1.3034387538512739e-05,
+ "loss": 0.3956,
+ "step": 15407
+ },
+ {
+ "epoch": 41.98365122615804,
+ "grad_norm": 6.461788177490234,
+ "learning_rate": 1.3033546640850734e-05,
+ "loss": 0.2765,
+ "step": 15408
+ },
+ {
+ "epoch": 41.986376021798364,
+ "grad_norm": 6.205533504486084,
+ "learning_rate": 1.3032705719563569e-05,
+ "loss": 0.3482,
+ "step": 15409
+ },
+ {
+ "epoch": 41.98910081743869,
+ "grad_norm": 6.210002899169922,
+ "learning_rate": 1.3031864774657788e-05,
+ "loss": 0.1491,
+ "step": 15410
+ },
+ {
+ "epoch": 41.991825613079016,
+ "grad_norm": 6.160497665405273,
+ "learning_rate": 1.3031023806139944e-05,
+ "loss": 0.3325,
+ "step": 15411
+ },
+ {
+ "epoch": 41.99455040871935,
+ "grad_norm": 5.840280055999756,
+ "learning_rate": 1.303018281401658e-05,
+ "loss": 0.1688,
+ "step": 15412
+ },
+ {
+ "epoch": 41.997275204359674,
+ "grad_norm": 6.895257472991943,
+ "learning_rate": 1.3029341798294253e-05,
+ "loss": 0.1855,
+ "step": 15413
+ },
+ {
+ "epoch": 42.0,
+ "grad_norm": 5.932795524597168,
+ "learning_rate": 1.3028500758979507e-05,
+ "loss": 0.1838,
+ "step": 15414
+ },
+ {
+ "epoch": 42.002724795640326,
+ "grad_norm": 5.44658899307251,
+ "learning_rate": 1.3027659696078898e-05,
+ "loss": 0.2222,
+ "step": 15415
+ },
+ {
+ "epoch": 42.00544959128065,
+ "grad_norm": 5.552676677703857,
+ "learning_rate": 1.302681860959897e-05,
+ "loss": 0.2783,
+ "step": 15416
+ },
+ {
+ "epoch": 42.00817438692098,
+ "grad_norm": 4.85700798034668,
+ "learning_rate": 1.3025977499546279e-05,
+ "loss": 0.1188,
+ "step": 15417
+ },
+ {
+ "epoch": 42.01089918256131,
+ "grad_norm": 6.233191967010498,
+ "learning_rate": 1.3025136365927371e-05,
+ "loss": 0.1516,
+ "step": 15418
+ },
+ {
+ "epoch": 42.013623978201636,
+ "grad_norm": 4.825685501098633,
+ "learning_rate": 1.3024295208748798e-05,
+ "loss": 0.2505,
+ "step": 15419
+ },
+ {
+ "epoch": 42.01634877384196,
+ "grad_norm": 5.147552490234375,
+ "learning_rate": 1.3023454028017111e-05,
+ "loss": 0.1792,
+ "step": 15420
+ },
+ {
+ "epoch": 42.01907356948229,
+ "grad_norm": 4.855800628662109,
+ "learning_rate": 1.3022612823738861e-05,
+ "loss": 0.26,
+ "step": 15421
+ },
+ {
+ "epoch": 42.02179836512261,
+ "grad_norm": 5.426023960113525,
+ "learning_rate": 1.3021771595920601e-05,
+ "loss": 0.2316,
+ "step": 15422
+ },
+ {
+ "epoch": 42.02452316076294,
+ "grad_norm": 6.038941860198975,
+ "learning_rate": 1.3020930344568881e-05,
+ "loss": 0.27,
+ "step": 15423
+ },
+ {
+ "epoch": 42.02724795640327,
+ "grad_norm": 6.548643589019775,
+ "learning_rate": 1.3020089069690252e-05,
+ "loss": 0.2178,
+ "step": 15424
+ },
+ {
+ "epoch": 42.0299727520436,
+ "grad_norm": 6.110074043273926,
+ "learning_rate": 1.3019247771291265e-05,
+ "loss": 0.2289,
+ "step": 15425
+ },
+ {
+ "epoch": 42.032697547683924,
+ "grad_norm": 5.3518195152282715,
+ "learning_rate": 1.3018406449378475e-05,
+ "loss": 0.2506,
+ "step": 15426
+ },
+ {
+ "epoch": 42.03542234332425,
+ "grad_norm": 5.930940628051758,
+ "learning_rate": 1.3017565103958434e-05,
+ "loss": 0.1571,
+ "step": 15427
+ },
+ {
+ "epoch": 42.038147138964575,
+ "grad_norm": 4.607296943664551,
+ "learning_rate": 1.3016723735037693e-05,
+ "loss": 0.1317,
+ "step": 15428
+ },
+ {
+ "epoch": 42.0408719346049,
+ "grad_norm": 5.928393840789795,
+ "learning_rate": 1.3015882342622804e-05,
+ "loss": 0.3472,
+ "step": 15429
+ },
+ {
+ "epoch": 42.043596730245234,
+ "grad_norm": 6.279974937438965,
+ "learning_rate": 1.3015040926720319e-05,
+ "loss": 0.1874,
+ "step": 15430
+ },
+ {
+ "epoch": 42.04632152588556,
+ "grad_norm": 4.728000164031982,
+ "learning_rate": 1.3014199487336792e-05,
+ "loss": 0.1772,
+ "step": 15431
+ },
+ {
+ "epoch": 42.049046321525886,
+ "grad_norm": 8.560091972351074,
+ "learning_rate": 1.3013358024478778e-05,
+ "loss": 0.1634,
+ "step": 15432
+ },
+ {
+ "epoch": 42.05177111716621,
+ "grad_norm": 6.110546112060547,
+ "learning_rate": 1.3012516538152828e-05,
+ "loss": 0.1488,
+ "step": 15433
+ },
+ {
+ "epoch": 42.05449591280654,
+ "grad_norm": 5.91204309463501,
+ "learning_rate": 1.3011675028365496e-05,
+ "loss": 0.1645,
+ "step": 15434
+ },
+ {
+ "epoch": 42.05722070844686,
+ "grad_norm": 6.979456901550293,
+ "learning_rate": 1.3010833495123339e-05,
+ "loss": 0.18,
+ "step": 15435
+ },
+ {
+ "epoch": 42.059945504087196,
+ "grad_norm": 4.777736186981201,
+ "learning_rate": 1.3009991938432904e-05,
+ "loss": 0.2222,
+ "step": 15436
+ },
+ {
+ "epoch": 42.06267029972752,
+ "grad_norm": 4.932180881500244,
+ "learning_rate": 1.3009150358300751e-05,
+ "loss": 0.1425,
+ "step": 15437
+ },
+ {
+ "epoch": 42.06539509536785,
+ "grad_norm": 5.368439197540283,
+ "learning_rate": 1.3008308754733428e-05,
+ "loss": 0.1572,
+ "step": 15438
+ },
+ {
+ "epoch": 42.06811989100817,
+ "grad_norm": 6.10922908782959,
+ "learning_rate": 1.3007467127737497e-05,
+ "loss": 0.368,
+ "step": 15439
+ },
+ {
+ "epoch": 42.0708446866485,
+ "grad_norm": 10.76334285736084,
+ "learning_rate": 1.3006625477319509e-05,
+ "loss": 0.2007,
+ "step": 15440
+ },
+ {
+ "epoch": 42.073569482288825,
+ "grad_norm": 8.216444969177246,
+ "learning_rate": 1.3005783803486015e-05,
+ "loss": 0.1735,
+ "step": 15441
+ },
+ {
+ "epoch": 42.07629427792916,
+ "grad_norm": 5.379700183868408,
+ "learning_rate": 1.3004942106243576e-05,
+ "loss": 0.1608,
+ "step": 15442
+ },
+ {
+ "epoch": 42.079019073569484,
+ "grad_norm": 4.8208818435668945,
+ "learning_rate": 1.3004100385598744e-05,
+ "loss": 0.2262,
+ "step": 15443
+ },
+ {
+ "epoch": 42.08174386920981,
+ "grad_norm": 5.083765983581543,
+ "learning_rate": 1.3003258641558073e-05,
+ "loss": 0.3147,
+ "step": 15444
+ },
+ {
+ "epoch": 42.084468664850135,
+ "grad_norm": 11.18905258178711,
+ "learning_rate": 1.3002416874128125e-05,
+ "loss": 0.243,
+ "step": 15445
+ },
+ {
+ "epoch": 42.08719346049046,
+ "grad_norm": 10.343413352966309,
+ "learning_rate": 1.3001575083315447e-05,
+ "loss": 0.3232,
+ "step": 15446
+ },
+ {
+ "epoch": 42.08991825613079,
+ "grad_norm": 6.096678256988525,
+ "learning_rate": 1.30007332691266e-05,
+ "loss": 0.1783,
+ "step": 15447
+ },
+ {
+ "epoch": 42.09264305177112,
+ "grad_norm": 4.937675952911377,
+ "learning_rate": 1.2999891431568141e-05,
+ "loss": 0.1357,
+ "step": 15448
+ },
+ {
+ "epoch": 42.095367847411445,
+ "grad_norm": 5.313512802124023,
+ "learning_rate": 1.299904957064662e-05,
+ "loss": 0.1648,
+ "step": 15449
+ },
+ {
+ "epoch": 42.09809264305177,
+ "grad_norm": 6.183883190155029,
+ "learning_rate": 1.29982076863686e-05,
+ "loss": 0.1842,
+ "step": 15450
+ },
+ {
+ "epoch": 42.1008174386921,
+ "grad_norm": 6.514837265014648,
+ "learning_rate": 1.2997365778740636e-05,
+ "loss": 0.245,
+ "step": 15451
+ },
+ {
+ "epoch": 42.10354223433242,
+ "grad_norm": 5.0147504806518555,
+ "learning_rate": 1.2996523847769283e-05,
+ "loss": 0.1951,
+ "step": 15452
+ },
+ {
+ "epoch": 42.10626702997275,
+ "grad_norm": 5.101580619812012,
+ "learning_rate": 1.2995681893461098e-05,
+ "loss": 0.1931,
+ "step": 15453
+ },
+ {
+ "epoch": 42.10899182561308,
+ "grad_norm": 5.041823387145996,
+ "learning_rate": 1.2994839915822639e-05,
+ "loss": 0.1534,
+ "step": 15454
+ },
+ {
+ "epoch": 42.11171662125341,
+ "grad_norm": 5.5947585105896,
+ "learning_rate": 1.2993997914860464e-05,
+ "loss": 0.1637,
+ "step": 15455
+ },
+ {
+ "epoch": 42.11444141689373,
+ "grad_norm": 5.6965837478637695,
+ "learning_rate": 1.2993155890581127e-05,
+ "loss": 0.1769,
+ "step": 15456
+ },
+ {
+ "epoch": 42.11716621253406,
+ "grad_norm": 5.925455570220947,
+ "learning_rate": 1.2992313842991189e-05,
+ "loss": 0.2349,
+ "step": 15457
+ },
+ {
+ "epoch": 42.119891008174385,
+ "grad_norm": 10.506064414978027,
+ "learning_rate": 1.2991471772097211e-05,
+ "loss": 0.1553,
+ "step": 15458
+ },
+ {
+ "epoch": 42.12261580381471,
+ "grad_norm": 4.932344436645508,
+ "learning_rate": 1.2990629677905741e-05,
+ "loss": 0.1751,
+ "step": 15459
+ },
+ {
+ "epoch": 42.12534059945504,
+ "grad_norm": 5.502622127532959,
+ "learning_rate": 1.298978756042335e-05,
+ "loss": 0.1926,
+ "step": 15460
+ },
+ {
+ "epoch": 42.12806539509537,
+ "grad_norm": 5.065340042114258,
+ "learning_rate": 1.2988945419656585e-05,
+ "loss": 0.1705,
+ "step": 15461
+ },
+ {
+ "epoch": 42.130790190735695,
+ "grad_norm": 7.667355537414551,
+ "learning_rate": 1.2988103255612012e-05,
+ "loss": 0.2387,
+ "step": 15462
+ },
+ {
+ "epoch": 42.13351498637602,
+ "grad_norm": 12.919604301452637,
+ "learning_rate": 1.2987261068296184e-05,
+ "loss": 0.2179,
+ "step": 15463
+ },
+ {
+ "epoch": 42.13623978201635,
+ "grad_norm": 5.050688743591309,
+ "learning_rate": 1.2986418857715663e-05,
+ "loss": 0.1942,
+ "step": 15464
+ },
+ {
+ "epoch": 42.13896457765667,
+ "grad_norm": 6.5861053466796875,
+ "learning_rate": 1.298557662387701e-05,
+ "loss": 0.1959,
+ "step": 15465
+ },
+ {
+ "epoch": 42.141689373297005,
+ "grad_norm": 9.029101371765137,
+ "learning_rate": 1.2984734366786782e-05,
+ "loss": 0.2185,
+ "step": 15466
+ },
+ {
+ "epoch": 42.14441416893733,
+ "grad_norm": 6.017579078674316,
+ "learning_rate": 1.298389208645154e-05,
+ "loss": 0.2112,
+ "step": 15467
+ },
+ {
+ "epoch": 42.14713896457766,
+ "grad_norm": 5.677315711975098,
+ "learning_rate": 1.2983049782877842e-05,
+ "loss": 0.3474,
+ "step": 15468
+ },
+ {
+ "epoch": 42.14986376021798,
+ "grad_norm": 6.018444538116455,
+ "learning_rate": 1.2982207456072246e-05,
+ "loss": 0.1863,
+ "step": 15469
+ },
+ {
+ "epoch": 42.15258855585831,
+ "grad_norm": 5.981948375701904,
+ "learning_rate": 1.2981365106041317e-05,
+ "loss": 0.2695,
+ "step": 15470
+ },
+ {
+ "epoch": 42.155313351498634,
+ "grad_norm": 6.641706466674805,
+ "learning_rate": 1.298052273279161e-05,
+ "loss": 0.2976,
+ "step": 15471
+ },
+ {
+ "epoch": 42.15803814713897,
+ "grad_norm": 6.385588645935059,
+ "learning_rate": 1.297968033632969e-05,
+ "loss": 0.2371,
+ "step": 15472
+ },
+ {
+ "epoch": 42.16076294277929,
+ "grad_norm": 7.496885776519775,
+ "learning_rate": 1.2978837916662113e-05,
+ "loss": 0.392,
+ "step": 15473
+ },
+ {
+ "epoch": 42.16348773841962,
+ "grad_norm": 5.354748249053955,
+ "learning_rate": 1.2977995473795444e-05,
+ "loss": 0.2055,
+ "step": 15474
+ },
+ {
+ "epoch": 42.166212534059945,
+ "grad_norm": 9.016228675842285,
+ "learning_rate": 1.2977153007736241e-05,
+ "loss": 0.2193,
+ "step": 15475
+ },
+ {
+ "epoch": 42.16893732970027,
+ "grad_norm": 5.192065715789795,
+ "learning_rate": 1.2976310518491068e-05,
+ "loss": 0.4163,
+ "step": 15476
+ },
+ {
+ "epoch": 42.171662125340596,
+ "grad_norm": 5.013331890106201,
+ "learning_rate": 1.2975468006066483e-05,
+ "loss": 0.2784,
+ "step": 15477
+ },
+ {
+ "epoch": 42.17438692098093,
+ "grad_norm": 5.486303806304932,
+ "learning_rate": 1.2974625470469051e-05,
+ "loss": 0.4019,
+ "step": 15478
+ },
+ {
+ "epoch": 42.177111716621255,
+ "grad_norm": 10.600406646728516,
+ "learning_rate": 1.297378291170533e-05,
+ "loss": 0.2654,
+ "step": 15479
+ },
+ {
+ "epoch": 42.17983651226158,
+ "grad_norm": 22.355682373046875,
+ "learning_rate": 1.2972940329781885e-05,
+ "loss": 0.2869,
+ "step": 15480
+ },
+ {
+ "epoch": 42.182561307901906,
+ "grad_norm": 7.4673357009887695,
+ "learning_rate": 1.2972097724705273e-05,
+ "loss": 0.1731,
+ "step": 15481
+ },
+ {
+ "epoch": 42.18528610354223,
+ "grad_norm": 7.031222343444824,
+ "learning_rate": 1.2971255096482063e-05,
+ "loss": 0.2067,
+ "step": 15482
+ },
+ {
+ "epoch": 42.18801089918256,
+ "grad_norm": 7.047456741333008,
+ "learning_rate": 1.297041244511881e-05,
+ "loss": 0.1381,
+ "step": 15483
+ },
+ {
+ "epoch": 42.19073569482289,
+ "grad_norm": 5.458183288574219,
+ "learning_rate": 1.2969569770622084e-05,
+ "loss": 0.2736,
+ "step": 15484
+ },
+ {
+ "epoch": 42.19346049046322,
+ "grad_norm": 5.774094581604004,
+ "learning_rate": 1.2968727072998442e-05,
+ "loss": 0.2545,
+ "step": 15485
+ },
+ {
+ "epoch": 42.19618528610354,
+ "grad_norm": 8.14728832244873,
+ "learning_rate": 1.2967884352254451e-05,
+ "loss": 0.2662,
+ "step": 15486
+ },
+ {
+ "epoch": 42.19891008174387,
+ "grad_norm": 5.487812519073486,
+ "learning_rate": 1.2967041608396671e-05,
+ "loss": 0.2005,
+ "step": 15487
+ },
+ {
+ "epoch": 42.201634877384194,
+ "grad_norm": 5.376804351806641,
+ "learning_rate": 1.296619884143167e-05,
+ "loss": 0.3924,
+ "step": 15488
+ },
+ {
+ "epoch": 42.20435967302452,
+ "grad_norm": 7.430761337280273,
+ "learning_rate": 1.2965356051366003e-05,
+ "loss": 0.3456,
+ "step": 15489
+ },
+ {
+ "epoch": 42.20708446866485,
+ "grad_norm": 6.076028347015381,
+ "learning_rate": 1.296451323820624e-05,
+ "loss": 0.2327,
+ "step": 15490
+ },
+ {
+ "epoch": 42.20980926430518,
+ "grad_norm": 5.0028395652771,
+ "learning_rate": 1.2963670401958944e-05,
+ "loss": 0.13,
+ "step": 15491
+ },
+ {
+ "epoch": 42.212534059945504,
+ "grad_norm": 5.353379726409912,
+ "learning_rate": 1.2962827542630678e-05,
+ "loss": 0.2015,
+ "step": 15492
+ },
+ {
+ "epoch": 42.21525885558583,
+ "grad_norm": 7.217342853546143,
+ "learning_rate": 1.2961984660228005e-05,
+ "loss": 0.1236,
+ "step": 15493
+ },
+ {
+ "epoch": 42.217983651226156,
+ "grad_norm": 6.616295337677002,
+ "learning_rate": 1.2961141754757494e-05,
+ "loss": 0.2788,
+ "step": 15494
+ },
+ {
+ "epoch": 42.22070844686648,
+ "grad_norm": 5.089466094970703,
+ "learning_rate": 1.2960298826225701e-05,
+ "loss": 0.2865,
+ "step": 15495
+ },
+ {
+ "epoch": 42.223433242506815,
+ "grad_norm": 5.868330478668213,
+ "learning_rate": 1.2959455874639202e-05,
+ "loss": 0.2689,
+ "step": 15496
+ },
+ {
+ "epoch": 42.22615803814714,
+ "grad_norm": 5.696859836578369,
+ "learning_rate": 1.2958612900004552e-05,
+ "loss": 0.2144,
+ "step": 15497
+ },
+ {
+ "epoch": 42.228882833787466,
+ "grad_norm": 6.412961959838867,
+ "learning_rate": 1.2957769902328324e-05,
+ "loss": 0.2056,
+ "step": 15498
+ },
+ {
+ "epoch": 42.23160762942779,
+ "grad_norm": 6.366140842437744,
+ "learning_rate": 1.2956926881617073e-05,
+ "loss": 0.1171,
+ "step": 15499
+ },
+ {
+ "epoch": 42.23433242506812,
+ "grad_norm": 4.624966621398926,
+ "learning_rate": 1.2956083837877376e-05,
+ "loss": 0.1428,
+ "step": 15500
+ },
+ {
+ "epoch": 42.237057220708444,
+ "grad_norm": 8.231295585632324,
+ "learning_rate": 1.2955240771115788e-05,
+ "loss": 0.3253,
+ "step": 15501
+ },
+ {
+ "epoch": 42.23978201634878,
+ "grad_norm": 5.296624183654785,
+ "learning_rate": 1.2954397681338886e-05,
+ "loss": 0.1492,
+ "step": 15502
+ },
+ {
+ "epoch": 42.2425068119891,
+ "grad_norm": 5.643084526062012,
+ "learning_rate": 1.2953554568553225e-05,
+ "loss": 0.2552,
+ "step": 15503
+ },
+ {
+ "epoch": 42.24523160762943,
+ "grad_norm": 5.668529987335205,
+ "learning_rate": 1.2952711432765381e-05,
+ "loss": 0.2309,
+ "step": 15504
+ },
+ {
+ "epoch": 42.247956403269754,
+ "grad_norm": 5.27156925201416,
+ "learning_rate": 1.2951868273981912e-05,
+ "loss": 0.1807,
+ "step": 15505
+ },
+ {
+ "epoch": 42.25068119891008,
+ "grad_norm": 5.571093559265137,
+ "learning_rate": 1.2951025092209391e-05,
+ "loss": 0.2919,
+ "step": 15506
+ },
+ {
+ "epoch": 42.253405994550405,
+ "grad_norm": 13.448417663574219,
+ "learning_rate": 1.2950181887454374e-05,
+ "loss": 0.1656,
+ "step": 15507
+ },
+ {
+ "epoch": 42.25613079019074,
+ "grad_norm": 5.163852214813232,
+ "learning_rate": 1.2949338659723443e-05,
+ "loss": 0.2104,
+ "step": 15508
+ },
+ {
+ "epoch": 42.258855585831064,
+ "grad_norm": 6.779701232910156,
+ "learning_rate": 1.2948495409023155e-05,
+ "loss": 0.4256,
+ "step": 15509
+ },
+ {
+ "epoch": 42.26158038147139,
+ "grad_norm": 11.53541374206543,
+ "learning_rate": 1.294765213536008e-05,
+ "loss": 0.149,
+ "step": 15510
+ },
+ {
+ "epoch": 42.264305177111716,
+ "grad_norm": 5.645216941833496,
+ "learning_rate": 1.2946808838740786e-05,
+ "loss": 0.2024,
+ "step": 15511
+ },
+ {
+ "epoch": 42.26702997275204,
+ "grad_norm": 6.562511444091797,
+ "learning_rate": 1.2945965519171837e-05,
+ "loss": 0.2311,
+ "step": 15512
+ },
+ {
+ "epoch": 42.26975476839237,
+ "grad_norm": 5.998152732849121,
+ "learning_rate": 1.2945122176659806e-05,
+ "loss": 0.135,
+ "step": 15513
+ },
+ {
+ "epoch": 42.2724795640327,
+ "grad_norm": 7.895827770233154,
+ "learning_rate": 1.2944278811211257e-05,
+ "loss": 0.3027,
+ "step": 15514
+ },
+ {
+ "epoch": 42.275204359673026,
+ "grad_norm": 5.272707939147949,
+ "learning_rate": 1.2943435422832757e-05,
+ "loss": 0.2454,
+ "step": 15515
+ },
+ {
+ "epoch": 42.27792915531335,
+ "grad_norm": 7.751999855041504,
+ "learning_rate": 1.2942592011530878e-05,
+ "loss": 0.3795,
+ "step": 15516
+ },
+ {
+ "epoch": 42.28065395095368,
+ "grad_norm": 5.843137264251709,
+ "learning_rate": 1.294174857731219e-05,
+ "loss": 0.1421,
+ "step": 15517
+ },
+ {
+ "epoch": 42.283378746594,
+ "grad_norm": 6.004982948303223,
+ "learning_rate": 1.2940905120183256e-05,
+ "loss": 0.1472,
+ "step": 15518
+ },
+ {
+ "epoch": 42.28610354223433,
+ "grad_norm": 5.694803237915039,
+ "learning_rate": 1.2940061640150647e-05,
+ "loss": 0.2206,
+ "step": 15519
+ },
+ {
+ "epoch": 42.28882833787466,
+ "grad_norm": 6.18784236907959,
+ "learning_rate": 1.2939218137220937e-05,
+ "loss": 0.142,
+ "step": 15520
+ },
+ {
+ "epoch": 42.29155313351499,
+ "grad_norm": 6.286417484283447,
+ "learning_rate": 1.2938374611400686e-05,
+ "loss": 0.1637,
+ "step": 15521
+ },
+ {
+ "epoch": 42.294277929155314,
+ "grad_norm": 12.573493957519531,
+ "learning_rate": 1.2937531062696472e-05,
+ "loss": 0.2488,
+ "step": 15522
+ },
+ {
+ "epoch": 42.29700272479564,
+ "grad_norm": 5.91987419128418,
+ "learning_rate": 1.2936687491114857e-05,
+ "loss": 0.2027,
+ "step": 15523
+ },
+ {
+ "epoch": 42.299727520435965,
+ "grad_norm": 5.3064866065979,
+ "learning_rate": 1.2935843896662415e-05,
+ "loss": 0.2772,
+ "step": 15524
+ },
+ {
+ "epoch": 42.30245231607629,
+ "grad_norm": 7.935819149017334,
+ "learning_rate": 1.2935000279345717e-05,
+ "loss": 0.2905,
+ "step": 15525
+ },
+ {
+ "epoch": 42.305177111716624,
+ "grad_norm": 10.462241172790527,
+ "learning_rate": 1.293415663917133e-05,
+ "loss": 0.2463,
+ "step": 15526
+ },
+ {
+ "epoch": 42.30790190735695,
+ "grad_norm": 5.2981367111206055,
+ "learning_rate": 1.2933312976145827e-05,
+ "loss": 0.2498,
+ "step": 15527
+ },
+ {
+ "epoch": 42.310626702997276,
+ "grad_norm": 5.681687355041504,
+ "learning_rate": 1.2932469290275776e-05,
+ "loss": 0.2193,
+ "step": 15528
+ },
+ {
+ "epoch": 42.3133514986376,
+ "grad_norm": 4.980800151824951,
+ "learning_rate": 1.2931625581567748e-05,
+ "loss": 0.2744,
+ "step": 15529
+ },
+ {
+ "epoch": 42.31607629427793,
+ "grad_norm": 4.790737628936768,
+ "learning_rate": 1.2930781850028313e-05,
+ "loss": 0.1973,
+ "step": 15530
+ },
+ {
+ "epoch": 42.31880108991825,
+ "grad_norm": 5.458620548248291,
+ "learning_rate": 1.2929938095664045e-05,
+ "loss": 0.2656,
+ "step": 15531
+ },
+ {
+ "epoch": 42.321525885558586,
+ "grad_norm": 8.451607704162598,
+ "learning_rate": 1.2929094318481515e-05,
+ "loss": 0.3004,
+ "step": 15532
+ },
+ {
+ "epoch": 42.32425068119891,
+ "grad_norm": 5.715627193450928,
+ "learning_rate": 1.2928250518487291e-05,
+ "loss": 0.2858,
+ "step": 15533
+ },
+ {
+ "epoch": 42.32697547683924,
+ "grad_norm": 5.105525493621826,
+ "learning_rate": 1.2927406695687945e-05,
+ "loss": 0.1778,
+ "step": 15534
+ },
+ {
+ "epoch": 42.32970027247956,
+ "grad_norm": 6.924923896789551,
+ "learning_rate": 1.2926562850090052e-05,
+ "loss": 0.1534,
+ "step": 15535
+ },
+ {
+ "epoch": 42.33242506811989,
+ "grad_norm": 5.473208904266357,
+ "learning_rate": 1.2925718981700181e-05,
+ "loss": 0.1992,
+ "step": 15536
+ },
+ {
+ "epoch": 42.335149863760215,
+ "grad_norm": 5.2932610511779785,
+ "learning_rate": 1.2924875090524904e-05,
+ "loss": 0.1865,
+ "step": 15537
+ },
+ {
+ "epoch": 42.33787465940055,
+ "grad_norm": 7.486854076385498,
+ "learning_rate": 1.2924031176570794e-05,
+ "loss": 0.2947,
+ "step": 15538
+ },
+ {
+ "epoch": 42.34059945504087,
+ "grad_norm": 5.6262359619140625,
+ "learning_rate": 1.2923187239844426e-05,
+ "loss": 0.2825,
+ "step": 15539
+ },
+ {
+ "epoch": 42.3433242506812,
+ "grad_norm": 7.020451068878174,
+ "learning_rate": 1.2922343280352367e-05,
+ "loss": 0.2192,
+ "step": 15540
+ },
+ {
+ "epoch": 42.346049046321525,
+ "grad_norm": 5.153855800628662,
+ "learning_rate": 1.2921499298101193e-05,
+ "loss": 0.1758,
+ "step": 15541
+ },
+ {
+ "epoch": 42.34877384196185,
+ "grad_norm": 5.127655506134033,
+ "learning_rate": 1.2920655293097474e-05,
+ "loss": 0.2618,
+ "step": 15542
+ },
+ {
+ "epoch": 42.35149863760218,
+ "grad_norm": 10.108250617980957,
+ "learning_rate": 1.291981126534779e-05,
+ "loss": 0.2181,
+ "step": 15543
+ },
+ {
+ "epoch": 42.35422343324251,
+ "grad_norm": 6.072994709014893,
+ "learning_rate": 1.2918967214858709e-05,
+ "loss": 0.1606,
+ "step": 15544
+ },
+ {
+ "epoch": 42.356948228882835,
+ "grad_norm": 6.636490345001221,
+ "learning_rate": 1.2918123141636804e-05,
+ "loss": 0.2944,
+ "step": 15545
+ },
+ {
+ "epoch": 42.35967302452316,
+ "grad_norm": 7.909504413604736,
+ "learning_rate": 1.291727904568865e-05,
+ "loss": 0.256,
+ "step": 15546
+ },
+ {
+ "epoch": 42.36239782016349,
+ "grad_norm": 5.1938090324401855,
+ "learning_rate": 1.2916434927020825e-05,
+ "loss": 0.1128,
+ "step": 15547
+ },
+ {
+ "epoch": 42.36512261580381,
+ "grad_norm": 5.129669666290283,
+ "learning_rate": 1.291559078563989e-05,
+ "loss": 0.2096,
+ "step": 15548
+ },
+ {
+ "epoch": 42.36784741144414,
+ "grad_norm": 5.939659118652344,
+ "learning_rate": 1.2914746621552437e-05,
+ "loss": 0.173,
+ "step": 15549
+ },
+ {
+ "epoch": 42.37057220708447,
+ "grad_norm": 7.425166130065918,
+ "learning_rate": 1.2913902434765023e-05,
+ "loss": 0.2892,
+ "step": 15550
+ },
+ {
+ "epoch": 42.3732970027248,
+ "grad_norm": 6.21837043762207,
+ "learning_rate": 1.2913058225284237e-05,
+ "loss": 0.2662,
+ "step": 15551
+ },
+ {
+ "epoch": 42.37602179836512,
+ "grad_norm": 7.428950309753418,
+ "learning_rate": 1.2912213993116642e-05,
+ "loss": 0.1748,
+ "step": 15552
+ },
+ {
+ "epoch": 42.37874659400545,
+ "grad_norm": 4.864560604095459,
+ "learning_rate": 1.2911369738268823e-05,
+ "loss": 0.3374,
+ "step": 15553
+ },
+ {
+ "epoch": 42.381471389645775,
+ "grad_norm": 6.655929088592529,
+ "learning_rate": 1.2910525460747346e-05,
+ "loss": 0.3018,
+ "step": 15554
+ },
+ {
+ "epoch": 42.3841961852861,
+ "grad_norm": 4.93895959854126,
+ "learning_rate": 1.2909681160558794e-05,
+ "loss": 0.4243,
+ "step": 15555
+ },
+ {
+ "epoch": 42.38692098092643,
+ "grad_norm": 6.0697922706604,
+ "learning_rate": 1.2908836837709734e-05,
+ "loss": 0.147,
+ "step": 15556
+ },
+ {
+ "epoch": 42.38964577656676,
+ "grad_norm": 4.908973217010498,
+ "learning_rate": 1.2907992492206752e-05,
+ "loss": 0.2268,
+ "step": 15557
+ },
+ {
+ "epoch": 42.392370572207085,
+ "grad_norm": 6.194726467132568,
+ "learning_rate": 1.2907148124056415e-05,
+ "loss": 0.1345,
+ "step": 15558
+ },
+ {
+ "epoch": 42.39509536784741,
+ "grad_norm": 4.846452713012695,
+ "learning_rate": 1.2906303733265301e-05,
+ "loss": 0.1757,
+ "step": 15559
+ },
+ {
+ "epoch": 42.39782016348774,
+ "grad_norm": 4.52724552154541,
+ "learning_rate": 1.2905459319839988e-05,
+ "loss": 0.1843,
+ "step": 15560
+ },
+ {
+ "epoch": 42.40054495912806,
+ "grad_norm": 5.058575630187988,
+ "learning_rate": 1.2904614883787052e-05,
+ "loss": 0.2414,
+ "step": 15561
+ },
+ {
+ "epoch": 42.403269754768395,
+ "grad_norm": 5.1417341232299805,
+ "learning_rate": 1.290377042511307e-05,
+ "loss": 0.2135,
+ "step": 15562
+ },
+ {
+ "epoch": 42.40599455040872,
+ "grad_norm": 5.533407211303711,
+ "learning_rate": 1.2902925943824615e-05,
+ "loss": 0.2542,
+ "step": 15563
+ },
+ {
+ "epoch": 42.40871934604905,
+ "grad_norm": 5.8959503173828125,
+ "learning_rate": 1.2902081439928268e-05,
+ "loss": 0.31,
+ "step": 15564
+ },
+ {
+ "epoch": 42.41144414168937,
+ "grad_norm": 5.670324802398682,
+ "learning_rate": 1.2901236913430604e-05,
+ "loss": 0.3066,
+ "step": 15565
+ },
+ {
+ "epoch": 42.4141689373297,
+ "grad_norm": 6.487437725067139,
+ "learning_rate": 1.2900392364338199e-05,
+ "loss": 0.1703,
+ "step": 15566
+ },
+ {
+ "epoch": 42.416893732970024,
+ "grad_norm": 9.519947052001953,
+ "learning_rate": 1.2899547792657633e-05,
+ "loss": 0.2129,
+ "step": 15567
+ },
+ {
+ "epoch": 42.41961852861036,
+ "grad_norm": 6.691407203674316,
+ "learning_rate": 1.289870319839548e-05,
+ "loss": 0.1647,
+ "step": 15568
+ },
+ {
+ "epoch": 42.42234332425068,
+ "grad_norm": 5.998138904571533,
+ "learning_rate": 1.289785858155832e-05,
+ "loss": 0.2248,
+ "step": 15569
+ },
+ {
+ "epoch": 42.42506811989101,
+ "grad_norm": 5.7534685134887695,
+ "learning_rate": 1.2897013942152732e-05,
+ "loss": 0.2413,
+ "step": 15570
+ },
+ {
+ "epoch": 42.427792915531334,
+ "grad_norm": 5.390469074249268,
+ "learning_rate": 1.2896169280185293e-05,
+ "loss": 0.3113,
+ "step": 15571
+ },
+ {
+ "epoch": 42.43051771117166,
+ "grad_norm": 5.165089130401611,
+ "learning_rate": 1.289532459566258e-05,
+ "loss": 0.1694,
+ "step": 15572
+ },
+ {
+ "epoch": 42.433242506811986,
+ "grad_norm": 19.199241638183594,
+ "learning_rate": 1.2894479888591173e-05,
+ "loss": 0.2332,
+ "step": 15573
+ },
+ {
+ "epoch": 42.43596730245232,
+ "grad_norm": 5.859897136688232,
+ "learning_rate": 1.289363515897765e-05,
+ "loss": 0.2173,
+ "step": 15574
+ },
+ {
+ "epoch": 42.438692098092645,
+ "grad_norm": 5.306302547454834,
+ "learning_rate": 1.289279040682859e-05,
+ "loss": 0.2181,
+ "step": 15575
+ },
+ {
+ "epoch": 42.44141689373297,
+ "grad_norm": 5.701376438140869,
+ "learning_rate": 1.2891945632150566e-05,
+ "loss": 0.1909,
+ "step": 15576
+ },
+ {
+ "epoch": 42.444141689373296,
+ "grad_norm": 5.970940113067627,
+ "learning_rate": 1.2891100834950167e-05,
+ "loss": 0.2238,
+ "step": 15577
+ },
+ {
+ "epoch": 42.44686648501362,
+ "grad_norm": 6.2598557472229,
+ "learning_rate": 1.2890256015233968e-05,
+ "loss": 0.3004,
+ "step": 15578
+ },
+ {
+ "epoch": 42.44959128065395,
+ "grad_norm": 5.792520523071289,
+ "learning_rate": 1.2889411173008549e-05,
+ "loss": 0.2131,
+ "step": 15579
+ },
+ {
+ "epoch": 42.45231607629428,
+ "grad_norm": 4.6232805252075195,
+ "learning_rate": 1.2888566308280486e-05,
+ "loss": 0.2638,
+ "step": 15580
+ },
+ {
+ "epoch": 42.45504087193461,
+ "grad_norm": 5.799549102783203,
+ "learning_rate": 1.2887721421056366e-05,
+ "loss": 0.1464,
+ "step": 15581
+ },
+ {
+ "epoch": 42.45776566757493,
+ "grad_norm": 9.060937881469727,
+ "learning_rate": 1.2886876511342758e-05,
+ "loss": 0.3488,
+ "step": 15582
+ },
+ {
+ "epoch": 42.46049046321526,
+ "grad_norm": 5.300330638885498,
+ "learning_rate": 1.2886031579146257e-05,
+ "loss": 0.2588,
+ "step": 15583
+ },
+ {
+ "epoch": 42.463215258855584,
+ "grad_norm": 5.925723552703857,
+ "learning_rate": 1.2885186624473428e-05,
+ "loss": 0.2493,
+ "step": 15584
+ },
+ {
+ "epoch": 42.46594005449591,
+ "grad_norm": 4.02168083190918,
+ "learning_rate": 1.288434164733086e-05,
+ "loss": 0.3596,
+ "step": 15585
+ },
+ {
+ "epoch": 42.46866485013624,
+ "grad_norm": 6.255588531494141,
+ "learning_rate": 1.2883496647725131e-05,
+ "loss": 0.1687,
+ "step": 15586
+ },
+ {
+ "epoch": 42.47138964577657,
+ "grad_norm": 5.425561428070068,
+ "learning_rate": 1.2882651625662825e-05,
+ "loss": 0.1327,
+ "step": 15587
+ },
+ {
+ "epoch": 42.474114441416894,
+ "grad_norm": 6.124661922454834,
+ "learning_rate": 1.288180658115052e-05,
+ "loss": 0.1344,
+ "step": 15588
+ },
+ {
+ "epoch": 42.47683923705722,
+ "grad_norm": 6.7752366065979,
+ "learning_rate": 1.28809615141948e-05,
+ "loss": 0.297,
+ "step": 15589
+ },
+ {
+ "epoch": 42.479564032697546,
+ "grad_norm": 6.834358215332031,
+ "learning_rate": 1.2880116424802242e-05,
+ "loss": 0.3883,
+ "step": 15590
+ },
+ {
+ "epoch": 42.48228882833787,
+ "grad_norm": 5.602798938751221,
+ "learning_rate": 1.287927131297943e-05,
+ "loss": 0.3643,
+ "step": 15591
+ },
+ {
+ "epoch": 42.485013623978205,
+ "grad_norm": 6.323520183563232,
+ "learning_rate": 1.2878426178732947e-05,
+ "loss": 0.2445,
+ "step": 15592
+ },
+ {
+ "epoch": 42.48773841961853,
+ "grad_norm": 4.985516548156738,
+ "learning_rate": 1.2877581022069374e-05,
+ "loss": 0.1582,
+ "step": 15593
+ },
+ {
+ "epoch": 42.490463215258856,
+ "grad_norm": 5.517819404602051,
+ "learning_rate": 1.2876735842995291e-05,
+ "loss": 0.1748,
+ "step": 15594
+ },
+ {
+ "epoch": 42.49318801089918,
+ "grad_norm": 6.430752277374268,
+ "learning_rate": 1.2875890641517283e-05,
+ "loss": 0.1986,
+ "step": 15595
+ },
+ {
+ "epoch": 42.49591280653951,
+ "grad_norm": 8.593796730041504,
+ "learning_rate": 1.2875045417641928e-05,
+ "loss": 0.1428,
+ "step": 15596
+ },
+ {
+ "epoch": 42.49863760217983,
+ "grad_norm": 5.309615612030029,
+ "learning_rate": 1.2874200171375817e-05,
+ "loss": 0.2898,
+ "step": 15597
+ },
+ {
+ "epoch": 42.50136239782017,
+ "grad_norm": 6.958247661590576,
+ "learning_rate": 1.2873354902725525e-05,
+ "loss": 0.2751,
+ "step": 15598
+ },
+ {
+ "epoch": 42.50408719346049,
+ "grad_norm": 5.246025085449219,
+ "learning_rate": 1.2872509611697639e-05,
+ "loss": 0.1521,
+ "step": 15599
+ },
+ {
+ "epoch": 42.50681198910082,
+ "grad_norm": 5.215633869171143,
+ "learning_rate": 1.287166429829874e-05,
+ "loss": 0.1823,
+ "step": 15600
+ },
+ {
+ "epoch": 42.509536784741144,
+ "grad_norm": 7.842749118804932,
+ "learning_rate": 1.2870818962535412e-05,
+ "loss": 0.1688,
+ "step": 15601
+ },
+ {
+ "epoch": 42.51226158038147,
+ "grad_norm": 5.858428001403809,
+ "learning_rate": 1.2869973604414237e-05,
+ "loss": 0.2268,
+ "step": 15602
+ },
+ {
+ "epoch": 42.514986376021795,
+ "grad_norm": 5.467252731323242,
+ "learning_rate": 1.28691282239418e-05,
+ "loss": 0.1691,
+ "step": 15603
+ },
+ {
+ "epoch": 42.51771117166213,
+ "grad_norm": 4.986133098602295,
+ "learning_rate": 1.2868282821124685e-05,
+ "loss": 0.3136,
+ "step": 15604
+ },
+ {
+ "epoch": 42.520435967302454,
+ "grad_norm": 5.284420967102051,
+ "learning_rate": 1.2867437395969476e-05,
+ "loss": 0.1013,
+ "step": 15605
+ },
+ {
+ "epoch": 42.52316076294278,
+ "grad_norm": 5.0402607917785645,
+ "learning_rate": 1.2866591948482756e-05,
+ "loss": 0.2024,
+ "step": 15606
+ },
+ {
+ "epoch": 42.525885558583106,
+ "grad_norm": 5.158346652984619,
+ "learning_rate": 1.286574647867111e-05,
+ "loss": 0.1467,
+ "step": 15607
+ },
+ {
+ "epoch": 42.52861035422343,
+ "grad_norm": 5.764071464538574,
+ "learning_rate": 1.2864900986541125e-05,
+ "loss": 0.1802,
+ "step": 15608
+ },
+ {
+ "epoch": 42.53133514986376,
+ "grad_norm": 6.164839744567871,
+ "learning_rate": 1.2864055472099381e-05,
+ "loss": 0.2463,
+ "step": 15609
+ },
+ {
+ "epoch": 42.53405994550409,
+ "grad_norm": 7.74569845199585,
+ "learning_rate": 1.2863209935352468e-05,
+ "loss": 0.23,
+ "step": 15610
+ },
+ {
+ "epoch": 42.536784741144416,
+ "grad_norm": 5.935806751251221,
+ "learning_rate": 1.2862364376306964e-05,
+ "loss": 0.1226,
+ "step": 15611
+ },
+ {
+ "epoch": 42.53950953678474,
+ "grad_norm": 5.458498954772949,
+ "learning_rate": 1.2861518794969464e-05,
+ "loss": 0.3806,
+ "step": 15612
+ },
+ {
+ "epoch": 42.54223433242507,
+ "grad_norm": 6.322701454162598,
+ "learning_rate": 1.2860673191346542e-05,
+ "loss": 0.3062,
+ "step": 15613
+ },
+ {
+ "epoch": 42.54495912806539,
+ "grad_norm": 7.980700969696045,
+ "learning_rate": 1.2859827565444793e-05,
+ "loss": 0.1646,
+ "step": 15614
+ },
+ {
+ "epoch": 42.54768392370572,
+ "grad_norm": 6.683459758758545,
+ "learning_rate": 1.2858981917270796e-05,
+ "loss": 0.2345,
+ "step": 15615
+ },
+ {
+ "epoch": 42.55040871934605,
+ "grad_norm": 7.966632843017578,
+ "learning_rate": 1.2858136246831144e-05,
+ "loss": 0.3876,
+ "step": 15616
+ },
+ {
+ "epoch": 42.55313351498638,
+ "grad_norm": 5.730477809906006,
+ "learning_rate": 1.2857290554132416e-05,
+ "loss": 0.2682,
+ "step": 15617
+ },
+ {
+ "epoch": 42.555858310626704,
+ "grad_norm": 5.792958736419678,
+ "learning_rate": 1.2856444839181199e-05,
+ "loss": 0.1936,
+ "step": 15618
+ },
+ {
+ "epoch": 42.55858310626703,
+ "grad_norm": 8.202452659606934,
+ "learning_rate": 1.2855599101984085e-05,
+ "loss": 0.159,
+ "step": 15619
+ },
+ {
+ "epoch": 42.561307901907355,
+ "grad_norm": 5.304412364959717,
+ "learning_rate": 1.2854753342547656e-05,
+ "loss": 0.2151,
+ "step": 15620
+ },
+ {
+ "epoch": 42.56403269754768,
+ "grad_norm": 4.5617594718933105,
+ "learning_rate": 1.2853907560878499e-05,
+ "loss": 0.1409,
+ "step": 15621
+ },
+ {
+ "epoch": 42.566757493188014,
+ "grad_norm": 7.792327880859375,
+ "learning_rate": 1.2853061756983203e-05,
+ "loss": 0.3014,
+ "step": 15622
+ },
+ {
+ "epoch": 42.56948228882834,
+ "grad_norm": 10.473942756652832,
+ "learning_rate": 1.2852215930868353e-05,
+ "loss": 0.2424,
+ "step": 15623
+ },
+ {
+ "epoch": 42.572207084468666,
+ "grad_norm": 6.214908599853516,
+ "learning_rate": 1.285137008254054e-05,
+ "loss": 0.1883,
+ "step": 15624
+ },
+ {
+ "epoch": 42.57493188010899,
+ "grad_norm": 8.285236358642578,
+ "learning_rate": 1.2850524212006344e-05,
+ "loss": 0.34,
+ "step": 15625
+ },
+ {
+ "epoch": 42.57765667574932,
+ "grad_norm": 5.568668365478516,
+ "learning_rate": 1.284967831927236e-05,
+ "loss": 0.2885,
+ "step": 15626
+ },
+ {
+ "epoch": 42.58038147138964,
+ "grad_norm": 4.822712421417236,
+ "learning_rate": 1.2848832404345173e-05,
+ "loss": 0.1432,
+ "step": 15627
+ },
+ {
+ "epoch": 42.583106267029976,
+ "grad_norm": 7.120174407958984,
+ "learning_rate": 1.2847986467231368e-05,
+ "loss": 0.2746,
+ "step": 15628
+ },
+ {
+ "epoch": 42.5858310626703,
+ "grad_norm": 5.246706962585449,
+ "learning_rate": 1.2847140507937539e-05,
+ "loss": 0.3759,
+ "step": 15629
+ },
+ {
+ "epoch": 42.58855585831063,
+ "grad_norm": 6.120863437652588,
+ "learning_rate": 1.2846294526470274e-05,
+ "loss": 0.3094,
+ "step": 15630
+ },
+ {
+ "epoch": 42.59128065395095,
+ "grad_norm": 9.145034790039062,
+ "learning_rate": 1.2845448522836152e-05,
+ "loss": 0.1625,
+ "step": 15631
+ },
+ {
+ "epoch": 42.59400544959128,
+ "grad_norm": 7.596875190734863,
+ "learning_rate": 1.2844602497041774e-05,
+ "loss": 0.1904,
+ "step": 15632
+ },
+ {
+ "epoch": 42.596730245231605,
+ "grad_norm": 7.045854568481445,
+ "learning_rate": 1.2843756449093721e-05,
+ "loss": 0.2578,
+ "step": 15633
+ },
+ {
+ "epoch": 42.59945504087194,
+ "grad_norm": 5.64263916015625,
+ "learning_rate": 1.2842910378998585e-05,
+ "loss": 0.3601,
+ "step": 15634
+ },
+ {
+ "epoch": 42.60217983651226,
+ "grad_norm": 6.453949451446533,
+ "learning_rate": 1.2842064286762954e-05,
+ "loss": 0.2219,
+ "step": 15635
+ },
+ {
+ "epoch": 42.60490463215259,
+ "grad_norm": 5.985903263092041,
+ "learning_rate": 1.2841218172393417e-05,
+ "loss": 0.1634,
+ "step": 15636
+ },
+ {
+ "epoch": 42.607629427792915,
+ "grad_norm": 6.2830810546875,
+ "learning_rate": 1.2840372035896565e-05,
+ "loss": 0.3231,
+ "step": 15637
+ },
+ {
+ "epoch": 42.61035422343324,
+ "grad_norm": 5.878849983215332,
+ "learning_rate": 1.2839525877278986e-05,
+ "loss": 0.3066,
+ "step": 15638
+ },
+ {
+ "epoch": 42.61307901907357,
+ "grad_norm": 9.201489448547363,
+ "learning_rate": 1.2838679696547272e-05,
+ "loss": 0.2384,
+ "step": 15639
+ },
+ {
+ "epoch": 42.6158038147139,
+ "grad_norm": 4.6086626052856445,
+ "learning_rate": 1.2837833493708013e-05,
+ "loss": 0.2048,
+ "step": 15640
+ },
+ {
+ "epoch": 42.618528610354225,
+ "grad_norm": 7.550244331359863,
+ "learning_rate": 1.2836987268767798e-05,
+ "loss": 0.3065,
+ "step": 15641
+ },
+ {
+ "epoch": 42.62125340599455,
+ "grad_norm": 6.34338903427124,
+ "learning_rate": 1.2836141021733217e-05,
+ "loss": 0.2497,
+ "step": 15642
+ },
+ {
+ "epoch": 42.62397820163488,
+ "grad_norm": 9.32612419128418,
+ "learning_rate": 1.283529475261086e-05,
+ "loss": 0.2767,
+ "step": 15643
+ },
+ {
+ "epoch": 42.6267029972752,
+ "grad_norm": 5.956027507781982,
+ "learning_rate": 1.283444846140732e-05,
+ "loss": 0.2447,
+ "step": 15644
+ },
+ {
+ "epoch": 42.62942779291553,
+ "grad_norm": 5.47667932510376,
+ "learning_rate": 1.2833602148129184e-05,
+ "loss": 0.1846,
+ "step": 15645
+ },
+ {
+ "epoch": 42.63215258855586,
+ "grad_norm": 6.449533462524414,
+ "learning_rate": 1.2832755812783048e-05,
+ "loss": 0.3097,
+ "step": 15646
+ },
+ {
+ "epoch": 42.63487738419619,
+ "grad_norm": 5.0832905769348145,
+ "learning_rate": 1.28319094553755e-05,
+ "loss": 0.1385,
+ "step": 15647
+ },
+ {
+ "epoch": 42.63760217983651,
+ "grad_norm": 5.39228630065918,
+ "learning_rate": 1.2831063075913134e-05,
+ "loss": 0.2786,
+ "step": 15648
+ },
+ {
+ "epoch": 42.64032697547684,
+ "grad_norm": 5.079096794128418,
+ "learning_rate": 1.2830216674402539e-05,
+ "loss": 0.2716,
+ "step": 15649
+ },
+ {
+ "epoch": 42.643051771117165,
+ "grad_norm": 7.23034143447876,
+ "learning_rate": 1.2829370250850306e-05,
+ "loss": 0.4366,
+ "step": 15650
+ },
+ {
+ "epoch": 42.64577656675749,
+ "grad_norm": 6.6343560218811035,
+ "learning_rate": 1.282852380526303e-05,
+ "loss": 0.2604,
+ "step": 15651
+ },
+ {
+ "epoch": 42.64850136239782,
+ "grad_norm": 7.3391194343566895,
+ "learning_rate": 1.2827677337647302e-05,
+ "loss": 0.1819,
+ "step": 15652
+ },
+ {
+ "epoch": 42.65122615803815,
+ "grad_norm": 11.406492233276367,
+ "learning_rate": 1.2826830848009711e-05,
+ "loss": 0.1838,
+ "step": 15653
+ },
+ {
+ "epoch": 42.653950953678475,
+ "grad_norm": 7.062712669372559,
+ "learning_rate": 1.2825984336356856e-05,
+ "loss": 0.2989,
+ "step": 15654
+ },
+ {
+ "epoch": 42.6566757493188,
+ "grad_norm": 10.87055778503418,
+ "learning_rate": 1.2825137802695324e-05,
+ "loss": 0.1964,
+ "step": 15655
+ },
+ {
+ "epoch": 42.65940054495913,
+ "grad_norm": 7.037644863128662,
+ "learning_rate": 1.282429124703171e-05,
+ "loss": 0.1846,
+ "step": 15656
+ },
+ {
+ "epoch": 42.66212534059945,
+ "grad_norm": 5.161700248718262,
+ "learning_rate": 1.2823444669372606e-05,
+ "loss": 0.1318,
+ "step": 15657
+ },
+ {
+ "epoch": 42.664850136239785,
+ "grad_norm": 6.45982551574707,
+ "learning_rate": 1.282259806972461e-05,
+ "loss": 0.2821,
+ "step": 15658
+ },
+ {
+ "epoch": 42.66757493188011,
+ "grad_norm": 6.253321647644043,
+ "learning_rate": 1.2821751448094306e-05,
+ "loss": 0.3189,
+ "step": 15659
+ },
+ {
+ "epoch": 42.67029972752044,
+ "grad_norm": 5.008757591247559,
+ "learning_rate": 1.2820904804488297e-05,
+ "loss": 0.2248,
+ "step": 15660
+ },
+ {
+ "epoch": 42.67302452316076,
+ "grad_norm": 5.852625370025635,
+ "learning_rate": 1.2820058138913169e-05,
+ "loss": 0.2124,
+ "step": 15661
+ },
+ {
+ "epoch": 42.67574931880109,
+ "grad_norm": 6.222420692443848,
+ "learning_rate": 1.2819211451375517e-05,
+ "loss": 0.3006,
+ "step": 15662
+ },
+ {
+ "epoch": 42.678474114441414,
+ "grad_norm": 6.5769195556640625,
+ "learning_rate": 1.2818364741881939e-05,
+ "loss": 0.2786,
+ "step": 15663
+ },
+ {
+ "epoch": 42.68119891008175,
+ "grad_norm": 15.356090545654297,
+ "learning_rate": 1.281751801043903e-05,
+ "loss": 0.3032,
+ "step": 15664
+ },
+ {
+ "epoch": 42.68392370572207,
+ "grad_norm": 5.917220592498779,
+ "learning_rate": 1.2816671257053377e-05,
+ "loss": 0.1984,
+ "step": 15665
+ },
+ {
+ "epoch": 42.6866485013624,
+ "grad_norm": 5.45731258392334,
+ "learning_rate": 1.2815824481731582e-05,
+ "loss": 0.1677,
+ "step": 15666
+ },
+ {
+ "epoch": 42.689373297002724,
+ "grad_norm": 5.89810037612915,
+ "learning_rate": 1.2814977684480234e-05,
+ "loss": 0.262,
+ "step": 15667
+ },
+ {
+ "epoch": 42.69209809264305,
+ "grad_norm": 6.147561550140381,
+ "learning_rate": 1.2814130865305937e-05,
+ "loss": 0.2132,
+ "step": 15668
+ },
+ {
+ "epoch": 42.694822888283376,
+ "grad_norm": 5.025945663452148,
+ "learning_rate": 1.2813284024215272e-05,
+ "loss": 0.1731,
+ "step": 15669
+ },
+ {
+ "epoch": 42.69754768392371,
+ "grad_norm": 6.564162254333496,
+ "learning_rate": 1.2812437161214843e-05,
+ "loss": 0.3235,
+ "step": 15670
+ },
+ {
+ "epoch": 42.700272479564035,
+ "grad_norm": 5.934960842132568,
+ "learning_rate": 1.2811590276311243e-05,
+ "loss": 0.3416,
+ "step": 15671
+ },
+ {
+ "epoch": 42.70299727520436,
+ "grad_norm": 7.1388726234436035,
+ "learning_rate": 1.2810743369511071e-05,
+ "loss": 0.1969,
+ "step": 15672
+ },
+ {
+ "epoch": 42.705722070844686,
+ "grad_norm": 5.952902793884277,
+ "learning_rate": 1.280989644082092e-05,
+ "loss": 0.1279,
+ "step": 15673
+ },
+ {
+ "epoch": 42.70844686648501,
+ "grad_norm": 5.618162631988525,
+ "learning_rate": 1.2809049490247386e-05,
+ "loss": 0.227,
+ "step": 15674
+ },
+ {
+ "epoch": 42.71117166212534,
+ "grad_norm": 5.18951416015625,
+ "learning_rate": 1.2808202517797064e-05,
+ "loss": 0.3255,
+ "step": 15675
+ },
+ {
+ "epoch": 42.71389645776567,
+ "grad_norm": 5.392221450805664,
+ "learning_rate": 1.2807355523476552e-05,
+ "loss": 0.2909,
+ "step": 15676
+ },
+ {
+ "epoch": 42.716621253406,
+ "grad_norm": 5.3777618408203125,
+ "learning_rate": 1.2806508507292444e-05,
+ "loss": 0.1854,
+ "step": 15677
+ },
+ {
+ "epoch": 42.71934604904632,
+ "grad_norm": 6.626627445220947,
+ "learning_rate": 1.280566146925134e-05,
+ "loss": 0.1884,
+ "step": 15678
+ },
+ {
+ "epoch": 42.72207084468665,
+ "grad_norm": 5.3079681396484375,
+ "learning_rate": 1.2804814409359834e-05,
+ "loss": 0.164,
+ "step": 15679
+ },
+ {
+ "epoch": 42.724795640326974,
+ "grad_norm": 5.620943069458008,
+ "learning_rate": 1.2803967327624522e-05,
+ "loss": 0.1486,
+ "step": 15680
+ },
+ {
+ "epoch": 42.7275204359673,
+ "grad_norm": 7.279932975769043,
+ "learning_rate": 1.2803120224052004e-05,
+ "loss": 0.185,
+ "step": 15681
+ },
+ {
+ "epoch": 42.73024523160763,
+ "grad_norm": 5.815249443054199,
+ "learning_rate": 1.2802273098648876e-05,
+ "loss": 0.1892,
+ "step": 15682
+ },
+ {
+ "epoch": 42.73297002724796,
+ "grad_norm": 5.860848426818848,
+ "learning_rate": 1.2801425951421736e-05,
+ "loss": 0.1905,
+ "step": 15683
+ },
+ {
+ "epoch": 42.735694822888284,
+ "grad_norm": 7.554252624511719,
+ "learning_rate": 1.280057878237718e-05,
+ "loss": 0.2471,
+ "step": 15684
+ },
+ {
+ "epoch": 42.73841961852861,
+ "grad_norm": 6.2970356941223145,
+ "learning_rate": 1.2799731591521805e-05,
+ "loss": 0.3025,
+ "step": 15685
+ },
+ {
+ "epoch": 42.741144414168936,
+ "grad_norm": 4.874846458435059,
+ "learning_rate": 1.2798884378862213e-05,
+ "loss": 0.2105,
+ "step": 15686
+ },
+ {
+ "epoch": 42.74386920980926,
+ "grad_norm": 8.647810935974121,
+ "learning_rate": 1.2798037144405e-05,
+ "loss": 0.2013,
+ "step": 15687
+ },
+ {
+ "epoch": 42.746594005449595,
+ "grad_norm": 5.494062423706055,
+ "learning_rate": 1.2797189888156761e-05,
+ "loss": 0.1594,
+ "step": 15688
+ },
+ {
+ "epoch": 42.74931880108992,
+ "grad_norm": 4.149773597717285,
+ "learning_rate": 1.27963426101241e-05,
+ "loss": 0.1171,
+ "step": 15689
+ },
+ {
+ "epoch": 42.752043596730246,
+ "grad_norm": 5.264461994171143,
+ "learning_rate": 1.279549531031361e-05,
+ "loss": 0.1744,
+ "step": 15690
+ },
+ {
+ "epoch": 42.75476839237057,
+ "grad_norm": 8.829997062683105,
+ "learning_rate": 1.2794647988731896e-05,
+ "loss": 0.2036,
+ "step": 15691
+ },
+ {
+ "epoch": 42.7574931880109,
+ "grad_norm": 5.838218688964844,
+ "learning_rate": 1.279380064538555e-05,
+ "loss": 0.2639,
+ "step": 15692
+ },
+ {
+ "epoch": 42.76021798365122,
+ "grad_norm": 4.818917751312256,
+ "learning_rate": 1.2792953280281175e-05,
+ "loss": 0.1606,
+ "step": 15693
+ },
+ {
+ "epoch": 42.762942779291556,
+ "grad_norm": 5.961804389953613,
+ "learning_rate": 1.2792105893425373e-05,
+ "loss": 0.1779,
+ "step": 15694
+ },
+ {
+ "epoch": 42.76566757493188,
+ "grad_norm": 6.108853340148926,
+ "learning_rate": 1.2791258484824736e-05,
+ "loss": 0.1674,
+ "step": 15695
+ },
+ {
+ "epoch": 42.76839237057221,
+ "grad_norm": 5.334097385406494,
+ "learning_rate": 1.279041105448587e-05,
+ "loss": 0.3838,
+ "step": 15696
+ },
+ {
+ "epoch": 42.771117166212534,
+ "grad_norm": 6.470245838165283,
+ "learning_rate": 1.278956360241537e-05,
+ "loss": 0.2318,
+ "step": 15697
+ },
+ {
+ "epoch": 42.77384196185286,
+ "grad_norm": 4.926463603973389,
+ "learning_rate": 1.2788716128619843e-05,
+ "loss": 0.1291,
+ "step": 15698
+ },
+ {
+ "epoch": 42.776566757493185,
+ "grad_norm": 5.360116004943848,
+ "learning_rate": 1.2787868633105882e-05,
+ "loss": 0.3191,
+ "step": 15699
+ },
+ {
+ "epoch": 42.77929155313352,
+ "grad_norm": 6.295806407928467,
+ "learning_rate": 1.278702111588009e-05,
+ "loss": 0.3707,
+ "step": 15700
+ },
+ {
+ "epoch": 42.782016348773844,
+ "grad_norm": 7.457422256469727,
+ "learning_rate": 1.2786173576949068e-05,
+ "loss": 0.1382,
+ "step": 15701
+ },
+ {
+ "epoch": 42.78474114441417,
+ "grad_norm": 5.710942268371582,
+ "learning_rate": 1.2785326016319415e-05,
+ "loss": 0.1496,
+ "step": 15702
+ },
+ {
+ "epoch": 42.787465940054496,
+ "grad_norm": 6.969316005706787,
+ "learning_rate": 1.2784478433997733e-05,
+ "loss": 0.1845,
+ "step": 15703
+ },
+ {
+ "epoch": 42.79019073569482,
+ "grad_norm": 5.756155490875244,
+ "learning_rate": 1.278363082999062e-05,
+ "loss": 0.3519,
+ "step": 15704
+ },
+ {
+ "epoch": 42.79291553133515,
+ "grad_norm": 4.032855033874512,
+ "learning_rate": 1.2782783204304683e-05,
+ "loss": 0.2219,
+ "step": 15705
+ },
+ {
+ "epoch": 42.79564032697548,
+ "grad_norm": 5.56076717376709,
+ "learning_rate": 1.2781935556946517e-05,
+ "loss": 0.2272,
+ "step": 15706
+ },
+ {
+ "epoch": 42.798365122615806,
+ "grad_norm": 6.550904273986816,
+ "learning_rate": 1.2781087887922729e-05,
+ "loss": 0.1784,
+ "step": 15707
+ },
+ {
+ "epoch": 42.80108991825613,
+ "grad_norm": 5.889643669128418,
+ "learning_rate": 1.2780240197239917e-05,
+ "loss": 0.1644,
+ "step": 15708
+ },
+ {
+ "epoch": 42.80381471389646,
+ "grad_norm": 5.0112810134887695,
+ "learning_rate": 1.2779392484904685e-05,
+ "loss": 0.1532,
+ "step": 15709
+ },
+ {
+ "epoch": 42.80653950953678,
+ "grad_norm": 5.021573543548584,
+ "learning_rate": 1.2778544750923634e-05,
+ "loss": 0.1197,
+ "step": 15710
+ },
+ {
+ "epoch": 42.80926430517711,
+ "grad_norm": 7.210042953491211,
+ "learning_rate": 1.2777696995303366e-05,
+ "loss": 0.2753,
+ "step": 15711
+ },
+ {
+ "epoch": 42.81198910081744,
+ "grad_norm": 5.5177812576293945,
+ "learning_rate": 1.277684921805048e-05,
+ "loss": 0.2453,
+ "step": 15712
+ },
+ {
+ "epoch": 42.81471389645777,
+ "grad_norm": 5.005462169647217,
+ "learning_rate": 1.2776001419171585e-05,
+ "loss": 0.3069,
+ "step": 15713
+ },
+ {
+ "epoch": 42.817438692098094,
+ "grad_norm": 9.254091262817383,
+ "learning_rate": 1.2775153598673276e-05,
+ "loss": 0.3414,
+ "step": 15714
+ },
+ {
+ "epoch": 42.82016348773842,
+ "grad_norm": 4.597906112670898,
+ "learning_rate": 1.2774305756562164e-05,
+ "loss": 0.2491,
+ "step": 15715
+ },
+ {
+ "epoch": 42.822888283378745,
+ "grad_norm": 4.350356101989746,
+ "learning_rate": 1.2773457892844844e-05,
+ "loss": 0.1406,
+ "step": 15716
+ },
+ {
+ "epoch": 42.82561307901907,
+ "grad_norm": 6.244409561157227,
+ "learning_rate": 1.277261000752793e-05,
+ "loss": 0.3517,
+ "step": 15717
+ },
+ {
+ "epoch": 42.828337874659404,
+ "grad_norm": 5.680519104003906,
+ "learning_rate": 1.2771762100618012e-05,
+ "loss": 0.2949,
+ "step": 15718
+ },
+ {
+ "epoch": 42.83106267029973,
+ "grad_norm": 6.875699520111084,
+ "learning_rate": 1.2770914172121706e-05,
+ "loss": 0.2951,
+ "step": 15719
+ },
+ {
+ "epoch": 42.833787465940055,
+ "grad_norm": 6.159343242645264,
+ "learning_rate": 1.2770066222045605e-05,
+ "loss": 0.1965,
+ "step": 15720
+ },
+ {
+ "epoch": 42.83651226158038,
+ "grad_norm": 7.010004043579102,
+ "learning_rate": 1.276921825039632e-05,
+ "loss": 0.2616,
+ "step": 15721
+ },
+ {
+ "epoch": 42.83923705722071,
+ "grad_norm": 5.467535495758057,
+ "learning_rate": 1.2768370257180449e-05,
+ "loss": 0.3691,
+ "step": 15722
+ },
+ {
+ "epoch": 42.84196185286103,
+ "grad_norm": 8.308337211608887,
+ "learning_rate": 1.2767522242404602e-05,
+ "loss": 0.1829,
+ "step": 15723
+ },
+ {
+ "epoch": 42.844686648501366,
+ "grad_norm": 5.9903178215026855,
+ "learning_rate": 1.276667420607538e-05,
+ "loss": 0.3084,
+ "step": 15724
+ },
+ {
+ "epoch": 42.84741144414169,
+ "grad_norm": 6.222293376922607,
+ "learning_rate": 1.276582614819939e-05,
+ "loss": 0.3444,
+ "step": 15725
+ },
+ {
+ "epoch": 42.85013623978202,
+ "grad_norm": 4.581437587738037,
+ "learning_rate": 1.2764978068783233e-05,
+ "loss": 0.2841,
+ "step": 15726
+ },
+ {
+ "epoch": 42.85286103542234,
+ "grad_norm": 7.398552894592285,
+ "learning_rate": 1.2764129967833518e-05,
+ "loss": 0.2128,
+ "step": 15727
+ },
+ {
+ "epoch": 42.85558583106267,
+ "grad_norm": 5.676241397857666,
+ "learning_rate": 1.2763281845356845e-05,
+ "loss": 0.1577,
+ "step": 15728
+ },
+ {
+ "epoch": 42.858310626702995,
+ "grad_norm": 5.449347972869873,
+ "learning_rate": 1.2762433701359827e-05,
+ "loss": 0.2946,
+ "step": 15729
+ },
+ {
+ "epoch": 42.86103542234333,
+ "grad_norm": 5.118447780609131,
+ "learning_rate": 1.2761585535849059e-05,
+ "loss": 0.2588,
+ "step": 15730
+ },
+ {
+ "epoch": 42.86376021798365,
+ "grad_norm": 5.3504252433776855,
+ "learning_rate": 1.2760737348831152e-05,
+ "loss": 0.2406,
+ "step": 15731
+ },
+ {
+ "epoch": 42.86648501362398,
+ "grad_norm": 5.175047874450684,
+ "learning_rate": 1.2759889140312711e-05,
+ "loss": 0.2955,
+ "step": 15732
+ },
+ {
+ "epoch": 42.869209809264305,
+ "grad_norm": 5.723325252532959,
+ "learning_rate": 1.2759040910300346e-05,
+ "loss": 0.1567,
+ "step": 15733
+ },
+ {
+ "epoch": 42.87193460490463,
+ "grad_norm": 5.2911224365234375,
+ "learning_rate": 1.2758192658800657e-05,
+ "loss": 0.3188,
+ "step": 15734
+ },
+ {
+ "epoch": 42.87465940054496,
+ "grad_norm": 4.562192440032959,
+ "learning_rate": 1.2757344385820254e-05,
+ "loss": 0.2519,
+ "step": 15735
+ },
+ {
+ "epoch": 42.87738419618529,
+ "grad_norm": 5.385756969451904,
+ "learning_rate": 1.2756496091365737e-05,
+ "loss": 0.2218,
+ "step": 15736
+ },
+ {
+ "epoch": 42.880108991825615,
+ "grad_norm": 5.6548752784729,
+ "learning_rate": 1.2755647775443722e-05,
+ "loss": 0.2245,
+ "step": 15737
+ },
+ {
+ "epoch": 42.88283378746594,
+ "grad_norm": 5.487072467803955,
+ "learning_rate": 1.275479943806081e-05,
+ "loss": 0.193,
+ "step": 15738
+ },
+ {
+ "epoch": 42.88555858310627,
+ "grad_norm": 6.113552093505859,
+ "learning_rate": 1.2753951079223606e-05,
+ "loss": 0.2282,
+ "step": 15739
+ },
+ {
+ "epoch": 42.88828337874659,
+ "grad_norm": 6.495295524597168,
+ "learning_rate": 1.275310269893872e-05,
+ "loss": 0.1993,
+ "step": 15740
+ },
+ {
+ "epoch": 42.89100817438692,
+ "grad_norm": 7.8980512619018555,
+ "learning_rate": 1.2752254297212762e-05,
+ "loss": 0.204,
+ "step": 15741
+ },
+ {
+ "epoch": 42.89373297002725,
+ "grad_norm": 6.508900165557861,
+ "learning_rate": 1.2751405874052334e-05,
+ "loss": 0.3016,
+ "step": 15742
+ },
+ {
+ "epoch": 42.89645776566758,
+ "grad_norm": 5.994144439697266,
+ "learning_rate": 1.2750557429464046e-05,
+ "loss": 0.2495,
+ "step": 15743
+ },
+ {
+ "epoch": 42.8991825613079,
+ "grad_norm": 5.538070201873779,
+ "learning_rate": 1.2749708963454507e-05,
+ "loss": 0.2072,
+ "step": 15744
+ },
+ {
+ "epoch": 42.90190735694823,
+ "grad_norm": 4.820894718170166,
+ "learning_rate": 1.274886047603032e-05,
+ "loss": 0.2049,
+ "step": 15745
+ },
+ {
+ "epoch": 42.904632152588555,
+ "grad_norm": 5.188495635986328,
+ "learning_rate": 1.2748011967198097e-05,
+ "loss": 0.1993,
+ "step": 15746
+ },
+ {
+ "epoch": 42.90735694822888,
+ "grad_norm": 5.004482269287109,
+ "learning_rate": 1.2747163436964447e-05,
+ "loss": 0.2109,
+ "step": 15747
+ },
+ {
+ "epoch": 42.91008174386921,
+ "grad_norm": 4.467107772827148,
+ "learning_rate": 1.274631488533597e-05,
+ "loss": 0.1824,
+ "step": 15748
+ },
+ {
+ "epoch": 42.91280653950954,
+ "grad_norm": 7.456881046295166,
+ "learning_rate": 1.274546631231929e-05,
+ "loss": 0.3516,
+ "step": 15749
+ },
+ {
+ "epoch": 42.915531335149865,
+ "grad_norm": 5.800576686859131,
+ "learning_rate": 1.2744617717921002e-05,
+ "loss": 0.3031,
+ "step": 15750
+ },
+ {
+ "epoch": 42.91825613079019,
+ "grad_norm": 4.827005863189697,
+ "learning_rate": 1.274376910214772e-05,
+ "loss": 0.1644,
+ "step": 15751
+ },
+ {
+ "epoch": 42.920980926430516,
+ "grad_norm": 6.49036169052124,
+ "learning_rate": 1.2742920465006052e-05,
+ "loss": 0.2566,
+ "step": 15752
+ },
+ {
+ "epoch": 42.92370572207084,
+ "grad_norm": 4.562337398529053,
+ "learning_rate": 1.2742071806502612e-05,
+ "loss": 0.1349,
+ "step": 15753
+ },
+ {
+ "epoch": 42.926430517711175,
+ "grad_norm": 5.6639509201049805,
+ "learning_rate": 1.2741223126644e-05,
+ "loss": 0.1537,
+ "step": 15754
+ },
+ {
+ "epoch": 42.9291553133515,
+ "grad_norm": 5.751596927642822,
+ "learning_rate": 1.2740374425436834e-05,
+ "loss": 0.1934,
+ "step": 15755
+ },
+ {
+ "epoch": 42.93188010899183,
+ "grad_norm": 5.298120021820068,
+ "learning_rate": 1.2739525702887718e-05,
+ "loss": 0.1716,
+ "step": 15756
+ },
+ {
+ "epoch": 42.93460490463215,
+ "grad_norm": 6.753478050231934,
+ "learning_rate": 1.2738676959003262e-05,
+ "loss": 0.2581,
+ "step": 15757
+ },
+ {
+ "epoch": 42.93732970027248,
+ "grad_norm": 7.195338249206543,
+ "learning_rate": 1.2737828193790081e-05,
+ "loss": 0.3621,
+ "step": 15758
+ },
+ {
+ "epoch": 42.940054495912804,
+ "grad_norm": 6.741783142089844,
+ "learning_rate": 1.2736979407254782e-05,
+ "loss": 0.2503,
+ "step": 15759
+ },
+ {
+ "epoch": 42.94277929155314,
+ "grad_norm": 15.566309928894043,
+ "learning_rate": 1.2736130599403973e-05,
+ "loss": 0.2491,
+ "step": 15760
+ },
+ {
+ "epoch": 42.94550408719346,
+ "grad_norm": 5.59145450592041,
+ "learning_rate": 1.2735281770244272e-05,
+ "loss": 0.1539,
+ "step": 15761
+ },
+ {
+ "epoch": 42.94822888283379,
+ "grad_norm": 6.900923728942871,
+ "learning_rate": 1.273443291978228e-05,
+ "loss": 0.1658,
+ "step": 15762
+ },
+ {
+ "epoch": 42.950953678474114,
+ "grad_norm": 6.400233268737793,
+ "learning_rate": 1.2733584048024614e-05,
+ "loss": 0.153,
+ "step": 15763
+ },
+ {
+ "epoch": 42.95367847411444,
+ "grad_norm": 7.227105617523193,
+ "learning_rate": 1.2732735154977885e-05,
+ "loss": 0.3138,
+ "step": 15764
+ },
+ {
+ "epoch": 42.956403269754766,
+ "grad_norm": 6.766824722290039,
+ "learning_rate": 1.2731886240648699e-05,
+ "loss": 0.2832,
+ "step": 15765
+ },
+ {
+ "epoch": 42.95912806539509,
+ "grad_norm": 7.418117523193359,
+ "learning_rate": 1.2731037305043675e-05,
+ "loss": 0.215,
+ "step": 15766
+ },
+ {
+ "epoch": 42.961852861035425,
+ "grad_norm": 6.897304534912109,
+ "learning_rate": 1.2730188348169416e-05,
+ "loss": 0.1917,
+ "step": 15767
+ },
+ {
+ "epoch": 42.96457765667575,
+ "grad_norm": 6.344455718994141,
+ "learning_rate": 1.272933937003254e-05,
+ "loss": 0.2007,
+ "step": 15768
+ },
+ {
+ "epoch": 42.967302452316076,
+ "grad_norm": 6.0487189292907715,
+ "learning_rate": 1.2728490370639659e-05,
+ "loss": 0.2554,
+ "step": 15769
+ },
+ {
+ "epoch": 42.9700272479564,
+ "grad_norm": 4.928340911865234,
+ "learning_rate": 1.2727641349997379e-05,
+ "loss": 0.2699,
+ "step": 15770
+ },
+ {
+ "epoch": 42.97275204359673,
+ "grad_norm": 5.338281154632568,
+ "learning_rate": 1.2726792308112319e-05,
+ "loss": 0.2481,
+ "step": 15771
+ },
+ {
+ "epoch": 42.97547683923706,
+ "grad_norm": 4.367077350616455,
+ "learning_rate": 1.2725943244991089e-05,
+ "loss": 0.1288,
+ "step": 15772
+ },
+ {
+ "epoch": 42.97820163487739,
+ "grad_norm": 4.917163372039795,
+ "learning_rate": 1.27250941606403e-05,
+ "loss": 0.1928,
+ "step": 15773
+ },
+ {
+ "epoch": 42.98092643051771,
+ "grad_norm": 6.855035305023193,
+ "learning_rate": 1.2724245055066561e-05,
+ "loss": 0.1877,
+ "step": 15774
+ },
+ {
+ "epoch": 42.98365122615804,
+ "grad_norm": 5.984237194061279,
+ "learning_rate": 1.2723395928276492e-05,
+ "loss": 0.2683,
+ "step": 15775
+ },
+ {
+ "epoch": 42.986376021798364,
+ "grad_norm": 5.014121055603027,
+ "learning_rate": 1.2722546780276705e-05,
+ "loss": 0.1354,
+ "step": 15776
+ },
+ {
+ "epoch": 42.98910081743869,
+ "grad_norm": 10.273235321044922,
+ "learning_rate": 1.272169761107381e-05,
+ "loss": 0.2324,
+ "step": 15777
+ },
+ {
+ "epoch": 42.991825613079016,
+ "grad_norm": 9.372404098510742,
+ "learning_rate": 1.272084842067442e-05,
+ "loss": 0.2366,
+ "step": 15778
+ },
+ {
+ "epoch": 42.99455040871935,
+ "grad_norm": 5.833219528198242,
+ "learning_rate": 1.2719999209085152e-05,
+ "loss": 0.4153,
+ "step": 15779
+ },
+ {
+ "epoch": 42.997275204359674,
+ "grad_norm": 7.8355913162231445,
+ "learning_rate": 1.2719149976312617e-05,
+ "loss": 0.4989,
+ "step": 15780
+ },
+ {
+ "epoch": 43.0,
+ "grad_norm": 4.25089693069458,
+ "learning_rate": 1.2718300722363431e-05,
+ "loss": 0.1144,
+ "step": 15781
+ },
+ {
+ "epoch": 43.002724795640326,
+ "grad_norm": 8.438754081726074,
+ "learning_rate": 1.2717451447244205e-05,
+ "loss": 0.1911,
+ "step": 15782
+ },
+ {
+ "epoch": 43.00544959128065,
+ "grad_norm": 5.1629252433776855,
+ "learning_rate": 1.2716602150961553e-05,
+ "loss": 0.2953,
+ "step": 15783
+ },
+ {
+ "epoch": 43.00817438692098,
+ "grad_norm": 4.964519500732422,
+ "learning_rate": 1.2715752833522094e-05,
+ "loss": 0.1674,
+ "step": 15784
+ },
+ {
+ "epoch": 43.01089918256131,
+ "grad_norm": 5.678306579589844,
+ "learning_rate": 1.2714903494932438e-05,
+ "loss": 0.179,
+ "step": 15785
+ },
+ {
+ "epoch": 43.013623978201636,
+ "grad_norm": 6.6454620361328125,
+ "learning_rate": 1.2714054135199201e-05,
+ "loss": 0.1723,
+ "step": 15786
+ },
+ {
+ "epoch": 43.01634877384196,
+ "grad_norm": 6.484141826629639,
+ "learning_rate": 1.2713204754328996e-05,
+ "loss": 0.1289,
+ "step": 15787
+ },
+ {
+ "epoch": 43.01907356948229,
+ "grad_norm": 4.936593532562256,
+ "learning_rate": 1.2712355352328442e-05,
+ "loss": 0.356,
+ "step": 15788
+ },
+ {
+ "epoch": 43.02179836512261,
+ "grad_norm": 5.204105377197266,
+ "learning_rate": 1.2711505929204153e-05,
+ "loss": 0.134,
+ "step": 15789
+ },
+ {
+ "epoch": 43.02452316076294,
+ "grad_norm": 5.359770774841309,
+ "learning_rate": 1.2710656484962742e-05,
+ "loss": 0.2325,
+ "step": 15790
+ },
+ {
+ "epoch": 43.02724795640327,
+ "grad_norm": 5.6926751136779785,
+ "learning_rate": 1.2709807019610823e-05,
+ "loss": 0.1692,
+ "step": 15791
+ },
+ {
+ "epoch": 43.0299727520436,
+ "grad_norm": 5.559471130371094,
+ "learning_rate": 1.2708957533155014e-05,
+ "loss": 0.2531,
+ "step": 15792
+ },
+ {
+ "epoch": 43.032697547683924,
+ "grad_norm": 4.012047290802002,
+ "learning_rate": 1.2708108025601935e-05,
+ "loss": 0.1518,
+ "step": 15793
+ },
+ {
+ "epoch": 43.03542234332425,
+ "grad_norm": 6.4738311767578125,
+ "learning_rate": 1.2707258496958197e-05,
+ "loss": 0.2364,
+ "step": 15794
+ },
+ {
+ "epoch": 43.038147138964575,
+ "grad_norm": 4.456639289855957,
+ "learning_rate": 1.2706408947230414e-05,
+ "loss": 0.1331,
+ "step": 15795
+ },
+ {
+ "epoch": 43.0408719346049,
+ "grad_norm": 6.203889846801758,
+ "learning_rate": 1.270555937642521e-05,
+ "loss": 0.2468,
+ "step": 15796
+ },
+ {
+ "epoch": 43.043596730245234,
+ "grad_norm": 4.330617427825928,
+ "learning_rate": 1.2704709784549192e-05,
+ "loss": 0.3094,
+ "step": 15797
+ },
+ {
+ "epoch": 43.04632152588556,
+ "grad_norm": 6.280506134033203,
+ "learning_rate": 1.2703860171608985e-05,
+ "loss": 0.2799,
+ "step": 15798
+ },
+ {
+ "epoch": 43.049046321525886,
+ "grad_norm": 6.598577976226807,
+ "learning_rate": 1.2703010537611198e-05,
+ "loss": 0.1708,
+ "step": 15799
+ },
+ {
+ "epoch": 43.05177111716621,
+ "grad_norm": 5.593931198120117,
+ "learning_rate": 1.2702160882562453e-05,
+ "loss": 0.188,
+ "step": 15800
+ },
+ {
+ "epoch": 43.05449591280654,
+ "grad_norm": 4.6534199714660645,
+ "learning_rate": 1.2701311206469366e-05,
+ "loss": 0.2912,
+ "step": 15801
+ },
+ {
+ "epoch": 43.05722070844686,
+ "grad_norm": 5.074550151824951,
+ "learning_rate": 1.2700461509338555e-05,
+ "loss": 0.1516,
+ "step": 15802
+ },
+ {
+ "epoch": 43.059945504087196,
+ "grad_norm": 6.933719635009766,
+ "learning_rate": 1.2699611791176638e-05,
+ "loss": 0.2509,
+ "step": 15803
+ },
+ {
+ "epoch": 43.06267029972752,
+ "grad_norm": 5.630640983581543,
+ "learning_rate": 1.269876205199023e-05,
+ "loss": 0.132,
+ "step": 15804
+ },
+ {
+ "epoch": 43.06539509536785,
+ "grad_norm": 6.669646739959717,
+ "learning_rate": 1.269791229178595e-05,
+ "loss": 0.2525,
+ "step": 15805
+ },
+ {
+ "epoch": 43.06811989100817,
+ "grad_norm": 6.0606584548950195,
+ "learning_rate": 1.2697062510570417e-05,
+ "loss": 0.2483,
+ "step": 15806
+ },
+ {
+ "epoch": 43.0708446866485,
+ "grad_norm": 5.033213138580322,
+ "learning_rate": 1.2696212708350247e-05,
+ "loss": 0.2202,
+ "step": 15807
+ },
+ {
+ "epoch": 43.073569482288825,
+ "grad_norm": 5.555293083190918,
+ "learning_rate": 1.2695362885132057e-05,
+ "loss": 0.2937,
+ "step": 15808
+ },
+ {
+ "epoch": 43.07629427792916,
+ "grad_norm": 5.399478435516357,
+ "learning_rate": 1.269451304092247e-05,
+ "loss": 0.1889,
+ "step": 15809
+ },
+ {
+ "epoch": 43.079019073569484,
+ "grad_norm": 6.696550369262695,
+ "learning_rate": 1.2693663175728102e-05,
+ "loss": 0.3098,
+ "step": 15810
+ },
+ {
+ "epoch": 43.08174386920981,
+ "grad_norm": 5.641627788543701,
+ "learning_rate": 1.269281328955557e-05,
+ "loss": 0.2914,
+ "step": 15811
+ },
+ {
+ "epoch": 43.084468664850135,
+ "grad_norm": 5.6052680015563965,
+ "learning_rate": 1.2691963382411498e-05,
+ "loss": 0.1666,
+ "step": 15812
+ },
+ {
+ "epoch": 43.08719346049046,
+ "grad_norm": 5.3014373779296875,
+ "learning_rate": 1.26911134543025e-05,
+ "loss": 0.2783,
+ "step": 15813
+ },
+ {
+ "epoch": 43.08991825613079,
+ "grad_norm": 4.597877502441406,
+ "learning_rate": 1.2690263505235199e-05,
+ "loss": 0.286,
+ "step": 15814
+ },
+ {
+ "epoch": 43.09264305177112,
+ "grad_norm": 4.8344645500183105,
+ "learning_rate": 1.2689413535216209e-05,
+ "loss": 0.2461,
+ "step": 15815
+ },
+ {
+ "epoch": 43.095367847411445,
+ "grad_norm": 4.9873046875,
+ "learning_rate": 1.2688563544252156e-05,
+ "loss": 0.1694,
+ "step": 15816
+ },
+ {
+ "epoch": 43.09809264305177,
+ "grad_norm": 5.87472677230835,
+ "learning_rate": 1.2687713532349653e-05,
+ "loss": 0.346,
+ "step": 15817
+ },
+ {
+ "epoch": 43.1008174386921,
+ "grad_norm": 5.895587921142578,
+ "learning_rate": 1.2686863499515327e-05,
+ "loss": 0.1604,
+ "step": 15818
+ },
+ {
+ "epoch": 43.10354223433242,
+ "grad_norm": 5.016204357147217,
+ "learning_rate": 1.2686013445755792e-05,
+ "loss": 0.2268,
+ "step": 15819
+ },
+ {
+ "epoch": 43.10626702997275,
+ "grad_norm": 4.473295211791992,
+ "learning_rate": 1.2685163371077676e-05,
+ "loss": 0.1698,
+ "step": 15820
+ },
+ {
+ "epoch": 43.10899182561308,
+ "grad_norm": 5.678323745727539,
+ "learning_rate": 1.2684313275487587e-05,
+ "loss": 0.2753,
+ "step": 15821
+ },
+ {
+ "epoch": 43.11171662125341,
+ "grad_norm": 5.489089012145996,
+ "learning_rate": 1.2683463158992157e-05,
+ "loss": 0.2203,
+ "step": 15822
+ },
+ {
+ "epoch": 43.11444141689373,
+ "grad_norm": 4.795029163360596,
+ "learning_rate": 1.2682613021598e-05,
+ "loss": 0.2138,
+ "step": 15823
+ },
+ {
+ "epoch": 43.11716621253406,
+ "grad_norm": 4.624063968658447,
+ "learning_rate": 1.2681762863311744e-05,
+ "loss": 0.2654,
+ "step": 15824
+ },
+ {
+ "epoch": 43.119891008174385,
+ "grad_norm": 5.710758209228516,
+ "learning_rate": 1.2680912684139996e-05,
+ "loss": 0.2917,
+ "step": 15825
+ },
+ {
+ "epoch": 43.12261580381471,
+ "grad_norm": 6.505515098571777,
+ "learning_rate": 1.2680062484089396e-05,
+ "loss": 0.2112,
+ "step": 15826
+ },
+ {
+ "epoch": 43.12534059945504,
+ "grad_norm": 5.088910102844238,
+ "learning_rate": 1.2679212263166548e-05,
+ "loss": 0.1748,
+ "step": 15827
+ },
+ {
+ "epoch": 43.12806539509537,
+ "grad_norm": 7.963064193725586,
+ "learning_rate": 1.2678362021378085e-05,
+ "loss": 0.2247,
+ "step": 15828
+ },
+ {
+ "epoch": 43.130790190735695,
+ "grad_norm": 5.173469543457031,
+ "learning_rate": 1.2677511758730625e-05,
+ "loss": 0.3488,
+ "step": 15829
+ },
+ {
+ "epoch": 43.13351498637602,
+ "grad_norm": 5.114818572998047,
+ "learning_rate": 1.267666147523079e-05,
+ "loss": 0.2002,
+ "step": 15830
+ },
+ {
+ "epoch": 43.13623978201635,
+ "grad_norm": 5.150710582733154,
+ "learning_rate": 1.2675811170885199e-05,
+ "loss": 0.2605,
+ "step": 15831
+ },
+ {
+ "epoch": 43.13896457765667,
+ "grad_norm": 4.721823215484619,
+ "learning_rate": 1.2674960845700478e-05,
+ "loss": 0.167,
+ "step": 15832
+ },
+ {
+ "epoch": 43.141689373297005,
+ "grad_norm": 7.443442344665527,
+ "learning_rate": 1.267411049968325e-05,
+ "loss": 0.1951,
+ "step": 15833
+ },
+ {
+ "epoch": 43.14441416893733,
+ "grad_norm": 6.747244834899902,
+ "learning_rate": 1.2673260132840133e-05,
+ "loss": 0.2664,
+ "step": 15834
+ },
+ {
+ "epoch": 43.14713896457766,
+ "grad_norm": 8.787422180175781,
+ "learning_rate": 1.2672409745177752e-05,
+ "loss": 0.1762,
+ "step": 15835
+ },
+ {
+ "epoch": 43.14986376021798,
+ "grad_norm": 7.668347358703613,
+ "learning_rate": 1.267155933670273e-05,
+ "loss": 0.1555,
+ "step": 15836
+ },
+ {
+ "epoch": 43.15258855585831,
+ "grad_norm": 23.420007705688477,
+ "learning_rate": 1.267070890742169e-05,
+ "loss": 0.1536,
+ "step": 15837
+ },
+ {
+ "epoch": 43.155313351498634,
+ "grad_norm": 5.895536422729492,
+ "learning_rate": 1.2669858457341258e-05,
+ "loss": 0.2571,
+ "step": 15838
+ },
+ {
+ "epoch": 43.15803814713897,
+ "grad_norm": 4.71837043762207,
+ "learning_rate": 1.266900798646805e-05,
+ "loss": 0.161,
+ "step": 15839
+ },
+ {
+ "epoch": 43.16076294277929,
+ "grad_norm": 5.424498558044434,
+ "learning_rate": 1.2668157494808697e-05,
+ "loss": 0.1275,
+ "step": 15840
+ },
+ {
+ "epoch": 43.16348773841962,
+ "grad_norm": 5.675332069396973,
+ "learning_rate": 1.2667306982369816e-05,
+ "loss": 0.1802,
+ "step": 15841
+ },
+ {
+ "epoch": 43.166212534059945,
+ "grad_norm": 3.783858060836792,
+ "learning_rate": 1.2666456449158037e-05,
+ "loss": 0.2775,
+ "step": 15842
+ },
+ {
+ "epoch": 43.16893732970027,
+ "grad_norm": 5.900336742401123,
+ "learning_rate": 1.2665605895179977e-05,
+ "loss": 0.3205,
+ "step": 15843
+ },
+ {
+ "epoch": 43.171662125340596,
+ "grad_norm": 4.113350868225098,
+ "learning_rate": 1.266475532044227e-05,
+ "loss": 0.148,
+ "step": 15844
+ },
+ {
+ "epoch": 43.17438692098093,
+ "grad_norm": 6.5994672775268555,
+ "learning_rate": 1.266390472495153e-05,
+ "loss": 0.2427,
+ "step": 15845
+ },
+ {
+ "epoch": 43.177111716621255,
+ "grad_norm": 5.132373809814453,
+ "learning_rate": 1.2663054108714388e-05,
+ "loss": 0.2726,
+ "step": 15846
+ },
+ {
+ "epoch": 43.17983651226158,
+ "grad_norm": 6.610569477081299,
+ "learning_rate": 1.2662203471737465e-05,
+ "loss": 0.3831,
+ "step": 15847
+ },
+ {
+ "epoch": 43.182561307901906,
+ "grad_norm": 5.182617664337158,
+ "learning_rate": 1.2661352814027388e-05,
+ "loss": 0.2854,
+ "step": 15848
+ },
+ {
+ "epoch": 43.18528610354223,
+ "grad_norm": 4.746345520019531,
+ "learning_rate": 1.266050213559078e-05,
+ "loss": 0.199,
+ "step": 15849
+ },
+ {
+ "epoch": 43.18801089918256,
+ "grad_norm": 6.213058948516846,
+ "learning_rate": 1.2659651436434268e-05,
+ "loss": 0.2269,
+ "step": 15850
+ },
+ {
+ "epoch": 43.19073569482289,
+ "grad_norm": 4.184413909912109,
+ "learning_rate": 1.2658800716564474e-05,
+ "loss": 0.1484,
+ "step": 15851
+ },
+ {
+ "epoch": 43.19346049046322,
+ "grad_norm": 6.441722869873047,
+ "learning_rate": 1.2657949975988028e-05,
+ "loss": 0.3351,
+ "step": 15852
+ },
+ {
+ "epoch": 43.19618528610354,
+ "grad_norm": 4.789957523345947,
+ "learning_rate": 1.2657099214711553e-05,
+ "loss": 0.1619,
+ "step": 15853
+ },
+ {
+ "epoch": 43.19891008174387,
+ "grad_norm": 4.777517795562744,
+ "learning_rate": 1.2656248432741674e-05,
+ "loss": 0.1425,
+ "step": 15854
+ },
+ {
+ "epoch": 43.201634877384194,
+ "grad_norm": 5.650998592376709,
+ "learning_rate": 1.2655397630085015e-05,
+ "loss": 0.1421,
+ "step": 15855
+ },
+ {
+ "epoch": 43.20435967302452,
+ "grad_norm": 6.645985126495361,
+ "learning_rate": 1.2654546806748209e-05,
+ "loss": 0.1788,
+ "step": 15856
+ },
+ {
+ "epoch": 43.20708446866485,
+ "grad_norm": 6.334911346435547,
+ "learning_rate": 1.2653695962737875e-05,
+ "loss": 0.2482,
+ "step": 15857
+ },
+ {
+ "epoch": 43.20980926430518,
+ "grad_norm": 5.914535999298096,
+ "learning_rate": 1.2652845098060647e-05,
+ "loss": 0.1692,
+ "step": 15858
+ },
+ {
+ "epoch": 43.212534059945504,
+ "grad_norm": 5.427907466888428,
+ "learning_rate": 1.2651994212723142e-05,
+ "loss": 0.2051,
+ "step": 15859
+ },
+ {
+ "epoch": 43.21525885558583,
+ "grad_norm": 5.219813346862793,
+ "learning_rate": 1.2651143306731992e-05,
+ "loss": 0.2219,
+ "step": 15860
+ },
+ {
+ "epoch": 43.217983651226156,
+ "grad_norm": 4.969454765319824,
+ "learning_rate": 1.2650292380093826e-05,
+ "loss": 0.2183,
+ "step": 15861
+ },
+ {
+ "epoch": 43.22070844686648,
+ "grad_norm": 5.98974084854126,
+ "learning_rate": 1.2649441432815266e-05,
+ "loss": 0.1773,
+ "step": 15862
+ },
+ {
+ "epoch": 43.223433242506815,
+ "grad_norm": 5.0268168449401855,
+ "learning_rate": 1.2648590464902941e-05,
+ "loss": 0.2191,
+ "step": 15863
+ },
+ {
+ "epoch": 43.22615803814714,
+ "grad_norm": 6.868879318237305,
+ "learning_rate": 1.264773947636348e-05,
+ "loss": 0.3091,
+ "step": 15864
+ },
+ {
+ "epoch": 43.228882833787466,
+ "grad_norm": 5.643497943878174,
+ "learning_rate": 1.2646888467203509e-05,
+ "loss": 0.1794,
+ "step": 15865
+ },
+ {
+ "epoch": 43.23160762942779,
+ "grad_norm": 8.155420303344727,
+ "learning_rate": 1.2646037437429654e-05,
+ "loss": 0.2581,
+ "step": 15866
+ },
+ {
+ "epoch": 43.23433242506812,
+ "grad_norm": 6.457836151123047,
+ "learning_rate": 1.2645186387048546e-05,
+ "loss": 0.173,
+ "step": 15867
+ },
+ {
+ "epoch": 43.237057220708444,
+ "grad_norm": 5.538093566894531,
+ "learning_rate": 1.2644335316066811e-05,
+ "loss": 0.2043,
+ "step": 15868
+ },
+ {
+ "epoch": 43.23978201634878,
+ "grad_norm": 4.105807781219482,
+ "learning_rate": 1.2643484224491078e-05,
+ "loss": 0.2702,
+ "step": 15869
+ },
+ {
+ "epoch": 43.2425068119891,
+ "grad_norm": 5.2638726234436035,
+ "learning_rate": 1.2642633112327975e-05,
+ "loss": 0.246,
+ "step": 15870
+ },
+ {
+ "epoch": 43.24523160762943,
+ "grad_norm": 6.423031330108643,
+ "learning_rate": 1.2641781979584133e-05,
+ "loss": 0.1329,
+ "step": 15871
+ },
+ {
+ "epoch": 43.247956403269754,
+ "grad_norm": 4.938924312591553,
+ "learning_rate": 1.2640930826266176e-05,
+ "loss": 0.221,
+ "step": 15872
+ },
+ {
+ "epoch": 43.25068119891008,
+ "grad_norm": 5.241696357727051,
+ "learning_rate": 1.2640079652380734e-05,
+ "loss": 0.1771,
+ "step": 15873
+ },
+ {
+ "epoch": 43.253405994550405,
+ "grad_norm": 5.034905433654785,
+ "learning_rate": 1.2639228457934435e-05,
+ "loss": 0.1534,
+ "step": 15874
+ },
+ {
+ "epoch": 43.25613079019074,
+ "grad_norm": 8.160731315612793,
+ "learning_rate": 1.2638377242933912e-05,
+ "loss": 0.3567,
+ "step": 15875
+ },
+ {
+ "epoch": 43.258855585831064,
+ "grad_norm": 6.0418877601623535,
+ "learning_rate": 1.2637526007385792e-05,
+ "loss": 0.2643,
+ "step": 15876
+ },
+ {
+ "epoch": 43.26158038147139,
+ "grad_norm": 4.733092308044434,
+ "learning_rate": 1.2636674751296702e-05,
+ "loss": 0.276,
+ "step": 15877
+ },
+ {
+ "epoch": 43.264305177111716,
+ "grad_norm": 4.871381759643555,
+ "learning_rate": 1.2635823474673277e-05,
+ "loss": 0.163,
+ "step": 15878
+ },
+ {
+ "epoch": 43.26702997275204,
+ "grad_norm": 4.54433536529541,
+ "learning_rate": 1.2634972177522143e-05,
+ "loss": 0.3121,
+ "step": 15879
+ },
+ {
+ "epoch": 43.26975476839237,
+ "grad_norm": 4.6075758934021,
+ "learning_rate": 1.263412085984993e-05,
+ "loss": 0.2503,
+ "step": 15880
+ },
+ {
+ "epoch": 43.2724795640327,
+ "grad_norm": 6.629269123077393,
+ "learning_rate": 1.2633269521663269e-05,
+ "loss": 0.2072,
+ "step": 15881
+ },
+ {
+ "epoch": 43.275204359673026,
+ "grad_norm": 8.31963062286377,
+ "learning_rate": 1.2632418162968789e-05,
+ "loss": 0.2411,
+ "step": 15882
+ },
+ {
+ "epoch": 43.27792915531335,
+ "grad_norm": 19.239208221435547,
+ "learning_rate": 1.2631566783773121e-05,
+ "loss": 0.2096,
+ "step": 15883
+ },
+ {
+ "epoch": 43.28065395095368,
+ "grad_norm": 4.6367716789245605,
+ "learning_rate": 1.2630715384082897e-05,
+ "loss": 0.2933,
+ "step": 15884
+ },
+ {
+ "epoch": 43.283378746594,
+ "grad_norm": 5.596940517425537,
+ "learning_rate": 1.2629863963904745e-05,
+ "loss": 0.1837,
+ "step": 15885
+ },
+ {
+ "epoch": 43.28610354223433,
+ "grad_norm": 5.270818710327148,
+ "learning_rate": 1.2629012523245294e-05,
+ "loss": 0.4278,
+ "step": 15886
+ },
+ {
+ "epoch": 43.28882833787466,
+ "grad_norm": 5.236704349517822,
+ "learning_rate": 1.2628161062111182e-05,
+ "loss": 0.2124,
+ "step": 15887
+ },
+ {
+ "epoch": 43.29155313351499,
+ "grad_norm": 6.127437591552734,
+ "learning_rate": 1.2627309580509034e-05,
+ "loss": 0.2041,
+ "step": 15888
+ },
+ {
+ "epoch": 43.294277929155314,
+ "grad_norm": 4.5770673751831055,
+ "learning_rate": 1.2626458078445487e-05,
+ "loss": 0.1639,
+ "step": 15889
+ },
+ {
+ "epoch": 43.29700272479564,
+ "grad_norm": 5.236861705780029,
+ "learning_rate": 1.2625606555927167e-05,
+ "loss": 0.1547,
+ "step": 15890
+ },
+ {
+ "epoch": 43.299727520435965,
+ "grad_norm": 5.086138725280762,
+ "learning_rate": 1.2624755012960707e-05,
+ "loss": 0.2465,
+ "step": 15891
+ },
+ {
+ "epoch": 43.30245231607629,
+ "grad_norm": 4.756349086761475,
+ "learning_rate": 1.2623903449552741e-05,
+ "loss": 0.1608,
+ "step": 15892
+ },
+ {
+ "epoch": 43.305177111716624,
+ "grad_norm": 5.747576713562012,
+ "learning_rate": 1.2623051865709899e-05,
+ "loss": 0.3202,
+ "step": 15893
+ },
+ {
+ "epoch": 43.30790190735695,
+ "grad_norm": 7.722446918487549,
+ "learning_rate": 1.262220026143881e-05,
+ "loss": 0.1602,
+ "step": 15894
+ },
+ {
+ "epoch": 43.310626702997276,
+ "grad_norm": 13.73774528503418,
+ "learning_rate": 1.2621348636746115e-05,
+ "loss": 0.2676,
+ "step": 15895
+ },
+ {
+ "epoch": 43.3133514986376,
+ "grad_norm": 4.293647766113281,
+ "learning_rate": 1.2620496991638439e-05,
+ "loss": 0.1291,
+ "step": 15896
+ },
+ {
+ "epoch": 43.31607629427793,
+ "grad_norm": 11.641107559204102,
+ "learning_rate": 1.2619645326122416e-05,
+ "loss": 0.2622,
+ "step": 15897
+ },
+ {
+ "epoch": 43.31880108991825,
+ "grad_norm": 5.130149841308594,
+ "learning_rate": 1.261879364020468e-05,
+ "loss": 0.1486,
+ "step": 15898
+ },
+ {
+ "epoch": 43.321525885558586,
+ "grad_norm": 4.847710132598877,
+ "learning_rate": 1.2617941933891867e-05,
+ "loss": 0.3147,
+ "step": 15899
+ },
+ {
+ "epoch": 43.32425068119891,
+ "grad_norm": 4.9436116218566895,
+ "learning_rate": 1.26170902071906e-05,
+ "loss": 0.2143,
+ "step": 15900
+ },
+ {
+ "epoch": 43.32697547683924,
+ "grad_norm": 5.533937931060791,
+ "learning_rate": 1.2616238460107525e-05,
+ "loss": 0.2049,
+ "step": 15901
+ },
+ {
+ "epoch": 43.32970027247956,
+ "grad_norm": 6.411024570465088,
+ "learning_rate": 1.2615386692649263e-05,
+ "loss": 0.1421,
+ "step": 15902
+ },
+ {
+ "epoch": 43.33242506811989,
+ "grad_norm": 4.478221893310547,
+ "learning_rate": 1.2614534904822455e-05,
+ "loss": 0.2364,
+ "step": 15903
+ },
+ {
+ "epoch": 43.335149863760215,
+ "grad_norm": 6.68491268157959,
+ "learning_rate": 1.2613683096633736e-05,
+ "loss": 0.3194,
+ "step": 15904
+ },
+ {
+ "epoch": 43.33787465940055,
+ "grad_norm": 5.500149726867676,
+ "learning_rate": 1.2612831268089736e-05,
+ "loss": 0.1888,
+ "step": 15905
+ },
+ {
+ "epoch": 43.34059945504087,
+ "grad_norm": 5.258341312408447,
+ "learning_rate": 1.261197941919709e-05,
+ "loss": 0.2387,
+ "step": 15906
+ },
+ {
+ "epoch": 43.3433242506812,
+ "grad_norm": 4.661367893218994,
+ "learning_rate": 1.2611127549962432e-05,
+ "loss": 0.1575,
+ "step": 15907
+ },
+ {
+ "epoch": 43.346049046321525,
+ "grad_norm": 4.837214946746826,
+ "learning_rate": 1.2610275660392397e-05,
+ "loss": 0.2816,
+ "step": 15908
+ },
+ {
+ "epoch": 43.34877384196185,
+ "grad_norm": 5.191956520080566,
+ "learning_rate": 1.2609423750493622e-05,
+ "loss": 0.2298,
+ "step": 15909
+ },
+ {
+ "epoch": 43.35149863760218,
+ "grad_norm": 4.816946983337402,
+ "learning_rate": 1.2608571820272734e-05,
+ "loss": 0.2029,
+ "step": 15910
+ },
+ {
+ "epoch": 43.35422343324251,
+ "grad_norm": 5.787227630615234,
+ "learning_rate": 1.2607719869736374e-05,
+ "loss": 0.1945,
+ "step": 15911
+ },
+ {
+ "epoch": 43.356948228882835,
+ "grad_norm": 5.747407913208008,
+ "learning_rate": 1.2606867898891175e-05,
+ "loss": 0.1796,
+ "step": 15912
+ },
+ {
+ "epoch": 43.35967302452316,
+ "grad_norm": 5.252607345581055,
+ "learning_rate": 1.2606015907743777e-05,
+ "loss": 0.1556,
+ "step": 15913
+ },
+ {
+ "epoch": 43.36239782016349,
+ "grad_norm": 5.972566604614258,
+ "learning_rate": 1.2605163896300808e-05,
+ "loss": 0.2113,
+ "step": 15914
+ },
+ {
+ "epoch": 43.36512261580381,
+ "grad_norm": 5.59675407409668,
+ "learning_rate": 1.2604311864568905e-05,
+ "loss": 0.2823,
+ "step": 15915
+ },
+ {
+ "epoch": 43.36784741144414,
+ "grad_norm": 5.3479905128479,
+ "learning_rate": 1.2603459812554708e-05,
+ "loss": 0.1877,
+ "step": 15916
+ },
+ {
+ "epoch": 43.37057220708447,
+ "grad_norm": 5.108469486236572,
+ "learning_rate": 1.260260774026485e-05,
+ "loss": 0.1691,
+ "step": 15917
+ },
+ {
+ "epoch": 43.3732970027248,
+ "grad_norm": 7.5149736404418945,
+ "learning_rate": 1.2601755647705963e-05,
+ "loss": 0.184,
+ "step": 15918
+ },
+ {
+ "epoch": 43.37602179836512,
+ "grad_norm": 4.790966033935547,
+ "learning_rate": 1.260090353488469e-05,
+ "loss": 0.277,
+ "step": 15919
+ },
+ {
+ "epoch": 43.37874659400545,
+ "grad_norm": 5.162489414215088,
+ "learning_rate": 1.2600051401807659e-05,
+ "loss": 0.3124,
+ "step": 15920
+ },
+ {
+ "epoch": 43.381471389645775,
+ "grad_norm": 4.985558032989502,
+ "learning_rate": 1.2599199248481515e-05,
+ "loss": 0.2502,
+ "step": 15921
+ },
+ {
+ "epoch": 43.3841961852861,
+ "grad_norm": 5.302313327789307,
+ "learning_rate": 1.2598347074912891e-05,
+ "loss": 0.2769,
+ "step": 15922
+ },
+ {
+ "epoch": 43.38692098092643,
+ "grad_norm": 4.48428201675415,
+ "learning_rate": 1.2597494881108425e-05,
+ "loss": 0.2012,
+ "step": 15923
+ },
+ {
+ "epoch": 43.38964577656676,
+ "grad_norm": 5.0740132331848145,
+ "learning_rate": 1.259664266707475e-05,
+ "loss": 0.3165,
+ "step": 15924
+ },
+ {
+ "epoch": 43.392370572207085,
+ "grad_norm": 6.1025390625,
+ "learning_rate": 1.2595790432818508e-05,
+ "loss": 0.3137,
+ "step": 15925
+ },
+ {
+ "epoch": 43.39509536784741,
+ "grad_norm": 6.309225082397461,
+ "learning_rate": 1.2594938178346332e-05,
+ "loss": 0.2605,
+ "step": 15926
+ },
+ {
+ "epoch": 43.39782016348774,
+ "grad_norm": 4.591233730316162,
+ "learning_rate": 1.2594085903664861e-05,
+ "loss": 0.2574,
+ "step": 15927
+ },
+ {
+ "epoch": 43.40054495912806,
+ "grad_norm": 5.807793617248535,
+ "learning_rate": 1.2593233608780733e-05,
+ "loss": 0.1706,
+ "step": 15928
+ },
+ {
+ "epoch": 43.403269754768395,
+ "grad_norm": 4.671628475189209,
+ "learning_rate": 1.2592381293700583e-05,
+ "loss": 0.1156,
+ "step": 15929
+ },
+ {
+ "epoch": 43.40599455040872,
+ "grad_norm": 5.2835307121276855,
+ "learning_rate": 1.2591528958431052e-05,
+ "loss": 0.2042,
+ "step": 15930
+ },
+ {
+ "epoch": 43.40871934604905,
+ "grad_norm": 4.173274517059326,
+ "learning_rate": 1.259067660297878e-05,
+ "loss": 0.1545,
+ "step": 15931
+ },
+ {
+ "epoch": 43.41144414168937,
+ "grad_norm": 4.61704683303833,
+ "learning_rate": 1.2589824227350397e-05,
+ "loss": 0.2786,
+ "step": 15932
+ },
+ {
+ "epoch": 43.4141689373297,
+ "grad_norm": 4.443673133850098,
+ "learning_rate": 1.2588971831552553e-05,
+ "loss": 0.2406,
+ "step": 15933
+ },
+ {
+ "epoch": 43.416893732970024,
+ "grad_norm": 5.341704368591309,
+ "learning_rate": 1.2588119415591873e-05,
+ "loss": 0.2189,
+ "step": 15934
+ },
+ {
+ "epoch": 43.41961852861036,
+ "grad_norm": 4.745103359222412,
+ "learning_rate": 1.2587266979475006e-05,
+ "loss": 0.2466,
+ "step": 15935
+ },
+ {
+ "epoch": 43.42234332425068,
+ "grad_norm": 5.30593729019165,
+ "learning_rate": 1.2586414523208586e-05,
+ "loss": 0.2246,
+ "step": 15936
+ },
+ {
+ "epoch": 43.42506811989101,
+ "grad_norm": 4.774023532867432,
+ "learning_rate": 1.2585562046799251e-05,
+ "loss": 0.1179,
+ "step": 15937
+ },
+ {
+ "epoch": 43.427792915531334,
+ "grad_norm": 4.554322719573975,
+ "learning_rate": 1.2584709550253644e-05,
+ "loss": 0.2502,
+ "step": 15938
+ },
+ {
+ "epoch": 43.43051771117166,
+ "grad_norm": 5.701827049255371,
+ "learning_rate": 1.2583857033578401e-05,
+ "loss": 0.3235,
+ "step": 15939
+ },
+ {
+ "epoch": 43.433242506811986,
+ "grad_norm": 6.528021812438965,
+ "learning_rate": 1.2583004496780164e-05,
+ "loss": 0.3034,
+ "step": 15940
+ },
+ {
+ "epoch": 43.43596730245232,
+ "grad_norm": 6.078108310699463,
+ "learning_rate": 1.258215193986557e-05,
+ "loss": 0.1343,
+ "step": 15941
+ },
+ {
+ "epoch": 43.438692098092645,
+ "grad_norm": 5.999648094177246,
+ "learning_rate": 1.2581299362841262e-05,
+ "loss": 0.1692,
+ "step": 15942
+ },
+ {
+ "epoch": 43.44141689373297,
+ "grad_norm": 6.091801166534424,
+ "learning_rate": 1.2580446765713876e-05,
+ "loss": 0.3725,
+ "step": 15943
+ },
+ {
+ "epoch": 43.444141689373296,
+ "grad_norm": 5.250519275665283,
+ "learning_rate": 1.2579594148490054e-05,
+ "loss": 0.1306,
+ "step": 15944
+ },
+ {
+ "epoch": 43.44686648501362,
+ "grad_norm": 4.235337257385254,
+ "learning_rate": 1.2578741511176436e-05,
+ "loss": 0.1967,
+ "step": 15945
+ },
+ {
+ "epoch": 43.44959128065395,
+ "grad_norm": 4.8902435302734375,
+ "learning_rate": 1.257788885377966e-05,
+ "loss": 0.1744,
+ "step": 15946
+ },
+ {
+ "epoch": 43.45231607629428,
+ "grad_norm": 6.23908805847168,
+ "learning_rate": 1.257703617630637e-05,
+ "loss": 0.1973,
+ "step": 15947
+ },
+ {
+ "epoch": 43.45504087193461,
+ "grad_norm": 5.5344648361206055,
+ "learning_rate": 1.2576183478763207e-05,
+ "loss": 0.1486,
+ "step": 15948
+ },
+ {
+ "epoch": 43.45776566757493,
+ "grad_norm": 4.776824474334717,
+ "learning_rate": 1.2575330761156808e-05,
+ "loss": 0.4061,
+ "step": 15949
+ },
+ {
+ "epoch": 43.46049046321526,
+ "grad_norm": 4.633957386016846,
+ "learning_rate": 1.2574478023493817e-05,
+ "loss": 0.2403,
+ "step": 15950
+ },
+ {
+ "epoch": 43.463215258855584,
+ "grad_norm": 3.901925563812256,
+ "learning_rate": 1.2573625265780873e-05,
+ "loss": 0.21,
+ "step": 15951
+ },
+ {
+ "epoch": 43.46594005449591,
+ "grad_norm": 5.508082389831543,
+ "learning_rate": 1.257277248802462e-05,
+ "loss": 0.3442,
+ "step": 15952
+ },
+ {
+ "epoch": 43.46866485013624,
+ "grad_norm": 6.7831926345825195,
+ "learning_rate": 1.2571919690231695e-05,
+ "loss": 0.3998,
+ "step": 15953
+ },
+ {
+ "epoch": 43.47138964577657,
+ "grad_norm": 4.064985275268555,
+ "learning_rate": 1.2571066872408744e-05,
+ "loss": 0.1023,
+ "step": 15954
+ },
+ {
+ "epoch": 43.474114441416894,
+ "grad_norm": 7.114734649658203,
+ "learning_rate": 1.2570214034562404e-05,
+ "loss": 0.245,
+ "step": 15955
+ },
+ {
+ "epoch": 43.47683923705722,
+ "grad_norm": 5.0616278648376465,
+ "learning_rate": 1.2569361176699323e-05,
+ "loss": 0.22,
+ "step": 15956
+ },
+ {
+ "epoch": 43.479564032697546,
+ "grad_norm": 7.711175441741943,
+ "learning_rate": 1.256850829882614e-05,
+ "loss": 0.2321,
+ "step": 15957
+ },
+ {
+ "epoch": 43.48228882833787,
+ "grad_norm": 11.367053031921387,
+ "learning_rate": 1.2567655400949497e-05,
+ "loss": 0.3439,
+ "step": 15958
+ },
+ {
+ "epoch": 43.485013623978205,
+ "grad_norm": 6.908168315887451,
+ "learning_rate": 1.2566802483076033e-05,
+ "loss": 0.198,
+ "step": 15959
+ },
+ {
+ "epoch": 43.48773841961853,
+ "grad_norm": 5.678273677825928,
+ "learning_rate": 1.25659495452124e-05,
+ "loss": 0.3083,
+ "step": 15960
+ },
+ {
+ "epoch": 43.490463215258856,
+ "grad_norm": 4.642317295074463,
+ "learning_rate": 1.256509658736523e-05,
+ "loss": 0.1347,
+ "step": 15961
+ },
+ {
+ "epoch": 43.49318801089918,
+ "grad_norm": 5.812233924865723,
+ "learning_rate": 1.2564243609541172e-05,
+ "loss": 0.1897,
+ "step": 15962
+ },
+ {
+ "epoch": 43.49591280653951,
+ "grad_norm": 5.294683456420898,
+ "learning_rate": 1.2563390611746864e-05,
+ "loss": 0.1106,
+ "step": 15963
+ },
+ {
+ "epoch": 43.49863760217983,
+ "grad_norm": 5.511291027069092,
+ "learning_rate": 1.2562537593988954e-05,
+ "loss": 0.2228,
+ "step": 15964
+ },
+ {
+ "epoch": 43.50136239782017,
+ "grad_norm": 5.468712329864502,
+ "learning_rate": 1.2561684556274085e-05,
+ "loss": 0.2565,
+ "step": 15965
+ },
+ {
+ "epoch": 43.50408719346049,
+ "grad_norm": 6.432379245758057,
+ "learning_rate": 1.25608314986089e-05,
+ "loss": 0.1214,
+ "step": 15966
+ },
+ {
+ "epoch": 43.50681198910082,
+ "grad_norm": 6.043390274047852,
+ "learning_rate": 1.2559978421000039e-05,
+ "loss": 0.1766,
+ "step": 15967
+ },
+ {
+ "epoch": 43.509536784741144,
+ "grad_norm": 4.677197456359863,
+ "learning_rate": 1.2559125323454154e-05,
+ "loss": 0.2536,
+ "step": 15968
+ },
+ {
+ "epoch": 43.51226158038147,
+ "grad_norm": 4.803244113922119,
+ "learning_rate": 1.2558272205977877e-05,
+ "loss": 0.2002,
+ "step": 15969
+ },
+ {
+ "epoch": 43.514986376021795,
+ "grad_norm": 4.047486782073975,
+ "learning_rate": 1.255741906857786e-05,
+ "loss": 0.1019,
+ "step": 15970
+ },
+ {
+ "epoch": 43.51771117166213,
+ "grad_norm": 8.100784301757812,
+ "learning_rate": 1.2556565911260747e-05,
+ "loss": 0.2284,
+ "step": 15971
+ },
+ {
+ "epoch": 43.520435967302454,
+ "grad_norm": 5.012939453125,
+ "learning_rate": 1.2555712734033179e-05,
+ "loss": 0.1698,
+ "step": 15972
+ },
+ {
+ "epoch": 43.52316076294278,
+ "grad_norm": 6.9246931076049805,
+ "learning_rate": 1.2554859536901805e-05,
+ "loss": 0.303,
+ "step": 15973
+ },
+ {
+ "epoch": 43.525885558583106,
+ "grad_norm": 6.250595569610596,
+ "learning_rate": 1.2554006319873265e-05,
+ "loss": 0.1173,
+ "step": 15974
+ },
+ {
+ "epoch": 43.52861035422343,
+ "grad_norm": 4.4001898765563965,
+ "learning_rate": 1.2553153082954206e-05,
+ "loss": 0.265,
+ "step": 15975
+ },
+ {
+ "epoch": 43.53133514986376,
+ "grad_norm": 5.430992603302002,
+ "learning_rate": 1.2552299826151275e-05,
+ "loss": 0.2309,
+ "step": 15976
+ },
+ {
+ "epoch": 43.53405994550409,
+ "grad_norm": 4.987862586975098,
+ "learning_rate": 1.2551446549471114e-05,
+ "loss": 0.3293,
+ "step": 15977
+ },
+ {
+ "epoch": 43.536784741144416,
+ "grad_norm": 6.801769256591797,
+ "learning_rate": 1.2550593252920371e-05,
+ "loss": 0.2247,
+ "step": 15978
+ },
+ {
+ "epoch": 43.53950953678474,
+ "grad_norm": 4.975493907928467,
+ "learning_rate": 1.2549739936505687e-05,
+ "loss": 0.1541,
+ "step": 15979
+ },
+ {
+ "epoch": 43.54223433242507,
+ "grad_norm": 5.002984523773193,
+ "learning_rate": 1.2548886600233709e-05,
+ "loss": 0.1904,
+ "step": 15980
+ },
+ {
+ "epoch": 43.54495912806539,
+ "grad_norm": 4.474903106689453,
+ "learning_rate": 1.2548033244111087e-05,
+ "loss": 0.1213,
+ "step": 15981
+ },
+ {
+ "epoch": 43.54768392370572,
+ "grad_norm": 5.30739164352417,
+ "learning_rate": 1.2547179868144466e-05,
+ "loss": 0.1704,
+ "step": 15982
+ },
+ {
+ "epoch": 43.55040871934605,
+ "grad_norm": 6.663933277130127,
+ "learning_rate": 1.2546326472340486e-05,
+ "loss": 0.1754,
+ "step": 15983
+ },
+ {
+ "epoch": 43.55313351498638,
+ "grad_norm": 4.3429131507873535,
+ "learning_rate": 1.2545473056705801e-05,
+ "loss": 0.133,
+ "step": 15984
+ },
+ {
+ "epoch": 43.555858310626704,
+ "grad_norm": 5.424915313720703,
+ "learning_rate": 1.2544619621247052e-05,
+ "loss": 0.1214,
+ "step": 15985
+ },
+ {
+ "epoch": 43.55858310626703,
+ "grad_norm": 5.305258274078369,
+ "learning_rate": 1.2543766165970887e-05,
+ "loss": 0.1232,
+ "step": 15986
+ },
+ {
+ "epoch": 43.561307901907355,
+ "grad_norm": 4.916006565093994,
+ "learning_rate": 1.2542912690883954e-05,
+ "loss": 0.2455,
+ "step": 15987
+ },
+ {
+ "epoch": 43.56403269754768,
+ "grad_norm": 5.430879592895508,
+ "learning_rate": 1.25420591959929e-05,
+ "loss": 0.2218,
+ "step": 15988
+ },
+ {
+ "epoch": 43.566757493188014,
+ "grad_norm": 4.888143539428711,
+ "learning_rate": 1.2541205681304364e-05,
+ "loss": 0.1677,
+ "step": 15989
+ },
+ {
+ "epoch": 43.56948228882834,
+ "grad_norm": 4.813355445861816,
+ "learning_rate": 1.2540352146825008e-05,
+ "loss": 0.1328,
+ "step": 15990
+ },
+ {
+ "epoch": 43.572207084468666,
+ "grad_norm": 6.177624225616455,
+ "learning_rate": 1.2539498592561468e-05,
+ "loss": 0.216,
+ "step": 15991
+ },
+ {
+ "epoch": 43.57493188010899,
+ "grad_norm": 5.1723432540893555,
+ "learning_rate": 1.2538645018520396e-05,
+ "loss": 0.1481,
+ "step": 15992
+ },
+ {
+ "epoch": 43.57765667574932,
+ "grad_norm": 5.250513553619385,
+ "learning_rate": 1.2537791424708436e-05,
+ "loss": 0.3468,
+ "step": 15993
+ },
+ {
+ "epoch": 43.58038147138964,
+ "grad_norm": 5.463875770568848,
+ "learning_rate": 1.2536937811132242e-05,
+ "loss": 0.1758,
+ "step": 15994
+ },
+ {
+ "epoch": 43.583106267029976,
+ "grad_norm": 5.446907997131348,
+ "learning_rate": 1.2536084177798453e-05,
+ "loss": 0.1342,
+ "step": 15995
+ },
+ {
+ "epoch": 43.5858310626703,
+ "grad_norm": 6.789150238037109,
+ "learning_rate": 1.2535230524713726e-05,
+ "loss": 0.1471,
+ "step": 15996
+ },
+ {
+ "epoch": 43.58855585831063,
+ "grad_norm": 7.316271781921387,
+ "learning_rate": 1.2534376851884702e-05,
+ "loss": 0.27,
+ "step": 15997
+ },
+ {
+ "epoch": 43.59128065395095,
+ "grad_norm": 5.163402080535889,
+ "learning_rate": 1.2533523159318035e-05,
+ "loss": 0.1695,
+ "step": 15998
+ },
+ {
+ "epoch": 43.59400544959128,
+ "grad_norm": 4.516694068908691,
+ "learning_rate": 1.2532669447020369e-05,
+ "loss": 0.1947,
+ "step": 15999
+ },
+ {
+ "epoch": 43.596730245231605,
+ "grad_norm": 6.344399929046631,
+ "learning_rate": 1.2531815714998356e-05,
+ "loss": 0.307,
+ "step": 16000
+ },
+ {
+ "epoch": 43.59945504087194,
+ "grad_norm": 5.544537544250488,
+ "learning_rate": 1.2530961963258643e-05,
+ "loss": 0.1917,
+ "step": 16001
+ },
+ {
+ "epoch": 43.60217983651226,
+ "grad_norm": 7.054203987121582,
+ "learning_rate": 1.2530108191807884e-05,
+ "loss": 0.2518,
+ "step": 16002
+ },
+ {
+ "epoch": 43.60490463215259,
+ "grad_norm": 5.008299350738525,
+ "learning_rate": 1.252925440065272e-05,
+ "loss": 0.1638,
+ "step": 16003
+ },
+ {
+ "epoch": 43.607629427792915,
+ "grad_norm": 5.451460838317871,
+ "learning_rate": 1.2528400589799805e-05,
+ "loss": 0.2308,
+ "step": 16004
+ },
+ {
+ "epoch": 43.61035422343324,
+ "grad_norm": 7.667142868041992,
+ "learning_rate": 1.2527546759255786e-05,
+ "loss": 0.1488,
+ "step": 16005
+ },
+ {
+ "epoch": 43.61307901907357,
+ "grad_norm": 6.472372531890869,
+ "learning_rate": 1.2526692909027314e-05,
+ "loss": 0.2041,
+ "step": 16006
+ },
+ {
+ "epoch": 43.6158038147139,
+ "grad_norm": 4.346190929412842,
+ "learning_rate": 1.252583903912104e-05,
+ "loss": 0.2752,
+ "step": 16007
+ },
+ {
+ "epoch": 43.618528610354225,
+ "grad_norm": 4.9120192527771,
+ "learning_rate": 1.2524985149543616e-05,
+ "loss": 0.3718,
+ "step": 16008
+ },
+ {
+ "epoch": 43.62125340599455,
+ "grad_norm": 4.977303504943848,
+ "learning_rate": 1.2524131240301684e-05,
+ "loss": 0.22,
+ "step": 16009
+ },
+ {
+ "epoch": 43.62397820163488,
+ "grad_norm": 5.490370273590088,
+ "learning_rate": 1.2523277311401903e-05,
+ "loss": 0.2609,
+ "step": 16010
+ },
+ {
+ "epoch": 43.6267029972752,
+ "grad_norm": 9.68083381652832,
+ "learning_rate": 1.2522423362850917e-05,
+ "loss": 0.2579,
+ "step": 16011
+ },
+ {
+ "epoch": 43.62942779291553,
+ "grad_norm": 7.106309413909912,
+ "learning_rate": 1.2521569394655382e-05,
+ "loss": 0.4242,
+ "step": 16012
+ },
+ {
+ "epoch": 43.63215258855586,
+ "grad_norm": 5.843109607696533,
+ "learning_rate": 1.2520715406821942e-05,
+ "loss": 0.19,
+ "step": 16013
+ },
+ {
+ "epoch": 43.63487738419619,
+ "grad_norm": 4.223015785217285,
+ "learning_rate": 1.2519861399357254e-05,
+ "loss": 0.1386,
+ "step": 16014
+ },
+ {
+ "epoch": 43.63760217983651,
+ "grad_norm": 6.382819175720215,
+ "learning_rate": 1.2519007372267964e-05,
+ "loss": 0.291,
+ "step": 16015
+ },
+ {
+ "epoch": 43.64032697547684,
+ "grad_norm": 4.584835529327393,
+ "learning_rate": 1.2518153325560726e-05,
+ "loss": 0.1245,
+ "step": 16016
+ },
+ {
+ "epoch": 43.643051771117165,
+ "grad_norm": 3.7178592681884766,
+ "learning_rate": 1.2517299259242193e-05,
+ "loss": 0.1624,
+ "step": 16017
+ },
+ {
+ "epoch": 43.64577656675749,
+ "grad_norm": 5.389956951141357,
+ "learning_rate": 1.2516445173319013e-05,
+ "loss": 0.236,
+ "step": 16018
+ },
+ {
+ "epoch": 43.64850136239782,
+ "grad_norm": 6.396854400634766,
+ "learning_rate": 1.2515591067797841e-05,
+ "loss": 0.2456,
+ "step": 16019
+ },
+ {
+ "epoch": 43.65122615803815,
+ "grad_norm": 6.409819602966309,
+ "learning_rate": 1.2514736942685326e-05,
+ "loss": 0.2351,
+ "step": 16020
+ },
+ {
+ "epoch": 43.653950953678475,
+ "grad_norm": 4.087258338928223,
+ "learning_rate": 1.251388279798812e-05,
+ "loss": 0.1525,
+ "step": 16021
+ },
+ {
+ "epoch": 43.6566757493188,
+ "grad_norm": 5.1316819190979,
+ "learning_rate": 1.2513028633712875e-05,
+ "loss": 0.2031,
+ "step": 16022
+ },
+ {
+ "epoch": 43.65940054495913,
+ "grad_norm": 7.15573263168335,
+ "learning_rate": 1.2512174449866243e-05,
+ "loss": 0.4549,
+ "step": 16023
+ },
+ {
+ "epoch": 43.66212534059945,
+ "grad_norm": 4.485933780670166,
+ "learning_rate": 1.251132024645488e-05,
+ "loss": 0.2953,
+ "step": 16024
+ },
+ {
+ "epoch": 43.664850136239785,
+ "grad_norm": 4.975935459136963,
+ "learning_rate": 1.2510466023485435e-05,
+ "loss": 0.1809,
+ "step": 16025
+ },
+ {
+ "epoch": 43.66757493188011,
+ "grad_norm": 5.3832688331604,
+ "learning_rate": 1.2509611780964562e-05,
+ "loss": 0.2421,
+ "step": 16026
+ },
+ {
+ "epoch": 43.67029972752044,
+ "grad_norm": 7.378668785095215,
+ "learning_rate": 1.2508757518898911e-05,
+ "loss": 0.2202,
+ "step": 16027
+ },
+ {
+ "epoch": 43.67302452316076,
+ "grad_norm": 5.278179168701172,
+ "learning_rate": 1.2507903237295138e-05,
+ "loss": 0.1807,
+ "step": 16028
+ },
+ {
+ "epoch": 43.67574931880109,
+ "grad_norm": 6.28816032409668,
+ "learning_rate": 1.2507048936159896e-05,
+ "loss": 0.1944,
+ "step": 16029
+ },
+ {
+ "epoch": 43.678474114441414,
+ "grad_norm": 4.760003089904785,
+ "learning_rate": 1.2506194615499836e-05,
+ "loss": 0.2402,
+ "step": 16030
+ },
+ {
+ "epoch": 43.68119891008175,
+ "grad_norm": 6.2029805183410645,
+ "learning_rate": 1.2505340275321613e-05,
+ "loss": 0.2573,
+ "step": 16031
+ },
+ {
+ "epoch": 43.68392370572207,
+ "grad_norm": 4.338624954223633,
+ "learning_rate": 1.2504485915631883e-05,
+ "loss": 0.1321,
+ "step": 16032
+ },
+ {
+ "epoch": 43.6866485013624,
+ "grad_norm": 4.835025310516357,
+ "learning_rate": 1.2503631536437295e-05,
+ "loss": 0.1835,
+ "step": 16033
+ },
+ {
+ "epoch": 43.689373297002724,
+ "grad_norm": 9.827530860900879,
+ "learning_rate": 1.2502777137744507e-05,
+ "loss": 0.2545,
+ "step": 16034
+ },
+ {
+ "epoch": 43.69209809264305,
+ "grad_norm": 5.594376564025879,
+ "learning_rate": 1.250192271956017e-05,
+ "loss": 0.1847,
+ "step": 16035
+ },
+ {
+ "epoch": 43.694822888283376,
+ "grad_norm": 5.1019392013549805,
+ "learning_rate": 1.250106828189094e-05,
+ "loss": 0.175,
+ "step": 16036
+ },
+ {
+ "epoch": 43.69754768392371,
+ "grad_norm": 5.329370021820068,
+ "learning_rate": 1.2500213824743472e-05,
+ "loss": 0.2035,
+ "step": 16037
+ },
+ {
+ "epoch": 43.700272479564035,
+ "grad_norm": 5.356943607330322,
+ "learning_rate": 1.2499359348124418e-05,
+ "loss": 0.1966,
+ "step": 16038
+ },
+ {
+ "epoch": 43.70299727520436,
+ "grad_norm": 5.181354999542236,
+ "learning_rate": 1.2498504852040433e-05,
+ "loss": 0.2862,
+ "step": 16039
+ },
+ {
+ "epoch": 43.705722070844686,
+ "grad_norm": 4.817810535430908,
+ "learning_rate": 1.2497650336498172e-05,
+ "loss": 0.1609,
+ "step": 16040
+ },
+ {
+ "epoch": 43.70844686648501,
+ "grad_norm": 6.273209095001221,
+ "learning_rate": 1.2496795801504291e-05,
+ "loss": 0.1707,
+ "step": 16041
+ },
+ {
+ "epoch": 43.71117166212534,
+ "grad_norm": 4.329726219177246,
+ "learning_rate": 1.2495941247065445e-05,
+ "loss": 0.1393,
+ "step": 16042
+ },
+ {
+ "epoch": 43.71389645776567,
+ "grad_norm": 6.111339092254639,
+ "learning_rate": 1.2495086673188293e-05,
+ "loss": 0.2964,
+ "step": 16043
+ },
+ {
+ "epoch": 43.716621253406,
+ "grad_norm": 4.5158491134643555,
+ "learning_rate": 1.249423207987948e-05,
+ "loss": 0.2061,
+ "step": 16044
+ },
+ {
+ "epoch": 43.71934604904632,
+ "grad_norm": 5.9191083908081055,
+ "learning_rate": 1.249337746714567e-05,
+ "loss": 0.2371,
+ "step": 16045
+ },
+ {
+ "epoch": 43.72207084468665,
+ "grad_norm": 4.54535436630249,
+ "learning_rate": 1.2492522834993519e-05,
+ "loss": 0.2207,
+ "step": 16046
+ },
+ {
+ "epoch": 43.724795640326974,
+ "grad_norm": 4.868076801300049,
+ "learning_rate": 1.2491668183429679e-05,
+ "loss": 0.1785,
+ "step": 16047
+ },
+ {
+ "epoch": 43.7275204359673,
+ "grad_norm": 4.8957977294921875,
+ "learning_rate": 1.2490813512460806e-05,
+ "loss": 0.1964,
+ "step": 16048
+ },
+ {
+ "epoch": 43.73024523160763,
+ "grad_norm": 5.272156715393066,
+ "learning_rate": 1.2489958822093557e-05,
+ "loss": 0.1245,
+ "step": 16049
+ },
+ {
+ "epoch": 43.73297002724796,
+ "grad_norm": 5.2726593017578125,
+ "learning_rate": 1.2489104112334588e-05,
+ "loss": 0.1562,
+ "step": 16050
+ },
+ {
+ "epoch": 43.735694822888284,
+ "grad_norm": 6.89739990234375,
+ "learning_rate": 1.248824938319056e-05,
+ "loss": 0.2311,
+ "step": 16051
+ },
+ {
+ "epoch": 43.73841961852861,
+ "grad_norm": 4.722046852111816,
+ "learning_rate": 1.2487394634668123e-05,
+ "loss": 0.1761,
+ "step": 16052
+ },
+ {
+ "epoch": 43.741144414168936,
+ "grad_norm": 5.488198280334473,
+ "learning_rate": 1.2486539866773941e-05,
+ "loss": 0.2041,
+ "step": 16053
+ },
+ {
+ "epoch": 43.74386920980926,
+ "grad_norm": 5.007774829864502,
+ "learning_rate": 1.2485685079514663e-05,
+ "loss": 0.1779,
+ "step": 16054
+ },
+ {
+ "epoch": 43.746594005449595,
+ "grad_norm": 11.114958763122559,
+ "learning_rate": 1.2484830272896951e-05,
+ "loss": 0.2186,
+ "step": 16055
+ },
+ {
+ "epoch": 43.74931880108992,
+ "grad_norm": 5.780182838439941,
+ "learning_rate": 1.2483975446927459e-05,
+ "loss": 0.2337,
+ "step": 16056
+ },
+ {
+ "epoch": 43.752043596730246,
+ "grad_norm": 6.6061859130859375,
+ "learning_rate": 1.2483120601612847e-05,
+ "loss": 0.2101,
+ "step": 16057
+ },
+ {
+ "epoch": 43.75476839237057,
+ "grad_norm": 6.823513031005859,
+ "learning_rate": 1.2482265736959769e-05,
+ "loss": 0.1509,
+ "step": 16058
+ },
+ {
+ "epoch": 43.7574931880109,
+ "grad_norm": 6.462015151977539,
+ "learning_rate": 1.248141085297489e-05,
+ "loss": 0.2858,
+ "step": 16059
+ },
+ {
+ "epoch": 43.76021798365122,
+ "grad_norm": 4.85947322845459,
+ "learning_rate": 1.2480555949664859e-05,
+ "loss": 0.1335,
+ "step": 16060
+ },
+ {
+ "epoch": 43.762942779291556,
+ "grad_norm": 4.83868932723999,
+ "learning_rate": 1.247970102703634e-05,
+ "loss": 0.2706,
+ "step": 16061
+ },
+ {
+ "epoch": 43.76566757493188,
+ "grad_norm": 6.2221503257751465,
+ "learning_rate": 1.247884608509599e-05,
+ "loss": 0.1767,
+ "step": 16062
+ },
+ {
+ "epoch": 43.76839237057221,
+ "grad_norm": 5.1493988037109375,
+ "learning_rate": 1.2477991123850468e-05,
+ "loss": 0.2175,
+ "step": 16063
+ },
+ {
+ "epoch": 43.771117166212534,
+ "grad_norm": 5.098999500274658,
+ "learning_rate": 1.2477136143306428e-05,
+ "loss": 0.1342,
+ "step": 16064
+ },
+ {
+ "epoch": 43.77384196185286,
+ "grad_norm": 5.399009704589844,
+ "learning_rate": 1.2476281143470535e-05,
+ "loss": 0.1434,
+ "step": 16065
+ },
+ {
+ "epoch": 43.776566757493185,
+ "grad_norm": 7.601125240325928,
+ "learning_rate": 1.2475426124349436e-05,
+ "loss": 0.205,
+ "step": 16066
+ },
+ {
+ "epoch": 43.77929155313352,
+ "grad_norm": 5.856564521789551,
+ "learning_rate": 1.2474571085949807e-05,
+ "loss": 0.2831,
+ "step": 16067
+ },
+ {
+ "epoch": 43.782016348773844,
+ "grad_norm": 5.1694135665893555,
+ "learning_rate": 1.2473716028278292e-05,
+ "loss": 0.5207,
+ "step": 16068
+ },
+ {
+ "epoch": 43.78474114441417,
+ "grad_norm": 4.714412689208984,
+ "learning_rate": 1.2472860951341561e-05,
+ "loss": 0.1497,
+ "step": 16069
+ },
+ {
+ "epoch": 43.787465940054496,
+ "grad_norm": 5.425742149353027,
+ "learning_rate": 1.2472005855146265e-05,
+ "loss": 0.2264,
+ "step": 16070
+ },
+ {
+ "epoch": 43.79019073569482,
+ "grad_norm": 5.301591396331787,
+ "learning_rate": 1.247115073969907e-05,
+ "loss": 0.1359,
+ "step": 16071
+ },
+ {
+ "epoch": 43.79291553133515,
+ "grad_norm": 5.562912940979004,
+ "learning_rate": 1.2470295605006628e-05,
+ "loss": 0.2102,
+ "step": 16072
+ },
+ {
+ "epoch": 43.79564032697548,
+ "grad_norm": 6.005643844604492,
+ "learning_rate": 1.246944045107561e-05,
+ "loss": 0.1778,
+ "step": 16073
+ },
+ {
+ "epoch": 43.798365122615806,
+ "grad_norm": 4.845348358154297,
+ "learning_rate": 1.2468585277912664e-05,
+ "loss": 0.1918,
+ "step": 16074
+ },
+ {
+ "epoch": 43.80108991825613,
+ "grad_norm": 5.073792457580566,
+ "learning_rate": 1.2467730085524454e-05,
+ "loss": 0.1407,
+ "step": 16075
+ },
+ {
+ "epoch": 43.80381471389646,
+ "grad_norm": 5.499170780181885,
+ "learning_rate": 1.2466874873917646e-05,
+ "loss": 0.158,
+ "step": 16076
+ },
+ {
+ "epoch": 43.80653950953678,
+ "grad_norm": 7.507500648498535,
+ "learning_rate": 1.2466019643098895e-05,
+ "loss": 0.1994,
+ "step": 16077
+ },
+ {
+ "epoch": 43.80926430517711,
+ "grad_norm": 4.464300155639648,
+ "learning_rate": 1.2465164393074859e-05,
+ "loss": 0.2694,
+ "step": 16078
+ },
+ {
+ "epoch": 43.81198910081744,
+ "grad_norm": 5.403188228607178,
+ "learning_rate": 1.2464309123852205e-05,
+ "loss": 0.1728,
+ "step": 16079
+ },
+ {
+ "epoch": 43.81471389645777,
+ "grad_norm": 7.665669918060303,
+ "learning_rate": 1.246345383543759e-05,
+ "loss": 0.2252,
+ "step": 16080
+ },
+ {
+ "epoch": 43.817438692098094,
+ "grad_norm": 5.672266960144043,
+ "learning_rate": 1.2462598527837678e-05,
+ "loss": 0.2267,
+ "step": 16081
+ },
+ {
+ "epoch": 43.82016348773842,
+ "grad_norm": 5.895010948181152,
+ "learning_rate": 1.2461743201059124e-05,
+ "loss": 0.2448,
+ "step": 16082
+ },
+ {
+ "epoch": 43.822888283378745,
+ "grad_norm": 7.843247890472412,
+ "learning_rate": 1.2460887855108597e-05,
+ "loss": 0.2243,
+ "step": 16083
+ },
+ {
+ "epoch": 43.82561307901907,
+ "grad_norm": 5.759918212890625,
+ "learning_rate": 1.2460032489992751e-05,
+ "loss": 0.1763,
+ "step": 16084
+ },
+ {
+ "epoch": 43.828337874659404,
+ "grad_norm": 5.617268085479736,
+ "learning_rate": 1.2459177105718251e-05,
+ "loss": 0.1667,
+ "step": 16085
+ },
+ {
+ "epoch": 43.83106267029973,
+ "grad_norm": 4.631982803344727,
+ "learning_rate": 1.2458321702291762e-05,
+ "loss": 0.1943,
+ "step": 16086
+ },
+ {
+ "epoch": 43.833787465940055,
+ "grad_norm": 4.916030406951904,
+ "learning_rate": 1.2457466279719943e-05,
+ "loss": 0.1129,
+ "step": 16087
+ },
+ {
+ "epoch": 43.83651226158038,
+ "grad_norm": 6.239870548248291,
+ "learning_rate": 1.2456610838009454e-05,
+ "loss": 0.2857,
+ "step": 16088
+ },
+ {
+ "epoch": 43.83923705722071,
+ "grad_norm": 6.174760818481445,
+ "learning_rate": 1.2455755377166958e-05,
+ "loss": 0.1576,
+ "step": 16089
+ },
+ {
+ "epoch": 43.84196185286103,
+ "grad_norm": 6.801732063293457,
+ "learning_rate": 1.245489989719912e-05,
+ "loss": 0.1155,
+ "step": 16090
+ },
+ {
+ "epoch": 43.844686648501366,
+ "grad_norm": 5.358292102813721,
+ "learning_rate": 1.2454044398112602e-05,
+ "loss": 0.2784,
+ "step": 16091
+ },
+ {
+ "epoch": 43.84741144414169,
+ "grad_norm": 6.265818119049072,
+ "learning_rate": 1.245318887991406e-05,
+ "loss": 0.1893,
+ "step": 16092
+ },
+ {
+ "epoch": 43.85013623978202,
+ "grad_norm": 4.627772331237793,
+ "learning_rate": 1.2452333342610166e-05,
+ "loss": 0.1819,
+ "step": 16093
+ },
+ {
+ "epoch": 43.85286103542234,
+ "grad_norm": 5.668519496917725,
+ "learning_rate": 1.2451477786207575e-05,
+ "loss": 0.2036,
+ "step": 16094
+ },
+ {
+ "epoch": 43.85558583106267,
+ "grad_norm": 9.2498197555542,
+ "learning_rate": 1.245062221071296e-05,
+ "loss": 0.253,
+ "step": 16095
+ },
+ {
+ "epoch": 43.858310626702995,
+ "grad_norm": 4.812533855438232,
+ "learning_rate": 1.2449766616132973e-05,
+ "loss": 0.2204,
+ "step": 16096
+ },
+ {
+ "epoch": 43.86103542234333,
+ "grad_norm": 5.658326625823975,
+ "learning_rate": 1.2448911002474287e-05,
+ "loss": 0.1572,
+ "step": 16097
+ },
+ {
+ "epoch": 43.86376021798365,
+ "grad_norm": 6.318443298339844,
+ "learning_rate": 1.2448055369743557e-05,
+ "loss": 0.1373,
+ "step": 16098
+ },
+ {
+ "epoch": 43.86648501362398,
+ "grad_norm": 4.787212371826172,
+ "learning_rate": 1.2447199717947451e-05,
+ "loss": 0.1609,
+ "step": 16099
+ },
+ {
+ "epoch": 43.869209809264305,
+ "grad_norm": 5.018313407897949,
+ "learning_rate": 1.2446344047092633e-05,
+ "loss": 0.3412,
+ "step": 16100
+ },
+ {
+ "epoch": 43.87193460490463,
+ "grad_norm": 5.533585071563721,
+ "learning_rate": 1.2445488357185766e-05,
+ "loss": 0.1091,
+ "step": 16101
+ },
+ {
+ "epoch": 43.87465940054496,
+ "grad_norm": 10.251208305358887,
+ "learning_rate": 1.2444632648233517e-05,
+ "loss": 0.2603,
+ "step": 16102
+ },
+ {
+ "epoch": 43.87738419618529,
+ "grad_norm": 6.50205135345459,
+ "learning_rate": 1.2443776920242542e-05,
+ "loss": 0.3353,
+ "step": 16103
+ },
+ {
+ "epoch": 43.880108991825615,
+ "grad_norm": 5.021983623504639,
+ "learning_rate": 1.2442921173219515e-05,
+ "loss": 0.199,
+ "step": 16104
+ },
+ {
+ "epoch": 43.88283378746594,
+ "grad_norm": 7.136135101318359,
+ "learning_rate": 1.2442065407171098e-05,
+ "loss": 0.1986,
+ "step": 16105
+ },
+ {
+ "epoch": 43.88555858310627,
+ "grad_norm": 5.772706985473633,
+ "learning_rate": 1.2441209622103951e-05,
+ "loss": 0.1638,
+ "step": 16106
+ },
+ {
+ "epoch": 43.88828337874659,
+ "grad_norm": 7.06938362121582,
+ "learning_rate": 1.2440353818024744e-05,
+ "loss": 0.2592,
+ "step": 16107
+ },
+ {
+ "epoch": 43.89100817438692,
+ "grad_norm": 5.062612056732178,
+ "learning_rate": 1.243949799494014e-05,
+ "loss": 0.2136,
+ "step": 16108
+ },
+ {
+ "epoch": 43.89373297002725,
+ "grad_norm": 6.993363380432129,
+ "learning_rate": 1.2438642152856802e-05,
+ "loss": 0.2269,
+ "step": 16109
+ },
+ {
+ "epoch": 43.89645776566758,
+ "grad_norm": 7.7213311195373535,
+ "learning_rate": 1.24377862917814e-05,
+ "loss": 0.2116,
+ "step": 16110
+ },
+ {
+ "epoch": 43.8991825613079,
+ "grad_norm": 4.676961898803711,
+ "learning_rate": 1.2436930411720594e-05,
+ "loss": 0.1582,
+ "step": 16111
+ },
+ {
+ "epoch": 43.90190735694823,
+ "grad_norm": 3.7129993438720703,
+ "learning_rate": 1.2436074512681055e-05,
+ "loss": 0.1428,
+ "step": 16112
+ },
+ {
+ "epoch": 43.904632152588555,
+ "grad_norm": 5.535231590270996,
+ "learning_rate": 1.2435218594669445e-05,
+ "loss": 0.1777,
+ "step": 16113
+ },
+ {
+ "epoch": 43.90735694822888,
+ "grad_norm": 5.202457427978516,
+ "learning_rate": 1.2434362657692432e-05,
+ "loss": 0.2078,
+ "step": 16114
+ },
+ {
+ "epoch": 43.91008174386921,
+ "grad_norm": 5.230146884918213,
+ "learning_rate": 1.2433506701756678e-05,
+ "loss": 0.2223,
+ "step": 16115
+ },
+ {
+ "epoch": 43.91280653950954,
+ "grad_norm": 6.026159286499023,
+ "learning_rate": 1.2432650726868854e-05,
+ "loss": 0.3477,
+ "step": 16116
+ },
+ {
+ "epoch": 43.915531335149865,
+ "grad_norm": 6.212592601776123,
+ "learning_rate": 1.2431794733035625e-05,
+ "loss": 0.1644,
+ "step": 16117
+ },
+ {
+ "epoch": 43.91825613079019,
+ "grad_norm": 8.96209716796875,
+ "learning_rate": 1.2430938720263657e-05,
+ "loss": 0.2091,
+ "step": 16118
+ },
+ {
+ "epoch": 43.920980926430516,
+ "grad_norm": 5.667464733123779,
+ "learning_rate": 1.2430082688559616e-05,
+ "loss": 0.2952,
+ "step": 16119
+ },
+ {
+ "epoch": 43.92370572207084,
+ "grad_norm": 5.065408229827881,
+ "learning_rate": 1.242922663793017e-05,
+ "loss": 0.245,
+ "step": 16120
+ },
+ {
+ "epoch": 43.926430517711175,
+ "grad_norm": 6.7920427322387695,
+ "learning_rate": 1.2428370568381982e-05,
+ "loss": 0.2838,
+ "step": 16121
+ },
+ {
+ "epoch": 43.9291553133515,
+ "grad_norm": 5.5842180252075195,
+ "learning_rate": 1.2427514479921725e-05,
+ "loss": 0.1599,
+ "step": 16122
+ },
+ {
+ "epoch": 43.93188010899183,
+ "grad_norm": 6.502938270568848,
+ "learning_rate": 1.2426658372556062e-05,
+ "loss": 0.163,
+ "step": 16123
+ },
+ {
+ "epoch": 43.93460490463215,
+ "grad_norm": 8.820902824401855,
+ "learning_rate": 1.2425802246291664e-05,
+ "loss": 0.2465,
+ "step": 16124
+ },
+ {
+ "epoch": 43.93732970027248,
+ "grad_norm": 5.5153889656066895,
+ "learning_rate": 1.2424946101135193e-05,
+ "loss": 0.1917,
+ "step": 16125
+ },
+ {
+ "epoch": 43.940054495912804,
+ "grad_norm": 7.109150409698486,
+ "learning_rate": 1.2424089937093324e-05,
+ "loss": 0.2391,
+ "step": 16126
+ },
+ {
+ "epoch": 43.94277929155314,
+ "grad_norm": 7.857607841491699,
+ "learning_rate": 1.2423233754172714e-05,
+ "loss": 0.1871,
+ "step": 16127
+ },
+ {
+ "epoch": 43.94550408719346,
+ "grad_norm": 116.6109848022461,
+ "learning_rate": 1.2422377552380045e-05,
+ "loss": 0.2427,
+ "step": 16128
+ },
+ {
+ "epoch": 43.94822888283379,
+ "grad_norm": 6.429569244384766,
+ "learning_rate": 1.2421521331721974e-05,
+ "loss": 0.2248,
+ "step": 16129
+ },
+ {
+ "epoch": 43.950953678474114,
+ "grad_norm": 5.0744781494140625,
+ "learning_rate": 1.2420665092205173e-05,
+ "loss": 0.3101,
+ "step": 16130
+ },
+ {
+ "epoch": 43.95367847411444,
+ "grad_norm": 10.218924522399902,
+ "learning_rate": 1.2419808833836309e-05,
+ "loss": 0.221,
+ "step": 16131
+ },
+ {
+ "epoch": 43.956403269754766,
+ "grad_norm": 9.258928298950195,
+ "learning_rate": 1.2418952556622055e-05,
+ "loss": 0.3065,
+ "step": 16132
+ },
+ {
+ "epoch": 43.95912806539509,
+ "grad_norm": 6.090509414672852,
+ "learning_rate": 1.2418096260569072e-05,
+ "loss": 0.156,
+ "step": 16133
+ },
+ {
+ "epoch": 43.961852861035425,
+ "grad_norm": 6.892738342285156,
+ "learning_rate": 1.2417239945684036e-05,
+ "loss": 0.3133,
+ "step": 16134
+ },
+ {
+ "epoch": 43.96457765667575,
+ "grad_norm": 8.078993797302246,
+ "learning_rate": 1.241638361197361e-05,
+ "loss": 0.3408,
+ "step": 16135
+ },
+ {
+ "epoch": 43.967302452316076,
+ "grad_norm": 14.61220645904541,
+ "learning_rate": 1.2415527259444471e-05,
+ "loss": 0.2736,
+ "step": 16136
+ },
+ {
+ "epoch": 43.9700272479564,
+ "grad_norm": 11.88048267364502,
+ "learning_rate": 1.2414670888103279e-05,
+ "loss": 0.4071,
+ "step": 16137
+ },
+ {
+ "epoch": 43.97275204359673,
+ "grad_norm": 9.614017486572266,
+ "learning_rate": 1.241381449795671e-05,
+ "loss": 0.2885,
+ "step": 16138
+ },
+ {
+ "epoch": 43.97547683923706,
+ "grad_norm": 7.922733306884766,
+ "learning_rate": 1.2412958089011433e-05,
+ "loss": 0.2641,
+ "step": 16139
+ },
+ {
+ "epoch": 43.97820163487739,
+ "grad_norm": 13.481842994689941,
+ "learning_rate": 1.2412101661274114e-05,
+ "loss": 0.3297,
+ "step": 16140
+ },
+ {
+ "epoch": 43.98092643051771,
+ "grad_norm": 9.547430038452148,
+ "learning_rate": 1.2411245214751426e-05,
+ "loss": 0.2846,
+ "step": 16141
+ },
+ {
+ "epoch": 43.98365122615804,
+ "grad_norm": 11.379546165466309,
+ "learning_rate": 1.2410388749450038e-05,
+ "loss": 0.3534,
+ "step": 16142
+ },
+ {
+ "epoch": 43.986376021798364,
+ "grad_norm": 31.17267417907715,
+ "learning_rate": 1.2409532265376618e-05,
+ "loss": 0.3415,
+ "step": 16143
+ },
+ {
+ "epoch": 43.98910081743869,
+ "grad_norm": 10.252547264099121,
+ "learning_rate": 1.2408675762537838e-05,
+ "loss": 0.2567,
+ "step": 16144
+ },
+ {
+ "epoch": 43.991825613079016,
+ "grad_norm": 9.675552368164062,
+ "learning_rate": 1.240781924094037e-05,
+ "loss": 0.3126,
+ "step": 16145
+ },
+ {
+ "epoch": 43.99455040871935,
+ "grad_norm": 15.750492095947266,
+ "learning_rate": 1.2406962700590884e-05,
+ "loss": 0.3246,
+ "step": 16146
+ },
+ {
+ "epoch": 43.997275204359674,
+ "grad_norm": 7.915947437286377,
+ "learning_rate": 1.2406106141496049e-05,
+ "loss": 0.1831,
+ "step": 16147
+ },
+ {
+ "epoch": 44.0,
+ "grad_norm": 7.796821117401123,
+ "learning_rate": 1.2405249563662539e-05,
+ "loss": 0.2965,
+ "step": 16148
+ },
+ {
+ "epoch": 44.002724795640326,
+ "grad_norm": 8.101951599121094,
+ "learning_rate": 1.2404392967097019e-05,
+ "loss": 0.2635,
+ "step": 16149
+ },
+ {
+ "epoch": 44.00544959128065,
+ "grad_norm": 8.145999908447266,
+ "learning_rate": 1.2403536351806167e-05,
+ "loss": 0.2394,
+ "step": 16150
+ },
+ {
+ "epoch": 44.00817438692098,
+ "grad_norm": 8.64932632446289,
+ "learning_rate": 1.2402679717796651e-05,
+ "loss": 0.3574,
+ "step": 16151
+ },
+ {
+ "epoch": 44.01089918256131,
+ "grad_norm": 6.614543437957764,
+ "learning_rate": 1.240182306507514e-05,
+ "loss": 0.361,
+ "step": 16152
+ },
+ {
+ "epoch": 44.013623978201636,
+ "grad_norm": 7.630898952484131,
+ "learning_rate": 1.2400966393648309e-05,
+ "loss": 0.3195,
+ "step": 16153
+ },
+ {
+ "epoch": 44.01634877384196,
+ "grad_norm": 7.651569366455078,
+ "learning_rate": 1.2400109703522831e-05,
+ "loss": 0.2422,
+ "step": 16154
+ },
+ {
+ "epoch": 44.01907356948229,
+ "grad_norm": 5.433675765991211,
+ "learning_rate": 1.2399252994705373e-05,
+ "loss": 0.209,
+ "step": 16155
+ },
+ {
+ "epoch": 44.02179836512261,
+ "grad_norm": 5.823220252990723,
+ "learning_rate": 1.2398396267202615e-05,
+ "loss": 0.1415,
+ "step": 16156
+ },
+ {
+ "epoch": 44.02452316076294,
+ "grad_norm": 7.748629093170166,
+ "learning_rate": 1.239753952102122e-05,
+ "loss": 0.2618,
+ "step": 16157
+ },
+ {
+ "epoch": 44.02724795640327,
+ "grad_norm": 5.98864221572876,
+ "learning_rate": 1.2396682756167866e-05,
+ "loss": 0.3019,
+ "step": 16158
+ },
+ {
+ "epoch": 44.0299727520436,
+ "grad_norm": 5.825252056121826,
+ "learning_rate": 1.2395825972649222e-05,
+ "loss": 0.1885,
+ "step": 16159
+ },
+ {
+ "epoch": 44.032697547683924,
+ "grad_norm": 7.396633148193359,
+ "learning_rate": 1.2394969170471965e-05,
+ "loss": 0.3402,
+ "step": 16160
+ },
+ {
+ "epoch": 44.03542234332425,
+ "grad_norm": 5.753902912139893,
+ "learning_rate": 1.2394112349642761e-05,
+ "loss": 0.1355,
+ "step": 16161
+ },
+ {
+ "epoch": 44.038147138964575,
+ "grad_norm": 5.8221845626831055,
+ "learning_rate": 1.2393255510168292e-05,
+ "loss": 0.2352,
+ "step": 16162
+ },
+ {
+ "epoch": 44.0408719346049,
+ "grad_norm": 7.52283239364624,
+ "learning_rate": 1.2392398652055222e-05,
+ "loss": 0.2686,
+ "step": 16163
+ },
+ {
+ "epoch": 44.043596730245234,
+ "grad_norm": 6.4456467628479,
+ "learning_rate": 1.2391541775310231e-05,
+ "loss": 0.3121,
+ "step": 16164
+ },
+ {
+ "epoch": 44.04632152588556,
+ "grad_norm": 6.80079984664917,
+ "learning_rate": 1.2390684879939989e-05,
+ "loss": 0.4465,
+ "step": 16165
+ },
+ {
+ "epoch": 44.049046321525886,
+ "grad_norm": 5.70070219039917,
+ "learning_rate": 1.238982796595117e-05,
+ "loss": 0.3208,
+ "step": 16166
+ },
+ {
+ "epoch": 44.05177111716621,
+ "grad_norm": 5.9923505783081055,
+ "learning_rate": 1.2388971033350447e-05,
+ "loss": 0.1696,
+ "step": 16167
+ },
+ {
+ "epoch": 44.05449591280654,
+ "grad_norm": 6.572014331817627,
+ "learning_rate": 1.2388114082144495e-05,
+ "loss": 0.2166,
+ "step": 16168
+ },
+ {
+ "epoch": 44.05722070844686,
+ "grad_norm": 6.781308174133301,
+ "learning_rate": 1.2387257112339987e-05,
+ "loss": 0.271,
+ "step": 16169
+ },
+ {
+ "epoch": 44.059945504087196,
+ "grad_norm": 5.984559059143066,
+ "learning_rate": 1.2386400123943597e-05,
+ "loss": 0.3424,
+ "step": 16170
+ },
+ {
+ "epoch": 44.06267029972752,
+ "grad_norm": 6.572991847991943,
+ "learning_rate": 1.2385543116962002e-05,
+ "loss": 0.157,
+ "step": 16171
+ },
+ {
+ "epoch": 44.06539509536785,
+ "grad_norm": 5.872347831726074,
+ "learning_rate": 1.2384686091401874e-05,
+ "loss": 0.1674,
+ "step": 16172
+ },
+ {
+ "epoch": 44.06811989100817,
+ "grad_norm": 5.073558807373047,
+ "learning_rate": 1.2383829047269884e-05,
+ "loss": 0.2827,
+ "step": 16173
+ },
+ {
+ "epoch": 44.0708446866485,
+ "grad_norm": 5.1867170333862305,
+ "learning_rate": 1.2382971984572714e-05,
+ "loss": 0.3451,
+ "step": 16174
+ },
+ {
+ "epoch": 44.073569482288825,
+ "grad_norm": 5.426074028015137,
+ "learning_rate": 1.2382114903317033e-05,
+ "loss": 0.1745,
+ "step": 16175
+ },
+ {
+ "epoch": 44.07629427792916,
+ "grad_norm": 6.267030239105225,
+ "learning_rate": 1.2381257803509518e-05,
+ "loss": 0.3035,
+ "step": 16176
+ },
+ {
+ "epoch": 44.079019073569484,
+ "grad_norm": 8.500021934509277,
+ "learning_rate": 1.2380400685156844e-05,
+ "loss": 0.2106,
+ "step": 16177
+ },
+ {
+ "epoch": 44.08174386920981,
+ "grad_norm": 6.597235679626465,
+ "learning_rate": 1.2379543548265685e-05,
+ "loss": 0.2307,
+ "step": 16178
+ },
+ {
+ "epoch": 44.084468664850135,
+ "grad_norm": 6.0201096534729,
+ "learning_rate": 1.2378686392842718e-05,
+ "loss": 0.2329,
+ "step": 16179
+ },
+ {
+ "epoch": 44.08719346049046,
+ "grad_norm": 5.377299785614014,
+ "learning_rate": 1.2377829218894618e-05,
+ "loss": 0.1459,
+ "step": 16180
+ },
+ {
+ "epoch": 44.08991825613079,
+ "grad_norm": 5.008917331695557,
+ "learning_rate": 1.237697202642806e-05,
+ "loss": 0.2108,
+ "step": 16181
+ },
+ {
+ "epoch": 44.09264305177112,
+ "grad_norm": 6.565011978149414,
+ "learning_rate": 1.2376114815449723e-05,
+ "loss": 0.2874,
+ "step": 16182
+ },
+ {
+ "epoch": 44.095367847411445,
+ "grad_norm": 6.714814186096191,
+ "learning_rate": 1.2375257585966275e-05,
+ "loss": 0.2558,
+ "step": 16183
+ },
+ {
+ "epoch": 44.09809264305177,
+ "grad_norm": 5.044266223907471,
+ "learning_rate": 1.2374400337984404e-05,
+ "loss": 0.3174,
+ "step": 16184
+ },
+ {
+ "epoch": 44.1008174386921,
+ "grad_norm": 7.665246963500977,
+ "learning_rate": 1.2373543071510774e-05,
+ "loss": 0.1517,
+ "step": 16185
+ },
+ {
+ "epoch": 44.10354223433242,
+ "grad_norm": 7.603165149688721,
+ "learning_rate": 1.2372685786552072e-05,
+ "loss": 0.1894,
+ "step": 16186
+ },
+ {
+ "epoch": 44.10626702997275,
+ "grad_norm": 9.16969108581543,
+ "learning_rate": 1.2371828483114964e-05,
+ "loss": 0.1768,
+ "step": 16187
+ },
+ {
+ "epoch": 44.10899182561308,
+ "grad_norm": 6.315141677856445,
+ "learning_rate": 1.2370971161206136e-05,
+ "loss": 0.4095,
+ "step": 16188
+ },
+ {
+ "epoch": 44.11171662125341,
+ "grad_norm": 6.79281759262085,
+ "learning_rate": 1.237011382083226e-05,
+ "loss": 0.1776,
+ "step": 16189
+ },
+ {
+ "epoch": 44.11444141689373,
+ "grad_norm": 5.980787754058838,
+ "learning_rate": 1.2369256462000015e-05,
+ "loss": 0.1793,
+ "step": 16190
+ },
+ {
+ "epoch": 44.11716621253406,
+ "grad_norm": 4.813692569732666,
+ "learning_rate": 1.2368399084716072e-05,
+ "loss": 0.2648,
+ "step": 16191
+ },
+ {
+ "epoch": 44.119891008174385,
+ "grad_norm": 6.074870586395264,
+ "learning_rate": 1.236754168898712e-05,
+ "loss": 0.1811,
+ "step": 16192
+ },
+ {
+ "epoch": 44.12261580381471,
+ "grad_norm": 6.126917839050293,
+ "learning_rate": 1.2366684274819825e-05,
+ "loss": 0.1966,
+ "step": 16193
+ },
+ {
+ "epoch": 44.12534059945504,
+ "grad_norm": 5.153909206390381,
+ "learning_rate": 1.2365826842220872e-05,
+ "loss": 0.1499,
+ "step": 16194
+ },
+ {
+ "epoch": 44.12806539509537,
+ "grad_norm": 5.3130269050598145,
+ "learning_rate": 1.2364969391196933e-05,
+ "loss": 0.1913,
+ "step": 16195
+ },
+ {
+ "epoch": 44.130790190735695,
+ "grad_norm": 6.73169469833374,
+ "learning_rate": 1.2364111921754686e-05,
+ "loss": 0.1729,
+ "step": 16196
+ },
+ {
+ "epoch": 44.13351498637602,
+ "grad_norm": 4.773559093475342,
+ "learning_rate": 1.2363254433900818e-05,
+ "loss": 0.1593,
+ "step": 16197
+ },
+ {
+ "epoch": 44.13623978201635,
+ "grad_norm": 6.7105937004089355,
+ "learning_rate": 1.2362396927641996e-05,
+ "loss": 0.1693,
+ "step": 16198
+ },
+ {
+ "epoch": 44.13896457765667,
+ "grad_norm": 5.667901039123535,
+ "learning_rate": 1.2361539402984905e-05,
+ "loss": 0.2905,
+ "step": 16199
+ },
+ {
+ "epoch": 44.141689373297005,
+ "grad_norm": 5.803109645843506,
+ "learning_rate": 1.2360681859936222e-05,
+ "loss": 0.1897,
+ "step": 16200
+ },
+ {
+ "epoch": 44.14441416893733,
+ "grad_norm": 5.439942836761475,
+ "learning_rate": 1.2359824298502622e-05,
+ "loss": 0.1578,
+ "step": 16201
+ },
+ {
+ "epoch": 44.14713896457766,
+ "grad_norm": 6.289660930633545,
+ "learning_rate": 1.2358966718690786e-05,
+ "loss": 0.2778,
+ "step": 16202
+ },
+ {
+ "epoch": 44.14986376021798,
+ "grad_norm": 4.494592666625977,
+ "learning_rate": 1.2358109120507393e-05,
+ "loss": 0.1301,
+ "step": 16203
+ },
+ {
+ "epoch": 44.15258855585831,
+ "grad_norm": 9.831260681152344,
+ "learning_rate": 1.2357251503959125e-05,
+ "loss": 0.1682,
+ "step": 16204
+ },
+ {
+ "epoch": 44.155313351498634,
+ "grad_norm": 4.6189751625061035,
+ "learning_rate": 1.2356393869052656e-05,
+ "loss": 0.2497,
+ "step": 16205
+ },
+ {
+ "epoch": 44.15803814713897,
+ "grad_norm": 6.3724212646484375,
+ "learning_rate": 1.2355536215794668e-05,
+ "loss": 0.247,
+ "step": 16206
+ },
+ {
+ "epoch": 44.16076294277929,
+ "grad_norm": 6.15195369720459,
+ "learning_rate": 1.235467854419184e-05,
+ "loss": 0.2225,
+ "step": 16207
+ },
+ {
+ "epoch": 44.16348773841962,
+ "grad_norm": 6.59060525894165,
+ "learning_rate": 1.235382085425085e-05,
+ "loss": 0.1894,
+ "step": 16208
+ },
+ {
+ "epoch": 44.166212534059945,
+ "grad_norm": 7.037757396697998,
+ "learning_rate": 1.2352963145978382e-05,
+ "loss": 0.2516,
+ "step": 16209
+ },
+ {
+ "epoch": 44.16893732970027,
+ "grad_norm": 5.91162109375,
+ "learning_rate": 1.235210541938111e-05,
+ "loss": 0.1681,
+ "step": 16210
+ },
+ {
+ "epoch": 44.171662125340596,
+ "grad_norm": 4.856721878051758,
+ "learning_rate": 1.2351247674465719e-05,
+ "loss": 0.2594,
+ "step": 16211
+ },
+ {
+ "epoch": 44.17438692098093,
+ "grad_norm": 6.868969440460205,
+ "learning_rate": 1.2350389911238884e-05,
+ "loss": 0.2111,
+ "step": 16212
+ },
+ {
+ "epoch": 44.177111716621255,
+ "grad_norm": 5.090456962585449,
+ "learning_rate": 1.2349532129707289e-05,
+ "loss": 0.223,
+ "step": 16213
+ },
+ {
+ "epoch": 44.17983651226158,
+ "grad_norm": 5.5267653465271,
+ "learning_rate": 1.2348674329877613e-05,
+ "loss": 0.1978,
+ "step": 16214
+ },
+ {
+ "epoch": 44.182561307901906,
+ "grad_norm": 5.36014986038208,
+ "learning_rate": 1.2347816511756539e-05,
+ "loss": 0.1841,
+ "step": 16215
+ },
+ {
+ "epoch": 44.18528610354223,
+ "grad_norm": 8.039497375488281,
+ "learning_rate": 1.2346958675350742e-05,
+ "loss": 0.2234,
+ "step": 16216
+ },
+ {
+ "epoch": 44.18801089918256,
+ "grad_norm": 5.579095363616943,
+ "learning_rate": 1.234610082066691e-05,
+ "loss": 0.2629,
+ "step": 16217
+ },
+ {
+ "epoch": 44.19073569482289,
+ "grad_norm": 7.914852142333984,
+ "learning_rate": 1.234524294771172e-05,
+ "loss": 0.1971,
+ "step": 16218
+ },
+ {
+ "epoch": 44.19346049046322,
+ "grad_norm": 7.122565746307373,
+ "learning_rate": 1.2344385056491852e-05,
+ "loss": 0.2775,
+ "step": 16219
+ },
+ {
+ "epoch": 44.19618528610354,
+ "grad_norm": 6.786997318267822,
+ "learning_rate": 1.2343527147013988e-05,
+ "loss": 0.2078,
+ "step": 16220
+ },
+ {
+ "epoch": 44.19891008174387,
+ "grad_norm": 5.375175952911377,
+ "learning_rate": 1.234266921928481e-05,
+ "loss": 0.1441,
+ "step": 16221
+ },
+ {
+ "epoch": 44.201634877384194,
+ "grad_norm": 5.61326265335083,
+ "learning_rate": 1.2341811273310999e-05,
+ "loss": 0.2092,
+ "step": 16222
+ },
+ {
+ "epoch": 44.20435967302452,
+ "grad_norm": 6.873278617858887,
+ "learning_rate": 1.234095330909924e-05,
+ "loss": 0.4392,
+ "step": 16223
+ },
+ {
+ "epoch": 44.20708446866485,
+ "grad_norm": 4.88468599319458,
+ "learning_rate": 1.234009532665621e-05,
+ "loss": 0.1497,
+ "step": 16224
+ },
+ {
+ "epoch": 44.20980926430518,
+ "grad_norm": 5.8181352615356445,
+ "learning_rate": 1.2339237325988595e-05,
+ "loss": 0.218,
+ "step": 16225
+ },
+ {
+ "epoch": 44.212534059945504,
+ "grad_norm": 6.216662406921387,
+ "learning_rate": 1.2338379307103072e-05,
+ "loss": 0.1904,
+ "step": 16226
+ },
+ {
+ "epoch": 44.21525885558583,
+ "grad_norm": 4.694410800933838,
+ "learning_rate": 1.233752127000633e-05,
+ "loss": 0.1707,
+ "step": 16227
+ },
+ {
+ "epoch": 44.217983651226156,
+ "grad_norm": 4.57954740524292,
+ "learning_rate": 1.2336663214705045e-05,
+ "loss": 0.1731,
+ "step": 16228
+ },
+ {
+ "epoch": 44.22070844686648,
+ "grad_norm": 9.905463218688965,
+ "learning_rate": 1.2335805141205901e-05,
+ "loss": 0.1608,
+ "step": 16229
+ },
+ {
+ "epoch": 44.223433242506815,
+ "grad_norm": 6.8656005859375,
+ "learning_rate": 1.2334947049515582e-05,
+ "loss": 0.4211,
+ "step": 16230
+ },
+ {
+ "epoch": 44.22615803814714,
+ "grad_norm": 5.616997718811035,
+ "learning_rate": 1.2334088939640772e-05,
+ "loss": 0.1646,
+ "step": 16231
+ },
+ {
+ "epoch": 44.228882833787466,
+ "grad_norm": 8.053744316101074,
+ "learning_rate": 1.233323081158815e-05,
+ "loss": 0.2007,
+ "step": 16232
+ },
+ {
+ "epoch": 44.23160762942779,
+ "grad_norm": 6.566122531890869,
+ "learning_rate": 1.2332372665364406e-05,
+ "loss": 0.263,
+ "step": 16233
+ },
+ {
+ "epoch": 44.23433242506812,
+ "grad_norm": 5.1463165283203125,
+ "learning_rate": 1.2331514500976216e-05,
+ "loss": 0.2473,
+ "step": 16234
+ },
+ {
+ "epoch": 44.237057220708444,
+ "grad_norm": 5.497501850128174,
+ "learning_rate": 1.2330656318430268e-05,
+ "loss": 0.1558,
+ "step": 16235
+ },
+ {
+ "epoch": 44.23978201634878,
+ "grad_norm": 4.741311073303223,
+ "learning_rate": 1.232979811773324e-05,
+ "loss": 0.1728,
+ "step": 16236
+ },
+ {
+ "epoch": 44.2425068119891,
+ "grad_norm": 6.691548824310303,
+ "learning_rate": 1.2328939898891823e-05,
+ "loss": 0.2718,
+ "step": 16237
+ },
+ {
+ "epoch": 44.24523160762943,
+ "grad_norm": 5.722686767578125,
+ "learning_rate": 1.2328081661912692e-05,
+ "loss": 0.3028,
+ "step": 16238
+ },
+ {
+ "epoch": 44.247956403269754,
+ "grad_norm": 6.705719947814941,
+ "learning_rate": 1.2327223406802542e-05,
+ "loss": 0.3498,
+ "step": 16239
+ },
+ {
+ "epoch": 44.25068119891008,
+ "grad_norm": 9.26452922821045,
+ "learning_rate": 1.2326365133568046e-05,
+ "loss": 0.1984,
+ "step": 16240
+ },
+ {
+ "epoch": 44.253405994550405,
+ "grad_norm": 8.045634269714355,
+ "learning_rate": 1.2325506842215897e-05,
+ "loss": 0.3474,
+ "step": 16241
+ },
+ {
+ "epoch": 44.25613079019074,
+ "grad_norm": 4.803380966186523,
+ "learning_rate": 1.2324648532752775e-05,
+ "loss": 0.1735,
+ "step": 16242
+ },
+ {
+ "epoch": 44.258855585831064,
+ "grad_norm": 4.696771621704102,
+ "learning_rate": 1.2323790205185364e-05,
+ "loss": 0.2244,
+ "step": 16243
+ },
+ {
+ "epoch": 44.26158038147139,
+ "grad_norm": 5.288698673248291,
+ "learning_rate": 1.2322931859520349e-05,
+ "loss": 0.1474,
+ "step": 16244
+ },
+ {
+ "epoch": 44.264305177111716,
+ "grad_norm": 6.997115612030029,
+ "learning_rate": 1.2322073495764418e-05,
+ "loss": 0.2016,
+ "step": 16245
+ },
+ {
+ "epoch": 44.26702997275204,
+ "grad_norm": 8.896620750427246,
+ "learning_rate": 1.232121511392425e-05,
+ "loss": 0.1961,
+ "step": 16246
+ },
+ {
+ "epoch": 44.26975476839237,
+ "grad_norm": 5.633690357208252,
+ "learning_rate": 1.2320356714006534e-05,
+ "loss": 0.2289,
+ "step": 16247
+ },
+ {
+ "epoch": 44.2724795640327,
+ "grad_norm": 5.711029052734375,
+ "learning_rate": 1.2319498296017955e-05,
+ "loss": 0.1247,
+ "step": 16248
+ },
+ {
+ "epoch": 44.275204359673026,
+ "grad_norm": 4.915972709655762,
+ "learning_rate": 1.2318639859965198e-05,
+ "loss": 0.1993,
+ "step": 16249
+ },
+ {
+ "epoch": 44.27792915531335,
+ "grad_norm": 5.64224910736084,
+ "learning_rate": 1.231778140585495e-05,
+ "loss": 0.1367,
+ "step": 16250
+ },
+ {
+ "epoch": 44.28065395095368,
+ "grad_norm": 4.77384614944458,
+ "learning_rate": 1.2316922933693893e-05,
+ "loss": 0.2323,
+ "step": 16251
+ },
+ {
+ "epoch": 44.283378746594,
+ "grad_norm": 4.476263046264648,
+ "learning_rate": 1.2316064443488715e-05,
+ "loss": 0.1991,
+ "step": 16252
+ },
+ {
+ "epoch": 44.28610354223433,
+ "grad_norm": 5.16072416305542,
+ "learning_rate": 1.2315205935246103e-05,
+ "loss": 0.4493,
+ "step": 16253
+ },
+ {
+ "epoch": 44.28882833787466,
+ "grad_norm": 6.235977649688721,
+ "learning_rate": 1.2314347408972742e-05,
+ "loss": 0.1392,
+ "step": 16254
+ },
+ {
+ "epoch": 44.29155313351499,
+ "grad_norm": 11.483926773071289,
+ "learning_rate": 1.2313488864675318e-05,
+ "loss": 0.245,
+ "step": 16255
+ },
+ {
+ "epoch": 44.294277929155314,
+ "grad_norm": 4.5253729820251465,
+ "learning_rate": 1.2312630302360513e-05,
+ "loss": 0.1809,
+ "step": 16256
+ },
+ {
+ "epoch": 44.29700272479564,
+ "grad_norm": 5.335109233856201,
+ "learning_rate": 1.2311771722035022e-05,
+ "loss": 0.1643,
+ "step": 16257
+ },
+ {
+ "epoch": 44.299727520435965,
+ "grad_norm": 7.941211700439453,
+ "learning_rate": 1.2310913123705523e-05,
+ "loss": 0.2764,
+ "step": 16258
+ },
+ {
+ "epoch": 44.30245231607629,
+ "grad_norm": 5.2220845222473145,
+ "learning_rate": 1.2310054507378712e-05,
+ "loss": 0.2522,
+ "step": 16259
+ },
+ {
+ "epoch": 44.305177111716624,
+ "grad_norm": 6.244221210479736,
+ "learning_rate": 1.2309195873061269e-05,
+ "loss": 0.2413,
+ "step": 16260
+ },
+ {
+ "epoch": 44.30790190735695,
+ "grad_norm": 5.436784267425537,
+ "learning_rate": 1.2308337220759883e-05,
+ "loss": 0.251,
+ "step": 16261
+ },
+ {
+ "epoch": 44.310626702997276,
+ "grad_norm": 6.853261470794678,
+ "learning_rate": 1.230747855048124e-05,
+ "loss": 0.2238,
+ "step": 16262
+ },
+ {
+ "epoch": 44.3133514986376,
+ "grad_norm": 6.074221134185791,
+ "learning_rate": 1.230661986223203e-05,
+ "loss": 0.3987,
+ "step": 16263
+ },
+ {
+ "epoch": 44.31607629427793,
+ "grad_norm": 5.958846569061279,
+ "learning_rate": 1.2305761156018936e-05,
+ "loss": 0.2845,
+ "step": 16264
+ },
+ {
+ "epoch": 44.31880108991825,
+ "grad_norm": 6.054225444793701,
+ "learning_rate": 1.230490243184865e-05,
+ "loss": 0.2574,
+ "step": 16265
+ },
+ {
+ "epoch": 44.321525885558586,
+ "grad_norm": 5.6045098304748535,
+ "learning_rate": 1.2304043689727859e-05,
+ "loss": 0.2519,
+ "step": 16266
+ },
+ {
+ "epoch": 44.32425068119891,
+ "grad_norm": 6.948996543884277,
+ "learning_rate": 1.2303184929663248e-05,
+ "loss": 0.1045,
+ "step": 16267
+ },
+ {
+ "epoch": 44.32697547683924,
+ "grad_norm": 4.249958038330078,
+ "learning_rate": 1.2302326151661509e-05,
+ "loss": 0.2094,
+ "step": 16268
+ },
+ {
+ "epoch": 44.32970027247956,
+ "grad_norm": 5.515820503234863,
+ "learning_rate": 1.2301467355729327e-05,
+ "loss": 0.3183,
+ "step": 16269
+ },
+ {
+ "epoch": 44.33242506811989,
+ "grad_norm": 6.033924102783203,
+ "learning_rate": 1.2300608541873391e-05,
+ "loss": 0.2324,
+ "step": 16270
+ },
+ {
+ "epoch": 44.335149863760215,
+ "grad_norm": 16.895814895629883,
+ "learning_rate": 1.229974971010039e-05,
+ "loss": 0.2255,
+ "step": 16271
+ },
+ {
+ "epoch": 44.33787465940055,
+ "grad_norm": 5.29602575302124,
+ "learning_rate": 1.2298890860417013e-05,
+ "loss": 0.1508,
+ "step": 16272
+ },
+ {
+ "epoch": 44.34059945504087,
+ "grad_norm": 5.749146938323975,
+ "learning_rate": 1.2298031992829945e-05,
+ "loss": 0.2484,
+ "step": 16273
+ },
+ {
+ "epoch": 44.3433242506812,
+ "grad_norm": 5.419031143188477,
+ "learning_rate": 1.229717310734588e-05,
+ "loss": 0.236,
+ "step": 16274
+ },
+ {
+ "epoch": 44.346049046321525,
+ "grad_norm": 6.744513034820557,
+ "learning_rate": 1.2296314203971505e-05,
+ "loss": 0.1292,
+ "step": 16275
+ },
+ {
+ "epoch": 44.34877384196185,
+ "grad_norm": 5.140876293182373,
+ "learning_rate": 1.2295455282713509e-05,
+ "loss": 0.2218,
+ "step": 16276
+ },
+ {
+ "epoch": 44.35149863760218,
+ "grad_norm": 5.723390579223633,
+ "learning_rate": 1.229459634357858e-05,
+ "loss": 0.3446,
+ "step": 16277
+ },
+ {
+ "epoch": 44.35422343324251,
+ "grad_norm": 4.45698881149292,
+ "learning_rate": 1.229373738657341e-05,
+ "loss": 0.1729,
+ "step": 16278
+ },
+ {
+ "epoch": 44.356948228882835,
+ "grad_norm": 5.501786708831787,
+ "learning_rate": 1.2292878411704688e-05,
+ "loss": 0.1649,
+ "step": 16279
+ },
+ {
+ "epoch": 44.35967302452316,
+ "grad_norm": 5.382435321807861,
+ "learning_rate": 1.2292019418979098e-05,
+ "loss": 0.1078,
+ "step": 16280
+ },
+ {
+ "epoch": 44.36239782016349,
+ "grad_norm": 6.311226844787598,
+ "learning_rate": 1.2291160408403338e-05,
+ "loss": 0.2673,
+ "step": 16281
+ },
+ {
+ "epoch": 44.36512261580381,
+ "grad_norm": 5.9953742027282715,
+ "learning_rate": 1.2290301379984095e-05,
+ "loss": 0.1188,
+ "step": 16282
+ },
+ {
+ "epoch": 44.36784741144414,
+ "grad_norm": 6.1877312660217285,
+ "learning_rate": 1.2289442333728057e-05,
+ "loss": 0.2395,
+ "step": 16283
+ },
+ {
+ "epoch": 44.37057220708447,
+ "grad_norm": 6.551638126373291,
+ "learning_rate": 1.2288583269641917e-05,
+ "loss": 0.1718,
+ "step": 16284
+ },
+ {
+ "epoch": 44.3732970027248,
+ "grad_norm": 5.743000030517578,
+ "learning_rate": 1.2287724187732364e-05,
+ "loss": 0.1979,
+ "step": 16285
+ },
+ {
+ "epoch": 44.37602179836512,
+ "grad_norm": 4.951767921447754,
+ "learning_rate": 1.2286865088006088e-05,
+ "loss": 0.1429,
+ "step": 16286
+ },
+ {
+ "epoch": 44.37874659400545,
+ "grad_norm": 7.207986354827881,
+ "learning_rate": 1.2286005970469779e-05,
+ "loss": 0.1797,
+ "step": 16287
+ },
+ {
+ "epoch": 44.381471389645775,
+ "grad_norm": 5.050862789154053,
+ "learning_rate": 1.2285146835130133e-05,
+ "loss": 0.1633,
+ "step": 16288
+ },
+ {
+ "epoch": 44.3841961852861,
+ "grad_norm": 4.695954322814941,
+ "learning_rate": 1.2284287681993834e-05,
+ "loss": 0.2142,
+ "step": 16289
+ },
+ {
+ "epoch": 44.38692098092643,
+ "grad_norm": 5.752518653869629,
+ "learning_rate": 1.2283428511067574e-05,
+ "loss": 0.2671,
+ "step": 16290
+ },
+ {
+ "epoch": 44.38964577656676,
+ "grad_norm": 4.853794097900391,
+ "learning_rate": 1.228256932235805e-05,
+ "loss": 0.2382,
+ "step": 16291
+ },
+ {
+ "epoch": 44.392370572207085,
+ "grad_norm": 5.388570785522461,
+ "learning_rate": 1.228171011587195e-05,
+ "loss": 0.1693,
+ "step": 16292
+ },
+ {
+ "epoch": 44.39509536784741,
+ "grad_norm": 4.890974998474121,
+ "learning_rate": 1.228085089161596e-05,
+ "loss": 0.2088,
+ "step": 16293
+ },
+ {
+ "epoch": 44.39782016348774,
+ "grad_norm": 4.6638360023498535,
+ "learning_rate": 1.2279991649596784e-05,
+ "loss": 0.2171,
+ "step": 16294
+ },
+ {
+ "epoch": 44.40054495912806,
+ "grad_norm": 5.858438491821289,
+ "learning_rate": 1.22791323898211e-05,
+ "loss": 0.3256,
+ "step": 16295
+ },
+ {
+ "epoch": 44.403269754768395,
+ "grad_norm": 5.6721720695495605,
+ "learning_rate": 1.2278273112295612e-05,
+ "loss": 0.2023,
+ "step": 16296
+ },
+ {
+ "epoch": 44.40599455040872,
+ "grad_norm": 4.828054904937744,
+ "learning_rate": 1.2277413817027003e-05,
+ "loss": 0.2213,
+ "step": 16297
+ },
+ {
+ "epoch": 44.40871934604905,
+ "grad_norm": 4.199804782867432,
+ "learning_rate": 1.2276554504021969e-05,
+ "loss": 0.2457,
+ "step": 16298
+ },
+ {
+ "epoch": 44.41144414168937,
+ "grad_norm": 5.8764142990112305,
+ "learning_rate": 1.22756951732872e-05,
+ "loss": 0.3098,
+ "step": 16299
+ },
+ {
+ "epoch": 44.4141689373297,
+ "grad_norm": 4.359859943389893,
+ "learning_rate": 1.2274835824829392e-05,
+ "loss": 0.1701,
+ "step": 16300
+ },
+ {
+ "epoch": 44.416893732970024,
+ "grad_norm": 16.240520477294922,
+ "learning_rate": 1.2273976458655233e-05,
+ "loss": 0.1604,
+ "step": 16301
+ },
+ {
+ "epoch": 44.41961852861036,
+ "grad_norm": 6.469280242919922,
+ "learning_rate": 1.2273117074771423e-05,
+ "loss": 0.138,
+ "step": 16302
+ },
+ {
+ "epoch": 44.42234332425068,
+ "grad_norm": 3.977710723876953,
+ "learning_rate": 1.2272257673184646e-05,
+ "loss": 0.0885,
+ "step": 16303
+ },
+ {
+ "epoch": 44.42506811989101,
+ "grad_norm": 4.005497455596924,
+ "learning_rate": 1.2271398253901606e-05,
+ "loss": 0.1484,
+ "step": 16304
+ },
+ {
+ "epoch": 44.427792915531334,
+ "grad_norm": 4.929205417633057,
+ "learning_rate": 1.2270538816928982e-05,
+ "loss": 0.2453,
+ "step": 16305
+ },
+ {
+ "epoch": 44.43051771117166,
+ "grad_norm": 5.408425807952881,
+ "learning_rate": 1.226967936227348e-05,
+ "loss": 0.1835,
+ "step": 16306
+ },
+ {
+ "epoch": 44.433242506811986,
+ "grad_norm": 4.860259532928467,
+ "learning_rate": 1.2268819889941784e-05,
+ "loss": 0.2817,
+ "step": 16307
+ },
+ {
+ "epoch": 44.43596730245232,
+ "grad_norm": 5.1819329261779785,
+ "learning_rate": 1.2267960399940595e-05,
+ "loss": 0.1383,
+ "step": 16308
+ },
+ {
+ "epoch": 44.438692098092645,
+ "grad_norm": 6.924758434295654,
+ "learning_rate": 1.2267100892276602e-05,
+ "loss": 0.1461,
+ "step": 16309
+ },
+ {
+ "epoch": 44.44141689373297,
+ "grad_norm": 4.335215091705322,
+ "learning_rate": 1.2266241366956503e-05,
+ "loss": 0.1862,
+ "step": 16310
+ },
+ {
+ "epoch": 44.444141689373296,
+ "grad_norm": 4.81735897064209,
+ "learning_rate": 1.2265381823986984e-05,
+ "loss": 0.1676,
+ "step": 16311
+ },
+ {
+ "epoch": 44.44686648501362,
+ "grad_norm": 4.712780952453613,
+ "learning_rate": 1.2264522263374747e-05,
+ "loss": 0.1684,
+ "step": 16312
+ },
+ {
+ "epoch": 44.44959128065395,
+ "grad_norm": 4.163626194000244,
+ "learning_rate": 1.2263662685126486e-05,
+ "loss": 0.1801,
+ "step": 16313
+ },
+ {
+ "epoch": 44.45231607629428,
+ "grad_norm": 6.2198805809021,
+ "learning_rate": 1.2262803089248889e-05,
+ "loss": 0.1632,
+ "step": 16314
+ },
+ {
+ "epoch": 44.45504087193461,
+ "grad_norm": 6.122025012969971,
+ "learning_rate": 1.2261943475748657e-05,
+ "loss": 0.3163,
+ "step": 16315
+ },
+ {
+ "epoch": 44.45776566757493,
+ "grad_norm": 4.518787384033203,
+ "learning_rate": 1.226108384463248e-05,
+ "loss": 0.1251,
+ "step": 16316
+ },
+ {
+ "epoch": 44.46049046321526,
+ "grad_norm": 5.9850640296936035,
+ "learning_rate": 1.2260224195907053e-05,
+ "loss": 0.2348,
+ "step": 16317
+ },
+ {
+ "epoch": 44.463215258855584,
+ "grad_norm": 5.899969100952148,
+ "learning_rate": 1.2259364529579076e-05,
+ "loss": 0.2406,
+ "step": 16318
+ },
+ {
+ "epoch": 44.46594005449591,
+ "grad_norm": 5.047104358673096,
+ "learning_rate": 1.2258504845655242e-05,
+ "loss": 0.1589,
+ "step": 16319
+ },
+ {
+ "epoch": 44.46866485013624,
+ "grad_norm": 6.053981304168701,
+ "learning_rate": 1.2257645144142244e-05,
+ "loss": 0.2739,
+ "step": 16320
+ },
+ {
+ "epoch": 44.47138964577657,
+ "grad_norm": 6.156033515930176,
+ "learning_rate": 1.2256785425046776e-05,
+ "loss": 0.2014,
+ "step": 16321
+ },
+ {
+ "epoch": 44.474114441416894,
+ "grad_norm": 5.389181137084961,
+ "learning_rate": 1.2255925688375539e-05,
+ "loss": 0.2613,
+ "step": 16322
+ },
+ {
+ "epoch": 44.47683923705722,
+ "grad_norm": 4.212601661682129,
+ "learning_rate": 1.2255065934135222e-05,
+ "loss": 0.2288,
+ "step": 16323
+ },
+ {
+ "epoch": 44.479564032697546,
+ "grad_norm": 5.5055108070373535,
+ "learning_rate": 1.2254206162332523e-05,
+ "loss": 0.1921,
+ "step": 16324
+ },
+ {
+ "epoch": 44.48228882833787,
+ "grad_norm": 4.336231231689453,
+ "learning_rate": 1.2253346372974142e-05,
+ "loss": 0.1337,
+ "step": 16325
+ },
+ {
+ "epoch": 44.485013623978205,
+ "grad_norm": 4.315658092498779,
+ "learning_rate": 1.2252486566066772e-05,
+ "loss": 0.1666,
+ "step": 16326
+ },
+ {
+ "epoch": 44.48773841961853,
+ "grad_norm": 5.385659217834473,
+ "learning_rate": 1.2251626741617106e-05,
+ "loss": 0.1505,
+ "step": 16327
+ },
+ {
+ "epoch": 44.490463215258856,
+ "grad_norm": 5.198558807373047,
+ "learning_rate": 1.225076689963185e-05,
+ "loss": 0.2453,
+ "step": 16328
+ },
+ {
+ "epoch": 44.49318801089918,
+ "grad_norm": 7.6078200340271,
+ "learning_rate": 1.2249907040117688e-05,
+ "loss": 0.1817,
+ "step": 16329
+ },
+ {
+ "epoch": 44.49591280653951,
+ "grad_norm": 7.1719441413879395,
+ "learning_rate": 1.2249047163081325e-05,
+ "loss": 0.1521,
+ "step": 16330
+ },
+ {
+ "epoch": 44.49863760217983,
+ "grad_norm": 4.648802280426025,
+ "learning_rate": 1.2248187268529453e-05,
+ "loss": 0.1992,
+ "step": 16331
+ },
+ {
+ "epoch": 44.50136239782017,
+ "grad_norm": 5.414094924926758,
+ "learning_rate": 1.2247327356468772e-05,
+ "loss": 0.1876,
+ "step": 16332
+ },
+ {
+ "epoch": 44.50408719346049,
+ "grad_norm": 6.786231994628906,
+ "learning_rate": 1.2246467426905978e-05,
+ "loss": 0.3367,
+ "step": 16333
+ },
+ {
+ "epoch": 44.50681198910082,
+ "grad_norm": 7.858244895935059,
+ "learning_rate": 1.2245607479847767e-05,
+ "loss": 0.245,
+ "step": 16334
+ },
+ {
+ "epoch": 44.509536784741144,
+ "grad_norm": 7.821645736694336,
+ "learning_rate": 1.2244747515300839e-05,
+ "loss": 0.1359,
+ "step": 16335
+ },
+ {
+ "epoch": 44.51226158038147,
+ "grad_norm": 11.80642032623291,
+ "learning_rate": 1.224388753327189e-05,
+ "loss": 0.1764,
+ "step": 16336
+ },
+ {
+ "epoch": 44.514986376021795,
+ "grad_norm": 6.316769599914551,
+ "learning_rate": 1.2243027533767614e-05,
+ "loss": 0.175,
+ "step": 16337
+ },
+ {
+ "epoch": 44.51771117166213,
+ "grad_norm": 5.621060371398926,
+ "learning_rate": 1.2242167516794714e-05,
+ "loss": 0.1629,
+ "step": 16338
+ },
+ {
+ "epoch": 44.520435967302454,
+ "grad_norm": 4.951374530792236,
+ "learning_rate": 1.2241307482359885e-05,
+ "loss": 0.2068,
+ "step": 16339
+ },
+ {
+ "epoch": 44.52316076294278,
+ "grad_norm": 5.404215335845947,
+ "learning_rate": 1.2240447430469829e-05,
+ "loss": 0.1461,
+ "step": 16340
+ },
+ {
+ "epoch": 44.525885558583106,
+ "grad_norm": 5.342979431152344,
+ "learning_rate": 1.2239587361131235e-05,
+ "loss": 0.1788,
+ "step": 16341
+ },
+ {
+ "epoch": 44.52861035422343,
+ "grad_norm": 5.920839309692383,
+ "learning_rate": 1.2238727274350808e-05,
+ "loss": 0.2077,
+ "step": 16342
+ },
+ {
+ "epoch": 44.53133514986376,
+ "grad_norm": 4.700316905975342,
+ "learning_rate": 1.2237867170135244e-05,
+ "loss": 0.1705,
+ "step": 16343
+ },
+ {
+ "epoch": 44.53405994550409,
+ "grad_norm": 5.291968822479248,
+ "learning_rate": 1.2237007048491248e-05,
+ "loss": 0.2509,
+ "step": 16344
+ },
+ {
+ "epoch": 44.536784741144416,
+ "grad_norm": 4.686873912811279,
+ "learning_rate": 1.2236146909425508e-05,
+ "loss": 0.246,
+ "step": 16345
+ },
+ {
+ "epoch": 44.53950953678474,
+ "grad_norm": 6.583618640899658,
+ "learning_rate": 1.223528675294473e-05,
+ "loss": 0.253,
+ "step": 16346
+ },
+ {
+ "epoch": 44.54223433242507,
+ "grad_norm": 4.258402347564697,
+ "learning_rate": 1.223442657905561e-05,
+ "loss": 0.2042,
+ "step": 16347
+ },
+ {
+ "epoch": 44.54495912806539,
+ "grad_norm": 5.072122097015381,
+ "learning_rate": 1.2233566387764847e-05,
+ "loss": 0.1084,
+ "step": 16348
+ },
+ {
+ "epoch": 44.54768392370572,
+ "grad_norm": 4.582540512084961,
+ "learning_rate": 1.2232706179079142e-05,
+ "loss": 0.165,
+ "step": 16349
+ },
+ {
+ "epoch": 44.55040871934605,
+ "grad_norm": 5.258549213409424,
+ "learning_rate": 1.2231845953005192e-05,
+ "loss": 0.1454,
+ "step": 16350
+ },
+ {
+ "epoch": 44.55313351498638,
+ "grad_norm": 5.412867546081543,
+ "learning_rate": 1.2230985709549699e-05,
+ "loss": 0.2958,
+ "step": 16351
+ },
+ {
+ "epoch": 44.555858310626704,
+ "grad_norm": 5.269376754760742,
+ "learning_rate": 1.2230125448719358e-05,
+ "loss": 0.3327,
+ "step": 16352
+ },
+ {
+ "epoch": 44.55858310626703,
+ "grad_norm": 5.642248153686523,
+ "learning_rate": 1.2229265170520876e-05,
+ "loss": 0.3118,
+ "step": 16353
+ },
+ {
+ "epoch": 44.561307901907355,
+ "grad_norm": 6.034834384918213,
+ "learning_rate": 1.2228404874960949e-05,
+ "loss": 0.2119,
+ "step": 16354
+ },
+ {
+ "epoch": 44.56403269754768,
+ "grad_norm": 4.387385368347168,
+ "learning_rate": 1.2227544562046272e-05,
+ "loss": 0.1628,
+ "step": 16355
+ },
+ {
+ "epoch": 44.566757493188014,
+ "grad_norm": 7.412023067474365,
+ "learning_rate": 1.2226684231783551e-05,
+ "loss": 0.3198,
+ "step": 16356
+ },
+ {
+ "epoch": 44.56948228882834,
+ "grad_norm": 5.820879936218262,
+ "learning_rate": 1.2225823884179486e-05,
+ "loss": 0.2483,
+ "step": 16357
+ },
+ {
+ "epoch": 44.572207084468666,
+ "grad_norm": 5.885914325714111,
+ "learning_rate": 1.222496351924078e-05,
+ "loss": 0.2217,
+ "step": 16358
+ },
+ {
+ "epoch": 44.57493188010899,
+ "grad_norm": 7.226802349090576,
+ "learning_rate": 1.2224103136974123e-05,
+ "loss": 0.2107,
+ "step": 16359
+ },
+ {
+ "epoch": 44.57765667574932,
+ "grad_norm": 4.522464275360107,
+ "learning_rate": 1.2223242737386225e-05,
+ "loss": 0.1055,
+ "step": 16360
+ },
+ {
+ "epoch": 44.58038147138964,
+ "grad_norm": 4.730563640594482,
+ "learning_rate": 1.2222382320483785e-05,
+ "loss": 0.2857,
+ "step": 16361
+ },
+ {
+ "epoch": 44.583106267029976,
+ "grad_norm": 5.198635101318359,
+ "learning_rate": 1.2221521886273502e-05,
+ "loss": 0.1795,
+ "step": 16362
+ },
+ {
+ "epoch": 44.5858310626703,
+ "grad_norm": 5.904626846313477,
+ "learning_rate": 1.222066143476208e-05,
+ "loss": 0.2273,
+ "step": 16363
+ },
+ {
+ "epoch": 44.58855585831063,
+ "grad_norm": 4.365389823913574,
+ "learning_rate": 1.2219800965956217e-05,
+ "loss": 0.1739,
+ "step": 16364
+ },
+ {
+ "epoch": 44.59128065395095,
+ "grad_norm": 5.098349571228027,
+ "learning_rate": 1.2218940479862613e-05,
+ "loss": 0.2538,
+ "step": 16365
+ },
+ {
+ "epoch": 44.59400544959128,
+ "grad_norm": 5.18057918548584,
+ "learning_rate": 1.2218079976487976e-05,
+ "loss": 0.2011,
+ "step": 16366
+ },
+ {
+ "epoch": 44.596730245231605,
+ "grad_norm": 5.942376613616943,
+ "learning_rate": 1.2217219455839e-05,
+ "loss": 0.2401,
+ "step": 16367
+ },
+ {
+ "epoch": 44.59945504087194,
+ "grad_norm": 5.536251068115234,
+ "learning_rate": 1.221635891792239e-05,
+ "loss": 0.1822,
+ "step": 16368
+ },
+ {
+ "epoch": 44.60217983651226,
+ "grad_norm": 4.777346134185791,
+ "learning_rate": 1.2215498362744853e-05,
+ "loss": 0.2757,
+ "step": 16369
+ },
+ {
+ "epoch": 44.60490463215259,
+ "grad_norm": 6.0716633796691895,
+ "learning_rate": 1.2214637790313081e-05,
+ "loss": 0.5032,
+ "step": 16370
+ },
+ {
+ "epoch": 44.607629427792915,
+ "grad_norm": 4.697019577026367,
+ "learning_rate": 1.2213777200633786e-05,
+ "loss": 0.1395,
+ "step": 16371
+ },
+ {
+ "epoch": 44.61035422343324,
+ "grad_norm": 6.832633972167969,
+ "learning_rate": 1.221291659371366e-05,
+ "loss": 0.1398,
+ "step": 16372
+ },
+ {
+ "epoch": 44.61307901907357,
+ "grad_norm": 4.780966281890869,
+ "learning_rate": 1.2212055969559415e-05,
+ "loss": 0.1528,
+ "step": 16373
+ },
+ {
+ "epoch": 44.6158038147139,
+ "grad_norm": 5.384737491607666,
+ "learning_rate": 1.2211195328177747e-05,
+ "loss": 0.2267,
+ "step": 16374
+ },
+ {
+ "epoch": 44.618528610354225,
+ "grad_norm": 5.076670169830322,
+ "learning_rate": 1.2210334669575362e-05,
+ "loss": 0.1704,
+ "step": 16375
+ },
+ {
+ "epoch": 44.62125340599455,
+ "grad_norm": 4.770692825317383,
+ "learning_rate": 1.2209473993758957e-05,
+ "loss": 0.1446,
+ "step": 16376
+ },
+ {
+ "epoch": 44.62397820163488,
+ "grad_norm": 6.416381359100342,
+ "learning_rate": 1.2208613300735247e-05,
+ "loss": 0.2606,
+ "step": 16377
+ },
+ {
+ "epoch": 44.6267029972752,
+ "grad_norm": 4.535919189453125,
+ "learning_rate": 1.2207752590510924e-05,
+ "loss": 0.3067,
+ "step": 16378
+ },
+ {
+ "epoch": 44.62942779291553,
+ "grad_norm": 5.324057102203369,
+ "learning_rate": 1.2206891863092697e-05,
+ "loss": 0.2079,
+ "step": 16379
+ },
+ {
+ "epoch": 44.63215258855586,
+ "grad_norm": 5.409849643707275,
+ "learning_rate": 1.2206031118487264e-05,
+ "loss": 0.2076,
+ "step": 16380
+ },
+ {
+ "epoch": 44.63487738419619,
+ "grad_norm": 6.793900489807129,
+ "learning_rate": 1.2205170356701337e-05,
+ "loss": 0.162,
+ "step": 16381
+ },
+ {
+ "epoch": 44.63760217983651,
+ "grad_norm": 4.991828441619873,
+ "learning_rate": 1.220430957774161e-05,
+ "loss": 0.212,
+ "step": 16382
+ },
+ {
+ "epoch": 44.64032697547684,
+ "grad_norm": 6.235599040985107,
+ "learning_rate": 1.220344878161479e-05,
+ "loss": 0.2661,
+ "step": 16383
+ },
+ {
+ "epoch": 44.643051771117165,
+ "grad_norm": 4.532994747161865,
+ "learning_rate": 1.2202587968327584e-05,
+ "loss": 0.2122,
+ "step": 16384
+ },
+ {
+ "epoch": 44.64577656675749,
+ "grad_norm": 5.00579833984375,
+ "learning_rate": 1.2201727137886692e-05,
+ "loss": 0.2256,
+ "step": 16385
+ },
+ {
+ "epoch": 44.64850136239782,
+ "grad_norm": 4.9762372970581055,
+ "learning_rate": 1.220086629029882e-05,
+ "loss": 0.348,
+ "step": 16386
+ },
+ {
+ "epoch": 44.65122615803815,
+ "grad_norm": 5.744802474975586,
+ "learning_rate": 1.2200005425570676e-05,
+ "loss": 0.268,
+ "step": 16387
+ },
+ {
+ "epoch": 44.653950953678475,
+ "grad_norm": 4.24283504486084,
+ "learning_rate": 1.2199144543708957e-05,
+ "loss": 0.1737,
+ "step": 16388
+ },
+ {
+ "epoch": 44.6566757493188,
+ "grad_norm": 4.924327850341797,
+ "learning_rate": 1.2198283644720373e-05,
+ "loss": 0.2677,
+ "step": 16389
+ },
+ {
+ "epoch": 44.65940054495913,
+ "grad_norm": 4.337157249450684,
+ "learning_rate": 1.2197422728611624e-05,
+ "loss": 0.3367,
+ "step": 16390
+ },
+ {
+ "epoch": 44.66212534059945,
+ "grad_norm": 5.2622456550598145,
+ "learning_rate": 1.219656179538942e-05,
+ "loss": 0.2184,
+ "step": 16391
+ },
+ {
+ "epoch": 44.664850136239785,
+ "grad_norm": 3.9210143089294434,
+ "learning_rate": 1.2195700845060462e-05,
+ "loss": 0.3047,
+ "step": 16392
+ },
+ {
+ "epoch": 44.66757493188011,
+ "grad_norm": 4.90424108505249,
+ "learning_rate": 1.2194839877631457e-05,
+ "loss": 0.1054,
+ "step": 16393
+ },
+ {
+ "epoch": 44.67029972752044,
+ "grad_norm": 4.5516862869262695,
+ "learning_rate": 1.2193978893109109e-05,
+ "loss": 0.2586,
+ "step": 16394
+ },
+ {
+ "epoch": 44.67302452316076,
+ "grad_norm": 5.143599987030029,
+ "learning_rate": 1.2193117891500126e-05,
+ "loss": 0.258,
+ "step": 16395
+ },
+ {
+ "epoch": 44.67574931880109,
+ "grad_norm": 5.577111721038818,
+ "learning_rate": 1.2192256872811207e-05,
+ "loss": 0.1353,
+ "step": 16396
+ },
+ {
+ "epoch": 44.678474114441414,
+ "grad_norm": 5.602947235107422,
+ "learning_rate": 1.219139583704907e-05,
+ "loss": 0.3288,
+ "step": 16397
+ },
+ {
+ "epoch": 44.68119891008175,
+ "grad_norm": 5.5605082511901855,
+ "learning_rate": 1.2190534784220405e-05,
+ "loss": 0.2506,
+ "step": 16398
+ },
+ {
+ "epoch": 44.68392370572207,
+ "grad_norm": 6.177340507507324,
+ "learning_rate": 1.2189673714331932e-05,
+ "loss": 0.167,
+ "step": 16399
+ },
+ {
+ "epoch": 44.6866485013624,
+ "grad_norm": 4.574554443359375,
+ "learning_rate": 1.2188812627390345e-05,
+ "loss": 0.1967,
+ "step": 16400
+ },
+ {
+ "epoch": 44.689373297002724,
+ "grad_norm": 4.757580757141113,
+ "learning_rate": 1.218795152340236e-05,
+ "loss": 0.183,
+ "step": 16401
+ },
+ {
+ "epoch": 44.69209809264305,
+ "grad_norm": 5.213620185852051,
+ "learning_rate": 1.2187090402374673e-05,
+ "loss": 0.3285,
+ "step": 16402
+ },
+ {
+ "epoch": 44.694822888283376,
+ "grad_norm": 5.771677494049072,
+ "learning_rate": 1.2186229264314e-05,
+ "loss": 0.171,
+ "step": 16403
+ },
+ {
+ "epoch": 44.69754768392371,
+ "grad_norm": 5.553153991699219,
+ "learning_rate": 1.2185368109227044e-05,
+ "loss": 0.3119,
+ "step": 16404
+ },
+ {
+ "epoch": 44.700272479564035,
+ "grad_norm": 4.6227827072143555,
+ "learning_rate": 1.2184506937120513e-05,
+ "loss": 0.1755,
+ "step": 16405
+ },
+ {
+ "epoch": 44.70299727520436,
+ "grad_norm": 4.735884189605713,
+ "learning_rate": 1.2183645748001109e-05,
+ "loss": 0.1804,
+ "step": 16406
+ },
+ {
+ "epoch": 44.705722070844686,
+ "grad_norm": 5.025547981262207,
+ "learning_rate": 1.2182784541875546e-05,
+ "loss": 0.177,
+ "step": 16407
+ },
+ {
+ "epoch": 44.70844686648501,
+ "grad_norm": 8.84172248840332,
+ "learning_rate": 1.2181923318750523e-05,
+ "loss": 0.2655,
+ "step": 16408
+ },
+ {
+ "epoch": 44.71117166212534,
+ "grad_norm": 5.576916694641113,
+ "learning_rate": 1.2181062078632757e-05,
+ "loss": 0.2252,
+ "step": 16409
+ },
+ {
+ "epoch": 44.71389645776567,
+ "grad_norm": 7.395151615142822,
+ "learning_rate": 1.2180200821528942e-05,
+ "loss": 0.2293,
+ "step": 16410
+ },
+ {
+ "epoch": 44.716621253406,
+ "grad_norm": 6.201037883758545,
+ "learning_rate": 1.2179339547445799e-05,
+ "loss": 0.214,
+ "step": 16411
+ },
+ {
+ "epoch": 44.71934604904632,
+ "grad_norm": 4.671193599700928,
+ "learning_rate": 1.2178478256390028e-05,
+ "loss": 0.1127,
+ "step": 16412
+ },
+ {
+ "epoch": 44.72207084468665,
+ "grad_norm": 6.584817409515381,
+ "learning_rate": 1.2177616948368341e-05,
+ "loss": 0.2061,
+ "step": 16413
+ },
+ {
+ "epoch": 44.724795640326974,
+ "grad_norm": 5.561539649963379,
+ "learning_rate": 1.217675562338744e-05,
+ "loss": 0.2798,
+ "step": 16414
+ },
+ {
+ "epoch": 44.7275204359673,
+ "grad_norm": 6.056123733520508,
+ "learning_rate": 1.2175894281454037e-05,
+ "loss": 0.2159,
+ "step": 16415
+ },
+ {
+ "epoch": 44.73024523160763,
+ "grad_norm": 6.623376369476318,
+ "learning_rate": 1.2175032922574839e-05,
+ "loss": 0.262,
+ "step": 16416
+ },
+ {
+ "epoch": 44.73297002724796,
+ "grad_norm": 7.3019537925720215,
+ "learning_rate": 1.2174171546756557e-05,
+ "loss": 0.3738,
+ "step": 16417
+ },
+ {
+ "epoch": 44.735694822888284,
+ "grad_norm": 6.133616924285889,
+ "learning_rate": 1.2173310154005896e-05,
+ "loss": 0.1665,
+ "step": 16418
+ },
+ {
+ "epoch": 44.73841961852861,
+ "grad_norm": 5.614738941192627,
+ "learning_rate": 1.217244874432956e-05,
+ "loss": 0.1658,
+ "step": 16419
+ },
+ {
+ "epoch": 44.741144414168936,
+ "grad_norm": 4.63480806350708,
+ "learning_rate": 1.2171587317734268e-05,
+ "loss": 0.1498,
+ "step": 16420
+ },
+ {
+ "epoch": 44.74386920980926,
+ "grad_norm": 5.289315223693848,
+ "learning_rate": 1.2170725874226725e-05,
+ "loss": 0.2081,
+ "step": 16421
+ },
+ {
+ "epoch": 44.746594005449595,
+ "grad_norm": 4.7408599853515625,
+ "learning_rate": 1.2169864413813637e-05,
+ "loss": 0.1478,
+ "step": 16422
+ },
+ {
+ "epoch": 44.74931880108992,
+ "grad_norm": 6.242374420166016,
+ "learning_rate": 1.2169002936501717e-05,
+ "loss": 0.2716,
+ "step": 16423
+ },
+ {
+ "epoch": 44.752043596730246,
+ "grad_norm": 5.0137434005737305,
+ "learning_rate": 1.216814144229767e-05,
+ "loss": 0.2229,
+ "step": 16424
+ },
+ {
+ "epoch": 44.75476839237057,
+ "grad_norm": 5.0223798751831055,
+ "learning_rate": 1.2167279931208209e-05,
+ "loss": 0.1383,
+ "step": 16425
+ },
+ {
+ "epoch": 44.7574931880109,
+ "grad_norm": 6.727980613708496,
+ "learning_rate": 1.2166418403240038e-05,
+ "loss": 0.1514,
+ "step": 16426
+ },
+ {
+ "epoch": 44.76021798365122,
+ "grad_norm": 7.22456169128418,
+ "learning_rate": 1.2165556858399874e-05,
+ "loss": 0.1984,
+ "step": 16427
+ },
+ {
+ "epoch": 44.762942779291556,
+ "grad_norm": 4.701144695281982,
+ "learning_rate": 1.216469529669442e-05,
+ "loss": 0.2101,
+ "step": 16428
+ },
+ {
+ "epoch": 44.76566757493188,
+ "grad_norm": 5.2383222579956055,
+ "learning_rate": 1.216383371813039e-05,
+ "loss": 0.1126,
+ "step": 16429
+ },
+ {
+ "epoch": 44.76839237057221,
+ "grad_norm": 6.049795627593994,
+ "learning_rate": 1.2162972122714491e-05,
+ "loss": 0.2141,
+ "step": 16430
+ },
+ {
+ "epoch": 44.771117166212534,
+ "grad_norm": 6.866738796234131,
+ "learning_rate": 1.2162110510453437e-05,
+ "loss": 0.2691,
+ "step": 16431
+ },
+ {
+ "epoch": 44.77384196185286,
+ "grad_norm": 6.67152214050293,
+ "learning_rate": 1.2161248881353936e-05,
+ "loss": 0.1846,
+ "step": 16432
+ },
+ {
+ "epoch": 44.776566757493185,
+ "grad_norm": 4.297389984130859,
+ "learning_rate": 1.2160387235422697e-05,
+ "loss": 0.3139,
+ "step": 16433
+ },
+ {
+ "epoch": 44.77929155313352,
+ "grad_norm": 4.853041172027588,
+ "learning_rate": 1.215952557266643e-05,
+ "loss": 0.3744,
+ "step": 16434
+ },
+ {
+ "epoch": 44.782016348773844,
+ "grad_norm": 4.801114559173584,
+ "learning_rate": 1.2158663893091851e-05,
+ "loss": 0.192,
+ "step": 16435
+ },
+ {
+ "epoch": 44.78474114441417,
+ "grad_norm": 3.750229835510254,
+ "learning_rate": 1.2157802196705666e-05,
+ "loss": 0.1018,
+ "step": 16436
+ },
+ {
+ "epoch": 44.787465940054496,
+ "grad_norm": 4.52603006362915,
+ "learning_rate": 1.2156940483514585e-05,
+ "loss": 0.1754,
+ "step": 16437
+ },
+ {
+ "epoch": 44.79019073569482,
+ "grad_norm": 4.756311416625977,
+ "learning_rate": 1.2156078753525325e-05,
+ "loss": 0.1699,
+ "step": 16438
+ },
+ {
+ "epoch": 44.79291553133515,
+ "grad_norm": 5.980393886566162,
+ "learning_rate": 1.2155217006744588e-05,
+ "loss": 0.1904,
+ "step": 16439
+ },
+ {
+ "epoch": 44.79564032697548,
+ "grad_norm": 5.323193073272705,
+ "learning_rate": 1.2154355243179092e-05,
+ "loss": 0.2048,
+ "step": 16440
+ },
+ {
+ "epoch": 44.798365122615806,
+ "grad_norm": 4.5851545333862305,
+ "learning_rate": 1.215349346283555e-05,
+ "loss": 0.1346,
+ "step": 16441
+ },
+ {
+ "epoch": 44.80108991825613,
+ "grad_norm": 4.715217113494873,
+ "learning_rate": 1.2152631665720667e-05,
+ "loss": 0.2542,
+ "step": 16442
+ },
+ {
+ "epoch": 44.80381471389646,
+ "grad_norm": 5.653316974639893,
+ "learning_rate": 1.215176985184116e-05,
+ "loss": 0.134,
+ "step": 16443
+ },
+ {
+ "epoch": 44.80653950953678,
+ "grad_norm": 4.876206874847412,
+ "learning_rate": 1.2150908021203736e-05,
+ "loss": 0.3399,
+ "step": 16444
+ },
+ {
+ "epoch": 44.80926430517711,
+ "grad_norm": 5.213658332824707,
+ "learning_rate": 1.215004617381511e-05,
+ "loss": 0.2188,
+ "step": 16445
+ },
+ {
+ "epoch": 44.81198910081744,
+ "grad_norm": 5.333511829376221,
+ "learning_rate": 1.2149184309681995e-05,
+ "loss": 0.2125,
+ "step": 16446
+ },
+ {
+ "epoch": 44.81471389645777,
+ "grad_norm": 4.946162700653076,
+ "learning_rate": 1.21483224288111e-05,
+ "loss": 0.1501,
+ "step": 16447
+ },
+ {
+ "epoch": 44.817438692098094,
+ "grad_norm": 4.635293960571289,
+ "learning_rate": 1.2147460531209141e-05,
+ "loss": 0.137,
+ "step": 16448
+ },
+ {
+ "epoch": 44.82016348773842,
+ "grad_norm": 4.830501079559326,
+ "learning_rate": 1.2146598616882828e-05,
+ "loss": 0.2062,
+ "step": 16449
+ },
+ {
+ "epoch": 44.822888283378745,
+ "grad_norm": 5.653111457824707,
+ "learning_rate": 1.2145736685838876e-05,
+ "loss": 0.1813,
+ "step": 16450
+ },
+ {
+ "epoch": 44.82561307901907,
+ "grad_norm": 5.251279354095459,
+ "learning_rate": 1.2144874738083992e-05,
+ "loss": 0.261,
+ "step": 16451
+ },
+ {
+ "epoch": 44.828337874659404,
+ "grad_norm": 5.2505388259887695,
+ "learning_rate": 1.2144012773624893e-05,
+ "loss": 0.1934,
+ "step": 16452
+ },
+ {
+ "epoch": 44.83106267029973,
+ "grad_norm": 8.280632019042969,
+ "learning_rate": 1.2143150792468292e-05,
+ "loss": 0.1978,
+ "step": 16453
+ },
+ {
+ "epoch": 44.833787465940055,
+ "grad_norm": 5.335907936096191,
+ "learning_rate": 1.2142288794620903e-05,
+ "loss": 0.1751,
+ "step": 16454
+ },
+ {
+ "epoch": 44.83651226158038,
+ "grad_norm": 5.506390571594238,
+ "learning_rate": 1.2141426780089436e-05,
+ "loss": 0.295,
+ "step": 16455
+ },
+ {
+ "epoch": 44.83923705722071,
+ "grad_norm": 5.114776611328125,
+ "learning_rate": 1.2140564748880608e-05,
+ "loss": 0.2163,
+ "step": 16456
+ },
+ {
+ "epoch": 44.84196185286103,
+ "grad_norm": 5.010404586791992,
+ "learning_rate": 1.213970270100113e-05,
+ "loss": 0.305,
+ "step": 16457
+ },
+ {
+ "epoch": 44.844686648501366,
+ "grad_norm": 6.250791549682617,
+ "learning_rate": 1.2138840636457716e-05,
+ "loss": 0.2335,
+ "step": 16458
+ },
+ {
+ "epoch": 44.84741144414169,
+ "grad_norm": 5.389265060424805,
+ "learning_rate": 1.213797855525708e-05,
+ "loss": 0.2307,
+ "step": 16459
+ },
+ {
+ "epoch": 44.85013623978202,
+ "grad_norm": 5.745802402496338,
+ "learning_rate": 1.2137116457405938e-05,
+ "loss": 0.1863,
+ "step": 16460
+ },
+ {
+ "epoch": 44.85286103542234,
+ "grad_norm": 4.540849208831787,
+ "learning_rate": 1.2136254342910997e-05,
+ "loss": 0.2068,
+ "step": 16461
+ },
+ {
+ "epoch": 44.85558583106267,
+ "grad_norm": 6.162951946258545,
+ "learning_rate": 1.2135392211778978e-05,
+ "loss": 0.2772,
+ "step": 16462
+ },
+ {
+ "epoch": 44.858310626702995,
+ "grad_norm": 5.170132160186768,
+ "learning_rate": 1.2134530064016594e-05,
+ "loss": 0.181,
+ "step": 16463
+ },
+ {
+ "epoch": 44.86103542234333,
+ "grad_norm": 4.901643753051758,
+ "learning_rate": 1.213366789963056e-05,
+ "loss": 0.1205,
+ "step": 16464
+ },
+ {
+ "epoch": 44.86376021798365,
+ "grad_norm": 4.8902363777160645,
+ "learning_rate": 1.2132805718627588e-05,
+ "loss": 0.1484,
+ "step": 16465
+ },
+ {
+ "epoch": 44.86648501362398,
+ "grad_norm": 4.043622016906738,
+ "learning_rate": 1.2131943521014393e-05,
+ "loss": 0.099,
+ "step": 16466
+ },
+ {
+ "epoch": 44.869209809264305,
+ "grad_norm": 5.787082672119141,
+ "learning_rate": 1.213108130679769e-05,
+ "loss": 0.1662,
+ "step": 16467
+ },
+ {
+ "epoch": 44.87193460490463,
+ "grad_norm": 8.555408477783203,
+ "learning_rate": 1.2130219075984195e-05,
+ "loss": 0.2985,
+ "step": 16468
+ },
+ {
+ "epoch": 44.87465940054496,
+ "grad_norm": 4.420747756958008,
+ "learning_rate": 1.2129356828580623e-05,
+ "loss": 0.1179,
+ "step": 16469
+ },
+ {
+ "epoch": 44.87738419618529,
+ "grad_norm": 6.063549518585205,
+ "learning_rate": 1.212849456459369e-05,
+ "loss": 0.4112,
+ "step": 16470
+ },
+ {
+ "epoch": 44.880108991825615,
+ "grad_norm": 5.833211898803711,
+ "learning_rate": 1.2127632284030101e-05,
+ "loss": 0.2814,
+ "step": 16471
+ },
+ {
+ "epoch": 44.88283378746594,
+ "grad_norm": 4.399301528930664,
+ "learning_rate": 1.212676998689659e-05,
+ "loss": 0.1431,
+ "step": 16472
+ },
+ {
+ "epoch": 44.88555858310627,
+ "grad_norm": 5.7322821617126465,
+ "learning_rate": 1.212590767319986e-05,
+ "loss": 0.2417,
+ "step": 16473
+ },
+ {
+ "epoch": 44.88828337874659,
+ "grad_norm": 7.326210021972656,
+ "learning_rate": 1.2125045342946628e-05,
+ "loss": 0.1547,
+ "step": 16474
+ },
+ {
+ "epoch": 44.89100817438692,
+ "grad_norm": 4.27852725982666,
+ "learning_rate": 1.2124182996143615e-05,
+ "loss": 0.1268,
+ "step": 16475
+ },
+ {
+ "epoch": 44.89373297002725,
+ "grad_norm": 5.068663597106934,
+ "learning_rate": 1.2123320632797531e-05,
+ "loss": 0.298,
+ "step": 16476
+ },
+ {
+ "epoch": 44.89645776566758,
+ "grad_norm": 5.224200248718262,
+ "learning_rate": 1.2122458252915093e-05,
+ "loss": 0.1547,
+ "step": 16477
+ },
+ {
+ "epoch": 44.8991825613079,
+ "grad_norm": 5.985930919647217,
+ "learning_rate": 1.2121595856503018e-05,
+ "loss": 0.2009,
+ "step": 16478
+ },
+ {
+ "epoch": 44.90190735694823,
+ "grad_norm": 4.921285152435303,
+ "learning_rate": 1.2120733443568023e-05,
+ "loss": 0.1677,
+ "step": 16479
+ },
+ {
+ "epoch": 44.904632152588555,
+ "grad_norm": 4.74705171585083,
+ "learning_rate": 1.2119871014116827e-05,
+ "loss": 0.1077,
+ "step": 16480
+ },
+ {
+ "epoch": 44.90735694822888,
+ "grad_norm": 4.848055839538574,
+ "learning_rate": 1.211900856815614e-05,
+ "loss": 0.1856,
+ "step": 16481
+ },
+ {
+ "epoch": 44.91008174386921,
+ "grad_norm": 4.837916374206543,
+ "learning_rate": 1.2118146105692687e-05,
+ "loss": 0.1507,
+ "step": 16482
+ },
+ {
+ "epoch": 44.91280653950954,
+ "grad_norm": 7.80957555770874,
+ "learning_rate": 1.2117283626733176e-05,
+ "loss": 0.2266,
+ "step": 16483
+ },
+ {
+ "epoch": 44.915531335149865,
+ "grad_norm": 6.339170932769775,
+ "learning_rate": 1.2116421131284332e-05,
+ "loss": 0.2142,
+ "step": 16484
+ },
+ {
+ "epoch": 44.91825613079019,
+ "grad_norm": 5.276419639587402,
+ "learning_rate": 1.2115558619352866e-05,
+ "loss": 0.1582,
+ "step": 16485
+ },
+ {
+ "epoch": 44.920980926430516,
+ "grad_norm": 4.407070159912109,
+ "learning_rate": 1.2114696090945499e-05,
+ "loss": 0.2064,
+ "step": 16486
+ },
+ {
+ "epoch": 44.92370572207084,
+ "grad_norm": 9.91385269165039,
+ "learning_rate": 1.2113833546068945e-05,
+ "loss": 0.2421,
+ "step": 16487
+ },
+ {
+ "epoch": 44.926430517711175,
+ "grad_norm": 13.311921119689941,
+ "learning_rate": 1.2112970984729924e-05,
+ "loss": 0.2019,
+ "step": 16488
+ },
+ {
+ "epoch": 44.9291553133515,
+ "grad_norm": 6.210605144500732,
+ "learning_rate": 1.2112108406935152e-05,
+ "loss": 0.1967,
+ "step": 16489
+ },
+ {
+ "epoch": 44.93188010899183,
+ "grad_norm": 4.3446574211120605,
+ "learning_rate": 1.211124581269135e-05,
+ "loss": 0.3851,
+ "step": 16490
+ },
+ {
+ "epoch": 44.93460490463215,
+ "grad_norm": 4.927207946777344,
+ "learning_rate": 1.2110383202005234e-05,
+ "loss": 0.1999,
+ "step": 16491
+ },
+ {
+ "epoch": 44.93732970027248,
+ "grad_norm": 5.123676776885986,
+ "learning_rate": 1.2109520574883519e-05,
+ "loss": 0.5084,
+ "step": 16492
+ },
+ {
+ "epoch": 44.940054495912804,
+ "grad_norm": 6.560925006866455,
+ "learning_rate": 1.2108657931332928e-05,
+ "loss": 0.2164,
+ "step": 16493
+ },
+ {
+ "epoch": 44.94277929155314,
+ "grad_norm": 5.3994574546813965,
+ "learning_rate": 1.2107795271360177e-05,
+ "loss": 0.2569,
+ "step": 16494
+ },
+ {
+ "epoch": 44.94550408719346,
+ "grad_norm": 5.85552978515625,
+ "learning_rate": 1.210693259497198e-05,
+ "loss": 0.2926,
+ "step": 16495
+ },
+ {
+ "epoch": 44.94822888283379,
+ "grad_norm": 7.393570423126221,
+ "learning_rate": 1.2106069902175061e-05,
+ "loss": 0.211,
+ "step": 16496
+ },
+ {
+ "epoch": 44.950953678474114,
+ "grad_norm": 6.004249572753906,
+ "learning_rate": 1.210520719297614e-05,
+ "loss": 0.1961,
+ "step": 16497
+ },
+ {
+ "epoch": 44.95367847411444,
+ "grad_norm": 4.975900173187256,
+ "learning_rate": 1.2104344467381934e-05,
+ "loss": 0.1602,
+ "step": 16498
+ },
+ {
+ "epoch": 44.956403269754766,
+ "grad_norm": 5.147679328918457,
+ "learning_rate": 1.2103481725399158e-05,
+ "loss": 0.1848,
+ "step": 16499
+ },
+ {
+ "epoch": 44.95912806539509,
+ "grad_norm": 5.091027736663818,
+ "learning_rate": 1.2102618967034537e-05,
+ "loss": 0.2364,
+ "step": 16500
+ },
+ {
+ "epoch": 44.961852861035425,
+ "grad_norm": 3.759225845336914,
+ "learning_rate": 1.2101756192294785e-05,
+ "loss": 0.2279,
+ "step": 16501
+ },
+ {
+ "epoch": 44.96457765667575,
+ "grad_norm": 5.046459197998047,
+ "learning_rate": 1.2100893401186624e-05,
+ "loss": 0.2177,
+ "step": 16502
+ },
+ {
+ "epoch": 44.967302452316076,
+ "grad_norm": 4.500819206237793,
+ "learning_rate": 1.2100030593716772e-05,
+ "loss": 0.1707,
+ "step": 16503
+ },
+ {
+ "epoch": 44.9700272479564,
+ "grad_norm": 9.605218887329102,
+ "learning_rate": 1.2099167769891952e-05,
+ "loss": 0.2307,
+ "step": 16504
+ },
+ {
+ "epoch": 44.97275204359673,
+ "grad_norm": 28.277524948120117,
+ "learning_rate": 1.2098304929718875e-05,
+ "loss": 0.257,
+ "step": 16505
+ },
+ {
+ "epoch": 44.97547683923706,
+ "grad_norm": 5.641982555389404,
+ "learning_rate": 1.2097442073204272e-05,
+ "loss": 0.1846,
+ "step": 16506
+ },
+ {
+ "epoch": 44.97820163487739,
+ "grad_norm": 5.367890357971191,
+ "learning_rate": 1.2096579200354857e-05,
+ "loss": 0.2236,
+ "step": 16507
+ },
+ {
+ "epoch": 44.98092643051771,
+ "grad_norm": 3.9556329250335693,
+ "learning_rate": 1.209571631117735e-05,
+ "loss": 0.2136,
+ "step": 16508
+ },
+ {
+ "epoch": 44.98365122615804,
+ "grad_norm": 4.4472150802612305,
+ "learning_rate": 1.2094853405678471e-05,
+ "loss": 0.1678,
+ "step": 16509
+ },
+ {
+ "epoch": 44.986376021798364,
+ "grad_norm": 6.31549596786499,
+ "learning_rate": 1.2093990483864944e-05,
+ "loss": 0.1811,
+ "step": 16510
+ },
+ {
+ "epoch": 44.98910081743869,
+ "grad_norm": 6.078292369842529,
+ "learning_rate": 1.2093127545743482e-05,
+ "loss": 0.177,
+ "step": 16511
+ },
+ {
+ "epoch": 44.991825613079016,
+ "grad_norm": 5.6930928230285645,
+ "learning_rate": 1.2092264591320815e-05,
+ "loss": 0.2932,
+ "step": 16512
+ },
+ {
+ "epoch": 44.99455040871935,
+ "grad_norm": 4.938112258911133,
+ "learning_rate": 1.2091401620603656e-05,
+ "loss": 0.1919,
+ "step": 16513
+ },
+ {
+ "epoch": 44.997275204359674,
+ "grad_norm": 6.328670024871826,
+ "learning_rate": 1.2090538633598728e-05,
+ "loss": 0.3275,
+ "step": 16514
+ },
+ {
+ "epoch": 45.0,
+ "grad_norm": 6.109992980957031,
+ "learning_rate": 1.2089675630312755e-05,
+ "loss": 0.1832,
+ "step": 16515
+ },
+ {
+ "epoch": 45.002724795640326,
+ "grad_norm": 5.512378692626953,
+ "learning_rate": 1.2088812610752449e-05,
+ "loss": 0.179,
+ "step": 16516
+ },
+ {
+ "epoch": 45.00544959128065,
+ "grad_norm": 5.3177971839904785,
+ "learning_rate": 1.2087949574924542e-05,
+ "loss": 0.155,
+ "step": 16517
+ },
+ {
+ "epoch": 45.00817438692098,
+ "grad_norm": 4.777791500091553,
+ "learning_rate": 1.2087086522835754e-05,
+ "loss": 0.2024,
+ "step": 16518
+ },
+ {
+ "epoch": 45.01089918256131,
+ "grad_norm": 4.446604251861572,
+ "learning_rate": 1.2086223454492798e-05,
+ "loss": 0.1863,
+ "step": 16519
+ },
+ {
+ "epoch": 45.013623978201636,
+ "grad_norm": 4.505539894104004,
+ "learning_rate": 1.2085360369902405e-05,
+ "loss": 0.2233,
+ "step": 16520
+ },
+ {
+ "epoch": 45.01634877384196,
+ "grad_norm": 6.669691562652588,
+ "learning_rate": 1.208449726907129e-05,
+ "loss": 0.2606,
+ "step": 16521
+ },
+ {
+ "epoch": 45.01907356948229,
+ "grad_norm": 5.373653411865234,
+ "learning_rate": 1.2083634152006178e-05,
+ "loss": 0.3221,
+ "step": 16522
+ },
+ {
+ "epoch": 45.02179836512261,
+ "grad_norm": 5.863643169403076,
+ "learning_rate": 1.208277101871379e-05,
+ "loss": 0.2959,
+ "step": 16523
+ },
+ {
+ "epoch": 45.02452316076294,
+ "grad_norm": 5.832777976989746,
+ "learning_rate": 1.208190786920085e-05,
+ "loss": 0.3932,
+ "step": 16524
+ },
+ {
+ "epoch": 45.02724795640327,
+ "grad_norm": 5.73431396484375,
+ "learning_rate": 1.2081044703474079e-05,
+ "loss": 0.2045,
+ "step": 16525
+ },
+ {
+ "epoch": 45.0299727520436,
+ "grad_norm": 4.735246658325195,
+ "learning_rate": 1.2080181521540195e-05,
+ "loss": 0.3188,
+ "step": 16526
+ },
+ {
+ "epoch": 45.032697547683924,
+ "grad_norm": 6.507968902587891,
+ "learning_rate": 1.2079318323405926e-05,
+ "loss": 0.1391,
+ "step": 16527
+ },
+ {
+ "epoch": 45.03542234332425,
+ "grad_norm": 6.053386211395264,
+ "learning_rate": 1.2078455109077994e-05,
+ "loss": 0.2635,
+ "step": 16528
+ },
+ {
+ "epoch": 45.038147138964575,
+ "grad_norm": 6.033876895904541,
+ "learning_rate": 1.207759187856312e-05,
+ "loss": 0.1196,
+ "step": 16529
+ },
+ {
+ "epoch": 45.0408719346049,
+ "grad_norm": 4.177990913391113,
+ "learning_rate": 1.2076728631868026e-05,
+ "loss": 0.1621,
+ "step": 16530
+ },
+ {
+ "epoch": 45.043596730245234,
+ "grad_norm": 7.85495138168335,
+ "learning_rate": 1.2075865368999437e-05,
+ "loss": 0.1633,
+ "step": 16531
+ },
+ {
+ "epoch": 45.04632152588556,
+ "grad_norm": 4.977965831756592,
+ "learning_rate": 1.2075002089964077e-05,
+ "loss": 0.2815,
+ "step": 16532
+ },
+ {
+ "epoch": 45.049046321525886,
+ "grad_norm": 5.360485076904297,
+ "learning_rate": 1.2074138794768666e-05,
+ "loss": 0.1459,
+ "step": 16533
+ },
+ {
+ "epoch": 45.05177111716621,
+ "grad_norm": 4.5159831047058105,
+ "learning_rate": 1.2073275483419928e-05,
+ "loss": 0.2168,
+ "step": 16534
+ },
+ {
+ "epoch": 45.05449591280654,
+ "grad_norm": 8.731205940246582,
+ "learning_rate": 1.2072412155924589e-05,
+ "loss": 0.2906,
+ "step": 16535
+ },
+ {
+ "epoch": 45.05722070844686,
+ "grad_norm": 4.30543851852417,
+ "learning_rate": 1.207154881228937e-05,
+ "loss": 0.1112,
+ "step": 16536
+ },
+ {
+ "epoch": 45.059945504087196,
+ "grad_norm": 5.078404426574707,
+ "learning_rate": 1.2070685452520996e-05,
+ "loss": 0.2499,
+ "step": 16537
+ },
+ {
+ "epoch": 45.06267029972752,
+ "grad_norm": 4.377470016479492,
+ "learning_rate": 1.206982207662619e-05,
+ "loss": 0.1048,
+ "step": 16538
+ },
+ {
+ "epoch": 45.06539509536785,
+ "grad_norm": 5.7056803703308105,
+ "learning_rate": 1.2068958684611675e-05,
+ "loss": 0.2832,
+ "step": 16539
+ },
+ {
+ "epoch": 45.06811989100817,
+ "grad_norm": 5.156067848205566,
+ "learning_rate": 1.2068095276484177e-05,
+ "loss": 0.1302,
+ "step": 16540
+ },
+ {
+ "epoch": 45.0708446866485,
+ "grad_norm": 7.141348361968994,
+ "learning_rate": 1.2067231852250421e-05,
+ "loss": 0.2455,
+ "step": 16541
+ },
+ {
+ "epoch": 45.073569482288825,
+ "grad_norm": 3.8205201625823975,
+ "learning_rate": 1.206636841191713e-05,
+ "loss": 0.1014,
+ "step": 16542
+ },
+ {
+ "epoch": 45.07629427792916,
+ "grad_norm": 4.64540958404541,
+ "learning_rate": 1.2065504955491028e-05,
+ "loss": 0.1048,
+ "step": 16543
+ },
+ {
+ "epoch": 45.079019073569484,
+ "grad_norm": 5.926222324371338,
+ "learning_rate": 1.2064641482978835e-05,
+ "loss": 0.2379,
+ "step": 16544
+ },
+ {
+ "epoch": 45.08174386920981,
+ "grad_norm": 5.158275604248047,
+ "learning_rate": 1.206377799438729e-05,
+ "loss": 0.2085,
+ "step": 16545
+ },
+ {
+ "epoch": 45.084468664850135,
+ "grad_norm": 15.585972785949707,
+ "learning_rate": 1.20629144897231e-05,
+ "loss": 0.2434,
+ "step": 16546
+ },
+ {
+ "epoch": 45.08719346049046,
+ "grad_norm": 5.83115291595459,
+ "learning_rate": 1.2062050968993002e-05,
+ "loss": 0.1738,
+ "step": 16547
+ },
+ {
+ "epoch": 45.08991825613079,
+ "grad_norm": 7.6292033195495605,
+ "learning_rate": 1.2061187432203716e-05,
+ "loss": 0.2433,
+ "step": 16548
+ },
+ {
+ "epoch": 45.09264305177112,
+ "grad_norm": 8.051736831665039,
+ "learning_rate": 1.206032387936197e-05,
+ "loss": 0.1835,
+ "step": 16549
+ },
+ {
+ "epoch": 45.095367847411445,
+ "grad_norm": 7.657648086547852,
+ "learning_rate": 1.2059460310474486e-05,
+ "loss": 0.1468,
+ "step": 16550
+ },
+ {
+ "epoch": 45.09809264305177,
+ "grad_norm": 7.185408115386963,
+ "learning_rate": 1.2058596725547993e-05,
+ "loss": 0.2395,
+ "step": 16551
+ },
+ {
+ "epoch": 45.1008174386921,
+ "grad_norm": 5.118465900421143,
+ "learning_rate": 1.2057733124589216e-05,
+ "loss": 0.1516,
+ "step": 16552
+ },
+ {
+ "epoch": 45.10354223433242,
+ "grad_norm": 5.896913528442383,
+ "learning_rate": 1.2056869507604878e-05,
+ "loss": 0.2349,
+ "step": 16553
+ },
+ {
+ "epoch": 45.10626702997275,
+ "grad_norm": 7.021651744842529,
+ "learning_rate": 1.2056005874601706e-05,
+ "loss": 0.1852,
+ "step": 16554
+ },
+ {
+ "epoch": 45.10899182561308,
+ "grad_norm": 7.547937393188477,
+ "learning_rate": 1.205514222558643e-05,
+ "loss": 0.1539,
+ "step": 16555
+ },
+ {
+ "epoch": 45.11171662125341,
+ "grad_norm": 5.6526384353637695,
+ "learning_rate": 1.2054278560565768e-05,
+ "loss": 0.1286,
+ "step": 16556
+ },
+ {
+ "epoch": 45.11444141689373,
+ "grad_norm": 4.357674598693848,
+ "learning_rate": 1.2053414879546453e-05,
+ "loss": 0.1671,
+ "step": 16557
+ },
+ {
+ "epoch": 45.11716621253406,
+ "grad_norm": 6.144803047180176,
+ "learning_rate": 1.2052551182535205e-05,
+ "loss": 0.2076,
+ "step": 16558
+ },
+ {
+ "epoch": 45.119891008174385,
+ "grad_norm": 4.0647664070129395,
+ "learning_rate": 1.2051687469538762e-05,
+ "loss": 0.1586,
+ "step": 16559
+ },
+ {
+ "epoch": 45.12261580381471,
+ "grad_norm": 5.348049163818359,
+ "learning_rate": 1.2050823740563838e-05,
+ "loss": 0.2232,
+ "step": 16560
+ },
+ {
+ "epoch": 45.12534059945504,
+ "grad_norm": 4.529613494873047,
+ "learning_rate": 1.2049959995617166e-05,
+ "loss": 0.1346,
+ "step": 16561
+ },
+ {
+ "epoch": 45.12806539509537,
+ "grad_norm": 7.2587151527404785,
+ "learning_rate": 1.2049096234705471e-05,
+ "loss": 0.2626,
+ "step": 16562
+ },
+ {
+ "epoch": 45.130790190735695,
+ "grad_norm": 5.042852401733398,
+ "learning_rate": 1.2048232457835482e-05,
+ "loss": 0.2629,
+ "step": 16563
+ },
+ {
+ "epoch": 45.13351498637602,
+ "grad_norm": 4.998375415802002,
+ "learning_rate": 1.204736866501392e-05,
+ "loss": 0.2243,
+ "step": 16564
+ },
+ {
+ "epoch": 45.13623978201635,
+ "grad_norm": 6.485538959503174,
+ "learning_rate": 1.204650485624752e-05,
+ "loss": 0.2776,
+ "step": 16565
+ },
+ {
+ "epoch": 45.13896457765667,
+ "grad_norm": 4.741646766662598,
+ "learning_rate": 1.2045641031543008e-05,
+ "loss": 0.0986,
+ "step": 16566
+ },
+ {
+ "epoch": 45.141689373297005,
+ "grad_norm": 6.637621879577637,
+ "learning_rate": 1.2044777190907107e-05,
+ "loss": 0.1705,
+ "step": 16567
+ },
+ {
+ "epoch": 45.14441416893733,
+ "grad_norm": 4.802213668823242,
+ "learning_rate": 1.2043913334346546e-05,
+ "loss": 0.1882,
+ "step": 16568
+ },
+ {
+ "epoch": 45.14713896457766,
+ "grad_norm": 6.388574123382568,
+ "learning_rate": 1.2043049461868057e-05,
+ "loss": 0.3225,
+ "step": 16569
+ },
+ {
+ "epoch": 45.14986376021798,
+ "grad_norm": 4.970810413360596,
+ "learning_rate": 1.2042185573478362e-05,
+ "loss": 0.1427,
+ "step": 16570
+ },
+ {
+ "epoch": 45.15258855585831,
+ "grad_norm": 8.400190353393555,
+ "learning_rate": 1.2041321669184194e-05,
+ "loss": 0.4492,
+ "step": 16571
+ },
+ {
+ "epoch": 45.155313351498634,
+ "grad_norm": 5.225356101989746,
+ "learning_rate": 1.2040457748992275e-05,
+ "loss": 0.1226,
+ "step": 16572
+ },
+ {
+ "epoch": 45.15803814713897,
+ "grad_norm": 4.736957550048828,
+ "learning_rate": 1.203959381290934e-05,
+ "loss": 0.2009,
+ "step": 16573
+ },
+ {
+ "epoch": 45.16076294277929,
+ "grad_norm": 4.66796875,
+ "learning_rate": 1.203872986094211e-05,
+ "loss": 0.1301,
+ "step": 16574
+ },
+ {
+ "epoch": 45.16348773841962,
+ "grad_norm": 6.437362194061279,
+ "learning_rate": 1.2037865893097323e-05,
+ "loss": 0.2308,
+ "step": 16575
+ },
+ {
+ "epoch": 45.166212534059945,
+ "grad_norm": 4.844325065612793,
+ "learning_rate": 1.2037001909381699e-05,
+ "loss": 0.1716,
+ "step": 16576
+ },
+ {
+ "epoch": 45.16893732970027,
+ "grad_norm": 5.221934795379639,
+ "learning_rate": 1.203613790980197e-05,
+ "loss": 0.1791,
+ "step": 16577
+ },
+ {
+ "epoch": 45.171662125340596,
+ "grad_norm": 4.624213695526123,
+ "learning_rate": 1.2035273894364863e-05,
+ "loss": 0.1102,
+ "step": 16578
+ },
+ {
+ "epoch": 45.17438692098093,
+ "grad_norm": 4.950865268707275,
+ "learning_rate": 1.203440986307711e-05,
+ "loss": 0.1157,
+ "step": 16579
+ },
+ {
+ "epoch": 45.177111716621255,
+ "grad_norm": 5.598708629608154,
+ "learning_rate": 1.2033545815945438e-05,
+ "loss": 0.2494,
+ "step": 16580
+ },
+ {
+ "epoch": 45.17983651226158,
+ "grad_norm": 4.302317142486572,
+ "learning_rate": 1.2032681752976578e-05,
+ "loss": 0.0961,
+ "step": 16581
+ },
+ {
+ "epoch": 45.182561307901906,
+ "grad_norm": 4.7786946296691895,
+ "learning_rate": 1.2031817674177255e-05,
+ "loss": 0.1896,
+ "step": 16582
+ },
+ {
+ "epoch": 45.18528610354223,
+ "grad_norm": 4.99862003326416,
+ "learning_rate": 1.2030953579554203e-05,
+ "loss": 0.1549,
+ "step": 16583
+ },
+ {
+ "epoch": 45.18801089918256,
+ "grad_norm": 5.704895973205566,
+ "learning_rate": 1.203008946911415e-05,
+ "loss": 0.2137,
+ "step": 16584
+ },
+ {
+ "epoch": 45.19073569482289,
+ "grad_norm": 4.31999397277832,
+ "learning_rate": 1.2029225342863826e-05,
+ "loss": 0.1605,
+ "step": 16585
+ },
+ {
+ "epoch": 45.19346049046322,
+ "grad_norm": 3.9720940589904785,
+ "learning_rate": 1.202836120080996e-05,
+ "loss": 0.1321,
+ "step": 16586
+ },
+ {
+ "epoch": 45.19618528610354,
+ "grad_norm": 5.717876434326172,
+ "learning_rate": 1.2027497042959281e-05,
+ "loss": 0.1545,
+ "step": 16587
+ },
+ {
+ "epoch": 45.19891008174387,
+ "grad_norm": 7.608456134796143,
+ "learning_rate": 1.2026632869318522e-05,
+ "loss": 0.1343,
+ "step": 16588
+ },
+ {
+ "epoch": 45.201634877384194,
+ "grad_norm": 5.579301357269287,
+ "learning_rate": 1.2025768679894412e-05,
+ "loss": 0.2828,
+ "step": 16589
+ },
+ {
+ "epoch": 45.20435967302452,
+ "grad_norm": 4.252120494842529,
+ "learning_rate": 1.2024904474693679e-05,
+ "loss": 0.1783,
+ "step": 16590
+ },
+ {
+ "epoch": 45.20708446866485,
+ "grad_norm": 6.057271480560303,
+ "learning_rate": 1.2024040253723054e-05,
+ "loss": 0.2513,
+ "step": 16591
+ },
+ {
+ "epoch": 45.20980926430518,
+ "grad_norm": 4.746553421020508,
+ "learning_rate": 1.2023176016989272e-05,
+ "loss": 0.1571,
+ "step": 16592
+ },
+ {
+ "epoch": 45.212534059945504,
+ "grad_norm": 5.150763511657715,
+ "learning_rate": 1.2022311764499057e-05,
+ "loss": 0.1441,
+ "step": 16593
+ },
+ {
+ "epoch": 45.21525885558583,
+ "grad_norm": 4.989012241363525,
+ "learning_rate": 1.2021447496259145e-05,
+ "loss": 0.1555,
+ "step": 16594
+ },
+ {
+ "epoch": 45.217983651226156,
+ "grad_norm": 5.327992916107178,
+ "learning_rate": 1.2020583212276267e-05,
+ "loss": 0.171,
+ "step": 16595
+ },
+ {
+ "epoch": 45.22070844686648,
+ "grad_norm": 7.940482139587402,
+ "learning_rate": 1.2019718912557148e-05,
+ "loss": 0.1578,
+ "step": 16596
+ },
+ {
+ "epoch": 45.223433242506815,
+ "grad_norm": 5.864681243896484,
+ "learning_rate": 1.2018854597108524e-05,
+ "loss": 0.2566,
+ "step": 16597
+ },
+ {
+ "epoch": 45.22615803814714,
+ "grad_norm": 6.923911094665527,
+ "learning_rate": 1.2017990265937127e-05,
+ "loss": 0.3066,
+ "step": 16598
+ },
+ {
+ "epoch": 45.228882833787466,
+ "grad_norm": 6.041567802429199,
+ "learning_rate": 1.2017125919049688e-05,
+ "loss": 0.1343,
+ "step": 16599
+ },
+ {
+ "epoch": 45.23160762942779,
+ "grad_norm": 6.406617164611816,
+ "learning_rate": 1.2016261556452933e-05,
+ "loss": 0.2468,
+ "step": 16600
+ },
+ {
+ "epoch": 45.23433242506812,
+ "grad_norm": 5.396008014678955,
+ "learning_rate": 1.2015397178153601e-05,
+ "loss": 0.3443,
+ "step": 16601
+ },
+ {
+ "epoch": 45.237057220708444,
+ "grad_norm": 5.214319705963135,
+ "learning_rate": 1.2014532784158419e-05,
+ "loss": 0.1919,
+ "step": 16602
+ },
+ {
+ "epoch": 45.23978201634878,
+ "grad_norm": 5.351510047912598,
+ "learning_rate": 1.201366837447412e-05,
+ "loss": 0.2486,
+ "step": 16603
+ },
+ {
+ "epoch": 45.2425068119891,
+ "grad_norm": 4.136556148529053,
+ "learning_rate": 1.2012803949107437e-05,
+ "loss": 0.1294,
+ "step": 16604
+ },
+ {
+ "epoch": 45.24523160762943,
+ "grad_norm": 7.471392631530762,
+ "learning_rate": 1.2011939508065105e-05,
+ "loss": 0.1367,
+ "step": 16605
+ },
+ {
+ "epoch": 45.247956403269754,
+ "grad_norm": 5.440866947174072,
+ "learning_rate": 1.2011075051353848e-05,
+ "loss": 0.16,
+ "step": 16606
+ },
+ {
+ "epoch": 45.25068119891008,
+ "grad_norm": 4.633749008178711,
+ "learning_rate": 1.2010210578980407e-05,
+ "loss": 0.2055,
+ "step": 16607
+ },
+ {
+ "epoch": 45.253405994550405,
+ "grad_norm": 7.459175109863281,
+ "learning_rate": 1.2009346090951507e-05,
+ "loss": 0.2332,
+ "step": 16608
+ },
+ {
+ "epoch": 45.25613079019074,
+ "grad_norm": 9.547760009765625,
+ "learning_rate": 1.2008481587273889e-05,
+ "loss": 0.1956,
+ "step": 16609
+ },
+ {
+ "epoch": 45.258855585831064,
+ "grad_norm": 4.923254013061523,
+ "learning_rate": 1.2007617067954279e-05,
+ "loss": 0.1647,
+ "step": 16610
+ },
+ {
+ "epoch": 45.26158038147139,
+ "grad_norm": 5.788157939910889,
+ "learning_rate": 1.2006752532999408e-05,
+ "loss": 0.1401,
+ "step": 16611
+ },
+ {
+ "epoch": 45.264305177111716,
+ "grad_norm": 10.717264175415039,
+ "learning_rate": 1.2005887982416018e-05,
+ "loss": 0.2287,
+ "step": 16612
+ },
+ {
+ "epoch": 45.26702997275204,
+ "grad_norm": 5.1473612785339355,
+ "learning_rate": 1.2005023416210835e-05,
+ "loss": 0.2368,
+ "step": 16613
+ },
+ {
+ "epoch": 45.26975476839237,
+ "grad_norm": 6.619595050811768,
+ "learning_rate": 1.2004158834390594e-05,
+ "loss": 0.1329,
+ "step": 16614
+ },
+ {
+ "epoch": 45.2724795640327,
+ "grad_norm": 3.5936288833618164,
+ "learning_rate": 1.2003294236962028e-05,
+ "loss": 0.3637,
+ "step": 16615
+ },
+ {
+ "epoch": 45.275204359673026,
+ "grad_norm": 4.85862398147583,
+ "learning_rate": 1.2002429623931874e-05,
+ "loss": 0.2879,
+ "step": 16616
+ },
+ {
+ "epoch": 45.27792915531335,
+ "grad_norm": 4.307836532592773,
+ "learning_rate": 1.2001564995306858e-05,
+ "loss": 0.1005,
+ "step": 16617
+ },
+ {
+ "epoch": 45.28065395095368,
+ "grad_norm": 5.3064727783203125,
+ "learning_rate": 1.2000700351093722e-05,
+ "loss": 0.303,
+ "step": 16618
+ },
+ {
+ "epoch": 45.283378746594,
+ "grad_norm": 4.527190208435059,
+ "learning_rate": 1.1999835691299193e-05,
+ "loss": 0.2161,
+ "step": 16619
+ },
+ {
+ "epoch": 45.28610354223433,
+ "grad_norm": 5.368263244628906,
+ "learning_rate": 1.1998971015930012e-05,
+ "loss": 0.135,
+ "step": 16620
+ },
+ {
+ "epoch": 45.28882833787466,
+ "grad_norm": 4.358409404754639,
+ "learning_rate": 1.1998106324992906e-05,
+ "loss": 0.2364,
+ "step": 16621
+ },
+ {
+ "epoch": 45.29155313351499,
+ "grad_norm": 4.781009674072266,
+ "learning_rate": 1.1997241618494613e-05,
+ "loss": 0.1104,
+ "step": 16622
+ },
+ {
+ "epoch": 45.294277929155314,
+ "grad_norm": 5.457147121429443,
+ "learning_rate": 1.1996376896441867e-05,
+ "loss": 0.0939,
+ "step": 16623
+ },
+ {
+ "epoch": 45.29700272479564,
+ "grad_norm": 5.586886405944824,
+ "learning_rate": 1.1995512158841402e-05,
+ "loss": 0.2515,
+ "step": 16624
+ },
+ {
+ "epoch": 45.299727520435965,
+ "grad_norm": 5.703341007232666,
+ "learning_rate": 1.1994647405699951e-05,
+ "loss": 0.2366,
+ "step": 16625
+ },
+ {
+ "epoch": 45.30245231607629,
+ "grad_norm": 5.6486921310424805,
+ "learning_rate": 1.1993782637024251e-05,
+ "loss": 0.2428,
+ "step": 16626
+ },
+ {
+ "epoch": 45.305177111716624,
+ "grad_norm": 5.216177940368652,
+ "learning_rate": 1.1992917852821035e-05,
+ "loss": 0.1912,
+ "step": 16627
+ },
+ {
+ "epoch": 45.30790190735695,
+ "grad_norm": 6.801618576049805,
+ "learning_rate": 1.1992053053097041e-05,
+ "loss": 0.1223,
+ "step": 16628
+ },
+ {
+ "epoch": 45.310626702997276,
+ "grad_norm": 6.861721038818359,
+ "learning_rate": 1.1991188237859e-05,
+ "loss": 0.3119,
+ "step": 16629
+ },
+ {
+ "epoch": 45.3133514986376,
+ "grad_norm": 6.232369899749756,
+ "learning_rate": 1.199032340711365e-05,
+ "loss": 0.2049,
+ "step": 16630
+ },
+ {
+ "epoch": 45.31607629427793,
+ "grad_norm": 5.272371768951416,
+ "learning_rate": 1.1989458560867726e-05,
+ "loss": 0.1973,
+ "step": 16631
+ },
+ {
+ "epoch": 45.31880108991825,
+ "grad_norm": 5.843293190002441,
+ "learning_rate": 1.1988593699127964e-05,
+ "loss": 0.1102,
+ "step": 16632
+ },
+ {
+ "epoch": 45.321525885558586,
+ "grad_norm": 4.8091535568237305,
+ "learning_rate": 1.1987728821901094e-05,
+ "loss": 0.1321,
+ "step": 16633
+ },
+ {
+ "epoch": 45.32425068119891,
+ "grad_norm": 5.556960105895996,
+ "learning_rate": 1.198686392919386e-05,
+ "loss": 0.2355,
+ "step": 16634
+ },
+ {
+ "epoch": 45.32697547683924,
+ "grad_norm": 4.6954426765441895,
+ "learning_rate": 1.198599902101299e-05,
+ "loss": 0.2318,
+ "step": 16635
+ },
+ {
+ "epoch": 45.32970027247956,
+ "grad_norm": 11.321298599243164,
+ "learning_rate": 1.1985134097365227e-05,
+ "loss": 0.2587,
+ "step": 16636
+ },
+ {
+ "epoch": 45.33242506811989,
+ "grad_norm": 7.810074806213379,
+ "learning_rate": 1.1984269158257303e-05,
+ "loss": 0.1495,
+ "step": 16637
+ },
+ {
+ "epoch": 45.335149863760215,
+ "grad_norm": 5.643194198608398,
+ "learning_rate": 1.1983404203695954e-05,
+ "loss": 0.2431,
+ "step": 16638
+ },
+ {
+ "epoch": 45.33787465940055,
+ "grad_norm": 4.987616539001465,
+ "learning_rate": 1.1982539233687916e-05,
+ "loss": 0.1606,
+ "step": 16639
+ },
+ {
+ "epoch": 45.34059945504087,
+ "grad_norm": 6.060144424438477,
+ "learning_rate": 1.1981674248239927e-05,
+ "loss": 0.2073,
+ "step": 16640
+ },
+ {
+ "epoch": 45.3433242506812,
+ "grad_norm": 11.028332710266113,
+ "learning_rate": 1.1980809247358722e-05,
+ "loss": 0.181,
+ "step": 16641
+ },
+ {
+ "epoch": 45.346049046321525,
+ "grad_norm": 4.551525115966797,
+ "learning_rate": 1.197994423105104e-05,
+ "loss": 0.3275,
+ "step": 16642
+ },
+ {
+ "epoch": 45.34877384196185,
+ "grad_norm": 4.677279949188232,
+ "learning_rate": 1.1979079199323613e-05,
+ "loss": 0.1158,
+ "step": 16643
+ },
+ {
+ "epoch": 45.35149863760218,
+ "grad_norm": 15.127598762512207,
+ "learning_rate": 1.1978214152183186e-05,
+ "loss": 0.1336,
+ "step": 16644
+ },
+ {
+ "epoch": 45.35422343324251,
+ "grad_norm": 5.0481648445129395,
+ "learning_rate": 1.1977349089636484e-05,
+ "loss": 0.2007,
+ "step": 16645
+ },
+ {
+ "epoch": 45.356948228882835,
+ "grad_norm": 8.24364185333252,
+ "learning_rate": 1.1976484011690257e-05,
+ "loss": 0.2051,
+ "step": 16646
+ },
+ {
+ "epoch": 45.35967302452316,
+ "grad_norm": 4.717498779296875,
+ "learning_rate": 1.1975618918351234e-05,
+ "loss": 0.1411,
+ "step": 16647
+ },
+ {
+ "epoch": 45.36239782016349,
+ "grad_norm": 9.359580039978027,
+ "learning_rate": 1.1974753809626157e-05,
+ "loss": 0.2377,
+ "step": 16648
+ },
+ {
+ "epoch": 45.36512261580381,
+ "grad_norm": 3.6303634643554688,
+ "learning_rate": 1.1973888685521755e-05,
+ "loss": 0.1616,
+ "step": 16649
+ },
+ {
+ "epoch": 45.36784741144414,
+ "grad_norm": 6.411387920379639,
+ "learning_rate": 1.1973023546044777e-05,
+ "loss": 0.1923,
+ "step": 16650
+ },
+ {
+ "epoch": 45.37057220708447,
+ "grad_norm": 5.722949504852295,
+ "learning_rate": 1.1972158391201949e-05,
+ "loss": 0.119,
+ "step": 16651
+ },
+ {
+ "epoch": 45.3732970027248,
+ "grad_norm": 5.816916465759277,
+ "learning_rate": 1.197129322100002e-05,
+ "loss": 0.2458,
+ "step": 16652
+ },
+ {
+ "epoch": 45.37602179836512,
+ "grad_norm": 6.132981777191162,
+ "learning_rate": 1.197042803544572e-05,
+ "loss": 0.195,
+ "step": 16653
+ },
+ {
+ "epoch": 45.37874659400545,
+ "grad_norm": 6.963262557983398,
+ "learning_rate": 1.1969562834545794e-05,
+ "loss": 0.3227,
+ "step": 16654
+ },
+ {
+ "epoch": 45.381471389645775,
+ "grad_norm": 5.772555351257324,
+ "learning_rate": 1.1968697618306973e-05,
+ "loss": 0.223,
+ "step": 16655
+ },
+ {
+ "epoch": 45.3841961852861,
+ "grad_norm": 4.3310546875,
+ "learning_rate": 1.1967832386736001e-05,
+ "loss": 0.2026,
+ "step": 16656
+ },
+ {
+ "epoch": 45.38692098092643,
+ "grad_norm": 4.356783866882324,
+ "learning_rate": 1.1966967139839609e-05,
+ "loss": 0.3471,
+ "step": 16657
+ },
+ {
+ "epoch": 45.38964577656676,
+ "grad_norm": 5.222243785858154,
+ "learning_rate": 1.1966101877624545e-05,
+ "loss": 0.136,
+ "step": 16658
+ },
+ {
+ "epoch": 45.392370572207085,
+ "grad_norm": 30.365690231323242,
+ "learning_rate": 1.1965236600097541e-05,
+ "loss": 0.3697,
+ "step": 16659
+ },
+ {
+ "epoch": 45.39509536784741,
+ "grad_norm": 7.362423419952393,
+ "learning_rate": 1.1964371307265334e-05,
+ "loss": 0.3103,
+ "step": 16660
+ },
+ {
+ "epoch": 45.39782016348774,
+ "grad_norm": 41.33028793334961,
+ "learning_rate": 1.196350599913467e-05,
+ "loss": 0.3573,
+ "step": 16661
+ },
+ {
+ "epoch": 45.40054495912806,
+ "grad_norm": 5.660735607147217,
+ "learning_rate": 1.1962640675712284e-05,
+ "loss": 0.1426,
+ "step": 16662
+ },
+ {
+ "epoch": 45.403269754768395,
+ "grad_norm": 5.834871292114258,
+ "learning_rate": 1.1961775337004916e-05,
+ "loss": 0.2839,
+ "step": 16663
+ },
+ {
+ "epoch": 45.40599455040872,
+ "grad_norm": 6.210115909576416,
+ "learning_rate": 1.1960909983019307e-05,
+ "loss": 0.141,
+ "step": 16664
+ },
+ {
+ "epoch": 45.40871934604905,
+ "grad_norm": 5.948051452636719,
+ "learning_rate": 1.1960044613762189e-05,
+ "loss": 0.1444,
+ "step": 16665
+ },
+ {
+ "epoch": 45.41144414168937,
+ "grad_norm": 5.73265266418457,
+ "learning_rate": 1.1959179229240312e-05,
+ "loss": 0.1241,
+ "step": 16666
+ },
+ {
+ "epoch": 45.4141689373297,
+ "grad_norm": 5.090624809265137,
+ "learning_rate": 1.1958313829460406e-05,
+ "loss": 0.1477,
+ "step": 16667
+ },
+ {
+ "epoch": 45.416893732970024,
+ "grad_norm": 6.242894649505615,
+ "learning_rate": 1.1957448414429218e-05,
+ "loss": 0.1256,
+ "step": 16668
+ },
+ {
+ "epoch": 45.41961852861036,
+ "grad_norm": 13.589362144470215,
+ "learning_rate": 1.1956582984153479e-05,
+ "loss": 0.1658,
+ "step": 16669
+ },
+ {
+ "epoch": 45.42234332425068,
+ "grad_norm": 5.8010406494140625,
+ "learning_rate": 1.1955717538639941e-05,
+ "loss": 0.2329,
+ "step": 16670
+ },
+ {
+ "epoch": 45.42506811989101,
+ "grad_norm": 5.109614372253418,
+ "learning_rate": 1.1954852077895335e-05,
+ "loss": 0.1757,
+ "step": 16671
+ },
+ {
+ "epoch": 45.427792915531334,
+ "grad_norm": 4.750753879547119,
+ "learning_rate": 1.1953986601926406e-05,
+ "loss": 0.155,
+ "step": 16672
+ },
+ {
+ "epoch": 45.43051771117166,
+ "grad_norm": 8.827396392822266,
+ "learning_rate": 1.195312111073989e-05,
+ "loss": 0.197,
+ "step": 16673
+ },
+ {
+ "epoch": 45.433242506811986,
+ "grad_norm": 6.231132507324219,
+ "learning_rate": 1.195225560434253e-05,
+ "loss": 0.1877,
+ "step": 16674
+ },
+ {
+ "epoch": 45.43596730245232,
+ "grad_norm": 6.299057483673096,
+ "learning_rate": 1.1951390082741068e-05,
+ "loss": 0.2544,
+ "step": 16675
+ },
+ {
+ "epoch": 45.438692098092645,
+ "grad_norm": 5.301882743835449,
+ "learning_rate": 1.1950524545942241e-05,
+ "loss": 0.2188,
+ "step": 16676
+ },
+ {
+ "epoch": 45.44141689373297,
+ "grad_norm": 5.3790106773376465,
+ "learning_rate": 1.1949658993952793e-05,
+ "loss": 0.1404,
+ "step": 16677
+ },
+ {
+ "epoch": 45.444141689373296,
+ "grad_norm": 8.645112991333008,
+ "learning_rate": 1.1948793426779462e-05,
+ "loss": 0.2259,
+ "step": 16678
+ },
+ {
+ "epoch": 45.44686648501362,
+ "grad_norm": 8.512444496154785,
+ "learning_rate": 1.194792784442899e-05,
+ "loss": 0.1794,
+ "step": 16679
+ },
+ {
+ "epoch": 45.44959128065395,
+ "grad_norm": 5.109349250793457,
+ "learning_rate": 1.1947062246908121e-05,
+ "loss": 0.1572,
+ "step": 16680
+ },
+ {
+ "epoch": 45.45231607629428,
+ "grad_norm": 5.574517250061035,
+ "learning_rate": 1.1946196634223592e-05,
+ "loss": 0.1516,
+ "step": 16681
+ },
+ {
+ "epoch": 45.45504087193461,
+ "grad_norm": 8.244447708129883,
+ "learning_rate": 1.1945331006382148e-05,
+ "loss": 0.1866,
+ "step": 16682
+ },
+ {
+ "epoch": 45.45776566757493,
+ "grad_norm": 6.59032678604126,
+ "learning_rate": 1.1944465363390527e-05,
+ "loss": 0.1877,
+ "step": 16683
+ },
+ {
+ "epoch": 45.46049046321526,
+ "grad_norm": 6.2295050621032715,
+ "learning_rate": 1.1943599705255476e-05,
+ "loss": 0.176,
+ "step": 16684
+ },
+ {
+ "epoch": 45.463215258855584,
+ "grad_norm": 26.40064239501953,
+ "learning_rate": 1.1942734031983727e-05,
+ "loss": 0.3238,
+ "step": 16685
+ },
+ {
+ "epoch": 45.46594005449591,
+ "grad_norm": 6.458420276641846,
+ "learning_rate": 1.1941868343582031e-05,
+ "loss": 0.2262,
+ "step": 16686
+ },
+ {
+ "epoch": 45.46866485013624,
+ "grad_norm": 5.881272315979004,
+ "learning_rate": 1.1941002640057126e-05,
+ "loss": 0.1857,
+ "step": 16687
+ },
+ {
+ "epoch": 45.47138964577657,
+ "grad_norm": 9.554805755615234,
+ "learning_rate": 1.1940136921415757e-05,
+ "loss": 0.2529,
+ "step": 16688
+ },
+ {
+ "epoch": 45.474114441416894,
+ "grad_norm": 6.610429286956787,
+ "learning_rate": 1.1939271187664664e-05,
+ "loss": 0.1741,
+ "step": 16689
+ },
+ {
+ "epoch": 45.47683923705722,
+ "grad_norm": 6.144949436187744,
+ "learning_rate": 1.1938405438810588e-05,
+ "loss": 0.1192,
+ "step": 16690
+ },
+ {
+ "epoch": 45.479564032697546,
+ "grad_norm": 6.75967264175415,
+ "learning_rate": 1.193753967486027e-05,
+ "loss": 0.2601,
+ "step": 16691
+ },
+ {
+ "epoch": 45.48228882833787,
+ "grad_norm": 7.9903717041015625,
+ "learning_rate": 1.1936673895820461e-05,
+ "loss": 0.2191,
+ "step": 16692
+ },
+ {
+ "epoch": 45.485013623978205,
+ "grad_norm": 6.284823894500732,
+ "learning_rate": 1.1935808101697895e-05,
+ "loss": 0.1932,
+ "step": 16693
+ },
+ {
+ "epoch": 45.48773841961853,
+ "grad_norm": 6.077003479003906,
+ "learning_rate": 1.1934942292499316e-05,
+ "loss": 0.1526,
+ "step": 16694
+ },
+ {
+ "epoch": 45.490463215258856,
+ "grad_norm": 6.023370742797852,
+ "learning_rate": 1.1934076468231472e-05,
+ "loss": 0.2062,
+ "step": 16695
+ },
+ {
+ "epoch": 45.49318801089918,
+ "grad_norm": 6.809840202331543,
+ "learning_rate": 1.1933210628901101e-05,
+ "loss": 0.2429,
+ "step": 16696
+ },
+ {
+ "epoch": 45.49591280653951,
+ "grad_norm": 9.45288372039795,
+ "learning_rate": 1.193234477451495e-05,
+ "loss": 0.1293,
+ "step": 16697
+ },
+ {
+ "epoch": 45.49863760217983,
+ "grad_norm": 5.4122395515441895,
+ "learning_rate": 1.1931478905079758e-05,
+ "loss": 0.1945,
+ "step": 16698
+ },
+ {
+ "epoch": 45.50136239782017,
+ "grad_norm": 4.952850818634033,
+ "learning_rate": 1.1930613020602273e-05,
+ "loss": 0.1848,
+ "step": 16699
+ },
+ {
+ "epoch": 45.50408719346049,
+ "grad_norm": 8.232172012329102,
+ "learning_rate": 1.1929747121089232e-05,
+ "loss": 0.2203,
+ "step": 16700
+ },
+ {
+ "epoch": 45.50681198910082,
+ "grad_norm": 5.5052900314331055,
+ "learning_rate": 1.1928881206547385e-05,
+ "loss": 0.1445,
+ "step": 16701
+ },
+ {
+ "epoch": 45.509536784741144,
+ "grad_norm": 6.1682820320129395,
+ "learning_rate": 1.1928015276983473e-05,
+ "loss": 0.1938,
+ "step": 16702
+ },
+ {
+ "epoch": 45.51226158038147,
+ "grad_norm": 6.207098007202148,
+ "learning_rate": 1.192714933240424e-05,
+ "loss": 0.2524,
+ "step": 16703
+ },
+ {
+ "epoch": 45.514986376021795,
+ "grad_norm": 4.526002407073975,
+ "learning_rate": 1.192628337281643e-05,
+ "loss": 0.1458,
+ "step": 16704
+ },
+ {
+ "epoch": 45.51771117166213,
+ "grad_norm": 9.20603084564209,
+ "learning_rate": 1.1925417398226786e-05,
+ "loss": 0.3266,
+ "step": 16705
+ },
+ {
+ "epoch": 45.520435967302454,
+ "grad_norm": 4.8588337898254395,
+ "learning_rate": 1.1924551408642054e-05,
+ "loss": 0.1795,
+ "step": 16706
+ },
+ {
+ "epoch": 45.52316076294278,
+ "grad_norm": 11.087041854858398,
+ "learning_rate": 1.1923685404068978e-05,
+ "loss": 0.0995,
+ "step": 16707
+ },
+ {
+ "epoch": 45.525885558583106,
+ "grad_norm": 7.632423400878906,
+ "learning_rate": 1.1922819384514302e-05,
+ "loss": 0.1736,
+ "step": 16708
+ },
+ {
+ "epoch": 45.52861035422343,
+ "grad_norm": 4.280725002288818,
+ "learning_rate": 1.1921953349984771e-05,
+ "loss": 0.2495,
+ "step": 16709
+ },
+ {
+ "epoch": 45.53133514986376,
+ "grad_norm": 4.482978343963623,
+ "learning_rate": 1.1921087300487128e-05,
+ "loss": 0.1411,
+ "step": 16710
+ },
+ {
+ "epoch": 45.53405994550409,
+ "grad_norm": 5.198719024658203,
+ "learning_rate": 1.1920221236028122e-05,
+ "loss": 0.2058,
+ "step": 16711
+ },
+ {
+ "epoch": 45.536784741144416,
+ "grad_norm": 6.219206809997559,
+ "learning_rate": 1.1919355156614488e-05,
+ "loss": 0.2802,
+ "step": 16712
+ },
+ {
+ "epoch": 45.53950953678474,
+ "grad_norm": 8.376551628112793,
+ "learning_rate": 1.1918489062252982e-05,
+ "loss": 0.3149,
+ "step": 16713
+ },
+ {
+ "epoch": 45.54223433242507,
+ "grad_norm": 5.516513824462891,
+ "learning_rate": 1.1917622952950346e-05,
+ "loss": 0.1148,
+ "step": 16714
+ },
+ {
+ "epoch": 45.54495912806539,
+ "grad_norm": 5.855601787567139,
+ "learning_rate": 1.1916756828713326e-05,
+ "loss": 0.1591,
+ "step": 16715
+ },
+ {
+ "epoch": 45.54768392370572,
+ "grad_norm": 6.673274517059326,
+ "learning_rate": 1.191589068954866e-05,
+ "loss": 0.225,
+ "step": 16716
+ },
+ {
+ "epoch": 45.55040871934605,
+ "grad_norm": 5.49294376373291,
+ "learning_rate": 1.1915024535463102e-05,
+ "loss": 0.1777,
+ "step": 16717
+ },
+ {
+ "epoch": 45.55313351498638,
+ "grad_norm": 5.714776515960693,
+ "learning_rate": 1.1914158366463392e-05,
+ "loss": 0.1862,
+ "step": 16718
+ },
+ {
+ "epoch": 45.555858310626704,
+ "grad_norm": 7.998096942901611,
+ "learning_rate": 1.1913292182556284e-05,
+ "loss": 0.1626,
+ "step": 16719
+ },
+ {
+ "epoch": 45.55858310626703,
+ "grad_norm": 4.941965103149414,
+ "learning_rate": 1.191242598374851e-05,
+ "loss": 0.2365,
+ "step": 16720
+ },
+ {
+ "epoch": 45.561307901907355,
+ "grad_norm": 11.13440227508545,
+ "learning_rate": 1.191155977004683e-05,
+ "loss": 0.2244,
+ "step": 16721
+ },
+ {
+ "epoch": 45.56403269754768,
+ "grad_norm": 5.3765034675598145,
+ "learning_rate": 1.1910693541457983e-05,
+ "loss": 0.1614,
+ "step": 16722
+ },
+ {
+ "epoch": 45.566757493188014,
+ "grad_norm": 4.9884467124938965,
+ "learning_rate": 1.1909827297988716e-05,
+ "loss": 0.1526,
+ "step": 16723
+ },
+ {
+ "epoch": 45.56948228882834,
+ "grad_norm": 5.218952655792236,
+ "learning_rate": 1.1908961039645774e-05,
+ "loss": 0.283,
+ "step": 16724
+ },
+ {
+ "epoch": 45.572207084468666,
+ "grad_norm": 5.10790491104126,
+ "learning_rate": 1.1908094766435906e-05,
+ "loss": 0.2459,
+ "step": 16725
+ },
+ {
+ "epoch": 45.57493188010899,
+ "grad_norm": 7.868581295013428,
+ "learning_rate": 1.190722847836586e-05,
+ "loss": 0.286,
+ "step": 16726
+ },
+ {
+ "epoch": 45.57765667574932,
+ "grad_norm": 7.350738525390625,
+ "learning_rate": 1.1906362175442376e-05,
+ "loss": 0.2108,
+ "step": 16727
+ },
+ {
+ "epoch": 45.58038147138964,
+ "grad_norm": 6.340230464935303,
+ "learning_rate": 1.1905495857672207e-05,
+ "loss": 0.1519,
+ "step": 16728
+ },
+ {
+ "epoch": 45.583106267029976,
+ "grad_norm": 5.222556114196777,
+ "learning_rate": 1.1904629525062094e-05,
+ "loss": 0.1501,
+ "step": 16729
+ },
+ {
+ "epoch": 45.5858310626703,
+ "grad_norm": 6.270688056945801,
+ "learning_rate": 1.190376317761879e-05,
+ "loss": 0.3152,
+ "step": 16730
+ },
+ {
+ "epoch": 45.58855585831063,
+ "grad_norm": 5.900198459625244,
+ "learning_rate": 1.1902896815349041e-05,
+ "loss": 0.31,
+ "step": 16731
+ },
+ {
+ "epoch": 45.59128065395095,
+ "grad_norm": 6.09793758392334,
+ "learning_rate": 1.1902030438259593e-05,
+ "loss": 0.3577,
+ "step": 16732
+ },
+ {
+ "epoch": 45.59400544959128,
+ "grad_norm": 6.048053741455078,
+ "learning_rate": 1.1901164046357192e-05,
+ "loss": 0.2992,
+ "step": 16733
+ },
+ {
+ "epoch": 45.596730245231605,
+ "grad_norm": 4.888824939727783,
+ "learning_rate": 1.1900297639648586e-05,
+ "loss": 0.231,
+ "step": 16734
+ },
+ {
+ "epoch": 45.59945504087194,
+ "grad_norm": 6.400858402252197,
+ "learning_rate": 1.1899431218140525e-05,
+ "loss": 0.1601,
+ "step": 16735
+ },
+ {
+ "epoch": 45.60217983651226,
+ "grad_norm": 8.345768928527832,
+ "learning_rate": 1.1898564781839752e-05,
+ "loss": 0.2145,
+ "step": 16736
+ },
+ {
+ "epoch": 45.60490463215259,
+ "grad_norm": 5.117101669311523,
+ "learning_rate": 1.1897698330753017e-05,
+ "loss": 0.2896,
+ "step": 16737
+ },
+ {
+ "epoch": 45.607629427792915,
+ "grad_norm": 5.829264163970947,
+ "learning_rate": 1.1896831864887071e-05,
+ "loss": 0.1202,
+ "step": 16738
+ },
+ {
+ "epoch": 45.61035422343324,
+ "grad_norm": 5.072994709014893,
+ "learning_rate": 1.189596538424866e-05,
+ "loss": 0.135,
+ "step": 16739
+ },
+ {
+ "epoch": 45.61307901907357,
+ "grad_norm": 5.669522762298584,
+ "learning_rate": 1.189509888884453e-05,
+ "loss": 0.2648,
+ "step": 16740
+ },
+ {
+ "epoch": 45.6158038147139,
+ "grad_norm": 6.418872356414795,
+ "learning_rate": 1.1894232378681432e-05,
+ "loss": 0.1324,
+ "step": 16741
+ },
+ {
+ "epoch": 45.618528610354225,
+ "grad_norm": 5.721817493438721,
+ "learning_rate": 1.1893365853766112e-05,
+ "loss": 0.1504,
+ "step": 16742
+ },
+ {
+ "epoch": 45.62125340599455,
+ "grad_norm": 4.870094299316406,
+ "learning_rate": 1.1892499314105322e-05,
+ "loss": 0.1526,
+ "step": 16743
+ },
+ {
+ "epoch": 45.62397820163488,
+ "grad_norm": 4.316743850708008,
+ "learning_rate": 1.1891632759705806e-05,
+ "loss": 0.2196,
+ "step": 16744
+ },
+ {
+ "epoch": 45.6267029972752,
+ "grad_norm": 5.4886698722839355,
+ "learning_rate": 1.1890766190574317e-05,
+ "loss": 0.2826,
+ "step": 16745
+ },
+ {
+ "epoch": 45.62942779291553,
+ "grad_norm": 5.585188388824463,
+ "learning_rate": 1.1889899606717596e-05,
+ "loss": 0.24,
+ "step": 16746
+ },
+ {
+ "epoch": 45.63215258855586,
+ "grad_norm": 5.05691385269165,
+ "learning_rate": 1.1889033008142405e-05,
+ "loss": 0.1792,
+ "step": 16747
+ },
+ {
+ "epoch": 45.63487738419619,
+ "grad_norm": 4.477142810821533,
+ "learning_rate": 1.188816639485548e-05,
+ "loss": 0.1701,
+ "step": 16748
+ },
+ {
+ "epoch": 45.63760217983651,
+ "grad_norm": 5.6869215965271,
+ "learning_rate": 1.188729976686358e-05,
+ "loss": 0.3177,
+ "step": 16749
+ },
+ {
+ "epoch": 45.64032697547684,
+ "grad_norm": 4.94856595993042,
+ "learning_rate": 1.1886433124173448e-05,
+ "loss": 0.1924,
+ "step": 16750
+ },
+ {
+ "epoch": 45.643051771117165,
+ "grad_norm": 6.606828689575195,
+ "learning_rate": 1.1885566466791838e-05,
+ "loss": 0.1509,
+ "step": 16751
+ },
+ {
+ "epoch": 45.64577656675749,
+ "grad_norm": 6.61343240737915,
+ "learning_rate": 1.1884699794725494e-05,
+ "loss": 0.2013,
+ "step": 16752
+ },
+ {
+ "epoch": 45.64850136239782,
+ "grad_norm": 5.412893772125244,
+ "learning_rate": 1.1883833107981173e-05,
+ "loss": 0.1584,
+ "step": 16753
+ },
+ {
+ "epoch": 45.65122615803815,
+ "grad_norm": 6.0776047706604,
+ "learning_rate": 1.1882966406565615e-05,
+ "loss": 0.2973,
+ "step": 16754
+ },
+ {
+ "epoch": 45.653950953678475,
+ "grad_norm": 6.073796272277832,
+ "learning_rate": 1.1882099690485578e-05,
+ "loss": 0.1985,
+ "step": 16755
+ },
+ {
+ "epoch": 45.6566757493188,
+ "grad_norm": 20.35211944580078,
+ "learning_rate": 1.1881232959747808e-05,
+ "loss": 0.1966,
+ "step": 16756
+ },
+ {
+ "epoch": 45.65940054495913,
+ "grad_norm": 5.905616760253906,
+ "learning_rate": 1.1880366214359058e-05,
+ "loss": 0.1485,
+ "step": 16757
+ },
+ {
+ "epoch": 45.66212534059945,
+ "grad_norm": 4.573220252990723,
+ "learning_rate": 1.1879499454326075e-05,
+ "loss": 0.0844,
+ "step": 16758
+ },
+ {
+ "epoch": 45.664850136239785,
+ "grad_norm": 5.227389812469482,
+ "learning_rate": 1.1878632679655613e-05,
+ "loss": 0.1249,
+ "step": 16759
+ },
+ {
+ "epoch": 45.66757493188011,
+ "grad_norm": 4.984939098358154,
+ "learning_rate": 1.1877765890354416e-05,
+ "loss": 0.0953,
+ "step": 16760
+ },
+ {
+ "epoch": 45.67029972752044,
+ "grad_norm": 6.445440769195557,
+ "learning_rate": 1.1876899086429243e-05,
+ "loss": 0.2402,
+ "step": 16761
+ },
+ {
+ "epoch": 45.67302452316076,
+ "grad_norm": 6.42676305770874,
+ "learning_rate": 1.1876032267886836e-05,
+ "loss": 0.21,
+ "step": 16762
+ },
+ {
+ "epoch": 45.67574931880109,
+ "grad_norm": 4.938652515411377,
+ "learning_rate": 1.1875165434733953e-05,
+ "loss": 0.2568,
+ "step": 16763
+ },
+ {
+ "epoch": 45.678474114441414,
+ "grad_norm": 5.695641994476318,
+ "learning_rate": 1.1874298586977343e-05,
+ "loss": 0.2105,
+ "step": 16764
+ },
+ {
+ "epoch": 45.68119891008175,
+ "grad_norm": 20.347829818725586,
+ "learning_rate": 1.1873431724623754e-05,
+ "loss": 0.2006,
+ "step": 16765
+ },
+ {
+ "epoch": 45.68392370572207,
+ "grad_norm": 4.463924407958984,
+ "learning_rate": 1.1872564847679937e-05,
+ "loss": 0.122,
+ "step": 16766
+ },
+ {
+ "epoch": 45.6866485013624,
+ "grad_norm": 5.034438133239746,
+ "learning_rate": 1.187169795615265e-05,
+ "loss": 0.3651,
+ "step": 16767
+ },
+ {
+ "epoch": 45.689373297002724,
+ "grad_norm": 6.706033229827881,
+ "learning_rate": 1.1870831050048637e-05,
+ "loss": 0.1983,
+ "step": 16768
+ },
+ {
+ "epoch": 45.69209809264305,
+ "grad_norm": 5.6929826736450195,
+ "learning_rate": 1.1869964129374653e-05,
+ "loss": 0.1591,
+ "step": 16769
+ },
+ {
+ "epoch": 45.694822888283376,
+ "grad_norm": 27.811521530151367,
+ "learning_rate": 1.1869097194137447e-05,
+ "loss": 0.1832,
+ "step": 16770
+ },
+ {
+ "epoch": 45.69754768392371,
+ "grad_norm": 4.503742218017578,
+ "learning_rate": 1.1868230244343772e-05,
+ "loss": 0.1942,
+ "step": 16771
+ },
+ {
+ "epoch": 45.700272479564035,
+ "grad_norm": 4.524623870849609,
+ "learning_rate": 1.1867363280000381e-05,
+ "loss": 0.1455,
+ "step": 16772
+ },
+ {
+ "epoch": 45.70299727520436,
+ "grad_norm": 10.254136085510254,
+ "learning_rate": 1.1866496301114024e-05,
+ "loss": 0.224,
+ "step": 16773
+ },
+ {
+ "epoch": 45.705722070844686,
+ "grad_norm": 5.565359115600586,
+ "learning_rate": 1.1865629307691457e-05,
+ "loss": 0.1702,
+ "step": 16774
+ },
+ {
+ "epoch": 45.70844686648501,
+ "grad_norm": 5.79984712600708,
+ "learning_rate": 1.1864762299739425e-05,
+ "loss": 0.195,
+ "step": 16775
+ },
+ {
+ "epoch": 45.71117166212534,
+ "grad_norm": 11.521369934082031,
+ "learning_rate": 1.1863895277264685e-05,
+ "loss": 0.2612,
+ "step": 16776
+ },
+ {
+ "epoch": 45.71389645776567,
+ "grad_norm": 4.3823676109313965,
+ "learning_rate": 1.186302824027399e-05,
+ "loss": 0.277,
+ "step": 16777
+ },
+ {
+ "epoch": 45.716621253406,
+ "grad_norm": 5.321345806121826,
+ "learning_rate": 1.186216118877409e-05,
+ "loss": 0.2387,
+ "step": 16778
+ },
+ {
+ "epoch": 45.71934604904632,
+ "grad_norm": 4.756073474884033,
+ "learning_rate": 1.186129412277174e-05,
+ "loss": 0.181,
+ "step": 16779
+ },
+ {
+ "epoch": 45.72207084468665,
+ "grad_norm": 5.8166399002075195,
+ "learning_rate": 1.186042704227369e-05,
+ "loss": 0.197,
+ "step": 16780
+ },
+ {
+ "epoch": 45.724795640326974,
+ "grad_norm": 6.273514270782471,
+ "learning_rate": 1.1859559947286695e-05,
+ "loss": 0.2122,
+ "step": 16781
+ },
+ {
+ "epoch": 45.7275204359673,
+ "grad_norm": 9.926748275756836,
+ "learning_rate": 1.1858692837817507e-05,
+ "loss": 0.2679,
+ "step": 16782
+ },
+ {
+ "epoch": 45.73024523160763,
+ "grad_norm": 5.106124401092529,
+ "learning_rate": 1.1857825713872877e-05,
+ "loss": 0.2026,
+ "step": 16783
+ },
+ {
+ "epoch": 45.73297002724796,
+ "grad_norm": 7.10134744644165,
+ "learning_rate": 1.1856958575459563e-05,
+ "loss": 0.2331,
+ "step": 16784
+ },
+ {
+ "epoch": 45.735694822888284,
+ "grad_norm": 5.939577102661133,
+ "learning_rate": 1.1856091422584312e-05,
+ "loss": 0.2202,
+ "step": 16785
+ },
+ {
+ "epoch": 45.73841961852861,
+ "grad_norm": 9.432857513427734,
+ "learning_rate": 1.1855224255253885e-05,
+ "loss": 0.1826,
+ "step": 16786
+ },
+ {
+ "epoch": 45.741144414168936,
+ "grad_norm": 5.389590263366699,
+ "learning_rate": 1.185435707347503e-05,
+ "loss": 0.1651,
+ "step": 16787
+ },
+ {
+ "epoch": 45.74386920980926,
+ "grad_norm": 5.081847190856934,
+ "learning_rate": 1.1853489877254498e-05,
+ "loss": 0.1582,
+ "step": 16788
+ },
+ {
+ "epoch": 45.746594005449595,
+ "grad_norm": 6.348358631134033,
+ "learning_rate": 1.1852622666599047e-05,
+ "loss": 0.2016,
+ "step": 16789
+ },
+ {
+ "epoch": 45.74931880108992,
+ "grad_norm": 5.817598342895508,
+ "learning_rate": 1.1851755441515435e-05,
+ "loss": 0.2261,
+ "step": 16790
+ },
+ {
+ "epoch": 45.752043596730246,
+ "grad_norm": 5.8689165115356445,
+ "learning_rate": 1.1850888202010408e-05,
+ "loss": 0.1593,
+ "step": 16791
+ },
+ {
+ "epoch": 45.75476839237057,
+ "grad_norm": 4.214691638946533,
+ "learning_rate": 1.1850020948090725e-05,
+ "loss": 0.1659,
+ "step": 16792
+ },
+ {
+ "epoch": 45.7574931880109,
+ "grad_norm": 5.222210884094238,
+ "learning_rate": 1.1849153679763137e-05,
+ "loss": 0.1364,
+ "step": 16793
+ },
+ {
+ "epoch": 45.76021798365122,
+ "grad_norm": 5.477433204650879,
+ "learning_rate": 1.1848286397034402e-05,
+ "loss": 0.1772,
+ "step": 16794
+ },
+ {
+ "epoch": 45.762942779291556,
+ "grad_norm": 5.0489020347595215,
+ "learning_rate": 1.1847419099911268e-05,
+ "loss": 0.2861,
+ "step": 16795
+ },
+ {
+ "epoch": 45.76566757493188,
+ "grad_norm": 8.0861234664917,
+ "learning_rate": 1.1846551788400497e-05,
+ "loss": 0.2905,
+ "step": 16796
+ },
+ {
+ "epoch": 45.76839237057221,
+ "grad_norm": 6.275272369384766,
+ "learning_rate": 1.1845684462508838e-05,
+ "loss": 0.2019,
+ "step": 16797
+ },
+ {
+ "epoch": 45.771117166212534,
+ "grad_norm": 9.220664978027344,
+ "learning_rate": 1.1844817122243047e-05,
+ "loss": 0.1202,
+ "step": 16798
+ },
+ {
+ "epoch": 45.77384196185286,
+ "grad_norm": 6.362813472747803,
+ "learning_rate": 1.1843949767609879e-05,
+ "loss": 0.2262,
+ "step": 16799
+ },
+ {
+ "epoch": 45.776566757493185,
+ "grad_norm": 5.926329135894775,
+ "learning_rate": 1.1843082398616095e-05,
+ "loss": 0.3897,
+ "step": 16800
+ },
+ {
+ "epoch": 45.77929155313352,
+ "grad_norm": 6.0297698974609375,
+ "learning_rate": 1.1842215015268439e-05,
+ "loss": 0.1284,
+ "step": 16801
+ },
+ {
+ "epoch": 45.782016348773844,
+ "grad_norm": 5.359635353088379,
+ "learning_rate": 1.1841347617573675e-05,
+ "loss": 0.1297,
+ "step": 16802
+ },
+ {
+ "epoch": 45.78474114441417,
+ "grad_norm": 5.568722724914551,
+ "learning_rate": 1.1840480205538553e-05,
+ "loss": 0.2027,
+ "step": 16803
+ },
+ {
+ "epoch": 45.787465940054496,
+ "grad_norm": 8.326163291931152,
+ "learning_rate": 1.1839612779169833e-05,
+ "loss": 0.1984,
+ "step": 16804
+ },
+ {
+ "epoch": 45.79019073569482,
+ "grad_norm": 5.921015739440918,
+ "learning_rate": 1.1838745338474266e-05,
+ "loss": 0.4049,
+ "step": 16805
+ },
+ {
+ "epoch": 45.79291553133515,
+ "grad_norm": 12.31640338897705,
+ "learning_rate": 1.183787788345861e-05,
+ "loss": 0.1637,
+ "step": 16806
+ },
+ {
+ "epoch": 45.79564032697548,
+ "grad_norm": 5.65764045715332,
+ "learning_rate": 1.1837010414129617e-05,
+ "loss": 0.2375,
+ "step": 16807
+ },
+ {
+ "epoch": 45.798365122615806,
+ "grad_norm": 4.975269794464111,
+ "learning_rate": 1.1836142930494053e-05,
+ "loss": 0.1195,
+ "step": 16808
+ },
+ {
+ "epoch": 45.80108991825613,
+ "grad_norm": 5.65529727935791,
+ "learning_rate": 1.1835275432558659e-05,
+ "loss": 0.1931,
+ "step": 16809
+ },
+ {
+ "epoch": 45.80381471389646,
+ "grad_norm": 8.044857025146484,
+ "learning_rate": 1.1834407920330207e-05,
+ "loss": 0.2065,
+ "step": 16810
+ },
+ {
+ "epoch": 45.80653950953678,
+ "grad_norm": 5.580800533294678,
+ "learning_rate": 1.1833540393815438e-05,
+ "loss": 0.3629,
+ "step": 16811
+ },
+ {
+ "epoch": 45.80926430517711,
+ "grad_norm": 4.198930263519287,
+ "learning_rate": 1.183267285302112e-05,
+ "loss": 0.258,
+ "step": 16812
+ },
+ {
+ "epoch": 45.81198910081744,
+ "grad_norm": 7.045481204986572,
+ "learning_rate": 1.1831805297954001e-05,
+ "loss": 0.1241,
+ "step": 16813
+ },
+ {
+ "epoch": 45.81471389645777,
+ "grad_norm": 6.636136054992676,
+ "learning_rate": 1.1830937728620847e-05,
+ "loss": 0.2276,
+ "step": 16814
+ },
+ {
+ "epoch": 45.817438692098094,
+ "grad_norm": 5.757200241088867,
+ "learning_rate": 1.1830070145028404e-05,
+ "loss": 0.1356,
+ "step": 16815
+ },
+ {
+ "epoch": 45.82016348773842,
+ "grad_norm": 5.463143348693848,
+ "learning_rate": 1.1829202547183434e-05,
+ "loss": 0.1717,
+ "step": 16816
+ },
+ {
+ "epoch": 45.822888283378745,
+ "grad_norm": 5.030807971954346,
+ "learning_rate": 1.1828334935092694e-05,
+ "loss": 0.1357,
+ "step": 16817
+ },
+ {
+ "epoch": 45.82561307901907,
+ "grad_norm": 9.538846969604492,
+ "learning_rate": 1.1827467308762943e-05,
+ "loss": 0.1935,
+ "step": 16818
+ },
+ {
+ "epoch": 45.828337874659404,
+ "grad_norm": 5.1914963722229,
+ "learning_rate": 1.1826599668200931e-05,
+ "loss": 0.2146,
+ "step": 16819
+ },
+ {
+ "epoch": 45.83106267029973,
+ "grad_norm": 6.6925458908081055,
+ "learning_rate": 1.1825732013413424e-05,
+ "loss": 0.286,
+ "step": 16820
+ },
+ {
+ "epoch": 45.833787465940055,
+ "grad_norm": 4.862399101257324,
+ "learning_rate": 1.1824864344407172e-05,
+ "loss": 0.117,
+ "step": 16821
+ },
+ {
+ "epoch": 45.83651226158038,
+ "grad_norm": 5.300833225250244,
+ "learning_rate": 1.1823996661188936e-05,
+ "loss": 0.2113,
+ "step": 16822
+ },
+ {
+ "epoch": 45.83923705722071,
+ "grad_norm": 5.468568801879883,
+ "learning_rate": 1.1823128963765472e-05,
+ "loss": 0.1965,
+ "step": 16823
+ },
+ {
+ "epoch": 45.84196185286103,
+ "grad_norm": 7.542404651641846,
+ "learning_rate": 1.1822261252143538e-05,
+ "loss": 0.1763,
+ "step": 16824
+ },
+ {
+ "epoch": 45.844686648501366,
+ "grad_norm": 5.1153459548950195,
+ "learning_rate": 1.1821393526329894e-05,
+ "loss": 0.1416,
+ "step": 16825
+ },
+ {
+ "epoch": 45.84741144414169,
+ "grad_norm": 7.301416397094727,
+ "learning_rate": 1.1820525786331296e-05,
+ "loss": 0.128,
+ "step": 16826
+ },
+ {
+ "epoch": 45.85013623978202,
+ "grad_norm": 4.820608615875244,
+ "learning_rate": 1.18196580321545e-05,
+ "loss": 0.1388,
+ "step": 16827
+ },
+ {
+ "epoch": 45.85286103542234,
+ "grad_norm": 5.057580947875977,
+ "learning_rate": 1.1818790263806265e-05,
+ "loss": 0.1096,
+ "step": 16828
+ },
+ {
+ "epoch": 45.85558583106267,
+ "grad_norm": 5.905057907104492,
+ "learning_rate": 1.1817922481293351e-05,
+ "loss": 0.1954,
+ "step": 16829
+ },
+ {
+ "epoch": 45.858310626702995,
+ "grad_norm": 6.665063381195068,
+ "learning_rate": 1.1817054684622518e-05,
+ "loss": 0.2183,
+ "step": 16830
+ },
+ {
+ "epoch": 45.86103542234333,
+ "grad_norm": 5.462371349334717,
+ "learning_rate": 1.1816186873800519e-05,
+ "loss": 0.2193,
+ "step": 16831
+ },
+ {
+ "epoch": 45.86376021798365,
+ "grad_norm": 6.108532905578613,
+ "learning_rate": 1.1815319048834113e-05,
+ "loss": 0.3233,
+ "step": 16832
+ },
+ {
+ "epoch": 45.86648501362398,
+ "grad_norm": 4.892570495605469,
+ "learning_rate": 1.1814451209730062e-05,
+ "loss": 0.1703,
+ "step": 16833
+ },
+ {
+ "epoch": 45.869209809264305,
+ "grad_norm": 4.645022869110107,
+ "learning_rate": 1.1813583356495126e-05,
+ "loss": 0.1634,
+ "step": 16834
+ },
+ {
+ "epoch": 45.87193460490463,
+ "grad_norm": 5.6142578125,
+ "learning_rate": 1.1812715489136059e-05,
+ "loss": 0.1651,
+ "step": 16835
+ },
+ {
+ "epoch": 45.87465940054496,
+ "grad_norm": 4.635265350341797,
+ "learning_rate": 1.1811847607659623e-05,
+ "loss": 0.292,
+ "step": 16836
+ },
+ {
+ "epoch": 45.87738419618529,
+ "grad_norm": 5.443964004516602,
+ "learning_rate": 1.1810979712072577e-05,
+ "loss": 0.3624,
+ "step": 16837
+ },
+ {
+ "epoch": 45.880108991825615,
+ "grad_norm": 6.793909072875977,
+ "learning_rate": 1.1810111802381679e-05,
+ "loss": 0.2163,
+ "step": 16838
+ },
+ {
+ "epoch": 45.88283378746594,
+ "grad_norm": 4.849037170410156,
+ "learning_rate": 1.1809243878593686e-05,
+ "loss": 0.2381,
+ "step": 16839
+ },
+ {
+ "epoch": 45.88555858310627,
+ "grad_norm": 5.565073013305664,
+ "learning_rate": 1.1808375940715362e-05,
+ "loss": 0.1832,
+ "step": 16840
+ },
+ {
+ "epoch": 45.88828337874659,
+ "grad_norm": 6.433823108673096,
+ "learning_rate": 1.1807507988753461e-05,
+ "loss": 0.133,
+ "step": 16841
+ },
+ {
+ "epoch": 45.89100817438692,
+ "grad_norm": 5.564578533172607,
+ "learning_rate": 1.180664002271475e-05,
+ "loss": 0.1701,
+ "step": 16842
+ },
+ {
+ "epoch": 45.89373297002725,
+ "grad_norm": 5.624913215637207,
+ "learning_rate": 1.1805772042605982e-05,
+ "loss": 0.1648,
+ "step": 16843
+ },
+ {
+ "epoch": 45.89645776566758,
+ "grad_norm": 5.615039348602295,
+ "learning_rate": 1.1804904048433925e-05,
+ "loss": 0.1364,
+ "step": 16844
+ },
+ {
+ "epoch": 45.8991825613079,
+ "grad_norm": 4.709343910217285,
+ "learning_rate": 1.1804036040205326e-05,
+ "loss": 0.1999,
+ "step": 16845
+ },
+ {
+ "epoch": 45.90190735694823,
+ "grad_norm": 7.4266557693481445,
+ "learning_rate": 1.1803168017926958e-05,
+ "loss": 0.1916,
+ "step": 16846
+ },
+ {
+ "epoch": 45.904632152588555,
+ "grad_norm": 7.247400283813477,
+ "learning_rate": 1.1802299981605572e-05,
+ "loss": 0.1903,
+ "step": 16847
+ },
+ {
+ "epoch": 45.90735694822888,
+ "grad_norm": 5.782771587371826,
+ "learning_rate": 1.1801431931247936e-05,
+ "loss": 0.1388,
+ "step": 16848
+ },
+ {
+ "epoch": 45.91008174386921,
+ "grad_norm": 6.266892910003662,
+ "learning_rate": 1.1800563866860802e-05,
+ "loss": 0.181,
+ "step": 16849
+ },
+ {
+ "epoch": 45.91280653950954,
+ "grad_norm": 5.285679817199707,
+ "learning_rate": 1.1799695788450933e-05,
+ "loss": 0.1858,
+ "step": 16850
+ },
+ {
+ "epoch": 45.915531335149865,
+ "grad_norm": 7.338531017303467,
+ "learning_rate": 1.1798827696025094e-05,
+ "loss": 0.2153,
+ "step": 16851
+ },
+ {
+ "epoch": 45.91825613079019,
+ "grad_norm": 8.412606239318848,
+ "learning_rate": 1.1797959589590042e-05,
+ "loss": 0.2985,
+ "step": 16852
+ },
+ {
+ "epoch": 45.920980926430516,
+ "grad_norm": 7.390754222869873,
+ "learning_rate": 1.179709146915254e-05,
+ "loss": 0.1792,
+ "step": 16853
+ },
+ {
+ "epoch": 45.92370572207084,
+ "grad_norm": 6.709893226623535,
+ "learning_rate": 1.1796223334719347e-05,
+ "loss": 0.357,
+ "step": 16854
+ },
+ {
+ "epoch": 45.926430517711175,
+ "grad_norm": 5.400599479675293,
+ "learning_rate": 1.1795355186297223e-05,
+ "loss": 0.1779,
+ "step": 16855
+ },
+ {
+ "epoch": 45.9291553133515,
+ "grad_norm": 6.281462669372559,
+ "learning_rate": 1.1794487023892934e-05,
+ "loss": 0.1422,
+ "step": 16856
+ },
+ {
+ "epoch": 45.93188010899183,
+ "grad_norm": 5.297862529754639,
+ "learning_rate": 1.1793618847513235e-05,
+ "loss": 0.1678,
+ "step": 16857
+ },
+ {
+ "epoch": 45.93460490463215,
+ "grad_norm": 5.953853607177734,
+ "learning_rate": 1.179275065716489e-05,
+ "loss": 0.2998,
+ "step": 16858
+ },
+ {
+ "epoch": 45.93732970027248,
+ "grad_norm": 5.778013706207275,
+ "learning_rate": 1.1791882452854661e-05,
+ "loss": 0.2167,
+ "step": 16859
+ },
+ {
+ "epoch": 45.940054495912804,
+ "grad_norm": 5.81217622756958,
+ "learning_rate": 1.1791014234589308e-05,
+ "loss": 0.2295,
+ "step": 16860
+ },
+ {
+ "epoch": 45.94277929155314,
+ "grad_norm": 5.243221759796143,
+ "learning_rate": 1.1790146002375597e-05,
+ "loss": 0.2875,
+ "step": 16861
+ },
+ {
+ "epoch": 45.94550408719346,
+ "grad_norm": 5.780571460723877,
+ "learning_rate": 1.1789277756220283e-05,
+ "loss": 0.1198,
+ "step": 16862
+ },
+ {
+ "epoch": 45.94822888283379,
+ "grad_norm": 8.66849136352539,
+ "learning_rate": 1.1788409496130133e-05,
+ "loss": 0.1437,
+ "step": 16863
+ },
+ {
+ "epoch": 45.950953678474114,
+ "grad_norm": 5.675642013549805,
+ "learning_rate": 1.178754122211191e-05,
+ "loss": 0.2999,
+ "step": 16864
+ },
+ {
+ "epoch": 45.95367847411444,
+ "grad_norm": 6.454855442047119,
+ "learning_rate": 1.178667293417237e-05,
+ "loss": 0.2019,
+ "step": 16865
+ },
+ {
+ "epoch": 45.956403269754766,
+ "grad_norm": 48.437015533447266,
+ "learning_rate": 1.1785804632318278e-05,
+ "loss": 0.106,
+ "step": 16866
+ },
+ {
+ "epoch": 45.95912806539509,
+ "grad_norm": 5.250528812408447,
+ "learning_rate": 1.1784936316556399e-05,
+ "loss": 0.1671,
+ "step": 16867
+ },
+ {
+ "epoch": 45.961852861035425,
+ "grad_norm": 4.772067546844482,
+ "learning_rate": 1.1784067986893492e-05,
+ "loss": 0.1622,
+ "step": 16868
+ },
+ {
+ "epoch": 45.96457765667575,
+ "grad_norm": 17.530364990234375,
+ "learning_rate": 1.1783199643336324e-05,
+ "loss": 0.1622,
+ "step": 16869
+ },
+ {
+ "epoch": 45.967302452316076,
+ "grad_norm": 6.608857154846191,
+ "learning_rate": 1.1782331285891654e-05,
+ "loss": 0.3674,
+ "step": 16870
+ },
+ {
+ "epoch": 45.9700272479564,
+ "grad_norm": 4.463240623474121,
+ "learning_rate": 1.1781462914566244e-05,
+ "loss": 0.1687,
+ "step": 16871
+ },
+ {
+ "epoch": 45.97275204359673,
+ "grad_norm": 5.558890342712402,
+ "learning_rate": 1.1780594529366856e-05,
+ "loss": 0.1276,
+ "step": 16872
+ },
+ {
+ "epoch": 45.97547683923706,
+ "grad_norm": 6.251444339752197,
+ "learning_rate": 1.177972613030026e-05,
+ "loss": 0.2368,
+ "step": 16873
+ },
+ {
+ "epoch": 45.97820163487739,
+ "grad_norm": 7.094636917114258,
+ "learning_rate": 1.1778857717373208e-05,
+ "loss": 0.2958,
+ "step": 16874
+ },
+ {
+ "epoch": 45.98092643051771,
+ "grad_norm": 4.030132293701172,
+ "learning_rate": 1.1777989290592474e-05,
+ "loss": 0.083,
+ "step": 16875
+ },
+ {
+ "epoch": 45.98365122615804,
+ "grad_norm": 4.525312423706055,
+ "learning_rate": 1.1777120849964814e-05,
+ "loss": 0.1293,
+ "step": 16876
+ },
+ {
+ "epoch": 45.986376021798364,
+ "grad_norm": 6.200839042663574,
+ "learning_rate": 1.1776252395496996e-05,
+ "loss": 0.2395,
+ "step": 16877
+ },
+ {
+ "epoch": 45.98910081743869,
+ "grad_norm": 12.559029579162598,
+ "learning_rate": 1.177538392719578e-05,
+ "loss": 0.3794,
+ "step": 16878
+ },
+ {
+ "epoch": 45.991825613079016,
+ "grad_norm": 5.862802505493164,
+ "learning_rate": 1.1774515445067933e-05,
+ "loss": 0.1498,
+ "step": 16879
+ },
+ {
+ "epoch": 45.99455040871935,
+ "grad_norm": 6.752175331115723,
+ "learning_rate": 1.1773646949120217e-05,
+ "loss": 0.2217,
+ "step": 16880
+ },
+ {
+ "epoch": 45.997275204359674,
+ "grad_norm": 7.321381092071533,
+ "learning_rate": 1.1772778439359393e-05,
+ "loss": 0.1709,
+ "step": 16881
+ },
+ {
+ "epoch": 46.0,
+ "grad_norm": 5.0732526779174805,
+ "learning_rate": 1.177190991579223e-05,
+ "loss": 0.1394,
+ "step": 16882
+ },
+ {
+ "epoch": 46.002724795640326,
+ "grad_norm": 5.083871364593506,
+ "learning_rate": 1.177104137842549e-05,
+ "loss": 0.1157,
+ "step": 16883
+ },
+ {
+ "epoch": 46.00544959128065,
+ "grad_norm": 4.938205718994141,
+ "learning_rate": 1.177017282726593e-05,
+ "loss": 0.1703,
+ "step": 16884
+ },
+ {
+ "epoch": 46.00817438692098,
+ "grad_norm": 4.9734673500061035,
+ "learning_rate": 1.1769304262320329e-05,
+ "loss": 0.2418,
+ "step": 16885
+ },
+ {
+ "epoch": 46.01089918256131,
+ "grad_norm": 4.630497932434082,
+ "learning_rate": 1.1768435683595441e-05,
+ "loss": 0.1616,
+ "step": 16886
+ },
+ {
+ "epoch": 46.013623978201636,
+ "grad_norm": 6.0803680419921875,
+ "learning_rate": 1.1767567091098033e-05,
+ "loss": 0.1457,
+ "step": 16887
+ },
+ {
+ "epoch": 46.01634877384196,
+ "grad_norm": 14.960121154785156,
+ "learning_rate": 1.1766698484834869e-05,
+ "loss": 0.1541,
+ "step": 16888
+ },
+ {
+ "epoch": 46.01907356948229,
+ "grad_norm": 7.334306240081787,
+ "learning_rate": 1.1765829864812714e-05,
+ "loss": 0.3031,
+ "step": 16889
+ },
+ {
+ "epoch": 46.02179836512261,
+ "grad_norm": 5.870535373687744,
+ "learning_rate": 1.1764961231038331e-05,
+ "loss": 0.197,
+ "step": 16890
+ },
+ {
+ "epoch": 46.02452316076294,
+ "grad_norm": 4.6464056968688965,
+ "learning_rate": 1.1764092583518491e-05,
+ "loss": 0.1464,
+ "step": 16891
+ },
+ {
+ "epoch": 46.02724795640327,
+ "grad_norm": 5.883876323699951,
+ "learning_rate": 1.176322392225995e-05,
+ "loss": 0.1725,
+ "step": 16892
+ },
+ {
+ "epoch": 46.0299727520436,
+ "grad_norm": 5.208800315856934,
+ "learning_rate": 1.1762355247269481e-05,
+ "loss": 0.3002,
+ "step": 16893
+ },
+ {
+ "epoch": 46.032697547683924,
+ "grad_norm": 5.147244930267334,
+ "learning_rate": 1.1761486558553843e-05,
+ "loss": 0.2334,
+ "step": 16894
+ },
+ {
+ "epoch": 46.03542234332425,
+ "grad_norm": 5.42535924911499,
+ "learning_rate": 1.1760617856119809e-05,
+ "loss": 0.224,
+ "step": 16895
+ },
+ {
+ "epoch": 46.038147138964575,
+ "grad_norm": 4.2400946617126465,
+ "learning_rate": 1.1759749139974137e-05,
+ "loss": 0.2851,
+ "step": 16896
+ },
+ {
+ "epoch": 46.0408719346049,
+ "grad_norm": 4.644554615020752,
+ "learning_rate": 1.1758880410123596e-05,
+ "loss": 0.1312,
+ "step": 16897
+ },
+ {
+ "epoch": 46.043596730245234,
+ "grad_norm": 4.072249889373779,
+ "learning_rate": 1.175801166657495e-05,
+ "loss": 0.1893,
+ "step": 16898
+ },
+ {
+ "epoch": 46.04632152588556,
+ "grad_norm": 5.934253215789795,
+ "learning_rate": 1.175714290933497e-05,
+ "loss": 0.2545,
+ "step": 16899
+ },
+ {
+ "epoch": 46.049046321525886,
+ "grad_norm": 6.599236011505127,
+ "learning_rate": 1.175627413841041e-05,
+ "loss": 0.2178,
+ "step": 16900
+ },
+ {
+ "epoch": 46.05177111716621,
+ "grad_norm": 7.527964115142822,
+ "learning_rate": 1.1755405353808047e-05,
+ "loss": 0.1436,
+ "step": 16901
+ },
+ {
+ "epoch": 46.05449591280654,
+ "grad_norm": 7.0813212394714355,
+ "learning_rate": 1.1754536555534643e-05,
+ "loss": 0.1468,
+ "step": 16902
+ },
+ {
+ "epoch": 46.05722070844686,
+ "grad_norm": 4.541636943817139,
+ "learning_rate": 1.1753667743596969e-05,
+ "loss": 0.1627,
+ "step": 16903
+ },
+ {
+ "epoch": 46.059945504087196,
+ "grad_norm": 5.095037460327148,
+ "learning_rate": 1.1752798918001782e-05,
+ "loss": 0.2652,
+ "step": 16904
+ },
+ {
+ "epoch": 46.06267029972752,
+ "grad_norm": 5.75819206237793,
+ "learning_rate": 1.1751930078755858e-05,
+ "loss": 0.1549,
+ "step": 16905
+ },
+ {
+ "epoch": 46.06539509536785,
+ "grad_norm": 6.596327781677246,
+ "learning_rate": 1.1751061225865953e-05,
+ "loss": 0.1703,
+ "step": 16906
+ },
+ {
+ "epoch": 46.06811989100817,
+ "grad_norm": 5.354146480560303,
+ "learning_rate": 1.1750192359338845e-05,
+ "loss": 0.2491,
+ "step": 16907
+ },
+ {
+ "epoch": 46.0708446866485,
+ "grad_norm": 4.3368754386901855,
+ "learning_rate": 1.1749323479181291e-05,
+ "loss": 0.2098,
+ "step": 16908
+ },
+ {
+ "epoch": 46.073569482288825,
+ "grad_norm": 4.405524730682373,
+ "learning_rate": 1.1748454585400064e-05,
+ "loss": 0.113,
+ "step": 16909
+ },
+ {
+ "epoch": 46.07629427792916,
+ "grad_norm": 5.045307636260986,
+ "learning_rate": 1.1747585678001929e-05,
+ "loss": 0.2091,
+ "step": 16910
+ },
+ {
+ "epoch": 46.079019073569484,
+ "grad_norm": 5.209238052368164,
+ "learning_rate": 1.1746716756993654e-05,
+ "loss": 0.2337,
+ "step": 16911
+ },
+ {
+ "epoch": 46.08174386920981,
+ "grad_norm": 4.878576278686523,
+ "learning_rate": 1.1745847822382004e-05,
+ "loss": 0.11,
+ "step": 16912
+ },
+ {
+ "epoch": 46.084468664850135,
+ "grad_norm": 6.489706516265869,
+ "learning_rate": 1.174497887417375e-05,
+ "loss": 0.2975,
+ "step": 16913
+ },
+ {
+ "epoch": 46.08719346049046,
+ "grad_norm": 5.230531692504883,
+ "learning_rate": 1.1744109912375652e-05,
+ "loss": 0.267,
+ "step": 16914
+ },
+ {
+ "epoch": 46.08991825613079,
+ "grad_norm": 4.458773136138916,
+ "learning_rate": 1.1743240936994484e-05,
+ "loss": 0.106,
+ "step": 16915
+ },
+ {
+ "epoch": 46.09264305177112,
+ "grad_norm": 3.952570915222168,
+ "learning_rate": 1.1742371948037012e-05,
+ "loss": 0.1326,
+ "step": 16916
+ },
+ {
+ "epoch": 46.095367847411445,
+ "grad_norm": 3.6904971599578857,
+ "learning_rate": 1.1741502945510005e-05,
+ "loss": 0.1023,
+ "step": 16917
+ },
+ {
+ "epoch": 46.09809264305177,
+ "grad_norm": 4.737332344055176,
+ "learning_rate": 1.1740633929420225e-05,
+ "loss": 0.1231,
+ "step": 16918
+ },
+ {
+ "epoch": 46.1008174386921,
+ "grad_norm": 5.266089916229248,
+ "learning_rate": 1.1739764899774447e-05,
+ "loss": 0.1163,
+ "step": 16919
+ },
+ {
+ "epoch": 46.10354223433242,
+ "grad_norm": 5.249556064605713,
+ "learning_rate": 1.1738895856579436e-05,
+ "loss": 0.203,
+ "step": 16920
+ },
+ {
+ "epoch": 46.10626702997275,
+ "grad_norm": 5.134702682495117,
+ "learning_rate": 1.173802679984196e-05,
+ "loss": 0.1029,
+ "step": 16921
+ },
+ {
+ "epoch": 46.10899182561308,
+ "grad_norm": 5.852989196777344,
+ "learning_rate": 1.1737157729568787e-05,
+ "loss": 0.1935,
+ "step": 16922
+ },
+ {
+ "epoch": 46.11171662125341,
+ "grad_norm": 12.089111328125,
+ "learning_rate": 1.1736288645766684e-05,
+ "loss": 0.1376,
+ "step": 16923
+ },
+ {
+ "epoch": 46.11444141689373,
+ "grad_norm": 5.578044891357422,
+ "learning_rate": 1.1735419548442422e-05,
+ "loss": 0.2012,
+ "step": 16924
+ },
+ {
+ "epoch": 46.11716621253406,
+ "grad_norm": 7.164999008178711,
+ "learning_rate": 1.173455043760277e-05,
+ "loss": 0.156,
+ "step": 16925
+ },
+ {
+ "epoch": 46.119891008174385,
+ "grad_norm": 5.309410572052002,
+ "learning_rate": 1.1733681313254492e-05,
+ "loss": 0.2188,
+ "step": 16926
+ },
+ {
+ "epoch": 46.12261580381471,
+ "grad_norm": 6.488722324371338,
+ "learning_rate": 1.1732812175404362e-05,
+ "loss": 0.2034,
+ "step": 16927
+ },
+ {
+ "epoch": 46.12534059945504,
+ "grad_norm": 4.2620391845703125,
+ "learning_rate": 1.1731943024059145e-05,
+ "loss": 0.1984,
+ "step": 16928
+ },
+ {
+ "epoch": 46.12806539509537,
+ "grad_norm": 5.6828742027282715,
+ "learning_rate": 1.1731073859225612e-05,
+ "loss": 0.2205,
+ "step": 16929
+ },
+ {
+ "epoch": 46.130790190735695,
+ "grad_norm": 7.540266990661621,
+ "learning_rate": 1.173020468091053e-05,
+ "loss": 0.2739,
+ "step": 16930
+ },
+ {
+ "epoch": 46.13351498637602,
+ "grad_norm": 4.928872108459473,
+ "learning_rate": 1.1729335489120675e-05,
+ "loss": 0.1258,
+ "step": 16931
+ },
+ {
+ "epoch": 46.13623978201635,
+ "grad_norm": 4.395156383514404,
+ "learning_rate": 1.1728466283862806e-05,
+ "loss": 0.0999,
+ "step": 16932
+ },
+ {
+ "epoch": 46.13896457765667,
+ "grad_norm": 4.242887496948242,
+ "learning_rate": 1.1727597065143699e-05,
+ "loss": 0.2232,
+ "step": 16933
+ },
+ {
+ "epoch": 46.141689373297005,
+ "grad_norm": 5.286397457122803,
+ "learning_rate": 1.1726727832970121e-05,
+ "loss": 0.1928,
+ "step": 16934
+ },
+ {
+ "epoch": 46.14441416893733,
+ "grad_norm": 5.503414154052734,
+ "learning_rate": 1.1725858587348842e-05,
+ "loss": 0.2134,
+ "step": 16935
+ },
+ {
+ "epoch": 46.14713896457766,
+ "grad_norm": 5.316442966461182,
+ "learning_rate": 1.1724989328286633e-05,
+ "loss": 0.1651,
+ "step": 16936
+ },
+ {
+ "epoch": 46.14986376021798,
+ "grad_norm": 3.8543577194213867,
+ "learning_rate": 1.172412005579026e-05,
+ "loss": 0.1191,
+ "step": 16937
+ },
+ {
+ "epoch": 46.15258855585831,
+ "grad_norm": 6.987120151519775,
+ "learning_rate": 1.1723250769866499e-05,
+ "loss": 0.1891,
+ "step": 16938
+ },
+ {
+ "epoch": 46.155313351498634,
+ "grad_norm": 4.610313892364502,
+ "learning_rate": 1.1722381470522116e-05,
+ "loss": 0.1173,
+ "step": 16939
+ },
+ {
+ "epoch": 46.15803814713897,
+ "grad_norm": 5.001042366027832,
+ "learning_rate": 1.1721512157763878e-05,
+ "loss": 0.151,
+ "step": 16940
+ },
+ {
+ "epoch": 46.16076294277929,
+ "grad_norm": 5.889011859893799,
+ "learning_rate": 1.1720642831598563e-05,
+ "loss": 0.2553,
+ "step": 16941
+ },
+ {
+ "epoch": 46.16348773841962,
+ "grad_norm": 4.743194103240967,
+ "learning_rate": 1.1719773492032933e-05,
+ "loss": 0.2292,
+ "step": 16942
+ },
+ {
+ "epoch": 46.166212534059945,
+ "grad_norm": 4.329124927520752,
+ "learning_rate": 1.1718904139073765e-05,
+ "loss": 0.107,
+ "step": 16943
+ },
+ {
+ "epoch": 46.16893732970027,
+ "grad_norm": 4.750197887420654,
+ "learning_rate": 1.1718034772727827e-05,
+ "loss": 0.1749,
+ "step": 16944
+ },
+ {
+ "epoch": 46.171662125340596,
+ "grad_norm": 5.156228065490723,
+ "learning_rate": 1.1717165393001888e-05,
+ "loss": 0.1928,
+ "step": 16945
+ },
+ {
+ "epoch": 46.17438692098093,
+ "grad_norm": 4.277947902679443,
+ "learning_rate": 1.1716295999902722e-05,
+ "loss": 0.1296,
+ "step": 16946
+ },
+ {
+ "epoch": 46.177111716621255,
+ "grad_norm": 6.750779151916504,
+ "learning_rate": 1.1715426593437096e-05,
+ "loss": 0.2778,
+ "step": 16947
+ },
+ {
+ "epoch": 46.17983651226158,
+ "grad_norm": 9.903641700744629,
+ "learning_rate": 1.1714557173611785e-05,
+ "loss": 0.2106,
+ "step": 16948
+ },
+ {
+ "epoch": 46.182561307901906,
+ "grad_norm": 4.747694492340088,
+ "learning_rate": 1.1713687740433557e-05,
+ "loss": 0.1006,
+ "step": 16949
+ },
+ {
+ "epoch": 46.18528610354223,
+ "grad_norm": 4.483840465545654,
+ "learning_rate": 1.1712818293909182e-05,
+ "loss": 0.2431,
+ "step": 16950
+ },
+ {
+ "epoch": 46.18801089918256,
+ "grad_norm": 6.454843521118164,
+ "learning_rate": 1.1711948834045437e-05,
+ "loss": 0.2097,
+ "step": 16951
+ },
+ {
+ "epoch": 46.19073569482289,
+ "grad_norm": 5.715302467346191,
+ "learning_rate": 1.1711079360849086e-05,
+ "loss": 0.1199,
+ "step": 16952
+ },
+ {
+ "epoch": 46.19346049046322,
+ "grad_norm": 5.379823207855225,
+ "learning_rate": 1.1710209874326905e-05,
+ "loss": 0.2381,
+ "step": 16953
+ },
+ {
+ "epoch": 46.19618528610354,
+ "grad_norm": 4.871223449707031,
+ "learning_rate": 1.1709340374485667e-05,
+ "loss": 0.1482,
+ "step": 16954
+ },
+ {
+ "epoch": 46.19891008174387,
+ "grad_norm": 5.154715538024902,
+ "learning_rate": 1.170847086133214e-05,
+ "loss": 0.2239,
+ "step": 16955
+ },
+ {
+ "epoch": 46.201634877384194,
+ "grad_norm": 7.11883020401001,
+ "learning_rate": 1.1707601334873097e-05,
+ "loss": 0.1468,
+ "step": 16956
+ },
+ {
+ "epoch": 46.20435967302452,
+ "grad_norm": 5.708817481994629,
+ "learning_rate": 1.1706731795115309e-05,
+ "loss": 0.2822,
+ "step": 16957
+ },
+ {
+ "epoch": 46.20708446866485,
+ "grad_norm": 5.6825971603393555,
+ "learning_rate": 1.1705862242065549e-05,
+ "loss": 0.2883,
+ "step": 16958
+ },
+ {
+ "epoch": 46.20980926430518,
+ "grad_norm": 6.1116766929626465,
+ "learning_rate": 1.1704992675730588e-05,
+ "loss": 0.2028,
+ "step": 16959
+ },
+ {
+ "epoch": 46.212534059945504,
+ "grad_norm": 4.810726642608643,
+ "learning_rate": 1.17041230961172e-05,
+ "loss": 0.181,
+ "step": 16960
+ },
+ {
+ "epoch": 46.21525885558583,
+ "grad_norm": 4.37108850479126,
+ "learning_rate": 1.1703253503232152e-05,
+ "loss": 0.1972,
+ "step": 16961
+ },
+ {
+ "epoch": 46.217983651226156,
+ "grad_norm": 6.069670677185059,
+ "learning_rate": 1.1702383897082229e-05,
+ "loss": 0.1389,
+ "step": 16962
+ },
+ {
+ "epoch": 46.22070844686648,
+ "grad_norm": 4.703593730926514,
+ "learning_rate": 1.1701514277674186e-05,
+ "loss": 0.4329,
+ "step": 16963
+ },
+ {
+ "epoch": 46.223433242506815,
+ "grad_norm": 5.444170951843262,
+ "learning_rate": 1.1700644645014812e-05,
+ "loss": 0.1443,
+ "step": 16964
+ },
+ {
+ "epoch": 46.22615803814714,
+ "grad_norm": 5.546870231628418,
+ "learning_rate": 1.1699774999110867e-05,
+ "loss": 0.1891,
+ "step": 16965
+ },
+ {
+ "epoch": 46.228882833787466,
+ "grad_norm": 4.24921178817749,
+ "learning_rate": 1.1698905339969133e-05,
+ "loss": 0.3073,
+ "step": 16966
+ },
+ {
+ "epoch": 46.23160762942779,
+ "grad_norm": 5.065343856811523,
+ "learning_rate": 1.1698035667596378e-05,
+ "loss": 0.1351,
+ "step": 16967
+ },
+ {
+ "epoch": 46.23433242506812,
+ "grad_norm": 5.259772300720215,
+ "learning_rate": 1.1697165981999375e-05,
+ "loss": 0.2985,
+ "step": 16968
+ },
+ {
+ "epoch": 46.237057220708444,
+ "grad_norm": 12.561153411865234,
+ "learning_rate": 1.1696296283184896e-05,
+ "loss": 0.2392,
+ "step": 16969
+ },
+ {
+ "epoch": 46.23978201634878,
+ "grad_norm": 6.302806854248047,
+ "learning_rate": 1.1695426571159718e-05,
+ "loss": 0.2354,
+ "step": 16970
+ },
+ {
+ "epoch": 46.2425068119891,
+ "grad_norm": 6.131228446960449,
+ "learning_rate": 1.1694556845930611e-05,
+ "loss": 0.2924,
+ "step": 16971
+ },
+ {
+ "epoch": 46.24523160762943,
+ "grad_norm": 4.117089748382568,
+ "learning_rate": 1.1693687107504352e-05,
+ "loss": 0.1476,
+ "step": 16972
+ },
+ {
+ "epoch": 46.247956403269754,
+ "grad_norm": 4.978460311889648,
+ "learning_rate": 1.169281735588771e-05,
+ "loss": 0.1621,
+ "step": 16973
+ },
+ {
+ "epoch": 46.25068119891008,
+ "grad_norm": 7.9032721519470215,
+ "learning_rate": 1.1691947591087464e-05,
+ "loss": 0.1782,
+ "step": 16974
+ },
+ {
+ "epoch": 46.253405994550405,
+ "grad_norm": 5.891063213348389,
+ "learning_rate": 1.1691077813110383e-05,
+ "loss": 0.1756,
+ "step": 16975
+ },
+ {
+ "epoch": 46.25613079019074,
+ "grad_norm": 5.366761207580566,
+ "learning_rate": 1.1690208021963243e-05,
+ "loss": 0.4038,
+ "step": 16976
+ },
+ {
+ "epoch": 46.258855585831064,
+ "grad_norm": 5.27750825881958,
+ "learning_rate": 1.1689338217652818e-05,
+ "loss": 0.1177,
+ "step": 16977
+ },
+ {
+ "epoch": 46.26158038147139,
+ "grad_norm": 5.0216288566589355,
+ "learning_rate": 1.1688468400185877e-05,
+ "loss": 0.3339,
+ "step": 16978
+ },
+ {
+ "epoch": 46.264305177111716,
+ "grad_norm": 4.817869663238525,
+ "learning_rate": 1.16875985695692e-05,
+ "loss": 0.0802,
+ "step": 16979
+ },
+ {
+ "epoch": 46.26702997275204,
+ "grad_norm": 5.414669513702393,
+ "learning_rate": 1.1686728725809564e-05,
+ "loss": 0.1339,
+ "step": 16980
+ },
+ {
+ "epoch": 46.26975476839237,
+ "grad_norm": 5.407716274261475,
+ "learning_rate": 1.1685858868913736e-05,
+ "loss": 0.2522,
+ "step": 16981
+ },
+ {
+ "epoch": 46.2724795640327,
+ "grad_norm": 4.433934688568115,
+ "learning_rate": 1.1684988998888494e-05,
+ "loss": 0.2352,
+ "step": 16982
+ },
+ {
+ "epoch": 46.275204359673026,
+ "grad_norm": 4.624395370483398,
+ "learning_rate": 1.168411911574061e-05,
+ "loss": 0.238,
+ "step": 16983
+ },
+ {
+ "epoch": 46.27792915531335,
+ "grad_norm": 5.083333492279053,
+ "learning_rate": 1.1683249219476864e-05,
+ "loss": 0.1794,
+ "step": 16984
+ },
+ {
+ "epoch": 46.28065395095368,
+ "grad_norm": 5.640879154205322,
+ "learning_rate": 1.1682379310104023e-05,
+ "loss": 0.1328,
+ "step": 16985
+ },
+ {
+ "epoch": 46.283378746594,
+ "grad_norm": 7.7753424644470215,
+ "learning_rate": 1.1681509387628871e-05,
+ "loss": 0.1967,
+ "step": 16986
+ },
+ {
+ "epoch": 46.28610354223433,
+ "grad_norm": 6.597271919250488,
+ "learning_rate": 1.1680639452058172e-05,
+ "loss": 0.3071,
+ "step": 16987
+ },
+ {
+ "epoch": 46.28882833787466,
+ "grad_norm": 4.760594844818115,
+ "learning_rate": 1.1679769503398712e-05,
+ "loss": 0.226,
+ "step": 16988
+ },
+ {
+ "epoch": 46.29155313351499,
+ "grad_norm": 4.12913179397583,
+ "learning_rate": 1.1678899541657258e-05,
+ "loss": 0.1955,
+ "step": 16989
+ },
+ {
+ "epoch": 46.294277929155314,
+ "grad_norm": 5.745121002197266,
+ "learning_rate": 1.1678029566840593e-05,
+ "loss": 0.1848,
+ "step": 16990
+ },
+ {
+ "epoch": 46.29700272479564,
+ "grad_norm": 8.40665054321289,
+ "learning_rate": 1.1677159578955481e-05,
+ "loss": 0.1738,
+ "step": 16991
+ },
+ {
+ "epoch": 46.299727520435965,
+ "grad_norm": 8.361091613769531,
+ "learning_rate": 1.167628957800871e-05,
+ "loss": 0.321,
+ "step": 16992
+ },
+ {
+ "epoch": 46.30245231607629,
+ "grad_norm": 7.860576152801514,
+ "learning_rate": 1.1675419564007046e-05,
+ "loss": 0.1078,
+ "step": 16993
+ },
+ {
+ "epoch": 46.305177111716624,
+ "grad_norm": 5.239068508148193,
+ "learning_rate": 1.167454953695727e-05,
+ "loss": 0.1725,
+ "step": 16994
+ },
+ {
+ "epoch": 46.30790190735695,
+ "grad_norm": 5.734799861907959,
+ "learning_rate": 1.1673679496866155e-05,
+ "loss": 0.0986,
+ "step": 16995
+ },
+ {
+ "epoch": 46.310626702997276,
+ "grad_norm": 12.02059268951416,
+ "learning_rate": 1.167280944374048e-05,
+ "loss": 0.1673,
+ "step": 16996
+ },
+ {
+ "epoch": 46.3133514986376,
+ "grad_norm": 6.198795795440674,
+ "learning_rate": 1.1671939377587018e-05,
+ "loss": 0.1999,
+ "step": 16997
+ },
+ {
+ "epoch": 46.31607629427793,
+ "grad_norm": 6.111451625823975,
+ "learning_rate": 1.1671069298412548e-05,
+ "loss": 0.1847,
+ "step": 16998
+ },
+ {
+ "epoch": 46.31880108991825,
+ "grad_norm": 7.072170734405518,
+ "learning_rate": 1.167019920622384e-05,
+ "loss": 0.1806,
+ "step": 16999
+ },
+ {
+ "epoch": 46.321525885558586,
+ "grad_norm": 6.404435634613037,
+ "learning_rate": 1.1669329101027677e-05,
+ "loss": 0.1762,
+ "step": 17000
+ },
+ {
+ "epoch": 46.32425068119891,
+ "grad_norm": 5.490909576416016,
+ "learning_rate": 1.166845898283083e-05,
+ "loss": 0.2574,
+ "step": 17001
+ },
+ {
+ "epoch": 46.32697547683924,
+ "grad_norm": 4.518784523010254,
+ "learning_rate": 1.1667588851640084e-05,
+ "loss": 0.1352,
+ "step": 17002
+ },
+ {
+ "epoch": 46.32970027247956,
+ "grad_norm": 5.648974895477295,
+ "learning_rate": 1.1666718707462203e-05,
+ "loss": 0.1929,
+ "step": 17003
+ },
+ {
+ "epoch": 46.33242506811989,
+ "grad_norm": 4.958102703094482,
+ "learning_rate": 1.1665848550303972e-05,
+ "loss": 0.2085,
+ "step": 17004
+ },
+ {
+ "epoch": 46.335149863760215,
+ "grad_norm": 5.627400875091553,
+ "learning_rate": 1.1664978380172167e-05,
+ "loss": 0.1024,
+ "step": 17005
+ },
+ {
+ "epoch": 46.33787465940055,
+ "grad_norm": 4.282506465911865,
+ "learning_rate": 1.1664108197073566e-05,
+ "loss": 0.1202,
+ "step": 17006
+ },
+ {
+ "epoch": 46.34059945504087,
+ "grad_norm": 14.788066864013672,
+ "learning_rate": 1.166323800101494e-05,
+ "loss": 0.1317,
+ "step": 17007
+ },
+ {
+ "epoch": 46.3433242506812,
+ "grad_norm": 13.455382347106934,
+ "learning_rate": 1.1662367792003075e-05,
+ "loss": 0.1522,
+ "step": 17008
+ },
+ {
+ "epoch": 46.346049046321525,
+ "grad_norm": 4.96815299987793,
+ "learning_rate": 1.1661497570044737e-05,
+ "loss": 0.1612,
+ "step": 17009
+ },
+ {
+ "epoch": 46.34877384196185,
+ "grad_norm": 7.081682205200195,
+ "learning_rate": 1.1660627335146714e-05,
+ "loss": 0.2652,
+ "step": 17010
+ },
+ {
+ "epoch": 46.35149863760218,
+ "grad_norm": 4.942091941833496,
+ "learning_rate": 1.1659757087315777e-05,
+ "loss": 0.1928,
+ "step": 17011
+ },
+ {
+ "epoch": 46.35422343324251,
+ "grad_norm": 5.042135715484619,
+ "learning_rate": 1.1658886826558709e-05,
+ "loss": 0.266,
+ "step": 17012
+ },
+ {
+ "epoch": 46.356948228882835,
+ "grad_norm": 6.583928108215332,
+ "learning_rate": 1.1658016552882279e-05,
+ "loss": 0.2129,
+ "step": 17013
+ },
+ {
+ "epoch": 46.35967302452316,
+ "grad_norm": 5.138932228088379,
+ "learning_rate": 1.1657146266293269e-05,
+ "loss": 0.1226,
+ "step": 17014
+ },
+ {
+ "epoch": 46.36239782016349,
+ "grad_norm": 5.067035675048828,
+ "learning_rate": 1.1656275966798458e-05,
+ "loss": 0.1469,
+ "step": 17015
+ },
+ {
+ "epoch": 46.36512261580381,
+ "grad_norm": 6.44582986831665,
+ "learning_rate": 1.1655405654404625e-05,
+ "loss": 0.3677,
+ "step": 17016
+ },
+ {
+ "epoch": 46.36784741144414,
+ "grad_norm": 5.958681106567383,
+ "learning_rate": 1.1654535329118545e-05,
+ "loss": 0.1352,
+ "step": 17017
+ },
+ {
+ "epoch": 46.37057220708447,
+ "grad_norm": 5.4483819007873535,
+ "learning_rate": 1.1653664990947e-05,
+ "loss": 0.1605,
+ "step": 17018
+ },
+ {
+ "epoch": 46.3732970027248,
+ "grad_norm": 5.049631595611572,
+ "learning_rate": 1.165279463989676e-05,
+ "loss": 0.2097,
+ "step": 17019
+ },
+ {
+ "epoch": 46.37602179836512,
+ "grad_norm": 6.19951868057251,
+ "learning_rate": 1.1651924275974613e-05,
+ "loss": 0.1634,
+ "step": 17020
+ },
+ {
+ "epoch": 46.37874659400545,
+ "grad_norm": 5.297245979309082,
+ "learning_rate": 1.165105389918733e-05,
+ "loss": 0.1602,
+ "step": 17021
+ },
+ {
+ "epoch": 46.381471389645775,
+ "grad_norm": 5.394540309906006,
+ "learning_rate": 1.1650183509541693e-05,
+ "loss": 0.1449,
+ "step": 17022
+ },
+ {
+ "epoch": 46.3841961852861,
+ "grad_norm": 4.56392765045166,
+ "learning_rate": 1.1649313107044483e-05,
+ "loss": 0.1062,
+ "step": 17023
+ },
+ {
+ "epoch": 46.38692098092643,
+ "grad_norm": 4.668919086456299,
+ "learning_rate": 1.164844269170247e-05,
+ "loss": 0.1717,
+ "step": 17024
+ },
+ {
+ "epoch": 46.38964577656676,
+ "grad_norm": 5.602856636047363,
+ "learning_rate": 1.1647572263522445e-05,
+ "loss": 0.1638,
+ "step": 17025
+ },
+ {
+ "epoch": 46.392370572207085,
+ "grad_norm": 5.524237155914307,
+ "learning_rate": 1.1646701822511173e-05,
+ "loss": 0.1851,
+ "step": 17026
+ },
+ {
+ "epoch": 46.39509536784741,
+ "grad_norm": 9.044189453125,
+ "learning_rate": 1.1645831368675445e-05,
+ "loss": 0.1613,
+ "step": 17027
+ },
+ {
+ "epoch": 46.39782016348774,
+ "grad_norm": 5.674327373504639,
+ "learning_rate": 1.1644960902022033e-05,
+ "loss": 0.1425,
+ "step": 17028
+ },
+ {
+ "epoch": 46.40054495912806,
+ "grad_norm": 4.188699245452881,
+ "learning_rate": 1.1644090422557719e-05,
+ "loss": 0.2439,
+ "step": 17029
+ },
+ {
+ "epoch": 46.403269754768395,
+ "grad_norm": 5.922665119171143,
+ "learning_rate": 1.1643219930289282e-05,
+ "loss": 0.1247,
+ "step": 17030
+ },
+ {
+ "epoch": 46.40599455040872,
+ "grad_norm": 6.207821846008301,
+ "learning_rate": 1.1642349425223502e-05,
+ "loss": 0.1871,
+ "step": 17031
+ },
+ {
+ "epoch": 46.40871934604905,
+ "grad_norm": 5.177120685577393,
+ "learning_rate": 1.1641478907367157e-05,
+ "loss": 0.1719,
+ "step": 17032
+ },
+ {
+ "epoch": 46.41144414168937,
+ "grad_norm": 7.872409820556641,
+ "learning_rate": 1.1640608376727028e-05,
+ "loss": 0.0984,
+ "step": 17033
+ },
+ {
+ "epoch": 46.4141689373297,
+ "grad_norm": 5.78146505355835,
+ "learning_rate": 1.163973783330989e-05,
+ "loss": 0.1353,
+ "step": 17034
+ },
+ {
+ "epoch": 46.416893732970024,
+ "grad_norm": 4.18654727935791,
+ "learning_rate": 1.1638867277122532e-05,
+ "loss": 0.1558,
+ "step": 17035
+ },
+ {
+ "epoch": 46.41961852861036,
+ "grad_norm": 5.658872127532959,
+ "learning_rate": 1.1637996708171725e-05,
+ "loss": 0.1506,
+ "step": 17036
+ },
+ {
+ "epoch": 46.42234332425068,
+ "grad_norm": 4.325180530548096,
+ "learning_rate": 1.163712612646425e-05,
+ "loss": 0.2835,
+ "step": 17037
+ },
+ {
+ "epoch": 46.42506811989101,
+ "grad_norm": 6.2680277824401855,
+ "learning_rate": 1.1636255532006892e-05,
+ "loss": 0.1261,
+ "step": 17038
+ },
+ {
+ "epoch": 46.427792915531334,
+ "grad_norm": 5.596966743469238,
+ "learning_rate": 1.163538492480643e-05,
+ "loss": 0.1306,
+ "step": 17039
+ },
+ {
+ "epoch": 46.43051771117166,
+ "grad_norm": 7.976938724517822,
+ "learning_rate": 1.1634514304869641e-05,
+ "loss": 0.2746,
+ "step": 17040
+ },
+ {
+ "epoch": 46.433242506811986,
+ "grad_norm": 4.647032737731934,
+ "learning_rate": 1.163364367220331e-05,
+ "loss": 0.1492,
+ "step": 17041
+ },
+ {
+ "epoch": 46.43596730245232,
+ "grad_norm": 4.698653221130371,
+ "learning_rate": 1.1632773026814213e-05,
+ "loss": 0.2278,
+ "step": 17042
+ },
+ {
+ "epoch": 46.438692098092645,
+ "grad_norm": 6.693230628967285,
+ "learning_rate": 1.1631902368709132e-05,
+ "loss": 0.1462,
+ "step": 17043
+ },
+ {
+ "epoch": 46.44141689373297,
+ "grad_norm": 5.366065502166748,
+ "learning_rate": 1.1631031697894846e-05,
+ "loss": 0.1761,
+ "step": 17044
+ },
+ {
+ "epoch": 46.444141689373296,
+ "grad_norm": 5.929636001586914,
+ "learning_rate": 1.1630161014378141e-05,
+ "loss": 0.1365,
+ "step": 17045
+ },
+ {
+ "epoch": 46.44686648501362,
+ "grad_norm": 9.201284408569336,
+ "learning_rate": 1.1629290318165792e-05,
+ "loss": 0.1515,
+ "step": 17046
+ },
+ {
+ "epoch": 46.44959128065395,
+ "grad_norm": 6.123513221740723,
+ "learning_rate": 1.1628419609264582e-05,
+ "loss": 0.2385,
+ "step": 17047
+ },
+ {
+ "epoch": 46.45231607629428,
+ "grad_norm": 5.181742191314697,
+ "learning_rate": 1.1627548887681292e-05,
+ "loss": 0.113,
+ "step": 17048
+ },
+ {
+ "epoch": 46.45504087193461,
+ "grad_norm": 5.155125141143799,
+ "learning_rate": 1.1626678153422708e-05,
+ "loss": 0.2259,
+ "step": 17049
+ },
+ {
+ "epoch": 46.45776566757493,
+ "grad_norm": 5.5835371017456055,
+ "learning_rate": 1.1625807406495605e-05,
+ "loss": 0.1088,
+ "step": 17050
+ },
+ {
+ "epoch": 46.46049046321526,
+ "grad_norm": 5.033536434173584,
+ "learning_rate": 1.1624936646906766e-05,
+ "loss": 0.1226,
+ "step": 17051
+ },
+ {
+ "epoch": 46.463215258855584,
+ "grad_norm": 4.7039618492126465,
+ "learning_rate": 1.1624065874662971e-05,
+ "loss": 0.0793,
+ "step": 17052
+ },
+ {
+ "epoch": 46.46594005449591,
+ "grad_norm": 5.142733097076416,
+ "learning_rate": 1.1623195089771005e-05,
+ "loss": 0.2472,
+ "step": 17053
+ },
+ {
+ "epoch": 46.46866485013624,
+ "grad_norm": 4.57804012298584,
+ "learning_rate": 1.1622324292237645e-05,
+ "loss": 0.1567,
+ "step": 17054
+ },
+ {
+ "epoch": 46.47138964577657,
+ "grad_norm": 5.453049182891846,
+ "learning_rate": 1.162145348206968e-05,
+ "loss": 0.2081,
+ "step": 17055
+ },
+ {
+ "epoch": 46.474114441416894,
+ "grad_norm": 7.133620738983154,
+ "learning_rate": 1.1620582659273882e-05,
+ "loss": 0.1425,
+ "step": 17056
+ },
+ {
+ "epoch": 46.47683923705722,
+ "grad_norm": 5.547028541564941,
+ "learning_rate": 1.1619711823857045e-05,
+ "loss": 0.1772,
+ "step": 17057
+ },
+ {
+ "epoch": 46.479564032697546,
+ "grad_norm": 5.2422919273376465,
+ "learning_rate": 1.161884097582594e-05,
+ "loss": 0.1627,
+ "step": 17058
+ },
+ {
+ "epoch": 46.48228882833787,
+ "grad_norm": 4.932727813720703,
+ "learning_rate": 1.1617970115187356e-05,
+ "loss": 0.1214,
+ "step": 17059
+ },
+ {
+ "epoch": 46.485013623978205,
+ "grad_norm": 4.722919464111328,
+ "learning_rate": 1.1617099241948072e-05,
+ "loss": 0.1622,
+ "step": 17060
+ },
+ {
+ "epoch": 46.48773841961853,
+ "grad_norm": 4.650905132293701,
+ "learning_rate": 1.1616228356114871e-05,
+ "loss": 0.1286,
+ "step": 17061
+ },
+ {
+ "epoch": 46.490463215258856,
+ "grad_norm": 6.387599468231201,
+ "learning_rate": 1.1615357457694534e-05,
+ "loss": 0.1863,
+ "step": 17062
+ },
+ {
+ "epoch": 46.49318801089918,
+ "grad_norm": 6.3198113441467285,
+ "learning_rate": 1.1614486546693848e-05,
+ "loss": 0.2276,
+ "step": 17063
+ },
+ {
+ "epoch": 46.49591280653951,
+ "grad_norm": 13.79389762878418,
+ "learning_rate": 1.1613615623119587e-05,
+ "loss": 0.1833,
+ "step": 17064
+ },
+ {
+ "epoch": 46.49863760217983,
+ "grad_norm": 5.718416690826416,
+ "learning_rate": 1.1612744686978545e-05,
+ "loss": 0.3176,
+ "step": 17065
+ },
+ {
+ "epoch": 46.50136239782017,
+ "grad_norm": 4.466360569000244,
+ "learning_rate": 1.1611873738277499e-05,
+ "loss": 0.1387,
+ "step": 17066
+ },
+ {
+ "epoch": 46.50408719346049,
+ "grad_norm": 16.300098419189453,
+ "learning_rate": 1.1611002777023233e-05,
+ "loss": 0.2676,
+ "step": 17067
+ },
+ {
+ "epoch": 46.50681198910082,
+ "grad_norm": 6.630517482757568,
+ "learning_rate": 1.1610131803222527e-05,
+ "loss": 0.1631,
+ "step": 17068
+ },
+ {
+ "epoch": 46.509536784741144,
+ "grad_norm": 6.6345977783203125,
+ "learning_rate": 1.1609260816882167e-05,
+ "loss": 0.1563,
+ "step": 17069
+ },
+ {
+ "epoch": 46.51226158038147,
+ "grad_norm": 6.348479747772217,
+ "learning_rate": 1.1608389818008933e-05,
+ "loss": 0.2277,
+ "step": 17070
+ },
+ {
+ "epoch": 46.514986376021795,
+ "grad_norm": 6.026793003082275,
+ "learning_rate": 1.1607518806609614e-05,
+ "loss": 0.1413,
+ "step": 17071
+ },
+ {
+ "epoch": 46.51771117166213,
+ "grad_norm": 5.881906509399414,
+ "learning_rate": 1.160664778269099e-05,
+ "loss": 0.2329,
+ "step": 17072
+ },
+ {
+ "epoch": 46.520435967302454,
+ "grad_norm": 5.612852573394775,
+ "learning_rate": 1.1605776746259844e-05,
+ "loss": 0.2504,
+ "step": 17073
+ },
+ {
+ "epoch": 46.52316076294278,
+ "grad_norm": 6.368758201599121,
+ "learning_rate": 1.1604905697322959e-05,
+ "loss": 0.2357,
+ "step": 17074
+ },
+ {
+ "epoch": 46.525885558583106,
+ "grad_norm": 4.724337100982666,
+ "learning_rate": 1.1604034635887123e-05,
+ "loss": 0.1575,
+ "step": 17075
+ },
+ {
+ "epoch": 46.52861035422343,
+ "grad_norm": 6.717184543609619,
+ "learning_rate": 1.1603163561959114e-05,
+ "loss": 0.2689,
+ "step": 17076
+ },
+ {
+ "epoch": 46.53133514986376,
+ "grad_norm": 5.42552375793457,
+ "learning_rate": 1.1602292475545722e-05,
+ "loss": 0.1152,
+ "step": 17077
+ },
+ {
+ "epoch": 46.53405994550409,
+ "grad_norm": 6.456541538238525,
+ "learning_rate": 1.1601421376653725e-05,
+ "loss": 0.2662,
+ "step": 17078
+ },
+ {
+ "epoch": 46.536784741144416,
+ "grad_norm": 7.436701774597168,
+ "learning_rate": 1.1600550265289913e-05,
+ "loss": 0.2448,
+ "step": 17079
+ },
+ {
+ "epoch": 46.53950953678474,
+ "grad_norm": 6.276247024536133,
+ "learning_rate": 1.1599679141461064e-05,
+ "loss": 0.1249,
+ "step": 17080
+ },
+ {
+ "epoch": 46.54223433242507,
+ "grad_norm": 5.149324893951416,
+ "learning_rate": 1.1598808005173967e-05,
+ "loss": 0.2059,
+ "step": 17081
+ },
+ {
+ "epoch": 46.54495912806539,
+ "grad_norm": 5.121246814727783,
+ "learning_rate": 1.15979368564354e-05,
+ "loss": 0.1415,
+ "step": 17082
+ },
+ {
+ "epoch": 46.54768392370572,
+ "grad_norm": 3.952131509780884,
+ "learning_rate": 1.1597065695252158e-05,
+ "loss": 0.1029,
+ "step": 17083
+ },
+ {
+ "epoch": 46.55040871934605,
+ "grad_norm": 5.1012282371521,
+ "learning_rate": 1.1596194521631018e-05,
+ "loss": 0.1665,
+ "step": 17084
+ },
+ {
+ "epoch": 46.55313351498638,
+ "grad_norm": 4.166836738586426,
+ "learning_rate": 1.159532333557877e-05,
+ "loss": 0.0947,
+ "step": 17085
+ },
+ {
+ "epoch": 46.555858310626704,
+ "grad_norm": 5.417153835296631,
+ "learning_rate": 1.159445213710219e-05,
+ "loss": 0.144,
+ "step": 17086
+ },
+ {
+ "epoch": 46.55858310626703,
+ "grad_norm": 4.658019065856934,
+ "learning_rate": 1.159358092620807e-05,
+ "loss": 0.1058,
+ "step": 17087
+ },
+ {
+ "epoch": 46.561307901907355,
+ "grad_norm": 6.91645622253418,
+ "learning_rate": 1.1592709702903193e-05,
+ "loss": 0.1344,
+ "step": 17088
+ },
+ {
+ "epoch": 46.56403269754768,
+ "grad_norm": 6.4773406982421875,
+ "learning_rate": 1.1591838467194345e-05,
+ "loss": 0.238,
+ "step": 17089
+ },
+ {
+ "epoch": 46.566757493188014,
+ "grad_norm": 5.077652454376221,
+ "learning_rate": 1.1590967219088305e-05,
+ "loss": 0.2961,
+ "step": 17090
+ },
+ {
+ "epoch": 46.56948228882834,
+ "grad_norm": 7.711599349975586,
+ "learning_rate": 1.159009595859187e-05,
+ "loss": 0.2155,
+ "step": 17091
+ },
+ {
+ "epoch": 46.572207084468666,
+ "grad_norm": 5.8498430252075195,
+ "learning_rate": 1.1589224685711816e-05,
+ "loss": 0.1707,
+ "step": 17092
+ },
+ {
+ "epoch": 46.57493188010899,
+ "grad_norm": 7.059077739715576,
+ "learning_rate": 1.1588353400454933e-05,
+ "loss": 0.1457,
+ "step": 17093
+ },
+ {
+ "epoch": 46.57765667574932,
+ "grad_norm": 4.909677028656006,
+ "learning_rate": 1.1587482102828002e-05,
+ "loss": 0.2807,
+ "step": 17094
+ },
+ {
+ "epoch": 46.58038147138964,
+ "grad_norm": 5.569499492645264,
+ "learning_rate": 1.1586610792837813e-05,
+ "loss": 0.3366,
+ "step": 17095
+ },
+ {
+ "epoch": 46.583106267029976,
+ "grad_norm": 4.240732669830322,
+ "learning_rate": 1.158573947049115e-05,
+ "loss": 0.147,
+ "step": 17096
+ },
+ {
+ "epoch": 46.5858310626703,
+ "grad_norm": 5.880338668823242,
+ "learning_rate": 1.1584868135794801e-05,
+ "loss": 0.256,
+ "step": 17097
+ },
+ {
+ "epoch": 46.58855585831063,
+ "grad_norm": 5.3914875984191895,
+ "learning_rate": 1.1583996788755548e-05,
+ "loss": 0.1347,
+ "step": 17098
+ },
+ {
+ "epoch": 46.59128065395095,
+ "grad_norm": 7.002774715423584,
+ "learning_rate": 1.1583125429380177e-05,
+ "loss": 0.1488,
+ "step": 17099
+ },
+ {
+ "epoch": 46.59400544959128,
+ "grad_norm": 4.866771697998047,
+ "learning_rate": 1.1582254057675481e-05,
+ "loss": 0.1221,
+ "step": 17100
+ },
+ {
+ "epoch": 46.596730245231605,
+ "grad_norm": 5.560983657836914,
+ "learning_rate": 1.1581382673648238e-05,
+ "loss": 0.2322,
+ "step": 17101
+ },
+ {
+ "epoch": 46.59945504087194,
+ "grad_norm": 5.6942620277404785,
+ "learning_rate": 1.1580511277305238e-05,
+ "loss": 0.1264,
+ "step": 17102
+ },
+ {
+ "epoch": 46.60217983651226,
+ "grad_norm": 5.447231769561768,
+ "learning_rate": 1.1579639868653267e-05,
+ "loss": 0.1602,
+ "step": 17103
+ },
+ {
+ "epoch": 46.60490463215259,
+ "grad_norm": 5.0954179763793945,
+ "learning_rate": 1.1578768447699111e-05,
+ "loss": 0.2193,
+ "step": 17104
+ },
+ {
+ "epoch": 46.607629427792915,
+ "grad_norm": 4.641750812530518,
+ "learning_rate": 1.1577897014449562e-05,
+ "loss": 0.1765,
+ "step": 17105
+ },
+ {
+ "epoch": 46.61035422343324,
+ "grad_norm": 4.832330226898193,
+ "learning_rate": 1.1577025568911395e-05,
+ "loss": 0.1841,
+ "step": 17106
+ },
+ {
+ "epoch": 46.61307901907357,
+ "grad_norm": 5.537833213806152,
+ "learning_rate": 1.1576154111091407e-05,
+ "loss": 0.257,
+ "step": 17107
+ },
+ {
+ "epoch": 46.6158038147139,
+ "grad_norm": 7.282318115234375,
+ "learning_rate": 1.157528264099638e-05,
+ "loss": 0.2022,
+ "step": 17108
+ },
+ {
+ "epoch": 46.618528610354225,
+ "grad_norm": 9.270844459533691,
+ "learning_rate": 1.1574411158633105e-05,
+ "loss": 0.2586,
+ "step": 17109
+ },
+ {
+ "epoch": 46.62125340599455,
+ "grad_norm": 5.545162677764893,
+ "learning_rate": 1.1573539664008367e-05,
+ "loss": 0.1764,
+ "step": 17110
+ },
+ {
+ "epoch": 46.62397820163488,
+ "grad_norm": 4.650853633880615,
+ "learning_rate": 1.157266815712895e-05,
+ "loss": 0.0835,
+ "step": 17111
+ },
+ {
+ "epoch": 46.6267029972752,
+ "grad_norm": 6.177081108093262,
+ "learning_rate": 1.1571796638001644e-05,
+ "loss": 0.1656,
+ "step": 17112
+ },
+ {
+ "epoch": 46.62942779291553,
+ "grad_norm": 6.224137306213379,
+ "learning_rate": 1.1570925106633237e-05,
+ "loss": 0.1861,
+ "step": 17113
+ },
+ {
+ "epoch": 46.63215258855586,
+ "grad_norm": 7.899147987365723,
+ "learning_rate": 1.1570053563030516e-05,
+ "loss": 0.1234,
+ "step": 17114
+ },
+ {
+ "epoch": 46.63487738419619,
+ "grad_norm": 4.292054176330566,
+ "learning_rate": 1.156918200720027e-05,
+ "loss": 0.1391,
+ "step": 17115
+ },
+ {
+ "epoch": 46.63760217983651,
+ "grad_norm": 6.130233287811279,
+ "learning_rate": 1.1568310439149281e-05,
+ "loss": 0.1378,
+ "step": 17116
+ },
+ {
+ "epoch": 46.64032697547684,
+ "grad_norm": 5.36210823059082,
+ "learning_rate": 1.1567438858884344e-05,
+ "loss": 0.2174,
+ "step": 17117
+ },
+ {
+ "epoch": 46.643051771117165,
+ "grad_norm": 4.932548999786377,
+ "learning_rate": 1.1566567266412243e-05,
+ "loss": 0.2543,
+ "step": 17118
+ },
+ {
+ "epoch": 46.64577656675749,
+ "grad_norm": 10.372445106506348,
+ "learning_rate": 1.1565695661739767e-05,
+ "loss": 0.2312,
+ "step": 17119
+ },
+ {
+ "epoch": 46.64850136239782,
+ "grad_norm": 6.825093746185303,
+ "learning_rate": 1.1564824044873704e-05,
+ "loss": 0.1279,
+ "step": 17120
+ },
+ {
+ "epoch": 46.65122615803815,
+ "grad_norm": 6.031970500946045,
+ "learning_rate": 1.156395241582084e-05,
+ "loss": 0.1711,
+ "step": 17121
+ },
+ {
+ "epoch": 46.653950953678475,
+ "grad_norm": 4.9874162673950195,
+ "learning_rate": 1.1563080774587967e-05,
+ "loss": 0.1428,
+ "step": 17122
+ },
+ {
+ "epoch": 46.6566757493188,
+ "grad_norm": 5.995129585266113,
+ "learning_rate": 1.1562209121181869e-05,
+ "loss": 0.1624,
+ "step": 17123
+ },
+ {
+ "epoch": 46.65940054495913,
+ "grad_norm": 4.370136737823486,
+ "learning_rate": 1.1561337455609336e-05,
+ "loss": 0.1771,
+ "step": 17124
+ },
+ {
+ "epoch": 46.66212534059945,
+ "grad_norm": 5.784974575042725,
+ "learning_rate": 1.1560465777877159e-05,
+ "loss": 0.3389,
+ "step": 17125
+ },
+ {
+ "epoch": 46.664850136239785,
+ "grad_norm": 5.641836643218994,
+ "learning_rate": 1.1559594087992126e-05,
+ "loss": 0.1953,
+ "step": 17126
+ },
+ {
+ "epoch": 46.66757493188011,
+ "grad_norm": 4.9505839347839355,
+ "learning_rate": 1.1558722385961022e-05,
+ "loss": 0.1016,
+ "step": 17127
+ },
+ {
+ "epoch": 46.67029972752044,
+ "grad_norm": 6.375181198120117,
+ "learning_rate": 1.1557850671790638e-05,
+ "loss": 0.4016,
+ "step": 17128
+ },
+ {
+ "epoch": 46.67302452316076,
+ "grad_norm": 6.434603214263916,
+ "learning_rate": 1.1556978945487764e-05,
+ "loss": 0.2028,
+ "step": 17129
+ },
+ {
+ "epoch": 46.67574931880109,
+ "grad_norm": 5.105738162994385,
+ "learning_rate": 1.1556107207059191e-05,
+ "loss": 0.1713,
+ "step": 17130
+ },
+ {
+ "epoch": 46.678474114441414,
+ "grad_norm": 6.207189083099365,
+ "learning_rate": 1.15552354565117e-05,
+ "loss": 0.2828,
+ "step": 17131
+ },
+ {
+ "epoch": 46.68119891008175,
+ "grad_norm": 5.005661487579346,
+ "learning_rate": 1.1554363693852088e-05,
+ "loss": 0.3001,
+ "step": 17132
+ },
+ {
+ "epoch": 46.68392370572207,
+ "grad_norm": 4.64664888381958,
+ "learning_rate": 1.155349191908714e-05,
+ "loss": 0.1309,
+ "step": 17133
+ },
+ {
+ "epoch": 46.6866485013624,
+ "grad_norm": 5.883870601654053,
+ "learning_rate": 1.1552620132223649e-05,
+ "loss": 0.1508,
+ "step": 17134
+ },
+ {
+ "epoch": 46.689373297002724,
+ "grad_norm": 6.420288562774658,
+ "learning_rate": 1.1551748333268402e-05,
+ "loss": 0.1644,
+ "step": 17135
+ },
+ {
+ "epoch": 46.69209809264305,
+ "grad_norm": 7.443354606628418,
+ "learning_rate": 1.155087652222819e-05,
+ "loss": 0.2949,
+ "step": 17136
+ },
+ {
+ "epoch": 46.694822888283376,
+ "grad_norm": 4.831696510314941,
+ "learning_rate": 1.1550004699109797e-05,
+ "loss": 0.1808,
+ "step": 17137
+ },
+ {
+ "epoch": 46.69754768392371,
+ "grad_norm": 5.709593772888184,
+ "learning_rate": 1.1549132863920023e-05,
+ "loss": 0.2093,
+ "step": 17138
+ },
+ {
+ "epoch": 46.700272479564035,
+ "grad_norm": 4.546253204345703,
+ "learning_rate": 1.154826101666565e-05,
+ "loss": 0.1078,
+ "step": 17139
+ },
+ {
+ "epoch": 46.70299727520436,
+ "grad_norm": 6.26744270324707,
+ "learning_rate": 1.154738915735347e-05,
+ "loss": 0.2678,
+ "step": 17140
+ },
+ {
+ "epoch": 46.705722070844686,
+ "grad_norm": 4.443904399871826,
+ "learning_rate": 1.1546517285990272e-05,
+ "loss": 0.1163,
+ "step": 17141
+ },
+ {
+ "epoch": 46.70844686648501,
+ "grad_norm": 6.217555522918701,
+ "learning_rate": 1.1545645402582845e-05,
+ "loss": 0.2317,
+ "step": 17142
+ },
+ {
+ "epoch": 46.71117166212534,
+ "grad_norm": 5.766835689544678,
+ "learning_rate": 1.1544773507137985e-05,
+ "loss": 0.1799,
+ "step": 17143
+ },
+ {
+ "epoch": 46.71389645776567,
+ "grad_norm": 5.947284698486328,
+ "learning_rate": 1.1543901599662476e-05,
+ "loss": 0.1737,
+ "step": 17144
+ },
+ {
+ "epoch": 46.716621253406,
+ "grad_norm": 5.5444254875183105,
+ "learning_rate": 1.1543029680163114e-05,
+ "loss": 0.1088,
+ "step": 17145
+ },
+ {
+ "epoch": 46.71934604904632,
+ "grad_norm": 5.982610702514648,
+ "learning_rate": 1.1542157748646687e-05,
+ "loss": 0.1342,
+ "step": 17146
+ },
+ {
+ "epoch": 46.72207084468665,
+ "grad_norm": 5.010898113250732,
+ "learning_rate": 1.1541285805119981e-05,
+ "loss": 0.2159,
+ "step": 17147
+ },
+ {
+ "epoch": 46.724795640326974,
+ "grad_norm": 5.242317199707031,
+ "learning_rate": 1.1540413849589795e-05,
+ "loss": 0.2223,
+ "step": 17148
+ },
+ {
+ "epoch": 46.7275204359673,
+ "grad_norm": 5.874389171600342,
+ "learning_rate": 1.1539541882062912e-05,
+ "loss": 0.1629,
+ "step": 17149
+ },
+ {
+ "epoch": 46.73024523160763,
+ "grad_norm": 5.2313151359558105,
+ "learning_rate": 1.1538669902546128e-05,
+ "loss": 0.1995,
+ "step": 17150
+ },
+ {
+ "epoch": 46.73297002724796,
+ "grad_norm": 4.858578681945801,
+ "learning_rate": 1.153779791104623e-05,
+ "loss": 0.2223,
+ "step": 17151
+ },
+ {
+ "epoch": 46.735694822888284,
+ "grad_norm": 6.7911601066589355,
+ "learning_rate": 1.1536925907570017e-05,
+ "loss": 0.1924,
+ "step": 17152
+ },
+ {
+ "epoch": 46.73841961852861,
+ "grad_norm": 5.80068302154541,
+ "learning_rate": 1.1536053892124271e-05,
+ "loss": 0.1387,
+ "step": 17153
+ },
+ {
+ "epoch": 46.741144414168936,
+ "grad_norm": 6.854654788970947,
+ "learning_rate": 1.1535181864715787e-05,
+ "loss": 0.2084,
+ "step": 17154
+ },
+ {
+ "epoch": 46.74386920980926,
+ "grad_norm": 6.12240743637085,
+ "learning_rate": 1.1534309825351355e-05,
+ "loss": 0.1462,
+ "step": 17155
+ },
+ {
+ "epoch": 46.746594005449595,
+ "grad_norm": 4.873581409454346,
+ "learning_rate": 1.153343777403777e-05,
+ "loss": 0.2224,
+ "step": 17156
+ },
+ {
+ "epoch": 46.74931880108992,
+ "grad_norm": 4.991065502166748,
+ "learning_rate": 1.153256571078182e-05,
+ "loss": 0.3822,
+ "step": 17157
+ },
+ {
+ "epoch": 46.752043596730246,
+ "grad_norm": 5.345722198486328,
+ "learning_rate": 1.1531693635590297e-05,
+ "loss": 0.1559,
+ "step": 17158
+ },
+ {
+ "epoch": 46.75476839237057,
+ "grad_norm": 4.802318096160889,
+ "learning_rate": 1.153082154846999e-05,
+ "loss": 0.0878,
+ "step": 17159
+ },
+ {
+ "epoch": 46.7574931880109,
+ "grad_norm": 16.177759170532227,
+ "learning_rate": 1.15299494494277e-05,
+ "loss": 0.1817,
+ "step": 17160
+ },
+ {
+ "epoch": 46.76021798365122,
+ "grad_norm": 5.017428874969482,
+ "learning_rate": 1.152907733847021e-05,
+ "loss": 0.1373,
+ "step": 17161
+ },
+ {
+ "epoch": 46.762942779291556,
+ "grad_norm": 4.417322635650635,
+ "learning_rate": 1.1528205215604315e-05,
+ "loss": 0.1326,
+ "step": 17162
+ },
+ {
+ "epoch": 46.76566757493188,
+ "grad_norm": 5.657163143157959,
+ "learning_rate": 1.1527333080836807e-05,
+ "loss": 0.2708,
+ "step": 17163
+ },
+ {
+ "epoch": 46.76839237057221,
+ "grad_norm": 6.762208461761475,
+ "learning_rate": 1.152646093417448e-05,
+ "loss": 0.1091,
+ "step": 17164
+ },
+ {
+ "epoch": 46.771117166212534,
+ "grad_norm": 7.414045333862305,
+ "learning_rate": 1.1525588775624122e-05,
+ "loss": 0.1453,
+ "step": 17165
+ },
+ {
+ "epoch": 46.77384196185286,
+ "grad_norm": 4.256861209869385,
+ "learning_rate": 1.1524716605192527e-05,
+ "loss": 0.1232,
+ "step": 17166
+ },
+ {
+ "epoch": 46.776566757493185,
+ "grad_norm": 6.971860885620117,
+ "learning_rate": 1.152384442288649e-05,
+ "loss": 0.131,
+ "step": 17167
+ },
+ {
+ "epoch": 46.77929155313352,
+ "grad_norm": 5.602042198181152,
+ "learning_rate": 1.1522972228712799e-05,
+ "loss": 0.1672,
+ "step": 17168
+ },
+ {
+ "epoch": 46.782016348773844,
+ "grad_norm": 5.54409122467041,
+ "learning_rate": 1.1522100022678251e-05,
+ "loss": 0.2248,
+ "step": 17169
+ },
+ {
+ "epoch": 46.78474114441417,
+ "grad_norm": 4.696835994720459,
+ "learning_rate": 1.1521227804789638e-05,
+ "loss": 0.3056,
+ "step": 17170
+ },
+ {
+ "epoch": 46.787465940054496,
+ "grad_norm": 10.720602035522461,
+ "learning_rate": 1.1520355575053752e-05,
+ "loss": 0.2274,
+ "step": 17171
+ },
+ {
+ "epoch": 46.79019073569482,
+ "grad_norm": 5.531253337860107,
+ "learning_rate": 1.1519483333477385e-05,
+ "loss": 0.1606,
+ "step": 17172
+ },
+ {
+ "epoch": 46.79291553133515,
+ "grad_norm": 5.234531879425049,
+ "learning_rate": 1.151861108006733e-05,
+ "loss": 0.201,
+ "step": 17173
+ },
+ {
+ "epoch": 46.79564032697548,
+ "grad_norm": 7.15482759475708,
+ "learning_rate": 1.1517738814830383e-05,
+ "loss": 0.1566,
+ "step": 17174
+ },
+ {
+ "epoch": 46.798365122615806,
+ "grad_norm": 8.959362983703613,
+ "learning_rate": 1.1516866537773332e-05,
+ "loss": 0.2745,
+ "step": 17175
+ },
+ {
+ "epoch": 46.80108991825613,
+ "grad_norm": 11.96219539642334,
+ "learning_rate": 1.1515994248902976e-05,
+ "loss": 0.2502,
+ "step": 17176
+ },
+ {
+ "epoch": 46.80381471389646,
+ "grad_norm": 4.936633110046387,
+ "learning_rate": 1.1515121948226102e-05,
+ "loss": 0.1515,
+ "step": 17177
+ },
+ {
+ "epoch": 46.80653950953678,
+ "grad_norm": 6.5064568519592285,
+ "learning_rate": 1.1514249635749511e-05,
+ "loss": 0.2102,
+ "step": 17178
+ },
+ {
+ "epoch": 46.80926430517711,
+ "grad_norm": 7.871065139770508,
+ "learning_rate": 1.1513377311479989e-05,
+ "loss": 0.1696,
+ "step": 17179
+ },
+ {
+ "epoch": 46.81198910081744,
+ "grad_norm": 5.331688404083252,
+ "learning_rate": 1.1512504975424338e-05,
+ "loss": 0.1754,
+ "step": 17180
+ },
+ {
+ "epoch": 46.81471389645777,
+ "grad_norm": 5.36503791809082,
+ "learning_rate": 1.1511632627589343e-05,
+ "loss": 0.1506,
+ "step": 17181
+ },
+ {
+ "epoch": 46.817438692098094,
+ "grad_norm": 4.530533790588379,
+ "learning_rate": 1.1510760267981803e-05,
+ "loss": 0.4418,
+ "step": 17182
+ },
+ {
+ "epoch": 46.82016348773842,
+ "grad_norm": 4.749527931213379,
+ "learning_rate": 1.1509887896608509e-05,
+ "loss": 0.1638,
+ "step": 17183
+ },
+ {
+ "epoch": 46.822888283378745,
+ "grad_norm": 5.135331153869629,
+ "learning_rate": 1.150901551347626e-05,
+ "loss": 0.208,
+ "step": 17184
+ },
+ {
+ "epoch": 46.82561307901907,
+ "grad_norm": 6.572135925292969,
+ "learning_rate": 1.1508143118591843e-05,
+ "loss": 0.2513,
+ "step": 17185
+ },
+ {
+ "epoch": 46.828337874659404,
+ "grad_norm": 5.860957622528076,
+ "learning_rate": 1.1507270711962057e-05,
+ "loss": 0.2179,
+ "step": 17186
+ },
+ {
+ "epoch": 46.83106267029973,
+ "grad_norm": 4.241574764251709,
+ "learning_rate": 1.1506398293593697e-05,
+ "loss": 0.1535,
+ "step": 17187
+ },
+ {
+ "epoch": 46.833787465940055,
+ "grad_norm": 5.161186695098877,
+ "learning_rate": 1.1505525863493554e-05,
+ "loss": 0.1632,
+ "step": 17188
+ },
+ {
+ "epoch": 46.83651226158038,
+ "grad_norm": 5.187852382659912,
+ "learning_rate": 1.1504653421668424e-05,
+ "loss": 0.2404,
+ "step": 17189
+ },
+ {
+ "epoch": 46.83923705722071,
+ "grad_norm": 5.943875312805176,
+ "learning_rate": 1.1503780968125105e-05,
+ "loss": 0.2124,
+ "step": 17190
+ },
+ {
+ "epoch": 46.84196185286103,
+ "grad_norm": 8.500675201416016,
+ "learning_rate": 1.1502908502870382e-05,
+ "loss": 0.3095,
+ "step": 17191
+ },
+ {
+ "epoch": 46.844686648501366,
+ "grad_norm": 5.175501346588135,
+ "learning_rate": 1.1502036025911061e-05,
+ "loss": 0.1518,
+ "step": 17192
+ },
+ {
+ "epoch": 46.84741144414169,
+ "grad_norm": 6.077765941619873,
+ "learning_rate": 1.150116353725393e-05,
+ "loss": 0.148,
+ "step": 17193
+ },
+ {
+ "epoch": 46.85013623978202,
+ "grad_norm": 5.665741443634033,
+ "learning_rate": 1.1500291036905784e-05,
+ "loss": 0.1457,
+ "step": 17194
+ },
+ {
+ "epoch": 46.85286103542234,
+ "grad_norm": 5.57317590713501,
+ "learning_rate": 1.1499418524873422e-05,
+ "loss": 0.3059,
+ "step": 17195
+ },
+ {
+ "epoch": 46.85558583106267,
+ "grad_norm": 6.533044338226318,
+ "learning_rate": 1.1498546001163638e-05,
+ "loss": 0.1403,
+ "step": 17196
+ },
+ {
+ "epoch": 46.858310626702995,
+ "grad_norm": 6.13126802444458,
+ "learning_rate": 1.1497673465783224e-05,
+ "loss": 0.2343,
+ "step": 17197
+ },
+ {
+ "epoch": 46.86103542234333,
+ "grad_norm": 5.1407060623168945,
+ "learning_rate": 1.1496800918738977e-05,
+ "loss": 0.1411,
+ "step": 17198
+ },
+ {
+ "epoch": 46.86376021798365,
+ "grad_norm": 8.173460960388184,
+ "learning_rate": 1.1495928360037691e-05,
+ "loss": 0.3423,
+ "step": 17199
+ },
+ {
+ "epoch": 46.86648501362398,
+ "grad_norm": 55.221885681152344,
+ "learning_rate": 1.1495055789686167e-05,
+ "loss": 0.2487,
+ "step": 17200
+ },
+ {
+ "epoch": 46.869209809264305,
+ "grad_norm": 7.013250827789307,
+ "learning_rate": 1.1494183207691194e-05,
+ "loss": 0.2019,
+ "step": 17201
+ },
+ {
+ "epoch": 46.87193460490463,
+ "grad_norm": 6.132880687713623,
+ "learning_rate": 1.149331061405957e-05,
+ "loss": 0.3039,
+ "step": 17202
+ },
+ {
+ "epoch": 46.87465940054496,
+ "grad_norm": 5.015172481536865,
+ "learning_rate": 1.1492438008798093e-05,
+ "loss": 0.2782,
+ "step": 17203
+ },
+ {
+ "epoch": 46.87738419618529,
+ "grad_norm": 6.557510852813721,
+ "learning_rate": 1.1491565391913555e-05,
+ "loss": 0.2694,
+ "step": 17204
+ },
+ {
+ "epoch": 46.880108991825615,
+ "grad_norm": 5.464590549468994,
+ "learning_rate": 1.1490692763412757e-05,
+ "loss": 0.439,
+ "step": 17205
+ },
+ {
+ "epoch": 46.88283378746594,
+ "grad_norm": 6.250936985015869,
+ "learning_rate": 1.1489820123302487e-05,
+ "loss": 0.1631,
+ "step": 17206
+ },
+ {
+ "epoch": 46.88555858310627,
+ "grad_norm": 5.934758186340332,
+ "learning_rate": 1.148894747158955e-05,
+ "loss": 0.186,
+ "step": 17207
+ },
+ {
+ "epoch": 46.88828337874659,
+ "grad_norm": 6.300573825836182,
+ "learning_rate": 1.1488074808280736e-05,
+ "loss": 0.2138,
+ "step": 17208
+ },
+ {
+ "epoch": 46.89100817438692,
+ "grad_norm": 4.808372497558594,
+ "learning_rate": 1.1487202133382844e-05,
+ "loss": 0.1864,
+ "step": 17209
+ },
+ {
+ "epoch": 46.89373297002725,
+ "grad_norm": 6.009509086608887,
+ "learning_rate": 1.1486329446902669e-05,
+ "loss": 0.1864,
+ "step": 17210
+ },
+ {
+ "epoch": 46.89645776566758,
+ "grad_norm": 5.693976402282715,
+ "learning_rate": 1.1485456748847006e-05,
+ "loss": 0.2315,
+ "step": 17211
+ },
+ {
+ "epoch": 46.8991825613079,
+ "grad_norm": 5.321122646331787,
+ "learning_rate": 1.1484584039222655e-05,
+ "loss": 0.313,
+ "step": 17212
+ },
+ {
+ "epoch": 46.90190735694823,
+ "grad_norm": 5.934122085571289,
+ "learning_rate": 1.1483711318036414e-05,
+ "loss": 0.1433,
+ "step": 17213
+ },
+ {
+ "epoch": 46.904632152588555,
+ "grad_norm": 5.832672119140625,
+ "learning_rate": 1.1482838585295076e-05,
+ "loss": 0.156,
+ "step": 17214
+ },
+ {
+ "epoch": 46.90735694822888,
+ "grad_norm": 6.689321041107178,
+ "learning_rate": 1.1481965841005438e-05,
+ "loss": 0.2502,
+ "step": 17215
+ },
+ {
+ "epoch": 46.91008174386921,
+ "grad_norm": 6.460909843444824,
+ "learning_rate": 1.1481093085174298e-05,
+ "loss": 0.2513,
+ "step": 17216
+ },
+ {
+ "epoch": 46.91280653950954,
+ "grad_norm": 6.603307247161865,
+ "learning_rate": 1.1480220317808453e-05,
+ "loss": 0.3076,
+ "step": 17217
+ },
+ {
+ "epoch": 46.915531335149865,
+ "grad_norm": 7.377344131469727,
+ "learning_rate": 1.1479347538914698e-05,
+ "loss": 0.2427,
+ "step": 17218
+ },
+ {
+ "epoch": 46.91825613079019,
+ "grad_norm": 4.96650505065918,
+ "learning_rate": 1.1478474748499833e-05,
+ "loss": 0.1482,
+ "step": 17219
+ },
+ {
+ "epoch": 46.920980926430516,
+ "grad_norm": 6.873035907745361,
+ "learning_rate": 1.1477601946570651e-05,
+ "loss": 0.2652,
+ "step": 17220
+ },
+ {
+ "epoch": 46.92370572207084,
+ "grad_norm": 5.6309309005737305,
+ "learning_rate": 1.147672913313396e-05,
+ "loss": 0.185,
+ "step": 17221
+ },
+ {
+ "epoch": 46.926430517711175,
+ "grad_norm": 5.095126152038574,
+ "learning_rate": 1.1475856308196544e-05,
+ "loss": 0.204,
+ "step": 17222
+ },
+ {
+ "epoch": 46.9291553133515,
+ "grad_norm": 6.1172966957092285,
+ "learning_rate": 1.1474983471765211e-05,
+ "loss": 0.2061,
+ "step": 17223
+ },
+ {
+ "epoch": 46.93188010899183,
+ "grad_norm": 8.968783378601074,
+ "learning_rate": 1.147411062384675e-05,
+ "loss": 0.258,
+ "step": 17224
+ },
+ {
+ "epoch": 46.93460490463215,
+ "grad_norm": 8.455772399902344,
+ "learning_rate": 1.1473237764447967e-05,
+ "loss": 0.1856,
+ "step": 17225
+ },
+ {
+ "epoch": 46.93732970027248,
+ "grad_norm": 5.343738555908203,
+ "learning_rate": 1.1472364893575651e-05,
+ "loss": 0.1199,
+ "step": 17226
+ },
+ {
+ "epoch": 46.940054495912804,
+ "grad_norm": 5.777643203735352,
+ "learning_rate": 1.1471492011236609e-05,
+ "loss": 0.2207,
+ "step": 17227
+ },
+ {
+ "epoch": 46.94277929155314,
+ "grad_norm": 6.920644283294678,
+ "learning_rate": 1.1470619117437629e-05,
+ "loss": 0.2204,
+ "step": 17228
+ },
+ {
+ "epoch": 46.94550408719346,
+ "grad_norm": 7.075724124908447,
+ "learning_rate": 1.146974621218552e-05,
+ "loss": 0.2559,
+ "step": 17229
+ },
+ {
+ "epoch": 46.94822888283379,
+ "grad_norm": 6.458963871002197,
+ "learning_rate": 1.1468873295487073e-05,
+ "loss": 0.2609,
+ "step": 17230
+ },
+ {
+ "epoch": 46.950953678474114,
+ "grad_norm": 8.322772979736328,
+ "learning_rate": 1.1468000367349088e-05,
+ "loss": 0.1818,
+ "step": 17231
+ },
+ {
+ "epoch": 46.95367847411444,
+ "grad_norm": 5.9607672691345215,
+ "learning_rate": 1.1467127427778364e-05,
+ "loss": 0.1233,
+ "step": 17232
+ },
+ {
+ "epoch": 46.956403269754766,
+ "grad_norm": 4.860105991363525,
+ "learning_rate": 1.14662544767817e-05,
+ "loss": 0.2093,
+ "step": 17233
+ },
+ {
+ "epoch": 46.95912806539509,
+ "grad_norm": 9.473416328430176,
+ "learning_rate": 1.146538151436589e-05,
+ "loss": 0.1582,
+ "step": 17234
+ },
+ {
+ "epoch": 46.961852861035425,
+ "grad_norm": 13.880687713623047,
+ "learning_rate": 1.1464508540537738e-05,
+ "loss": 0.2226,
+ "step": 17235
+ },
+ {
+ "epoch": 46.96457765667575,
+ "grad_norm": 4.40953254699707,
+ "learning_rate": 1.1463635555304038e-05,
+ "loss": 0.1368,
+ "step": 17236
+ },
+ {
+ "epoch": 46.967302452316076,
+ "grad_norm": 5.262019157409668,
+ "learning_rate": 1.1462762558671594e-05,
+ "loss": 0.1339,
+ "step": 17237
+ },
+ {
+ "epoch": 46.9700272479564,
+ "grad_norm": 4.952602386474609,
+ "learning_rate": 1.14618895506472e-05,
+ "loss": 0.239,
+ "step": 17238
+ },
+ {
+ "epoch": 46.97275204359673,
+ "grad_norm": 6.291650772094727,
+ "learning_rate": 1.1461016531237661e-05,
+ "loss": 0.138,
+ "step": 17239
+ },
+ {
+ "epoch": 46.97547683923706,
+ "grad_norm": 4.404817581176758,
+ "learning_rate": 1.1460143500449769e-05,
+ "loss": 0.3566,
+ "step": 17240
+ },
+ {
+ "epoch": 46.97820163487739,
+ "grad_norm": 6.670058250427246,
+ "learning_rate": 1.145927045829033e-05,
+ "loss": 0.2422,
+ "step": 17241
+ },
+ {
+ "epoch": 46.98092643051771,
+ "grad_norm": 3.762319564819336,
+ "learning_rate": 1.1458397404766138e-05,
+ "loss": 0.1222,
+ "step": 17242
+ },
+ {
+ "epoch": 46.98365122615804,
+ "grad_norm": 5.879096508026123,
+ "learning_rate": 1.1457524339883994e-05,
+ "loss": 0.2251,
+ "step": 17243
+ },
+ {
+ "epoch": 46.986376021798364,
+ "grad_norm": 5.028500556945801,
+ "learning_rate": 1.1456651263650695e-05,
+ "loss": 0.1746,
+ "step": 17244
+ },
+ {
+ "epoch": 46.98910081743869,
+ "grad_norm": 4.749955177307129,
+ "learning_rate": 1.1455778176073045e-05,
+ "loss": 0.1785,
+ "step": 17245
+ },
+ {
+ "epoch": 46.991825613079016,
+ "grad_norm": 5.498077869415283,
+ "learning_rate": 1.1454905077157839e-05,
+ "loss": 0.123,
+ "step": 17246
+ },
+ {
+ "epoch": 46.99455040871935,
+ "grad_norm": 4.786930561065674,
+ "learning_rate": 1.1454031966911883e-05,
+ "loss": 0.1777,
+ "step": 17247
+ },
+ {
+ "epoch": 46.997275204359674,
+ "grad_norm": 5.84864616394043,
+ "learning_rate": 1.1453158845341969e-05,
+ "loss": 0.1277,
+ "step": 17248
+ },
+ {
+ "epoch": 47.0,
+ "grad_norm": 4.433199882507324,
+ "learning_rate": 1.1452285712454905e-05,
+ "loss": 0.0942,
+ "step": 17249
+ },
+ {
+ "epoch": 47.002724795640326,
+ "grad_norm": 5.735518932342529,
+ "learning_rate": 1.1451412568257484e-05,
+ "loss": 0.1767,
+ "step": 17250
+ },
+ {
+ "epoch": 47.00544959128065,
+ "grad_norm": 4.625182151794434,
+ "learning_rate": 1.1450539412756509e-05,
+ "loss": 0.1015,
+ "step": 17251
+ },
+ {
+ "epoch": 47.00817438692098,
+ "grad_norm": 18.605335235595703,
+ "learning_rate": 1.144966624595878e-05,
+ "loss": 0.1508,
+ "step": 17252
+ },
+ {
+ "epoch": 47.01089918256131,
+ "grad_norm": 6.5579142570495605,
+ "learning_rate": 1.1448793067871095e-05,
+ "loss": 0.1519,
+ "step": 17253
+ },
+ {
+ "epoch": 47.013623978201636,
+ "grad_norm": 6.73146390914917,
+ "learning_rate": 1.1447919878500255e-05,
+ "loss": 0.1431,
+ "step": 17254
+ },
+ {
+ "epoch": 47.01634877384196,
+ "grad_norm": 10.806292533874512,
+ "learning_rate": 1.1447046677853066e-05,
+ "loss": 0.3581,
+ "step": 17255
+ },
+ {
+ "epoch": 47.01907356948229,
+ "grad_norm": 7.758955478668213,
+ "learning_rate": 1.1446173465936322e-05,
+ "loss": 0.2293,
+ "step": 17256
+ },
+ {
+ "epoch": 47.02179836512261,
+ "grad_norm": 5.246854305267334,
+ "learning_rate": 1.1445300242756827e-05,
+ "loss": 0.1232,
+ "step": 17257
+ },
+ {
+ "epoch": 47.02452316076294,
+ "grad_norm": 4.2169389724731445,
+ "learning_rate": 1.144442700832138e-05,
+ "loss": 0.1807,
+ "step": 17258
+ },
+ {
+ "epoch": 47.02724795640327,
+ "grad_norm": 5.507205486297607,
+ "learning_rate": 1.1443553762636781e-05,
+ "loss": 0.1362,
+ "step": 17259
+ },
+ {
+ "epoch": 47.0299727520436,
+ "grad_norm": 6.601847171783447,
+ "learning_rate": 1.1442680505709832e-05,
+ "loss": 0.1526,
+ "step": 17260
+ },
+ {
+ "epoch": 47.032697547683924,
+ "grad_norm": 4.276211738586426,
+ "learning_rate": 1.1441807237547336e-05,
+ "loss": 0.1558,
+ "step": 17261
+ },
+ {
+ "epoch": 47.03542234332425,
+ "grad_norm": 4.014583110809326,
+ "learning_rate": 1.1440933958156087e-05,
+ "loss": 0.1796,
+ "step": 17262
+ },
+ {
+ "epoch": 47.038147138964575,
+ "grad_norm": 9.991283416748047,
+ "learning_rate": 1.1440060667542891e-05,
+ "loss": 0.1512,
+ "step": 17263
+ },
+ {
+ "epoch": 47.0408719346049,
+ "grad_norm": 4.610074520111084,
+ "learning_rate": 1.143918736571455e-05,
+ "loss": 0.1224,
+ "step": 17264
+ },
+ {
+ "epoch": 47.043596730245234,
+ "grad_norm": 5.848897457122803,
+ "learning_rate": 1.1438314052677865e-05,
+ "loss": 0.1876,
+ "step": 17265
+ },
+ {
+ "epoch": 47.04632152588556,
+ "grad_norm": 6.770817756652832,
+ "learning_rate": 1.1437440728439637e-05,
+ "loss": 0.1305,
+ "step": 17266
+ },
+ {
+ "epoch": 47.049046321525886,
+ "grad_norm": 7.044491291046143,
+ "learning_rate": 1.1436567393006668e-05,
+ "loss": 0.204,
+ "step": 17267
+ },
+ {
+ "epoch": 47.05177111716621,
+ "grad_norm": 5.467977046966553,
+ "learning_rate": 1.1435694046385755e-05,
+ "loss": 0.1817,
+ "step": 17268
+ },
+ {
+ "epoch": 47.05449591280654,
+ "grad_norm": 5.026775360107422,
+ "learning_rate": 1.1434820688583706e-05,
+ "loss": 0.1329,
+ "step": 17269
+ },
+ {
+ "epoch": 47.05722070844686,
+ "grad_norm": 6.125763416290283,
+ "learning_rate": 1.1433947319607318e-05,
+ "loss": 0.1733,
+ "step": 17270
+ },
+ {
+ "epoch": 47.059945504087196,
+ "grad_norm": 6.257920742034912,
+ "learning_rate": 1.1433073939463393e-05,
+ "loss": 0.152,
+ "step": 17271
+ },
+ {
+ "epoch": 47.06267029972752,
+ "grad_norm": 7.099124908447266,
+ "learning_rate": 1.1432200548158738e-05,
+ "loss": 0.2168,
+ "step": 17272
+ },
+ {
+ "epoch": 47.06539509536785,
+ "grad_norm": 6.816453456878662,
+ "learning_rate": 1.1431327145700149e-05,
+ "loss": 0.2618,
+ "step": 17273
+ },
+ {
+ "epoch": 47.06811989100817,
+ "grad_norm": 5.101950168609619,
+ "learning_rate": 1.143045373209443e-05,
+ "loss": 0.1437,
+ "step": 17274
+ },
+ {
+ "epoch": 47.0708446866485,
+ "grad_norm": 17.04148292541504,
+ "learning_rate": 1.1429580307348385e-05,
+ "loss": 0.1967,
+ "step": 17275
+ },
+ {
+ "epoch": 47.073569482288825,
+ "grad_norm": 5.364077091217041,
+ "learning_rate": 1.142870687146881e-05,
+ "loss": 0.1554,
+ "step": 17276
+ },
+ {
+ "epoch": 47.07629427792916,
+ "grad_norm": 6.201749324798584,
+ "learning_rate": 1.1427833424462517e-05,
+ "loss": 0.19,
+ "step": 17277
+ },
+ {
+ "epoch": 47.079019073569484,
+ "grad_norm": 5.364887714385986,
+ "learning_rate": 1.1426959966336302e-05,
+ "loss": 0.2224,
+ "step": 17278
+ },
+ {
+ "epoch": 47.08174386920981,
+ "grad_norm": 7.636233806610107,
+ "learning_rate": 1.1426086497096966e-05,
+ "loss": 0.1855,
+ "step": 17279
+ },
+ {
+ "epoch": 47.084468664850135,
+ "grad_norm": 5.564447402954102,
+ "learning_rate": 1.1425213016751317e-05,
+ "loss": 0.1315,
+ "step": 17280
+ },
+ {
+ "epoch": 47.08719346049046,
+ "grad_norm": 4.97089958190918,
+ "learning_rate": 1.1424339525306154e-05,
+ "loss": 0.1413,
+ "step": 17281
+ },
+ {
+ "epoch": 47.08991825613079,
+ "grad_norm": 4.3761091232299805,
+ "learning_rate": 1.1423466022768283e-05,
+ "loss": 0.1186,
+ "step": 17282
+ },
+ {
+ "epoch": 47.09264305177112,
+ "grad_norm": 15.600180625915527,
+ "learning_rate": 1.14225925091445e-05,
+ "loss": 0.2701,
+ "step": 17283
+ },
+ {
+ "epoch": 47.095367847411445,
+ "grad_norm": 5.563814640045166,
+ "learning_rate": 1.1421718984441617e-05,
+ "loss": 0.2928,
+ "step": 17284
+ },
+ {
+ "epoch": 47.09809264305177,
+ "grad_norm": 6.132524490356445,
+ "learning_rate": 1.1420845448666429e-05,
+ "loss": 0.3414,
+ "step": 17285
+ },
+ {
+ "epoch": 47.1008174386921,
+ "grad_norm": 4.493549346923828,
+ "learning_rate": 1.1419971901825743e-05,
+ "loss": 0.2024,
+ "step": 17286
+ },
+ {
+ "epoch": 47.10354223433242,
+ "grad_norm": 11.406949043273926,
+ "learning_rate": 1.1419098343926363e-05,
+ "loss": 0.2807,
+ "step": 17287
+ },
+ {
+ "epoch": 47.10626702997275,
+ "grad_norm": 15.65683364868164,
+ "learning_rate": 1.1418224774975088e-05,
+ "loss": 0.1355,
+ "step": 17288
+ },
+ {
+ "epoch": 47.10899182561308,
+ "grad_norm": 6.96215295791626,
+ "learning_rate": 1.1417351194978725e-05,
+ "loss": 0.316,
+ "step": 17289
+ },
+ {
+ "epoch": 47.11171662125341,
+ "grad_norm": 8.716181755065918,
+ "learning_rate": 1.1416477603944078e-05,
+ "loss": 0.17,
+ "step": 17290
+ },
+ {
+ "epoch": 47.11444141689373,
+ "grad_norm": 5.2091217041015625,
+ "learning_rate": 1.1415604001877949e-05,
+ "loss": 0.2232,
+ "step": 17291
+ },
+ {
+ "epoch": 47.11716621253406,
+ "grad_norm": 11.852521896362305,
+ "learning_rate": 1.1414730388787143e-05,
+ "loss": 0.1593,
+ "step": 17292
+ },
+ {
+ "epoch": 47.119891008174385,
+ "grad_norm": 6.9596757888793945,
+ "learning_rate": 1.1413856764678459e-05,
+ "loss": 0.1775,
+ "step": 17293
+ },
+ {
+ "epoch": 47.12261580381471,
+ "grad_norm": 4.772704601287842,
+ "learning_rate": 1.1412983129558706e-05,
+ "loss": 0.2445,
+ "step": 17294
+ },
+ {
+ "epoch": 47.12534059945504,
+ "grad_norm": 6.12083625793457,
+ "learning_rate": 1.1412109483434683e-05,
+ "loss": 0.1868,
+ "step": 17295
+ },
+ {
+ "epoch": 47.12806539509537,
+ "grad_norm": 6.204431533813477,
+ "learning_rate": 1.1411235826313201e-05,
+ "loss": 0.2229,
+ "step": 17296
+ },
+ {
+ "epoch": 47.130790190735695,
+ "grad_norm": 5.632849216461182,
+ "learning_rate": 1.1410362158201054e-05,
+ "loss": 0.3334,
+ "step": 17297
+ },
+ {
+ "epoch": 47.13351498637602,
+ "grad_norm": 8.755095481872559,
+ "learning_rate": 1.1409488479105058e-05,
+ "loss": 0.1777,
+ "step": 17298
+ },
+ {
+ "epoch": 47.13623978201635,
+ "grad_norm": 4.300026893615723,
+ "learning_rate": 1.1408614789032007e-05,
+ "loss": 0.1565,
+ "step": 17299
+ },
+ {
+ "epoch": 47.13896457765667,
+ "grad_norm": 5.8478803634643555,
+ "learning_rate": 1.1407741087988713e-05,
+ "loss": 0.1355,
+ "step": 17300
+ },
+ {
+ "epoch": 47.141689373297005,
+ "grad_norm": 9.44076919555664,
+ "learning_rate": 1.1406867375981975e-05,
+ "loss": 0.2481,
+ "step": 17301
+ },
+ {
+ "epoch": 47.14441416893733,
+ "grad_norm": 5.266812801361084,
+ "learning_rate": 1.1405993653018599e-05,
+ "loss": 0.1623,
+ "step": 17302
+ },
+ {
+ "epoch": 47.14713896457766,
+ "grad_norm": 4.535799026489258,
+ "learning_rate": 1.1405119919105387e-05,
+ "loss": 0.1985,
+ "step": 17303
+ },
+ {
+ "epoch": 47.14986376021798,
+ "grad_norm": 6.18609094619751,
+ "learning_rate": 1.1404246174249152e-05,
+ "loss": 0.1531,
+ "step": 17304
+ },
+ {
+ "epoch": 47.15258855585831,
+ "grad_norm": 4.408097743988037,
+ "learning_rate": 1.1403372418456687e-05,
+ "loss": 0.2456,
+ "step": 17305
+ },
+ {
+ "epoch": 47.155313351498634,
+ "grad_norm": 5.561338901519775,
+ "learning_rate": 1.1402498651734806e-05,
+ "loss": 0.1267,
+ "step": 17306
+ },
+ {
+ "epoch": 47.15803814713897,
+ "grad_norm": 5.082563877105713,
+ "learning_rate": 1.1401624874090309e-05,
+ "loss": 0.1825,
+ "step": 17307
+ },
+ {
+ "epoch": 47.16076294277929,
+ "grad_norm": 5.351593494415283,
+ "learning_rate": 1.1400751085530006e-05,
+ "loss": 0.1378,
+ "step": 17308
+ },
+ {
+ "epoch": 47.16348773841962,
+ "grad_norm": 8.034741401672363,
+ "learning_rate": 1.1399877286060695e-05,
+ "loss": 0.1617,
+ "step": 17309
+ },
+ {
+ "epoch": 47.166212534059945,
+ "grad_norm": 10.069036483764648,
+ "learning_rate": 1.1399003475689187e-05,
+ "loss": 0.125,
+ "step": 17310
+ },
+ {
+ "epoch": 47.16893732970027,
+ "grad_norm": 4.9894490242004395,
+ "learning_rate": 1.1398129654422284e-05,
+ "loss": 0.2234,
+ "step": 17311
+ },
+ {
+ "epoch": 47.171662125340596,
+ "grad_norm": 5.806913375854492,
+ "learning_rate": 1.1397255822266794e-05,
+ "loss": 0.1104,
+ "step": 17312
+ },
+ {
+ "epoch": 47.17438692098093,
+ "grad_norm": 13.047809600830078,
+ "learning_rate": 1.1396381979229518e-05,
+ "loss": 0.2257,
+ "step": 17313
+ },
+ {
+ "epoch": 47.177111716621255,
+ "grad_norm": 6.9155168533325195,
+ "learning_rate": 1.1395508125317266e-05,
+ "loss": 0.1387,
+ "step": 17314
+ },
+ {
+ "epoch": 47.17983651226158,
+ "grad_norm": 4.971002578735352,
+ "learning_rate": 1.1394634260536839e-05,
+ "loss": 0.1436,
+ "step": 17315
+ },
+ {
+ "epoch": 47.182561307901906,
+ "grad_norm": 14.82128620147705,
+ "learning_rate": 1.1393760384895047e-05,
+ "loss": 0.1135,
+ "step": 17316
+ },
+ {
+ "epoch": 47.18528610354223,
+ "grad_norm": 6.719625949859619,
+ "learning_rate": 1.1392886498398695e-05,
+ "loss": 0.1841,
+ "step": 17317
+ },
+ {
+ "epoch": 47.18801089918256,
+ "grad_norm": 4.952080249786377,
+ "learning_rate": 1.1392012601054588e-05,
+ "loss": 0.1434,
+ "step": 17318
+ },
+ {
+ "epoch": 47.19073569482289,
+ "grad_norm": 5.241774082183838,
+ "learning_rate": 1.1391138692869528e-05,
+ "loss": 0.1313,
+ "step": 17319
+ },
+ {
+ "epoch": 47.19346049046322,
+ "grad_norm": 5.519021987915039,
+ "learning_rate": 1.1390264773850329e-05,
+ "loss": 0.1473,
+ "step": 17320
+ },
+ {
+ "epoch": 47.19618528610354,
+ "grad_norm": 10.155780792236328,
+ "learning_rate": 1.1389390844003789e-05,
+ "loss": 0.199,
+ "step": 17321
+ },
+ {
+ "epoch": 47.19891008174387,
+ "grad_norm": 7.600268840789795,
+ "learning_rate": 1.138851690333672e-05,
+ "loss": 0.2099,
+ "step": 17322
+ },
+ {
+ "epoch": 47.201634877384194,
+ "grad_norm": 5.401339530944824,
+ "learning_rate": 1.1387642951855925e-05,
+ "loss": 0.2131,
+ "step": 17323
+ },
+ {
+ "epoch": 47.20435967302452,
+ "grad_norm": 5.1407365798950195,
+ "learning_rate": 1.1386768989568213e-05,
+ "loss": 0.1204,
+ "step": 17324
+ },
+ {
+ "epoch": 47.20708446866485,
+ "grad_norm": 7.2260422706604,
+ "learning_rate": 1.1385895016480387e-05,
+ "loss": 0.1996,
+ "step": 17325
+ },
+ {
+ "epoch": 47.20980926430518,
+ "grad_norm": 8.958779335021973,
+ "learning_rate": 1.1385021032599257e-05,
+ "loss": 0.1553,
+ "step": 17326
+ },
+ {
+ "epoch": 47.212534059945504,
+ "grad_norm": 4.629421710968018,
+ "learning_rate": 1.1384147037931625e-05,
+ "loss": 0.0848,
+ "step": 17327
+ },
+ {
+ "epoch": 47.21525885558583,
+ "grad_norm": 7.2963128089904785,
+ "learning_rate": 1.1383273032484302e-05,
+ "loss": 0.2914,
+ "step": 17328
+ },
+ {
+ "epoch": 47.217983651226156,
+ "grad_norm": 8.382322311401367,
+ "learning_rate": 1.1382399016264093e-05,
+ "loss": 0.1498,
+ "step": 17329
+ },
+ {
+ "epoch": 47.22070844686648,
+ "grad_norm": 4.128012657165527,
+ "learning_rate": 1.1381524989277807e-05,
+ "loss": 0.2148,
+ "step": 17330
+ },
+ {
+ "epoch": 47.223433242506815,
+ "grad_norm": 4.981644630432129,
+ "learning_rate": 1.1380650951532243e-05,
+ "loss": 0.1136,
+ "step": 17331
+ },
+ {
+ "epoch": 47.22615803814714,
+ "grad_norm": 5.655073165893555,
+ "learning_rate": 1.137977690303422e-05,
+ "loss": 0.393,
+ "step": 17332
+ },
+ {
+ "epoch": 47.228882833787466,
+ "grad_norm": 4.699531078338623,
+ "learning_rate": 1.1378902843790538e-05,
+ "loss": 0.3039,
+ "step": 17333
+ },
+ {
+ "epoch": 47.23160762942779,
+ "grad_norm": 6.343612194061279,
+ "learning_rate": 1.1378028773808003e-05,
+ "loss": 0.1774,
+ "step": 17334
+ },
+ {
+ "epoch": 47.23433242506812,
+ "grad_norm": 5.021273136138916,
+ "learning_rate": 1.1377154693093426e-05,
+ "loss": 0.0888,
+ "step": 17335
+ },
+ {
+ "epoch": 47.237057220708444,
+ "grad_norm": 4.948480129241943,
+ "learning_rate": 1.1376280601653613e-05,
+ "loss": 0.1255,
+ "step": 17336
+ },
+ {
+ "epoch": 47.23978201634878,
+ "grad_norm": 5.859848976135254,
+ "learning_rate": 1.1375406499495367e-05,
+ "loss": 0.3579,
+ "step": 17337
+ },
+ {
+ "epoch": 47.2425068119891,
+ "grad_norm": 7.666250705718994,
+ "learning_rate": 1.1374532386625506e-05,
+ "loss": 0.1589,
+ "step": 17338
+ },
+ {
+ "epoch": 47.24523160762943,
+ "grad_norm": 7.62019157409668,
+ "learning_rate": 1.1373658263050824e-05,
+ "loss": 0.2307,
+ "step": 17339
+ },
+ {
+ "epoch": 47.247956403269754,
+ "grad_norm": 7.805665969848633,
+ "learning_rate": 1.1372784128778138e-05,
+ "loss": 0.274,
+ "step": 17340
+ },
+ {
+ "epoch": 47.25068119891008,
+ "grad_norm": 5.220042705535889,
+ "learning_rate": 1.1371909983814253e-05,
+ "loss": 0.2284,
+ "step": 17341
+ },
+ {
+ "epoch": 47.253405994550405,
+ "grad_norm": 5.222188949584961,
+ "learning_rate": 1.1371035828165979e-05,
+ "loss": 0.2258,
+ "step": 17342
+ },
+ {
+ "epoch": 47.25613079019074,
+ "grad_norm": 4.879983425140381,
+ "learning_rate": 1.1370161661840122e-05,
+ "loss": 0.2649,
+ "step": 17343
+ },
+ {
+ "epoch": 47.258855585831064,
+ "grad_norm": 4.29693603515625,
+ "learning_rate": 1.136928748484349e-05,
+ "loss": 0.2224,
+ "step": 17344
+ },
+ {
+ "epoch": 47.26158038147139,
+ "grad_norm": 6.894303321838379,
+ "learning_rate": 1.1368413297182892e-05,
+ "loss": 0.2061,
+ "step": 17345
+ },
+ {
+ "epoch": 47.264305177111716,
+ "grad_norm": 4.151698589324951,
+ "learning_rate": 1.1367539098865134e-05,
+ "loss": 0.1359,
+ "step": 17346
+ },
+ {
+ "epoch": 47.26702997275204,
+ "grad_norm": 7.282924175262451,
+ "learning_rate": 1.1366664889897025e-05,
+ "loss": 0.1911,
+ "step": 17347
+ },
+ {
+ "epoch": 47.26975476839237,
+ "grad_norm": 11.262412071228027,
+ "learning_rate": 1.1365790670285372e-05,
+ "loss": 0.2117,
+ "step": 17348
+ },
+ {
+ "epoch": 47.2724795640327,
+ "grad_norm": 5.026998519897461,
+ "learning_rate": 1.136491644003699e-05,
+ "loss": 0.127,
+ "step": 17349
+ },
+ {
+ "epoch": 47.275204359673026,
+ "grad_norm": 4.999397277832031,
+ "learning_rate": 1.1364042199158681e-05,
+ "loss": 0.134,
+ "step": 17350
+ },
+ {
+ "epoch": 47.27792915531335,
+ "grad_norm": 5.330348491668701,
+ "learning_rate": 1.1363167947657252e-05,
+ "loss": 0.1223,
+ "step": 17351
+ },
+ {
+ "epoch": 47.28065395095368,
+ "grad_norm": 5.6617865562438965,
+ "learning_rate": 1.1362293685539518e-05,
+ "loss": 0.1256,
+ "step": 17352
+ },
+ {
+ "epoch": 47.283378746594,
+ "grad_norm": 6.341552257537842,
+ "learning_rate": 1.1361419412812284e-05,
+ "loss": 0.1729,
+ "step": 17353
+ },
+ {
+ "epoch": 47.28610354223433,
+ "grad_norm": 6.309276580810547,
+ "learning_rate": 1.1360545129482361e-05,
+ "loss": 0.2233,
+ "step": 17354
+ },
+ {
+ "epoch": 47.28882833787466,
+ "grad_norm": 4.976595401763916,
+ "learning_rate": 1.1359670835556554e-05,
+ "loss": 0.1524,
+ "step": 17355
+ },
+ {
+ "epoch": 47.29155313351499,
+ "grad_norm": 4.946108341217041,
+ "learning_rate": 1.1358796531041676e-05,
+ "loss": 0.1253,
+ "step": 17356
+ },
+ {
+ "epoch": 47.294277929155314,
+ "grad_norm": 5.250059604644775,
+ "learning_rate": 1.1357922215944533e-05,
+ "loss": 0.123,
+ "step": 17357
+ },
+ {
+ "epoch": 47.29700272479564,
+ "grad_norm": 9.978639602661133,
+ "learning_rate": 1.1357047890271935e-05,
+ "loss": 0.3298,
+ "step": 17358
+ },
+ {
+ "epoch": 47.299727520435965,
+ "grad_norm": 5.052424907684326,
+ "learning_rate": 1.1356173554030692e-05,
+ "loss": 0.113,
+ "step": 17359
+ },
+ {
+ "epoch": 47.30245231607629,
+ "grad_norm": 7.464874744415283,
+ "learning_rate": 1.1355299207227612e-05,
+ "loss": 0.2352,
+ "step": 17360
+ },
+ {
+ "epoch": 47.305177111716624,
+ "grad_norm": 7.263399600982666,
+ "learning_rate": 1.135442484986951e-05,
+ "loss": 0.1648,
+ "step": 17361
+ },
+ {
+ "epoch": 47.30790190735695,
+ "grad_norm": 8.095212936401367,
+ "learning_rate": 1.1353550481963188e-05,
+ "loss": 0.1867,
+ "step": 17362
+ },
+ {
+ "epoch": 47.310626702997276,
+ "grad_norm": 6.417571544647217,
+ "learning_rate": 1.1352676103515456e-05,
+ "loss": 0.1455,
+ "step": 17363
+ },
+ {
+ "epoch": 47.3133514986376,
+ "grad_norm": 15.318137168884277,
+ "learning_rate": 1.135180171453313e-05,
+ "loss": 0.226,
+ "step": 17364
+ },
+ {
+ "epoch": 47.31607629427793,
+ "grad_norm": 4.018860340118408,
+ "learning_rate": 1.1350927315023012e-05,
+ "loss": 0.1905,
+ "step": 17365
+ },
+ {
+ "epoch": 47.31880108991825,
+ "grad_norm": 4.7360968589782715,
+ "learning_rate": 1.1350052904991917e-05,
+ "loss": 0.2281,
+ "step": 17366
+ },
+ {
+ "epoch": 47.321525885558586,
+ "grad_norm": 6.059764862060547,
+ "learning_rate": 1.1349178484446655e-05,
+ "loss": 0.2661,
+ "step": 17367
+ },
+ {
+ "epoch": 47.32425068119891,
+ "grad_norm": 5.604198455810547,
+ "learning_rate": 1.1348304053394032e-05,
+ "loss": 0.1767,
+ "step": 17368
+ },
+ {
+ "epoch": 47.32697547683924,
+ "grad_norm": 4.785433292388916,
+ "learning_rate": 1.1347429611840863e-05,
+ "loss": 0.1619,
+ "step": 17369
+ },
+ {
+ "epoch": 47.32970027247956,
+ "grad_norm": 6.601691246032715,
+ "learning_rate": 1.1346555159793956e-05,
+ "loss": 0.4151,
+ "step": 17370
+ },
+ {
+ "epoch": 47.33242506811989,
+ "grad_norm": 8.255234718322754,
+ "learning_rate": 1.134568069726012e-05,
+ "loss": 0.1947,
+ "step": 17371
+ },
+ {
+ "epoch": 47.335149863760215,
+ "grad_norm": 4.329376697540283,
+ "learning_rate": 1.1344806224246164e-05,
+ "loss": 0.0924,
+ "step": 17372
+ },
+ {
+ "epoch": 47.33787465940055,
+ "grad_norm": 7.335381984710693,
+ "learning_rate": 1.13439317407589e-05,
+ "loss": 0.2743,
+ "step": 17373
+ },
+ {
+ "epoch": 47.34059945504087,
+ "grad_norm": 5.078884601593018,
+ "learning_rate": 1.134305724680514e-05,
+ "loss": 0.1332,
+ "step": 17374
+ },
+ {
+ "epoch": 47.3433242506812,
+ "grad_norm": 5.090694427490234,
+ "learning_rate": 1.1342182742391693e-05,
+ "loss": 0.2632,
+ "step": 17375
+ },
+ {
+ "epoch": 47.346049046321525,
+ "grad_norm": 7.320001125335693,
+ "learning_rate": 1.1341308227525372e-05,
+ "loss": 0.1552,
+ "step": 17376
+ },
+ {
+ "epoch": 47.34877384196185,
+ "grad_norm": 8.654484748840332,
+ "learning_rate": 1.1340433702212986e-05,
+ "loss": 0.2031,
+ "step": 17377
+ },
+ {
+ "epoch": 47.35149863760218,
+ "grad_norm": 4.913638114929199,
+ "learning_rate": 1.1339559166461343e-05,
+ "loss": 0.2018,
+ "step": 17378
+ },
+ {
+ "epoch": 47.35422343324251,
+ "grad_norm": 5.031498432159424,
+ "learning_rate": 1.1338684620277259e-05,
+ "loss": 0.1499,
+ "step": 17379
+ },
+ {
+ "epoch": 47.356948228882835,
+ "grad_norm": 5.879524230957031,
+ "learning_rate": 1.1337810063667539e-05,
+ "loss": 0.1839,
+ "step": 17380
+ },
+ {
+ "epoch": 47.35967302452316,
+ "grad_norm": 6.057834148406982,
+ "learning_rate": 1.1336935496639e-05,
+ "loss": 0.2018,
+ "step": 17381
+ },
+ {
+ "epoch": 47.36239782016349,
+ "grad_norm": 5.919984817504883,
+ "learning_rate": 1.1336060919198449e-05,
+ "loss": 0.1179,
+ "step": 17382
+ },
+ {
+ "epoch": 47.36512261580381,
+ "grad_norm": 5.599321365356445,
+ "learning_rate": 1.1335186331352697e-05,
+ "loss": 0.0937,
+ "step": 17383
+ },
+ {
+ "epoch": 47.36784741144414,
+ "grad_norm": 5.7660369873046875,
+ "learning_rate": 1.1334311733108558e-05,
+ "loss": 0.1562,
+ "step": 17384
+ },
+ {
+ "epoch": 47.37057220708447,
+ "grad_norm": 5.741179466247559,
+ "learning_rate": 1.1333437124472844e-05,
+ "loss": 0.1245,
+ "step": 17385
+ },
+ {
+ "epoch": 47.3732970027248,
+ "grad_norm": 6.793684005737305,
+ "learning_rate": 1.1332562505452363e-05,
+ "loss": 0.2028,
+ "step": 17386
+ },
+ {
+ "epoch": 47.37602179836512,
+ "grad_norm": 6.103033542633057,
+ "learning_rate": 1.1331687876053929e-05,
+ "loss": 0.1651,
+ "step": 17387
+ },
+ {
+ "epoch": 47.37874659400545,
+ "grad_norm": 7.7717719078063965,
+ "learning_rate": 1.1330813236284353e-05,
+ "loss": 0.1776,
+ "step": 17388
+ },
+ {
+ "epoch": 47.381471389645775,
+ "grad_norm": 6.243279933929443,
+ "learning_rate": 1.1329938586150445e-05,
+ "loss": 0.2212,
+ "step": 17389
+ },
+ {
+ "epoch": 47.3841961852861,
+ "grad_norm": 6.319809436798096,
+ "learning_rate": 1.1329063925659018e-05,
+ "loss": 0.1883,
+ "step": 17390
+ },
+ {
+ "epoch": 47.38692098092643,
+ "grad_norm": 7.187377452850342,
+ "learning_rate": 1.1328189254816883e-05,
+ "loss": 0.1503,
+ "step": 17391
+ },
+ {
+ "epoch": 47.38964577656676,
+ "grad_norm": 4.905011177062988,
+ "learning_rate": 1.1327314573630855e-05,
+ "loss": 0.1894,
+ "step": 17392
+ },
+ {
+ "epoch": 47.392370572207085,
+ "grad_norm": 7.594850540161133,
+ "learning_rate": 1.1326439882107745e-05,
+ "loss": 0.2032,
+ "step": 17393
+ },
+ {
+ "epoch": 47.39509536784741,
+ "grad_norm": 4.616300106048584,
+ "learning_rate": 1.132556518025436e-05,
+ "loss": 0.2928,
+ "step": 17394
+ },
+ {
+ "epoch": 47.39782016348774,
+ "grad_norm": 6.146267414093018,
+ "learning_rate": 1.132469046807752e-05,
+ "loss": 0.1833,
+ "step": 17395
+ },
+ {
+ "epoch": 47.40054495912806,
+ "grad_norm": 6.339707851409912,
+ "learning_rate": 1.132381574558403e-05,
+ "loss": 0.2174,
+ "step": 17396
+ },
+ {
+ "epoch": 47.403269754768395,
+ "grad_norm": 6.550048828125,
+ "learning_rate": 1.1322941012780707e-05,
+ "loss": 0.2267,
+ "step": 17397
+ },
+ {
+ "epoch": 47.40599455040872,
+ "grad_norm": 6.415716171264648,
+ "learning_rate": 1.1322066269674364e-05,
+ "loss": 0.183,
+ "step": 17398
+ },
+ {
+ "epoch": 47.40871934604905,
+ "grad_norm": 4.894993782043457,
+ "learning_rate": 1.132119151627181e-05,
+ "loss": 0.1251,
+ "step": 17399
+ },
+ {
+ "epoch": 47.41144414168937,
+ "grad_norm": 7.787525653839111,
+ "learning_rate": 1.1320316752579854e-05,
+ "loss": 0.1692,
+ "step": 17400
+ },
+ {
+ "epoch": 47.4141689373297,
+ "grad_norm": 4.8304443359375,
+ "learning_rate": 1.1319441978605319e-05,
+ "loss": 0.3152,
+ "step": 17401
+ },
+ {
+ "epoch": 47.416893732970024,
+ "grad_norm": 5.751040935516357,
+ "learning_rate": 1.131856719435501e-05,
+ "loss": 0.1759,
+ "step": 17402
+ },
+ {
+ "epoch": 47.41961852861036,
+ "grad_norm": 4.539827346801758,
+ "learning_rate": 1.1317692399835746e-05,
+ "loss": 0.3914,
+ "step": 17403
+ },
+ {
+ "epoch": 47.42234332425068,
+ "grad_norm": 5.309699058532715,
+ "learning_rate": 1.1316817595054333e-05,
+ "loss": 0.1444,
+ "step": 17404
+ },
+ {
+ "epoch": 47.42506811989101,
+ "grad_norm": 5.834379196166992,
+ "learning_rate": 1.1315942780017589e-05,
+ "loss": 0.2961,
+ "step": 17405
+ },
+ {
+ "epoch": 47.427792915531334,
+ "grad_norm": 6.645628929138184,
+ "learning_rate": 1.1315067954732322e-05,
+ "loss": 0.4054,
+ "step": 17406
+ },
+ {
+ "epoch": 47.43051771117166,
+ "grad_norm": 5.270048141479492,
+ "learning_rate": 1.131419311920535e-05,
+ "loss": 0.1968,
+ "step": 17407
+ },
+ {
+ "epoch": 47.433242506811986,
+ "grad_norm": 10.516953468322754,
+ "learning_rate": 1.131331827344348e-05,
+ "loss": 0.3111,
+ "step": 17408
+ },
+ {
+ "epoch": 47.43596730245232,
+ "grad_norm": 4.475905895233154,
+ "learning_rate": 1.1312443417453535e-05,
+ "loss": 0.0942,
+ "step": 17409
+ },
+ {
+ "epoch": 47.438692098092645,
+ "grad_norm": 5.827042579650879,
+ "learning_rate": 1.131156855124232e-05,
+ "loss": 0.2352,
+ "step": 17410
+ },
+ {
+ "epoch": 47.44141689373297,
+ "grad_norm": 5.595770835876465,
+ "learning_rate": 1.1310693674816655e-05,
+ "loss": 0.2271,
+ "step": 17411
+ },
+ {
+ "epoch": 47.444141689373296,
+ "grad_norm": 4.498119831085205,
+ "learning_rate": 1.1309818788183347e-05,
+ "loss": 0.1723,
+ "step": 17412
+ },
+ {
+ "epoch": 47.44686648501362,
+ "grad_norm": 5.491279602050781,
+ "learning_rate": 1.1308943891349213e-05,
+ "loss": 0.1805,
+ "step": 17413
+ },
+ {
+ "epoch": 47.44959128065395,
+ "grad_norm": 5.263021469116211,
+ "learning_rate": 1.1308068984321066e-05,
+ "loss": 0.1742,
+ "step": 17414
+ },
+ {
+ "epoch": 47.45231607629428,
+ "grad_norm": 5.425411224365234,
+ "learning_rate": 1.130719406710572e-05,
+ "loss": 0.133,
+ "step": 17415
+ },
+ {
+ "epoch": 47.45504087193461,
+ "grad_norm": 4.812409400939941,
+ "learning_rate": 1.130631913970999e-05,
+ "loss": 0.2897,
+ "step": 17416
+ },
+ {
+ "epoch": 47.45776566757493,
+ "grad_norm": 4.713386535644531,
+ "learning_rate": 1.1305444202140685e-05,
+ "loss": 0.2036,
+ "step": 17417
+ },
+ {
+ "epoch": 47.46049046321526,
+ "grad_norm": 5.480905532836914,
+ "learning_rate": 1.1304569254404623e-05,
+ "loss": 0.1172,
+ "step": 17418
+ },
+ {
+ "epoch": 47.463215258855584,
+ "grad_norm": 8.589835166931152,
+ "learning_rate": 1.130369429650862e-05,
+ "loss": 0.1477,
+ "step": 17419
+ },
+ {
+ "epoch": 47.46594005449591,
+ "grad_norm": 6.506086349487305,
+ "learning_rate": 1.1302819328459487e-05,
+ "loss": 0.2017,
+ "step": 17420
+ },
+ {
+ "epoch": 47.46866485013624,
+ "grad_norm": 6.886260032653809,
+ "learning_rate": 1.130194435026404e-05,
+ "loss": 0.2262,
+ "step": 17421
+ },
+ {
+ "epoch": 47.47138964577657,
+ "grad_norm": 5.667884349822998,
+ "learning_rate": 1.1301069361929092e-05,
+ "loss": 0.126,
+ "step": 17422
+ },
+ {
+ "epoch": 47.474114441416894,
+ "grad_norm": 4.748784065246582,
+ "learning_rate": 1.1300194363461456e-05,
+ "loss": 0.1147,
+ "step": 17423
+ },
+ {
+ "epoch": 47.47683923705722,
+ "grad_norm": 6.0897722244262695,
+ "learning_rate": 1.129931935486795e-05,
+ "loss": 0.1983,
+ "step": 17424
+ },
+ {
+ "epoch": 47.479564032697546,
+ "grad_norm": 6.235533237457275,
+ "learning_rate": 1.1298444336155388e-05,
+ "loss": 0.1375,
+ "step": 17425
+ },
+ {
+ "epoch": 47.48228882833787,
+ "grad_norm": 5.98510217666626,
+ "learning_rate": 1.1297569307330576e-05,
+ "loss": 0.1994,
+ "step": 17426
+ },
+ {
+ "epoch": 47.485013623978205,
+ "grad_norm": 5.428730487823486,
+ "learning_rate": 1.1296694268400343e-05,
+ "loss": 0.1193,
+ "step": 17427
+ },
+ {
+ "epoch": 47.48773841961853,
+ "grad_norm": 5.673888683319092,
+ "learning_rate": 1.1295819219371494e-05,
+ "loss": 0.2798,
+ "step": 17428
+ },
+ {
+ "epoch": 47.490463215258856,
+ "grad_norm": 12.204548835754395,
+ "learning_rate": 1.1294944160250849e-05,
+ "loss": 0.3595,
+ "step": 17429
+ },
+ {
+ "epoch": 47.49318801089918,
+ "grad_norm": 5.644983291625977,
+ "learning_rate": 1.129406909104522e-05,
+ "loss": 0.1491,
+ "step": 17430
+ },
+ {
+ "epoch": 47.49591280653951,
+ "grad_norm": 7.090771675109863,
+ "learning_rate": 1.1293194011761421e-05,
+ "loss": 0.2103,
+ "step": 17431
+ },
+ {
+ "epoch": 47.49863760217983,
+ "grad_norm": 5.9541916847229,
+ "learning_rate": 1.1292318922406268e-05,
+ "loss": 0.1831,
+ "step": 17432
+ },
+ {
+ "epoch": 47.50136239782017,
+ "grad_norm": 4.507806777954102,
+ "learning_rate": 1.129144382298658e-05,
+ "loss": 0.1984,
+ "step": 17433
+ },
+ {
+ "epoch": 47.50408719346049,
+ "grad_norm": 5.049549102783203,
+ "learning_rate": 1.1290568713509166e-05,
+ "loss": 0.209,
+ "step": 17434
+ },
+ {
+ "epoch": 47.50681198910082,
+ "grad_norm": 5.580391883850098,
+ "learning_rate": 1.1289693593980843e-05,
+ "loss": 0.1354,
+ "step": 17435
+ },
+ {
+ "epoch": 47.509536784741144,
+ "grad_norm": 10.421479225158691,
+ "learning_rate": 1.1288818464408433e-05,
+ "loss": 0.1727,
+ "step": 17436
+ },
+ {
+ "epoch": 47.51226158038147,
+ "grad_norm": 10.88788890838623,
+ "learning_rate": 1.1287943324798744e-05,
+ "loss": 0.1282,
+ "step": 17437
+ },
+ {
+ "epoch": 47.514986376021795,
+ "grad_norm": 5.003871440887451,
+ "learning_rate": 1.1287068175158594e-05,
+ "loss": 0.1301,
+ "step": 17438
+ },
+ {
+ "epoch": 47.51771117166213,
+ "grad_norm": 5.405365943908691,
+ "learning_rate": 1.1286193015494797e-05,
+ "loss": 0.4263,
+ "step": 17439
+ },
+ {
+ "epoch": 47.520435967302454,
+ "grad_norm": 5.518341064453125,
+ "learning_rate": 1.128531784581417e-05,
+ "loss": 0.1235,
+ "step": 17440
+ },
+ {
+ "epoch": 47.52316076294278,
+ "grad_norm": 5.502331733703613,
+ "learning_rate": 1.1284442666123532e-05,
+ "loss": 0.126,
+ "step": 17441
+ },
+ {
+ "epoch": 47.525885558583106,
+ "grad_norm": 6.106025218963623,
+ "learning_rate": 1.1283567476429693e-05,
+ "loss": 0.123,
+ "step": 17442
+ },
+ {
+ "epoch": 47.52861035422343,
+ "grad_norm": 5.299657344818115,
+ "learning_rate": 1.1282692276739473e-05,
+ "loss": 0.1493,
+ "step": 17443
+ },
+ {
+ "epoch": 47.53133514986376,
+ "grad_norm": 6.045785903930664,
+ "learning_rate": 1.1281817067059689e-05,
+ "loss": 0.1349,
+ "step": 17444
+ },
+ {
+ "epoch": 47.53405994550409,
+ "grad_norm": 5.7348527908325195,
+ "learning_rate": 1.128094184739715e-05,
+ "loss": 0.1582,
+ "step": 17445
+ },
+ {
+ "epoch": 47.536784741144416,
+ "grad_norm": 4.512693405151367,
+ "learning_rate": 1.128006661775868e-05,
+ "loss": 0.1694,
+ "step": 17446
+ },
+ {
+ "epoch": 47.53950953678474,
+ "grad_norm": 6.702103137969971,
+ "learning_rate": 1.1279191378151094e-05,
+ "loss": 0.1433,
+ "step": 17447
+ },
+ {
+ "epoch": 47.54223433242507,
+ "grad_norm": 6.371593475341797,
+ "learning_rate": 1.1278316128581205e-05,
+ "loss": 0.3932,
+ "step": 17448
+ },
+ {
+ "epoch": 47.54495912806539,
+ "grad_norm": 5.314506530761719,
+ "learning_rate": 1.1277440869055829e-05,
+ "loss": 0.1245,
+ "step": 17449
+ },
+ {
+ "epoch": 47.54768392370572,
+ "grad_norm": 8.911656379699707,
+ "learning_rate": 1.1276565599581786e-05,
+ "loss": 0.2033,
+ "step": 17450
+ },
+ {
+ "epoch": 47.55040871934605,
+ "grad_norm": 4.4906005859375,
+ "learning_rate": 1.1275690320165891e-05,
+ "loss": 0.169,
+ "step": 17451
+ },
+ {
+ "epoch": 47.55313351498638,
+ "grad_norm": 5.4205474853515625,
+ "learning_rate": 1.1274815030814962e-05,
+ "loss": 0.1658,
+ "step": 17452
+ },
+ {
+ "epoch": 47.555858310626704,
+ "grad_norm": 5.942286014556885,
+ "learning_rate": 1.1273939731535814e-05,
+ "loss": 0.2132,
+ "step": 17453
+ },
+ {
+ "epoch": 47.55858310626703,
+ "grad_norm": 5.758001804351807,
+ "learning_rate": 1.1273064422335266e-05,
+ "loss": 0.1875,
+ "step": 17454
+ },
+ {
+ "epoch": 47.561307901907355,
+ "grad_norm": 5.243936538696289,
+ "learning_rate": 1.127218910322013e-05,
+ "loss": 0.1523,
+ "step": 17455
+ },
+ {
+ "epoch": 47.56403269754768,
+ "grad_norm": 9.450494766235352,
+ "learning_rate": 1.127131377419723e-05,
+ "loss": 0.1725,
+ "step": 17456
+ },
+ {
+ "epoch": 47.566757493188014,
+ "grad_norm": 6.759274482727051,
+ "learning_rate": 1.1270438435273376e-05,
+ "loss": 0.3017,
+ "step": 17457
+ },
+ {
+ "epoch": 47.56948228882834,
+ "grad_norm": 6.860689163208008,
+ "learning_rate": 1.1269563086455393e-05,
+ "loss": 0.1928,
+ "step": 17458
+ },
+ {
+ "epoch": 47.572207084468666,
+ "grad_norm": 8.381548881530762,
+ "learning_rate": 1.126868772775009e-05,
+ "loss": 0.1584,
+ "step": 17459
+ },
+ {
+ "epoch": 47.57493188010899,
+ "grad_norm": 8.353500366210938,
+ "learning_rate": 1.1267812359164286e-05,
+ "loss": 0.1151,
+ "step": 17460
+ },
+ {
+ "epoch": 47.57765667574932,
+ "grad_norm": 10.234742164611816,
+ "learning_rate": 1.1266936980704801e-05,
+ "loss": 0.1353,
+ "step": 17461
+ },
+ {
+ "epoch": 47.58038147138964,
+ "grad_norm": 5.291065692901611,
+ "learning_rate": 1.1266061592378455e-05,
+ "loss": 0.2135,
+ "step": 17462
+ },
+ {
+ "epoch": 47.583106267029976,
+ "grad_norm": 8.350508689880371,
+ "learning_rate": 1.1265186194192058e-05,
+ "loss": 0.117,
+ "step": 17463
+ },
+ {
+ "epoch": 47.5858310626703,
+ "grad_norm": 6.17387580871582,
+ "learning_rate": 1.1264310786152434e-05,
+ "loss": 0.1594,
+ "step": 17464
+ },
+ {
+ "epoch": 47.58855585831063,
+ "grad_norm": 5.931378364562988,
+ "learning_rate": 1.1263435368266397e-05,
+ "loss": 0.147,
+ "step": 17465
+ },
+ {
+ "epoch": 47.59128065395095,
+ "grad_norm": 6.011143684387207,
+ "learning_rate": 1.1262559940540769e-05,
+ "loss": 0.3531,
+ "step": 17466
+ },
+ {
+ "epoch": 47.59400544959128,
+ "grad_norm": 6.663870811462402,
+ "learning_rate": 1.1261684502982363e-05,
+ "loss": 0.1823,
+ "step": 17467
+ },
+ {
+ "epoch": 47.596730245231605,
+ "grad_norm": 5.473087310791016,
+ "learning_rate": 1.1260809055597996e-05,
+ "loss": 0.3148,
+ "step": 17468
+ },
+ {
+ "epoch": 47.59945504087194,
+ "grad_norm": 5.8604416847229,
+ "learning_rate": 1.125993359839449e-05,
+ "loss": 0.1427,
+ "step": 17469
+ },
+ {
+ "epoch": 47.60217983651226,
+ "grad_norm": 5.006176471710205,
+ "learning_rate": 1.1259058131378665e-05,
+ "loss": 0.1764,
+ "step": 17470
+ },
+ {
+ "epoch": 47.60490463215259,
+ "grad_norm": 6.329784393310547,
+ "learning_rate": 1.125818265455733e-05,
+ "loss": 0.1748,
+ "step": 17471
+ },
+ {
+ "epoch": 47.607629427792915,
+ "grad_norm": 5.836141109466553,
+ "learning_rate": 1.1257307167937315e-05,
+ "loss": 0.2063,
+ "step": 17472
+ },
+ {
+ "epoch": 47.61035422343324,
+ "grad_norm": 5.373903274536133,
+ "learning_rate": 1.1256431671525428e-05,
+ "loss": 0.1913,
+ "step": 17473
+ },
+ {
+ "epoch": 47.61307901907357,
+ "grad_norm": 6.745926380157471,
+ "learning_rate": 1.1255556165328494e-05,
+ "loss": 0.2,
+ "step": 17474
+ },
+ {
+ "epoch": 47.6158038147139,
+ "grad_norm": 4.685171127319336,
+ "learning_rate": 1.125468064935333e-05,
+ "loss": 0.099,
+ "step": 17475
+ },
+ {
+ "epoch": 47.618528610354225,
+ "grad_norm": 4.967680931091309,
+ "learning_rate": 1.1253805123606752e-05,
+ "loss": 0.1854,
+ "step": 17476
+ },
+ {
+ "epoch": 47.62125340599455,
+ "grad_norm": 6.480405330657959,
+ "learning_rate": 1.1252929588095576e-05,
+ "loss": 0.116,
+ "step": 17477
+ },
+ {
+ "epoch": 47.62397820163488,
+ "grad_norm": 7.122380256652832,
+ "learning_rate": 1.1252054042826627e-05,
+ "loss": 0.2554,
+ "step": 17478
+ },
+ {
+ "epoch": 47.6267029972752,
+ "grad_norm": 6.015350341796875,
+ "learning_rate": 1.1251178487806725e-05,
+ "loss": 0.2606,
+ "step": 17479
+ },
+ {
+ "epoch": 47.62942779291553,
+ "grad_norm": 6.103729724884033,
+ "learning_rate": 1.1250302923042684e-05,
+ "loss": 0.131,
+ "step": 17480
+ },
+ {
+ "epoch": 47.63215258855586,
+ "grad_norm": 4.799370765686035,
+ "learning_rate": 1.1249427348541322e-05,
+ "loss": 0.1053,
+ "step": 17481
+ },
+ {
+ "epoch": 47.63487738419619,
+ "grad_norm": 4.938962936401367,
+ "learning_rate": 1.124855176430946e-05,
+ "loss": 0.0967,
+ "step": 17482
+ },
+ {
+ "epoch": 47.63760217983651,
+ "grad_norm": 5.413734436035156,
+ "learning_rate": 1.1247676170353918e-05,
+ "loss": 0.1881,
+ "step": 17483
+ },
+ {
+ "epoch": 47.64032697547684,
+ "grad_norm": 6.096156597137451,
+ "learning_rate": 1.1246800566681517e-05,
+ "loss": 0.1828,
+ "step": 17484
+ },
+ {
+ "epoch": 47.643051771117165,
+ "grad_norm": 4.924108028411865,
+ "learning_rate": 1.124592495329907e-05,
+ "loss": 0.2259,
+ "step": 17485
+ },
+ {
+ "epoch": 47.64577656675749,
+ "grad_norm": 5.234230041503906,
+ "learning_rate": 1.1245049330213398e-05,
+ "loss": 0.1552,
+ "step": 17486
+ },
+ {
+ "epoch": 47.64850136239782,
+ "grad_norm": 4.4490275382995605,
+ "learning_rate": 1.1244173697431324e-05,
+ "loss": 0.2035,
+ "step": 17487
+ },
+ {
+ "epoch": 47.65122615803815,
+ "grad_norm": 5.975407600402832,
+ "learning_rate": 1.1243298054959666e-05,
+ "loss": 0.2455,
+ "step": 17488
+ },
+ {
+ "epoch": 47.653950953678475,
+ "grad_norm": 6.0566205978393555,
+ "learning_rate": 1.1242422402805242e-05,
+ "loss": 0.2092,
+ "step": 17489
+ },
+ {
+ "epoch": 47.6566757493188,
+ "grad_norm": 5.6127729415893555,
+ "learning_rate": 1.1241546740974874e-05,
+ "loss": 0.1373,
+ "step": 17490
+ },
+ {
+ "epoch": 47.65940054495913,
+ "grad_norm": 5.423619270324707,
+ "learning_rate": 1.1240671069475377e-05,
+ "loss": 0.2289,
+ "step": 17491
+ },
+ {
+ "epoch": 47.66212534059945,
+ "grad_norm": 5.537922382354736,
+ "learning_rate": 1.1239795388313578e-05,
+ "loss": 0.1996,
+ "step": 17492
+ },
+ {
+ "epoch": 47.664850136239785,
+ "grad_norm": 5.652258396148682,
+ "learning_rate": 1.1238919697496287e-05,
+ "loss": 0.2054,
+ "step": 17493
+ },
+ {
+ "epoch": 47.66757493188011,
+ "grad_norm": 4.688675880432129,
+ "learning_rate": 1.123804399703033e-05,
+ "loss": 0.1739,
+ "step": 17494
+ },
+ {
+ "epoch": 47.67029972752044,
+ "grad_norm": 4.451544284820557,
+ "learning_rate": 1.1237168286922528e-05,
+ "loss": 0.1129,
+ "step": 17495
+ },
+ {
+ "epoch": 47.67302452316076,
+ "grad_norm": 15.768667221069336,
+ "learning_rate": 1.1236292567179702e-05,
+ "loss": 0.2325,
+ "step": 17496
+ },
+ {
+ "epoch": 47.67574931880109,
+ "grad_norm": 4.785447597503662,
+ "learning_rate": 1.1235416837808663e-05,
+ "loss": 0.137,
+ "step": 17497
+ },
+ {
+ "epoch": 47.678474114441414,
+ "grad_norm": 4.1190996170043945,
+ "learning_rate": 1.1234541098816244e-05,
+ "loss": 0.1097,
+ "step": 17498
+ },
+ {
+ "epoch": 47.68119891008175,
+ "grad_norm": 6.4247822761535645,
+ "learning_rate": 1.1233665350209253e-05,
+ "loss": 0.1627,
+ "step": 17499
+ },
+ {
+ "epoch": 47.68392370572207,
+ "grad_norm": 5.705071926116943,
+ "learning_rate": 1.123278959199452e-05,
+ "loss": 0.1465,
+ "step": 17500
+ },
+ {
+ "epoch": 47.6866485013624,
+ "grad_norm": 5.82485818862915,
+ "learning_rate": 1.1231913824178859e-05,
+ "loss": 0.1548,
+ "step": 17501
+ },
+ {
+ "epoch": 47.689373297002724,
+ "grad_norm": 4.3881964683532715,
+ "learning_rate": 1.1231038046769094e-05,
+ "loss": 0.1803,
+ "step": 17502
+ },
+ {
+ "epoch": 47.69209809264305,
+ "grad_norm": 5.945643424987793,
+ "learning_rate": 1.1230162259772041e-05,
+ "loss": 0.196,
+ "step": 17503
+ },
+ {
+ "epoch": 47.694822888283376,
+ "grad_norm": 5.282832145690918,
+ "learning_rate": 1.1229286463194529e-05,
+ "loss": 0.1717,
+ "step": 17504
+ },
+ {
+ "epoch": 47.69754768392371,
+ "grad_norm": 5.0459113121032715,
+ "learning_rate": 1.1228410657043369e-05,
+ "loss": 0.1257,
+ "step": 17505
+ },
+ {
+ "epoch": 47.700272479564035,
+ "grad_norm": 5.307849884033203,
+ "learning_rate": 1.1227534841325392e-05,
+ "loss": 0.1627,
+ "step": 17506
+ },
+ {
+ "epoch": 47.70299727520436,
+ "grad_norm": 4.829582214355469,
+ "learning_rate": 1.1226659016047408e-05,
+ "loss": 0.203,
+ "step": 17507
+ },
+ {
+ "epoch": 47.705722070844686,
+ "grad_norm": 5.935482501983643,
+ "learning_rate": 1.1225783181216245e-05,
+ "loss": 0.2103,
+ "step": 17508
+ },
+ {
+ "epoch": 47.70844686648501,
+ "grad_norm": 5.641786098480225,
+ "learning_rate": 1.1224907336838722e-05,
+ "loss": 0.3269,
+ "step": 17509
+ },
+ {
+ "epoch": 47.71117166212534,
+ "grad_norm": 5.684382438659668,
+ "learning_rate": 1.1224031482921662e-05,
+ "loss": 0.1154,
+ "step": 17510
+ },
+ {
+ "epoch": 47.71389645776567,
+ "grad_norm": 14.90807819366455,
+ "learning_rate": 1.122315561947188e-05,
+ "loss": 0.1667,
+ "step": 17511
+ },
+ {
+ "epoch": 47.716621253406,
+ "grad_norm": 4.395716190338135,
+ "learning_rate": 1.1222279746496203e-05,
+ "loss": 0.107,
+ "step": 17512
+ },
+ {
+ "epoch": 47.71934604904632,
+ "grad_norm": 4.7664008140563965,
+ "learning_rate": 1.1221403864001452e-05,
+ "loss": 0.2012,
+ "step": 17513
+ },
+ {
+ "epoch": 47.72207084468665,
+ "grad_norm": 5.558382034301758,
+ "learning_rate": 1.1220527971994447e-05,
+ "loss": 0.2555,
+ "step": 17514
+ },
+ {
+ "epoch": 47.724795640326974,
+ "grad_norm": 4.383884906768799,
+ "learning_rate": 1.1219652070482007e-05,
+ "loss": 0.1831,
+ "step": 17515
+ },
+ {
+ "epoch": 47.7275204359673,
+ "grad_norm": 4.921212673187256,
+ "learning_rate": 1.1218776159470962e-05,
+ "loss": 0.1973,
+ "step": 17516
+ },
+ {
+ "epoch": 47.73024523160763,
+ "grad_norm": 7.012421607971191,
+ "learning_rate": 1.121790023896812e-05,
+ "loss": 0.3093,
+ "step": 17517
+ },
+ {
+ "epoch": 47.73297002724796,
+ "grad_norm": 3.847579002380371,
+ "learning_rate": 1.1217024308980316e-05,
+ "loss": 0.0867,
+ "step": 17518
+ },
+ {
+ "epoch": 47.735694822888284,
+ "grad_norm": 5.985230922698975,
+ "learning_rate": 1.1216148369514361e-05,
+ "loss": 0.2108,
+ "step": 17519
+ },
+ {
+ "epoch": 47.73841961852861,
+ "grad_norm": 4.878545761108398,
+ "learning_rate": 1.1215272420577084e-05,
+ "loss": 0.1246,
+ "step": 17520
+ },
+ {
+ "epoch": 47.741144414168936,
+ "grad_norm": 5.384594440460205,
+ "learning_rate": 1.1214396462175306e-05,
+ "loss": 0.2503,
+ "step": 17521
+ },
+ {
+ "epoch": 47.74386920980926,
+ "grad_norm": 4.4147748947143555,
+ "learning_rate": 1.1213520494315844e-05,
+ "loss": 0.1209,
+ "step": 17522
+ },
+ {
+ "epoch": 47.746594005449595,
+ "grad_norm": 5.7944512367248535,
+ "learning_rate": 1.1212644517005527e-05,
+ "loss": 0.1086,
+ "step": 17523
+ },
+ {
+ "epoch": 47.74931880108992,
+ "grad_norm": 4.662676811218262,
+ "learning_rate": 1.121176853025117e-05,
+ "loss": 0.1195,
+ "step": 17524
+ },
+ {
+ "epoch": 47.752043596730246,
+ "grad_norm": 7.815180778503418,
+ "learning_rate": 1.1210892534059599e-05,
+ "loss": 0.2545,
+ "step": 17525
+ },
+ {
+ "epoch": 47.75476839237057,
+ "grad_norm": 9.577667236328125,
+ "learning_rate": 1.121001652843764e-05,
+ "loss": 0.2967,
+ "step": 17526
+ },
+ {
+ "epoch": 47.7574931880109,
+ "grad_norm": 4.301311492919922,
+ "learning_rate": 1.1209140513392108e-05,
+ "loss": 0.2221,
+ "step": 17527
+ },
+ {
+ "epoch": 47.76021798365122,
+ "grad_norm": 6.129922389984131,
+ "learning_rate": 1.120826448892983e-05,
+ "loss": 0.3099,
+ "step": 17528
+ },
+ {
+ "epoch": 47.762942779291556,
+ "grad_norm": 4.257871627807617,
+ "learning_rate": 1.1207388455057623e-05,
+ "loss": 0.1592,
+ "step": 17529
+ },
+ {
+ "epoch": 47.76566757493188,
+ "grad_norm": 5.939739227294922,
+ "learning_rate": 1.1206512411782318e-05,
+ "loss": 0.2376,
+ "step": 17530
+ },
+ {
+ "epoch": 47.76839237057221,
+ "grad_norm": 6.521246910095215,
+ "learning_rate": 1.1205636359110733e-05,
+ "loss": 0.1876,
+ "step": 17531
+ },
+ {
+ "epoch": 47.771117166212534,
+ "grad_norm": 5.632286548614502,
+ "learning_rate": 1.1204760297049688e-05,
+ "loss": 0.2123,
+ "step": 17532
+ },
+ {
+ "epoch": 47.77384196185286,
+ "grad_norm": 6.878013610839844,
+ "learning_rate": 1.1203884225606012e-05,
+ "loss": 0.1777,
+ "step": 17533
+ },
+ {
+ "epoch": 47.776566757493185,
+ "grad_norm": 6.377793312072754,
+ "learning_rate": 1.1203008144786523e-05,
+ "loss": 0.1919,
+ "step": 17534
+ },
+ {
+ "epoch": 47.77929155313352,
+ "grad_norm": 5.528269290924072,
+ "learning_rate": 1.1202132054598045e-05,
+ "loss": 0.1104,
+ "step": 17535
+ },
+ {
+ "epoch": 47.782016348773844,
+ "grad_norm": 8.225494384765625,
+ "learning_rate": 1.1201255955047401e-05,
+ "loss": 0.1152,
+ "step": 17536
+ },
+ {
+ "epoch": 47.78474114441417,
+ "grad_norm": 6.01784086227417,
+ "learning_rate": 1.1200379846141414e-05,
+ "loss": 0.1954,
+ "step": 17537
+ },
+ {
+ "epoch": 47.787465940054496,
+ "grad_norm": 7.055092811584473,
+ "learning_rate": 1.1199503727886906e-05,
+ "loss": 0.1979,
+ "step": 17538
+ },
+ {
+ "epoch": 47.79019073569482,
+ "grad_norm": 5.262936592102051,
+ "learning_rate": 1.1198627600290705e-05,
+ "loss": 0.2109,
+ "step": 17539
+ },
+ {
+ "epoch": 47.79291553133515,
+ "grad_norm": 4.87378454208374,
+ "learning_rate": 1.119775146335963e-05,
+ "loss": 0.1322,
+ "step": 17540
+ },
+ {
+ "epoch": 47.79564032697548,
+ "grad_norm": 10.3624906539917,
+ "learning_rate": 1.1196875317100507e-05,
+ "loss": 0.308,
+ "step": 17541
+ },
+ {
+ "epoch": 47.798365122615806,
+ "grad_norm": 5.652101039886475,
+ "learning_rate": 1.1195999161520152e-05,
+ "loss": 0.2001,
+ "step": 17542
+ },
+ {
+ "epoch": 47.80108991825613,
+ "grad_norm": 8.375594139099121,
+ "learning_rate": 1.1195122996625399e-05,
+ "loss": 0.1048,
+ "step": 17543
+ },
+ {
+ "epoch": 47.80381471389646,
+ "grad_norm": 4.651740550994873,
+ "learning_rate": 1.1194246822423063e-05,
+ "loss": 0.1327,
+ "step": 17544
+ },
+ {
+ "epoch": 47.80653950953678,
+ "grad_norm": 4.437902450561523,
+ "learning_rate": 1.1193370638919976e-05,
+ "loss": 0.199,
+ "step": 17545
+ },
+ {
+ "epoch": 47.80926430517711,
+ "grad_norm": 25.399202346801758,
+ "learning_rate": 1.119249444612295e-05,
+ "loss": 0.2416,
+ "step": 17546
+ },
+ {
+ "epoch": 47.81198910081744,
+ "grad_norm": 7.21932315826416,
+ "learning_rate": 1.119161824403882e-05,
+ "loss": 0.2107,
+ "step": 17547
+ },
+ {
+ "epoch": 47.81471389645777,
+ "grad_norm": 5.15492057800293,
+ "learning_rate": 1.1190742032674404e-05,
+ "loss": 0.1763,
+ "step": 17548
+ },
+ {
+ "epoch": 47.817438692098094,
+ "grad_norm": 4.759138584136963,
+ "learning_rate": 1.118986581203653e-05,
+ "loss": 0.2657,
+ "step": 17549
+ },
+ {
+ "epoch": 47.82016348773842,
+ "grad_norm": 4.424410343170166,
+ "learning_rate": 1.1188989582132016e-05,
+ "loss": 0.1495,
+ "step": 17550
+ },
+ {
+ "epoch": 47.822888283378745,
+ "grad_norm": 5.128902912139893,
+ "learning_rate": 1.1188113342967692e-05,
+ "loss": 0.25,
+ "step": 17551
+ },
+ {
+ "epoch": 47.82561307901907,
+ "grad_norm": 6.951042175292969,
+ "learning_rate": 1.1187237094550378e-05,
+ "loss": 0.1469,
+ "step": 17552
+ },
+ {
+ "epoch": 47.828337874659404,
+ "grad_norm": 5.308253288269043,
+ "learning_rate": 1.1186360836886903e-05,
+ "loss": 0.1671,
+ "step": 17553
+ },
+ {
+ "epoch": 47.83106267029973,
+ "grad_norm": 5.095129489898682,
+ "learning_rate": 1.1185484569984082e-05,
+ "loss": 0.1024,
+ "step": 17554
+ },
+ {
+ "epoch": 47.833787465940055,
+ "grad_norm": 5.261958599090576,
+ "learning_rate": 1.1184608293848748e-05,
+ "loss": 0.1865,
+ "step": 17555
+ },
+ {
+ "epoch": 47.83651226158038,
+ "grad_norm": 6.035133361816406,
+ "learning_rate": 1.1183732008487723e-05,
+ "loss": 0.1757,
+ "step": 17556
+ },
+ {
+ "epoch": 47.83923705722071,
+ "grad_norm": 5.6396565437316895,
+ "learning_rate": 1.1182855713907831e-05,
+ "loss": 0.1738,
+ "step": 17557
+ },
+ {
+ "epoch": 47.84196185286103,
+ "grad_norm": 8.060161590576172,
+ "learning_rate": 1.1181979410115897e-05,
+ "loss": 0.2106,
+ "step": 17558
+ },
+ {
+ "epoch": 47.844686648501366,
+ "grad_norm": 10.053136825561523,
+ "learning_rate": 1.1181103097118748e-05,
+ "loss": 0.1968,
+ "step": 17559
+ },
+ {
+ "epoch": 47.84741144414169,
+ "grad_norm": 5.771396160125732,
+ "learning_rate": 1.1180226774923204e-05,
+ "loss": 0.2558,
+ "step": 17560
+ },
+ {
+ "epoch": 47.85013623978202,
+ "grad_norm": 7.158561706542969,
+ "learning_rate": 1.1179350443536092e-05,
+ "loss": 0.2619,
+ "step": 17561
+ },
+ {
+ "epoch": 47.85286103542234,
+ "grad_norm": 7.704658508300781,
+ "learning_rate": 1.1178474102964236e-05,
+ "loss": 0.196,
+ "step": 17562
+ },
+ {
+ "epoch": 47.85558583106267,
+ "grad_norm": 5.428753852844238,
+ "learning_rate": 1.117759775321446e-05,
+ "loss": 0.1781,
+ "step": 17563
+ },
+ {
+ "epoch": 47.858310626702995,
+ "grad_norm": 4.305299282073975,
+ "learning_rate": 1.1176721394293593e-05,
+ "loss": 0.1271,
+ "step": 17564
+ },
+ {
+ "epoch": 47.86103542234333,
+ "grad_norm": 7.138521194458008,
+ "learning_rate": 1.1175845026208458e-05,
+ "loss": 0.2738,
+ "step": 17565
+ },
+ {
+ "epoch": 47.86376021798365,
+ "grad_norm": 6.107406139373779,
+ "learning_rate": 1.1174968648965878e-05,
+ "loss": 0.1829,
+ "step": 17566
+ },
+ {
+ "epoch": 47.86648501362398,
+ "grad_norm": 5.503721714019775,
+ "learning_rate": 1.1174092262572682e-05,
+ "loss": 0.2099,
+ "step": 17567
+ },
+ {
+ "epoch": 47.869209809264305,
+ "grad_norm": 5.220943450927734,
+ "learning_rate": 1.1173215867035692e-05,
+ "loss": 0.0943,
+ "step": 17568
+ },
+ {
+ "epoch": 47.87193460490463,
+ "grad_norm": 9.411043167114258,
+ "learning_rate": 1.1172339462361735e-05,
+ "loss": 0.1556,
+ "step": 17569
+ },
+ {
+ "epoch": 47.87465940054496,
+ "grad_norm": 5.23283576965332,
+ "learning_rate": 1.1171463048557636e-05,
+ "loss": 0.1575,
+ "step": 17570
+ },
+ {
+ "epoch": 47.87738419618529,
+ "grad_norm": 4.6045026779174805,
+ "learning_rate": 1.117058662563022e-05,
+ "loss": 0.1449,
+ "step": 17571
+ },
+ {
+ "epoch": 47.880108991825615,
+ "grad_norm": 4.9127678871154785,
+ "learning_rate": 1.1169710193586312e-05,
+ "loss": 0.1686,
+ "step": 17572
+ },
+ {
+ "epoch": 47.88283378746594,
+ "grad_norm": 5.103357791900635,
+ "learning_rate": 1.1168833752432739e-05,
+ "loss": 0.1299,
+ "step": 17573
+ },
+ {
+ "epoch": 47.88555858310627,
+ "grad_norm": 6.955219745635986,
+ "learning_rate": 1.1167957302176327e-05,
+ "loss": 0.167,
+ "step": 17574
+ },
+ {
+ "epoch": 47.88828337874659,
+ "grad_norm": 5.665987491607666,
+ "learning_rate": 1.1167080842823904e-05,
+ "loss": 0.2096,
+ "step": 17575
+ },
+ {
+ "epoch": 47.89100817438692,
+ "grad_norm": 5.6638054847717285,
+ "learning_rate": 1.1166204374382287e-05,
+ "loss": 0.2489,
+ "step": 17576
+ },
+ {
+ "epoch": 47.89373297002725,
+ "grad_norm": 4.14143705368042,
+ "learning_rate": 1.1165327896858314e-05,
+ "loss": 0.2216,
+ "step": 17577
+ },
+ {
+ "epoch": 47.89645776566758,
+ "grad_norm": 5.11337947845459,
+ "learning_rate": 1.1164451410258801e-05,
+ "loss": 0.285,
+ "step": 17578
+ },
+ {
+ "epoch": 47.8991825613079,
+ "grad_norm": 5.634405136108398,
+ "learning_rate": 1.116357491459058e-05,
+ "loss": 0.163,
+ "step": 17579
+ },
+ {
+ "epoch": 47.90190735694823,
+ "grad_norm": 4.708236217498779,
+ "learning_rate": 1.1162698409860471e-05,
+ "loss": 0.2005,
+ "step": 17580
+ },
+ {
+ "epoch": 47.904632152588555,
+ "grad_norm": 13.555902481079102,
+ "learning_rate": 1.1161821896075309e-05,
+ "loss": 0.1329,
+ "step": 17581
+ },
+ {
+ "epoch": 47.90735694822888,
+ "grad_norm": 3.5687427520751953,
+ "learning_rate": 1.1160945373241914e-05,
+ "loss": 0.1467,
+ "step": 17582
+ },
+ {
+ "epoch": 47.91008174386921,
+ "grad_norm": 6.148223876953125,
+ "learning_rate": 1.1160068841367113e-05,
+ "loss": 0.1637,
+ "step": 17583
+ },
+ {
+ "epoch": 47.91280653950954,
+ "grad_norm": 5.446135520935059,
+ "learning_rate": 1.1159192300457733e-05,
+ "loss": 0.1921,
+ "step": 17584
+ },
+ {
+ "epoch": 47.915531335149865,
+ "grad_norm": 3.317143678665161,
+ "learning_rate": 1.1158315750520603e-05,
+ "loss": 0.1658,
+ "step": 17585
+ },
+ {
+ "epoch": 47.91825613079019,
+ "grad_norm": 8.444612503051758,
+ "learning_rate": 1.1157439191562545e-05,
+ "loss": 0.1204,
+ "step": 17586
+ },
+ {
+ "epoch": 47.920980926430516,
+ "grad_norm": 4.2756547927856445,
+ "learning_rate": 1.1156562623590391e-05,
+ "loss": 0.2194,
+ "step": 17587
+ },
+ {
+ "epoch": 47.92370572207084,
+ "grad_norm": 5.209869861602783,
+ "learning_rate": 1.1155686046610958e-05,
+ "loss": 0.1105,
+ "step": 17588
+ },
+ {
+ "epoch": 47.926430517711175,
+ "grad_norm": 4.758162975311279,
+ "learning_rate": 1.1154809460631084e-05,
+ "loss": 0.1089,
+ "step": 17589
+ },
+ {
+ "epoch": 47.9291553133515,
+ "grad_norm": 5.233775615692139,
+ "learning_rate": 1.1153932865657588e-05,
+ "loss": 0.111,
+ "step": 17590
+ },
+ {
+ "epoch": 47.93188010899183,
+ "grad_norm": 5.705069065093994,
+ "learning_rate": 1.1153056261697303e-05,
+ "loss": 0.3223,
+ "step": 17591
+ },
+ {
+ "epoch": 47.93460490463215,
+ "grad_norm": 6.418481826782227,
+ "learning_rate": 1.1152179648757053e-05,
+ "loss": 0.1835,
+ "step": 17592
+ },
+ {
+ "epoch": 47.93732970027248,
+ "grad_norm": 6.488126754760742,
+ "learning_rate": 1.1151303026843664e-05,
+ "loss": 0.2548,
+ "step": 17593
+ },
+ {
+ "epoch": 47.940054495912804,
+ "grad_norm": 4.554354667663574,
+ "learning_rate": 1.1150426395963964e-05,
+ "loss": 0.1249,
+ "step": 17594
+ },
+ {
+ "epoch": 47.94277929155314,
+ "grad_norm": 5.311594486236572,
+ "learning_rate": 1.1149549756124782e-05,
+ "loss": 0.1586,
+ "step": 17595
+ },
+ {
+ "epoch": 47.94550408719346,
+ "grad_norm": 6.385234355926514,
+ "learning_rate": 1.1148673107332942e-05,
+ "loss": 0.1875,
+ "step": 17596
+ },
+ {
+ "epoch": 47.94822888283379,
+ "grad_norm": 4.108850479125977,
+ "learning_rate": 1.1147796449595274e-05,
+ "loss": 0.2056,
+ "step": 17597
+ },
+ {
+ "epoch": 47.950953678474114,
+ "grad_norm": 5.044709205627441,
+ "learning_rate": 1.1146919782918601e-05,
+ "loss": 0.1718,
+ "step": 17598
+ },
+ {
+ "epoch": 47.95367847411444,
+ "grad_norm": 4.59542989730835,
+ "learning_rate": 1.1146043107309754e-05,
+ "loss": 0.1536,
+ "step": 17599
+ },
+ {
+ "epoch": 47.956403269754766,
+ "grad_norm": 11.871831893920898,
+ "learning_rate": 1.1145166422775562e-05,
+ "loss": 0.2989,
+ "step": 17600
+ },
+ {
+ "epoch": 47.95912806539509,
+ "grad_norm": 4.525768280029297,
+ "learning_rate": 1.1144289729322853e-05,
+ "loss": 0.2321,
+ "step": 17601
+ },
+ {
+ "epoch": 47.961852861035425,
+ "grad_norm": 5.020235061645508,
+ "learning_rate": 1.1143413026958448e-05,
+ "loss": 0.1179,
+ "step": 17602
+ },
+ {
+ "epoch": 47.96457765667575,
+ "grad_norm": 6.464372634887695,
+ "learning_rate": 1.1142536315689183e-05,
+ "loss": 0.2007,
+ "step": 17603
+ },
+ {
+ "epoch": 47.967302452316076,
+ "grad_norm": 4.812226295471191,
+ "learning_rate": 1.1141659595521879e-05,
+ "loss": 0.1165,
+ "step": 17604
+ },
+ {
+ "epoch": 47.9700272479564,
+ "grad_norm": 5.447220325469971,
+ "learning_rate": 1.1140782866463369e-05,
+ "loss": 0.1425,
+ "step": 17605
+ },
+ {
+ "epoch": 47.97275204359673,
+ "grad_norm": 5.454530239105225,
+ "learning_rate": 1.1139906128520476e-05,
+ "loss": 0.2015,
+ "step": 17606
+ },
+ {
+ "epoch": 47.97547683923706,
+ "grad_norm": 6.178712368011475,
+ "learning_rate": 1.1139029381700033e-05,
+ "loss": 0.1644,
+ "step": 17607
+ },
+ {
+ "epoch": 47.97820163487739,
+ "grad_norm": 4.985306739807129,
+ "learning_rate": 1.1138152626008864e-05,
+ "loss": 0.2515,
+ "step": 17608
+ },
+ {
+ "epoch": 47.98092643051771,
+ "grad_norm": 5.267483234405518,
+ "learning_rate": 1.1137275861453801e-05,
+ "loss": 0.1962,
+ "step": 17609
+ },
+ {
+ "epoch": 47.98365122615804,
+ "grad_norm": 7.079397201538086,
+ "learning_rate": 1.113639908804167e-05,
+ "loss": 0.1802,
+ "step": 17610
+ },
+ {
+ "epoch": 47.986376021798364,
+ "grad_norm": 4.777469158172607,
+ "learning_rate": 1.1135522305779298e-05,
+ "loss": 0.1946,
+ "step": 17611
+ },
+ {
+ "epoch": 47.98910081743869,
+ "grad_norm": 5.747976303100586,
+ "learning_rate": 1.1134645514673514e-05,
+ "loss": 0.4596,
+ "step": 17612
+ },
+ {
+ "epoch": 47.991825613079016,
+ "grad_norm": 5.1898698806762695,
+ "learning_rate": 1.1133768714731152e-05,
+ "loss": 0.094,
+ "step": 17613
+ },
+ {
+ "epoch": 47.99455040871935,
+ "grad_norm": 4.5456390380859375,
+ "learning_rate": 1.113289190595903e-05,
+ "loss": 0.1426,
+ "step": 17614
+ },
+ {
+ "epoch": 47.997275204359674,
+ "grad_norm": 4.944077968597412,
+ "learning_rate": 1.1132015088363985e-05,
+ "loss": 0.2636,
+ "step": 17615
+ },
+ {
+ "epoch": 48.0,
+ "grad_norm": 5.0380401611328125,
+ "learning_rate": 1.1131138261952845e-05,
+ "loss": 0.1395,
+ "step": 17616
+ },
+ {
+ "epoch": 48.002724795640326,
+ "grad_norm": 23.600337982177734,
+ "learning_rate": 1.1130261426732433e-05,
+ "loss": 0.2574,
+ "step": 17617
+ },
+ {
+ "epoch": 48.00544959128065,
+ "grad_norm": 4.308071613311768,
+ "learning_rate": 1.1129384582709584e-05,
+ "loss": 0.2789,
+ "step": 17618
+ },
+ {
+ "epoch": 48.00817438692098,
+ "grad_norm": 5.865283012390137,
+ "learning_rate": 1.1128507729891123e-05,
+ "loss": 0.1063,
+ "step": 17619
+ },
+ {
+ "epoch": 48.01089918256131,
+ "grad_norm": 6.204005718231201,
+ "learning_rate": 1.1127630868283881e-05,
+ "loss": 0.224,
+ "step": 17620
+ },
+ {
+ "epoch": 48.013623978201636,
+ "grad_norm": 7.709722518920898,
+ "learning_rate": 1.1126753997894683e-05,
+ "loss": 0.3526,
+ "step": 17621
+ },
+ {
+ "epoch": 48.01634877384196,
+ "grad_norm": 4.147298336029053,
+ "learning_rate": 1.1125877118730363e-05,
+ "loss": 0.1381,
+ "step": 17622
+ },
+ {
+ "epoch": 48.01907356948229,
+ "grad_norm": 3.798046350479126,
+ "learning_rate": 1.112500023079775e-05,
+ "loss": 0.2069,
+ "step": 17623
+ },
+ {
+ "epoch": 48.02179836512261,
+ "grad_norm": 5.765188694000244,
+ "learning_rate": 1.1124123334103671e-05,
+ "loss": 0.1226,
+ "step": 17624
+ },
+ {
+ "epoch": 48.02452316076294,
+ "grad_norm": 4.516467094421387,
+ "learning_rate": 1.1123246428654953e-05,
+ "loss": 0.1196,
+ "step": 17625
+ },
+ {
+ "epoch": 48.02724795640327,
+ "grad_norm": 5.7083845138549805,
+ "learning_rate": 1.1122369514458431e-05,
+ "loss": 0.2256,
+ "step": 17626
+ },
+ {
+ "epoch": 48.0299727520436,
+ "grad_norm": 4.721480369567871,
+ "learning_rate": 1.112149259152093e-05,
+ "loss": 0.0924,
+ "step": 17627
+ },
+ {
+ "epoch": 48.032697547683924,
+ "grad_norm": 6.462025165557861,
+ "learning_rate": 1.112061565984928e-05,
+ "loss": 0.1297,
+ "step": 17628
+ },
+ {
+ "epoch": 48.03542234332425,
+ "grad_norm": 4.309183597564697,
+ "learning_rate": 1.1119738719450312e-05,
+ "loss": 0.2081,
+ "step": 17629
+ },
+ {
+ "epoch": 48.038147138964575,
+ "grad_norm": 6.586560249328613,
+ "learning_rate": 1.1118861770330857e-05,
+ "loss": 0.1908,
+ "step": 17630
+ },
+ {
+ "epoch": 48.0408719346049,
+ "grad_norm": 4.4471659660339355,
+ "learning_rate": 1.1117984812497739e-05,
+ "loss": 0.1516,
+ "step": 17631
+ },
+ {
+ "epoch": 48.043596730245234,
+ "grad_norm": 4.485964775085449,
+ "learning_rate": 1.1117107845957793e-05,
+ "loss": 0.1233,
+ "step": 17632
+ },
+ {
+ "epoch": 48.04632152588556,
+ "grad_norm": 6.085051536560059,
+ "learning_rate": 1.1116230870717846e-05,
+ "loss": 0.2802,
+ "step": 17633
+ },
+ {
+ "epoch": 48.049046321525886,
+ "grad_norm": 7.2233991622924805,
+ "learning_rate": 1.1115353886784732e-05,
+ "loss": 0.2454,
+ "step": 17634
+ },
+ {
+ "epoch": 48.05177111716621,
+ "grad_norm": 4.020181179046631,
+ "learning_rate": 1.1114476894165273e-05,
+ "loss": 0.2004,
+ "step": 17635
+ },
+ {
+ "epoch": 48.05449591280654,
+ "grad_norm": 4.400680065155029,
+ "learning_rate": 1.1113599892866309e-05,
+ "loss": 0.0985,
+ "step": 17636
+ },
+ {
+ "epoch": 48.05722070844686,
+ "grad_norm": 4.079622268676758,
+ "learning_rate": 1.1112722882894662e-05,
+ "loss": 0.1791,
+ "step": 17637
+ },
+ {
+ "epoch": 48.059945504087196,
+ "grad_norm": 4.532163143157959,
+ "learning_rate": 1.1111845864257166e-05,
+ "loss": 0.1177,
+ "step": 17638
+ },
+ {
+ "epoch": 48.06267029972752,
+ "grad_norm": 5.875760555267334,
+ "learning_rate": 1.111096883696065e-05,
+ "loss": 0.2561,
+ "step": 17639
+ },
+ {
+ "epoch": 48.06539509536785,
+ "grad_norm": 4.709860324859619,
+ "learning_rate": 1.1110091801011944e-05,
+ "loss": 0.1643,
+ "step": 17640
+ },
+ {
+ "epoch": 48.06811989100817,
+ "grad_norm": 6.544802188873291,
+ "learning_rate": 1.1109214756417876e-05,
+ "loss": 0.1373,
+ "step": 17641
+ },
+ {
+ "epoch": 48.0708446866485,
+ "grad_norm": 3.946495532989502,
+ "learning_rate": 1.1108337703185283e-05,
+ "loss": 0.2344,
+ "step": 17642
+ },
+ {
+ "epoch": 48.073569482288825,
+ "grad_norm": 3.775704860687256,
+ "learning_rate": 1.1107460641320991e-05,
+ "loss": 0.1107,
+ "step": 17643
+ },
+ {
+ "epoch": 48.07629427792916,
+ "grad_norm": 5.911627769470215,
+ "learning_rate": 1.110658357083183e-05,
+ "loss": 0.1627,
+ "step": 17644
+ },
+ {
+ "epoch": 48.079019073569484,
+ "grad_norm": 5.471261501312256,
+ "learning_rate": 1.1105706491724633e-05,
+ "loss": 0.3694,
+ "step": 17645
+ },
+ {
+ "epoch": 48.08174386920981,
+ "grad_norm": 4.470165729522705,
+ "learning_rate": 1.110482940400623e-05,
+ "loss": 0.1108,
+ "step": 17646
+ },
+ {
+ "epoch": 48.084468664850135,
+ "grad_norm": 4.8588786125183105,
+ "learning_rate": 1.110395230768345e-05,
+ "loss": 0.1053,
+ "step": 17647
+ },
+ {
+ "epoch": 48.08719346049046,
+ "grad_norm": 7.981325149536133,
+ "learning_rate": 1.1103075202763125e-05,
+ "loss": 0.2082,
+ "step": 17648
+ },
+ {
+ "epoch": 48.08991825613079,
+ "grad_norm": 5.377898693084717,
+ "learning_rate": 1.1102198089252083e-05,
+ "loss": 0.1289,
+ "step": 17649
+ },
+ {
+ "epoch": 48.09264305177112,
+ "grad_norm": 4.502743244171143,
+ "learning_rate": 1.1101320967157164e-05,
+ "loss": 0.3021,
+ "step": 17650
+ },
+ {
+ "epoch": 48.095367847411445,
+ "grad_norm": 3.802295446395874,
+ "learning_rate": 1.1100443836485187e-05,
+ "loss": 0.0957,
+ "step": 17651
+ },
+ {
+ "epoch": 48.09809264305177,
+ "grad_norm": 5.665125846862793,
+ "learning_rate": 1.1099566697242992e-05,
+ "loss": 0.1497,
+ "step": 17652
+ },
+ {
+ "epoch": 48.1008174386921,
+ "grad_norm": 4.261890888214111,
+ "learning_rate": 1.1098689549437406e-05,
+ "loss": 0.137,
+ "step": 17653
+ },
+ {
+ "epoch": 48.10354223433242,
+ "grad_norm": 5.558714389801025,
+ "learning_rate": 1.1097812393075262e-05,
+ "loss": 0.2521,
+ "step": 17654
+ },
+ {
+ "epoch": 48.10626702997275,
+ "grad_norm": 4.837158203125,
+ "learning_rate": 1.1096935228163387e-05,
+ "loss": 0.0972,
+ "step": 17655
+ },
+ {
+ "epoch": 48.10899182561308,
+ "grad_norm": 5.561313629150391,
+ "learning_rate": 1.1096058054708624e-05,
+ "loss": 0.2004,
+ "step": 17656
+ },
+ {
+ "epoch": 48.11171662125341,
+ "grad_norm": 6.110978126525879,
+ "learning_rate": 1.1095180872717789e-05,
+ "loss": 0.2212,
+ "step": 17657
+ },
+ {
+ "epoch": 48.11444141689373,
+ "grad_norm": 4.91227388381958,
+ "learning_rate": 1.109430368219772e-05,
+ "loss": 0.1553,
+ "step": 17658
+ },
+ {
+ "epoch": 48.11716621253406,
+ "grad_norm": 5.304751873016357,
+ "learning_rate": 1.109342648315525e-05,
+ "loss": 0.0942,
+ "step": 17659
+ },
+ {
+ "epoch": 48.119891008174385,
+ "grad_norm": 6.523604869842529,
+ "learning_rate": 1.1092549275597213e-05,
+ "loss": 0.2844,
+ "step": 17660
+ },
+ {
+ "epoch": 48.12261580381471,
+ "grad_norm": 4.470745086669922,
+ "learning_rate": 1.1091672059530434e-05,
+ "loss": 0.1423,
+ "step": 17661
+ },
+ {
+ "epoch": 48.12534059945504,
+ "grad_norm": 4.966081142425537,
+ "learning_rate": 1.1090794834961751e-05,
+ "loss": 0.2176,
+ "step": 17662
+ },
+ {
+ "epoch": 48.12806539509537,
+ "grad_norm": 4.370601177215576,
+ "learning_rate": 1.108991760189799e-05,
+ "loss": 0.1076,
+ "step": 17663
+ },
+ {
+ "epoch": 48.130790190735695,
+ "grad_norm": 4.971834182739258,
+ "learning_rate": 1.1089040360345991e-05,
+ "loss": 0.1852,
+ "step": 17664
+ },
+ {
+ "epoch": 48.13351498637602,
+ "grad_norm": 3.0083553791046143,
+ "learning_rate": 1.1088163110312576e-05,
+ "loss": 0.1391,
+ "step": 17665
+ },
+ {
+ "epoch": 48.13623978201635,
+ "grad_norm": 5.607665538787842,
+ "learning_rate": 1.108728585180458e-05,
+ "loss": 0.3079,
+ "step": 17666
+ },
+ {
+ "epoch": 48.13896457765667,
+ "grad_norm": 4.5860595703125,
+ "learning_rate": 1.1086408584828841e-05,
+ "loss": 0.1729,
+ "step": 17667
+ },
+ {
+ "epoch": 48.141689373297005,
+ "grad_norm": 6.232942581176758,
+ "learning_rate": 1.1085531309392186e-05,
+ "loss": 0.086,
+ "step": 17668
+ },
+ {
+ "epoch": 48.14441416893733,
+ "grad_norm": 5.38991641998291,
+ "learning_rate": 1.1084654025501446e-05,
+ "loss": 0.1033,
+ "step": 17669
+ },
+ {
+ "epoch": 48.14713896457766,
+ "grad_norm": 4.217653751373291,
+ "learning_rate": 1.1083776733163459e-05,
+ "loss": 0.12,
+ "step": 17670
+ },
+ {
+ "epoch": 48.14986376021798,
+ "grad_norm": 3.475024938583374,
+ "learning_rate": 1.108289943238505e-05,
+ "loss": 0.1121,
+ "step": 17671
+ },
+ {
+ "epoch": 48.15258855585831,
+ "grad_norm": 4.399120807647705,
+ "learning_rate": 1.108202212317306e-05,
+ "loss": 0.1247,
+ "step": 17672
+ },
+ {
+ "epoch": 48.155313351498634,
+ "grad_norm": 5.111778736114502,
+ "learning_rate": 1.1081144805534311e-05,
+ "loss": 0.2277,
+ "step": 17673
+ },
+ {
+ "epoch": 48.15803814713897,
+ "grad_norm": 5.794163227081299,
+ "learning_rate": 1.1080267479475644e-05,
+ "loss": 0.2108,
+ "step": 17674
+ },
+ {
+ "epoch": 48.16076294277929,
+ "grad_norm": 5.117379665374756,
+ "learning_rate": 1.1079390145003886e-05,
+ "loss": 0.124,
+ "step": 17675
+ },
+ {
+ "epoch": 48.16348773841962,
+ "grad_norm": 4.971923351287842,
+ "learning_rate": 1.1078512802125876e-05,
+ "loss": 0.2581,
+ "step": 17676
+ },
+ {
+ "epoch": 48.166212534059945,
+ "grad_norm": 4.8347368240356445,
+ "learning_rate": 1.1077635450848439e-05,
+ "loss": 0.169,
+ "step": 17677
+ },
+ {
+ "epoch": 48.16893732970027,
+ "grad_norm": 4.8003249168396,
+ "learning_rate": 1.1076758091178417e-05,
+ "loss": 0.2206,
+ "step": 17678
+ },
+ {
+ "epoch": 48.171662125340596,
+ "grad_norm": 4.9459004402160645,
+ "learning_rate": 1.1075880723122632e-05,
+ "loss": 0.1044,
+ "step": 17679
+ },
+ {
+ "epoch": 48.17438692098093,
+ "grad_norm": 4.366501331329346,
+ "learning_rate": 1.1075003346687927e-05,
+ "loss": 0.1245,
+ "step": 17680
+ },
+ {
+ "epoch": 48.177111716621255,
+ "grad_norm": 5.24885368347168,
+ "learning_rate": 1.1074125961881128e-05,
+ "loss": 0.3014,
+ "step": 17681
+ },
+ {
+ "epoch": 48.17983651226158,
+ "grad_norm": 4.298219203948975,
+ "learning_rate": 1.1073248568709073e-05,
+ "loss": 0.1314,
+ "step": 17682
+ },
+ {
+ "epoch": 48.182561307901906,
+ "grad_norm": 4.7655439376831055,
+ "learning_rate": 1.1072371167178591e-05,
+ "loss": 0.2176,
+ "step": 17683
+ },
+ {
+ "epoch": 48.18528610354223,
+ "grad_norm": 4.6595845222473145,
+ "learning_rate": 1.1071493757296515e-05,
+ "loss": 0.1591,
+ "step": 17684
+ },
+ {
+ "epoch": 48.18801089918256,
+ "grad_norm": 5.491793632507324,
+ "learning_rate": 1.1070616339069683e-05,
+ "loss": 0.3436,
+ "step": 17685
+ },
+ {
+ "epoch": 48.19073569482289,
+ "grad_norm": 3.7247369289398193,
+ "learning_rate": 1.1069738912504924e-05,
+ "loss": 0.0642,
+ "step": 17686
+ },
+ {
+ "epoch": 48.19346049046322,
+ "grad_norm": 4.61937952041626,
+ "learning_rate": 1.1068861477609072e-05,
+ "loss": 0.1947,
+ "step": 17687
+ },
+ {
+ "epoch": 48.19618528610354,
+ "grad_norm": 5.518864154815674,
+ "learning_rate": 1.1067984034388963e-05,
+ "loss": 0.1409,
+ "step": 17688
+ },
+ {
+ "epoch": 48.19891008174387,
+ "grad_norm": 4.456373691558838,
+ "learning_rate": 1.1067106582851427e-05,
+ "loss": 0.1544,
+ "step": 17689
+ },
+ {
+ "epoch": 48.201634877384194,
+ "grad_norm": 6.588265419006348,
+ "learning_rate": 1.1066229123003302e-05,
+ "loss": 0.2329,
+ "step": 17690
+ },
+ {
+ "epoch": 48.20435967302452,
+ "grad_norm": 4.4196457862854,
+ "learning_rate": 1.1065351654851417e-05,
+ "loss": 0.115,
+ "step": 17691
+ },
+ {
+ "epoch": 48.20708446866485,
+ "grad_norm": 8.519316673278809,
+ "learning_rate": 1.1064474178402607e-05,
+ "loss": 0.2761,
+ "step": 17692
+ },
+ {
+ "epoch": 48.20980926430518,
+ "grad_norm": 4.9979963302612305,
+ "learning_rate": 1.106359669366371e-05,
+ "loss": 0.1371,
+ "step": 17693
+ },
+ {
+ "epoch": 48.212534059945504,
+ "grad_norm": 4.272399425506592,
+ "learning_rate": 1.1062719200641551e-05,
+ "loss": 0.191,
+ "step": 17694
+ },
+ {
+ "epoch": 48.21525885558583,
+ "grad_norm": 3.858732223510742,
+ "learning_rate": 1.1061841699342975e-05,
+ "loss": 0.1189,
+ "step": 17695
+ },
+ {
+ "epoch": 48.217983651226156,
+ "grad_norm": 4.810211181640625,
+ "learning_rate": 1.1060964189774804e-05,
+ "loss": 0.0938,
+ "step": 17696
+ },
+ {
+ "epoch": 48.22070844686648,
+ "grad_norm": 4.097233772277832,
+ "learning_rate": 1.106008667194388e-05,
+ "loss": 0.1729,
+ "step": 17697
+ },
+ {
+ "epoch": 48.223433242506815,
+ "grad_norm": 5.586561679840088,
+ "learning_rate": 1.1059209145857038e-05,
+ "loss": 0.1512,
+ "step": 17698
+ },
+ {
+ "epoch": 48.22615803814714,
+ "grad_norm": 5.138467311859131,
+ "learning_rate": 1.1058331611521105e-05,
+ "loss": 0.1904,
+ "step": 17699
+ },
+ {
+ "epoch": 48.228882833787466,
+ "grad_norm": 7.284699440002441,
+ "learning_rate": 1.1057454068942923e-05,
+ "loss": 0.1239,
+ "step": 17700
+ },
+ {
+ "epoch": 48.23160762942779,
+ "grad_norm": 4.594121932983398,
+ "learning_rate": 1.105657651812932e-05,
+ "loss": 0.2418,
+ "step": 17701
+ },
+ {
+ "epoch": 48.23433242506812,
+ "grad_norm": 5.351985454559326,
+ "learning_rate": 1.1055698959087133e-05,
+ "loss": 0.0924,
+ "step": 17702
+ },
+ {
+ "epoch": 48.237057220708444,
+ "grad_norm": 3.99371600151062,
+ "learning_rate": 1.10548213918232e-05,
+ "loss": 0.0705,
+ "step": 17703
+ },
+ {
+ "epoch": 48.23978201634878,
+ "grad_norm": 4.211036205291748,
+ "learning_rate": 1.1053943816344348e-05,
+ "loss": 0.3535,
+ "step": 17704
+ },
+ {
+ "epoch": 48.2425068119891,
+ "grad_norm": 5.788252830505371,
+ "learning_rate": 1.1053066232657419e-05,
+ "loss": 0.1866,
+ "step": 17705
+ },
+ {
+ "epoch": 48.24523160762943,
+ "grad_norm": 4.31191349029541,
+ "learning_rate": 1.1052188640769242e-05,
+ "loss": 0.1199,
+ "step": 17706
+ },
+ {
+ "epoch": 48.247956403269754,
+ "grad_norm": 4.442556381225586,
+ "learning_rate": 1.1051311040686654e-05,
+ "loss": 0.2192,
+ "step": 17707
+ },
+ {
+ "epoch": 48.25068119891008,
+ "grad_norm": 4.344634056091309,
+ "learning_rate": 1.105043343241649e-05,
+ "loss": 0.1389,
+ "step": 17708
+ },
+ {
+ "epoch": 48.253405994550405,
+ "grad_norm": 6.456859111785889,
+ "learning_rate": 1.1049555815965583e-05,
+ "loss": 0.2467,
+ "step": 17709
+ },
+ {
+ "epoch": 48.25613079019074,
+ "grad_norm": 4.2649993896484375,
+ "learning_rate": 1.1048678191340766e-05,
+ "loss": 0.1074,
+ "step": 17710
+ },
+ {
+ "epoch": 48.258855585831064,
+ "grad_norm": 6.091101169586182,
+ "learning_rate": 1.1047800558548885e-05,
+ "loss": 0.3346,
+ "step": 17711
+ },
+ {
+ "epoch": 48.26158038147139,
+ "grad_norm": 5.986828804016113,
+ "learning_rate": 1.1046922917596761e-05,
+ "loss": 0.2379,
+ "step": 17712
+ },
+ {
+ "epoch": 48.264305177111716,
+ "grad_norm": 3.8978688716888428,
+ "learning_rate": 1.1046045268491237e-05,
+ "loss": 0.1309,
+ "step": 17713
+ },
+ {
+ "epoch": 48.26702997275204,
+ "grad_norm": 13.23773193359375,
+ "learning_rate": 1.1045167611239145e-05,
+ "loss": 0.2822,
+ "step": 17714
+ },
+ {
+ "epoch": 48.26975476839237,
+ "grad_norm": 4.466581344604492,
+ "learning_rate": 1.1044289945847325e-05,
+ "loss": 0.1192,
+ "step": 17715
+ },
+ {
+ "epoch": 48.2724795640327,
+ "grad_norm": 4.531101226806641,
+ "learning_rate": 1.1043412272322605e-05,
+ "loss": 0.3405,
+ "step": 17716
+ },
+ {
+ "epoch": 48.275204359673026,
+ "grad_norm": 3.8679039478302,
+ "learning_rate": 1.1042534590671825e-05,
+ "loss": 0.2082,
+ "step": 17717
+ },
+ {
+ "epoch": 48.27792915531335,
+ "grad_norm": 4.445958614349365,
+ "learning_rate": 1.1041656900901816e-05,
+ "loss": 0.2833,
+ "step": 17718
+ },
+ {
+ "epoch": 48.28065395095368,
+ "grad_norm": 4.962905406951904,
+ "learning_rate": 1.104077920301942e-05,
+ "loss": 0.1478,
+ "step": 17719
+ },
+ {
+ "epoch": 48.283378746594,
+ "grad_norm": 5.9054951667785645,
+ "learning_rate": 1.1039901497031466e-05,
+ "loss": 0.1653,
+ "step": 17720
+ },
+ {
+ "epoch": 48.28610354223433,
+ "grad_norm": 5.974760055541992,
+ "learning_rate": 1.1039023782944798e-05,
+ "loss": 0.0797,
+ "step": 17721
+ },
+ {
+ "epoch": 48.28882833787466,
+ "grad_norm": 6.065160274505615,
+ "learning_rate": 1.1038146060766241e-05,
+ "loss": 0.1601,
+ "step": 17722
+ },
+ {
+ "epoch": 48.29155313351499,
+ "grad_norm": 5.21046781539917,
+ "learning_rate": 1.103726833050264e-05,
+ "loss": 0.2534,
+ "step": 17723
+ },
+ {
+ "epoch": 48.294277929155314,
+ "grad_norm": 5.575509548187256,
+ "learning_rate": 1.1036390592160824e-05,
+ "loss": 0.2999,
+ "step": 17724
+ },
+ {
+ "epoch": 48.29700272479564,
+ "grad_norm": 4.694852828979492,
+ "learning_rate": 1.1035512845747633e-05,
+ "loss": 0.3159,
+ "step": 17725
+ },
+ {
+ "epoch": 48.299727520435965,
+ "grad_norm": 5.344362735748291,
+ "learning_rate": 1.1034635091269899e-05,
+ "loss": 0.1761,
+ "step": 17726
+ },
+ {
+ "epoch": 48.30245231607629,
+ "grad_norm": 4.941341400146484,
+ "learning_rate": 1.1033757328734461e-05,
+ "loss": 0.2184,
+ "step": 17727
+ },
+ {
+ "epoch": 48.305177111716624,
+ "grad_norm": 3.8010690212249756,
+ "learning_rate": 1.1032879558148152e-05,
+ "loss": 0.1603,
+ "step": 17728
+ },
+ {
+ "epoch": 48.30790190735695,
+ "grad_norm": 4.248983383178711,
+ "learning_rate": 1.1032001779517816e-05,
+ "loss": 0.2535,
+ "step": 17729
+ },
+ {
+ "epoch": 48.310626702997276,
+ "grad_norm": 6.031062126159668,
+ "learning_rate": 1.1031123992850279e-05,
+ "loss": 0.117,
+ "step": 17730
+ },
+ {
+ "epoch": 48.3133514986376,
+ "grad_norm": 3.9195001125335693,
+ "learning_rate": 1.1030246198152386e-05,
+ "loss": 0.0703,
+ "step": 17731
+ },
+ {
+ "epoch": 48.31607629427793,
+ "grad_norm": 4.528135776519775,
+ "learning_rate": 1.1029368395430964e-05,
+ "loss": 0.0937,
+ "step": 17732
+ },
+ {
+ "epoch": 48.31880108991825,
+ "grad_norm": 5.599699974060059,
+ "learning_rate": 1.1028490584692856e-05,
+ "loss": 0.1284,
+ "step": 17733
+ },
+ {
+ "epoch": 48.321525885558586,
+ "grad_norm": 4.686074733734131,
+ "learning_rate": 1.1027612765944895e-05,
+ "loss": 0.1411,
+ "step": 17734
+ },
+ {
+ "epoch": 48.32425068119891,
+ "grad_norm": 5.885397434234619,
+ "learning_rate": 1.102673493919392e-05,
+ "loss": 0.1282,
+ "step": 17735
+ },
+ {
+ "epoch": 48.32697547683924,
+ "grad_norm": 4.175334930419922,
+ "learning_rate": 1.1025857104446765e-05,
+ "loss": 0.1643,
+ "step": 17736
+ },
+ {
+ "epoch": 48.32970027247956,
+ "grad_norm": 6.086652755737305,
+ "learning_rate": 1.1024979261710271e-05,
+ "loss": 0.1401,
+ "step": 17737
+ },
+ {
+ "epoch": 48.33242506811989,
+ "grad_norm": 6.760055065155029,
+ "learning_rate": 1.1024101410991268e-05,
+ "loss": 0.1443,
+ "step": 17738
+ },
+ {
+ "epoch": 48.335149863760215,
+ "grad_norm": 4.661835670471191,
+ "learning_rate": 1.1023223552296601e-05,
+ "loss": 0.3518,
+ "step": 17739
+ },
+ {
+ "epoch": 48.33787465940055,
+ "grad_norm": 5.910048961639404,
+ "learning_rate": 1.1022345685633095e-05,
+ "loss": 0.1884,
+ "step": 17740
+ },
+ {
+ "epoch": 48.34059945504087,
+ "grad_norm": 4.59259557723999,
+ "learning_rate": 1.10214678110076e-05,
+ "loss": 0.1301,
+ "step": 17741
+ },
+ {
+ "epoch": 48.3433242506812,
+ "grad_norm": 4.3317341804504395,
+ "learning_rate": 1.1020589928426944e-05,
+ "loss": 0.1671,
+ "step": 17742
+ },
+ {
+ "epoch": 48.346049046321525,
+ "grad_norm": 4.421215534210205,
+ "learning_rate": 1.1019712037897967e-05,
+ "loss": 0.2242,
+ "step": 17743
+ },
+ {
+ "epoch": 48.34877384196185,
+ "grad_norm": 4.629679203033447,
+ "learning_rate": 1.1018834139427503e-05,
+ "loss": 0.1191,
+ "step": 17744
+ },
+ {
+ "epoch": 48.35149863760218,
+ "grad_norm": 3.6511409282684326,
+ "learning_rate": 1.1017956233022394e-05,
+ "loss": 0.0969,
+ "step": 17745
+ },
+ {
+ "epoch": 48.35422343324251,
+ "grad_norm": 4.725893020629883,
+ "learning_rate": 1.1017078318689473e-05,
+ "loss": 0.1221,
+ "step": 17746
+ },
+ {
+ "epoch": 48.356948228882835,
+ "grad_norm": 4.646679401397705,
+ "learning_rate": 1.1016200396435581e-05,
+ "loss": 0.1594,
+ "step": 17747
+ },
+ {
+ "epoch": 48.35967302452316,
+ "grad_norm": 4.431085586547852,
+ "learning_rate": 1.1015322466267552e-05,
+ "loss": 0.165,
+ "step": 17748
+ },
+ {
+ "epoch": 48.36239782016349,
+ "grad_norm": 6.013887882232666,
+ "learning_rate": 1.1014444528192225e-05,
+ "loss": 0.2449,
+ "step": 17749
+ },
+ {
+ "epoch": 48.36512261580381,
+ "grad_norm": 4.200595378875732,
+ "learning_rate": 1.1013566582216436e-05,
+ "loss": 0.0898,
+ "step": 17750
+ },
+ {
+ "epoch": 48.36784741144414,
+ "grad_norm": 5.01737117767334,
+ "learning_rate": 1.1012688628347024e-05,
+ "loss": 0.0877,
+ "step": 17751
+ },
+ {
+ "epoch": 48.37057220708447,
+ "grad_norm": 4.337869167327881,
+ "learning_rate": 1.1011810666590824e-05,
+ "loss": 0.1086,
+ "step": 17752
+ },
+ {
+ "epoch": 48.3732970027248,
+ "grad_norm": 4.994279861450195,
+ "learning_rate": 1.1010932696954675e-05,
+ "loss": 0.1671,
+ "step": 17753
+ },
+ {
+ "epoch": 48.37602179836512,
+ "grad_norm": 3.789541721343994,
+ "learning_rate": 1.1010054719445414e-05,
+ "loss": 0.224,
+ "step": 17754
+ },
+ {
+ "epoch": 48.37874659400545,
+ "grad_norm": 5.507375240325928,
+ "learning_rate": 1.1009176734069881e-05,
+ "loss": 0.2105,
+ "step": 17755
+ },
+ {
+ "epoch": 48.381471389645775,
+ "grad_norm": 4.9275126457214355,
+ "learning_rate": 1.1008298740834911e-05,
+ "loss": 0.1468,
+ "step": 17756
+ },
+ {
+ "epoch": 48.3841961852861,
+ "grad_norm": 5.050284385681152,
+ "learning_rate": 1.1007420739747345e-05,
+ "loss": 0.2736,
+ "step": 17757
+ },
+ {
+ "epoch": 48.38692098092643,
+ "grad_norm": 6.128137111663818,
+ "learning_rate": 1.1006542730814017e-05,
+ "loss": 0.1295,
+ "step": 17758
+ },
+ {
+ "epoch": 48.38964577656676,
+ "grad_norm": 4.414264678955078,
+ "learning_rate": 1.1005664714041768e-05,
+ "loss": 0.2319,
+ "step": 17759
+ },
+ {
+ "epoch": 48.392370572207085,
+ "grad_norm": 4.139552116394043,
+ "learning_rate": 1.1004786689437433e-05,
+ "loss": 0.191,
+ "step": 17760
+ },
+ {
+ "epoch": 48.39509536784741,
+ "grad_norm": 5.218533039093018,
+ "learning_rate": 1.1003908657007851e-05,
+ "loss": 0.1057,
+ "step": 17761
+ },
+ {
+ "epoch": 48.39782016348774,
+ "grad_norm": 5.753410339355469,
+ "learning_rate": 1.100303061675986e-05,
+ "loss": 0.1035,
+ "step": 17762
+ },
+ {
+ "epoch": 48.40054495912806,
+ "grad_norm": 4.692521095275879,
+ "learning_rate": 1.1002152568700302e-05,
+ "loss": 0.1673,
+ "step": 17763
+ },
+ {
+ "epoch": 48.403269754768395,
+ "grad_norm": 4.142365455627441,
+ "learning_rate": 1.1001274512836011e-05,
+ "loss": 0.1165,
+ "step": 17764
+ },
+ {
+ "epoch": 48.40599455040872,
+ "grad_norm": 5.406883239746094,
+ "learning_rate": 1.1000396449173826e-05,
+ "loss": 0.314,
+ "step": 17765
+ },
+ {
+ "epoch": 48.40871934604905,
+ "grad_norm": 4.213931083679199,
+ "learning_rate": 1.0999518377720587e-05,
+ "loss": 0.1259,
+ "step": 17766
+ },
+ {
+ "epoch": 48.41144414168937,
+ "grad_norm": 4.824357986450195,
+ "learning_rate": 1.099864029848313e-05,
+ "loss": 0.1755,
+ "step": 17767
+ },
+ {
+ "epoch": 48.4141689373297,
+ "grad_norm": 4.123696804046631,
+ "learning_rate": 1.0997762211468292e-05,
+ "loss": 0.2553,
+ "step": 17768
+ },
+ {
+ "epoch": 48.416893732970024,
+ "grad_norm": 8.818885803222656,
+ "learning_rate": 1.0996884116682918e-05,
+ "loss": 0.2187,
+ "step": 17769
+ },
+ {
+ "epoch": 48.41961852861036,
+ "grad_norm": 4.484251499176025,
+ "learning_rate": 1.099600601413384e-05,
+ "loss": 0.1441,
+ "step": 17770
+ },
+ {
+ "epoch": 48.42234332425068,
+ "grad_norm": 4.239068031311035,
+ "learning_rate": 1.09951279038279e-05,
+ "loss": 0.223,
+ "step": 17771
+ },
+ {
+ "epoch": 48.42506811989101,
+ "grad_norm": 4.117552280426025,
+ "learning_rate": 1.0994249785771938e-05,
+ "loss": 0.2856,
+ "step": 17772
+ },
+ {
+ "epoch": 48.427792915531334,
+ "grad_norm": 6.538234233856201,
+ "learning_rate": 1.0993371659972786e-05,
+ "loss": 0.2195,
+ "step": 17773
+ },
+ {
+ "epoch": 48.43051771117166,
+ "grad_norm": 3.74076509475708,
+ "learning_rate": 1.0992493526437288e-05,
+ "loss": 0.1529,
+ "step": 17774
+ },
+ {
+ "epoch": 48.433242506811986,
+ "grad_norm": 4.483790874481201,
+ "learning_rate": 1.0991615385172288e-05,
+ "loss": 0.1295,
+ "step": 17775
+ },
+ {
+ "epoch": 48.43596730245232,
+ "grad_norm": 4.919607639312744,
+ "learning_rate": 1.0990737236184615e-05,
+ "loss": 0.1698,
+ "step": 17776
+ },
+ {
+ "epoch": 48.438692098092645,
+ "grad_norm": 5.5300140380859375,
+ "learning_rate": 1.0989859079481114e-05,
+ "loss": 0.1996,
+ "step": 17777
+ },
+ {
+ "epoch": 48.44141689373297,
+ "grad_norm": 8.211633682250977,
+ "learning_rate": 1.098898091506862e-05,
+ "loss": 0.1651,
+ "step": 17778
+ },
+ {
+ "epoch": 48.444141689373296,
+ "grad_norm": 5.996046543121338,
+ "learning_rate": 1.0988102742953975e-05,
+ "loss": 0.2726,
+ "step": 17779
+ },
+ {
+ "epoch": 48.44686648501362,
+ "grad_norm": 4.44057035446167,
+ "learning_rate": 1.0987224563144018e-05,
+ "loss": 0.0924,
+ "step": 17780
+ },
+ {
+ "epoch": 48.44959128065395,
+ "grad_norm": 5.444934844970703,
+ "learning_rate": 1.098634637564559e-05,
+ "loss": 0.1428,
+ "step": 17781
+ },
+ {
+ "epoch": 48.45231607629428,
+ "grad_norm": 3.993893623352051,
+ "learning_rate": 1.0985468180465525e-05,
+ "loss": 0.1146,
+ "step": 17782
+ },
+ {
+ "epoch": 48.45504087193461,
+ "grad_norm": 4.247274875640869,
+ "learning_rate": 1.0984589977610669e-05,
+ "loss": 0.195,
+ "step": 17783
+ },
+ {
+ "epoch": 48.45776566757493,
+ "grad_norm": 4.251191139221191,
+ "learning_rate": 1.0983711767087856e-05,
+ "loss": 0.1395,
+ "step": 17784
+ },
+ {
+ "epoch": 48.46049046321526,
+ "grad_norm": 4.462006092071533,
+ "learning_rate": 1.0982833548903926e-05,
+ "loss": 0.1132,
+ "step": 17785
+ },
+ {
+ "epoch": 48.463215258855584,
+ "grad_norm": 3.7238845825195312,
+ "learning_rate": 1.0981955323065723e-05,
+ "loss": 0.1435,
+ "step": 17786
+ },
+ {
+ "epoch": 48.46594005449591,
+ "grad_norm": 4.878916263580322,
+ "learning_rate": 1.098107708958008e-05,
+ "loss": 0.2097,
+ "step": 17787
+ },
+ {
+ "epoch": 48.46866485013624,
+ "grad_norm": 5.452115058898926,
+ "learning_rate": 1.0980198848453843e-05,
+ "loss": 0.1718,
+ "step": 17788
+ },
+ {
+ "epoch": 48.47138964577657,
+ "grad_norm": 4.800817966461182,
+ "learning_rate": 1.0979320599693848e-05,
+ "loss": 0.1466,
+ "step": 17789
+ },
+ {
+ "epoch": 48.474114441416894,
+ "grad_norm": 3.7360053062438965,
+ "learning_rate": 1.0978442343306936e-05,
+ "loss": 0.2216,
+ "step": 17790
+ },
+ {
+ "epoch": 48.47683923705722,
+ "grad_norm": 3.831552505493164,
+ "learning_rate": 1.0977564079299946e-05,
+ "loss": 0.1302,
+ "step": 17791
+ },
+ {
+ "epoch": 48.479564032697546,
+ "grad_norm": 3.7697205543518066,
+ "learning_rate": 1.0976685807679719e-05,
+ "loss": 0.2297,
+ "step": 17792
+ },
+ {
+ "epoch": 48.48228882833787,
+ "grad_norm": 6.190758228302002,
+ "learning_rate": 1.0975807528453093e-05,
+ "loss": 0.1273,
+ "step": 17793
+ },
+ {
+ "epoch": 48.485013623978205,
+ "grad_norm": 4.133101940155029,
+ "learning_rate": 1.0974929241626912e-05,
+ "loss": 0.2018,
+ "step": 17794
+ },
+ {
+ "epoch": 48.48773841961853,
+ "grad_norm": 5.943972110748291,
+ "learning_rate": 1.0974050947208012e-05,
+ "loss": 0.1339,
+ "step": 17795
+ },
+ {
+ "epoch": 48.490463215258856,
+ "grad_norm": 7.384430408477783,
+ "learning_rate": 1.0973172645203235e-05,
+ "loss": 0.1288,
+ "step": 17796
+ },
+ {
+ "epoch": 48.49318801089918,
+ "grad_norm": 4.5868377685546875,
+ "learning_rate": 1.0972294335619418e-05,
+ "loss": 0.0871,
+ "step": 17797
+ },
+ {
+ "epoch": 48.49591280653951,
+ "grad_norm": 4.389998912811279,
+ "learning_rate": 1.0971416018463406e-05,
+ "loss": 0.1223,
+ "step": 17798
+ },
+ {
+ "epoch": 48.49863760217983,
+ "grad_norm": 3.918980598449707,
+ "learning_rate": 1.0970537693742038e-05,
+ "loss": 0.2619,
+ "step": 17799
+ },
+ {
+ "epoch": 48.50136239782017,
+ "grad_norm": 4.901152610778809,
+ "learning_rate": 1.0969659361462153e-05,
+ "loss": 0.1312,
+ "step": 17800
+ },
+ {
+ "epoch": 48.50408719346049,
+ "grad_norm": 4.2105865478515625,
+ "learning_rate": 1.0968781021630593e-05,
+ "loss": 0.198,
+ "step": 17801
+ },
+ {
+ "epoch": 48.50681198910082,
+ "grad_norm": 6.870593070983887,
+ "learning_rate": 1.0967902674254199e-05,
+ "loss": 0.1419,
+ "step": 17802
+ },
+ {
+ "epoch": 48.509536784741144,
+ "grad_norm": 4.70383358001709,
+ "learning_rate": 1.0967024319339806e-05,
+ "loss": 0.1556,
+ "step": 17803
+ },
+ {
+ "epoch": 48.51226158038147,
+ "grad_norm": 4.624796390533447,
+ "learning_rate": 1.0966145956894259e-05,
+ "loss": 0.1064,
+ "step": 17804
+ },
+ {
+ "epoch": 48.514986376021795,
+ "grad_norm": 5.43842077255249,
+ "learning_rate": 1.0965267586924399e-05,
+ "loss": 0.2489,
+ "step": 17805
+ },
+ {
+ "epoch": 48.51771117166213,
+ "grad_norm": 4.296053886413574,
+ "learning_rate": 1.096438920943707e-05,
+ "loss": 0.219,
+ "step": 17806
+ },
+ {
+ "epoch": 48.520435967302454,
+ "grad_norm": 3.50492000579834,
+ "learning_rate": 1.0963510824439102e-05,
+ "loss": 0.1002,
+ "step": 17807
+ },
+ {
+ "epoch": 48.52316076294278,
+ "grad_norm": 5.498265266418457,
+ "learning_rate": 1.096263243193735e-05,
+ "loss": 0.1517,
+ "step": 17808
+ },
+ {
+ "epoch": 48.525885558583106,
+ "grad_norm": 4.727783203125,
+ "learning_rate": 1.0961754031938643e-05,
+ "loss": 0.2114,
+ "step": 17809
+ },
+ {
+ "epoch": 48.52861035422343,
+ "grad_norm": 5.354934215545654,
+ "learning_rate": 1.096087562444983e-05,
+ "loss": 0.1706,
+ "step": 17810
+ },
+ {
+ "epoch": 48.53133514986376,
+ "grad_norm": 4.985727787017822,
+ "learning_rate": 1.0959997209477747e-05,
+ "loss": 0.1196,
+ "step": 17811
+ },
+ {
+ "epoch": 48.53405994550409,
+ "grad_norm": 4.712111473083496,
+ "learning_rate": 1.0959118787029236e-05,
+ "loss": 0.1507,
+ "step": 17812
+ },
+ {
+ "epoch": 48.536784741144416,
+ "grad_norm": 6.8252058029174805,
+ "learning_rate": 1.0958240357111136e-05,
+ "loss": 0.2059,
+ "step": 17813
+ },
+ {
+ "epoch": 48.53950953678474,
+ "grad_norm": 4.87732458114624,
+ "learning_rate": 1.0957361919730293e-05,
+ "loss": 0.1522,
+ "step": 17814
+ },
+ {
+ "epoch": 48.54223433242507,
+ "grad_norm": 3.610193967819214,
+ "learning_rate": 1.095648347489355e-05,
+ "loss": 0.1651,
+ "step": 17815
+ },
+ {
+ "epoch": 48.54495912806539,
+ "grad_norm": 5.8085551261901855,
+ "learning_rate": 1.095560502260774e-05,
+ "loss": 0.127,
+ "step": 17816
+ },
+ {
+ "epoch": 48.54768392370572,
+ "grad_norm": 3.7117836475372314,
+ "learning_rate": 1.0954726562879709e-05,
+ "loss": 0.0835,
+ "step": 17817
+ },
+ {
+ "epoch": 48.55040871934605,
+ "grad_norm": 3.1796491146087646,
+ "learning_rate": 1.0953848095716302e-05,
+ "loss": 0.0797,
+ "step": 17818
+ },
+ {
+ "epoch": 48.55313351498638,
+ "grad_norm": 4.152004241943359,
+ "learning_rate": 1.0952969621124354e-05,
+ "loss": 0.1352,
+ "step": 17819
+ },
+ {
+ "epoch": 48.555858310626704,
+ "grad_norm": 7.578192710876465,
+ "learning_rate": 1.095209113911071e-05,
+ "loss": 0.2625,
+ "step": 17820
+ },
+ {
+ "epoch": 48.55858310626703,
+ "grad_norm": 4.083261013031006,
+ "learning_rate": 1.0951212649682208e-05,
+ "loss": 0.0693,
+ "step": 17821
+ },
+ {
+ "epoch": 48.561307901907355,
+ "grad_norm": 4.408059120178223,
+ "learning_rate": 1.0950334152845697e-05,
+ "loss": 0.2066,
+ "step": 17822
+ },
+ {
+ "epoch": 48.56403269754768,
+ "grad_norm": 5.4838547706604,
+ "learning_rate": 1.094945564860801e-05,
+ "loss": 0.138,
+ "step": 17823
+ },
+ {
+ "epoch": 48.566757493188014,
+ "grad_norm": 4.158769607543945,
+ "learning_rate": 1.0948577136975998e-05,
+ "loss": 0.2052,
+ "step": 17824
+ },
+ {
+ "epoch": 48.56948228882834,
+ "grad_norm": 6.033012866973877,
+ "learning_rate": 1.0947698617956493e-05,
+ "loss": 0.1823,
+ "step": 17825
+ },
+ {
+ "epoch": 48.572207084468666,
+ "grad_norm": 4.139128684997559,
+ "learning_rate": 1.0946820091556345e-05,
+ "loss": 0.2572,
+ "step": 17826
+ },
+ {
+ "epoch": 48.57493188010899,
+ "grad_norm": 4.893764495849609,
+ "learning_rate": 1.0945941557782389e-05,
+ "loss": 0.1458,
+ "step": 17827
+ },
+ {
+ "epoch": 48.57765667574932,
+ "grad_norm": 4.853830337524414,
+ "learning_rate": 1.0945063016641475e-05,
+ "loss": 0.1359,
+ "step": 17828
+ },
+ {
+ "epoch": 48.58038147138964,
+ "grad_norm": 4.356120586395264,
+ "learning_rate": 1.0944184468140438e-05,
+ "loss": 0.2207,
+ "step": 17829
+ },
+ {
+ "epoch": 48.583106267029976,
+ "grad_norm": 4.447303295135498,
+ "learning_rate": 1.0943305912286122e-05,
+ "loss": 0.218,
+ "step": 17830
+ },
+ {
+ "epoch": 48.5858310626703,
+ "grad_norm": 4.7632246017456055,
+ "learning_rate": 1.0942427349085369e-05,
+ "loss": 0.1986,
+ "step": 17831
+ },
+ {
+ "epoch": 48.58855585831063,
+ "grad_norm": 5.0486860275268555,
+ "learning_rate": 1.0941548778545026e-05,
+ "loss": 0.2096,
+ "step": 17832
+ },
+ {
+ "epoch": 48.59128065395095,
+ "grad_norm": 4.926656246185303,
+ "learning_rate": 1.0940670200671927e-05,
+ "loss": 0.1386,
+ "step": 17833
+ },
+ {
+ "epoch": 48.59400544959128,
+ "grad_norm": 6.114628791809082,
+ "learning_rate": 1.0939791615472925e-05,
+ "loss": 0.1548,
+ "step": 17834
+ },
+ {
+ "epoch": 48.596730245231605,
+ "grad_norm": 4.695802211761475,
+ "learning_rate": 1.093891302295485e-05,
+ "loss": 0.131,
+ "step": 17835
+ },
+ {
+ "epoch": 48.59945504087194,
+ "grad_norm": 4.727912902832031,
+ "learning_rate": 1.0938034423124556e-05,
+ "loss": 0.2326,
+ "step": 17836
+ },
+ {
+ "epoch": 48.60217983651226,
+ "grad_norm": 5.18319845199585,
+ "learning_rate": 1.0937155815988876e-05,
+ "loss": 0.135,
+ "step": 17837
+ },
+ {
+ "epoch": 48.60490463215259,
+ "grad_norm": 4.774102210998535,
+ "learning_rate": 1.0936277201554659e-05,
+ "loss": 0.1554,
+ "step": 17838
+ },
+ {
+ "epoch": 48.607629427792915,
+ "grad_norm": 4.480764389038086,
+ "learning_rate": 1.093539857982874e-05,
+ "loss": 0.0951,
+ "step": 17839
+ },
+ {
+ "epoch": 48.61035422343324,
+ "grad_norm": 5.493941307067871,
+ "learning_rate": 1.0934519950817975e-05,
+ "loss": 0.145,
+ "step": 17840
+ },
+ {
+ "epoch": 48.61307901907357,
+ "grad_norm": 12.467942237854004,
+ "learning_rate": 1.0933641314529194e-05,
+ "loss": 0.1568,
+ "step": 17841
+ },
+ {
+ "epoch": 48.6158038147139,
+ "grad_norm": 4.472496509552002,
+ "learning_rate": 1.0932762670969245e-05,
+ "loss": 0.3599,
+ "step": 17842
+ },
+ {
+ "epoch": 48.618528610354225,
+ "grad_norm": 4.142789840698242,
+ "learning_rate": 1.093188402014497e-05,
+ "loss": 0.1164,
+ "step": 17843
+ },
+ {
+ "epoch": 48.62125340599455,
+ "grad_norm": 11.64066219329834,
+ "learning_rate": 1.0931005362063215e-05,
+ "loss": 0.0925,
+ "step": 17844
+ },
+ {
+ "epoch": 48.62397820163488,
+ "grad_norm": 4.357254505157471,
+ "learning_rate": 1.0930126696730817e-05,
+ "loss": 0.1776,
+ "step": 17845
+ },
+ {
+ "epoch": 48.6267029972752,
+ "grad_norm": 4.873206615447998,
+ "learning_rate": 1.0929248024154623e-05,
+ "loss": 0.114,
+ "step": 17846
+ },
+ {
+ "epoch": 48.62942779291553,
+ "grad_norm": 3.566783905029297,
+ "learning_rate": 1.0928369344341475e-05,
+ "loss": 0.0887,
+ "step": 17847
+ },
+ {
+ "epoch": 48.63215258855586,
+ "grad_norm": 4.783731460571289,
+ "learning_rate": 1.0927490657298217e-05,
+ "loss": 0.3098,
+ "step": 17848
+ },
+ {
+ "epoch": 48.63487738419619,
+ "grad_norm": 9.20406436920166,
+ "learning_rate": 1.092661196303169e-05,
+ "loss": 0.1396,
+ "step": 17849
+ },
+ {
+ "epoch": 48.63760217983651,
+ "grad_norm": 5.053576469421387,
+ "learning_rate": 1.092573326154874e-05,
+ "loss": 0.1924,
+ "step": 17850
+ },
+ {
+ "epoch": 48.64032697547684,
+ "grad_norm": 6.097115516662598,
+ "learning_rate": 1.092485455285621e-05,
+ "loss": 0.188,
+ "step": 17851
+ },
+ {
+ "epoch": 48.643051771117165,
+ "grad_norm": 4.562507629394531,
+ "learning_rate": 1.0923975836960945e-05,
+ "loss": 0.1523,
+ "step": 17852
+ },
+ {
+ "epoch": 48.64577656675749,
+ "grad_norm": 5.5145063400268555,
+ "learning_rate": 1.092309711386978e-05,
+ "loss": 0.2023,
+ "step": 17853
+ },
+ {
+ "epoch": 48.64850136239782,
+ "grad_norm": 3.9514994621276855,
+ "learning_rate": 1.0922218383589571e-05,
+ "loss": 0.147,
+ "step": 17854
+ },
+ {
+ "epoch": 48.65122615803815,
+ "grad_norm": 4.680118083953857,
+ "learning_rate": 1.0921339646127149e-05,
+ "loss": 0.2202,
+ "step": 17855
+ },
+ {
+ "epoch": 48.653950953678475,
+ "grad_norm": 5.517587184906006,
+ "learning_rate": 1.0920460901489367e-05,
+ "loss": 0.2085,
+ "step": 17856
+ },
+ {
+ "epoch": 48.6566757493188,
+ "grad_norm": 4.694092750549316,
+ "learning_rate": 1.0919582149683063e-05,
+ "loss": 0.1227,
+ "step": 17857
+ },
+ {
+ "epoch": 48.65940054495913,
+ "grad_norm": 4.772033214569092,
+ "learning_rate": 1.0918703390715085e-05,
+ "loss": 0.1051,
+ "step": 17858
+ },
+ {
+ "epoch": 48.66212534059945,
+ "grad_norm": 4.644705772399902,
+ "learning_rate": 1.0917824624592275e-05,
+ "loss": 0.1581,
+ "step": 17859
+ },
+ {
+ "epoch": 48.664850136239785,
+ "grad_norm": 8.996315956115723,
+ "learning_rate": 1.0916945851321472e-05,
+ "loss": 0.137,
+ "step": 17860
+ },
+ {
+ "epoch": 48.66757493188011,
+ "grad_norm": 3.949974775314331,
+ "learning_rate": 1.0916067070909526e-05,
+ "loss": 0.2643,
+ "step": 17861
+ },
+ {
+ "epoch": 48.67029972752044,
+ "grad_norm": 5.861550807952881,
+ "learning_rate": 1.0915188283363282e-05,
+ "loss": 0.2017,
+ "step": 17862
+ },
+ {
+ "epoch": 48.67302452316076,
+ "grad_norm": 5.690976142883301,
+ "learning_rate": 1.0914309488689578e-05,
+ "loss": 0.2188,
+ "step": 17863
+ },
+ {
+ "epoch": 48.67574931880109,
+ "grad_norm": 4.927664279937744,
+ "learning_rate": 1.0913430686895261e-05,
+ "loss": 0.0955,
+ "step": 17864
+ },
+ {
+ "epoch": 48.678474114441414,
+ "grad_norm": 4.175412654876709,
+ "learning_rate": 1.0912551877987179e-05,
+ "loss": 0.1394,
+ "step": 17865
+ },
+ {
+ "epoch": 48.68119891008175,
+ "grad_norm": 7.90694522857666,
+ "learning_rate": 1.0911673061972168e-05,
+ "loss": 0.3055,
+ "step": 17866
+ },
+ {
+ "epoch": 48.68392370572207,
+ "grad_norm": 5.071043968200684,
+ "learning_rate": 1.0910794238857082e-05,
+ "loss": 0.2462,
+ "step": 17867
+ },
+ {
+ "epoch": 48.6866485013624,
+ "grad_norm": 3.9485936164855957,
+ "learning_rate": 1.0909915408648755e-05,
+ "loss": 0.1552,
+ "step": 17868
+ },
+ {
+ "epoch": 48.689373297002724,
+ "grad_norm": 4.367345809936523,
+ "learning_rate": 1.0909036571354037e-05,
+ "loss": 0.0789,
+ "step": 17869
+ },
+ {
+ "epoch": 48.69209809264305,
+ "grad_norm": 6.0083417892456055,
+ "learning_rate": 1.0908157726979772e-05,
+ "loss": 0.2444,
+ "step": 17870
+ },
+ {
+ "epoch": 48.694822888283376,
+ "grad_norm": 4.69628381729126,
+ "learning_rate": 1.0907278875532805e-05,
+ "loss": 0.2709,
+ "step": 17871
+ },
+ {
+ "epoch": 48.69754768392371,
+ "grad_norm": 5.077993392944336,
+ "learning_rate": 1.0906400017019976e-05,
+ "loss": 0.1828,
+ "step": 17872
+ },
+ {
+ "epoch": 48.700272479564035,
+ "grad_norm": 8.109603881835938,
+ "learning_rate": 1.0905521151448132e-05,
+ "loss": 0.194,
+ "step": 17873
+ },
+ {
+ "epoch": 48.70299727520436,
+ "grad_norm": 4.917482852935791,
+ "learning_rate": 1.0904642278824122e-05,
+ "loss": 0.1781,
+ "step": 17874
+ },
+ {
+ "epoch": 48.705722070844686,
+ "grad_norm": 7.983536243438721,
+ "learning_rate": 1.0903763399154787e-05,
+ "loss": 0.1718,
+ "step": 17875
+ },
+ {
+ "epoch": 48.70844686648501,
+ "grad_norm": 4.195606708526611,
+ "learning_rate": 1.0902884512446972e-05,
+ "loss": 0.1059,
+ "step": 17876
+ },
+ {
+ "epoch": 48.71117166212534,
+ "grad_norm": 4.410258769989014,
+ "learning_rate": 1.090200561870752e-05,
+ "loss": 0.1021,
+ "step": 17877
+ },
+ {
+ "epoch": 48.71389645776567,
+ "grad_norm": 4.368112087249756,
+ "learning_rate": 1.0901126717943277e-05,
+ "loss": 0.1574,
+ "step": 17878
+ },
+ {
+ "epoch": 48.716621253406,
+ "grad_norm": 3.8354806900024414,
+ "learning_rate": 1.0900247810161091e-05,
+ "loss": 0.1346,
+ "step": 17879
+ },
+ {
+ "epoch": 48.71934604904632,
+ "grad_norm": 3.4195239543914795,
+ "learning_rate": 1.0899368895367802e-05,
+ "loss": 0.1244,
+ "step": 17880
+ },
+ {
+ "epoch": 48.72207084468665,
+ "grad_norm": 4.415281295776367,
+ "learning_rate": 1.0898489973570256e-05,
+ "loss": 0.1332,
+ "step": 17881
+ },
+ {
+ "epoch": 48.724795640326974,
+ "grad_norm": 6.313999652862549,
+ "learning_rate": 1.0897611044775299e-05,
+ "loss": 0.155,
+ "step": 17882
+ },
+ {
+ "epoch": 48.7275204359673,
+ "grad_norm": 5.8819804191589355,
+ "learning_rate": 1.0896732108989775e-05,
+ "loss": 0.1077,
+ "step": 17883
+ },
+ {
+ "epoch": 48.73024523160763,
+ "grad_norm": 5.503526210784912,
+ "learning_rate": 1.0895853166220534e-05,
+ "loss": 0.1199,
+ "step": 17884
+ },
+ {
+ "epoch": 48.73297002724796,
+ "grad_norm": 5.5648369789123535,
+ "learning_rate": 1.0894974216474415e-05,
+ "loss": 0.1902,
+ "step": 17885
+ },
+ {
+ "epoch": 48.735694822888284,
+ "grad_norm": 6.182637691497803,
+ "learning_rate": 1.0894095259758267e-05,
+ "loss": 0.1331,
+ "step": 17886
+ },
+ {
+ "epoch": 48.73841961852861,
+ "grad_norm": 5.193334579467773,
+ "learning_rate": 1.0893216296078932e-05,
+ "loss": 0.2414,
+ "step": 17887
+ },
+ {
+ "epoch": 48.741144414168936,
+ "grad_norm": 4.44490909576416,
+ "learning_rate": 1.0892337325443259e-05,
+ "loss": 0.2874,
+ "step": 17888
+ },
+ {
+ "epoch": 48.74386920980926,
+ "grad_norm": 4.241389274597168,
+ "learning_rate": 1.089145834785809e-05,
+ "loss": 0.2356,
+ "step": 17889
+ },
+ {
+ "epoch": 48.746594005449595,
+ "grad_norm": 4.388084888458252,
+ "learning_rate": 1.0890579363330271e-05,
+ "loss": 0.1595,
+ "step": 17890
+ },
+ {
+ "epoch": 48.74931880108992,
+ "grad_norm": 5.427707672119141,
+ "learning_rate": 1.0889700371866651e-05,
+ "loss": 0.4053,
+ "step": 17891
+ },
+ {
+ "epoch": 48.752043596730246,
+ "grad_norm": 4.970544815063477,
+ "learning_rate": 1.0888821373474073e-05,
+ "loss": 0.1579,
+ "step": 17892
+ },
+ {
+ "epoch": 48.75476839237057,
+ "grad_norm": 3.7840118408203125,
+ "learning_rate": 1.0887942368159384e-05,
+ "loss": 0.1369,
+ "step": 17893
+ },
+ {
+ "epoch": 48.7574931880109,
+ "grad_norm": 4.346770763397217,
+ "learning_rate": 1.0887063355929426e-05,
+ "loss": 0.0802,
+ "step": 17894
+ },
+ {
+ "epoch": 48.76021798365122,
+ "grad_norm": 4.558623313903809,
+ "learning_rate": 1.0886184336791047e-05,
+ "loss": 0.2136,
+ "step": 17895
+ },
+ {
+ "epoch": 48.762942779291556,
+ "grad_norm": 4.797070026397705,
+ "learning_rate": 1.0885305310751095e-05,
+ "loss": 0.0827,
+ "step": 17896
+ },
+ {
+ "epoch": 48.76566757493188,
+ "grad_norm": 4.973506450653076,
+ "learning_rate": 1.0884426277816413e-05,
+ "loss": 0.1287,
+ "step": 17897
+ },
+ {
+ "epoch": 48.76839237057221,
+ "grad_norm": 5.083658218383789,
+ "learning_rate": 1.0883547237993846e-05,
+ "loss": 0.2286,
+ "step": 17898
+ },
+ {
+ "epoch": 48.771117166212534,
+ "grad_norm": 5.547389507293701,
+ "learning_rate": 1.0882668191290242e-05,
+ "loss": 0.2499,
+ "step": 17899
+ },
+ {
+ "epoch": 48.77384196185286,
+ "grad_norm": 4.125782012939453,
+ "learning_rate": 1.0881789137712446e-05,
+ "loss": 0.1324,
+ "step": 17900
+ },
+ {
+ "epoch": 48.776566757493185,
+ "grad_norm": 4.395590782165527,
+ "learning_rate": 1.0880910077267308e-05,
+ "loss": 0.1084,
+ "step": 17901
+ },
+ {
+ "epoch": 48.77929155313352,
+ "grad_norm": 4.682062149047852,
+ "learning_rate": 1.0880031009961667e-05,
+ "loss": 0.2002,
+ "step": 17902
+ },
+ {
+ "epoch": 48.782016348773844,
+ "grad_norm": 4.319581508636475,
+ "learning_rate": 1.0879151935802376e-05,
+ "loss": 0.1735,
+ "step": 17903
+ },
+ {
+ "epoch": 48.78474114441417,
+ "grad_norm": 4.89421272277832,
+ "learning_rate": 1.0878272854796274e-05,
+ "loss": 0.2112,
+ "step": 17904
+ },
+ {
+ "epoch": 48.787465940054496,
+ "grad_norm": 3.7251944541931152,
+ "learning_rate": 1.0877393766950217e-05,
+ "loss": 0.0972,
+ "step": 17905
+ },
+ {
+ "epoch": 48.79019073569482,
+ "grad_norm": 4.159662246704102,
+ "learning_rate": 1.0876514672271041e-05,
+ "loss": 0.1897,
+ "step": 17906
+ },
+ {
+ "epoch": 48.79291553133515,
+ "grad_norm": 5.107697486877441,
+ "learning_rate": 1.0875635570765596e-05,
+ "loss": 0.3254,
+ "step": 17907
+ },
+ {
+ "epoch": 48.79564032697548,
+ "grad_norm": 4.411425590515137,
+ "learning_rate": 1.0874756462440732e-05,
+ "loss": 0.1898,
+ "step": 17908
+ },
+ {
+ "epoch": 48.798365122615806,
+ "grad_norm": 3.6324493885040283,
+ "learning_rate": 1.0873877347303295e-05,
+ "loss": 0.1586,
+ "step": 17909
+ },
+ {
+ "epoch": 48.80108991825613,
+ "grad_norm": 5.099329948425293,
+ "learning_rate": 1.0872998225360126e-05,
+ "loss": 0.1069,
+ "step": 17910
+ },
+ {
+ "epoch": 48.80381471389646,
+ "grad_norm": 4.622508525848389,
+ "learning_rate": 1.0872119096618074e-05,
+ "loss": 0.1519,
+ "step": 17911
+ },
+ {
+ "epoch": 48.80653950953678,
+ "grad_norm": 5.181702136993408,
+ "learning_rate": 1.0871239961083987e-05,
+ "loss": 0.1398,
+ "step": 17912
+ },
+ {
+ "epoch": 48.80926430517711,
+ "grad_norm": 3.86995792388916,
+ "learning_rate": 1.0870360818764716e-05,
+ "loss": 0.1343,
+ "step": 17913
+ },
+ {
+ "epoch": 48.81198910081744,
+ "grad_norm": 4.519218444824219,
+ "learning_rate": 1.0869481669667097e-05,
+ "loss": 0.1195,
+ "step": 17914
+ },
+ {
+ "epoch": 48.81471389645777,
+ "grad_norm": 7.27349853515625,
+ "learning_rate": 1.0868602513797989e-05,
+ "loss": 0.2016,
+ "step": 17915
+ },
+ {
+ "epoch": 48.817438692098094,
+ "grad_norm": 3.614105701446533,
+ "learning_rate": 1.0867723351164223e-05,
+ "loss": 0.2255,
+ "step": 17916
+ },
+ {
+ "epoch": 48.82016348773842,
+ "grad_norm": 4.0133442878723145,
+ "learning_rate": 1.0866844181772662e-05,
+ "loss": 0.1782,
+ "step": 17917
+ },
+ {
+ "epoch": 48.822888283378745,
+ "grad_norm": 4.203430652618408,
+ "learning_rate": 1.0865965005630147e-05,
+ "loss": 0.1177,
+ "step": 17918
+ },
+ {
+ "epoch": 48.82561307901907,
+ "grad_norm": 4.711203575134277,
+ "learning_rate": 1.0865085822743521e-05,
+ "loss": 0.1313,
+ "step": 17919
+ },
+ {
+ "epoch": 48.828337874659404,
+ "grad_norm": 6.362487316131592,
+ "learning_rate": 1.0864206633119637e-05,
+ "loss": 0.3236,
+ "step": 17920
+ },
+ {
+ "epoch": 48.83106267029973,
+ "grad_norm": 4.486247539520264,
+ "learning_rate": 1.0863327436765342e-05,
+ "loss": 0.211,
+ "step": 17921
+ },
+ {
+ "epoch": 48.833787465940055,
+ "grad_norm": 5.597450256347656,
+ "learning_rate": 1.0862448233687475e-05,
+ "loss": 0.1327,
+ "step": 17922
+ },
+ {
+ "epoch": 48.83651226158038,
+ "grad_norm": 5.655049800872803,
+ "learning_rate": 1.0861569023892893e-05,
+ "loss": 0.139,
+ "step": 17923
+ },
+ {
+ "epoch": 48.83923705722071,
+ "grad_norm": 4.612045764923096,
+ "learning_rate": 1.0860689807388437e-05,
+ "loss": 0.1858,
+ "step": 17924
+ },
+ {
+ "epoch": 48.84196185286103,
+ "grad_norm": 6.127689838409424,
+ "learning_rate": 1.0859810584180956e-05,
+ "loss": 0.207,
+ "step": 17925
+ },
+ {
+ "epoch": 48.844686648501366,
+ "grad_norm": 4.130288600921631,
+ "learning_rate": 1.0858931354277299e-05,
+ "loss": 0.1206,
+ "step": 17926
+ },
+ {
+ "epoch": 48.84741144414169,
+ "grad_norm": 4.735872268676758,
+ "learning_rate": 1.0858052117684312e-05,
+ "loss": 0.1348,
+ "step": 17927
+ },
+ {
+ "epoch": 48.85013623978202,
+ "grad_norm": 4.604114532470703,
+ "learning_rate": 1.0857172874408844e-05,
+ "loss": 0.2167,
+ "step": 17928
+ },
+ {
+ "epoch": 48.85286103542234,
+ "grad_norm": 4.775600910186768,
+ "learning_rate": 1.0856293624457741e-05,
+ "loss": 0.3827,
+ "step": 17929
+ },
+ {
+ "epoch": 48.85558583106267,
+ "grad_norm": 3.6267833709716797,
+ "learning_rate": 1.0855414367837848e-05,
+ "loss": 0.0815,
+ "step": 17930
+ },
+ {
+ "epoch": 48.858310626702995,
+ "grad_norm": 4.787769317626953,
+ "learning_rate": 1.0854535104556019e-05,
+ "loss": 0.0944,
+ "step": 17931
+ },
+ {
+ "epoch": 48.86103542234333,
+ "grad_norm": 5.059425354003906,
+ "learning_rate": 1.0853655834619096e-05,
+ "loss": 0.1597,
+ "step": 17932
+ },
+ {
+ "epoch": 48.86376021798365,
+ "grad_norm": 4.373810768127441,
+ "learning_rate": 1.0852776558033928e-05,
+ "loss": 0.1992,
+ "step": 17933
+ },
+ {
+ "epoch": 48.86648501362398,
+ "grad_norm": 8.81373405456543,
+ "learning_rate": 1.0851897274807368e-05,
+ "loss": 0.2454,
+ "step": 17934
+ },
+ {
+ "epoch": 48.869209809264305,
+ "grad_norm": 4.95613431930542,
+ "learning_rate": 1.0851017984946255e-05,
+ "loss": 0.1094,
+ "step": 17935
+ },
+ {
+ "epoch": 48.87193460490463,
+ "grad_norm": 4.967520713806152,
+ "learning_rate": 1.0850138688457441e-05,
+ "loss": 0.1375,
+ "step": 17936
+ },
+ {
+ "epoch": 48.87465940054496,
+ "grad_norm": 6.082039833068848,
+ "learning_rate": 1.0849259385347779e-05,
+ "loss": 0.2957,
+ "step": 17937
+ },
+ {
+ "epoch": 48.87738419618529,
+ "grad_norm": 4.3331685066223145,
+ "learning_rate": 1.0848380075624107e-05,
+ "loss": 0.2389,
+ "step": 17938
+ },
+ {
+ "epoch": 48.880108991825615,
+ "grad_norm": 6.027491092681885,
+ "learning_rate": 1.0847500759293284e-05,
+ "loss": 0.1063,
+ "step": 17939
+ },
+ {
+ "epoch": 48.88283378746594,
+ "grad_norm": 3.9232709407806396,
+ "learning_rate": 1.0846621436362146e-05,
+ "loss": 0.1005,
+ "step": 17940
+ },
+ {
+ "epoch": 48.88555858310627,
+ "grad_norm": 3.850847005844116,
+ "learning_rate": 1.0845742106837553e-05,
+ "loss": 0.1297,
+ "step": 17941
+ },
+ {
+ "epoch": 48.88828337874659,
+ "grad_norm": 8.043157577514648,
+ "learning_rate": 1.0844862770726344e-05,
+ "loss": 0.1501,
+ "step": 17942
+ },
+ {
+ "epoch": 48.89100817438692,
+ "grad_norm": 4.68732213973999,
+ "learning_rate": 1.0843983428035372e-05,
+ "loss": 0.1081,
+ "step": 17943
+ },
+ {
+ "epoch": 48.89373297002725,
+ "grad_norm": 4.118488311767578,
+ "learning_rate": 1.0843104078771485e-05,
+ "loss": 0.0933,
+ "step": 17944
+ },
+ {
+ "epoch": 48.89645776566758,
+ "grad_norm": 4.96099853515625,
+ "learning_rate": 1.0842224722941528e-05,
+ "loss": 0.0891,
+ "step": 17945
+ },
+ {
+ "epoch": 48.8991825613079,
+ "grad_norm": 5.396556854248047,
+ "learning_rate": 1.0841345360552356e-05,
+ "loss": 0.174,
+ "step": 17946
+ },
+ {
+ "epoch": 48.90190735694823,
+ "grad_norm": 4.59935998916626,
+ "learning_rate": 1.084046599161081e-05,
+ "loss": 0.0983,
+ "step": 17947
+ },
+ {
+ "epoch": 48.904632152588555,
+ "grad_norm": 5.52337121963501,
+ "learning_rate": 1.0839586616123743e-05,
+ "loss": 0.2061,
+ "step": 17948
+ },
+ {
+ "epoch": 48.90735694822888,
+ "grad_norm": 4.852114677429199,
+ "learning_rate": 1.0838707234098003e-05,
+ "loss": 0.1496,
+ "step": 17949
+ },
+ {
+ "epoch": 48.91008174386921,
+ "grad_norm": 5.507870197296143,
+ "learning_rate": 1.0837827845540438e-05,
+ "loss": 0.1866,
+ "step": 17950
+ },
+ {
+ "epoch": 48.91280653950954,
+ "grad_norm": 6.330488681793213,
+ "learning_rate": 1.0836948450457894e-05,
+ "loss": 0.1924,
+ "step": 17951
+ },
+ {
+ "epoch": 48.915531335149865,
+ "grad_norm": 4.366691589355469,
+ "learning_rate": 1.0836069048857228e-05,
+ "loss": 0.1955,
+ "step": 17952
+ },
+ {
+ "epoch": 48.91825613079019,
+ "grad_norm": 5.374604225158691,
+ "learning_rate": 1.0835189640745279e-05,
+ "loss": 0.1514,
+ "step": 17953
+ },
+ {
+ "epoch": 48.920980926430516,
+ "grad_norm": 4.547908306121826,
+ "learning_rate": 1.08343102261289e-05,
+ "loss": 0.2376,
+ "step": 17954
+ },
+ {
+ "epoch": 48.92370572207084,
+ "grad_norm": 4.376667022705078,
+ "learning_rate": 1.0833430805014942e-05,
+ "loss": 0.0857,
+ "step": 17955
+ },
+ {
+ "epoch": 48.926430517711175,
+ "grad_norm": 4.054291725158691,
+ "learning_rate": 1.0832551377410252e-05,
+ "loss": 0.2339,
+ "step": 17956
+ },
+ {
+ "epoch": 48.9291553133515,
+ "grad_norm": 8.085643768310547,
+ "learning_rate": 1.0831671943321675e-05,
+ "loss": 0.1084,
+ "step": 17957
+ },
+ {
+ "epoch": 48.93188010899183,
+ "grad_norm": 7.077549457550049,
+ "learning_rate": 1.0830792502756067e-05,
+ "loss": 0.1158,
+ "step": 17958
+ },
+ {
+ "epoch": 48.93460490463215,
+ "grad_norm": 4.296553611755371,
+ "learning_rate": 1.0829913055720268e-05,
+ "loss": 0.1128,
+ "step": 17959
+ },
+ {
+ "epoch": 48.93732970027248,
+ "grad_norm": 6.046850204467773,
+ "learning_rate": 1.082903360222114e-05,
+ "loss": 0.2121,
+ "step": 17960
+ },
+ {
+ "epoch": 48.940054495912804,
+ "grad_norm": 4.763850212097168,
+ "learning_rate": 1.0828154142265521e-05,
+ "loss": 0.2364,
+ "step": 17961
+ },
+ {
+ "epoch": 48.94277929155314,
+ "grad_norm": 4.865629196166992,
+ "learning_rate": 1.0827274675860266e-05,
+ "loss": 0.1177,
+ "step": 17962
+ },
+ {
+ "epoch": 48.94550408719346,
+ "grad_norm": 3.9033432006835938,
+ "learning_rate": 1.0826395203012223e-05,
+ "loss": 0.0955,
+ "step": 17963
+ },
+ {
+ "epoch": 48.94822888283379,
+ "grad_norm": 4.03185510635376,
+ "learning_rate": 1.0825515723728241e-05,
+ "loss": 0.1818,
+ "step": 17964
+ },
+ {
+ "epoch": 48.950953678474114,
+ "grad_norm": 6.728121757507324,
+ "learning_rate": 1.0824636238015167e-05,
+ "loss": 0.2241,
+ "step": 17965
+ },
+ {
+ "epoch": 48.95367847411444,
+ "grad_norm": 4.339187145233154,
+ "learning_rate": 1.0823756745879853e-05,
+ "loss": 0.1173,
+ "step": 17966
+ },
+ {
+ "epoch": 48.956403269754766,
+ "grad_norm": 4.03483247756958,
+ "learning_rate": 1.0822877247329148e-05,
+ "loss": 0.1961,
+ "step": 17967
+ },
+ {
+ "epoch": 48.95912806539509,
+ "grad_norm": 6.427977561950684,
+ "learning_rate": 1.0821997742369901e-05,
+ "loss": 0.1114,
+ "step": 17968
+ },
+ {
+ "epoch": 48.961852861035425,
+ "grad_norm": 5.688981533050537,
+ "learning_rate": 1.0821118231008963e-05,
+ "loss": 0.1795,
+ "step": 17969
+ },
+ {
+ "epoch": 48.96457765667575,
+ "grad_norm": 3.970400094985962,
+ "learning_rate": 1.0820238713253184e-05,
+ "loss": 0.0742,
+ "step": 17970
+ },
+ {
+ "epoch": 48.967302452316076,
+ "grad_norm": 4.422605991363525,
+ "learning_rate": 1.0819359189109409e-05,
+ "loss": 0.2069,
+ "step": 17971
+ },
+ {
+ "epoch": 48.9700272479564,
+ "grad_norm": 5.416562557220459,
+ "learning_rate": 1.0818479658584495e-05,
+ "loss": 0.1225,
+ "step": 17972
+ },
+ {
+ "epoch": 48.97275204359673,
+ "grad_norm": 4.591360092163086,
+ "learning_rate": 1.0817600121685283e-05,
+ "loss": 0.1456,
+ "step": 17973
+ },
+ {
+ "epoch": 48.97547683923706,
+ "grad_norm": 5.2208099365234375,
+ "learning_rate": 1.0816720578418634e-05,
+ "loss": 0.1883,
+ "step": 17974
+ },
+ {
+ "epoch": 48.97820163487739,
+ "grad_norm": 4.898530006408691,
+ "learning_rate": 1.0815841028791385e-05,
+ "loss": 0.117,
+ "step": 17975
+ },
+ {
+ "epoch": 48.98092643051771,
+ "grad_norm": 4.976808547973633,
+ "learning_rate": 1.0814961472810395e-05,
+ "loss": 0.1436,
+ "step": 17976
+ },
+ {
+ "epoch": 48.98365122615804,
+ "grad_norm": 5.774075508117676,
+ "learning_rate": 1.081408191048251e-05,
+ "loss": 0.1706,
+ "step": 17977
+ },
+ {
+ "epoch": 48.986376021798364,
+ "grad_norm": 6.600642681121826,
+ "learning_rate": 1.0813202341814583e-05,
+ "loss": 0.1776,
+ "step": 17978
+ },
+ {
+ "epoch": 48.98910081743869,
+ "grad_norm": 6.6657185554504395,
+ "learning_rate": 1.081232276681346e-05,
+ "loss": 0.2789,
+ "step": 17979
+ },
+ {
+ "epoch": 48.991825613079016,
+ "grad_norm": 3.7275452613830566,
+ "learning_rate": 1.0811443185485998e-05,
+ "loss": 0.12,
+ "step": 17980
+ },
+ {
+ "epoch": 48.99455040871935,
+ "grad_norm": 4.625736236572266,
+ "learning_rate": 1.0810563597839039e-05,
+ "loss": 0.2359,
+ "step": 17981
+ },
+ {
+ "epoch": 48.997275204359674,
+ "grad_norm": 4.443175792694092,
+ "learning_rate": 1.0809684003879438e-05,
+ "loss": 0.1874,
+ "step": 17982
+ },
+ {
+ "epoch": 49.0,
+ "grad_norm": 5.10296106338501,
+ "learning_rate": 1.0808804403614044e-05,
+ "loss": 0.1693,
+ "step": 17983
+ },
+ {
+ "epoch": 49.002724795640326,
+ "grad_norm": 4.369555950164795,
+ "learning_rate": 1.0807924797049707e-05,
+ "loss": 0.3171,
+ "step": 17984
+ },
+ {
+ "epoch": 49.00544959128065,
+ "grad_norm": 4.7278056144714355,
+ "learning_rate": 1.0807045184193274e-05,
+ "loss": 0.2289,
+ "step": 17985
+ },
+ {
+ "epoch": 49.00817438692098,
+ "grad_norm": 4.353641986846924,
+ "learning_rate": 1.0806165565051606e-05,
+ "loss": 0.1017,
+ "step": 17986
+ },
+ {
+ "epoch": 49.01089918256131,
+ "grad_norm": 4.177628517150879,
+ "learning_rate": 1.0805285939631543e-05,
+ "loss": 0.2429,
+ "step": 17987
+ },
+ {
+ "epoch": 49.013623978201636,
+ "grad_norm": 4.302578449249268,
+ "learning_rate": 1.0804406307939938e-05,
+ "loss": 0.2183,
+ "step": 17988
+ },
+ {
+ "epoch": 49.01634877384196,
+ "grad_norm": 4.035937786102295,
+ "learning_rate": 1.0803526669983644e-05,
+ "loss": 0.1412,
+ "step": 17989
+ },
+ {
+ "epoch": 49.01907356948229,
+ "grad_norm": 4.200725078582764,
+ "learning_rate": 1.0802647025769511e-05,
+ "loss": 0.2043,
+ "step": 17990
+ },
+ {
+ "epoch": 49.02179836512261,
+ "grad_norm": 5.639614582061768,
+ "learning_rate": 1.0801767375304388e-05,
+ "loss": 0.3566,
+ "step": 17991
+ },
+ {
+ "epoch": 49.02452316076294,
+ "grad_norm": 4.2248945236206055,
+ "learning_rate": 1.0800887718595127e-05,
+ "loss": 0.1866,
+ "step": 17992
+ },
+ {
+ "epoch": 49.02724795640327,
+ "grad_norm": 4.550290584564209,
+ "learning_rate": 1.0800008055648574e-05,
+ "loss": 0.1476,
+ "step": 17993
+ },
+ {
+ "epoch": 49.0299727520436,
+ "grad_norm": 5.263301849365234,
+ "learning_rate": 1.0799128386471589e-05,
+ "loss": 0.1947,
+ "step": 17994
+ },
+ {
+ "epoch": 49.032697547683924,
+ "grad_norm": 5.180984020233154,
+ "learning_rate": 1.0798248711071016e-05,
+ "loss": 0.2674,
+ "step": 17995
+ },
+ {
+ "epoch": 49.03542234332425,
+ "grad_norm": 5.652591228485107,
+ "learning_rate": 1.0797369029453708e-05,
+ "loss": 0.1565,
+ "step": 17996
+ },
+ {
+ "epoch": 49.038147138964575,
+ "grad_norm": 8.383416175842285,
+ "learning_rate": 1.0796489341626515e-05,
+ "loss": 0.1568,
+ "step": 17997
+ },
+ {
+ "epoch": 49.0408719346049,
+ "grad_norm": 4.705984592437744,
+ "learning_rate": 1.0795609647596292e-05,
+ "loss": 0.2035,
+ "step": 17998
+ },
+ {
+ "epoch": 49.043596730245234,
+ "grad_norm": 4.038379669189453,
+ "learning_rate": 1.0794729947369881e-05,
+ "loss": 0.1252,
+ "step": 17999
+ },
+ {
+ "epoch": 49.04632152588556,
+ "grad_norm": 3.832319974899292,
+ "learning_rate": 1.0793850240954145e-05,
+ "loss": 0.0876,
+ "step": 18000
+ },
+ {
+ "epoch": 49.049046321525886,
+ "grad_norm": 4.551717758178711,
+ "learning_rate": 1.0792970528355925e-05,
+ "loss": 0.2588,
+ "step": 18001
+ },
+ {
+ "epoch": 49.05177111716621,
+ "grad_norm": 5.047624111175537,
+ "learning_rate": 1.0792090809582077e-05,
+ "loss": 0.1498,
+ "step": 18002
+ },
+ {
+ "epoch": 49.05449591280654,
+ "grad_norm": 3.703632354736328,
+ "learning_rate": 1.0791211084639448e-05,
+ "loss": 0.073,
+ "step": 18003
+ },
+ {
+ "epoch": 49.05722070844686,
+ "grad_norm": 4.088559150695801,
+ "learning_rate": 1.0790331353534898e-05,
+ "loss": 0.1275,
+ "step": 18004
+ },
+ {
+ "epoch": 49.059945504087196,
+ "grad_norm": 4.196995258331299,
+ "learning_rate": 1.0789451616275268e-05,
+ "loss": 0.1185,
+ "step": 18005
+ },
+ {
+ "epoch": 49.06267029972752,
+ "grad_norm": 4.991589546203613,
+ "learning_rate": 1.078857187286742e-05,
+ "loss": 0.1148,
+ "step": 18006
+ },
+ {
+ "epoch": 49.06539509536785,
+ "grad_norm": 4.610150337219238,
+ "learning_rate": 1.0787692123318193e-05,
+ "loss": 0.1873,
+ "step": 18007
+ },
+ {
+ "epoch": 49.06811989100817,
+ "grad_norm": 3.9155521392822266,
+ "learning_rate": 1.0786812367634452e-05,
+ "loss": 0.0902,
+ "step": 18008
+ },
+ {
+ "epoch": 49.0708446866485,
+ "grad_norm": 5.252546310424805,
+ "learning_rate": 1.0785932605823035e-05,
+ "loss": 0.1207,
+ "step": 18009
+ },
+ {
+ "epoch": 49.073569482288825,
+ "grad_norm": 8.474834442138672,
+ "learning_rate": 1.0785052837890805e-05,
+ "loss": 0.1332,
+ "step": 18010
+ },
+ {
+ "epoch": 49.07629427792916,
+ "grad_norm": 5.846328258514404,
+ "learning_rate": 1.0784173063844606e-05,
+ "loss": 0.2301,
+ "step": 18011
+ },
+ {
+ "epoch": 49.079019073569484,
+ "grad_norm": 5.642576217651367,
+ "learning_rate": 1.0783293283691292e-05,
+ "loss": 0.1465,
+ "step": 18012
+ },
+ {
+ "epoch": 49.08174386920981,
+ "grad_norm": 3.442023992538452,
+ "learning_rate": 1.0782413497437716e-05,
+ "loss": 0.1454,
+ "step": 18013
+ },
+ {
+ "epoch": 49.084468664850135,
+ "grad_norm": 3.6676108837127686,
+ "learning_rate": 1.078153370509073e-05,
+ "loss": 0.0996,
+ "step": 18014
+ },
+ {
+ "epoch": 49.08719346049046,
+ "grad_norm": 3.262950897216797,
+ "learning_rate": 1.0780653906657183e-05,
+ "loss": 0.0632,
+ "step": 18015
+ },
+ {
+ "epoch": 49.08991825613079,
+ "grad_norm": 7.376670837402344,
+ "learning_rate": 1.0779774102143932e-05,
+ "loss": 0.1095,
+ "step": 18016
+ },
+ {
+ "epoch": 49.09264305177112,
+ "grad_norm": 4.342564582824707,
+ "learning_rate": 1.0778894291557822e-05,
+ "loss": 0.1534,
+ "step": 18017
+ },
+ {
+ "epoch": 49.095367847411445,
+ "grad_norm": 3.993922233581543,
+ "learning_rate": 1.077801447490571e-05,
+ "loss": 0.0923,
+ "step": 18018
+ },
+ {
+ "epoch": 49.09809264305177,
+ "grad_norm": 4.462991714477539,
+ "learning_rate": 1.0777134652194444e-05,
+ "loss": 0.1785,
+ "step": 18019
+ },
+ {
+ "epoch": 49.1008174386921,
+ "grad_norm": 3.691136360168457,
+ "learning_rate": 1.077625482343088e-05,
+ "loss": 0.1676,
+ "step": 18020
+ },
+ {
+ "epoch": 49.10354223433242,
+ "grad_norm": 4.868034839630127,
+ "learning_rate": 1.077537498862187e-05,
+ "loss": 0.2172,
+ "step": 18021
+ },
+ {
+ "epoch": 49.10626702997275,
+ "grad_norm": 4.317085266113281,
+ "learning_rate": 1.077449514777426e-05,
+ "loss": 0.107,
+ "step": 18022
+ },
+ {
+ "epoch": 49.10899182561308,
+ "grad_norm": 4.479748725891113,
+ "learning_rate": 1.0773615300894908e-05,
+ "loss": 0.2292,
+ "step": 18023
+ },
+ {
+ "epoch": 49.11171662125341,
+ "grad_norm": 4.770779609680176,
+ "learning_rate": 1.0772735447990669e-05,
+ "loss": 0.0942,
+ "step": 18024
+ },
+ {
+ "epoch": 49.11444141689373,
+ "grad_norm": 4.341066837310791,
+ "learning_rate": 1.0771855589068387e-05,
+ "loss": 0.152,
+ "step": 18025
+ },
+ {
+ "epoch": 49.11716621253406,
+ "grad_norm": 4.202481269836426,
+ "learning_rate": 1.0770975724134922e-05,
+ "loss": 0.137,
+ "step": 18026
+ },
+ {
+ "epoch": 49.119891008174385,
+ "grad_norm": 4.304060935974121,
+ "learning_rate": 1.077009585319712e-05,
+ "loss": 0.0935,
+ "step": 18027
+ },
+ {
+ "epoch": 49.12261580381471,
+ "grad_norm": 4.502399444580078,
+ "learning_rate": 1.0769215976261838e-05,
+ "loss": 0.157,
+ "step": 18028
+ },
+ {
+ "epoch": 49.12534059945504,
+ "grad_norm": 3.793384313583374,
+ "learning_rate": 1.0768336093335928e-05,
+ "loss": 0.0881,
+ "step": 18029
+ },
+ {
+ "epoch": 49.12806539509537,
+ "grad_norm": 5.380351543426514,
+ "learning_rate": 1.0767456204426236e-05,
+ "loss": 0.1699,
+ "step": 18030
+ },
+ {
+ "epoch": 49.130790190735695,
+ "grad_norm": 3.9379515647888184,
+ "learning_rate": 1.0766576309539624e-05,
+ "loss": 0.086,
+ "step": 18031
+ },
+ {
+ "epoch": 49.13351498637602,
+ "grad_norm": 4.494139194488525,
+ "learning_rate": 1.076569640868294e-05,
+ "loss": 0.1696,
+ "step": 18032
+ },
+ {
+ "epoch": 49.13623978201635,
+ "grad_norm": 4.4707932472229,
+ "learning_rate": 1.0764816501863038e-05,
+ "loss": 0.1769,
+ "step": 18033
+ },
+ {
+ "epoch": 49.13896457765667,
+ "grad_norm": 3.2799689769744873,
+ "learning_rate": 1.0763936589086765e-05,
+ "loss": 0.1579,
+ "step": 18034
+ },
+ {
+ "epoch": 49.141689373297005,
+ "grad_norm": 4.310459136962891,
+ "learning_rate": 1.0763056670360983e-05,
+ "loss": 0.1066,
+ "step": 18035
+ },
+ {
+ "epoch": 49.14441416893733,
+ "grad_norm": 7.240693092346191,
+ "learning_rate": 1.0762176745692536e-05,
+ "loss": 0.2024,
+ "step": 18036
+ },
+ {
+ "epoch": 49.14713896457766,
+ "grad_norm": 5.299901485443115,
+ "learning_rate": 1.0761296815088286e-05,
+ "loss": 0.2777,
+ "step": 18037
+ },
+ {
+ "epoch": 49.14986376021798,
+ "grad_norm": 5.850484371185303,
+ "learning_rate": 1.0760416878555078e-05,
+ "loss": 0.2594,
+ "step": 18038
+ },
+ {
+ "epoch": 49.15258855585831,
+ "grad_norm": 4.424598693847656,
+ "learning_rate": 1.075953693609977e-05,
+ "loss": 0.1136,
+ "step": 18039
+ },
+ {
+ "epoch": 49.155313351498634,
+ "grad_norm": 4.08601188659668,
+ "learning_rate": 1.075865698772921e-05,
+ "loss": 0.2056,
+ "step": 18040
+ },
+ {
+ "epoch": 49.15803814713897,
+ "grad_norm": 5.298847675323486,
+ "learning_rate": 1.0757777033450257e-05,
+ "loss": 0.1508,
+ "step": 18041
+ },
+ {
+ "epoch": 49.16076294277929,
+ "grad_norm": 3.9473395347595215,
+ "learning_rate": 1.0756897073269758e-05,
+ "loss": 0.0882,
+ "step": 18042
+ },
+ {
+ "epoch": 49.16348773841962,
+ "grad_norm": 3.3817026615142822,
+ "learning_rate": 1.0756017107194569e-05,
+ "loss": 0.0952,
+ "step": 18043
+ },
+ {
+ "epoch": 49.166212534059945,
+ "grad_norm": 4.317387104034424,
+ "learning_rate": 1.0755137135231544e-05,
+ "loss": 0.2264,
+ "step": 18044
+ },
+ {
+ "epoch": 49.16893732970027,
+ "grad_norm": 5.175841331481934,
+ "learning_rate": 1.0754257157387536e-05,
+ "loss": 0.3095,
+ "step": 18045
+ },
+ {
+ "epoch": 49.171662125340596,
+ "grad_norm": 5.526827335357666,
+ "learning_rate": 1.0753377173669394e-05,
+ "loss": 0.1276,
+ "step": 18046
+ },
+ {
+ "epoch": 49.17438692098093,
+ "grad_norm": 5.604735851287842,
+ "learning_rate": 1.075249718408398e-05,
+ "loss": 0.197,
+ "step": 18047
+ },
+ {
+ "epoch": 49.177111716621255,
+ "grad_norm": 4.368131160736084,
+ "learning_rate": 1.075161718863814e-05,
+ "loss": 0.1844,
+ "step": 18048
+ },
+ {
+ "epoch": 49.17983651226158,
+ "grad_norm": 4.580317974090576,
+ "learning_rate": 1.0750737187338729e-05,
+ "loss": 0.1741,
+ "step": 18049
+ },
+ {
+ "epoch": 49.182561307901906,
+ "grad_norm": 4.791848659515381,
+ "learning_rate": 1.0749857180192603e-05,
+ "loss": 0.1884,
+ "step": 18050
+ },
+ {
+ "epoch": 49.18528610354223,
+ "grad_norm": 4.375580310821533,
+ "learning_rate": 1.0748977167206611e-05,
+ "loss": 0.1462,
+ "step": 18051
+ },
+ {
+ "epoch": 49.18801089918256,
+ "grad_norm": 3.8808562755584717,
+ "learning_rate": 1.0748097148387609e-05,
+ "loss": 0.1322,
+ "step": 18052
+ },
+ {
+ "epoch": 49.19073569482289,
+ "grad_norm": 4.329455375671387,
+ "learning_rate": 1.0747217123742453e-05,
+ "loss": 0.1538,
+ "step": 18053
+ },
+ {
+ "epoch": 49.19346049046322,
+ "grad_norm": 7.597806930541992,
+ "learning_rate": 1.0746337093277987e-05,
+ "loss": 0.3893,
+ "step": 18054
+ },
+ {
+ "epoch": 49.19618528610354,
+ "grad_norm": 5.23726749420166,
+ "learning_rate": 1.0745457057001079e-05,
+ "loss": 0.0787,
+ "step": 18055
+ },
+ {
+ "epoch": 49.19891008174387,
+ "grad_norm": 4.245670795440674,
+ "learning_rate": 1.0744577014918574e-05,
+ "loss": 0.2025,
+ "step": 18056
+ },
+ {
+ "epoch": 49.201634877384194,
+ "grad_norm": 4.973139762878418,
+ "learning_rate": 1.0743696967037327e-05,
+ "loss": 0.2124,
+ "step": 18057
+ },
+ {
+ "epoch": 49.20435967302452,
+ "grad_norm": 5.1174187660217285,
+ "learning_rate": 1.074281691336419e-05,
+ "loss": 0.2098,
+ "step": 18058
+ },
+ {
+ "epoch": 49.20708446866485,
+ "grad_norm": 4.663021564483643,
+ "learning_rate": 1.0741936853906023e-05,
+ "loss": 0.1087,
+ "step": 18059
+ },
+ {
+ "epoch": 49.20980926430518,
+ "grad_norm": 3.7342076301574707,
+ "learning_rate": 1.0741056788669671e-05,
+ "loss": 0.2342,
+ "step": 18060
+ },
+ {
+ "epoch": 49.212534059945504,
+ "grad_norm": 4.790356159210205,
+ "learning_rate": 1.0740176717661997e-05,
+ "loss": 0.1091,
+ "step": 18061
+ },
+ {
+ "epoch": 49.21525885558583,
+ "grad_norm": 5.599277496337891,
+ "learning_rate": 1.0739296640889844e-05,
+ "loss": 0.222,
+ "step": 18062
+ },
+ {
+ "epoch": 49.217983651226156,
+ "grad_norm": 4.795881271362305,
+ "learning_rate": 1.073841655836008e-05,
+ "loss": 0.302,
+ "step": 18063
+ },
+ {
+ "epoch": 49.22070844686648,
+ "grad_norm": 4.898931980133057,
+ "learning_rate": 1.0737536470079545e-05,
+ "loss": 0.2092,
+ "step": 18064
+ },
+ {
+ "epoch": 49.223433242506815,
+ "grad_norm": 4.329406261444092,
+ "learning_rate": 1.0736656376055106e-05,
+ "loss": 0.0806,
+ "step": 18065
+ },
+ {
+ "epoch": 49.22615803814714,
+ "grad_norm": 4.139956474304199,
+ "learning_rate": 1.0735776276293605e-05,
+ "loss": 0.2472,
+ "step": 18066
+ },
+ {
+ "epoch": 49.228882833787466,
+ "grad_norm": 7.229269027709961,
+ "learning_rate": 1.0734896170801907e-05,
+ "loss": 0.1951,
+ "step": 18067
+ },
+ {
+ "epoch": 49.23160762942779,
+ "grad_norm": 3.936602830886841,
+ "learning_rate": 1.0734016059586858e-05,
+ "loss": 0.0831,
+ "step": 18068
+ },
+ {
+ "epoch": 49.23433242506812,
+ "grad_norm": 5.162415504455566,
+ "learning_rate": 1.0733135942655318e-05,
+ "loss": 0.2105,
+ "step": 18069
+ },
+ {
+ "epoch": 49.237057220708444,
+ "grad_norm": 5.241152286529541,
+ "learning_rate": 1.0732255820014137e-05,
+ "loss": 0.1564,
+ "step": 18070
+ },
+ {
+ "epoch": 49.23978201634878,
+ "grad_norm": 3.9510488510131836,
+ "learning_rate": 1.073137569167017e-05,
+ "loss": 0.3114,
+ "step": 18071
+ },
+ {
+ "epoch": 49.2425068119891,
+ "grad_norm": 4.706510543823242,
+ "learning_rate": 1.0730495557630275e-05,
+ "loss": 0.0815,
+ "step": 18072
+ },
+ {
+ "epoch": 49.24523160762943,
+ "grad_norm": 5.237221717834473,
+ "learning_rate": 1.0729615417901305e-05,
+ "loss": 0.3302,
+ "step": 18073
+ },
+ {
+ "epoch": 49.247956403269754,
+ "grad_norm": 4.733431339263916,
+ "learning_rate": 1.072873527249011e-05,
+ "loss": 0.2856,
+ "step": 18074
+ },
+ {
+ "epoch": 49.25068119891008,
+ "grad_norm": 6.3101043701171875,
+ "learning_rate": 1.0727855121403551e-05,
+ "loss": 0.165,
+ "step": 18075
+ },
+ {
+ "epoch": 49.253405994550405,
+ "grad_norm": 3.8238027095794678,
+ "learning_rate": 1.0726974964648478e-05,
+ "loss": 0.1038,
+ "step": 18076
+ },
+ {
+ "epoch": 49.25613079019074,
+ "grad_norm": 6.8419084548950195,
+ "learning_rate": 1.072609480223175e-05,
+ "loss": 0.1189,
+ "step": 18077
+ },
+ {
+ "epoch": 49.258855585831064,
+ "grad_norm": 4.807248592376709,
+ "learning_rate": 1.0725214634160217e-05,
+ "loss": 0.099,
+ "step": 18078
+ },
+ {
+ "epoch": 49.26158038147139,
+ "grad_norm": 3.048029661178589,
+ "learning_rate": 1.0724334460440735e-05,
+ "loss": 0.1367,
+ "step": 18079
+ },
+ {
+ "epoch": 49.264305177111716,
+ "grad_norm": 4.009759426116943,
+ "learning_rate": 1.0723454281080161e-05,
+ "loss": 0.1014,
+ "step": 18080
+ },
+ {
+ "epoch": 49.26702997275204,
+ "grad_norm": 6.9584126472473145,
+ "learning_rate": 1.072257409608535e-05,
+ "loss": 0.1801,
+ "step": 18081
+ },
+ {
+ "epoch": 49.26975476839237,
+ "grad_norm": 3.863007068634033,
+ "learning_rate": 1.072169390546315e-05,
+ "loss": 0.0648,
+ "step": 18082
+ },
+ {
+ "epoch": 49.2724795640327,
+ "grad_norm": 8.388815879821777,
+ "learning_rate": 1.0720813709220427e-05,
+ "loss": 0.1313,
+ "step": 18083
+ },
+ {
+ "epoch": 49.275204359673026,
+ "grad_norm": 4.568418502807617,
+ "learning_rate": 1.0719933507364027e-05,
+ "loss": 0.145,
+ "step": 18084
+ },
+ {
+ "epoch": 49.27792915531335,
+ "grad_norm": 3.9196252822875977,
+ "learning_rate": 1.071905329990081e-05,
+ "loss": 0.1087,
+ "step": 18085
+ },
+ {
+ "epoch": 49.28065395095368,
+ "grad_norm": 4.317632675170898,
+ "learning_rate": 1.0718173086837626e-05,
+ "loss": 0.1917,
+ "step": 18086
+ },
+ {
+ "epoch": 49.283378746594,
+ "grad_norm": 6.338841915130615,
+ "learning_rate": 1.0717292868181335e-05,
+ "loss": 0.1705,
+ "step": 18087
+ },
+ {
+ "epoch": 49.28610354223433,
+ "grad_norm": 4.756075859069824,
+ "learning_rate": 1.0716412643938788e-05,
+ "loss": 0.396,
+ "step": 18088
+ },
+ {
+ "epoch": 49.28882833787466,
+ "grad_norm": 4.442616939544678,
+ "learning_rate": 1.0715532414116844e-05,
+ "loss": 0.1386,
+ "step": 18089
+ },
+ {
+ "epoch": 49.29155313351499,
+ "grad_norm": 4.1272783279418945,
+ "learning_rate": 1.0714652178722357e-05,
+ "loss": 0.0948,
+ "step": 18090
+ },
+ {
+ "epoch": 49.294277929155314,
+ "grad_norm": 4.293083667755127,
+ "learning_rate": 1.0713771937762183e-05,
+ "loss": 0.0735,
+ "step": 18091
+ },
+ {
+ "epoch": 49.29700272479564,
+ "grad_norm": 6.48081636428833,
+ "learning_rate": 1.0712891691243174e-05,
+ "loss": 0.148,
+ "step": 18092
+ },
+ {
+ "epoch": 49.299727520435965,
+ "grad_norm": 5.072357177734375,
+ "learning_rate": 1.0712011439172189e-05,
+ "loss": 0.2161,
+ "step": 18093
+ },
+ {
+ "epoch": 49.30245231607629,
+ "grad_norm": 5.972768783569336,
+ "learning_rate": 1.071113118155608e-05,
+ "loss": 0.2425,
+ "step": 18094
+ },
+ {
+ "epoch": 49.305177111716624,
+ "grad_norm": 4.665791034698486,
+ "learning_rate": 1.0710250918401709e-05,
+ "loss": 0.1129,
+ "step": 18095
+ },
+ {
+ "epoch": 49.30790190735695,
+ "grad_norm": 5.621108531951904,
+ "learning_rate": 1.070937064971592e-05,
+ "loss": 0.1445,
+ "step": 18096
+ },
+ {
+ "epoch": 49.310626702997276,
+ "grad_norm": 5.065195560455322,
+ "learning_rate": 1.0708490375505577e-05,
+ "loss": 0.1042,
+ "step": 18097
+ },
+ {
+ "epoch": 49.3133514986376,
+ "grad_norm": 5.798933506011963,
+ "learning_rate": 1.0707610095777534e-05,
+ "loss": 0.1124,
+ "step": 18098
+ },
+ {
+ "epoch": 49.31607629427793,
+ "grad_norm": 3.935114622116089,
+ "learning_rate": 1.070672981053865e-05,
+ "loss": 0.1385,
+ "step": 18099
+ },
+ {
+ "epoch": 49.31880108991825,
+ "grad_norm": 4.582058906555176,
+ "learning_rate": 1.0705849519795772e-05,
+ "loss": 0.1604,
+ "step": 18100
+ },
+ {
+ "epoch": 49.321525885558586,
+ "grad_norm": 4.798512935638428,
+ "learning_rate": 1.0704969223555766e-05,
+ "loss": 0.0866,
+ "step": 18101
+ },
+ {
+ "epoch": 49.32425068119891,
+ "grad_norm": 3.550732135772705,
+ "learning_rate": 1.0704088921825477e-05,
+ "loss": 0.0992,
+ "step": 18102
+ },
+ {
+ "epoch": 49.32697547683924,
+ "grad_norm": 3.969743490219116,
+ "learning_rate": 1.0703208614611772e-05,
+ "loss": 0.127,
+ "step": 18103
+ },
+ {
+ "epoch": 49.32970027247956,
+ "grad_norm": 5.467886924743652,
+ "learning_rate": 1.0702328301921495e-05,
+ "loss": 0.1953,
+ "step": 18104
+ },
+ {
+ "epoch": 49.33242506811989,
+ "grad_norm": 4.552988052368164,
+ "learning_rate": 1.0701447983761508e-05,
+ "loss": 0.2266,
+ "step": 18105
+ },
+ {
+ "epoch": 49.335149863760215,
+ "grad_norm": 4.883590221405029,
+ "learning_rate": 1.0700567660138672e-05,
+ "loss": 0.1233,
+ "step": 18106
+ },
+ {
+ "epoch": 49.33787465940055,
+ "grad_norm": 7.797180652618408,
+ "learning_rate": 1.0699687331059834e-05,
+ "loss": 0.234,
+ "step": 18107
+ },
+ {
+ "epoch": 49.34059945504087,
+ "grad_norm": 4.586651802062988,
+ "learning_rate": 1.0698806996531855e-05,
+ "loss": 0.1167,
+ "step": 18108
+ },
+ {
+ "epoch": 49.3433242506812,
+ "grad_norm": 4.137990474700928,
+ "learning_rate": 1.0697926656561588e-05,
+ "loss": 0.2158,
+ "step": 18109
+ },
+ {
+ "epoch": 49.346049046321525,
+ "grad_norm": 4.418461322784424,
+ "learning_rate": 1.069704631115589e-05,
+ "loss": 0.1901,
+ "step": 18110
+ },
+ {
+ "epoch": 49.34877384196185,
+ "grad_norm": 5.157928943634033,
+ "learning_rate": 1.069616596032162e-05,
+ "loss": 0.2292,
+ "step": 18111
+ },
+ {
+ "epoch": 49.35149863760218,
+ "grad_norm": 3.745630979537964,
+ "learning_rate": 1.069528560406563e-05,
+ "loss": 0.2967,
+ "step": 18112
+ },
+ {
+ "epoch": 49.35422343324251,
+ "grad_norm": 9.908339500427246,
+ "learning_rate": 1.069440524239478e-05,
+ "loss": 0.1697,
+ "step": 18113
+ },
+ {
+ "epoch": 49.356948228882835,
+ "grad_norm": 4.503567218780518,
+ "learning_rate": 1.0693524875315924e-05,
+ "loss": 0.1747,
+ "step": 18114
+ },
+ {
+ "epoch": 49.35967302452316,
+ "grad_norm": 4.296820163726807,
+ "learning_rate": 1.0692644502835915e-05,
+ "loss": 0.0885,
+ "step": 18115
+ },
+ {
+ "epoch": 49.36239782016349,
+ "grad_norm": 3.2776989936828613,
+ "learning_rate": 1.0691764124961618e-05,
+ "loss": 0.2318,
+ "step": 18116
+ },
+ {
+ "epoch": 49.36512261580381,
+ "grad_norm": 5.114651679992676,
+ "learning_rate": 1.0690883741699882e-05,
+ "loss": 0.2653,
+ "step": 18117
+ },
+ {
+ "epoch": 49.36784741144414,
+ "grad_norm": 8.092615127563477,
+ "learning_rate": 1.0690003353057567e-05,
+ "loss": 0.0964,
+ "step": 18118
+ },
+ {
+ "epoch": 49.37057220708447,
+ "grad_norm": 4.071983337402344,
+ "learning_rate": 1.0689122959041524e-05,
+ "loss": 0.3459,
+ "step": 18119
+ },
+ {
+ "epoch": 49.3732970027248,
+ "grad_norm": 4.370309829711914,
+ "learning_rate": 1.068824255965862e-05,
+ "loss": 0.2297,
+ "step": 18120
+ },
+ {
+ "epoch": 49.37602179836512,
+ "grad_norm": 4.2969207763671875,
+ "learning_rate": 1.0687362154915699e-05,
+ "loss": 0.1268,
+ "step": 18121
+ },
+ {
+ "epoch": 49.37874659400545,
+ "grad_norm": 4.603678226470947,
+ "learning_rate": 1.0686481744819626e-05,
+ "loss": 0.1205,
+ "step": 18122
+ },
+ {
+ "epoch": 49.381471389645775,
+ "grad_norm": 4.215365886688232,
+ "learning_rate": 1.0685601329377255e-05,
+ "loss": 0.2,
+ "step": 18123
+ },
+ {
+ "epoch": 49.3841961852861,
+ "grad_norm": 4.711794376373291,
+ "learning_rate": 1.0684720908595445e-05,
+ "loss": 0.2561,
+ "step": 18124
+ },
+ {
+ "epoch": 49.38692098092643,
+ "grad_norm": 4.6763691902160645,
+ "learning_rate": 1.0683840482481046e-05,
+ "loss": 0.184,
+ "step": 18125
+ },
+ {
+ "epoch": 49.38964577656676,
+ "grad_norm": 5.492859840393066,
+ "learning_rate": 1.0682960051040924e-05,
+ "loss": 0.143,
+ "step": 18126
+ },
+ {
+ "epoch": 49.392370572207085,
+ "grad_norm": 5.027314186096191,
+ "learning_rate": 1.068207961428193e-05,
+ "loss": 0.1715,
+ "step": 18127
+ },
+ {
+ "epoch": 49.39509536784741,
+ "grad_norm": 3.5511410236358643,
+ "learning_rate": 1.0681199172210923e-05,
+ "loss": 0.106,
+ "step": 18128
+ },
+ {
+ "epoch": 49.39782016348774,
+ "grad_norm": 5.608665466308594,
+ "learning_rate": 1.0680318724834758e-05,
+ "loss": 0.2715,
+ "step": 18129
+ },
+ {
+ "epoch": 49.40054495912806,
+ "grad_norm": 5.252490997314453,
+ "learning_rate": 1.0679438272160292e-05,
+ "loss": 0.1136,
+ "step": 18130
+ },
+ {
+ "epoch": 49.403269754768395,
+ "grad_norm": 16.229663848876953,
+ "learning_rate": 1.067855781419438e-05,
+ "loss": 0.251,
+ "step": 18131
+ },
+ {
+ "epoch": 49.40599455040872,
+ "grad_norm": 4.906930446624756,
+ "learning_rate": 1.0677677350943885e-05,
+ "loss": 0.1255,
+ "step": 18132
+ },
+ {
+ "epoch": 49.40871934604905,
+ "grad_norm": 4.8139777183532715,
+ "learning_rate": 1.0676796882415658e-05,
+ "loss": 0.0892,
+ "step": 18133
+ },
+ {
+ "epoch": 49.41144414168937,
+ "grad_norm": 4.291130065917969,
+ "learning_rate": 1.0675916408616562e-05,
+ "loss": 0.1425,
+ "step": 18134
+ },
+ {
+ "epoch": 49.4141689373297,
+ "grad_norm": 5.100659370422363,
+ "learning_rate": 1.0675035929553448e-05,
+ "loss": 0.1028,
+ "step": 18135
+ },
+ {
+ "epoch": 49.416893732970024,
+ "grad_norm": 6.584331035614014,
+ "learning_rate": 1.0674155445233179e-05,
+ "loss": 0.1488,
+ "step": 18136
+ },
+ {
+ "epoch": 49.41961852861036,
+ "grad_norm": 6.058783531188965,
+ "learning_rate": 1.0673274955662604e-05,
+ "loss": 0.1697,
+ "step": 18137
+ },
+ {
+ "epoch": 49.42234332425068,
+ "grad_norm": 4.610739231109619,
+ "learning_rate": 1.067239446084859e-05,
+ "loss": 0.2024,
+ "step": 18138
+ },
+ {
+ "epoch": 49.42506811989101,
+ "grad_norm": 5.838510036468506,
+ "learning_rate": 1.0671513960797988e-05,
+ "loss": 0.1562,
+ "step": 18139
+ },
+ {
+ "epoch": 49.427792915531334,
+ "grad_norm": 3.6795663833618164,
+ "learning_rate": 1.0670633455517656e-05,
+ "loss": 0.1504,
+ "step": 18140
+ },
+ {
+ "epoch": 49.43051771117166,
+ "grad_norm": 3.164093255996704,
+ "learning_rate": 1.0669752945014452e-05,
+ "loss": 0.0783,
+ "step": 18141
+ },
+ {
+ "epoch": 49.433242506811986,
+ "grad_norm": 4.077607154846191,
+ "learning_rate": 1.0668872429295236e-05,
+ "loss": 0.1422,
+ "step": 18142
+ },
+ {
+ "epoch": 49.43596730245232,
+ "grad_norm": 3.4083364009857178,
+ "learning_rate": 1.0667991908366861e-05,
+ "loss": 0.0929,
+ "step": 18143
+ },
+ {
+ "epoch": 49.438692098092645,
+ "grad_norm": 3.873018980026245,
+ "learning_rate": 1.0667111382236187e-05,
+ "loss": 0.1183,
+ "step": 18144
+ },
+ {
+ "epoch": 49.44141689373297,
+ "grad_norm": 4.201215744018555,
+ "learning_rate": 1.0666230850910071e-05,
+ "loss": 0.1714,
+ "step": 18145
+ },
+ {
+ "epoch": 49.444141689373296,
+ "grad_norm": 4.790209770202637,
+ "learning_rate": 1.0665350314395373e-05,
+ "loss": 0.1645,
+ "step": 18146
+ },
+ {
+ "epoch": 49.44686648501362,
+ "grad_norm": 4.523641586303711,
+ "learning_rate": 1.0664469772698945e-05,
+ "loss": 0.0816,
+ "step": 18147
+ },
+ {
+ "epoch": 49.44959128065395,
+ "grad_norm": 5.0345258712768555,
+ "learning_rate": 1.0663589225827648e-05,
+ "loss": 0.1731,
+ "step": 18148
+ },
+ {
+ "epoch": 49.45231607629428,
+ "grad_norm": 3.8730554580688477,
+ "learning_rate": 1.066270867378834e-05,
+ "loss": 0.1498,
+ "step": 18149
+ },
+ {
+ "epoch": 49.45504087193461,
+ "grad_norm": 4.271957874298096,
+ "learning_rate": 1.0661828116587878e-05,
+ "loss": 0.1517,
+ "step": 18150
+ },
+ {
+ "epoch": 49.45776566757493,
+ "grad_norm": 8.417770385742188,
+ "learning_rate": 1.066094755423312e-05,
+ "loss": 0.0968,
+ "step": 18151
+ },
+ {
+ "epoch": 49.46049046321526,
+ "grad_norm": 4.589767932891846,
+ "learning_rate": 1.0660066986730925e-05,
+ "loss": 0.2009,
+ "step": 18152
+ },
+ {
+ "epoch": 49.463215258855584,
+ "grad_norm": 5.2906413078308105,
+ "learning_rate": 1.0659186414088148e-05,
+ "loss": 0.1702,
+ "step": 18153
+ },
+ {
+ "epoch": 49.46594005449591,
+ "grad_norm": 5.601592063903809,
+ "learning_rate": 1.0658305836311651e-05,
+ "loss": 0.1856,
+ "step": 18154
+ },
+ {
+ "epoch": 49.46866485013624,
+ "grad_norm": 6.945178031921387,
+ "learning_rate": 1.0657425253408287e-05,
+ "loss": 0.2302,
+ "step": 18155
+ },
+ {
+ "epoch": 49.47138964577657,
+ "grad_norm": 4.493739128112793,
+ "learning_rate": 1.0656544665384918e-05,
+ "loss": 0.0931,
+ "step": 18156
+ },
+ {
+ "epoch": 49.474114441416894,
+ "grad_norm": 7.880306720733643,
+ "learning_rate": 1.0655664072248395e-05,
+ "loss": 0.0797,
+ "step": 18157
+ },
+ {
+ "epoch": 49.47683923705722,
+ "grad_norm": 4.8007707595825195,
+ "learning_rate": 1.0654783474005587e-05,
+ "loss": 0.1721,
+ "step": 18158
+ },
+ {
+ "epoch": 49.479564032697546,
+ "grad_norm": 6.430230617523193,
+ "learning_rate": 1.0653902870663344e-05,
+ "loss": 0.0995,
+ "step": 18159
+ },
+ {
+ "epoch": 49.48228882833787,
+ "grad_norm": 4.005404472351074,
+ "learning_rate": 1.0653022262228527e-05,
+ "loss": 0.2804,
+ "step": 18160
+ },
+ {
+ "epoch": 49.485013623978205,
+ "grad_norm": 6.052149772644043,
+ "learning_rate": 1.0652141648707994e-05,
+ "loss": 0.2013,
+ "step": 18161
+ },
+ {
+ "epoch": 49.48773841961853,
+ "grad_norm": 4.363229751586914,
+ "learning_rate": 1.0651261030108603e-05,
+ "loss": 0.1064,
+ "step": 18162
+ },
+ {
+ "epoch": 49.490463215258856,
+ "grad_norm": 4.8147759437561035,
+ "learning_rate": 1.065038040643721e-05,
+ "loss": 0.1154,
+ "step": 18163
+ },
+ {
+ "epoch": 49.49318801089918,
+ "grad_norm": 6.709095478057861,
+ "learning_rate": 1.064949977770068e-05,
+ "loss": 0.2924,
+ "step": 18164
+ },
+ {
+ "epoch": 49.49591280653951,
+ "grad_norm": 4.5668840408325195,
+ "learning_rate": 1.064861914390586e-05,
+ "loss": 0.0771,
+ "step": 18165
+ },
+ {
+ "epoch": 49.49863760217983,
+ "grad_norm": 4.888486862182617,
+ "learning_rate": 1.064773850505962e-05,
+ "loss": 0.2727,
+ "step": 18166
+ },
+ {
+ "epoch": 49.50136239782017,
+ "grad_norm": 5.187841892242432,
+ "learning_rate": 1.0646857861168811e-05,
+ "loss": 0.2116,
+ "step": 18167
+ },
+ {
+ "epoch": 49.50408719346049,
+ "grad_norm": 4.599339485168457,
+ "learning_rate": 1.0645977212240297e-05,
+ "loss": 0.207,
+ "step": 18168
+ },
+ {
+ "epoch": 49.50681198910082,
+ "grad_norm": 4.81515645980835,
+ "learning_rate": 1.064509655828093e-05,
+ "loss": 0.2151,
+ "step": 18169
+ },
+ {
+ "epoch": 49.509536784741144,
+ "grad_norm": 4.856693744659424,
+ "learning_rate": 1.0644215899297574e-05,
+ "loss": 0.2136,
+ "step": 18170
+ },
+ {
+ "epoch": 49.51226158038147,
+ "grad_norm": 4.939047813415527,
+ "learning_rate": 1.0643335235297084e-05,
+ "loss": 0.0968,
+ "step": 18171
+ },
+ {
+ "epoch": 49.514986376021795,
+ "grad_norm": 6.327423095703125,
+ "learning_rate": 1.0642454566286319e-05,
+ "loss": 0.2723,
+ "step": 18172
+ },
+ {
+ "epoch": 49.51771117166213,
+ "grad_norm": 5.196204662322998,
+ "learning_rate": 1.064157389227214e-05,
+ "loss": 0.2142,
+ "step": 18173
+ },
+ {
+ "epoch": 49.520435967302454,
+ "grad_norm": 5.256061553955078,
+ "learning_rate": 1.0640693213261404e-05,
+ "loss": 0.1198,
+ "step": 18174
+ },
+ {
+ "epoch": 49.52316076294278,
+ "grad_norm": 3.857426404953003,
+ "learning_rate": 1.0639812529260967e-05,
+ "loss": 0.0641,
+ "step": 18175
+ },
+ {
+ "epoch": 49.525885558583106,
+ "grad_norm": 5.198551654815674,
+ "learning_rate": 1.0638931840277696e-05,
+ "loss": 0.1856,
+ "step": 18176
+ },
+ {
+ "epoch": 49.52861035422343,
+ "grad_norm": 4.237199306488037,
+ "learning_rate": 1.063805114631844e-05,
+ "loss": 0.166,
+ "step": 18177
+ },
+ {
+ "epoch": 49.53133514986376,
+ "grad_norm": 3.5271968841552734,
+ "learning_rate": 1.0637170447390063e-05,
+ "loss": 0.065,
+ "step": 18178
+ },
+ {
+ "epoch": 49.53405994550409,
+ "grad_norm": 3.8488316535949707,
+ "learning_rate": 1.0636289743499424e-05,
+ "loss": 0.1502,
+ "step": 18179
+ },
+ {
+ "epoch": 49.536784741144416,
+ "grad_norm": 12.370738983154297,
+ "learning_rate": 1.0635409034653383e-05,
+ "loss": 0.1002,
+ "step": 18180
+ },
+ {
+ "epoch": 49.53950953678474,
+ "grad_norm": 6.158624649047852,
+ "learning_rate": 1.0634528320858792e-05,
+ "loss": 0.1541,
+ "step": 18181
+ },
+ {
+ "epoch": 49.54223433242507,
+ "grad_norm": 4.370608806610107,
+ "learning_rate": 1.0633647602122521e-05,
+ "loss": 0.0896,
+ "step": 18182
+ },
+ {
+ "epoch": 49.54495912806539,
+ "grad_norm": 4.981345176696777,
+ "learning_rate": 1.0632766878451416e-05,
+ "loss": 0.2075,
+ "step": 18183
+ },
+ {
+ "epoch": 49.54768392370572,
+ "grad_norm": 8.145125389099121,
+ "learning_rate": 1.0631886149852347e-05,
+ "loss": 0.1988,
+ "step": 18184
+ },
+ {
+ "epoch": 49.55040871934605,
+ "grad_norm": 12.380273818969727,
+ "learning_rate": 1.0631005416332168e-05,
+ "loss": 0.1242,
+ "step": 18185
+ },
+ {
+ "epoch": 49.55313351498638,
+ "grad_norm": 4.580547332763672,
+ "learning_rate": 1.063012467789774e-05,
+ "loss": 0.2128,
+ "step": 18186
+ },
+ {
+ "epoch": 49.555858310626704,
+ "grad_norm": 6.241352558135986,
+ "learning_rate": 1.0629243934555919e-05,
+ "loss": 0.1936,
+ "step": 18187
+ },
+ {
+ "epoch": 49.55858310626703,
+ "grad_norm": 4.160164833068848,
+ "learning_rate": 1.062836318631357e-05,
+ "loss": 0.1873,
+ "step": 18188
+ },
+ {
+ "epoch": 49.561307901907355,
+ "grad_norm": 6.1277995109558105,
+ "learning_rate": 1.0627482433177547e-05,
+ "loss": 0.3317,
+ "step": 18189
+ },
+ {
+ "epoch": 49.56403269754768,
+ "grad_norm": 4.253282070159912,
+ "learning_rate": 1.0626601675154713e-05,
+ "loss": 0.1541,
+ "step": 18190
+ },
+ {
+ "epoch": 49.566757493188014,
+ "grad_norm": 4.2864766120910645,
+ "learning_rate": 1.0625720912251923e-05,
+ "loss": 0.1371,
+ "step": 18191
+ },
+ {
+ "epoch": 49.56948228882834,
+ "grad_norm": 9.15553092956543,
+ "learning_rate": 1.0624840144476036e-05,
+ "loss": 0.1497,
+ "step": 18192
+ },
+ {
+ "epoch": 49.572207084468666,
+ "grad_norm": 5.953794479370117,
+ "learning_rate": 1.0623959371833918e-05,
+ "loss": 0.1323,
+ "step": 18193
+ },
+ {
+ "epoch": 49.57493188010899,
+ "grad_norm": 6.5279459953308105,
+ "learning_rate": 1.0623078594332424e-05,
+ "loss": 0.1452,
+ "step": 18194
+ },
+ {
+ "epoch": 49.57765667574932,
+ "grad_norm": 9.369184494018555,
+ "learning_rate": 1.0622197811978414e-05,
+ "loss": 0.1026,
+ "step": 18195
+ },
+ {
+ "epoch": 49.58038147138964,
+ "grad_norm": 4.457242012023926,
+ "learning_rate": 1.0621317024778747e-05,
+ "loss": 0.2238,
+ "step": 18196
+ },
+ {
+ "epoch": 49.583106267029976,
+ "grad_norm": 8.569912910461426,
+ "learning_rate": 1.062043623274028e-05,
+ "loss": 0.1649,
+ "step": 18197
+ },
+ {
+ "epoch": 49.5858310626703,
+ "grad_norm": 4.9559736251831055,
+ "learning_rate": 1.0619555435869881e-05,
+ "loss": 0.0911,
+ "step": 18198
+ },
+ {
+ "epoch": 49.58855585831063,
+ "grad_norm": 4.798398017883301,
+ "learning_rate": 1.0618674634174402e-05,
+ "loss": 0.1421,
+ "step": 18199
+ },
+ {
+ "epoch": 49.59128065395095,
+ "grad_norm": 5.347679615020752,
+ "learning_rate": 1.0617793827660703e-05,
+ "loss": 0.1805,
+ "step": 18200
+ },
+ {
+ "epoch": 49.59400544959128,
+ "grad_norm": 3.8213841915130615,
+ "learning_rate": 1.0616913016335648e-05,
+ "loss": 0.0836,
+ "step": 18201
+ },
+ {
+ "epoch": 49.596730245231605,
+ "grad_norm": 5.150428295135498,
+ "learning_rate": 1.0616032200206094e-05,
+ "loss": 0.1916,
+ "step": 18202
+ },
+ {
+ "epoch": 49.59945504087194,
+ "grad_norm": 4.489078521728516,
+ "learning_rate": 1.0615151379278901e-05,
+ "loss": 0.1812,
+ "step": 18203
+ },
+ {
+ "epoch": 49.60217983651226,
+ "grad_norm": 4.463815689086914,
+ "learning_rate": 1.0614270553560928e-05,
+ "loss": 0.0996,
+ "step": 18204
+ },
+ {
+ "epoch": 49.60490463215259,
+ "grad_norm": 9.333776473999023,
+ "learning_rate": 1.0613389723059037e-05,
+ "loss": 0.1649,
+ "step": 18205
+ },
+ {
+ "epoch": 49.607629427792915,
+ "grad_norm": 3.7884669303894043,
+ "learning_rate": 1.0612508887780085e-05,
+ "loss": 0.1649,
+ "step": 18206
+ },
+ {
+ "epoch": 49.61035422343324,
+ "grad_norm": 4.525467872619629,
+ "learning_rate": 1.0611628047730935e-05,
+ "loss": 0.1861,
+ "step": 18207
+ },
+ {
+ "epoch": 49.61307901907357,
+ "grad_norm": 7.235852241516113,
+ "learning_rate": 1.0610747202918442e-05,
+ "loss": 0.13,
+ "step": 18208
+ },
+ {
+ "epoch": 49.6158038147139,
+ "grad_norm": 9.90200138092041,
+ "learning_rate": 1.0609866353349474e-05,
+ "loss": 0.1544,
+ "step": 18209
+ },
+ {
+ "epoch": 49.618528610354225,
+ "grad_norm": 4.8709869384765625,
+ "learning_rate": 1.0608985499030884e-05,
+ "loss": 0.0988,
+ "step": 18210
+ },
+ {
+ "epoch": 49.62125340599455,
+ "grad_norm": 6.361578941345215,
+ "learning_rate": 1.0608104639969535e-05,
+ "loss": 0.1463,
+ "step": 18211
+ },
+ {
+ "epoch": 49.62397820163488,
+ "grad_norm": 6.684064865112305,
+ "learning_rate": 1.0607223776172287e-05,
+ "loss": 0.2931,
+ "step": 18212
+ },
+ {
+ "epoch": 49.6267029972752,
+ "grad_norm": 4.376237869262695,
+ "learning_rate": 1.0606342907645998e-05,
+ "loss": 0.1451,
+ "step": 18213
+ },
+ {
+ "epoch": 49.62942779291553,
+ "grad_norm": 5.746951580047607,
+ "learning_rate": 1.0605462034397532e-05,
+ "loss": 0.16,
+ "step": 18214
+ },
+ {
+ "epoch": 49.63215258855586,
+ "grad_norm": 4.049665927886963,
+ "learning_rate": 1.060458115643375e-05,
+ "loss": 0.2061,
+ "step": 18215
+ },
+ {
+ "epoch": 49.63487738419619,
+ "grad_norm": 5.825301170349121,
+ "learning_rate": 1.0603700273761504e-05,
+ "loss": 0.1265,
+ "step": 18216
+ },
+ {
+ "epoch": 49.63760217983651,
+ "grad_norm": 3.50651478767395,
+ "learning_rate": 1.060281938638766e-05,
+ "loss": 0.0803,
+ "step": 18217
+ },
+ {
+ "epoch": 49.64032697547684,
+ "grad_norm": 3.667231559753418,
+ "learning_rate": 1.060193849431908e-05,
+ "loss": 0.1276,
+ "step": 18218
+ },
+ {
+ "epoch": 49.643051771117165,
+ "grad_norm": 4.3791327476501465,
+ "learning_rate": 1.0601057597562623e-05,
+ "loss": 0.2172,
+ "step": 18219
+ },
+ {
+ "epoch": 49.64577656675749,
+ "grad_norm": 5.698973178863525,
+ "learning_rate": 1.0600176696125146e-05,
+ "loss": 0.1031,
+ "step": 18220
+ },
+ {
+ "epoch": 49.64850136239782,
+ "grad_norm": 7.409605979919434,
+ "learning_rate": 1.0599295790013515e-05,
+ "loss": 0.1568,
+ "step": 18221
+ },
+ {
+ "epoch": 49.65122615803815,
+ "grad_norm": 5.001932144165039,
+ "learning_rate": 1.0598414879234587e-05,
+ "loss": 0.2364,
+ "step": 18222
+ },
+ {
+ "epoch": 49.653950953678475,
+ "grad_norm": 4.489975929260254,
+ "learning_rate": 1.0597533963795223e-05,
+ "loss": 0.093,
+ "step": 18223
+ },
+ {
+ "epoch": 49.6566757493188,
+ "grad_norm": 6.3259596824646,
+ "learning_rate": 1.0596653043702283e-05,
+ "loss": 0.1477,
+ "step": 18224
+ },
+ {
+ "epoch": 49.65940054495913,
+ "grad_norm": 7.116461277008057,
+ "learning_rate": 1.0595772118962631e-05,
+ "loss": 0.3108,
+ "step": 18225
+ },
+ {
+ "epoch": 49.66212534059945,
+ "grad_norm": 4.958671569824219,
+ "learning_rate": 1.0594891189583119e-05,
+ "loss": 0.0998,
+ "step": 18226
+ },
+ {
+ "epoch": 49.664850136239785,
+ "grad_norm": 15.675604820251465,
+ "learning_rate": 1.059401025557062e-05,
+ "loss": 0.1984,
+ "step": 18227
+ },
+ {
+ "epoch": 49.66757493188011,
+ "grad_norm": 6.726870536804199,
+ "learning_rate": 1.0593129316931985e-05,
+ "loss": 0.1522,
+ "step": 18228
+ },
+ {
+ "epoch": 49.67029972752044,
+ "grad_norm": 5.004068374633789,
+ "learning_rate": 1.0592248373674078e-05,
+ "loss": 0.2209,
+ "step": 18229
+ },
+ {
+ "epoch": 49.67302452316076,
+ "grad_norm": 4.550838470458984,
+ "learning_rate": 1.059136742580376e-05,
+ "loss": 0.0881,
+ "step": 18230
+ },
+ {
+ "epoch": 49.67574931880109,
+ "grad_norm": 4.816982746124268,
+ "learning_rate": 1.0590486473327894e-05,
+ "loss": 0.1794,
+ "step": 18231
+ },
+ {
+ "epoch": 49.678474114441414,
+ "grad_norm": 5.47058629989624,
+ "learning_rate": 1.0589605516253333e-05,
+ "loss": 0.2464,
+ "step": 18232
+ },
+ {
+ "epoch": 49.68119891008175,
+ "grad_norm": 6.425475120544434,
+ "learning_rate": 1.058872455458695e-05,
+ "loss": 0.1028,
+ "step": 18233
+ },
+ {
+ "epoch": 49.68392370572207,
+ "grad_norm": 5.621904373168945,
+ "learning_rate": 1.0587843588335592e-05,
+ "loss": 0.2819,
+ "step": 18234
+ },
+ {
+ "epoch": 49.6866485013624,
+ "grad_norm": 4.362329959869385,
+ "learning_rate": 1.058696261750613e-05,
+ "loss": 0.1758,
+ "step": 18235
+ },
+ {
+ "epoch": 49.689373297002724,
+ "grad_norm": 6.487398147583008,
+ "learning_rate": 1.0586081642105423e-05,
+ "loss": 0.2571,
+ "step": 18236
+ },
+ {
+ "epoch": 49.69209809264305,
+ "grad_norm": 5.748312473297119,
+ "learning_rate": 1.0585200662140334e-05,
+ "loss": 0.3426,
+ "step": 18237
+ },
+ {
+ "epoch": 49.694822888283376,
+ "grad_norm": 4.671896934509277,
+ "learning_rate": 1.0584319677617716e-05,
+ "loss": 0.1777,
+ "step": 18238
+ },
+ {
+ "epoch": 49.69754768392371,
+ "grad_norm": 4.370096206665039,
+ "learning_rate": 1.0583438688544438e-05,
+ "loss": 0.1786,
+ "step": 18239
+ },
+ {
+ "epoch": 49.700272479564035,
+ "grad_norm": 4.892489433288574,
+ "learning_rate": 1.0582557694927356e-05,
+ "loss": 0.139,
+ "step": 18240
+ },
+ {
+ "epoch": 49.70299727520436,
+ "grad_norm": 4.985652923583984,
+ "learning_rate": 1.0581676696773336e-05,
+ "loss": 0.3533,
+ "step": 18241
+ },
+ {
+ "epoch": 49.705722070844686,
+ "grad_norm": 7.21626615524292,
+ "learning_rate": 1.0580795694089234e-05,
+ "loss": 0.1689,
+ "step": 18242
+ },
+ {
+ "epoch": 49.70844686648501,
+ "grad_norm": 3.7203969955444336,
+ "learning_rate": 1.0579914686881914e-05,
+ "loss": 0.0635,
+ "step": 18243
+ },
+ {
+ "epoch": 49.71117166212534,
+ "grad_norm": 4.61190128326416,
+ "learning_rate": 1.0579033675158236e-05,
+ "loss": 0.1296,
+ "step": 18244
+ },
+ {
+ "epoch": 49.71389645776567,
+ "grad_norm": 4.63526725769043,
+ "learning_rate": 1.0578152658925066e-05,
+ "loss": 0.2572,
+ "step": 18245
+ },
+ {
+ "epoch": 49.716621253406,
+ "grad_norm": 5.661147117614746,
+ "learning_rate": 1.0577271638189261e-05,
+ "loss": 0.2119,
+ "step": 18246
+ },
+ {
+ "epoch": 49.71934604904632,
+ "grad_norm": 5.838468074798584,
+ "learning_rate": 1.0576390612957683e-05,
+ "loss": 0.1644,
+ "step": 18247
+ },
+ {
+ "epoch": 49.72207084468665,
+ "grad_norm": 4.0203962326049805,
+ "learning_rate": 1.057550958323719e-05,
+ "loss": 0.0692,
+ "step": 18248
+ },
+ {
+ "epoch": 49.724795640326974,
+ "grad_norm": 5.284526824951172,
+ "learning_rate": 1.0574628549034653e-05,
+ "loss": 0.1809,
+ "step": 18249
+ },
+ {
+ "epoch": 49.7275204359673,
+ "grad_norm": 5.219470024108887,
+ "learning_rate": 1.0573747510356923e-05,
+ "loss": 0.1761,
+ "step": 18250
+ },
+ {
+ "epoch": 49.73024523160763,
+ "grad_norm": 4.994770526885986,
+ "learning_rate": 1.0572866467210865e-05,
+ "loss": 0.157,
+ "step": 18251
+ },
+ {
+ "epoch": 49.73297002724796,
+ "grad_norm": 6.430014610290527,
+ "learning_rate": 1.0571985419603343e-05,
+ "loss": 0.259,
+ "step": 18252
+ },
+ {
+ "epoch": 49.735694822888284,
+ "grad_norm": 6.348018646240234,
+ "learning_rate": 1.0571104367541218e-05,
+ "loss": 0.2008,
+ "step": 18253
+ },
+ {
+ "epoch": 49.73841961852861,
+ "grad_norm": 4.19774866104126,
+ "learning_rate": 1.0570223311031349e-05,
+ "loss": 0.1261,
+ "step": 18254
+ },
+ {
+ "epoch": 49.741144414168936,
+ "grad_norm": 4.381269931793213,
+ "learning_rate": 1.0569342250080601e-05,
+ "loss": 0.0822,
+ "step": 18255
+ },
+ {
+ "epoch": 49.74386920980926,
+ "grad_norm": 5.628778457641602,
+ "learning_rate": 1.0568461184695833e-05,
+ "loss": 0.2369,
+ "step": 18256
+ },
+ {
+ "epoch": 49.746594005449595,
+ "grad_norm": 5.383265495300293,
+ "learning_rate": 1.056758011488391e-05,
+ "loss": 0.2278,
+ "step": 18257
+ },
+ {
+ "epoch": 49.74931880108992,
+ "grad_norm": 4.400010108947754,
+ "learning_rate": 1.0566699040651687e-05,
+ "loss": 0.1128,
+ "step": 18258
+ },
+ {
+ "epoch": 49.752043596730246,
+ "grad_norm": 6.867877006530762,
+ "learning_rate": 1.0565817962006033e-05,
+ "loss": 0.2063,
+ "step": 18259
+ },
+ {
+ "epoch": 49.75476839237057,
+ "grad_norm": 3.7297110557556152,
+ "learning_rate": 1.0564936878953804e-05,
+ "loss": 0.1872,
+ "step": 18260
+ },
+ {
+ "epoch": 49.7574931880109,
+ "grad_norm": 6.1977858543396,
+ "learning_rate": 1.0564055791501867e-05,
+ "loss": 0.2369,
+ "step": 18261
+ },
+ {
+ "epoch": 49.76021798365122,
+ "grad_norm": 5.163815975189209,
+ "learning_rate": 1.056317469965708e-05,
+ "loss": 0.1626,
+ "step": 18262
+ },
+ {
+ "epoch": 49.762942779291556,
+ "grad_norm": 4.913216590881348,
+ "learning_rate": 1.0562293603426309e-05,
+ "loss": 0.1421,
+ "step": 18263
+ },
+ {
+ "epoch": 49.76566757493188,
+ "grad_norm": 4.714107513427734,
+ "learning_rate": 1.0561412502816411e-05,
+ "loss": 0.1879,
+ "step": 18264
+ },
+ {
+ "epoch": 49.76839237057221,
+ "grad_norm": 5.038058757781982,
+ "learning_rate": 1.0560531397834253e-05,
+ "loss": 0.2115,
+ "step": 18265
+ },
+ {
+ "epoch": 49.771117166212534,
+ "grad_norm": 13.269697189331055,
+ "learning_rate": 1.055965028848669e-05,
+ "loss": 0.1234,
+ "step": 18266
+ },
+ {
+ "epoch": 49.77384196185286,
+ "grad_norm": 4.1821699142456055,
+ "learning_rate": 1.0558769174780595e-05,
+ "loss": 0.0749,
+ "step": 18267
+ },
+ {
+ "epoch": 49.776566757493185,
+ "grad_norm": 6.874485969543457,
+ "learning_rate": 1.055788805672282e-05,
+ "loss": 0.2055,
+ "step": 18268
+ },
+ {
+ "epoch": 49.77929155313352,
+ "grad_norm": 4.795389175415039,
+ "learning_rate": 1.0557006934320232e-05,
+ "loss": 0.1236,
+ "step": 18269
+ },
+ {
+ "epoch": 49.782016348773844,
+ "grad_norm": 13.366247177124023,
+ "learning_rate": 1.0556125807579691e-05,
+ "loss": 0.2072,
+ "step": 18270
+ },
+ {
+ "epoch": 49.78474114441417,
+ "grad_norm": 3.8460803031921387,
+ "learning_rate": 1.0555244676508058e-05,
+ "loss": 0.0697,
+ "step": 18271
+ },
+ {
+ "epoch": 49.787465940054496,
+ "grad_norm": 4.661848545074463,
+ "learning_rate": 1.05543635411122e-05,
+ "loss": 0.1132,
+ "step": 18272
+ },
+ {
+ "epoch": 49.79019073569482,
+ "grad_norm": 11.662322998046875,
+ "learning_rate": 1.0553482401398979e-05,
+ "loss": 0.1519,
+ "step": 18273
+ },
+ {
+ "epoch": 49.79291553133515,
+ "grad_norm": 7.327706336975098,
+ "learning_rate": 1.055260125737525e-05,
+ "loss": 0.0829,
+ "step": 18274
+ },
+ {
+ "epoch": 49.79564032697548,
+ "grad_norm": 6.02321195602417,
+ "learning_rate": 1.0551720109047883e-05,
+ "loss": 0.1618,
+ "step": 18275
+ },
+ {
+ "epoch": 49.798365122615806,
+ "grad_norm": 5.443646430969238,
+ "learning_rate": 1.0550838956423737e-05,
+ "loss": 0.0948,
+ "step": 18276
+ },
+ {
+ "epoch": 49.80108991825613,
+ "grad_norm": 4.680039405822754,
+ "learning_rate": 1.0549957799509674e-05,
+ "loss": 0.2436,
+ "step": 18277
+ },
+ {
+ "epoch": 49.80381471389646,
+ "grad_norm": 4.676031589508057,
+ "learning_rate": 1.0549076638312558e-05,
+ "loss": 0.28,
+ "step": 18278
+ },
+ {
+ "epoch": 49.80653950953678,
+ "grad_norm": 4.422796249389648,
+ "learning_rate": 1.0548195472839251e-05,
+ "loss": 0.2487,
+ "step": 18279
+ },
+ {
+ "epoch": 49.80926430517711,
+ "grad_norm": 6.870621204376221,
+ "learning_rate": 1.0547314303096617e-05,
+ "loss": 0.116,
+ "step": 18280
+ },
+ {
+ "epoch": 49.81198910081744,
+ "grad_norm": 5.2428154945373535,
+ "learning_rate": 1.0546433129091514e-05,
+ "loss": 0.1182,
+ "step": 18281
+ },
+ {
+ "epoch": 49.81471389645777,
+ "grad_norm": 4.760616779327393,
+ "learning_rate": 1.0545551950830808e-05,
+ "loss": 0.1925,
+ "step": 18282
+ },
+ {
+ "epoch": 49.817438692098094,
+ "grad_norm": 5.274930000305176,
+ "learning_rate": 1.054467076832136e-05,
+ "loss": 0.1249,
+ "step": 18283
+ },
+ {
+ "epoch": 49.82016348773842,
+ "grad_norm": 4.147454738616943,
+ "learning_rate": 1.0543789581570037e-05,
+ "loss": 0.097,
+ "step": 18284
+ },
+ {
+ "epoch": 49.822888283378745,
+ "grad_norm": 4.724230766296387,
+ "learning_rate": 1.0542908390583694e-05,
+ "loss": 0.1272,
+ "step": 18285
+ },
+ {
+ "epoch": 49.82561307901907,
+ "grad_norm": 3.691598653793335,
+ "learning_rate": 1.0542027195369202e-05,
+ "loss": 0.1959,
+ "step": 18286
+ },
+ {
+ "epoch": 49.828337874659404,
+ "grad_norm": 4.603728771209717,
+ "learning_rate": 1.0541145995933416e-05,
+ "loss": 0.124,
+ "step": 18287
+ },
+ {
+ "epoch": 49.83106267029973,
+ "grad_norm": 5.445811748504639,
+ "learning_rate": 1.0540264792283205e-05,
+ "loss": 0.0962,
+ "step": 18288
+ },
+ {
+ "epoch": 49.833787465940055,
+ "grad_norm": 3.8996129035949707,
+ "learning_rate": 1.0539383584425428e-05,
+ "loss": 0.1087,
+ "step": 18289
+ },
+ {
+ "epoch": 49.83651226158038,
+ "grad_norm": 5.699887752532959,
+ "learning_rate": 1.053850237236695e-05,
+ "loss": 0.1406,
+ "step": 18290
+ },
+ {
+ "epoch": 49.83923705722071,
+ "grad_norm": 6.749419212341309,
+ "learning_rate": 1.0537621156114633e-05,
+ "loss": 0.2279,
+ "step": 18291
+ },
+ {
+ "epoch": 49.84196185286103,
+ "grad_norm": 12.689628601074219,
+ "learning_rate": 1.053673993567534e-05,
+ "loss": 0.15,
+ "step": 18292
+ },
+ {
+ "epoch": 49.844686648501366,
+ "grad_norm": 5.9806742668151855,
+ "learning_rate": 1.0535858711055931e-05,
+ "loss": 0.2104,
+ "step": 18293
+ },
+ {
+ "epoch": 49.84741144414169,
+ "grad_norm": 4.2488017082214355,
+ "learning_rate": 1.0534977482263274e-05,
+ "loss": 0.1174,
+ "step": 18294
+ },
+ {
+ "epoch": 49.85013623978202,
+ "grad_norm": 4.2461771965026855,
+ "learning_rate": 1.0534096249304226e-05,
+ "loss": 0.1724,
+ "step": 18295
+ },
+ {
+ "epoch": 49.85286103542234,
+ "grad_norm": 4.024528503417969,
+ "learning_rate": 1.0533215012185659e-05,
+ "loss": 0.2053,
+ "step": 18296
+ },
+ {
+ "epoch": 49.85558583106267,
+ "grad_norm": 4.433617115020752,
+ "learning_rate": 1.0532333770914427e-05,
+ "loss": 0.1113,
+ "step": 18297
+ },
+ {
+ "epoch": 49.858310626702995,
+ "grad_norm": 3.990469455718994,
+ "learning_rate": 1.0531452525497398e-05,
+ "loss": 0.1112,
+ "step": 18298
+ },
+ {
+ "epoch": 49.86103542234333,
+ "grad_norm": 5.256641387939453,
+ "learning_rate": 1.0530571275941433e-05,
+ "loss": 0.1691,
+ "step": 18299
+ },
+ {
+ "epoch": 49.86376021798365,
+ "grad_norm": 4.690814971923828,
+ "learning_rate": 1.0529690022253398e-05,
+ "loss": 0.1937,
+ "step": 18300
+ },
+ {
+ "epoch": 49.86648501362398,
+ "grad_norm": 4.61068868637085,
+ "learning_rate": 1.0528808764440152e-05,
+ "loss": 0.1708,
+ "step": 18301
+ },
+ {
+ "epoch": 49.869209809264305,
+ "grad_norm": 5.555260181427002,
+ "learning_rate": 1.052792750250856e-05,
+ "loss": 0.2876,
+ "step": 18302
+ },
+ {
+ "epoch": 49.87193460490463,
+ "grad_norm": 23.923898696899414,
+ "learning_rate": 1.0527046236465485e-05,
+ "loss": 0.2312,
+ "step": 18303
+ },
+ {
+ "epoch": 49.87465940054496,
+ "grad_norm": 4.177738189697266,
+ "learning_rate": 1.0526164966317796e-05,
+ "loss": 0.219,
+ "step": 18304
+ },
+ {
+ "epoch": 49.87738419618529,
+ "grad_norm": 5.994362831115723,
+ "learning_rate": 1.0525283692072346e-05,
+ "loss": 0.1716,
+ "step": 18305
+ },
+ {
+ "epoch": 49.880108991825615,
+ "grad_norm": 5.897968769073486,
+ "learning_rate": 1.0524402413736005e-05,
+ "loss": 0.1874,
+ "step": 18306
+ },
+ {
+ "epoch": 49.88283378746594,
+ "grad_norm": 9.682744026184082,
+ "learning_rate": 1.0523521131315636e-05,
+ "loss": 0.1946,
+ "step": 18307
+ },
+ {
+ "epoch": 49.88555858310627,
+ "grad_norm": 4.334563732147217,
+ "learning_rate": 1.0522639844818102e-05,
+ "loss": 0.1312,
+ "step": 18308
+ },
+ {
+ "epoch": 49.88828337874659,
+ "grad_norm": 4.382263660430908,
+ "learning_rate": 1.0521758554250263e-05,
+ "loss": 0.1112,
+ "step": 18309
+ },
+ {
+ "epoch": 49.89100817438692,
+ "grad_norm": 3.9178307056427,
+ "learning_rate": 1.0520877259618986e-05,
+ "loss": 0.0924,
+ "step": 18310
+ },
+ {
+ "epoch": 49.89373297002725,
+ "grad_norm": 4.639375686645508,
+ "learning_rate": 1.0519995960931136e-05,
+ "loss": 0.1725,
+ "step": 18311
+ },
+ {
+ "epoch": 49.89645776566758,
+ "grad_norm": 4.992181777954102,
+ "learning_rate": 1.051911465819357e-05,
+ "loss": 0.1519,
+ "step": 18312
+ },
+ {
+ "epoch": 49.8991825613079,
+ "grad_norm": 6.2513275146484375,
+ "learning_rate": 1.0518233351413155e-05,
+ "loss": 0.0841,
+ "step": 18313
+ },
+ {
+ "epoch": 49.90190735694823,
+ "grad_norm": 4.794405937194824,
+ "learning_rate": 1.0517352040596762e-05,
+ "loss": 0.3198,
+ "step": 18314
+ },
+ {
+ "epoch": 49.904632152588555,
+ "grad_norm": 4.1200032234191895,
+ "learning_rate": 1.0516470725751242e-05,
+ "loss": 0.1155,
+ "step": 18315
+ },
+ {
+ "epoch": 49.90735694822888,
+ "grad_norm": 5.223155975341797,
+ "learning_rate": 1.0515589406883469e-05,
+ "loss": 0.1609,
+ "step": 18316
+ },
+ {
+ "epoch": 49.91008174386921,
+ "grad_norm": 4.886833667755127,
+ "learning_rate": 1.05147080840003e-05,
+ "loss": 0.3186,
+ "step": 18317
+ },
+ {
+ "epoch": 49.91280653950954,
+ "grad_norm": 5.794650077819824,
+ "learning_rate": 1.0513826757108603e-05,
+ "loss": 0.0866,
+ "step": 18318
+ },
+ {
+ "epoch": 49.915531335149865,
+ "grad_norm": 4.465744972229004,
+ "learning_rate": 1.0512945426215234e-05,
+ "loss": 0.1001,
+ "step": 18319
+ },
+ {
+ "epoch": 49.91825613079019,
+ "grad_norm": 9.17824935913086,
+ "learning_rate": 1.0512064091327067e-05,
+ "loss": 0.0945,
+ "step": 18320
+ },
+ {
+ "epoch": 49.920980926430516,
+ "grad_norm": 6.776849746704102,
+ "learning_rate": 1.0511182752450959e-05,
+ "loss": 0.1981,
+ "step": 18321
+ },
+ {
+ "epoch": 49.92370572207084,
+ "grad_norm": 5.3896098136901855,
+ "learning_rate": 1.0510301409593779e-05,
+ "loss": 0.1399,
+ "step": 18322
+ },
+ {
+ "epoch": 49.926430517711175,
+ "grad_norm": 3.8560609817504883,
+ "learning_rate": 1.0509420062762388e-05,
+ "loss": 0.1679,
+ "step": 18323
+ },
+ {
+ "epoch": 49.9291553133515,
+ "grad_norm": 5.350097179412842,
+ "learning_rate": 1.0508538711963649e-05,
+ "loss": 0.2121,
+ "step": 18324
+ },
+ {
+ "epoch": 49.93188010899183,
+ "grad_norm": 4.888600826263428,
+ "learning_rate": 1.0507657357204426e-05,
+ "loss": 0.1259,
+ "step": 18325
+ },
+ {
+ "epoch": 49.93460490463215,
+ "grad_norm": 3.7617251873016357,
+ "learning_rate": 1.0506775998491587e-05,
+ "loss": 0.1737,
+ "step": 18326
+ },
+ {
+ "epoch": 49.93732970027248,
+ "grad_norm": 5.460902214050293,
+ "learning_rate": 1.050589463583199e-05,
+ "loss": 0.1618,
+ "step": 18327
+ },
+ {
+ "epoch": 49.940054495912804,
+ "grad_norm": 7.914155960083008,
+ "learning_rate": 1.0505013269232503e-05,
+ "loss": 0.2932,
+ "step": 18328
+ },
+ {
+ "epoch": 49.94277929155314,
+ "grad_norm": 6.479796886444092,
+ "learning_rate": 1.0504131898699985e-05,
+ "loss": 0.119,
+ "step": 18329
+ },
+ {
+ "epoch": 49.94550408719346,
+ "grad_norm": 4.8925628662109375,
+ "learning_rate": 1.0503250524241308e-05,
+ "loss": 0.2076,
+ "step": 18330
+ },
+ {
+ "epoch": 49.94822888283379,
+ "grad_norm": 4.879620552062988,
+ "learning_rate": 1.0502369145863332e-05,
+ "loss": 0.1089,
+ "step": 18331
+ },
+ {
+ "epoch": 49.950953678474114,
+ "grad_norm": 5.510569095611572,
+ "learning_rate": 1.0501487763572921e-05,
+ "loss": 0.1811,
+ "step": 18332
+ },
+ {
+ "epoch": 49.95367847411444,
+ "grad_norm": 5.198431968688965,
+ "learning_rate": 1.0500606377376938e-05,
+ "loss": 0.2939,
+ "step": 18333
+ },
+ {
+ "epoch": 49.956403269754766,
+ "grad_norm": 5.519257545471191,
+ "learning_rate": 1.0499724987282251e-05,
+ "loss": 0.1253,
+ "step": 18334
+ },
+ {
+ "epoch": 49.95912806539509,
+ "grad_norm": 4.976462364196777,
+ "learning_rate": 1.049884359329572e-05,
+ "loss": 0.2019,
+ "step": 18335
+ },
+ {
+ "epoch": 49.961852861035425,
+ "grad_norm": 4.999112606048584,
+ "learning_rate": 1.0497962195424214e-05,
+ "loss": 0.1197,
+ "step": 18336
+ },
+ {
+ "epoch": 49.96457765667575,
+ "grad_norm": 4.481200218200684,
+ "learning_rate": 1.049708079367459e-05,
+ "loss": 0.082,
+ "step": 18337
+ },
+ {
+ "epoch": 49.967302452316076,
+ "grad_norm": 5.327234268188477,
+ "learning_rate": 1.0496199388053718e-05,
+ "loss": 0.1496,
+ "step": 18338
+ },
+ {
+ "epoch": 49.9700272479564,
+ "grad_norm": 5.957428455352783,
+ "learning_rate": 1.0495317978568462e-05,
+ "loss": 0.1545,
+ "step": 18339
+ },
+ {
+ "epoch": 49.97275204359673,
+ "grad_norm": 4.346925735473633,
+ "learning_rate": 1.0494436565225688e-05,
+ "loss": 0.1513,
+ "step": 18340
+ },
+ {
+ "epoch": 49.97547683923706,
+ "grad_norm": 4.060068607330322,
+ "learning_rate": 1.0493555148032253e-05,
+ "loss": 0.1498,
+ "step": 18341
+ },
+ {
+ "epoch": 49.97820163487739,
+ "grad_norm": 6.395273685455322,
+ "learning_rate": 1.0492673726995031e-05,
+ "loss": 0.2749,
+ "step": 18342
+ },
+ {
+ "epoch": 49.98092643051771,
+ "grad_norm": 7.144204139709473,
+ "learning_rate": 1.0491792302120879e-05,
+ "loss": 0.1537,
+ "step": 18343
+ },
+ {
+ "epoch": 49.98365122615804,
+ "grad_norm": 4.112253665924072,
+ "learning_rate": 1.0490910873416667e-05,
+ "loss": 0.1762,
+ "step": 18344
+ },
+ {
+ "epoch": 49.986376021798364,
+ "grad_norm": 5.929678916931152,
+ "learning_rate": 1.0490029440889254e-05,
+ "loss": 0.1125,
+ "step": 18345
+ },
+ {
+ "epoch": 49.98910081743869,
+ "grad_norm": 5.074626445770264,
+ "learning_rate": 1.0489148004545506e-05,
+ "loss": 0.1712,
+ "step": 18346
+ },
+ {
+ "epoch": 49.991825613079016,
+ "grad_norm": 5.8632612228393555,
+ "learning_rate": 1.0488266564392293e-05,
+ "loss": 0.1416,
+ "step": 18347
+ },
+ {
+ "epoch": 49.99455040871935,
+ "grad_norm": 4.237979888916016,
+ "learning_rate": 1.0487385120436475e-05,
+ "loss": 0.177,
+ "step": 18348
+ },
+ {
+ "epoch": 49.997275204359674,
+ "grad_norm": 5.096149444580078,
+ "learning_rate": 1.0486503672684915e-05,
+ "loss": 0.1208,
+ "step": 18349
+ },
+ {
+ "epoch": 50.0,
+ "grad_norm": 5.351661205291748,
+ "learning_rate": 1.0485622221144485e-05,
+ "loss": 0.175,
+ "step": 18350
+ },
+ {
+ "epoch": 50.002724795640326,
+ "grad_norm": 4.498886585235596,
+ "learning_rate": 1.048474076582204e-05,
+ "loss": 0.1241,
+ "step": 18351
+ },
+ {
+ "epoch": 50.00544959128065,
+ "grad_norm": 4.655673503875732,
+ "learning_rate": 1.0483859306724451e-05,
+ "loss": 0.2254,
+ "step": 18352
+ },
+ {
+ "epoch": 50.00817438692098,
+ "grad_norm": 4.227473735809326,
+ "learning_rate": 1.0482977843858581e-05,
+ "loss": 0.2683,
+ "step": 18353
+ },
+ {
+ "epoch": 50.01089918256131,
+ "grad_norm": 9.067605018615723,
+ "learning_rate": 1.0482096377231297e-05,
+ "loss": 0.1116,
+ "step": 18354
+ },
+ {
+ "epoch": 50.013623978201636,
+ "grad_norm": 5.1989874839782715,
+ "learning_rate": 1.0481214906849459e-05,
+ "loss": 0.1028,
+ "step": 18355
+ },
+ {
+ "epoch": 50.01634877384196,
+ "grad_norm": 3.9210336208343506,
+ "learning_rate": 1.0480333432719936e-05,
+ "loss": 0.1528,
+ "step": 18356
+ },
+ {
+ "epoch": 50.01907356948229,
+ "grad_norm": 4.288864612579346,
+ "learning_rate": 1.0479451954849594e-05,
+ "loss": 0.2224,
+ "step": 18357
+ },
+ {
+ "epoch": 50.02179836512261,
+ "grad_norm": 3.425851345062256,
+ "learning_rate": 1.0478570473245293e-05,
+ "loss": 0.0959,
+ "step": 18358
+ },
+ {
+ "epoch": 50.02452316076294,
+ "grad_norm": 5.149254322052002,
+ "learning_rate": 1.0477688987913898e-05,
+ "loss": 0.0959,
+ "step": 18359
+ },
+ {
+ "epoch": 50.02724795640327,
+ "grad_norm": 4.205198287963867,
+ "learning_rate": 1.0476807498862282e-05,
+ "loss": 0.0985,
+ "step": 18360
+ },
+ {
+ "epoch": 50.0299727520436,
+ "grad_norm": 4.834911823272705,
+ "learning_rate": 1.04759260060973e-05,
+ "loss": 0.192,
+ "step": 18361
+ },
+ {
+ "epoch": 50.032697547683924,
+ "grad_norm": 3.771606683731079,
+ "learning_rate": 1.0475044509625827e-05,
+ "loss": 0.0944,
+ "step": 18362
+ },
+ {
+ "epoch": 50.03542234332425,
+ "grad_norm": 5.029878616333008,
+ "learning_rate": 1.0474163009454718e-05,
+ "loss": 0.0996,
+ "step": 18363
+ },
+ {
+ "epoch": 50.038147138964575,
+ "grad_norm": 3.8827707767486572,
+ "learning_rate": 1.0473281505590844e-05,
+ "loss": 0.0865,
+ "step": 18364
+ },
+ {
+ "epoch": 50.0408719346049,
+ "grad_norm": 4.6911773681640625,
+ "learning_rate": 1.047239999804107e-05,
+ "loss": 0.1315,
+ "step": 18365
+ },
+ {
+ "epoch": 50.043596730245234,
+ "grad_norm": 9.542468070983887,
+ "learning_rate": 1.0471518486812258e-05,
+ "loss": 0.2691,
+ "step": 18366
+ },
+ {
+ "epoch": 50.04632152588556,
+ "grad_norm": 5.197531700134277,
+ "learning_rate": 1.0470636971911277e-05,
+ "loss": 0.2597,
+ "step": 18367
+ },
+ {
+ "epoch": 50.049046321525886,
+ "grad_norm": 4.857045650482178,
+ "learning_rate": 1.0469755453344989e-05,
+ "loss": 0.1893,
+ "step": 18368
+ },
+ {
+ "epoch": 50.05177111716621,
+ "grad_norm": 4.129888534545898,
+ "learning_rate": 1.0468873931120263e-05,
+ "loss": 0.1494,
+ "step": 18369
+ },
+ {
+ "epoch": 50.05449591280654,
+ "grad_norm": 5.007657527923584,
+ "learning_rate": 1.0467992405243959e-05,
+ "loss": 0.2078,
+ "step": 18370
+ },
+ {
+ "epoch": 50.05722070844686,
+ "grad_norm": 4.791961193084717,
+ "learning_rate": 1.0467110875722945e-05,
+ "loss": 0.1493,
+ "step": 18371
+ },
+ {
+ "epoch": 50.059945504087196,
+ "grad_norm": 4.589936256408691,
+ "learning_rate": 1.0466229342564087e-05,
+ "loss": 0.1173,
+ "step": 18372
+ },
+ {
+ "epoch": 50.06267029972752,
+ "grad_norm": 4.196911811828613,
+ "learning_rate": 1.0465347805774253e-05,
+ "loss": 0.1584,
+ "step": 18373
+ },
+ {
+ "epoch": 50.06539509536785,
+ "grad_norm": 4.869670867919922,
+ "learning_rate": 1.0464466265360303e-05,
+ "loss": 0.2005,
+ "step": 18374
+ },
+ {
+ "epoch": 50.06811989100817,
+ "grad_norm": 3.5600781440734863,
+ "learning_rate": 1.0463584721329105e-05,
+ "loss": 0.2594,
+ "step": 18375
+ },
+ {
+ "epoch": 50.0708446866485,
+ "grad_norm": 4.4433979988098145,
+ "learning_rate": 1.0462703173687523e-05,
+ "loss": 0.229,
+ "step": 18376
+ },
+ {
+ "epoch": 50.073569482288825,
+ "grad_norm": 4.804118633270264,
+ "learning_rate": 1.0461821622442425e-05,
+ "loss": 0.2624,
+ "step": 18377
+ },
+ {
+ "epoch": 50.07629427792916,
+ "grad_norm": 4.39185094833374,
+ "learning_rate": 1.0460940067600676e-05,
+ "loss": 0.0922,
+ "step": 18378
+ },
+ {
+ "epoch": 50.079019073569484,
+ "grad_norm": 6.641062259674072,
+ "learning_rate": 1.046005850916914e-05,
+ "loss": 0.09,
+ "step": 18379
+ },
+ {
+ "epoch": 50.08174386920981,
+ "grad_norm": 4.962137699127197,
+ "learning_rate": 1.0459176947154682e-05,
+ "loss": 0.1016,
+ "step": 18380
+ },
+ {
+ "epoch": 50.084468664850135,
+ "grad_norm": 5.6916279792785645,
+ "learning_rate": 1.0458295381564168e-05,
+ "loss": 0.1782,
+ "step": 18381
+ },
+ {
+ "epoch": 50.08719346049046,
+ "grad_norm": 3.9860925674438477,
+ "learning_rate": 1.0457413812404461e-05,
+ "loss": 0.2467,
+ "step": 18382
+ },
+ {
+ "epoch": 50.08991825613079,
+ "grad_norm": 9.179952621459961,
+ "learning_rate": 1.0456532239682438e-05,
+ "loss": 0.1843,
+ "step": 18383
+ },
+ {
+ "epoch": 50.09264305177112,
+ "grad_norm": 4.272060394287109,
+ "learning_rate": 1.0455650663404953e-05,
+ "loss": 0.1184,
+ "step": 18384
+ },
+ {
+ "epoch": 50.095367847411445,
+ "grad_norm": 5.147090911865234,
+ "learning_rate": 1.0454769083578876e-05,
+ "loss": 0.1671,
+ "step": 18385
+ },
+ {
+ "epoch": 50.09809264305177,
+ "grad_norm": 4.8225836753845215,
+ "learning_rate": 1.0453887500211068e-05,
+ "loss": 0.0667,
+ "step": 18386
+ },
+ {
+ "epoch": 50.1008174386921,
+ "grad_norm": 4.201931476593018,
+ "learning_rate": 1.0453005913308405e-05,
+ "loss": 0.099,
+ "step": 18387
+ },
+ {
+ "epoch": 50.10354223433242,
+ "grad_norm": 5.505147457122803,
+ "learning_rate": 1.0452124322877741e-05,
+ "loss": 0.0965,
+ "step": 18388
+ },
+ {
+ "epoch": 50.10626702997275,
+ "grad_norm": 6.157524108886719,
+ "learning_rate": 1.045124272892595e-05,
+ "loss": 0.2204,
+ "step": 18389
+ },
+ {
+ "epoch": 50.10899182561308,
+ "grad_norm": 4.28139066696167,
+ "learning_rate": 1.0450361131459894e-05,
+ "loss": 0.2364,
+ "step": 18390
+ },
+ {
+ "epoch": 50.11171662125341,
+ "grad_norm": 5.012563228607178,
+ "learning_rate": 1.0449479530486441e-05,
+ "loss": 0.1196,
+ "step": 18391
+ },
+ {
+ "epoch": 50.11444141689373,
+ "grad_norm": 4.472416877746582,
+ "learning_rate": 1.0448597926012456e-05,
+ "loss": 0.2205,
+ "step": 18392
+ },
+ {
+ "epoch": 50.11716621253406,
+ "grad_norm": 5.370371341705322,
+ "learning_rate": 1.0447716318044807e-05,
+ "loss": 0.1321,
+ "step": 18393
+ },
+ {
+ "epoch": 50.119891008174385,
+ "grad_norm": 6.545853137969971,
+ "learning_rate": 1.0446834706590354e-05,
+ "loss": 0.0559,
+ "step": 18394
+ },
+ {
+ "epoch": 50.12261580381471,
+ "grad_norm": 5.600507736206055,
+ "learning_rate": 1.044595309165597e-05,
+ "loss": 0.1398,
+ "step": 18395
+ },
+ {
+ "epoch": 50.12534059945504,
+ "grad_norm": 6.128230094909668,
+ "learning_rate": 1.0445071473248514e-05,
+ "loss": 0.145,
+ "step": 18396
+ },
+ {
+ "epoch": 50.12806539509537,
+ "grad_norm": 4.690159797668457,
+ "learning_rate": 1.0444189851374857e-05,
+ "loss": 0.2394,
+ "step": 18397
+ },
+ {
+ "epoch": 50.130790190735695,
+ "grad_norm": 4.9555487632751465,
+ "learning_rate": 1.0443308226041862e-05,
+ "loss": 0.1515,
+ "step": 18398
+ },
+ {
+ "epoch": 50.13351498637602,
+ "grad_norm": 4.733140468597412,
+ "learning_rate": 1.04424265972564e-05,
+ "loss": 0.1177,
+ "step": 18399
+ },
+ {
+ "epoch": 50.13623978201635,
+ "grad_norm": 4.880582332611084,
+ "learning_rate": 1.0441544965025332e-05,
+ "loss": 0.1291,
+ "step": 18400
+ },
+ {
+ "epoch": 50.13896457765667,
+ "grad_norm": 3.9399352073669434,
+ "learning_rate": 1.044066332935553e-05,
+ "loss": 0.0717,
+ "step": 18401
+ },
+ {
+ "epoch": 50.141689373297005,
+ "grad_norm": 7.9581708908081055,
+ "learning_rate": 1.0439781690253851e-05,
+ "loss": 0.1258,
+ "step": 18402
+ },
+ {
+ "epoch": 50.14441416893733,
+ "grad_norm": 5.133094787597656,
+ "learning_rate": 1.043890004772717e-05,
+ "loss": 0.0825,
+ "step": 18403
+ },
+ {
+ "epoch": 50.14713896457766,
+ "grad_norm": 3.9729957580566406,
+ "learning_rate": 1.0438018401782347e-05,
+ "loss": 0.1867,
+ "step": 18404
+ },
+ {
+ "epoch": 50.14986376021798,
+ "grad_norm": 3.989093542098999,
+ "learning_rate": 1.0437136752426254e-05,
+ "loss": 0.2117,
+ "step": 18405
+ },
+ {
+ "epoch": 50.15258855585831,
+ "grad_norm": 4.257974624633789,
+ "learning_rate": 1.0436255099665746e-05,
+ "loss": 0.2167,
+ "step": 18406
+ },
+ {
+ "epoch": 50.155313351498634,
+ "grad_norm": 4.502657413482666,
+ "learning_rate": 1.0435373443507706e-05,
+ "loss": 0.1782,
+ "step": 18407
+ },
+ {
+ "epoch": 50.15803814713897,
+ "grad_norm": 5.227933406829834,
+ "learning_rate": 1.0434491783958986e-05,
+ "loss": 0.1995,
+ "step": 18408
+ },
+ {
+ "epoch": 50.16076294277929,
+ "grad_norm": 9.845762252807617,
+ "learning_rate": 1.0433610121026463e-05,
+ "loss": 0.1165,
+ "step": 18409
+ },
+ {
+ "epoch": 50.16348773841962,
+ "grad_norm": 4.153945446014404,
+ "learning_rate": 1.0432728454716996e-05,
+ "loss": 0.1055,
+ "step": 18410
+ },
+ {
+ "epoch": 50.166212534059945,
+ "grad_norm": 5.337934970855713,
+ "learning_rate": 1.0431846785037454e-05,
+ "loss": 0.2107,
+ "step": 18411
+ },
+ {
+ "epoch": 50.16893732970027,
+ "grad_norm": 4.0061750411987305,
+ "learning_rate": 1.0430965111994701e-05,
+ "loss": 0.091,
+ "step": 18412
+ },
+ {
+ "epoch": 50.171662125340596,
+ "grad_norm": 67.78372192382812,
+ "learning_rate": 1.0430083435595611e-05,
+ "loss": 0.1771,
+ "step": 18413
+ },
+ {
+ "epoch": 50.17438692098093,
+ "grad_norm": 4.743940830230713,
+ "learning_rate": 1.0429201755847041e-05,
+ "loss": 0.0999,
+ "step": 18414
+ },
+ {
+ "epoch": 50.177111716621255,
+ "grad_norm": 4.93541145324707,
+ "learning_rate": 1.042832007275586e-05,
+ "loss": 0.1944,
+ "step": 18415
+ },
+ {
+ "epoch": 50.17983651226158,
+ "grad_norm": 5.489130020141602,
+ "learning_rate": 1.0427438386328936e-05,
+ "loss": 0.1787,
+ "step": 18416
+ },
+ {
+ "epoch": 50.182561307901906,
+ "grad_norm": 4.149992942810059,
+ "learning_rate": 1.042655669657314e-05,
+ "loss": 0.1445,
+ "step": 18417
+ },
+ {
+ "epoch": 50.18528610354223,
+ "grad_norm": 5.850244045257568,
+ "learning_rate": 1.0425675003495333e-05,
+ "loss": 0.0969,
+ "step": 18418
+ },
+ {
+ "epoch": 50.18801089918256,
+ "grad_norm": 5.269390106201172,
+ "learning_rate": 1.0424793307102381e-05,
+ "loss": 0.1114,
+ "step": 18419
+ },
+ {
+ "epoch": 50.19073569482289,
+ "grad_norm": 7.50940465927124,
+ "learning_rate": 1.0423911607401152e-05,
+ "loss": 0.2189,
+ "step": 18420
+ },
+ {
+ "epoch": 50.19346049046322,
+ "grad_norm": 5.363705635070801,
+ "learning_rate": 1.0423029904398515e-05,
+ "loss": 0.1729,
+ "step": 18421
+ },
+ {
+ "epoch": 50.19618528610354,
+ "grad_norm": 5.508678436279297,
+ "learning_rate": 1.0422148198101334e-05,
+ "loss": 0.1864,
+ "step": 18422
+ },
+ {
+ "epoch": 50.19891008174387,
+ "grad_norm": 8.772170066833496,
+ "learning_rate": 1.0421266488516478e-05,
+ "loss": 0.3508,
+ "step": 18423
+ },
+ {
+ "epoch": 50.201634877384194,
+ "grad_norm": 6.351077079772949,
+ "learning_rate": 1.0420384775650806e-05,
+ "loss": 0.1513,
+ "step": 18424
+ },
+ {
+ "epoch": 50.20435967302452,
+ "grad_norm": 8.251812934875488,
+ "learning_rate": 1.0419503059511197e-05,
+ "loss": 0.1293,
+ "step": 18425
+ },
+ {
+ "epoch": 50.20708446866485,
+ "grad_norm": 4.953874111175537,
+ "learning_rate": 1.0418621340104509e-05,
+ "loss": 0.1023,
+ "step": 18426
+ },
+ {
+ "epoch": 50.20980926430518,
+ "grad_norm": 4.948370456695557,
+ "learning_rate": 1.0417739617437615e-05,
+ "loss": 0.117,
+ "step": 18427
+ },
+ {
+ "epoch": 50.212534059945504,
+ "grad_norm": 6.658825397491455,
+ "learning_rate": 1.0416857891517374e-05,
+ "loss": 0.1379,
+ "step": 18428
+ },
+ {
+ "epoch": 50.21525885558583,
+ "grad_norm": 5.551758289337158,
+ "learning_rate": 1.041597616235066e-05,
+ "loss": 0.1382,
+ "step": 18429
+ },
+ {
+ "epoch": 50.217983651226156,
+ "grad_norm": 6.4018683433532715,
+ "learning_rate": 1.0415094429944334e-05,
+ "loss": 0.2777,
+ "step": 18430
+ },
+ {
+ "epoch": 50.22070844686648,
+ "grad_norm": 6.368010997772217,
+ "learning_rate": 1.041421269430527e-05,
+ "loss": 0.1227,
+ "step": 18431
+ },
+ {
+ "epoch": 50.223433242506815,
+ "grad_norm": 7.071566581726074,
+ "learning_rate": 1.0413330955440328e-05,
+ "loss": 0.1889,
+ "step": 18432
+ },
+ {
+ "epoch": 50.22615803814714,
+ "grad_norm": 4.986183166503906,
+ "learning_rate": 1.0412449213356377e-05,
+ "loss": 0.1167,
+ "step": 18433
+ },
+ {
+ "epoch": 50.228882833787466,
+ "grad_norm": 6.3849029541015625,
+ "learning_rate": 1.0411567468060288e-05,
+ "loss": 0.2268,
+ "step": 18434
+ },
+ {
+ "epoch": 50.23160762942779,
+ "grad_norm": 7.67453145980835,
+ "learning_rate": 1.0410685719558921e-05,
+ "loss": 0.0973,
+ "step": 18435
+ },
+ {
+ "epoch": 50.23433242506812,
+ "grad_norm": 11.306721687316895,
+ "learning_rate": 1.040980396785915e-05,
+ "loss": 0.1166,
+ "step": 18436
+ },
+ {
+ "epoch": 50.237057220708444,
+ "grad_norm": 5.158883094787598,
+ "learning_rate": 1.0408922212967839e-05,
+ "loss": 0.1354,
+ "step": 18437
+ },
+ {
+ "epoch": 50.23978201634878,
+ "grad_norm": 5.250732898712158,
+ "learning_rate": 1.0408040454891852e-05,
+ "loss": 0.095,
+ "step": 18438
+ },
+ {
+ "epoch": 50.2425068119891,
+ "grad_norm": 5.08771276473999,
+ "learning_rate": 1.0407158693638065e-05,
+ "loss": 0.2626,
+ "step": 18439
+ },
+ {
+ "epoch": 50.24523160762943,
+ "grad_norm": 6.133188724517822,
+ "learning_rate": 1.0406276929213332e-05,
+ "loss": 0.2383,
+ "step": 18440
+ },
+ {
+ "epoch": 50.247956403269754,
+ "grad_norm": 9.72242259979248,
+ "learning_rate": 1.040539516162453e-05,
+ "loss": 0.1978,
+ "step": 18441
+ },
+ {
+ "epoch": 50.25068119891008,
+ "grad_norm": 7.685892581939697,
+ "learning_rate": 1.0404513390878526e-05,
+ "loss": 0.1966,
+ "step": 18442
+ },
+ {
+ "epoch": 50.253405994550405,
+ "grad_norm": 23.41997718811035,
+ "learning_rate": 1.0403631616982181e-05,
+ "loss": 0.2018,
+ "step": 18443
+ },
+ {
+ "epoch": 50.25613079019074,
+ "grad_norm": 18.337629318237305,
+ "learning_rate": 1.040274983994237e-05,
+ "loss": 0.1876,
+ "step": 18444
+ },
+ {
+ "epoch": 50.258855585831064,
+ "grad_norm": 6.652121543884277,
+ "learning_rate": 1.0401868059765952e-05,
+ "loss": 0.1405,
+ "step": 18445
+ },
+ {
+ "epoch": 50.26158038147139,
+ "grad_norm": 6.964537143707275,
+ "learning_rate": 1.04009862764598e-05,
+ "loss": 0.25,
+ "step": 18446
+ },
+ {
+ "epoch": 50.264305177111716,
+ "grad_norm": 7.468809604644775,
+ "learning_rate": 1.0400104490030781e-05,
+ "loss": 0.311,
+ "step": 18447
+ },
+ {
+ "epoch": 50.26702997275204,
+ "grad_norm": 8.93313217163086,
+ "learning_rate": 1.039922270048576e-05,
+ "loss": 0.1644,
+ "step": 18448
+ },
+ {
+ "epoch": 50.26975476839237,
+ "grad_norm": 5.838148593902588,
+ "learning_rate": 1.0398340907831603e-05,
+ "loss": 0.1412,
+ "step": 18449
+ },
+ {
+ "epoch": 50.2724795640327,
+ "grad_norm": 15.795492172241211,
+ "learning_rate": 1.0397459112075186e-05,
+ "loss": 0.1476,
+ "step": 18450
+ },
+ {
+ "epoch": 50.275204359673026,
+ "grad_norm": 7.08922815322876,
+ "learning_rate": 1.0396577313223367e-05,
+ "loss": 0.1622,
+ "step": 18451
+ },
+ {
+ "epoch": 50.27792915531335,
+ "grad_norm": 6.640037536621094,
+ "learning_rate": 1.0395695511283015e-05,
+ "loss": 0.1612,
+ "step": 18452
+ },
+ {
+ "epoch": 50.28065395095368,
+ "grad_norm": 6.648226261138916,
+ "learning_rate": 1.0394813706261e-05,
+ "loss": 0.0946,
+ "step": 18453
+ },
+ {
+ "epoch": 50.283378746594,
+ "grad_norm": 5.4601593017578125,
+ "learning_rate": 1.0393931898164191e-05,
+ "loss": 0.1922,
+ "step": 18454
+ },
+ {
+ "epoch": 50.28610354223433,
+ "grad_norm": 16.282859802246094,
+ "learning_rate": 1.039305008699945e-05,
+ "loss": 0.1048,
+ "step": 18455
+ },
+ {
+ "epoch": 50.28882833787466,
+ "grad_norm": 7.032933235168457,
+ "learning_rate": 1.0392168272773651e-05,
+ "loss": 0.1855,
+ "step": 18456
+ },
+ {
+ "epoch": 50.29155313351499,
+ "grad_norm": 7.576723575592041,
+ "learning_rate": 1.0391286455493655e-05,
+ "loss": 0.2885,
+ "step": 18457
+ },
+ {
+ "epoch": 50.294277929155314,
+ "grad_norm": 6.466182708740234,
+ "learning_rate": 1.0390404635166331e-05,
+ "loss": 0.1541,
+ "step": 18458
+ },
+ {
+ "epoch": 50.29700272479564,
+ "grad_norm": 5.537355422973633,
+ "learning_rate": 1.0389522811798551e-05,
+ "loss": 0.1611,
+ "step": 18459
+ },
+ {
+ "epoch": 50.299727520435965,
+ "grad_norm": 7.105430603027344,
+ "learning_rate": 1.038864098539718e-05,
+ "loss": 0.134,
+ "step": 18460
+ },
+ {
+ "epoch": 50.30245231607629,
+ "grad_norm": 5.081597328186035,
+ "learning_rate": 1.0387759155969085e-05,
+ "loss": 0.2542,
+ "step": 18461
+ },
+ {
+ "epoch": 50.305177111716624,
+ "grad_norm": 5.218195915222168,
+ "learning_rate": 1.0386877323521137e-05,
+ "loss": 0.1787,
+ "step": 18462
+ },
+ {
+ "epoch": 50.30790190735695,
+ "grad_norm": 6.520836353302002,
+ "learning_rate": 1.0385995488060196e-05,
+ "loss": 0.1189,
+ "step": 18463
+ },
+ {
+ "epoch": 50.310626702997276,
+ "grad_norm": 5.77503776550293,
+ "learning_rate": 1.0385113649593137e-05,
+ "loss": 0.2085,
+ "step": 18464
+ },
+ {
+ "epoch": 50.3133514986376,
+ "grad_norm": 4.978865146636963,
+ "learning_rate": 1.0384231808126826e-05,
+ "loss": 0.3342,
+ "step": 18465
+ },
+ {
+ "epoch": 50.31607629427793,
+ "grad_norm": 5.38184928894043,
+ "learning_rate": 1.038334996366813e-05,
+ "loss": 0.1617,
+ "step": 18466
+ },
+ {
+ "epoch": 50.31880108991825,
+ "grad_norm": 5.251583099365234,
+ "learning_rate": 1.0382468116223912e-05,
+ "loss": 0.243,
+ "step": 18467
+ },
+ {
+ "epoch": 50.321525885558586,
+ "grad_norm": 5.05536413192749,
+ "learning_rate": 1.0381586265801049e-05,
+ "loss": 0.302,
+ "step": 18468
+ },
+ {
+ "epoch": 50.32425068119891,
+ "grad_norm": 4.584299564361572,
+ "learning_rate": 1.0380704412406405e-05,
+ "loss": 0.109,
+ "step": 18469
+ },
+ {
+ "epoch": 50.32697547683924,
+ "grad_norm": 4.566288471221924,
+ "learning_rate": 1.0379822556046845e-05,
+ "loss": 0.2359,
+ "step": 18470
+ },
+ {
+ "epoch": 50.32970027247956,
+ "grad_norm": 5.151820659637451,
+ "learning_rate": 1.037894069672924e-05,
+ "loss": 0.2084,
+ "step": 18471
+ },
+ {
+ "epoch": 50.33242506811989,
+ "grad_norm": 6.798867225646973,
+ "learning_rate": 1.037805883446046e-05,
+ "loss": 0.1276,
+ "step": 18472
+ },
+ {
+ "epoch": 50.335149863760215,
+ "grad_norm": 4.876811981201172,
+ "learning_rate": 1.0377176969247366e-05,
+ "loss": 0.1242,
+ "step": 18473
+ },
+ {
+ "epoch": 50.33787465940055,
+ "grad_norm": 5.204194068908691,
+ "learning_rate": 1.0376295101096834e-05,
+ "loss": 0.1834,
+ "step": 18474
+ },
+ {
+ "epoch": 50.34059945504087,
+ "grad_norm": 7.647690773010254,
+ "learning_rate": 1.037541323001572e-05,
+ "loss": 0.1279,
+ "step": 18475
+ },
+ {
+ "epoch": 50.3433242506812,
+ "grad_norm": 6.199369430541992,
+ "learning_rate": 1.0374531356010909e-05,
+ "loss": 0.1893,
+ "step": 18476
+ },
+ {
+ "epoch": 50.346049046321525,
+ "grad_norm": 4.2011189460754395,
+ "learning_rate": 1.0373649479089254e-05,
+ "loss": 0.1199,
+ "step": 18477
+ },
+ {
+ "epoch": 50.34877384196185,
+ "grad_norm": 7.538383483886719,
+ "learning_rate": 1.0372767599257631e-05,
+ "loss": 0.1437,
+ "step": 18478
+ },
+ {
+ "epoch": 50.35149863760218,
+ "grad_norm": 4.226534843444824,
+ "learning_rate": 1.0371885716522904e-05,
+ "loss": 0.1227,
+ "step": 18479
+ },
+ {
+ "epoch": 50.35422343324251,
+ "grad_norm": 5.861737251281738,
+ "learning_rate": 1.0371003830891948e-05,
+ "loss": 0.1451,
+ "step": 18480
+ },
+ {
+ "epoch": 50.356948228882835,
+ "grad_norm": 7.6636762619018555,
+ "learning_rate": 1.0370121942371623e-05,
+ "loss": 0.1809,
+ "step": 18481
+ },
+ {
+ "epoch": 50.35967302452316,
+ "grad_norm": 6.123965263366699,
+ "learning_rate": 1.0369240050968802e-05,
+ "loss": 0.1501,
+ "step": 18482
+ },
+ {
+ "epoch": 50.36239782016349,
+ "grad_norm": 5.685791015625,
+ "learning_rate": 1.0368358156690345e-05,
+ "loss": 0.1547,
+ "step": 18483
+ },
+ {
+ "epoch": 50.36512261580381,
+ "grad_norm": 5.073871612548828,
+ "learning_rate": 1.0367476259543133e-05,
+ "loss": 0.1027,
+ "step": 18484
+ },
+ {
+ "epoch": 50.36784741144414,
+ "grad_norm": 7.540602684020996,
+ "learning_rate": 1.0366594359534024e-05,
+ "loss": 0.1327,
+ "step": 18485
+ },
+ {
+ "epoch": 50.37057220708447,
+ "grad_norm": 5.798464298248291,
+ "learning_rate": 1.0365712456669891e-05,
+ "loss": 0.145,
+ "step": 18486
+ },
+ {
+ "epoch": 50.3732970027248,
+ "grad_norm": 4.602923393249512,
+ "learning_rate": 1.0364830550957603e-05,
+ "loss": 0.1547,
+ "step": 18487
+ },
+ {
+ "epoch": 50.37602179836512,
+ "grad_norm": 7.460385322570801,
+ "learning_rate": 1.0363948642404025e-05,
+ "loss": 0.1556,
+ "step": 18488
+ },
+ {
+ "epoch": 50.37874659400545,
+ "grad_norm": 5.966169834136963,
+ "learning_rate": 1.0363066731016026e-05,
+ "loss": 0.3613,
+ "step": 18489
+ },
+ {
+ "epoch": 50.381471389645775,
+ "grad_norm": 6.093320369720459,
+ "learning_rate": 1.0362184816800478e-05,
+ "loss": 0.1202,
+ "step": 18490
+ },
+ {
+ "epoch": 50.3841961852861,
+ "grad_norm": 5.022852420806885,
+ "learning_rate": 1.0361302899764242e-05,
+ "loss": 0.199,
+ "step": 18491
+ },
+ {
+ "epoch": 50.38692098092643,
+ "grad_norm": 6.382558822631836,
+ "learning_rate": 1.0360420979914192e-05,
+ "loss": 0.1699,
+ "step": 18492
+ },
+ {
+ "epoch": 50.38964577656676,
+ "grad_norm": 4.964744567871094,
+ "learning_rate": 1.0359539057257196e-05,
+ "loss": 0.283,
+ "step": 18493
+ },
+ {
+ "epoch": 50.392370572207085,
+ "grad_norm": 7.423490047454834,
+ "learning_rate": 1.0358657131800123e-05,
+ "loss": 0.1443,
+ "step": 18494
+ },
+ {
+ "epoch": 50.39509536784741,
+ "grad_norm": 4.478601932525635,
+ "learning_rate": 1.0357775203549836e-05,
+ "loss": 0.2648,
+ "step": 18495
+ },
+ {
+ "epoch": 50.39782016348774,
+ "grad_norm": 5.2288818359375,
+ "learning_rate": 1.0356893272513211e-05,
+ "loss": 0.1324,
+ "step": 18496
+ },
+ {
+ "epoch": 50.40054495912806,
+ "grad_norm": 3.6058640480041504,
+ "learning_rate": 1.0356011338697109e-05,
+ "loss": 0.0967,
+ "step": 18497
+ },
+ {
+ "epoch": 50.403269754768395,
+ "grad_norm": 6.091643810272217,
+ "learning_rate": 1.0355129402108407e-05,
+ "loss": 0.1614,
+ "step": 18498
+ },
+ {
+ "epoch": 50.40599455040872,
+ "grad_norm": 5.402215003967285,
+ "learning_rate": 1.0354247462753964e-05,
+ "loss": 0.1089,
+ "step": 18499
+ },
+ {
+ "epoch": 50.40871934604905,
+ "grad_norm": 5.242166996002197,
+ "learning_rate": 1.0353365520640657e-05,
+ "loss": 0.1504,
+ "step": 18500
+ },
+ {
+ "epoch": 50.41144414168937,
+ "grad_norm": 6.618157386779785,
+ "learning_rate": 1.0352483575775345e-05,
+ "loss": 0.0943,
+ "step": 18501
+ },
+ {
+ "epoch": 50.4141689373297,
+ "grad_norm": 6.022257328033447,
+ "learning_rate": 1.0351601628164906e-05,
+ "loss": 0.1216,
+ "step": 18502
+ },
+ {
+ "epoch": 50.416893732970024,
+ "grad_norm": 5.579530239105225,
+ "learning_rate": 1.0350719677816206e-05,
+ "loss": 0.091,
+ "step": 18503
+ },
+ {
+ "epoch": 50.41961852861036,
+ "grad_norm": 5.442110061645508,
+ "learning_rate": 1.0349837724736111e-05,
+ "loss": 0.2021,
+ "step": 18504
+ },
+ {
+ "epoch": 50.42234332425068,
+ "grad_norm": 6.488962173461914,
+ "learning_rate": 1.034895576893149e-05,
+ "loss": 0.1867,
+ "step": 18505
+ },
+ {
+ "epoch": 50.42506811989101,
+ "grad_norm": 13.680377960205078,
+ "learning_rate": 1.0348073810409216e-05,
+ "loss": 0.2782,
+ "step": 18506
+ },
+ {
+ "epoch": 50.427792915531334,
+ "grad_norm": 3.9911866188049316,
+ "learning_rate": 1.0347191849176151e-05,
+ "loss": 0.0757,
+ "step": 18507
+ },
+ {
+ "epoch": 50.43051771117166,
+ "grad_norm": 5.4325714111328125,
+ "learning_rate": 1.034630988523917e-05,
+ "loss": 0.1251,
+ "step": 18508
+ },
+ {
+ "epoch": 50.433242506811986,
+ "grad_norm": 4.3573384284973145,
+ "learning_rate": 1.0345427918605136e-05,
+ "loss": 0.0782,
+ "step": 18509
+ },
+ {
+ "epoch": 50.43596730245232,
+ "grad_norm": 3.7895023822784424,
+ "learning_rate": 1.034454594928092e-05,
+ "loss": 0.0818,
+ "step": 18510
+ },
+ {
+ "epoch": 50.438692098092645,
+ "grad_norm": 5.045506954193115,
+ "learning_rate": 1.0343663977273393e-05,
+ "loss": 0.0791,
+ "step": 18511
+ },
+ {
+ "epoch": 50.44141689373297,
+ "grad_norm": 5.500280857086182,
+ "learning_rate": 1.0342782002589421e-05,
+ "loss": 0.2222,
+ "step": 18512
+ },
+ {
+ "epoch": 50.444141689373296,
+ "grad_norm": 4.472443103790283,
+ "learning_rate": 1.0341900025235876e-05,
+ "loss": 0.1824,
+ "step": 18513
+ },
+ {
+ "epoch": 50.44686648501362,
+ "grad_norm": 5.784664630889893,
+ "learning_rate": 1.0341018045219624e-05,
+ "loss": 0.1524,
+ "step": 18514
+ },
+ {
+ "epoch": 50.44959128065395,
+ "grad_norm": 5.076463222503662,
+ "learning_rate": 1.0340136062547531e-05,
+ "loss": 0.2144,
+ "step": 18515
+ },
+ {
+ "epoch": 50.45231607629428,
+ "grad_norm": 5.553852081298828,
+ "learning_rate": 1.0339254077226474e-05,
+ "loss": 0.2322,
+ "step": 18516
+ },
+ {
+ "epoch": 50.45504087193461,
+ "grad_norm": 5.4261698722839355,
+ "learning_rate": 1.0338372089263316e-05,
+ "loss": 0.2037,
+ "step": 18517
+ },
+ {
+ "epoch": 50.45776566757493,
+ "grad_norm": 20.90692901611328,
+ "learning_rate": 1.0337490098664923e-05,
+ "loss": 0.1938,
+ "step": 18518
+ },
+ {
+ "epoch": 50.46049046321526,
+ "grad_norm": 7.544172763824463,
+ "learning_rate": 1.0336608105438172e-05,
+ "loss": 0.2766,
+ "step": 18519
+ },
+ {
+ "epoch": 50.463215258855584,
+ "grad_norm": 4.8083977699279785,
+ "learning_rate": 1.0335726109589927e-05,
+ "loss": 0.1645,
+ "step": 18520
+ },
+ {
+ "epoch": 50.46594005449591,
+ "grad_norm": 5.119318008422852,
+ "learning_rate": 1.0334844111127058e-05,
+ "loss": 0.1378,
+ "step": 18521
+ },
+ {
+ "epoch": 50.46866485013624,
+ "grad_norm": 13.963621139526367,
+ "learning_rate": 1.0333962110056435e-05,
+ "loss": 0.1564,
+ "step": 18522
+ },
+ {
+ "epoch": 50.47138964577657,
+ "grad_norm": 5.176802635192871,
+ "learning_rate": 1.0333080106384922e-05,
+ "loss": 0.1489,
+ "step": 18523
+ },
+ {
+ "epoch": 50.474114441416894,
+ "grad_norm": 6.25013542175293,
+ "learning_rate": 1.0332198100119398e-05,
+ "loss": 0.1352,
+ "step": 18524
+ },
+ {
+ "epoch": 50.47683923705722,
+ "grad_norm": 4.3459320068359375,
+ "learning_rate": 1.033131609126672e-05,
+ "loss": 0.1453,
+ "step": 18525
+ },
+ {
+ "epoch": 50.479564032697546,
+ "grad_norm": 5.281796455383301,
+ "learning_rate": 1.0330434079833767e-05,
+ "loss": 0.2247,
+ "step": 18526
+ },
+ {
+ "epoch": 50.48228882833787,
+ "grad_norm": 5.650903224945068,
+ "learning_rate": 1.0329552065827402e-05,
+ "loss": 0.1086,
+ "step": 18527
+ },
+ {
+ "epoch": 50.485013623978205,
+ "grad_norm": 5.897468090057373,
+ "learning_rate": 1.0328670049254494e-05,
+ "loss": 0.1713,
+ "step": 18528
+ },
+ {
+ "epoch": 50.48773841961853,
+ "grad_norm": 5.536411285400391,
+ "learning_rate": 1.032778803012192e-05,
+ "loss": 0.1332,
+ "step": 18529
+ },
+ {
+ "epoch": 50.490463215258856,
+ "grad_norm": 4.596107482910156,
+ "learning_rate": 1.0326906008436537e-05,
+ "loss": 0.1164,
+ "step": 18530
+ },
+ {
+ "epoch": 50.49318801089918,
+ "grad_norm": 12.462303161621094,
+ "learning_rate": 1.0326023984205224e-05,
+ "loss": 0.2555,
+ "step": 18531
+ },
+ {
+ "epoch": 50.49591280653951,
+ "grad_norm": 4.766989707946777,
+ "learning_rate": 1.0325141957434848e-05,
+ "loss": 0.103,
+ "step": 18532
+ },
+ {
+ "epoch": 50.49863760217983,
+ "grad_norm": 5.915868759155273,
+ "learning_rate": 1.0324259928132273e-05,
+ "loss": 0.2964,
+ "step": 18533
+ },
+ {
+ "epoch": 50.50136239782017,
+ "grad_norm": 4.585247993469238,
+ "learning_rate": 1.0323377896304377e-05,
+ "loss": 0.1374,
+ "step": 18534
+ },
+ {
+ "epoch": 50.50408719346049,
+ "grad_norm": 6.821434497833252,
+ "learning_rate": 1.032249586195802e-05,
+ "loss": 0.2504,
+ "step": 18535
+ },
+ {
+ "epoch": 50.50681198910082,
+ "grad_norm": 4.72754430770874,
+ "learning_rate": 1.0321613825100076e-05,
+ "loss": 0.1451,
+ "step": 18536
+ },
+ {
+ "epoch": 50.509536784741144,
+ "grad_norm": 4.41359806060791,
+ "learning_rate": 1.0320731785737417e-05,
+ "loss": 0.2929,
+ "step": 18537
+ },
+ {
+ "epoch": 50.51226158038147,
+ "grad_norm": 5.099160671234131,
+ "learning_rate": 1.0319849743876904e-05,
+ "loss": 0.1279,
+ "step": 18538
+ },
+ {
+ "epoch": 50.514986376021795,
+ "grad_norm": 4.279083728790283,
+ "learning_rate": 1.0318967699525418e-05,
+ "loss": 0.0831,
+ "step": 18539
+ },
+ {
+ "epoch": 50.51771117166213,
+ "grad_norm": 3.7065377235412598,
+ "learning_rate": 1.0318085652689817e-05,
+ "loss": 0.2047,
+ "step": 18540
+ },
+ {
+ "epoch": 50.520435967302454,
+ "grad_norm": 5.958557605743408,
+ "learning_rate": 1.0317203603376978e-05,
+ "loss": 0.1109,
+ "step": 18541
+ },
+ {
+ "epoch": 50.52316076294278,
+ "grad_norm": 5.407521724700928,
+ "learning_rate": 1.0316321551593765e-05,
+ "loss": 0.1997,
+ "step": 18542
+ },
+ {
+ "epoch": 50.525885558583106,
+ "grad_norm": 4.932890892028809,
+ "learning_rate": 1.0315439497347053e-05,
+ "loss": 0.092,
+ "step": 18543
+ },
+ {
+ "epoch": 50.52861035422343,
+ "grad_norm": 5.787096977233887,
+ "learning_rate": 1.0314557440643704e-05,
+ "loss": 0.2025,
+ "step": 18544
+ },
+ {
+ "epoch": 50.53133514986376,
+ "grad_norm": 5.552667617797852,
+ "learning_rate": 1.0313675381490596e-05,
+ "loss": 0.2368,
+ "step": 18545
+ },
+ {
+ "epoch": 50.53405994550409,
+ "grad_norm": 4.171079158782959,
+ "learning_rate": 1.031279331989459e-05,
+ "loss": 0.1034,
+ "step": 18546
+ },
+ {
+ "epoch": 50.536784741144416,
+ "grad_norm": 4.297781467437744,
+ "learning_rate": 1.0311911255862563e-05,
+ "loss": 0.0874,
+ "step": 18547
+ },
+ {
+ "epoch": 50.53950953678474,
+ "grad_norm": 6.7232441902160645,
+ "learning_rate": 1.0311029189401381e-05,
+ "loss": 0.2101,
+ "step": 18548
+ },
+ {
+ "epoch": 50.54223433242507,
+ "grad_norm": 4.8784589767456055,
+ "learning_rate": 1.0310147120517914e-05,
+ "loss": 0.3153,
+ "step": 18549
+ },
+ {
+ "epoch": 50.54495912806539,
+ "grad_norm": 6.15592622756958,
+ "learning_rate": 1.030926504921903e-05,
+ "loss": 0.2002,
+ "step": 18550
+ },
+ {
+ "epoch": 50.54768392370572,
+ "grad_norm": 15.851859092712402,
+ "learning_rate": 1.0308382975511601e-05,
+ "loss": 0.1726,
+ "step": 18551
+ },
+ {
+ "epoch": 50.55040871934605,
+ "grad_norm": 7.502651691436768,
+ "learning_rate": 1.0307500899402493e-05,
+ "loss": 0.364,
+ "step": 18552
+ },
+ {
+ "epoch": 50.55313351498638,
+ "grad_norm": 4.7100396156311035,
+ "learning_rate": 1.0306618820898579e-05,
+ "loss": 0.1076,
+ "step": 18553
+ },
+ {
+ "epoch": 50.555858310626704,
+ "grad_norm": 6.022217750549316,
+ "learning_rate": 1.0305736740006726e-05,
+ "loss": 0.1563,
+ "step": 18554
+ },
+ {
+ "epoch": 50.55858310626703,
+ "grad_norm": 8.388520240783691,
+ "learning_rate": 1.0304854656733808e-05,
+ "loss": 0.1141,
+ "step": 18555
+ },
+ {
+ "epoch": 50.561307901907355,
+ "grad_norm": 5.04994535446167,
+ "learning_rate": 1.0303972571086691e-05,
+ "loss": 0.1208,
+ "step": 18556
+ },
+ {
+ "epoch": 50.56403269754768,
+ "grad_norm": 6.984668254852295,
+ "learning_rate": 1.0303090483072247e-05,
+ "loss": 0.1762,
+ "step": 18557
+ },
+ {
+ "epoch": 50.566757493188014,
+ "grad_norm": 4.813941955566406,
+ "learning_rate": 1.0302208392697339e-05,
+ "loss": 0.0937,
+ "step": 18558
+ },
+ {
+ "epoch": 50.56948228882834,
+ "grad_norm": 5.3015875816345215,
+ "learning_rate": 1.0301326299968848e-05,
+ "loss": 0.1246,
+ "step": 18559
+ },
+ {
+ "epoch": 50.572207084468666,
+ "grad_norm": 7.070939064025879,
+ "learning_rate": 1.0300444204893634e-05,
+ "loss": 0.2059,
+ "step": 18560
+ },
+ {
+ "epoch": 50.57493188010899,
+ "grad_norm": 4.208089351654053,
+ "learning_rate": 1.0299562107478569e-05,
+ "loss": 0.0784,
+ "step": 18561
+ },
+ {
+ "epoch": 50.57765667574932,
+ "grad_norm": 5.170956134796143,
+ "learning_rate": 1.0298680007730525e-05,
+ "loss": 0.2942,
+ "step": 18562
+ },
+ {
+ "epoch": 50.58038147138964,
+ "grad_norm": 4.3384575843811035,
+ "learning_rate": 1.029779790565637e-05,
+ "loss": 0.2176,
+ "step": 18563
+ },
+ {
+ "epoch": 50.583106267029976,
+ "grad_norm": 4.105449199676514,
+ "learning_rate": 1.0296915801262977e-05,
+ "loss": 0.0632,
+ "step": 18564
+ },
+ {
+ "epoch": 50.5858310626703,
+ "grad_norm": 5.115097999572754,
+ "learning_rate": 1.0296033694557213e-05,
+ "loss": 0.1507,
+ "step": 18565
+ },
+ {
+ "epoch": 50.58855585831063,
+ "grad_norm": 5.516662120819092,
+ "learning_rate": 1.0295151585545947e-05,
+ "loss": 0.1112,
+ "step": 18566
+ },
+ {
+ "epoch": 50.59128065395095,
+ "grad_norm": 4.84885311126709,
+ "learning_rate": 1.029426947423605e-05,
+ "loss": 0.1101,
+ "step": 18567
+ },
+ {
+ "epoch": 50.59400544959128,
+ "grad_norm": 4.946444988250732,
+ "learning_rate": 1.029338736063439e-05,
+ "loss": 0.0787,
+ "step": 18568
+ },
+ {
+ "epoch": 50.596730245231605,
+ "grad_norm": 4.045813083648682,
+ "learning_rate": 1.0292505244747843e-05,
+ "loss": 0.1009,
+ "step": 18569
+ },
+ {
+ "epoch": 50.59945504087194,
+ "grad_norm": 6.580115795135498,
+ "learning_rate": 1.0291623126583268e-05,
+ "loss": 0.1581,
+ "step": 18570
+ },
+ {
+ "epoch": 50.60217983651226,
+ "grad_norm": 4.543004512786865,
+ "learning_rate": 1.0290741006147548e-05,
+ "loss": 0.0934,
+ "step": 18571
+ },
+ {
+ "epoch": 50.60490463215259,
+ "grad_norm": 5.4109368324279785,
+ "learning_rate": 1.0289858883447544e-05,
+ "loss": 0.2124,
+ "step": 18572
+ },
+ {
+ "epoch": 50.607629427792915,
+ "grad_norm": 10.45888900756836,
+ "learning_rate": 1.0288976758490129e-05,
+ "loss": 0.1781,
+ "step": 18573
+ },
+ {
+ "epoch": 50.61035422343324,
+ "grad_norm": 5.362655162811279,
+ "learning_rate": 1.028809463128217e-05,
+ "loss": 0.1545,
+ "step": 18574
+ },
+ {
+ "epoch": 50.61307901907357,
+ "grad_norm": 7.316466331481934,
+ "learning_rate": 1.0287212501830543e-05,
+ "loss": 0.2022,
+ "step": 18575
+ },
+ {
+ "epoch": 50.6158038147139,
+ "grad_norm": 3.898688316345215,
+ "learning_rate": 1.0286330370142111e-05,
+ "loss": 0.0998,
+ "step": 18576
+ },
+ {
+ "epoch": 50.618528610354225,
+ "grad_norm": 3.980304479598999,
+ "learning_rate": 1.028544823622375e-05,
+ "loss": 0.1586,
+ "step": 18577
+ },
+ {
+ "epoch": 50.62125340599455,
+ "grad_norm": 4.505300998687744,
+ "learning_rate": 1.0284566100082323e-05,
+ "loss": 0.2628,
+ "step": 18578
+ },
+ {
+ "epoch": 50.62397820163488,
+ "grad_norm": 5.694802284240723,
+ "learning_rate": 1.0283683961724708e-05,
+ "loss": 0.1341,
+ "step": 18579
+ },
+ {
+ "epoch": 50.6267029972752,
+ "grad_norm": 3.978081464767456,
+ "learning_rate": 1.0282801821157768e-05,
+ "loss": 0.154,
+ "step": 18580
+ },
+ {
+ "epoch": 50.62942779291553,
+ "grad_norm": 4.474717617034912,
+ "learning_rate": 1.0281919678388382e-05,
+ "loss": 0.2082,
+ "step": 18581
+ },
+ {
+ "epoch": 50.63215258855586,
+ "grad_norm": 8.891847610473633,
+ "learning_rate": 1.028103753342341e-05,
+ "loss": 0.1251,
+ "step": 18582
+ },
+ {
+ "epoch": 50.63487738419619,
+ "grad_norm": 7.032039165496826,
+ "learning_rate": 1.028015538626973e-05,
+ "loss": 0.2065,
+ "step": 18583
+ },
+ {
+ "epoch": 50.63760217983651,
+ "grad_norm": 9.012201309204102,
+ "learning_rate": 1.0279273236934207e-05,
+ "loss": 0.1921,
+ "step": 18584
+ },
+ {
+ "epoch": 50.64032697547684,
+ "grad_norm": 4.566155433654785,
+ "learning_rate": 1.0278391085423715e-05,
+ "loss": 0.1126,
+ "step": 18585
+ },
+ {
+ "epoch": 50.643051771117165,
+ "grad_norm": 5.303219795227051,
+ "learning_rate": 1.0277508931745119e-05,
+ "loss": 0.2254,
+ "step": 18586
+ },
+ {
+ "epoch": 50.64577656675749,
+ "grad_norm": 4.0097832679748535,
+ "learning_rate": 1.0276626775905294e-05,
+ "loss": 0.2024,
+ "step": 18587
+ },
+ {
+ "epoch": 50.64850136239782,
+ "grad_norm": 4.792849540710449,
+ "learning_rate": 1.0275744617911107e-05,
+ "loss": 0.2083,
+ "step": 18588
+ },
+ {
+ "epoch": 50.65122615803815,
+ "grad_norm": 4.081125259399414,
+ "learning_rate": 1.0274862457769432e-05,
+ "loss": 0.1437,
+ "step": 18589
+ },
+ {
+ "epoch": 50.653950953678475,
+ "grad_norm": 5.231274127960205,
+ "learning_rate": 1.0273980295487136e-05,
+ "loss": 0.1261,
+ "step": 18590
+ },
+ {
+ "epoch": 50.6566757493188,
+ "grad_norm": 5.771617412567139,
+ "learning_rate": 1.027309813107109e-05,
+ "loss": 0.1846,
+ "step": 18591
+ },
+ {
+ "epoch": 50.65940054495913,
+ "grad_norm": 5.414749622344971,
+ "learning_rate": 1.0272215964528168e-05,
+ "loss": 0.1033,
+ "step": 18592
+ },
+ {
+ "epoch": 50.66212534059945,
+ "grad_norm": 5.166776180267334,
+ "learning_rate": 1.0271333795865233e-05,
+ "loss": 0.1527,
+ "step": 18593
+ },
+ {
+ "epoch": 50.664850136239785,
+ "grad_norm": 5.49155330657959,
+ "learning_rate": 1.027045162508916e-05,
+ "loss": 0.1975,
+ "step": 18594
+ },
+ {
+ "epoch": 50.66757493188011,
+ "grad_norm": 4.783842086791992,
+ "learning_rate": 1.026956945220682e-05,
+ "loss": 0.1186,
+ "step": 18595
+ },
+ {
+ "epoch": 50.67029972752044,
+ "grad_norm": 8.354765892028809,
+ "learning_rate": 1.026868727722508e-05,
+ "loss": 0.1232,
+ "step": 18596
+ },
+ {
+ "epoch": 50.67302452316076,
+ "grad_norm": 5.419940948486328,
+ "learning_rate": 1.0267805100150811e-05,
+ "loss": 0.2251,
+ "step": 18597
+ },
+ {
+ "epoch": 50.67574931880109,
+ "grad_norm": 3.7597742080688477,
+ "learning_rate": 1.0266922920990885e-05,
+ "loss": 0.0977,
+ "step": 18598
+ },
+ {
+ "epoch": 50.678474114441414,
+ "grad_norm": 5.967283248901367,
+ "learning_rate": 1.0266040739752175e-05,
+ "loss": 0.2887,
+ "step": 18599
+ },
+ {
+ "epoch": 50.68119891008175,
+ "grad_norm": 5.507992744445801,
+ "learning_rate": 1.0265158556441543e-05,
+ "loss": 0.1203,
+ "step": 18600
+ },
+ {
+ "epoch": 50.68392370572207,
+ "grad_norm": 7.205935955047607,
+ "learning_rate": 1.0264276371065871e-05,
+ "loss": 0.1477,
+ "step": 18601
+ },
+ {
+ "epoch": 50.6866485013624,
+ "grad_norm": 6.18890380859375,
+ "learning_rate": 1.026339418363202e-05,
+ "loss": 0.1459,
+ "step": 18602
+ },
+ {
+ "epoch": 50.689373297002724,
+ "grad_norm": 7.717989444732666,
+ "learning_rate": 1.0262511994146862e-05,
+ "loss": 0.1926,
+ "step": 18603
+ },
+ {
+ "epoch": 50.69209809264305,
+ "grad_norm": 5.477873802185059,
+ "learning_rate": 1.026162980261727e-05,
+ "loss": 0.2208,
+ "step": 18604
+ },
+ {
+ "epoch": 50.694822888283376,
+ "grad_norm": 5.5274271965026855,
+ "learning_rate": 1.0260747609050115e-05,
+ "loss": 0.0972,
+ "step": 18605
+ },
+ {
+ "epoch": 50.69754768392371,
+ "grad_norm": 5.3758673667907715,
+ "learning_rate": 1.0259865413452266e-05,
+ "loss": 0.1111,
+ "step": 18606
+ },
+ {
+ "epoch": 50.700272479564035,
+ "grad_norm": 5.199080467224121,
+ "learning_rate": 1.0258983215830591e-05,
+ "loss": 0.189,
+ "step": 18607
+ },
+ {
+ "epoch": 50.70299727520436,
+ "grad_norm": 7.787143230438232,
+ "learning_rate": 1.0258101016191963e-05,
+ "loss": 0.3012,
+ "step": 18608
+ },
+ {
+ "epoch": 50.705722070844686,
+ "grad_norm": 4.525249004364014,
+ "learning_rate": 1.0257218814543257e-05,
+ "loss": 0.1977,
+ "step": 18609
+ },
+ {
+ "epoch": 50.70844686648501,
+ "grad_norm": 4.9005913734436035,
+ "learning_rate": 1.0256336610891336e-05,
+ "loss": 0.0966,
+ "step": 18610
+ },
+ {
+ "epoch": 50.71117166212534,
+ "grad_norm": 4.556335926055908,
+ "learning_rate": 1.0255454405243076e-05,
+ "loss": 0.1,
+ "step": 18611
+ },
+ {
+ "epoch": 50.71389645776567,
+ "grad_norm": 7.69804048538208,
+ "learning_rate": 1.0254572197605341e-05,
+ "loss": 0.1512,
+ "step": 18612
+ },
+ {
+ "epoch": 50.716621253406,
+ "grad_norm": 8.30517578125,
+ "learning_rate": 1.0253689987985008e-05,
+ "loss": 0.0957,
+ "step": 18613
+ },
+ {
+ "epoch": 50.71934604904632,
+ "grad_norm": 6.534460067749023,
+ "learning_rate": 1.0252807776388946e-05,
+ "loss": 0.1291,
+ "step": 18614
+ },
+ {
+ "epoch": 50.72207084468665,
+ "grad_norm": 5.42502498626709,
+ "learning_rate": 1.0251925562824026e-05,
+ "loss": 0.1425,
+ "step": 18615
+ },
+ {
+ "epoch": 50.724795640326974,
+ "grad_norm": 4.998002052307129,
+ "learning_rate": 1.0251043347297118e-05,
+ "loss": 0.0969,
+ "step": 18616
+ },
+ {
+ "epoch": 50.7275204359673,
+ "grad_norm": 9.392294883728027,
+ "learning_rate": 1.0250161129815091e-05,
+ "loss": 0.1188,
+ "step": 18617
+ },
+ {
+ "epoch": 50.73024523160763,
+ "grad_norm": 6.346102714538574,
+ "learning_rate": 1.0249278910384817e-05,
+ "loss": 0.213,
+ "step": 18618
+ },
+ {
+ "epoch": 50.73297002724796,
+ "grad_norm": 4.94590950012207,
+ "learning_rate": 1.0248396689013166e-05,
+ "loss": 0.1149,
+ "step": 18619
+ },
+ {
+ "epoch": 50.735694822888284,
+ "grad_norm": 5.284358501434326,
+ "learning_rate": 1.0247514465707012e-05,
+ "loss": 0.0735,
+ "step": 18620
+ },
+ {
+ "epoch": 50.73841961852861,
+ "grad_norm": 11.247912406921387,
+ "learning_rate": 1.024663224047322e-05,
+ "loss": 0.1569,
+ "step": 18621
+ },
+ {
+ "epoch": 50.741144414168936,
+ "grad_norm": 5.320253849029541,
+ "learning_rate": 1.0245750013318669e-05,
+ "loss": 0.1623,
+ "step": 18622
+ },
+ {
+ "epoch": 50.74386920980926,
+ "grad_norm": 6.120570659637451,
+ "learning_rate": 1.024486778425022e-05,
+ "loss": 0.2398,
+ "step": 18623
+ },
+ {
+ "epoch": 50.746594005449595,
+ "grad_norm": 5.824092388153076,
+ "learning_rate": 1.0243985553274753e-05,
+ "loss": 0.1296,
+ "step": 18624
+ },
+ {
+ "epoch": 50.74931880108992,
+ "grad_norm": 6.964953422546387,
+ "learning_rate": 1.024310332039913e-05,
+ "loss": 0.1353,
+ "step": 18625
+ },
+ {
+ "epoch": 50.752043596730246,
+ "grad_norm": 7.604491710662842,
+ "learning_rate": 1.024222108563023e-05,
+ "loss": 0.1786,
+ "step": 18626
+ },
+ {
+ "epoch": 50.75476839237057,
+ "grad_norm": 6.910664081573486,
+ "learning_rate": 1.0241338848974918e-05,
+ "loss": 0.2086,
+ "step": 18627
+ },
+ {
+ "epoch": 50.7574931880109,
+ "grad_norm": 5.907593727111816,
+ "learning_rate": 1.0240456610440068e-05,
+ "loss": 0.3074,
+ "step": 18628
+ },
+ {
+ "epoch": 50.76021798365122,
+ "grad_norm": 5.974182605743408,
+ "learning_rate": 1.0239574370032548e-05,
+ "loss": 0.1979,
+ "step": 18629
+ },
+ {
+ "epoch": 50.762942779291556,
+ "grad_norm": 5.4504289627075195,
+ "learning_rate": 1.0238692127759232e-05,
+ "loss": 0.1797,
+ "step": 18630
+ },
+ {
+ "epoch": 50.76566757493188,
+ "grad_norm": 14.588968276977539,
+ "learning_rate": 1.0237809883626986e-05,
+ "loss": 0.149,
+ "step": 18631
+ },
+ {
+ "epoch": 50.76839237057221,
+ "grad_norm": 15.98033332824707,
+ "learning_rate": 1.0236927637642688e-05,
+ "loss": 0.238,
+ "step": 18632
+ },
+ {
+ "epoch": 50.771117166212534,
+ "grad_norm": 4.419747829437256,
+ "learning_rate": 1.0236045389813203e-05,
+ "loss": 0.2188,
+ "step": 18633
+ },
+ {
+ "epoch": 50.77384196185286,
+ "grad_norm": 6.706301689147949,
+ "learning_rate": 1.0235163140145408e-05,
+ "loss": 0.3224,
+ "step": 18634
+ },
+ {
+ "epoch": 50.776566757493185,
+ "grad_norm": 6.188803672790527,
+ "learning_rate": 1.0234280888646166e-05,
+ "loss": 0.0994,
+ "step": 18635
+ },
+ {
+ "epoch": 50.77929155313352,
+ "grad_norm": 7.780112266540527,
+ "learning_rate": 1.0233398635322353e-05,
+ "loss": 0.1531,
+ "step": 18636
+ },
+ {
+ "epoch": 50.782016348773844,
+ "grad_norm": 5.561610698699951,
+ "learning_rate": 1.023251638018084e-05,
+ "loss": 0.1296,
+ "step": 18637
+ },
+ {
+ "epoch": 50.78474114441417,
+ "grad_norm": 4.837251663208008,
+ "learning_rate": 1.0231634123228498e-05,
+ "loss": 0.0933,
+ "step": 18638
+ },
+ {
+ "epoch": 50.787465940054496,
+ "grad_norm": 3.9444570541381836,
+ "learning_rate": 1.023075186447219e-05,
+ "loss": 0.1079,
+ "step": 18639
+ },
+ {
+ "epoch": 50.79019073569482,
+ "grad_norm": 6.445371627807617,
+ "learning_rate": 1.0229869603918801e-05,
+ "loss": 0.2153,
+ "step": 18640
+ },
+ {
+ "epoch": 50.79291553133515,
+ "grad_norm": 6.34771203994751,
+ "learning_rate": 1.0228987341575192e-05,
+ "loss": 0.1475,
+ "step": 18641
+ },
+ {
+ "epoch": 50.79564032697548,
+ "grad_norm": 8.866080284118652,
+ "learning_rate": 1.0228105077448239e-05,
+ "loss": 0.1518,
+ "step": 18642
+ },
+ {
+ "epoch": 50.798365122615806,
+ "grad_norm": 5.695035457611084,
+ "learning_rate": 1.0227222811544807e-05,
+ "loss": 0.1191,
+ "step": 18643
+ },
+ {
+ "epoch": 50.80108991825613,
+ "grad_norm": 5.830082416534424,
+ "learning_rate": 1.0226340543871778e-05,
+ "loss": 0.2573,
+ "step": 18644
+ },
+ {
+ "epoch": 50.80381471389646,
+ "grad_norm": 4.047380447387695,
+ "learning_rate": 1.0225458274436011e-05,
+ "loss": 0.1415,
+ "step": 18645
+ },
+ {
+ "epoch": 50.80653950953678,
+ "grad_norm": 7.31242561340332,
+ "learning_rate": 1.0224576003244385e-05,
+ "loss": 0.2494,
+ "step": 18646
+ },
+ {
+ "epoch": 50.80926430517711,
+ "grad_norm": 4.944585800170898,
+ "learning_rate": 1.0223693730303761e-05,
+ "loss": 0.2513,
+ "step": 18647
+ },
+ {
+ "epoch": 50.81198910081744,
+ "grad_norm": 4.9357733726501465,
+ "learning_rate": 1.0222811455621025e-05,
+ "loss": 0.392,
+ "step": 18648
+ },
+ {
+ "epoch": 50.81471389645777,
+ "grad_norm": 6.6110029220581055,
+ "learning_rate": 1.0221929179203038e-05,
+ "loss": 0.1249,
+ "step": 18649
+ },
+ {
+ "epoch": 50.817438692098094,
+ "grad_norm": 6.397737979888916,
+ "learning_rate": 1.0221046901056675e-05,
+ "loss": 0.1245,
+ "step": 18650
+ },
+ {
+ "epoch": 50.82016348773842,
+ "grad_norm": 5.183709144592285,
+ "learning_rate": 1.0220164621188804e-05,
+ "loss": 0.1974,
+ "step": 18651
+ },
+ {
+ "epoch": 50.822888283378745,
+ "grad_norm": 5.553018569946289,
+ "learning_rate": 1.02192823396063e-05,
+ "loss": 0.2481,
+ "step": 18652
+ },
+ {
+ "epoch": 50.82561307901907,
+ "grad_norm": 4.401885986328125,
+ "learning_rate": 1.0218400056316031e-05,
+ "loss": 0.1696,
+ "step": 18653
+ },
+ {
+ "epoch": 50.828337874659404,
+ "grad_norm": 3.9832563400268555,
+ "learning_rate": 1.0217517771324871e-05,
+ "loss": 0.3923,
+ "step": 18654
+ },
+ {
+ "epoch": 50.83106267029973,
+ "grad_norm": 4.639732837677002,
+ "learning_rate": 1.0216635484639688e-05,
+ "loss": 0.177,
+ "step": 18655
+ },
+ {
+ "epoch": 50.833787465940055,
+ "grad_norm": 4.781457901000977,
+ "learning_rate": 1.0215753196267352e-05,
+ "loss": 0.1861,
+ "step": 18656
+ },
+ {
+ "epoch": 50.83651226158038,
+ "grad_norm": 4.005565643310547,
+ "learning_rate": 1.021487090621474e-05,
+ "loss": 0.0803,
+ "step": 18657
+ },
+ {
+ "epoch": 50.83923705722071,
+ "grad_norm": 5.11945915222168,
+ "learning_rate": 1.0213988614488721e-05,
+ "loss": 0.1536,
+ "step": 18658
+ },
+ {
+ "epoch": 50.84196185286103,
+ "grad_norm": 4.560452938079834,
+ "learning_rate": 1.0213106321096164e-05,
+ "loss": 0.2326,
+ "step": 18659
+ },
+ {
+ "epoch": 50.844686648501366,
+ "grad_norm": 6.021965026855469,
+ "learning_rate": 1.0212224026043945e-05,
+ "loss": 0.1181,
+ "step": 18660
+ },
+ {
+ "epoch": 50.84741144414169,
+ "grad_norm": 3.8789072036743164,
+ "learning_rate": 1.0211341729338928e-05,
+ "loss": 0.1204,
+ "step": 18661
+ },
+ {
+ "epoch": 50.85013623978202,
+ "grad_norm": 5.305844783782959,
+ "learning_rate": 1.0210459430987993e-05,
+ "loss": 0.1091,
+ "step": 18662
+ },
+ {
+ "epoch": 50.85286103542234,
+ "grad_norm": 4.129421234130859,
+ "learning_rate": 1.0209577130998002e-05,
+ "loss": 0.1939,
+ "step": 18663
+ },
+ {
+ "epoch": 50.85558583106267,
+ "grad_norm": 5.56313943862915,
+ "learning_rate": 1.0208694829375834e-05,
+ "loss": 0.1791,
+ "step": 18664
+ },
+ {
+ "epoch": 50.858310626702995,
+ "grad_norm": 4.692027568817139,
+ "learning_rate": 1.0207812526128356e-05,
+ "loss": 0.1208,
+ "step": 18665
+ },
+ {
+ "epoch": 50.86103542234333,
+ "grad_norm": 5.1737961769104,
+ "learning_rate": 1.020693022126244e-05,
+ "loss": 0.1212,
+ "step": 18666
+ },
+ {
+ "epoch": 50.86376021798365,
+ "grad_norm": 6.0052361488342285,
+ "learning_rate": 1.020604791478496e-05,
+ "loss": 0.2019,
+ "step": 18667
+ },
+ {
+ "epoch": 50.86648501362398,
+ "grad_norm": 5.494925498962402,
+ "learning_rate": 1.0205165606702784e-05,
+ "loss": 0.2635,
+ "step": 18668
+ },
+ {
+ "epoch": 50.869209809264305,
+ "grad_norm": 7.216293811798096,
+ "learning_rate": 1.0204283297022786e-05,
+ "loss": 0.1622,
+ "step": 18669
+ },
+ {
+ "epoch": 50.87193460490463,
+ "grad_norm": 5.883440017700195,
+ "learning_rate": 1.0203400985751838e-05,
+ "loss": 0.292,
+ "step": 18670
+ },
+ {
+ "epoch": 50.87465940054496,
+ "grad_norm": 5.328831195831299,
+ "learning_rate": 1.0202518672896806e-05,
+ "loss": 0.1097,
+ "step": 18671
+ },
+ {
+ "epoch": 50.87738419618529,
+ "grad_norm": 5.100024223327637,
+ "learning_rate": 1.0201636358464568e-05,
+ "loss": 0.276,
+ "step": 18672
+ },
+ {
+ "epoch": 50.880108991825615,
+ "grad_norm": 3.971789598464966,
+ "learning_rate": 1.0200754042461988e-05,
+ "loss": 0.1783,
+ "step": 18673
+ },
+ {
+ "epoch": 50.88283378746594,
+ "grad_norm": 4.622824668884277,
+ "learning_rate": 1.0199871724895947e-05,
+ "loss": 0.153,
+ "step": 18674
+ },
+ {
+ "epoch": 50.88555858310627,
+ "grad_norm": 24.071992874145508,
+ "learning_rate": 1.0198989405773307e-05,
+ "loss": 0.1639,
+ "step": 18675
+ },
+ {
+ "epoch": 50.88828337874659,
+ "grad_norm": 5.242025375366211,
+ "learning_rate": 1.019810708510095e-05,
+ "loss": 0.1633,
+ "step": 18676
+ },
+ {
+ "epoch": 50.89100817438692,
+ "grad_norm": 4.857852935791016,
+ "learning_rate": 1.0197224762885735e-05,
+ "loss": 0.1911,
+ "step": 18677
+ },
+ {
+ "epoch": 50.89373297002725,
+ "grad_norm": 5.67581844329834,
+ "learning_rate": 1.0196342439134546e-05,
+ "loss": 0.3513,
+ "step": 18678
+ },
+ {
+ "epoch": 50.89645776566758,
+ "grad_norm": 6.3713274002075195,
+ "learning_rate": 1.0195460113854243e-05,
+ "loss": 0.1237,
+ "step": 18679
+ },
+ {
+ "epoch": 50.8991825613079,
+ "grad_norm": 5.207911491394043,
+ "learning_rate": 1.0194577787051708e-05,
+ "loss": 0.1406,
+ "step": 18680
+ },
+ {
+ "epoch": 50.90190735694823,
+ "grad_norm": 8.377357482910156,
+ "learning_rate": 1.0193695458733803e-05,
+ "loss": 0.1182,
+ "step": 18681
+ },
+ {
+ "epoch": 50.904632152588555,
+ "grad_norm": 4.9795708656311035,
+ "learning_rate": 1.0192813128907404e-05,
+ "loss": 0.3101,
+ "step": 18682
+ },
+ {
+ "epoch": 50.90735694822888,
+ "grad_norm": 6.144087314605713,
+ "learning_rate": 1.0191930797579386e-05,
+ "loss": 0.148,
+ "step": 18683
+ },
+ {
+ "epoch": 50.91008174386921,
+ "grad_norm": 5.1268439292907715,
+ "learning_rate": 1.0191048464756615e-05,
+ "loss": 0.1114,
+ "step": 18684
+ },
+ {
+ "epoch": 50.91280653950954,
+ "grad_norm": 4.573668479919434,
+ "learning_rate": 1.0190166130445964e-05,
+ "loss": 0.0848,
+ "step": 18685
+ },
+ {
+ "epoch": 50.915531335149865,
+ "grad_norm": 4.333711624145508,
+ "learning_rate": 1.0189283794654308e-05,
+ "loss": 0.1864,
+ "step": 18686
+ },
+ {
+ "epoch": 50.91825613079019,
+ "grad_norm": 6.886716842651367,
+ "learning_rate": 1.0188401457388513e-05,
+ "loss": 0.1345,
+ "step": 18687
+ },
+ {
+ "epoch": 50.920980926430516,
+ "grad_norm": 4.428810119628906,
+ "learning_rate": 1.0187519118655456e-05,
+ "loss": 0.1554,
+ "step": 18688
+ },
+ {
+ "epoch": 50.92370572207084,
+ "grad_norm": 4.6712141036987305,
+ "learning_rate": 1.0186636778462002e-05,
+ "loss": 0.0946,
+ "step": 18689
+ },
+ {
+ "epoch": 50.926430517711175,
+ "grad_norm": 5.9868035316467285,
+ "learning_rate": 1.0185754436815029e-05,
+ "loss": 0.135,
+ "step": 18690
+ },
+ {
+ "epoch": 50.9291553133515,
+ "grad_norm": 5.404600620269775,
+ "learning_rate": 1.018487209372141e-05,
+ "loss": 0.2366,
+ "step": 18691
+ },
+ {
+ "epoch": 50.93188010899183,
+ "grad_norm": 8.686942100524902,
+ "learning_rate": 1.0183989749188009e-05,
+ "loss": 0.1878,
+ "step": 18692
+ },
+ {
+ "epoch": 50.93460490463215,
+ "grad_norm": 9.665703773498535,
+ "learning_rate": 1.0183107403221703e-05,
+ "loss": 0.151,
+ "step": 18693
+ },
+ {
+ "epoch": 50.93732970027248,
+ "grad_norm": 5.4269890785217285,
+ "learning_rate": 1.0182225055829362e-05,
+ "loss": 0.2427,
+ "step": 18694
+ },
+ {
+ "epoch": 50.940054495912804,
+ "grad_norm": 52.33797073364258,
+ "learning_rate": 1.0181342707017859e-05,
+ "loss": 0.0847,
+ "step": 18695
+ },
+ {
+ "epoch": 50.94277929155314,
+ "grad_norm": 6.4972310066223145,
+ "learning_rate": 1.0180460356794065e-05,
+ "loss": 0.2136,
+ "step": 18696
+ },
+ {
+ "epoch": 50.94550408719346,
+ "grad_norm": 9.618993759155273,
+ "learning_rate": 1.017957800516485e-05,
+ "loss": 0.2531,
+ "step": 18697
+ },
+ {
+ "epoch": 50.94822888283379,
+ "grad_norm": 8.187857627868652,
+ "learning_rate": 1.0178695652137088e-05,
+ "loss": 0.2706,
+ "step": 18698
+ },
+ {
+ "epoch": 50.950953678474114,
+ "grad_norm": 6.918089866638184,
+ "learning_rate": 1.0177813297717649e-05,
+ "loss": 0.1428,
+ "step": 18699
+ },
+ {
+ "epoch": 50.95367847411444,
+ "grad_norm": 6.106166839599609,
+ "learning_rate": 1.0176930941913405e-05,
+ "loss": 0.2265,
+ "step": 18700
+ },
+ {
+ "epoch": 50.956403269754766,
+ "grad_norm": 5.025012016296387,
+ "learning_rate": 1.0176048584731233e-05,
+ "loss": 0.1294,
+ "step": 18701
+ },
+ {
+ "epoch": 50.95912806539509,
+ "grad_norm": 5.337967395782471,
+ "learning_rate": 1.0175166226177998e-05,
+ "loss": 0.1372,
+ "step": 18702
+ },
+ {
+ "epoch": 50.961852861035425,
+ "grad_norm": 4.797581195831299,
+ "learning_rate": 1.0174283866260575e-05,
+ "loss": 0.1651,
+ "step": 18703
+ },
+ {
+ "epoch": 50.96457765667575,
+ "grad_norm": 5.887904167175293,
+ "learning_rate": 1.0173401504985831e-05,
+ "loss": 0.2833,
+ "step": 18704
+ },
+ {
+ "epoch": 50.967302452316076,
+ "grad_norm": 6.55267333984375,
+ "learning_rate": 1.0172519142360646e-05,
+ "loss": 0.1519,
+ "step": 18705
+ },
+ {
+ "epoch": 50.9700272479564,
+ "grad_norm": 6.467425346374512,
+ "learning_rate": 1.0171636778391885e-05,
+ "loss": 0.1798,
+ "step": 18706
+ },
+ {
+ "epoch": 50.97275204359673,
+ "grad_norm": 5.7684526443481445,
+ "learning_rate": 1.0170754413086422e-05,
+ "loss": 0.1561,
+ "step": 18707
+ },
+ {
+ "epoch": 50.97547683923706,
+ "grad_norm": 11.755709648132324,
+ "learning_rate": 1.016987204645113e-05,
+ "loss": 0.2787,
+ "step": 18708
+ },
+ {
+ "epoch": 50.97820163487739,
+ "grad_norm": 5.804837703704834,
+ "learning_rate": 1.016898967849288e-05,
+ "loss": 0.1966,
+ "step": 18709
+ },
+ {
+ "epoch": 50.98092643051771,
+ "grad_norm": 4.074558258056641,
+ "learning_rate": 1.0168107309218545e-05,
+ "loss": 0.1037,
+ "step": 18710
+ },
+ {
+ "epoch": 50.98365122615804,
+ "grad_norm": 6.014253616333008,
+ "learning_rate": 1.0167224938634994e-05,
+ "loss": 0.22,
+ "step": 18711
+ },
+ {
+ "epoch": 50.986376021798364,
+ "grad_norm": 5.788711071014404,
+ "learning_rate": 1.01663425667491e-05,
+ "loss": 0.2037,
+ "step": 18712
+ },
+ {
+ "epoch": 50.98910081743869,
+ "grad_norm": 5.540937900543213,
+ "learning_rate": 1.016546019356774e-05,
+ "loss": 0.1178,
+ "step": 18713
+ },
+ {
+ "epoch": 50.991825613079016,
+ "grad_norm": 6.734719753265381,
+ "learning_rate": 1.0164577819097777e-05,
+ "loss": 0.2364,
+ "step": 18714
+ },
+ {
+ "epoch": 50.99455040871935,
+ "grad_norm": 7.610739231109619,
+ "learning_rate": 1.016369544334609e-05,
+ "loss": 0.1228,
+ "step": 18715
+ },
+ {
+ "epoch": 50.997275204359674,
+ "grad_norm": 5.655003070831299,
+ "learning_rate": 1.0162813066319542e-05,
+ "loss": 0.1497,
+ "step": 18716
+ },
+ {
+ "epoch": 51.0,
+ "grad_norm": 5.585046768188477,
+ "learning_rate": 1.0161930688025018e-05,
+ "loss": 0.1662,
+ "step": 18717
+ },
+ {
+ "epoch": 51.002724795640326,
+ "grad_norm": 11.332860946655273,
+ "learning_rate": 1.0161048308469378e-05,
+ "loss": 0.2005,
+ "step": 18718
+ },
+ {
+ "epoch": 51.00544959128065,
+ "grad_norm": 17.428442001342773,
+ "learning_rate": 1.0160165927659502e-05,
+ "loss": 0.1392,
+ "step": 18719
+ },
+ {
+ "epoch": 51.00817438692098,
+ "grad_norm": 5.3399658203125,
+ "learning_rate": 1.015928354560226e-05,
+ "loss": 0.2174,
+ "step": 18720
+ },
+ {
+ "epoch": 51.01089918256131,
+ "grad_norm": 4.200045585632324,
+ "learning_rate": 1.0158401162304522e-05,
+ "loss": 0.3348,
+ "step": 18721
+ },
+ {
+ "epoch": 51.013623978201636,
+ "grad_norm": 4.7197675704956055,
+ "learning_rate": 1.0157518777773159e-05,
+ "loss": 0.0845,
+ "step": 18722
+ },
+ {
+ "epoch": 51.01634877384196,
+ "grad_norm": 5.308382511138916,
+ "learning_rate": 1.0156636392015046e-05,
+ "loss": 0.2566,
+ "step": 18723
+ },
+ {
+ "epoch": 51.01907356948229,
+ "grad_norm": 4.911110877990723,
+ "learning_rate": 1.0155754005037054e-05,
+ "loss": 0.1306,
+ "step": 18724
+ },
+ {
+ "epoch": 51.02179836512261,
+ "grad_norm": 6.263029098510742,
+ "learning_rate": 1.015487161684605e-05,
+ "loss": 0.2966,
+ "step": 18725
+ },
+ {
+ "epoch": 51.02452316076294,
+ "grad_norm": 4.92348051071167,
+ "learning_rate": 1.0153989227448917e-05,
+ "loss": 0.1635,
+ "step": 18726
+ },
+ {
+ "epoch": 51.02724795640327,
+ "grad_norm": 5.831380844116211,
+ "learning_rate": 1.015310683685252e-05,
+ "loss": 0.0931,
+ "step": 18727
+ },
+ {
+ "epoch": 51.0299727520436,
+ "grad_norm": 12.072651863098145,
+ "learning_rate": 1.015222444506373e-05,
+ "loss": 0.1893,
+ "step": 18728
+ },
+ {
+ "epoch": 51.032697547683924,
+ "grad_norm": 11.225703239440918,
+ "learning_rate": 1.0151342052089423e-05,
+ "loss": 0.2093,
+ "step": 18729
+ },
+ {
+ "epoch": 51.03542234332425,
+ "grad_norm": 7.203643798828125,
+ "learning_rate": 1.0150459657936469e-05,
+ "loss": 0.1521,
+ "step": 18730
+ },
+ {
+ "epoch": 51.038147138964575,
+ "grad_norm": 5.221952438354492,
+ "learning_rate": 1.0149577262611739e-05,
+ "loss": 0.117,
+ "step": 18731
+ },
+ {
+ "epoch": 51.0408719346049,
+ "grad_norm": 4.445789337158203,
+ "learning_rate": 1.0148694866122107e-05,
+ "loss": 0.1751,
+ "step": 18732
+ },
+ {
+ "epoch": 51.043596730245234,
+ "grad_norm": 6.010112285614014,
+ "learning_rate": 1.014781246847444e-05,
+ "loss": 0.1888,
+ "step": 18733
+ },
+ {
+ "epoch": 51.04632152588556,
+ "grad_norm": 4.826539039611816,
+ "learning_rate": 1.0146930069675617e-05,
+ "loss": 0.0933,
+ "step": 18734
+ },
+ {
+ "epoch": 51.049046321525886,
+ "grad_norm": 4.85269021987915,
+ "learning_rate": 1.014604766973251e-05,
+ "loss": 0.0985,
+ "step": 18735
+ },
+ {
+ "epoch": 51.05177111716621,
+ "grad_norm": 6.659588813781738,
+ "learning_rate": 1.0145165268651985e-05,
+ "loss": 0.1496,
+ "step": 18736
+ },
+ {
+ "epoch": 51.05449591280654,
+ "grad_norm": 4.729734420776367,
+ "learning_rate": 1.014428286644092e-05,
+ "loss": 0.1488,
+ "step": 18737
+ },
+ {
+ "epoch": 51.05722070844686,
+ "grad_norm": 5.822243690490723,
+ "learning_rate": 1.0143400463106184e-05,
+ "loss": 0.1028,
+ "step": 18738
+ },
+ {
+ "epoch": 51.059945504087196,
+ "grad_norm": 5.308828830718994,
+ "learning_rate": 1.0142518058654649e-05,
+ "loss": 0.0896,
+ "step": 18739
+ },
+ {
+ "epoch": 51.06267029972752,
+ "grad_norm": 5.010536193847656,
+ "learning_rate": 1.0141635653093187e-05,
+ "loss": 0.1237,
+ "step": 18740
+ },
+ {
+ "epoch": 51.06539509536785,
+ "grad_norm": 5.888706684112549,
+ "learning_rate": 1.0140753246428674e-05,
+ "loss": 0.1296,
+ "step": 18741
+ },
+ {
+ "epoch": 51.06811989100817,
+ "grad_norm": 40.01289749145508,
+ "learning_rate": 1.0139870838667976e-05,
+ "loss": 0.2059,
+ "step": 18742
+ },
+ {
+ "epoch": 51.0708446866485,
+ "grad_norm": 4.776760578155518,
+ "learning_rate": 1.0138988429817971e-05,
+ "loss": 0.1722,
+ "step": 18743
+ },
+ {
+ "epoch": 51.073569482288825,
+ "grad_norm": 9.24162483215332,
+ "learning_rate": 1.0138106019885525e-05,
+ "loss": 0.185,
+ "step": 18744
+ },
+ {
+ "epoch": 51.07629427792916,
+ "grad_norm": 4.977770805358887,
+ "learning_rate": 1.0137223608877518e-05,
+ "loss": 0.2341,
+ "step": 18745
+ },
+ {
+ "epoch": 51.079019073569484,
+ "grad_norm": 6.066573619842529,
+ "learning_rate": 1.0136341196800816e-05,
+ "loss": 0.1852,
+ "step": 18746
+ },
+ {
+ "epoch": 51.08174386920981,
+ "grad_norm": 5.879281997680664,
+ "learning_rate": 1.0135458783662296e-05,
+ "loss": 0.143,
+ "step": 18747
+ },
+ {
+ "epoch": 51.084468664850135,
+ "grad_norm": 4.567464828491211,
+ "learning_rate": 1.0134576369468823e-05,
+ "loss": 0.0869,
+ "step": 18748
+ },
+ {
+ "epoch": 51.08719346049046,
+ "grad_norm": 7.318799018859863,
+ "learning_rate": 1.0133693954227278e-05,
+ "loss": 0.1819,
+ "step": 18749
+ },
+ {
+ "epoch": 51.08991825613079,
+ "grad_norm": 9.434854507446289,
+ "learning_rate": 1.0132811537944522e-05,
+ "loss": 0.1568,
+ "step": 18750
+ },
+ {
+ "epoch": 51.09264305177112,
+ "grad_norm": 4.460082054138184,
+ "learning_rate": 1.0131929120627439e-05,
+ "loss": 0.1595,
+ "step": 18751
+ },
+ {
+ "epoch": 51.095367847411445,
+ "grad_norm": 4.987976551055908,
+ "learning_rate": 1.0131046702282893e-05,
+ "loss": 0.086,
+ "step": 18752
+ },
+ {
+ "epoch": 51.09809264305177,
+ "grad_norm": 4.004764556884766,
+ "learning_rate": 1.0130164282917764e-05,
+ "loss": 0.2204,
+ "step": 18753
+ },
+ {
+ "epoch": 51.1008174386921,
+ "grad_norm": 5.967334747314453,
+ "learning_rate": 1.0129281862538918e-05,
+ "loss": 0.2305,
+ "step": 18754
+ },
+ {
+ "epoch": 51.10354223433242,
+ "grad_norm": 4.764896392822266,
+ "learning_rate": 1.012839944115323e-05,
+ "loss": 0.129,
+ "step": 18755
+ },
+ {
+ "epoch": 51.10626702997275,
+ "grad_norm": 7.496785640716553,
+ "learning_rate": 1.0127517018767569e-05,
+ "loss": 0.0907,
+ "step": 18756
+ },
+ {
+ "epoch": 51.10899182561308,
+ "grad_norm": 3.6667022705078125,
+ "learning_rate": 1.0126634595388812e-05,
+ "loss": 0.1383,
+ "step": 18757
+ },
+ {
+ "epoch": 51.11171662125341,
+ "grad_norm": 10.265843391418457,
+ "learning_rate": 1.0125752171023825e-05,
+ "loss": 0.2072,
+ "step": 18758
+ },
+ {
+ "epoch": 51.11444141689373,
+ "grad_norm": 5.989264011383057,
+ "learning_rate": 1.0124869745679486e-05,
+ "loss": 0.1543,
+ "step": 18759
+ },
+ {
+ "epoch": 51.11716621253406,
+ "grad_norm": 8.33877944946289,
+ "learning_rate": 1.0123987319362668e-05,
+ "loss": 0.1829,
+ "step": 18760
+ },
+ {
+ "epoch": 51.119891008174385,
+ "grad_norm": 5.455020427703857,
+ "learning_rate": 1.0123104892080237e-05,
+ "loss": 0.1301,
+ "step": 18761
+ },
+ {
+ "epoch": 51.12261580381471,
+ "grad_norm": 4.6251726150512695,
+ "learning_rate": 1.012222246383907e-05,
+ "loss": 0.1591,
+ "step": 18762
+ },
+ {
+ "epoch": 51.12534059945504,
+ "grad_norm": 5.778083324432373,
+ "learning_rate": 1.0121340034646041e-05,
+ "loss": 0.1534,
+ "step": 18763
+ },
+ {
+ "epoch": 51.12806539509537,
+ "grad_norm": 6.038066864013672,
+ "learning_rate": 1.0120457604508019e-05,
+ "loss": 0.1822,
+ "step": 18764
+ },
+ {
+ "epoch": 51.130790190735695,
+ "grad_norm": 6.604792594909668,
+ "learning_rate": 1.0119575173431877e-05,
+ "loss": 0.1728,
+ "step": 18765
+ },
+ {
+ "epoch": 51.13351498637602,
+ "grad_norm": 6.406408309936523,
+ "learning_rate": 1.0118692741424485e-05,
+ "loss": 0.1196,
+ "step": 18766
+ },
+ {
+ "epoch": 51.13623978201635,
+ "grad_norm": 6.284243583679199,
+ "learning_rate": 1.0117810308492719e-05,
+ "loss": 0.2791,
+ "step": 18767
+ },
+ {
+ "epoch": 51.13896457765667,
+ "grad_norm": 5.192579746246338,
+ "learning_rate": 1.011692787464345e-05,
+ "loss": 0.0937,
+ "step": 18768
+ },
+ {
+ "epoch": 51.141689373297005,
+ "grad_norm": 5.316946029663086,
+ "learning_rate": 1.011604543988355e-05,
+ "loss": 0.0972,
+ "step": 18769
+ },
+ {
+ "epoch": 51.14441416893733,
+ "grad_norm": 4.363719940185547,
+ "learning_rate": 1.0115163004219894e-05,
+ "loss": 0.166,
+ "step": 18770
+ },
+ {
+ "epoch": 51.14713896457766,
+ "grad_norm": 5.205626010894775,
+ "learning_rate": 1.011428056765935e-05,
+ "loss": 0.1089,
+ "step": 18771
+ },
+ {
+ "epoch": 51.14986376021798,
+ "grad_norm": 6.125519275665283,
+ "learning_rate": 1.0113398130208791e-05,
+ "loss": 0.1815,
+ "step": 18772
+ },
+ {
+ "epoch": 51.15258855585831,
+ "grad_norm": 6.656401634216309,
+ "learning_rate": 1.0112515691875095e-05,
+ "loss": 0.1347,
+ "step": 18773
+ },
+ {
+ "epoch": 51.155313351498634,
+ "grad_norm": 5.416975021362305,
+ "learning_rate": 1.0111633252665129e-05,
+ "loss": 0.2934,
+ "step": 18774
+ },
+ {
+ "epoch": 51.15803814713897,
+ "grad_norm": 79.0899658203125,
+ "learning_rate": 1.0110750812585767e-05,
+ "loss": 0.2813,
+ "step": 18775
+ },
+ {
+ "epoch": 51.16076294277929,
+ "grad_norm": 5.5814642906188965,
+ "learning_rate": 1.010986837164388e-05,
+ "loss": 0.2162,
+ "step": 18776
+ },
+ {
+ "epoch": 51.16348773841962,
+ "grad_norm": 9.727604866027832,
+ "learning_rate": 1.0108985929846342e-05,
+ "loss": 0.1799,
+ "step": 18777
+ },
+ {
+ "epoch": 51.166212534059945,
+ "grad_norm": 6.37643575668335,
+ "learning_rate": 1.0108103487200028e-05,
+ "loss": 0.1972,
+ "step": 18778
+ },
+ {
+ "epoch": 51.16893732970027,
+ "grad_norm": 5.157503604888916,
+ "learning_rate": 1.0107221043711804e-05,
+ "loss": 0.1791,
+ "step": 18779
+ },
+ {
+ "epoch": 51.171662125340596,
+ "grad_norm": 5.511967658996582,
+ "learning_rate": 1.0106338599388548e-05,
+ "loss": 0.2906,
+ "step": 18780
+ },
+ {
+ "epoch": 51.17438692098093,
+ "grad_norm": 5.359907150268555,
+ "learning_rate": 1.010545615423713e-05,
+ "loss": 0.2688,
+ "step": 18781
+ },
+ {
+ "epoch": 51.177111716621255,
+ "grad_norm": 8.087959289550781,
+ "learning_rate": 1.010457370826442e-05,
+ "loss": 0.18,
+ "step": 18782
+ },
+ {
+ "epoch": 51.17983651226158,
+ "grad_norm": 5.236056804656982,
+ "learning_rate": 1.0103691261477297e-05,
+ "loss": 0.1554,
+ "step": 18783
+ },
+ {
+ "epoch": 51.182561307901906,
+ "grad_norm": 7.0774993896484375,
+ "learning_rate": 1.0102808813882627e-05,
+ "loss": 0.1399,
+ "step": 18784
+ },
+ {
+ "epoch": 51.18528610354223,
+ "grad_norm": 5.047219753265381,
+ "learning_rate": 1.0101926365487287e-05,
+ "loss": 0.1951,
+ "step": 18785
+ },
+ {
+ "epoch": 51.18801089918256,
+ "grad_norm": 19.370012283325195,
+ "learning_rate": 1.0101043916298148e-05,
+ "loss": 0.1911,
+ "step": 18786
+ },
+ {
+ "epoch": 51.19073569482289,
+ "grad_norm": 7.3546271324157715,
+ "learning_rate": 1.0100161466322082e-05,
+ "loss": 0.1905,
+ "step": 18787
+ },
+ {
+ "epoch": 51.19346049046322,
+ "grad_norm": 5.489282608032227,
+ "learning_rate": 1.0099279015565961e-05,
+ "loss": 0.161,
+ "step": 18788
+ },
+ {
+ "epoch": 51.19618528610354,
+ "grad_norm": 5.209650993347168,
+ "learning_rate": 1.0098396564036658e-05,
+ "loss": 0.1584,
+ "step": 18789
+ },
+ {
+ "epoch": 51.19891008174387,
+ "grad_norm": 6.183939456939697,
+ "learning_rate": 1.0097514111741048e-05,
+ "loss": 0.1404,
+ "step": 18790
+ },
+ {
+ "epoch": 51.201634877384194,
+ "grad_norm": 7.37171745300293,
+ "learning_rate": 1.0096631658686e-05,
+ "loss": 0.2906,
+ "step": 18791
+ },
+ {
+ "epoch": 51.20435967302452,
+ "grad_norm": 7.757916450500488,
+ "learning_rate": 1.009574920487839e-05,
+ "loss": 0.2218,
+ "step": 18792
+ },
+ {
+ "epoch": 51.20708446866485,
+ "grad_norm": 5.5463175773620605,
+ "learning_rate": 1.009486675032508e-05,
+ "loss": 0.1096,
+ "step": 18793
+ },
+ {
+ "epoch": 51.20980926430518,
+ "grad_norm": 6.708303928375244,
+ "learning_rate": 1.009398429503296e-05,
+ "loss": 0.1681,
+ "step": 18794
+ },
+ {
+ "epoch": 51.212534059945504,
+ "grad_norm": 9.129183769226074,
+ "learning_rate": 1.0093101839008888e-05,
+ "loss": 0.2122,
+ "step": 18795
+ },
+ {
+ "epoch": 51.21525885558583,
+ "grad_norm": 4.936119079589844,
+ "learning_rate": 1.0092219382259745e-05,
+ "loss": 0.2291,
+ "step": 18796
+ },
+ {
+ "epoch": 51.217983651226156,
+ "grad_norm": 6.745718479156494,
+ "learning_rate": 1.00913369247924e-05,
+ "loss": 0.1609,
+ "step": 18797
+ },
+ {
+ "epoch": 51.22070844686648,
+ "grad_norm": 8.815296173095703,
+ "learning_rate": 1.0090454466613724e-05,
+ "loss": 0.127,
+ "step": 18798
+ },
+ {
+ "epoch": 51.223433242506815,
+ "grad_norm": 5.680782318115234,
+ "learning_rate": 1.0089572007730593e-05,
+ "loss": 0.3213,
+ "step": 18799
+ },
+ {
+ "epoch": 51.22615803814714,
+ "grad_norm": 6.469271183013916,
+ "learning_rate": 1.0088689548149878e-05,
+ "loss": 0.1957,
+ "step": 18800
+ },
+ {
+ "epoch": 51.228882833787466,
+ "grad_norm": 6.46415901184082,
+ "learning_rate": 1.008780708787845e-05,
+ "loss": 0.1899,
+ "step": 18801
+ },
+ {
+ "epoch": 51.23160762942779,
+ "grad_norm": 6.101480484008789,
+ "learning_rate": 1.0086924626923185e-05,
+ "loss": 0.187,
+ "step": 18802
+ },
+ {
+ "epoch": 51.23433242506812,
+ "grad_norm": 4.842905044555664,
+ "learning_rate": 1.0086042165290952e-05,
+ "loss": 0.1832,
+ "step": 18803
+ },
+ {
+ "epoch": 51.237057220708444,
+ "grad_norm": 4.603719711303711,
+ "learning_rate": 1.0085159702988627e-05,
+ "loss": 0.2,
+ "step": 18804
+ },
+ {
+ "epoch": 51.23978201634878,
+ "grad_norm": 4.809569358825684,
+ "learning_rate": 1.0084277240023082e-05,
+ "loss": 0.1505,
+ "step": 18805
+ },
+ {
+ "epoch": 51.2425068119891,
+ "grad_norm": 4.232131004333496,
+ "learning_rate": 1.0083394776401188e-05,
+ "loss": 0.1742,
+ "step": 18806
+ },
+ {
+ "epoch": 51.24523160762943,
+ "grad_norm": 4.67697811126709,
+ "learning_rate": 1.0082512312129815e-05,
+ "loss": 0.2456,
+ "step": 18807
+ },
+ {
+ "epoch": 51.247956403269754,
+ "grad_norm": 4.75968599319458,
+ "learning_rate": 1.0081629847215843e-05,
+ "loss": 0.0844,
+ "step": 18808
+ },
+ {
+ "epoch": 51.25068119891008,
+ "grad_norm": 4.272505760192871,
+ "learning_rate": 1.0080747381666138e-05,
+ "loss": 0.1488,
+ "step": 18809
+ },
+ {
+ "epoch": 51.253405994550405,
+ "grad_norm": 5.496559143066406,
+ "learning_rate": 1.0079864915487576e-05,
+ "loss": 0.1714,
+ "step": 18810
+ },
+ {
+ "epoch": 51.25613079019074,
+ "grad_norm": 4.785799026489258,
+ "learning_rate": 1.0078982448687027e-05,
+ "loss": 0.1613,
+ "step": 18811
+ },
+ {
+ "epoch": 51.258855585831064,
+ "grad_norm": 6.205319881439209,
+ "learning_rate": 1.0078099981271367e-05,
+ "loss": 0.3415,
+ "step": 18812
+ },
+ {
+ "epoch": 51.26158038147139,
+ "grad_norm": 8.09691333770752,
+ "learning_rate": 1.0077217513247465e-05,
+ "loss": 0.1214,
+ "step": 18813
+ },
+ {
+ "epoch": 51.264305177111716,
+ "grad_norm": 5.109775543212891,
+ "learning_rate": 1.0076335044622198e-05,
+ "loss": 0.1111,
+ "step": 18814
+ },
+ {
+ "epoch": 51.26702997275204,
+ "grad_norm": 7.009300708770752,
+ "learning_rate": 1.0075452575402433e-05,
+ "loss": 0.1186,
+ "step": 18815
+ },
+ {
+ "epoch": 51.26975476839237,
+ "grad_norm": 6.143910884857178,
+ "learning_rate": 1.007457010559505e-05,
+ "loss": 0.1601,
+ "step": 18816
+ },
+ {
+ "epoch": 51.2724795640327,
+ "grad_norm": 10.16909408569336,
+ "learning_rate": 1.0073687635206915e-05,
+ "loss": 0.2043,
+ "step": 18817
+ },
+ {
+ "epoch": 51.275204359673026,
+ "grad_norm": 4.602548122406006,
+ "learning_rate": 1.0072805164244903e-05,
+ "loss": 0.1435,
+ "step": 18818
+ },
+ {
+ "epoch": 51.27792915531335,
+ "grad_norm": 8.02277660369873,
+ "learning_rate": 1.0071922692715885e-05,
+ "loss": 0.1631,
+ "step": 18819
+ },
+ {
+ "epoch": 51.28065395095368,
+ "grad_norm": 5.542445182800293,
+ "learning_rate": 1.0071040220626738e-05,
+ "loss": 0.1126,
+ "step": 18820
+ },
+ {
+ "epoch": 51.283378746594,
+ "grad_norm": 51.237945556640625,
+ "learning_rate": 1.0070157747984331e-05,
+ "loss": 0.2363,
+ "step": 18821
+ },
+ {
+ "epoch": 51.28610354223433,
+ "grad_norm": 4.691830158233643,
+ "learning_rate": 1.006927527479554e-05,
+ "loss": 0.2623,
+ "step": 18822
+ },
+ {
+ "epoch": 51.28882833787466,
+ "grad_norm": 5.037574291229248,
+ "learning_rate": 1.0068392801067232e-05,
+ "loss": 0.1498,
+ "step": 18823
+ },
+ {
+ "epoch": 51.29155313351499,
+ "grad_norm": 7.60037088394165,
+ "learning_rate": 1.0067510326806284e-05,
+ "loss": 0.2092,
+ "step": 18824
+ },
+ {
+ "epoch": 51.294277929155314,
+ "grad_norm": 4.125919818878174,
+ "learning_rate": 1.0066627852019567e-05,
+ "loss": 0.2363,
+ "step": 18825
+ },
+ {
+ "epoch": 51.29700272479564,
+ "grad_norm": 4.860090255737305,
+ "learning_rate": 1.0065745376713958e-05,
+ "loss": 0.1537,
+ "step": 18826
+ },
+ {
+ "epoch": 51.299727520435965,
+ "grad_norm": 6.538519859313965,
+ "learning_rate": 1.0064862900896323e-05,
+ "loss": 0.153,
+ "step": 18827
+ },
+ {
+ "epoch": 51.30245231607629,
+ "grad_norm": 6.630890369415283,
+ "learning_rate": 1.0063980424573538e-05,
+ "loss": 0.1448,
+ "step": 18828
+ },
+ {
+ "epoch": 51.305177111716624,
+ "grad_norm": 4.957268238067627,
+ "learning_rate": 1.0063097947752477e-05,
+ "loss": 0.1503,
+ "step": 18829
+ },
+ {
+ "epoch": 51.30790190735695,
+ "grad_norm": 5.636377334594727,
+ "learning_rate": 1.0062215470440011e-05,
+ "loss": 0.1475,
+ "step": 18830
+ },
+ {
+ "epoch": 51.310626702997276,
+ "grad_norm": 7.311302185058594,
+ "learning_rate": 1.006133299264301e-05,
+ "loss": 0.1904,
+ "step": 18831
+ },
+ {
+ "epoch": 51.3133514986376,
+ "grad_norm": 10.37523365020752,
+ "learning_rate": 1.0060450514368355e-05,
+ "loss": 0.11,
+ "step": 18832
+ },
+ {
+ "epoch": 51.31607629427793,
+ "grad_norm": 4.774973392486572,
+ "learning_rate": 1.005956803562291e-05,
+ "loss": 0.1609,
+ "step": 18833
+ },
+ {
+ "epoch": 51.31880108991825,
+ "grad_norm": 5.141545295715332,
+ "learning_rate": 1.005868555641355e-05,
+ "loss": 0.1307,
+ "step": 18834
+ },
+ {
+ "epoch": 51.321525885558586,
+ "grad_norm": 5.759461402893066,
+ "learning_rate": 1.005780307674715e-05,
+ "loss": 0.4502,
+ "step": 18835
+ },
+ {
+ "epoch": 51.32425068119891,
+ "grad_norm": 5.119438648223877,
+ "learning_rate": 1.0056920596630582e-05,
+ "loss": 0.1453,
+ "step": 18836
+ },
+ {
+ "epoch": 51.32697547683924,
+ "grad_norm": 6.693476676940918,
+ "learning_rate": 1.0056038116070716e-05,
+ "loss": 0.1693,
+ "step": 18837
+ },
+ {
+ "epoch": 51.32970027247956,
+ "grad_norm": 6.895663261413574,
+ "learning_rate": 1.005515563507443e-05,
+ "loss": 0.1509,
+ "step": 18838
+ },
+ {
+ "epoch": 51.33242506811989,
+ "grad_norm": 11.935626983642578,
+ "learning_rate": 1.0054273153648591e-05,
+ "loss": 0.1915,
+ "step": 18839
+ },
+ {
+ "epoch": 51.335149863760215,
+ "grad_norm": 5.337900638580322,
+ "learning_rate": 1.005339067180008e-05,
+ "loss": 0.178,
+ "step": 18840
+ },
+ {
+ "epoch": 51.33787465940055,
+ "grad_norm": 5.646678447723389,
+ "learning_rate": 1.0052508189535758e-05,
+ "loss": 0.1078,
+ "step": 18841
+ },
+ {
+ "epoch": 51.34059945504087,
+ "grad_norm": 5.215188980102539,
+ "learning_rate": 1.0051625706862507e-05,
+ "loss": 0.101,
+ "step": 18842
+ },
+ {
+ "epoch": 51.3433242506812,
+ "grad_norm": 4.767889976501465,
+ "learning_rate": 1.0050743223787193e-05,
+ "loss": 0.1725,
+ "step": 18843
+ },
+ {
+ "epoch": 51.346049046321525,
+ "grad_norm": 6.254324436187744,
+ "learning_rate": 1.0049860740316697e-05,
+ "loss": 0.1405,
+ "step": 18844
+ },
+ {
+ "epoch": 51.34877384196185,
+ "grad_norm": 5.112353801727295,
+ "learning_rate": 1.0048978256457885e-05,
+ "loss": 0.1337,
+ "step": 18845
+ },
+ {
+ "epoch": 51.35149863760218,
+ "grad_norm": 4.851981163024902,
+ "learning_rate": 1.004809577221763e-05,
+ "loss": 0.1956,
+ "step": 18846
+ },
+ {
+ "epoch": 51.35422343324251,
+ "grad_norm": 4.096112251281738,
+ "learning_rate": 1.0047213287602809e-05,
+ "loss": 0.0883,
+ "step": 18847
+ },
+ {
+ "epoch": 51.356948228882835,
+ "grad_norm": 5.8044586181640625,
+ "learning_rate": 1.0046330802620292e-05,
+ "loss": 0.093,
+ "step": 18848
+ },
+ {
+ "epoch": 51.35967302452316,
+ "grad_norm": 5.176109790802002,
+ "learning_rate": 1.0045448317276951e-05,
+ "loss": 0.1221,
+ "step": 18849
+ },
+ {
+ "epoch": 51.36239782016349,
+ "grad_norm": 5.2995781898498535,
+ "learning_rate": 1.0044565831579664e-05,
+ "loss": 0.1443,
+ "step": 18850
+ },
+ {
+ "epoch": 51.36512261580381,
+ "grad_norm": 6.7969536781311035,
+ "learning_rate": 1.0043683345535295e-05,
+ "loss": 0.0691,
+ "step": 18851
+ },
+ {
+ "epoch": 51.36784741144414,
+ "grad_norm": 4.332256317138672,
+ "learning_rate": 1.0042800859150726e-05,
+ "loss": 0.1539,
+ "step": 18852
+ },
+ {
+ "epoch": 51.37057220708447,
+ "grad_norm": 4.30204963684082,
+ "learning_rate": 1.0041918372432822e-05,
+ "loss": 0.1867,
+ "step": 18853
+ },
+ {
+ "epoch": 51.3732970027248,
+ "grad_norm": 5.851512432098389,
+ "learning_rate": 1.004103588538846e-05,
+ "loss": 0.2439,
+ "step": 18854
+ },
+ {
+ "epoch": 51.37602179836512,
+ "grad_norm": 5.3317084312438965,
+ "learning_rate": 1.0040153398024513e-05,
+ "loss": 0.1674,
+ "step": 18855
+ },
+ {
+ "epoch": 51.37874659400545,
+ "grad_norm": 4.1724534034729,
+ "learning_rate": 1.0039270910347849e-05,
+ "loss": 0.1919,
+ "step": 18856
+ },
+ {
+ "epoch": 51.381471389645775,
+ "grad_norm": 6.053035259246826,
+ "learning_rate": 1.0038388422365348e-05,
+ "loss": 0.107,
+ "step": 18857
+ },
+ {
+ "epoch": 51.3841961852861,
+ "grad_norm": 5.427990913391113,
+ "learning_rate": 1.0037505934083877e-05,
+ "loss": 0.1115,
+ "step": 18858
+ },
+ {
+ "epoch": 51.38692098092643,
+ "grad_norm": 6.375370025634766,
+ "learning_rate": 1.0036623445510312e-05,
+ "loss": 0.1364,
+ "step": 18859
+ },
+ {
+ "epoch": 51.38964577656676,
+ "grad_norm": 4.085097789764404,
+ "learning_rate": 1.0035740956651527e-05,
+ "loss": 0.2076,
+ "step": 18860
+ },
+ {
+ "epoch": 51.392370572207085,
+ "grad_norm": 7.361934661865234,
+ "learning_rate": 1.0034858467514388e-05,
+ "loss": 0.167,
+ "step": 18861
+ },
+ {
+ "epoch": 51.39509536784741,
+ "grad_norm": 5.714624881744385,
+ "learning_rate": 1.0033975978105774e-05,
+ "loss": 0.1235,
+ "step": 18862
+ },
+ {
+ "epoch": 51.39782016348774,
+ "grad_norm": 4.752364635467529,
+ "learning_rate": 1.003309348843256e-05,
+ "loss": 0.1219,
+ "step": 18863
+ },
+ {
+ "epoch": 51.40054495912806,
+ "grad_norm": 5.669373035430908,
+ "learning_rate": 1.0032210998501611e-05,
+ "loss": 0.1629,
+ "step": 18864
+ },
+ {
+ "epoch": 51.403269754768395,
+ "grad_norm": 9.528609275817871,
+ "learning_rate": 1.0031328508319805e-05,
+ "loss": 0.1717,
+ "step": 18865
+ },
+ {
+ "epoch": 51.40599455040872,
+ "grad_norm": 4.603137969970703,
+ "learning_rate": 1.0030446017894014e-05,
+ "loss": 0.078,
+ "step": 18866
+ },
+ {
+ "epoch": 51.40871934604905,
+ "grad_norm": 5.248652458190918,
+ "learning_rate": 1.002956352723111e-05,
+ "loss": 0.2607,
+ "step": 18867
+ },
+ {
+ "epoch": 51.41144414168937,
+ "grad_norm": 5.387473106384277,
+ "learning_rate": 1.0028681036337963e-05,
+ "loss": 0.1365,
+ "step": 18868
+ },
+ {
+ "epoch": 51.4141689373297,
+ "grad_norm": 4.097549915313721,
+ "learning_rate": 1.0027798545221453e-05,
+ "loss": 0.1656,
+ "step": 18869
+ },
+ {
+ "epoch": 51.416893732970024,
+ "grad_norm": 4.61376953125,
+ "learning_rate": 1.0026916053888449e-05,
+ "loss": 0.1086,
+ "step": 18870
+ },
+ {
+ "epoch": 51.41961852861036,
+ "grad_norm": 4.5222930908203125,
+ "learning_rate": 1.0026033562345821e-05,
+ "loss": 0.1723,
+ "step": 18871
+ },
+ {
+ "epoch": 51.42234332425068,
+ "grad_norm": 5.318976402282715,
+ "learning_rate": 1.0025151070600445e-05,
+ "loss": 0.1462,
+ "step": 18872
+ },
+ {
+ "epoch": 51.42506811989101,
+ "grad_norm": 4.539977073669434,
+ "learning_rate": 1.0024268578659195e-05,
+ "loss": 0.0965,
+ "step": 18873
+ },
+ {
+ "epoch": 51.427792915531334,
+ "grad_norm": 4.928645610809326,
+ "learning_rate": 1.0023386086528942e-05,
+ "loss": 0.1979,
+ "step": 18874
+ },
+ {
+ "epoch": 51.43051771117166,
+ "grad_norm": 5.497778415679932,
+ "learning_rate": 1.0022503594216558e-05,
+ "loss": 0.1126,
+ "step": 18875
+ },
+ {
+ "epoch": 51.433242506811986,
+ "grad_norm": 7.102056503295898,
+ "learning_rate": 1.0021621101728916e-05,
+ "loss": 0.2033,
+ "step": 18876
+ },
+ {
+ "epoch": 51.43596730245232,
+ "grad_norm": 5.455347537994385,
+ "learning_rate": 1.002073860907289e-05,
+ "loss": 0.1587,
+ "step": 18877
+ },
+ {
+ "epoch": 51.438692098092645,
+ "grad_norm": 5.075624465942383,
+ "learning_rate": 1.0019856116255353e-05,
+ "loss": 0.1917,
+ "step": 18878
+ },
+ {
+ "epoch": 51.44141689373297,
+ "grad_norm": 7.048523902893066,
+ "learning_rate": 1.0018973623283177e-05,
+ "loss": 0.1951,
+ "step": 18879
+ },
+ {
+ "epoch": 51.444141689373296,
+ "grad_norm": 4.175597667694092,
+ "learning_rate": 1.0018091130163235e-05,
+ "loss": 0.16,
+ "step": 18880
+ },
+ {
+ "epoch": 51.44686648501362,
+ "grad_norm": 4.40514612197876,
+ "learning_rate": 1.0017208636902401e-05,
+ "loss": 0.0847,
+ "step": 18881
+ },
+ {
+ "epoch": 51.44959128065395,
+ "grad_norm": 6.212416648864746,
+ "learning_rate": 1.0016326143507544e-05,
+ "loss": 0.288,
+ "step": 18882
+ },
+ {
+ "epoch": 51.45231607629428,
+ "grad_norm": 5.558211803436279,
+ "learning_rate": 1.0015443649985542e-05,
+ "loss": 0.131,
+ "step": 18883
+ },
+ {
+ "epoch": 51.45504087193461,
+ "grad_norm": 4.054054260253906,
+ "learning_rate": 1.0014561156343263e-05,
+ "loss": 0.1175,
+ "step": 18884
+ },
+ {
+ "epoch": 51.45776566757493,
+ "grad_norm": 5.712672710418701,
+ "learning_rate": 1.0013678662587584e-05,
+ "loss": 0.1595,
+ "step": 18885
+ },
+ {
+ "epoch": 51.46049046321526,
+ "grad_norm": 5.684453964233398,
+ "learning_rate": 1.0012796168725376e-05,
+ "loss": 0.2425,
+ "step": 18886
+ },
+ {
+ "epoch": 51.463215258855584,
+ "grad_norm": 4.908958911895752,
+ "learning_rate": 1.0011913674763514e-05,
+ "loss": 0.1607,
+ "step": 18887
+ },
+ {
+ "epoch": 51.46594005449591,
+ "grad_norm": 5.546113967895508,
+ "learning_rate": 1.0011031180708861e-05,
+ "loss": 0.1102,
+ "step": 18888
+ },
+ {
+ "epoch": 51.46866485013624,
+ "grad_norm": 4.123659133911133,
+ "learning_rate": 1.0010148686568304e-05,
+ "loss": 0.0927,
+ "step": 18889
+ },
+ {
+ "epoch": 51.47138964577657,
+ "grad_norm": 5.6722540855407715,
+ "learning_rate": 1.0009266192348708e-05,
+ "loss": 0.2096,
+ "step": 18890
+ },
+ {
+ "epoch": 51.474114441416894,
+ "grad_norm": 4.974035739898682,
+ "learning_rate": 1.0008383698056949e-05,
+ "loss": 0.1766,
+ "step": 18891
+ },
+ {
+ "epoch": 51.47683923705722,
+ "grad_norm": 5.52852201461792,
+ "learning_rate": 1.0007501203699894e-05,
+ "loss": 0.1583,
+ "step": 18892
+ },
+ {
+ "epoch": 51.479564032697546,
+ "grad_norm": 5.028327465057373,
+ "learning_rate": 1.0006618709284424e-05,
+ "loss": 0.1769,
+ "step": 18893
+ },
+ {
+ "epoch": 51.48228882833787,
+ "grad_norm": 4.124752044677734,
+ "learning_rate": 1.0005736214817405e-05,
+ "loss": 0.1034,
+ "step": 18894
+ },
+ {
+ "epoch": 51.485013623978205,
+ "grad_norm": 5.628269672393799,
+ "learning_rate": 1.0004853720305717e-05,
+ "loss": 0.1655,
+ "step": 18895
+ },
+ {
+ "epoch": 51.48773841961853,
+ "grad_norm": 5.227619171142578,
+ "learning_rate": 1.0003971225756222e-05,
+ "loss": 0.1572,
+ "step": 18896
+ },
+ {
+ "epoch": 51.490463215258856,
+ "grad_norm": 4.5399909019470215,
+ "learning_rate": 1.00030887311758e-05,
+ "loss": 0.107,
+ "step": 18897
+ },
+ {
+ "epoch": 51.49318801089918,
+ "grad_norm": 4.212165832519531,
+ "learning_rate": 1.0002206236571325e-05,
+ "loss": 0.1536,
+ "step": 18898
+ },
+ {
+ "epoch": 51.49591280653951,
+ "grad_norm": 4.753115177154541,
+ "learning_rate": 1.0001323741949669e-05,
+ "loss": 0.1167,
+ "step": 18899
+ },
+ {
+ "epoch": 51.49863760217983,
+ "grad_norm": 4.665989875793457,
+ "learning_rate": 1.0000441247317702e-05,
+ "loss": 0.1029,
+ "step": 18900
+ },
+ {
+ "epoch": 51.50136239782017,
+ "grad_norm": 4.497897624969482,
+ "learning_rate": 9.9995587526823e-06,
+ "loss": 0.0884,
+ "step": 18901
+ },
+ {
+ "epoch": 51.50408719346049,
+ "grad_norm": 5.178405284881592,
+ "learning_rate": 9.998676258050331e-06,
+ "loss": 0.0727,
+ "step": 18902
+ },
+ {
+ "epoch": 51.50681198910082,
+ "grad_norm": 5.843135833740234,
+ "learning_rate": 9.997793763428676e-06,
+ "loss": 0.2678,
+ "step": 18903
+ },
+ {
+ "epoch": 51.509536784741144,
+ "grad_norm": 4.736177444458008,
+ "learning_rate": 9.9969112688242e-06,
+ "loss": 0.1993,
+ "step": 18904
+ },
+ {
+ "epoch": 51.51226158038147,
+ "grad_norm": 5.294179916381836,
+ "learning_rate": 9.996028774243781e-06,
+ "loss": 0.1534,
+ "step": 18905
+ },
+ {
+ "epoch": 51.514986376021795,
+ "grad_norm": 4.487862586975098,
+ "learning_rate": 9.995146279694288e-06,
+ "loss": 0.2374,
+ "step": 18906
+ },
+ {
+ "epoch": 51.51771117166213,
+ "grad_norm": 4.244534015655518,
+ "learning_rate": 9.994263785182597e-06,
+ "loss": 0.127,
+ "step": 18907
+ },
+ {
+ "epoch": 51.520435967302454,
+ "grad_norm": 4.889786243438721,
+ "learning_rate": 9.993381290715578e-06,
+ "loss": 0.1465,
+ "step": 18908
+ },
+ {
+ "epoch": 51.52316076294278,
+ "grad_norm": 5.3072662353515625,
+ "learning_rate": 9.992498796300108e-06,
+ "loss": 0.1057,
+ "step": 18909
+ },
+ {
+ "epoch": 51.525885558583106,
+ "grad_norm": 6.529801368713379,
+ "learning_rate": 9.991616301943054e-06,
+ "loss": 0.221,
+ "step": 18910
+ },
+ {
+ "epoch": 51.52861035422343,
+ "grad_norm": 3.673734426498413,
+ "learning_rate": 9.990733807651295e-06,
+ "loss": 0.0801,
+ "step": 18911
+ },
+ {
+ "epoch": 51.53133514986376,
+ "grad_norm": 6.3138203620910645,
+ "learning_rate": 9.989851313431698e-06,
+ "loss": 0.2169,
+ "step": 18912
+ },
+ {
+ "epoch": 51.53405994550409,
+ "grad_norm": 3.917548179626465,
+ "learning_rate": 9.98896881929114e-06,
+ "loss": 0.1764,
+ "step": 18913
+ },
+ {
+ "epoch": 51.536784741144416,
+ "grad_norm": 5.814704418182373,
+ "learning_rate": 9.988086325236493e-06,
+ "loss": 0.1834,
+ "step": 18914
+ },
+ {
+ "epoch": 51.53950953678474,
+ "grad_norm": 4.445235252380371,
+ "learning_rate": 9.987203831274629e-06,
+ "loss": 0.2559,
+ "step": 18915
+ },
+ {
+ "epoch": 51.54223433242507,
+ "grad_norm": 4.93685245513916,
+ "learning_rate": 9.98632133741242e-06,
+ "loss": 0.2249,
+ "step": 18916
+ },
+ {
+ "epoch": 51.54495912806539,
+ "grad_norm": 4.567865371704102,
+ "learning_rate": 9.985438843656742e-06,
+ "loss": 0.0841,
+ "step": 18917
+ },
+ {
+ "epoch": 51.54768392370572,
+ "grad_norm": 4.291372776031494,
+ "learning_rate": 9.98455635001446e-06,
+ "loss": 0.2191,
+ "step": 18918
+ },
+ {
+ "epoch": 51.55040871934605,
+ "grad_norm": 5.775290012359619,
+ "learning_rate": 9.983673856492457e-06,
+ "loss": 0.2156,
+ "step": 18919
+ },
+ {
+ "epoch": 51.55313351498638,
+ "grad_norm": 4.890861511230469,
+ "learning_rate": 9.982791363097602e-06,
+ "loss": 0.2356,
+ "step": 18920
+ },
+ {
+ "epoch": 51.555858310626704,
+ "grad_norm": 4.549856662750244,
+ "learning_rate": 9.981908869836767e-06,
+ "loss": 0.1903,
+ "step": 18921
+ },
+ {
+ "epoch": 51.55858310626703,
+ "grad_norm": 4.9609246253967285,
+ "learning_rate": 9.981026376716823e-06,
+ "loss": 0.2612,
+ "step": 18922
+ },
+ {
+ "epoch": 51.561307901907355,
+ "grad_norm": 4.6248393058776855,
+ "learning_rate": 9.98014388374465e-06,
+ "loss": 0.2277,
+ "step": 18923
+ },
+ {
+ "epoch": 51.56403269754768,
+ "grad_norm": 5.297659397125244,
+ "learning_rate": 9.97926139092711e-06,
+ "loss": 0.2539,
+ "step": 18924
+ },
+ {
+ "epoch": 51.566757493188014,
+ "grad_norm": 4.408740520477295,
+ "learning_rate": 9.978378898271087e-06,
+ "loss": 0.112,
+ "step": 18925
+ },
+ {
+ "epoch": 51.56948228882834,
+ "grad_norm": 5.680944442749023,
+ "learning_rate": 9.977496405783444e-06,
+ "loss": 0.1101,
+ "step": 18926
+ },
+ {
+ "epoch": 51.572207084468666,
+ "grad_norm": 4.534115314483643,
+ "learning_rate": 9.976613913471063e-06,
+ "loss": 0.2115,
+ "step": 18927
+ },
+ {
+ "epoch": 51.57493188010899,
+ "grad_norm": 4.632035732269287,
+ "learning_rate": 9.975731421340807e-06,
+ "loss": 0.1009,
+ "step": 18928
+ },
+ {
+ "epoch": 51.57765667574932,
+ "grad_norm": 3.959153175354004,
+ "learning_rate": 9.974848929399557e-06,
+ "loss": 0.3635,
+ "step": 18929
+ },
+ {
+ "epoch": 51.58038147138964,
+ "grad_norm": 4.5949177742004395,
+ "learning_rate": 9.973966437654182e-06,
+ "loss": 0.12,
+ "step": 18930
+ },
+ {
+ "epoch": 51.583106267029976,
+ "grad_norm": 4.820900917053223,
+ "learning_rate": 9.973083946111556e-06,
+ "loss": 0.2106,
+ "step": 18931
+ },
+ {
+ "epoch": 51.5858310626703,
+ "grad_norm": 4.429122447967529,
+ "learning_rate": 9.97220145477855e-06,
+ "loss": 0.1239,
+ "step": 18932
+ },
+ {
+ "epoch": 51.58855585831063,
+ "grad_norm": 4.48766565322876,
+ "learning_rate": 9.971318963662042e-06,
+ "loss": 0.1423,
+ "step": 18933
+ },
+ {
+ "epoch": 51.59128065395095,
+ "grad_norm": 4.9005126953125,
+ "learning_rate": 9.970436472768895e-06,
+ "loss": 0.1009,
+ "step": 18934
+ },
+ {
+ "epoch": 51.59400544959128,
+ "grad_norm": 3.8744966983795166,
+ "learning_rate": 9.969553982105988e-06,
+ "loss": 0.2056,
+ "step": 18935
+ },
+ {
+ "epoch": 51.596730245231605,
+ "grad_norm": 4.15589714050293,
+ "learning_rate": 9.968671491680197e-06,
+ "loss": 0.0911,
+ "step": 18936
+ },
+ {
+ "epoch": 51.59945504087194,
+ "grad_norm": 3.719292640686035,
+ "learning_rate": 9.96778900149839e-06,
+ "loss": 0.1378,
+ "step": 18937
+ },
+ {
+ "epoch": 51.60217983651226,
+ "grad_norm": 4.779216289520264,
+ "learning_rate": 9.966906511567443e-06,
+ "loss": 0.2018,
+ "step": 18938
+ },
+ {
+ "epoch": 51.60490463215259,
+ "grad_norm": 5.980700969696045,
+ "learning_rate": 9.966024021894226e-06,
+ "loss": 0.1083,
+ "step": 18939
+ },
+ {
+ "epoch": 51.607629427792915,
+ "grad_norm": 5.108234882354736,
+ "learning_rate": 9.965141532485613e-06,
+ "loss": 0.1925,
+ "step": 18940
+ },
+ {
+ "epoch": 51.61035422343324,
+ "grad_norm": 4.135683536529541,
+ "learning_rate": 9.964259043348476e-06,
+ "loss": 0.1219,
+ "step": 18941
+ },
+ {
+ "epoch": 51.61307901907357,
+ "grad_norm": 3.197345495223999,
+ "learning_rate": 9.963376554489691e-06,
+ "loss": 0.0701,
+ "step": 18942
+ },
+ {
+ "epoch": 51.6158038147139,
+ "grad_norm": 4.442191123962402,
+ "learning_rate": 9.962494065916124e-06,
+ "loss": 0.1184,
+ "step": 18943
+ },
+ {
+ "epoch": 51.618528610354225,
+ "grad_norm": 3.397578239440918,
+ "learning_rate": 9.961611577634655e-06,
+ "loss": 0.0821,
+ "step": 18944
+ },
+ {
+ "epoch": 51.62125340599455,
+ "grad_norm": 5.611720085144043,
+ "learning_rate": 9.960729089652153e-06,
+ "loss": 0.1397,
+ "step": 18945
+ },
+ {
+ "epoch": 51.62397820163488,
+ "grad_norm": 5.228200912475586,
+ "learning_rate": 9.95984660197549e-06,
+ "loss": 0.1119,
+ "step": 18946
+ },
+ {
+ "epoch": 51.6267029972752,
+ "grad_norm": 4.0746660232543945,
+ "learning_rate": 9.958964114611544e-06,
+ "loss": 0.3339,
+ "step": 18947
+ },
+ {
+ "epoch": 51.62942779291553,
+ "grad_norm": 4.019106388092041,
+ "learning_rate": 9.958081627567182e-06,
+ "loss": 0.0726,
+ "step": 18948
+ },
+ {
+ "epoch": 51.63215258855586,
+ "grad_norm": 5.064167022705078,
+ "learning_rate": 9.95719914084928e-06,
+ "loss": 0.0893,
+ "step": 18949
+ },
+ {
+ "epoch": 51.63487738419619,
+ "grad_norm": 5.4382805824279785,
+ "learning_rate": 9.956316654464706e-06,
+ "loss": 0.0875,
+ "step": 18950
+ },
+ {
+ "epoch": 51.63760217983651,
+ "grad_norm": 5.484139442443848,
+ "learning_rate": 9.95543416842034e-06,
+ "loss": 0.2185,
+ "step": 18951
+ },
+ {
+ "epoch": 51.64032697547684,
+ "grad_norm": 6.450892925262451,
+ "learning_rate": 9.95455168272305e-06,
+ "loss": 0.3215,
+ "step": 18952
+ },
+ {
+ "epoch": 51.643051771117165,
+ "grad_norm": 4.3288421630859375,
+ "learning_rate": 9.953669197379708e-06,
+ "loss": 0.1527,
+ "step": 18953
+ },
+ {
+ "epoch": 51.64577656675749,
+ "grad_norm": 4.621757507324219,
+ "learning_rate": 9.952786712397191e-06,
+ "loss": 0.1524,
+ "step": 18954
+ },
+ {
+ "epoch": 51.64850136239782,
+ "grad_norm": 5.470773220062256,
+ "learning_rate": 9.95190422778237e-06,
+ "loss": 0.1019,
+ "step": 18955
+ },
+ {
+ "epoch": 51.65122615803815,
+ "grad_norm": 4.634878635406494,
+ "learning_rate": 9.951021743542119e-06,
+ "loss": 0.1514,
+ "step": 18956
+ },
+ {
+ "epoch": 51.653950953678475,
+ "grad_norm": 4.923651218414307,
+ "learning_rate": 9.950139259683305e-06,
+ "loss": 0.2577,
+ "step": 18957
+ },
+ {
+ "epoch": 51.6566757493188,
+ "grad_norm": 4.08267879486084,
+ "learning_rate": 9.949256776212808e-06,
+ "loss": 0.1605,
+ "step": 18958
+ },
+ {
+ "epoch": 51.65940054495913,
+ "grad_norm": 6.271906852722168,
+ "learning_rate": 9.948374293137496e-06,
+ "loss": 0.152,
+ "step": 18959
+ },
+ {
+ "epoch": 51.66212534059945,
+ "grad_norm": 4.404917240142822,
+ "learning_rate": 9.947491810464246e-06,
+ "loss": 0.2029,
+ "step": 18960
+ },
+ {
+ "epoch": 51.664850136239785,
+ "grad_norm": 4.689579963684082,
+ "learning_rate": 9.946609328199926e-06,
+ "loss": 0.092,
+ "step": 18961
+ },
+ {
+ "epoch": 51.66757493188011,
+ "grad_norm": 5.952474594116211,
+ "learning_rate": 9.94572684635141e-06,
+ "loss": 0.1792,
+ "step": 18962
+ },
+ {
+ "epoch": 51.67029972752044,
+ "grad_norm": 5.2045722007751465,
+ "learning_rate": 9.944844364925574e-06,
+ "loss": 0.295,
+ "step": 18963
+ },
+ {
+ "epoch": 51.67302452316076,
+ "grad_norm": 6.426792144775391,
+ "learning_rate": 9.943961883929287e-06,
+ "loss": 0.2517,
+ "step": 18964
+ },
+ {
+ "epoch": 51.67574931880109,
+ "grad_norm": 4.43955135345459,
+ "learning_rate": 9.943079403369423e-06,
+ "loss": 0.1677,
+ "step": 18965
+ },
+ {
+ "epoch": 51.678474114441414,
+ "grad_norm": 4.113171577453613,
+ "learning_rate": 9.942196923252855e-06,
+ "loss": 0.1186,
+ "step": 18966
+ },
+ {
+ "epoch": 51.68119891008175,
+ "grad_norm": 3.726844549179077,
+ "learning_rate": 9.941314443586454e-06,
+ "loss": 0.1156,
+ "step": 18967
+ },
+ {
+ "epoch": 51.68392370572207,
+ "grad_norm": 4.087982654571533,
+ "learning_rate": 9.940431964377094e-06,
+ "loss": 0.1668,
+ "step": 18968
+ },
+ {
+ "epoch": 51.6866485013624,
+ "grad_norm": 5.609523773193359,
+ "learning_rate": 9.93954948563165e-06,
+ "loss": 0.1342,
+ "step": 18969
+ },
+ {
+ "epoch": 51.689373297002724,
+ "grad_norm": 4.390143871307373,
+ "learning_rate": 9.938667007356991e-06,
+ "loss": 0.1868,
+ "step": 18970
+ },
+ {
+ "epoch": 51.69209809264305,
+ "grad_norm": 8.819103240966797,
+ "learning_rate": 9.93778452955999e-06,
+ "loss": 0.1333,
+ "step": 18971
+ },
+ {
+ "epoch": 51.694822888283376,
+ "grad_norm": 4.704899311065674,
+ "learning_rate": 9.936902052247525e-06,
+ "loss": 0.0866,
+ "step": 18972
+ },
+ {
+ "epoch": 51.69754768392371,
+ "grad_norm": 2.8743555545806885,
+ "learning_rate": 9.936019575426462e-06,
+ "loss": 0.0636,
+ "step": 18973
+ },
+ {
+ "epoch": 51.700272479564035,
+ "grad_norm": 6.211526393890381,
+ "learning_rate": 9.935137099103678e-06,
+ "loss": 0.2033,
+ "step": 18974
+ },
+ {
+ "epoch": 51.70299727520436,
+ "grad_norm": 4.9399871826171875,
+ "learning_rate": 9.934254623286043e-06,
+ "loss": 0.1494,
+ "step": 18975
+ },
+ {
+ "epoch": 51.705722070844686,
+ "grad_norm": 4.001533031463623,
+ "learning_rate": 9.933372147980434e-06,
+ "loss": 0.2128,
+ "step": 18976
+ },
+ {
+ "epoch": 51.70844686648501,
+ "grad_norm": 4.183261871337891,
+ "learning_rate": 9.932489673193718e-06,
+ "loss": 0.1497,
+ "step": 18977
+ },
+ {
+ "epoch": 51.71117166212534,
+ "grad_norm": 4.518909454345703,
+ "learning_rate": 9.931607198932771e-06,
+ "loss": 0.1536,
+ "step": 18978
+ },
+ {
+ "epoch": 51.71389645776567,
+ "grad_norm": 4.9194488525390625,
+ "learning_rate": 9.930724725204463e-06,
+ "loss": 0.1351,
+ "step": 18979
+ },
+ {
+ "epoch": 51.716621253406,
+ "grad_norm": 4.825377941131592,
+ "learning_rate": 9.929842252015672e-06,
+ "loss": 0.1188,
+ "step": 18980
+ },
+ {
+ "epoch": 51.71934604904632,
+ "grad_norm": 6.563079833984375,
+ "learning_rate": 9.928959779373265e-06,
+ "loss": 0.1064,
+ "step": 18981
+ },
+ {
+ "epoch": 51.72207084468665,
+ "grad_norm": 4.544953346252441,
+ "learning_rate": 9.928077307284118e-06,
+ "loss": 0.2616,
+ "step": 18982
+ },
+ {
+ "epoch": 51.724795640326974,
+ "grad_norm": 4.771892547607422,
+ "learning_rate": 9.9271948357551e-06,
+ "loss": 0.1276,
+ "step": 18983
+ },
+ {
+ "epoch": 51.7275204359673,
+ "grad_norm": 6.476113319396973,
+ "learning_rate": 9.92631236479309e-06,
+ "loss": 0.2689,
+ "step": 18984
+ },
+ {
+ "epoch": 51.73024523160763,
+ "grad_norm": 5.970198154449463,
+ "learning_rate": 9.925429894404955e-06,
+ "loss": 0.285,
+ "step": 18985
+ },
+ {
+ "epoch": 51.73297002724796,
+ "grad_norm": 4.367156505584717,
+ "learning_rate": 9.92454742459757e-06,
+ "loss": 0.1528,
+ "step": 18986
+ },
+ {
+ "epoch": 51.735694822888284,
+ "grad_norm": 5.05354118347168,
+ "learning_rate": 9.923664955377802e-06,
+ "loss": 0.1256,
+ "step": 18987
+ },
+ {
+ "epoch": 51.73841961852861,
+ "grad_norm": 4.834817886352539,
+ "learning_rate": 9.922782486752537e-06,
+ "loss": 0.1377,
+ "step": 18988
+ },
+ {
+ "epoch": 51.741144414168936,
+ "grad_norm": 3.8790314197540283,
+ "learning_rate": 9.921900018728634e-06,
+ "loss": 0.2363,
+ "step": 18989
+ },
+ {
+ "epoch": 51.74386920980926,
+ "grad_norm": 4.6017560958862305,
+ "learning_rate": 9.921017551312975e-06,
+ "loss": 0.213,
+ "step": 18990
+ },
+ {
+ "epoch": 51.746594005449595,
+ "grad_norm": 11.591754913330078,
+ "learning_rate": 9.920135084512425e-06,
+ "loss": 0.1818,
+ "step": 18991
+ },
+ {
+ "epoch": 51.74931880108992,
+ "grad_norm": 6.721871376037598,
+ "learning_rate": 9.919252618333864e-06,
+ "loss": 0.1454,
+ "step": 18992
+ },
+ {
+ "epoch": 51.752043596730246,
+ "grad_norm": 5.192331314086914,
+ "learning_rate": 9.918370152784158e-06,
+ "loss": 0.113,
+ "step": 18993
+ },
+ {
+ "epoch": 51.75476839237057,
+ "grad_norm": 4.748659610748291,
+ "learning_rate": 9.917487687870187e-06,
+ "loss": 0.1944,
+ "step": 18994
+ },
+ {
+ "epoch": 51.7574931880109,
+ "grad_norm": 5.543908596038818,
+ "learning_rate": 9.916605223598815e-06,
+ "loss": 0.1583,
+ "step": 18995
+ },
+ {
+ "epoch": 51.76021798365122,
+ "grad_norm": 4.537134170532227,
+ "learning_rate": 9.915722759976923e-06,
+ "loss": 0.1149,
+ "step": 18996
+ },
+ {
+ "epoch": 51.762942779291556,
+ "grad_norm": 5.6749677658081055,
+ "learning_rate": 9.914840297011376e-06,
+ "loss": 0.1267,
+ "step": 18997
+ },
+ {
+ "epoch": 51.76566757493188,
+ "grad_norm": 4.887343406677246,
+ "learning_rate": 9.913957834709051e-06,
+ "loss": 0.2384,
+ "step": 18998
+ },
+ {
+ "epoch": 51.76839237057221,
+ "grad_norm": 4.104245662689209,
+ "learning_rate": 9.913075373076819e-06,
+ "loss": 0.1162,
+ "step": 18999
+ },
+ {
+ "epoch": 51.771117166212534,
+ "grad_norm": 4.365303039550781,
+ "learning_rate": 9.912192912121554e-06,
+ "loss": 0.1506,
+ "step": 19000
+ },
+ {
+ "epoch": 51.77384196185286,
+ "grad_norm": 3.8478541374206543,
+ "learning_rate": 9.911310451850127e-06,
+ "loss": 0.0982,
+ "step": 19001
+ },
+ {
+ "epoch": 51.776566757493185,
+ "grad_norm": 5.014444828033447,
+ "learning_rate": 9.910427992269414e-06,
+ "loss": 0.2771,
+ "step": 19002
+ },
+ {
+ "epoch": 51.77929155313352,
+ "grad_norm": 4.454366683959961,
+ "learning_rate": 9.909545533386281e-06,
+ "loss": 0.2987,
+ "step": 19003
+ },
+ {
+ "epoch": 51.782016348773844,
+ "grad_norm": 3.6813745498657227,
+ "learning_rate": 9.908663075207602e-06,
+ "loss": 0.1858,
+ "step": 19004
+ },
+ {
+ "epoch": 51.78474114441417,
+ "grad_norm": 7.667509078979492,
+ "learning_rate": 9.907780617740258e-06,
+ "loss": 0.1968,
+ "step": 19005
+ },
+ {
+ "epoch": 51.787465940054496,
+ "grad_norm": 4.544261932373047,
+ "learning_rate": 9.906898160991113e-06,
+ "loss": 0.1412,
+ "step": 19006
+ },
+ {
+ "epoch": 51.79019073569482,
+ "grad_norm": 4.070530414581299,
+ "learning_rate": 9.906015704967044e-06,
+ "loss": 0.1038,
+ "step": 19007
+ },
+ {
+ "epoch": 51.79291553133515,
+ "grad_norm": 4.835860729217529,
+ "learning_rate": 9.90513324967492e-06,
+ "loss": 0.2113,
+ "step": 19008
+ },
+ {
+ "epoch": 51.79564032697548,
+ "grad_norm": 7.1134033203125,
+ "learning_rate": 9.904250795121614e-06,
+ "loss": 0.3214,
+ "step": 19009
+ },
+ {
+ "epoch": 51.798365122615806,
+ "grad_norm": 5.900073051452637,
+ "learning_rate": 9.903368341314003e-06,
+ "loss": 0.11,
+ "step": 19010
+ },
+ {
+ "epoch": 51.80108991825613,
+ "grad_norm": 5.206643104553223,
+ "learning_rate": 9.902485888258953e-06,
+ "loss": 0.1453,
+ "step": 19011
+ },
+ {
+ "epoch": 51.80381471389646,
+ "grad_norm": 5.340708255767822,
+ "learning_rate": 9.901603435963343e-06,
+ "loss": 0.0987,
+ "step": 19012
+ },
+ {
+ "epoch": 51.80653950953678,
+ "grad_norm": 5.448592662811279,
+ "learning_rate": 9.90072098443404e-06,
+ "loss": 0.1181,
+ "step": 19013
+ },
+ {
+ "epoch": 51.80926430517711,
+ "grad_norm": 5.2505011558532715,
+ "learning_rate": 9.899838533677922e-06,
+ "loss": 0.0873,
+ "step": 19014
+ },
+ {
+ "epoch": 51.81198910081744,
+ "grad_norm": 4.6900739669799805,
+ "learning_rate": 9.898956083701854e-06,
+ "loss": 0.1025,
+ "step": 19015
+ },
+ {
+ "epoch": 51.81471389645777,
+ "grad_norm": 7.396714687347412,
+ "learning_rate": 9.898073634512717e-06,
+ "loss": 0.0938,
+ "step": 19016
+ },
+ {
+ "epoch": 51.817438692098094,
+ "grad_norm": 4.672626972198486,
+ "learning_rate": 9.897191186117375e-06,
+ "loss": 0.2453,
+ "step": 19017
+ },
+ {
+ "epoch": 51.82016348773842,
+ "grad_norm": 4.7493720054626465,
+ "learning_rate": 9.896308738522708e-06,
+ "loss": 0.1075,
+ "step": 19018
+ },
+ {
+ "epoch": 51.822888283378745,
+ "grad_norm": 4.544273853302002,
+ "learning_rate": 9.895426291735582e-06,
+ "loss": 0.3212,
+ "step": 19019
+ },
+ {
+ "epoch": 51.82561307901907,
+ "grad_norm": 4.8066792488098145,
+ "learning_rate": 9.894543845762876e-06,
+ "loss": 0.158,
+ "step": 19020
+ },
+ {
+ "epoch": 51.828337874659404,
+ "grad_norm": 4.690978527069092,
+ "learning_rate": 9.893661400611456e-06,
+ "loss": 0.1431,
+ "step": 19021
+ },
+ {
+ "epoch": 51.83106267029973,
+ "grad_norm": 5.638887882232666,
+ "learning_rate": 9.892778956288198e-06,
+ "loss": 0.1434,
+ "step": 19022
+ },
+ {
+ "epoch": 51.833787465940055,
+ "grad_norm": 5.1739068031311035,
+ "learning_rate": 9.891896512799975e-06,
+ "loss": 0.2879,
+ "step": 19023
+ },
+ {
+ "epoch": 51.83651226158038,
+ "grad_norm": 7.537215232849121,
+ "learning_rate": 9.891014070153658e-06,
+ "loss": 0.1211,
+ "step": 19024
+ },
+ {
+ "epoch": 51.83923705722071,
+ "grad_norm": 6.0180535316467285,
+ "learning_rate": 9.890131628356122e-06,
+ "loss": 0.1376,
+ "step": 19025
+ },
+ {
+ "epoch": 51.84196185286103,
+ "grad_norm": 4.283379077911377,
+ "learning_rate": 9.889249187414235e-06,
+ "loss": 0.0915,
+ "step": 19026
+ },
+ {
+ "epoch": 51.844686648501366,
+ "grad_norm": 5.555041790008545,
+ "learning_rate": 9.888366747334873e-06,
+ "loss": 0.1199,
+ "step": 19027
+ },
+ {
+ "epoch": 51.84741144414169,
+ "grad_norm": 4.932379722595215,
+ "learning_rate": 9.887484308124907e-06,
+ "loss": 0.1198,
+ "step": 19028
+ },
+ {
+ "epoch": 51.85013623978202,
+ "grad_norm": 4.495264530181885,
+ "learning_rate": 9.88660186979121e-06,
+ "loss": 0.188,
+ "step": 19029
+ },
+ {
+ "epoch": 51.85286103542234,
+ "grad_norm": 6.212512493133545,
+ "learning_rate": 9.885719432340652e-06,
+ "loss": 0.2284,
+ "step": 19030
+ },
+ {
+ "epoch": 51.85558583106267,
+ "grad_norm": 4.427855491638184,
+ "learning_rate": 9.884836995780109e-06,
+ "loss": 0.2725,
+ "step": 19031
+ },
+ {
+ "epoch": 51.858310626702995,
+ "grad_norm": 4.954310417175293,
+ "learning_rate": 9.883954560116452e-06,
+ "loss": 0.1135,
+ "step": 19032
+ },
+ {
+ "epoch": 51.86103542234333,
+ "grad_norm": 4.122082233428955,
+ "learning_rate": 9.883072125356552e-06,
+ "loss": 0.0942,
+ "step": 19033
+ },
+ {
+ "epoch": 51.86376021798365,
+ "grad_norm": 3.8311758041381836,
+ "learning_rate": 9.882189691507285e-06,
+ "loss": 0.1667,
+ "step": 19034
+ },
+ {
+ "epoch": 51.86648501362398,
+ "grad_norm": 5.232621669769287,
+ "learning_rate": 9.881307258575519e-06,
+ "loss": 0.1082,
+ "step": 19035
+ },
+ {
+ "epoch": 51.869209809264305,
+ "grad_norm": 5.181174278259277,
+ "learning_rate": 9.880424826568128e-06,
+ "loss": 0.1105,
+ "step": 19036
+ },
+ {
+ "epoch": 51.87193460490463,
+ "grad_norm": 6.016700267791748,
+ "learning_rate": 9.879542395491984e-06,
+ "loss": 0.1191,
+ "step": 19037
+ },
+ {
+ "epoch": 51.87465940054496,
+ "grad_norm": 5.201912879943848,
+ "learning_rate": 9.878659965353964e-06,
+ "loss": 0.1178,
+ "step": 19038
+ },
+ {
+ "epoch": 51.87738419618529,
+ "grad_norm": 6.831856727600098,
+ "learning_rate": 9.87777753616093e-06,
+ "loss": 0.1596,
+ "step": 19039
+ },
+ {
+ "epoch": 51.880108991825615,
+ "grad_norm": 4.478147029876709,
+ "learning_rate": 9.876895107919761e-06,
+ "loss": 0.1235,
+ "step": 19040
+ },
+ {
+ "epoch": 51.88283378746594,
+ "grad_norm": 5.386390686035156,
+ "learning_rate": 9.876012680637334e-06,
+ "loss": 0.14,
+ "step": 19041
+ },
+ {
+ "epoch": 51.88555858310627,
+ "grad_norm": 6.98453426361084,
+ "learning_rate": 9.875130254320513e-06,
+ "loss": 0.1128,
+ "step": 19042
+ },
+ {
+ "epoch": 51.88828337874659,
+ "grad_norm": 13.316817283630371,
+ "learning_rate": 9.874247828976176e-06,
+ "loss": 0.2634,
+ "step": 19043
+ },
+ {
+ "epoch": 51.89100817438692,
+ "grad_norm": 4.4534759521484375,
+ "learning_rate": 9.87336540461119e-06,
+ "loss": 0.2525,
+ "step": 19044
+ },
+ {
+ "epoch": 51.89373297002725,
+ "grad_norm": 4.711284160614014,
+ "learning_rate": 9.872482981232434e-06,
+ "loss": 0.1092,
+ "step": 19045
+ },
+ {
+ "epoch": 51.89645776566758,
+ "grad_norm": 4.004992961883545,
+ "learning_rate": 9.871600558846772e-06,
+ "loss": 0.2462,
+ "step": 19046
+ },
+ {
+ "epoch": 51.8991825613079,
+ "grad_norm": 6.234788417816162,
+ "learning_rate": 9.870718137461085e-06,
+ "loss": 0.1602,
+ "step": 19047
+ },
+ {
+ "epoch": 51.90190735694823,
+ "grad_norm": 4.16002893447876,
+ "learning_rate": 9.869835717082237e-06,
+ "loss": 0.1424,
+ "step": 19048
+ },
+ {
+ "epoch": 51.904632152588555,
+ "grad_norm": 5.75315523147583,
+ "learning_rate": 9.868953297717108e-06,
+ "loss": 0.1034,
+ "step": 19049
+ },
+ {
+ "epoch": 51.90735694822888,
+ "grad_norm": 5.9653239250183105,
+ "learning_rate": 9.868070879372563e-06,
+ "loss": 0.1137,
+ "step": 19050
+ },
+ {
+ "epoch": 51.91008174386921,
+ "grad_norm": 4.411348819732666,
+ "learning_rate": 9.867188462055482e-06,
+ "loss": 0.1898,
+ "step": 19051
+ },
+ {
+ "epoch": 51.91280653950954,
+ "grad_norm": 5.087191104888916,
+ "learning_rate": 9.86630604577273e-06,
+ "loss": 0.1411,
+ "step": 19052
+ },
+ {
+ "epoch": 51.915531335149865,
+ "grad_norm": 7.6265788078308105,
+ "learning_rate": 9.865423630531182e-06,
+ "loss": 0.0907,
+ "step": 19053
+ },
+ {
+ "epoch": 51.91825613079019,
+ "grad_norm": 4.868733882904053,
+ "learning_rate": 9.86454121633771e-06,
+ "loss": 0.1693,
+ "step": 19054
+ },
+ {
+ "epoch": 51.920980926430516,
+ "grad_norm": 4.471322536468506,
+ "learning_rate": 9.863658803199187e-06,
+ "loss": 0.1086,
+ "step": 19055
+ },
+ {
+ "epoch": 51.92370572207084,
+ "grad_norm": 3.931206226348877,
+ "learning_rate": 9.862776391122482e-06,
+ "loss": 0.1117,
+ "step": 19056
+ },
+ {
+ "epoch": 51.926430517711175,
+ "grad_norm": 4.475884914398193,
+ "learning_rate": 9.861893980114475e-06,
+ "loss": 0.0922,
+ "step": 19057
+ },
+ {
+ "epoch": 51.9291553133515,
+ "grad_norm": 5.323555946350098,
+ "learning_rate": 9.86101157018203e-06,
+ "loss": 0.1027,
+ "step": 19058
+ },
+ {
+ "epoch": 51.93188010899183,
+ "grad_norm": 4.618867874145508,
+ "learning_rate": 9.860129161332026e-06,
+ "loss": 0.2802,
+ "step": 19059
+ },
+ {
+ "epoch": 51.93460490463215,
+ "grad_norm": 5.137905597686768,
+ "learning_rate": 9.859246753571328e-06,
+ "loss": 0.1069,
+ "step": 19060
+ },
+ {
+ "epoch": 51.93732970027248,
+ "grad_norm": 5.134658336639404,
+ "learning_rate": 9.858364346906814e-06,
+ "loss": 0.1496,
+ "step": 19061
+ },
+ {
+ "epoch": 51.940054495912804,
+ "grad_norm": 5.088315010070801,
+ "learning_rate": 9.857481941345354e-06,
+ "loss": 0.1792,
+ "step": 19062
+ },
+ {
+ "epoch": 51.94277929155314,
+ "grad_norm": 4.330304145812988,
+ "learning_rate": 9.856599536893821e-06,
+ "loss": 0.1337,
+ "step": 19063
+ },
+ {
+ "epoch": 51.94550408719346,
+ "grad_norm": 4.265829563140869,
+ "learning_rate": 9.855717133559082e-06,
+ "loss": 0.3549,
+ "step": 19064
+ },
+ {
+ "epoch": 51.94822888283379,
+ "grad_norm": 5.327817440032959,
+ "learning_rate": 9.854834731348017e-06,
+ "loss": 0.1134,
+ "step": 19065
+ },
+ {
+ "epoch": 51.950953678474114,
+ "grad_norm": 4.612740993499756,
+ "learning_rate": 9.853952330267494e-06,
+ "loss": 0.1141,
+ "step": 19066
+ },
+ {
+ "epoch": 51.95367847411444,
+ "grad_norm": 5.05368709564209,
+ "learning_rate": 9.853069930324386e-06,
+ "loss": 0.1647,
+ "step": 19067
+ },
+ {
+ "epoch": 51.956403269754766,
+ "grad_norm": 8.820033073425293,
+ "learning_rate": 9.852187531525563e-06,
+ "loss": 0.2022,
+ "step": 19068
+ },
+ {
+ "epoch": 51.95912806539509,
+ "grad_norm": 7.538532733917236,
+ "learning_rate": 9.8513051338779e-06,
+ "loss": 0.1246,
+ "step": 19069
+ },
+ {
+ "epoch": 51.961852861035425,
+ "grad_norm": 9.275288581848145,
+ "learning_rate": 9.850422737388266e-06,
+ "loss": 0.1403,
+ "step": 19070
+ },
+ {
+ "epoch": 51.96457765667575,
+ "grad_norm": 4.492852210998535,
+ "learning_rate": 9.849540342063538e-06,
+ "loss": 0.0984,
+ "step": 19071
+ },
+ {
+ "epoch": 51.967302452316076,
+ "grad_norm": 5.652397632598877,
+ "learning_rate": 9.848657947910582e-06,
+ "loss": 0.2101,
+ "step": 19072
+ },
+ {
+ "epoch": 51.9700272479564,
+ "grad_norm": 4.326151371002197,
+ "learning_rate": 9.84777555493627e-06,
+ "loss": 0.3379,
+ "step": 19073
+ },
+ {
+ "epoch": 51.97275204359673,
+ "grad_norm": 7.145446300506592,
+ "learning_rate": 9.84689316314748e-06,
+ "loss": 0.1147,
+ "step": 19074
+ },
+ {
+ "epoch": 51.97547683923706,
+ "grad_norm": 5.152425765991211,
+ "learning_rate": 9.846010772551083e-06,
+ "loss": 0.1434,
+ "step": 19075
+ },
+ {
+ "epoch": 51.97820163487739,
+ "grad_norm": 4.132455825805664,
+ "learning_rate": 9.845128383153948e-06,
+ "loss": 0.1292,
+ "step": 19076
+ },
+ {
+ "epoch": 51.98092643051771,
+ "grad_norm": 5.042201995849609,
+ "learning_rate": 9.84424599496295e-06,
+ "loss": 0.2215,
+ "step": 19077
+ },
+ {
+ "epoch": 51.98365122615804,
+ "grad_norm": 4.171875476837158,
+ "learning_rate": 9.843363607984957e-06,
+ "loss": 0.1582,
+ "step": 19078
+ },
+ {
+ "epoch": 51.986376021798364,
+ "grad_norm": 5.28590726852417,
+ "learning_rate": 9.842481222226845e-06,
+ "loss": 0.1508,
+ "step": 19079
+ },
+ {
+ "epoch": 51.98910081743869,
+ "grad_norm": 5.6133198738098145,
+ "learning_rate": 9.841598837695482e-06,
+ "loss": 0.1724,
+ "step": 19080
+ },
+ {
+ "epoch": 51.991825613079016,
+ "grad_norm": 4.963491439819336,
+ "learning_rate": 9.840716454397746e-06,
+ "loss": 0.1653,
+ "step": 19081
+ },
+ {
+ "epoch": 51.99455040871935,
+ "grad_norm": 5.135807991027832,
+ "learning_rate": 9.8398340723405e-06,
+ "loss": 0.1413,
+ "step": 19082
+ },
+ {
+ "epoch": 51.997275204359674,
+ "grad_norm": 5.180513858795166,
+ "learning_rate": 9.838951691530625e-06,
+ "loss": 0.1247,
+ "step": 19083
+ },
+ {
+ "epoch": 52.0,
+ "grad_norm": 3.206604242324829,
+ "learning_rate": 9.838069311974986e-06,
+ "loss": 0.0588,
+ "step": 19084
+ },
+ {
+ "epoch": 52.002724795640326,
+ "grad_norm": 5.357468605041504,
+ "learning_rate": 9.837186933680462e-06,
+ "loss": 0.1203,
+ "step": 19085
+ },
+ {
+ "epoch": 52.00544959128065,
+ "grad_norm": 4.185212135314941,
+ "learning_rate": 9.836304556653916e-06,
+ "loss": 0.1916,
+ "step": 19086
+ },
+ {
+ "epoch": 52.00817438692098,
+ "grad_norm": 5.570226192474365,
+ "learning_rate": 9.835422180902228e-06,
+ "loss": 0.1843,
+ "step": 19087
+ },
+ {
+ "epoch": 52.01089918256131,
+ "grad_norm": 4.808948040008545,
+ "learning_rate": 9.834539806432267e-06,
+ "loss": 0.1085,
+ "step": 19088
+ },
+ {
+ "epoch": 52.013623978201636,
+ "grad_norm": 4.601601600646973,
+ "learning_rate": 9.833657433250904e-06,
+ "loss": 0.1868,
+ "step": 19089
+ },
+ {
+ "epoch": 52.01634877384196,
+ "grad_norm": 7.2745361328125,
+ "learning_rate": 9.832775061365008e-06,
+ "loss": 0.0949,
+ "step": 19090
+ },
+ {
+ "epoch": 52.01907356948229,
+ "grad_norm": 4.245944976806641,
+ "learning_rate": 9.831892690781457e-06,
+ "loss": 0.1617,
+ "step": 19091
+ },
+ {
+ "epoch": 52.02179836512261,
+ "grad_norm": 3.1831865310668945,
+ "learning_rate": 9.831010321507122e-06,
+ "loss": 0.1959,
+ "step": 19092
+ },
+ {
+ "epoch": 52.02452316076294,
+ "grad_norm": 4.060930252075195,
+ "learning_rate": 9.830127953548872e-06,
+ "loss": 0.0862,
+ "step": 19093
+ },
+ {
+ "epoch": 52.02724795640327,
+ "grad_norm": 4.801197528839111,
+ "learning_rate": 9.82924558691358e-06,
+ "loss": 0.1185,
+ "step": 19094
+ },
+ {
+ "epoch": 52.0299727520436,
+ "grad_norm": 6.656748294830322,
+ "learning_rate": 9.828363221608118e-06,
+ "loss": 0.0909,
+ "step": 19095
+ },
+ {
+ "epoch": 52.032697547683924,
+ "grad_norm": 6.821707725524902,
+ "learning_rate": 9.827480857639357e-06,
+ "loss": 0.161,
+ "step": 19096
+ },
+ {
+ "epoch": 52.03542234332425,
+ "grad_norm": 3.8699491024017334,
+ "learning_rate": 9.826598495014172e-06,
+ "loss": 0.1075,
+ "step": 19097
+ },
+ {
+ "epoch": 52.038147138964575,
+ "grad_norm": 3.5079822540283203,
+ "learning_rate": 9.82571613373943e-06,
+ "loss": 0.1131,
+ "step": 19098
+ },
+ {
+ "epoch": 52.0408719346049,
+ "grad_norm": 3.8385355472564697,
+ "learning_rate": 9.824833773822006e-06,
+ "loss": 0.2495,
+ "step": 19099
+ },
+ {
+ "epoch": 52.043596730245234,
+ "grad_norm": 6.233022212982178,
+ "learning_rate": 9.82395141526877e-06,
+ "loss": 0.1038,
+ "step": 19100
+ },
+ {
+ "epoch": 52.04632152588556,
+ "grad_norm": 5.880666255950928,
+ "learning_rate": 9.823069058086597e-06,
+ "loss": 0.1858,
+ "step": 19101
+ },
+ {
+ "epoch": 52.049046321525886,
+ "grad_norm": 5.460610389709473,
+ "learning_rate": 9.822186702282354e-06,
+ "loss": 0.2856,
+ "step": 19102
+ },
+ {
+ "epoch": 52.05177111716621,
+ "grad_norm": 4.017082214355469,
+ "learning_rate": 9.821304347862917e-06,
+ "loss": 0.1405,
+ "step": 19103
+ },
+ {
+ "epoch": 52.05449591280654,
+ "grad_norm": 7.076798915863037,
+ "learning_rate": 9.820421994835154e-06,
+ "loss": 0.2079,
+ "step": 19104
+ },
+ {
+ "epoch": 52.05722070844686,
+ "grad_norm": 4.44091272354126,
+ "learning_rate": 9.81953964320594e-06,
+ "loss": 0.0803,
+ "step": 19105
+ },
+ {
+ "epoch": 52.059945504087196,
+ "grad_norm": 5.3109564781188965,
+ "learning_rate": 9.818657292982146e-06,
+ "loss": 0.1039,
+ "step": 19106
+ },
+ {
+ "epoch": 52.06267029972752,
+ "grad_norm": 4.658829689025879,
+ "learning_rate": 9.817774944170638e-06,
+ "loss": 0.1626,
+ "step": 19107
+ },
+ {
+ "epoch": 52.06539509536785,
+ "grad_norm": 4.813467502593994,
+ "learning_rate": 9.816892596778299e-06,
+ "loss": 0.1605,
+ "step": 19108
+ },
+ {
+ "epoch": 52.06811989100817,
+ "grad_norm": 4.176400184631348,
+ "learning_rate": 9.816010250811993e-06,
+ "loss": 0.2054,
+ "step": 19109
+ },
+ {
+ "epoch": 52.0708446866485,
+ "grad_norm": 8.531670570373535,
+ "learning_rate": 9.815127906278595e-06,
+ "loss": 0.2266,
+ "step": 19110
+ },
+ {
+ "epoch": 52.073569482288825,
+ "grad_norm": 4.211588382720947,
+ "learning_rate": 9.814245563184971e-06,
+ "loss": 0.2232,
+ "step": 19111
+ },
+ {
+ "epoch": 52.07629427792916,
+ "grad_norm": 4.5949387550354,
+ "learning_rate": 9.813363221538e-06,
+ "loss": 0.1642,
+ "step": 19112
+ },
+ {
+ "epoch": 52.079019073569484,
+ "grad_norm": 4.175572872161865,
+ "learning_rate": 9.812480881344548e-06,
+ "loss": 0.1366,
+ "step": 19113
+ },
+ {
+ "epoch": 52.08174386920981,
+ "grad_norm": 3.458845615386963,
+ "learning_rate": 9.811598542611492e-06,
+ "loss": 0.1829,
+ "step": 19114
+ },
+ {
+ "epoch": 52.084468664850135,
+ "grad_norm": 4.565491676330566,
+ "learning_rate": 9.810716205345695e-06,
+ "loss": 0.2216,
+ "step": 19115
+ },
+ {
+ "epoch": 52.08719346049046,
+ "grad_norm": 4.427910804748535,
+ "learning_rate": 9.80983386955404e-06,
+ "loss": 0.1551,
+ "step": 19116
+ },
+ {
+ "epoch": 52.08991825613079,
+ "grad_norm": 4.134413719177246,
+ "learning_rate": 9.808951535243389e-06,
+ "loss": 0.2118,
+ "step": 19117
+ },
+ {
+ "epoch": 52.09264305177112,
+ "grad_norm": 4.23202657699585,
+ "learning_rate": 9.808069202420617e-06,
+ "loss": 0.1259,
+ "step": 19118
+ },
+ {
+ "epoch": 52.095367847411445,
+ "grad_norm": 3.89436936378479,
+ "learning_rate": 9.8071868710926e-06,
+ "loss": 0.2316,
+ "step": 19119
+ },
+ {
+ "epoch": 52.09809264305177,
+ "grad_norm": 5.763807773590088,
+ "learning_rate": 9.8063045412662e-06,
+ "loss": 0.1645,
+ "step": 19120
+ },
+ {
+ "epoch": 52.1008174386921,
+ "grad_norm": 4.004239082336426,
+ "learning_rate": 9.805422212948297e-06,
+ "loss": 0.0766,
+ "step": 19121
+ },
+ {
+ "epoch": 52.10354223433242,
+ "grad_norm": 3.9072365760803223,
+ "learning_rate": 9.80453988614576e-06,
+ "loss": 0.1027,
+ "step": 19122
+ },
+ {
+ "epoch": 52.10626702997275,
+ "grad_norm": 4.546239852905273,
+ "learning_rate": 9.80365756086546e-06,
+ "loss": 0.2511,
+ "step": 19123
+ },
+ {
+ "epoch": 52.10899182561308,
+ "grad_norm": 3.611271858215332,
+ "learning_rate": 9.802775237114267e-06,
+ "loss": 0.0702,
+ "step": 19124
+ },
+ {
+ "epoch": 52.11171662125341,
+ "grad_norm": 4.813879489898682,
+ "learning_rate": 9.801892914899051e-06,
+ "loss": 0.1756,
+ "step": 19125
+ },
+ {
+ "epoch": 52.11444141689373,
+ "grad_norm": 3.95748233795166,
+ "learning_rate": 9.801010594226691e-06,
+ "loss": 0.1067,
+ "step": 19126
+ },
+ {
+ "epoch": 52.11716621253406,
+ "grad_norm": 3.612278461456299,
+ "learning_rate": 9.800128275104054e-06,
+ "loss": 0.0726,
+ "step": 19127
+ },
+ {
+ "epoch": 52.119891008174385,
+ "grad_norm": 3.7307493686676025,
+ "learning_rate": 9.799245957538013e-06,
+ "loss": 0.0693,
+ "step": 19128
+ },
+ {
+ "epoch": 52.12261580381471,
+ "grad_norm": 4.682528972625732,
+ "learning_rate": 9.798363641535434e-06,
+ "loss": 0.1538,
+ "step": 19129
+ },
+ {
+ "epoch": 52.12534059945504,
+ "grad_norm": 4.460844039916992,
+ "learning_rate": 9.797481327103196e-06,
+ "loss": 0.1456,
+ "step": 19130
+ },
+ {
+ "epoch": 52.12806539509537,
+ "grad_norm": 4.052233695983887,
+ "learning_rate": 9.796599014248164e-06,
+ "loss": 0.0777,
+ "step": 19131
+ },
+ {
+ "epoch": 52.130790190735695,
+ "grad_norm": 6.026838779449463,
+ "learning_rate": 9.795716702977216e-06,
+ "loss": 0.0797,
+ "step": 19132
+ },
+ {
+ "epoch": 52.13351498637602,
+ "grad_norm": 4.016129016876221,
+ "learning_rate": 9.794834393297217e-06,
+ "loss": 0.1709,
+ "step": 19133
+ },
+ {
+ "epoch": 52.13623978201635,
+ "grad_norm": 3.1839075088500977,
+ "learning_rate": 9.793952085215043e-06,
+ "loss": 0.0997,
+ "step": 19134
+ },
+ {
+ "epoch": 52.13896457765667,
+ "grad_norm": 5.489106178283691,
+ "learning_rate": 9.793069778737561e-06,
+ "loss": 0.2695,
+ "step": 19135
+ },
+ {
+ "epoch": 52.141689373297005,
+ "grad_norm": 4.77548885345459,
+ "learning_rate": 9.792187473871648e-06,
+ "loss": 0.3013,
+ "step": 19136
+ },
+ {
+ "epoch": 52.14441416893733,
+ "grad_norm": 4.23523473739624,
+ "learning_rate": 9.79130517062417e-06,
+ "loss": 0.1891,
+ "step": 19137
+ },
+ {
+ "epoch": 52.14713896457766,
+ "grad_norm": 4.312173366546631,
+ "learning_rate": 9.790422869002003e-06,
+ "loss": 0.1265,
+ "step": 19138
+ },
+ {
+ "epoch": 52.14986376021798,
+ "grad_norm": 5.366184711456299,
+ "learning_rate": 9.789540569012012e-06,
+ "loss": 0.0827,
+ "step": 19139
+ },
+ {
+ "epoch": 52.15258855585831,
+ "grad_norm": 6.901341915130615,
+ "learning_rate": 9.788658270661076e-06,
+ "loss": 0.1,
+ "step": 19140
+ },
+ {
+ "epoch": 52.155313351498634,
+ "grad_norm": 4.667526721954346,
+ "learning_rate": 9.78777597395606e-06,
+ "loss": 0.1889,
+ "step": 19141
+ },
+ {
+ "epoch": 52.15803814713897,
+ "grad_norm": 5.528557777404785,
+ "learning_rate": 9.786893678903835e-06,
+ "loss": 0.1324,
+ "step": 19142
+ },
+ {
+ "epoch": 52.16076294277929,
+ "grad_norm": 3.8147330284118652,
+ "learning_rate": 9.786011385511279e-06,
+ "loss": 0.0893,
+ "step": 19143
+ },
+ {
+ "epoch": 52.16348773841962,
+ "grad_norm": 3.9426429271698,
+ "learning_rate": 9.78512909378526e-06,
+ "loss": 0.0894,
+ "step": 19144
+ },
+ {
+ "epoch": 52.166212534059945,
+ "grad_norm": 4.193362236022949,
+ "learning_rate": 9.784246803732648e-06,
+ "loss": 0.1798,
+ "step": 19145
+ },
+ {
+ "epoch": 52.16893732970027,
+ "grad_norm": 3.5375497341156006,
+ "learning_rate": 9.783364515360315e-06,
+ "loss": 0.1651,
+ "step": 19146
+ },
+ {
+ "epoch": 52.171662125340596,
+ "grad_norm": 10.843406677246094,
+ "learning_rate": 9.782482228675132e-06,
+ "loss": 0.3171,
+ "step": 19147
+ },
+ {
+ "epoch": 52.17438692098093,
+ "grad_norm": 4.114462852478027,
+ "learning_rate": 9.781599943683972e-06,
+ "loss": 0.1131,
+ "step": 19148
+ },
+ {
+ "epoch": 52.177111716621255,
+ "grad_norm": 4.447324752807617,
+ "learning_rate": 9.780717660393702e-06,
+ "loss": 0.2078,
+ "step": 19149
+ },
+ {
+ "epoch": 52.17983651226158,
+ "grad_norm": 15.412213325500488,
+ "learning_rate": 9.7798353788112e-06,
+ "loss": 0.1368,
+ "step": 19150
+ },
+ {
+ "epoch": 52.182561307901906,
+ "grad_norm": 4.740209102630615,
+ "learning_rate": 9.778953098943329e-06,
+ "loss": 0.164,
+ "step": 19151
+ },
+ {
+ "epoch": 52.18528610354223,
+ "grad_norm": 4.917448997497559,
+ "learning_rate": 9.778070820796966e-06,
+ "loss": 0.1054,
+ "step": 19152
+ },
+ {
+ "epoch": 52.18801089918256,
+ "grad_norm": 4.078722953796387,
+ "learning_rate": 9.777188544378979e-06,
+ "loss": 0.2942,
+ "step": 19153
+ },
+ {
+ "epoch": 52.19073569482289,
+ "grad_norm": 7.165360927581787,
+ "learning_rate": 9.77630626969624e-06,
+ "loss": 0.1162,
+ "step": 19154
+ },
+ {
+ "epoch": 52.19346049046322,
+ "grad_norm": 6.1595258712768555,
+ "learning_rate": 9.775423996755622e-06,
+ "loss": 0.1511,
+ "step": 19155
+ },
+ {
+ "epoch": 52.19618528610354,
+ "grad_norm": 4.429165363311768,
+ "learning_rate": 9.774541725563996e-06,
+ "loss": 0.0787,
+ "step": 19156
+ },
+ {
+ "epoch": 52.19891008174387,
+ "grad_norm": 4.14840841293335,
+ "learning_rate": 9.773659456128229e-06,
+ "loss": 0.1928,
+ "step": 19157
+ },
+ {
+ "epoch": 52.201634877384194,
+ "grad_norm": 4.104926109313965,
+ "learning_rate": 9.772777188455196e-06,
+ "loss": 0.0826,
+ "step": 19158
+ },
+ {
+ "epoch": 52.20435967302452,
+ "grad_norm": 6.021915435791016,
+ "learning_rate": 9.771894922551763e-06,
+ "loss": 0.2946,
+ "step": 19159
+ },
+ {
+ "epoch": 52.20708446866485,
+ "grad_norm": 3.799884557723999,
+ "learning_rate": 9.771012658424808e-06,
+ "loss": 0.0798,
+ "step": 19160
+ },
+ {
+ "epoch": 52.20980926430518,
+ "grad_norm": 3.756002187728882,
+ "learning_rate": 9.7701303960812e-06,
+ "loss": 0.1701,
+ "step": 19161
+ },
+ {
+ "epoch": 52.212534059945504,
+ "grad_norm": 4.617569923400879,
+ "learning_rate": 9.76924813552781e-06,
+ "loss": 0.1818,
+ "step": 19162
+ },
+ {
+ "epoch": 52.21525885558583,
+ "grad_norm": 4.105844497680664,
+ "learning_rate": 9.768365876771505e-06,
+ "loss": 0.1153,
+ "step": 19163
+ },
+ {
+ "epoch": 52.217983651226156,
+ "grad_norm": 4.216437816619873,
+ "learning_rate": 9.767483619819164e-06,
+ "loss": 0.1544,
+ "step": 19164
+ },
+ {
+ "epoch": 52.22070844686648,
+ "grad_norm": 5.39052152633667,
+ "learning_rate": 9.766601364677648e-06,
+ "loss": 0.1662,
+ "step": 19165
+ },
+ {
+ "epoch": 52.223433242506815,
+ "grad_norm": 4.8423895835876465,
+ "learning_rate": 9.765719111353837e-06,
+ "loss": 0.3015,
+ "step": 19166
+ },
+ {
+ "epoch": 52.22615803814714,
+ "grad_norm": 4.74192476272583,
+ "learning_rate": 9.764836859854595e-06,
+ "loss": 0.2087,
+ "step": 19167
+ },
+ {
+ "epoch": 52.228882833787466,
+ "grad_norm": 5.739588260650635,
+ "learning_rate": 9.763954610186798e-06,
+ "loss": 0.104,
+ "step": 19168
+ },
+ {
+ "epoch": 52.23160762942779,
+ "grad_norm": 6.070648670196533,
+ "learning_rate": 9.763072362357315e-06,
+ "loss": 0.1366,
+ "step": 19169
+ },
+ {
+ "epoch": 52.23433242506812,
+ "grad_norm": 4.204780101776123,
+ "learning_rate": 9.762190116373017e-06,
+ "loss": 0.2565,
+ "step": 19170
+ },
+ {
+ "epoch": 52.237057220708444,
+ "grad_norm": 4.189395427703857,
+ "learning_rate": 9.761307872240773e-06,
+ "loss": 0.1398,
+ "step": 19171
+ },
+ {
+ "epoch": 52.23978201634878,
+ "grad_norm": 3.492771625518799,
+ "learning_rate": 9.760425629967457e-06,
+ "loss": 0.1139,
+ "step": 19172
+ },
+ {
+ "epoch": 52.2425068119891,
+ "grad_norm": 4.4667840003967285,
+ "learning_rate": 9.759543389559937e-06,
+ "loss": 0.0829,
+ "step": 19173
+ },
+ {
+ "epoch": 52.24523160762943,
+ "grad_norm": 4.1979522705078125,
+ "learning_rate": 9.758661151025087e-06,
+ "loss": 0.0752,
+ "step": 19174
+ },
+ {
+ "epoch": 52.247956403269754,
+ "grad_norm": 4.452780246734619,
+ "learning_rate": 9.757778914369774e-06,
+ "loss": 0.092,
+ "step": 19175
+ },
+ {
+ "epoch": 52.25068119891008,
+ "grad_norm": 5.760451793670654,
+ "learning_rate": 9.75689667960087e-06,
+ "loss": 0.1678,
+ "step": 19176
+ },
+ {
+ "epoch": 52.253405994550405,
+ "grad_norm": 4.483896255493164,
+ "learning_rate": 9.75601444672525e-06,
+ "loss": 0.1453,
+ "step": 19177
+ },
+ {
+ "epoch": 52.25613079019074,
+ "grad_norm": 4.075677394866943,
+ "learning_rate": 9.75513221574978e-06,
+ "loss": 0.1116,
+ "step": 19178
+ },
+ {
+ "epoch": 52.258855585831064,
+ "grad_norm": 3.575446367263794,
+ "learning_rate": 9.754249986681334e-06,
+ "loss": 0.065,
+ "step": 19179
+ },
+ {
+ "epoch": 52.26158038147139,
+ "grad_norm": 4.823285102844238,
+ "learning_rate": 9.75336775952678e-06,
+ "loss": 0.164,
+ "step": 19180
+ },
+ {
+ "epoch": 52.264305177111716,
+ "grad_norm": 4.425245761871338,
+ "learning_rate": 9.752485534292992e-06,
+ "loss": 0.0766,
+ "step": 19181
+ },
+ {
+ "epoch": 52.26702997275204,
+ "grad_norm": 5.054012298583984,
+ "learning_rate": 9.751603310986835e-06,
+ "loss": 0.1827,
+ "step": 19182
+ },
+ {
+ "epoch": 52.26975476839237,
+ "grad_norm": 3.997870922088623,
+ "learning_rate": 9.750721089615185e-06,
+ "loss": 0.0808,
+ "step": 19183
+ },
+ {
+ "epoch": 52.2724795640327,
+ "grad_norm": 3.9631030559539795,
+ "learning_rate": 9.749838870184914e-06,
+ "loss": 0.1113,
+ "step": 19184
+ },
+ {
+ "epoch": 52.275204359673026,
+ "grad_norm": 4.400388240814209,
+ "learning_rate": 9.748956652702885e-06,
+ "loss": 0.1463,
+ "step": 19185
+ },
+ {
+ "epoch": 52.27792915531335,
+ "grad_norm": 4.180642127990723,
+ "learning_rate": 9.748074437175979e-06,
+ "loss": 0.3338,
+ "step": 19186
+ },
+ {
+ "epoch": 52.28065395095368,
+ "grad_norm": 3.2455155849456787,
+ "learning_rate": 9.747192223611055e-06,
+ "loss": 0.1908,
+ "step": 19187
+ },
+ {
+ "epoch": 52.283378746594,
+ "grad_norm": 6.889337062835693,
+ "learning_rate": 9.746310012014996e-06,
+ "loss": 0.1829,
+ "step": 19188
+ },
+ {
+ "epoch": 52.28610354223433,
+ "grad_norm": 4.764960289001465,
+ "learning_rate": 9.745427802394662e-06,
+ "loss": 0.2042,
+ "step": 19189
+ },
+ {
+ "epoch": 52.28882833787466,
+ "grad_norm": 3.8126718997955322,
+ "learning_rate": 9.74454559475693e-06,
+ "loss": 0.0861,
+ "step": 19190
+ },
+ {
+ "epoch": 52.29155313351499,
+ "grad_norm": 3.9455277919769287,
+ "learning_rate": 9.743663389108667e-06,
+ "loss": 0.093,
+ "step": 19191
+ },
+ {
+ "epoch": 52.294277929155314,
+ "grad_norm": 4.232730388641357,
+ "learning_rate": 9.742781185456748e-06,
+ "loss": 0.2172,
+ "step": 19192
+ },
+ {
+ "epoch": 52.29700272479564,
+ "grad_norm": 11.808323860168457,
+ "learning_rate": 9.74189898380804e-06,
+ "loss": 0.0975,
+ "step": 19193
+ },
+ {
+ "epoch": 52.299727520435965,
+ "grad_norm": 4.863210201263428,
+ "learning_rate": 9.741016784169409e-06,
+ "loss": 0.1337,
+ "step": 19194
+ },
+ {
+ "epoch": 52.30245231607629,
+ "grad_norm": 4.657174587249756,
+ "learning_rate": 9.740134586547737e-06,
+ "loss": 0.1553,
+ "step": 19195
+ },
+ {
+ "epoch": 52.305177111716624,
+ "grad_norm": 2.96730899810791,
+ "learning_rate": 9.739252390949887e-06,
+ "loss": 0.2061,
+ "step": 19196
+ },
+ {
+ "epoch": 52.30790190735695,
+ "grad_norm": 4.627375602722168,
+ "learning_rate": 9.738370197382732e-06,
+ "loss": 0.1023,
+ "step": 19197
+ },
+ {
+ "epoch": 52.310626702997276,
+ "grad_norm": 3.875765562057495,
+ "learning_rate": 9.73748800585314e-06,
+ "loss": 0.0961,
+ "step": 19198
+ },
+ {
+ "epoch": 52.3133514986376,
+ "grad_norm": 4.1032915115356445,
+ "learning_rate": 9.736605816367984e-06,
+ "loss": 0.1447,
+ "step": 19199
+ },
+ {
+ "epoch": 52.31607629427793,
+ "grad_norm": 4.122752666473389,
+ "learning_rate": 9.735723628934132e-06,
+ "loss": 0.0795,
+ "step": 19200
+ },
+ {
+ "epoch": 52.31880108991825,
+ "grad_norm": 4.321817874908447,
+ "learning_rate": 9.73484144355846e-06,
+ "loss": 0.332,
+ "step": 19201
+ },
+ {
+ "epoch": 52.321525885558586,
+ "grad_norm": 4.540710926055908,
+ "learning_rate": 9.733959260247829e-06,
+ "loss": 0.1718,
+ "step": 19202
+ },
+ {
+ "epoch": 52.32425068119891,
+ "grad_norm": 4.2653937339782715,
+ "learning_rate": 9.733077079009118e-06,
+ "loss": 0.1837,
+ "step": 19203
+ },
+ {
+ "epoch": 52.32697547683924,
+ "grad_norm": 3.323207378387451,
+ "learning_rate": 9.732194899849192e-06,
+ "loss": 0.1834,
+ "step": 19204
+ },
+ {
+ "epoch": 52.32970027247956,
+ "grad_norm": 3.735625982284546,
+ "learning_rate": 9.731312722774924e-06,
+ "loss": 0.1162,
+ "step": 19205
+ },
+ {
+ "epoch": 52.33242506811989,
+ "grad_norm": 9.254440307617188,
+ "learning_rate": 9.730430547793186e-06,
+ "loss": 0.1432,
+ "step": 19206
+ },
+ {
+ "epoch": 52.335149863760215,
+ "grad_norm": 4.414444923400879,
+ "learning_rate": 9.729548374910843e-06,
+ "loss": 0.2507,
+ "step": 19207
+ },
+ {
+ "epoch": 52.33787465940055,
+ "grad_norm": 4.62446403503418,
+ "learning_rate": 9.728666204134772e-06,
+ "loss": 0.1977,
+ "step": 19208
+ },
+ {
+ "epoch": 52.34059945504087,
+ "grad_norm": 4.216208457946777,
+ "learning_rate": 9.727784035471837e-06,
+ "loss": 0.1967,
+ "step": 19209
+ },
+ {
+ "epoch": 52.3433242506812,
+ "grad_norm": 3.2713513374328613,
+ "learning_rate": 9.726901868928913e-06,
+ "loss": 0.1025,
+ "step": 19210
+ },
+ {
+ "epoch": 52.346049046321525,
+ "grad_norm": 3.672574281692505,
+ "learning_rate": 9.726019704512864e-06,
+ "loss": 0.0612,
+ "step": 19211
+ },
+ {
+ "epoch": 52.34877384196185,
+ "grad_norm": 4.518486976623535,
+ "learning_rate": 9.725137542230568e-06,
+ "loss": 0.2087,
+ "step": 19212
+ },
+ {
+ "epoch": 52.35149863760218,
+ "grad_norm": 4.896111011505127,
+ "learning_rate": 9.724255382088895e-06,
+ "loss": 0.2777,
+ "step": 19213
+ },
+ {
+ "epoch": 52.35422343324251,
+ "grad_norm": 4.063868999481201,
+ "learning_rate": 9.723373224094708e-06,
+ "loss": 0.1814,
+ "step": 19214
+ },
+ {
+ "epoch": 52.356948228882835,
+ "grad_norm": 4.255677223205566,
+ "learning_rate": 9.722491068254883e-06,
+ "loss": 0.1455,
+ "step": 19215
+ },
+ {
+ "epoch": 52.35967302452316,
+ "grad_norm": 4.90528678894043,
+ "learning_rate": 9.721608914576288e-06,
+ "loss": 0.102,
+ "step": 19216
+ },
+ {
+ "epoch": 52.36239782016349,
+ "grad_norm": 4.571956157684326,
+ "learning_rate": 9.720726763065795e-06,
+ "loss": 0.2026,
+ "step": 19217
+ },
+ {
+ "epoch": 52.36512261580381,
+ "grad_norm": 4.2854108810424805,
+ "learning_rate": 9.719844613730273e-06,
+ "loss": 0.16,
+ "step": 19218
+ },
+ {
+ "epoch": 52.36784741144414,
+ "grad_norm": 3.9086852073669434,
+ "learning_rate": 9.718962466576592e-06,
+ "loss": 0.1718,
+ "step": 19219
+ },
+ {
+ "epoch": 52.37057220708447,
+ "grad_norm": 5.214824199676514,
+ "learning_rate": 9.71808032161162e-06,
+ "loss": 0.1705,
+ "step": 19220
+ },
+ {
+ "epoch": 52.3732970027248,
+ "grad_norm": 3.797212839126587,
+ "learning_rate": 9.717198178842234e-06,
+ "loss": 0.2025,
+ "step": 19221
+ },
+ {
+ "epoch": 52.37602179836512,
+ "grad_norm": 4.190108776092529,
+ "learning_rate": 9.716316038275295e-06,
+ "loss": 0.082,
+ "step": 19222
+ },
+ {
+ "epoch": 52.37874659400545,
+ "grad_norm": 4.681421279907227,
+ "learning_rate": 9.715433899917682e-06,
+ "loss": 0.2673,
+ "step": 19223
+ },
+ {
+ "epoch": 52.381471389645775,
+ "grad_norm": 5.3838324546813965,
+ "learning_rate": 9.714551763776255e-06,
+ "loss": 0.1939,
+ "step": 19224
+ },
+ {
+ "epoch": 52.3841961852861,
+ "grad_norm": 4.088294506072998,
+ "learning_rate": 9.713669629857894e-06,
+ "loss": 0.1051,
+ "step": 19225
+ },
+ {
+ "epoch": 52.38692098092643,
+ "grad_norm": 3.0899713039398193,
+ "learning_rate": 9.712787498169462e-06,
+ "loss": 0.0621,
+ "step": 19226
+ },
+ {
+ "epoch": 52.38964577656676,
+ "grad_norm": 4.062369346618652,
+ "learning_rate": 9.711905368717834e-06,
+ "loss": 0.1527,
+ "step": 19227
+ },
+ {
+ "epoch": 52.392370572207085,
+ "grad_norm": 4.366440773010254,
+ "learning_rate": 9.711023241509873e-06,
+ "loss": 0.0976,
+ "step": 19228
+ },
+ {
+ "epoch": 52.39509536784741,
+ "grad_norm": 5.699102401733398,
+ "learning_rate": 9.710141116552458e-06,
+ "loss": 0.1762,
+ "step": 19229
+ },
+ {
+ "epoch": 52.39782016348774,
+ "grad_norm": 6.592490196228027,
+ "learning_rate": 9.709258993852453e-06,
+ "loss": 0.1911,
+ "step": 19230
+ },
+ {
+ "epoch": 52.40054495912806,
+ "grad_norm": 5.691075801849365,
+ "learning_rate": 9.708376873416732e-06,
+ "loss": 0.1322,
+ "step": 19231
+ },
+ {
+ "epoch": 52.403269754768395,
+ "grad_norm": 5.219867706298828,
+ "learning_rate": 9.70749475525216e-06,
+ "loss": 0.169,
+ "step": 19232
+ },
+ {
+ "epoch": 52.40599455040872,
+ "grad_norm": 4.067953586578369,
+ "learning_rate": 9.706612639365613e-06,
+ "loss": 0.164,
+ "step": 19233
+ },
+ {
+ "epoch": 52.40871934604905,
+ "grad_norm": 3.9165313243865967,
+ "learning_rate": 9.705730525763951e-06,
+ "loss": 0.1286,
+ "step": 19234
+ },
+ {
+ "epoch": 52.41144414168937,
+ "grad_norm": 3.8384532928466797,
+ "learning_rate": 9.704848414454057e-06,
+ "loss": 0.1876,
+ "step": 19235
+ },
+ {
+ "epoch": 52.4141689373297,
+ "grad_norm": 3.8974759578704834,
+ "learning_rate": 9.70396630544279e-06,
+ "loss": 0.1039,
+ "step": 19236
+ },
+ {
+ "epoch": 52.416893732970024,
+ "grad_norm": 4.8549580574035645,
+ "learning_rate": 9.703084198737028e-06,
+ "loss": 0.1575,
+ "step": 19237
+ },
+ {
+ "epoch": 52.41961852861036,
+ "grad_norm": 4.355259418487549,
+ "learning_rate": 9.702202094343631e-06,
+ "loss": 0.1488,
+ "step": 19238
+ },
+ {
+ "epoch": 52.42234332425068,
+ "grad_norm": 3.9184348583221436,
+ "learning_rate": 9.701319992269479e-06,
+ "loss": 0.0948,
+ "step": 19239
+ },
+ {
+ "epoch": 52.42506811989101,
+ "grad_norm": 4.7135725021362305,
+ "learning_rate": 9.700437892521434e-06,
+ "loss": 0.236,
+ "step": 19240
+ },
+ {
+ "epoch": 52.427792915531334,
+ "grad_norm": 3.2412667274475098,
+ "learning_rate": 9.699555795106373e-06,
+ "loss": 0.0877,
+ "step": 19241
+ },
+ {
+ "epoch": 52.43051771117166,
+ "grad_norm": 4.784268379211426,
+ "learning_rate": 9.698673700031159e-06,
+ "loss": 0.0706,
+ "step": 19242
+ },
+ {
+ "epoch": 52.433242506811986,
+ "grad_norm": 4.160239219665527,
+ "learning_rate": 9.697791607302665e-06,
+ "loss": 0.0824,
+ "step": 19243
+ },
+ {
+ "epoch": 52.43596730245232,
+ "grad_norm": 4.861740589141846,
+ "learning_rate": 9.69690951692776e-06,
+ "loss": 0.179,
+ "step": 19244
+ },
+ {
+ "epoch": 52.438692098092645,
+ "grad_norm": 5.323450565338135,
+ "learning_rate": 9.69602742891331e-06,
+ "loss": 0.1943,
+ "step": 19245
+ },
+ {
+ "epoch": 52.44141689373297,
+ "grad_norm": 5.598095417022705,
+ "learning_rate": 9.695145343266195e-06,
+ "loss": 0.146,
+ "step": 19246
+ },
+ {
+ "epoch": 52.444141689373296,
+ "grad_norm": 4.833616256713867,
+ "learning_rate": 9.694263259993274e-06,
+ "loss": 0.0836,
+ "step": 19247
+ },
+ {
+ "epoch": 52.44686648501362,
+ "grad_norm": 3.781280517578125,
+ "learning_rate": 9.693381179101423e-06,
+ "loss": 0.0723,
+ "step": 19248
+ },
+ {
+ "epoch": 52.44959128065395,
+ "grad_norm": 9.509787559509277,
+ "learning_rate": 9.69249910059751e-06,
+ "loss": 0.1396,
+ "step": 19249
+ },
+ {
+ "epoch": 52.45231607629428,
+ "grad_norm": 4.508984565734863,
+ "learning_rate": 9.691617024488402e-06,
+ "loss": 0.073,
+ "step": 19250
+ },
+ {
+ "epoch": 52.45504087193461,
+ "grad_norm": 5.343342304229736,
+ "learning_rate": 9.690734950780973e-06,
+ "loss": 0.1266,
+ "step": 19251
+ },
+ {
+ "epoch": 52.45776566757493,
+ "grad_norm": 4.149517059326172,
+ "learning_rate": 9.689852879482089e-06,
+ "loss": 0.0921,
+ "step": 19252
+ },
+ {
+ "epoch": 52.46049046321526,
+ "grad_norm": 5.513681888580322,
+ "learning_rate": 9.688970810598622e-06,
+ "loss": 0.1791,
+ "step": 19253
+ },
+ {
+ "epoch": 52.463215258855584,
+ "grad_norm": 3.3647594451904297,
+ "learning_rate": 9.688088744137438e-06,
+ "loss": 0.1007,
+ "step": 19254
+ },
+ {
+ "epoch": 52.46594005449591,
+ "grad_norm": 3.7131452560424805,
+ "learning_rate": 9.687206680105412e-06,
+ "loss": 0.0605,
+ "step": 19255
+ },
+ {
+ "epoch": 52.46866485013624,
+ "grad_norm": 4.058668613433838,
+ "learning_rate": 9.686324618509409e-06,
+ "loss": 0.0623,
+ "step": 19256
+ },
+ {
+ "epoch": 52.47138964577657,
+ "grad_norm": 5.368107795715332,
+ "learning_rate": 9.6854425593563e-06,
+ "loss": 0.0909,
+ "step": 19257
+ },
+ {
+ "epoch": 52.474114441416894,
+ "grad_norm": 4.719025611877441,
+ "learning_rate": 9.684560502652952e-06,
+ "loss": 0.1163,
+ "step": 19258
+ },
+ {
+ "epoch": 52.47683923705722,
+ "grad_norm": 3.9193098545074463,
+ "learning_rate": 9.68367844840624e-06,
+ "loss": 0.157,
+ "step": 19259
+ },
+ {
+ "epoch": 52.479564032697546,
+ "grad_norm": 4.803292751312256,
+ "learning_rate": 9.682796396623027e-06,
+ "loss": 0.1858,
+ "step": 19260
+ },
+ {
+ "epoch": 52.48228882833787,
+ "grad_norm": 3.553367853164673,
+ "learning_rate": 9.681914347310188e-06,
+ "loss": 0.0781,
+ "step": 19261
+ },
+ {
+ "epoch": 52.485013623978205,
+ "grad_norm": 6.250884532928467,
+ "learning_rate": 9.681032300474586e-06,
+ "loss": 0.1178,
+ "step": 19262
+ },
+ {
+ "epoch": 52.48773841961853,
+ "grad_norm": 4.706630229949951,
+ "learning_rate": 9.680150256123096e-06,
+ "loss": 0.1932,
+ "step": 19263
+ },
+ {
+ "epoch": 52.490463215258856,
+ "grad_norm": 5.85382080078125,
+ "learning_rate": 9.679268214262588e-06,
+ "loss": 0.1317,
+ "step": 19264
+ },
+ {
+ "epoch": 52.49318801089918,
+ "grad_norm": 5.139765739440918,
+ "learning_rate": 9.678386174899925e-06,
+ "loss": 0.1764,
+ "step": 19265
+ },
+ {
+ "epoch": 52.49591280653951,
+ "grad_norm": 4.154210567474365,
+ "learning_rate": 9.677504138041984e-06,
+ "loss": 0.0861,
+ "step": 19266
+ },
+ {
+ "epoch": 52.49863760217983,
+ "grad_norm": 4.736916542053223,
+ "learning_rate": 9.676622103695628e-06,
+ "loss": 0.1052,
+ "step": 19267
+ },
+ {
+ "epoch": 52.50136239782017,
+ "grad_norm": 3.8731517791748047,
+ "learning_rate": 9.675740071867729e-06,
+ "loss": 0.2096,
+ "step": 19268
+ },
+ {
+ "epoch": 52.50408719346049,
+ "grad_norm": 5.190960884094238,
+ "learning_rate": 9.674858042565157e-06,
+ "loss": 0.1572,
+ "step": 19269
+ },
+ {
+ "epoch": 52.50681198910082,
+ "grad_norm": 5.408673286437988,
+ "learning_rate": 9.673976015794778e-06,
+ "loss": 0.1133,
+ "step": 19270
+ },
+ {
+ "epoch": 52.509536784741144,
+ "grad_norm": 4.685727596282959,
+ "learning_rate": 9.673093991563466e-06,
+ "loss": 0.1489,
+ "step": 19271
+ },
+ {
+ "epoch": 52.51226158038147,
+ "grad_norm": 5.208731651306152,
+ "learning_rate": 9.672211969878085e-06,
+ "loss": 0.2998,
+ "step": 19272
+ },
+ {
+ "epoch": 52.514986376021795,
+ "grad_norm": 4.553671360015869,
+ "learning_rate": 9.671329950745509e-06,
+ "loss": 0.3697,
+ "step": 19273
+ },
+ {
+ "epoch": 52.51771117166213,
+ "grad_norm": 5.830882549285889,
+ "learning_rate": 9.670447934172602e-06,
+ "loss": 0.1832,
+ "step": 19274
+ },
+ {
+ "epoch": 52.520435967302454,
+ "grad_norm": 4.45698356628418,
+ "learning_rate": 9.669565920166238e-06,
+ "loss": 0.1636,
+ "step": 19275
+ },
+ {
+ "epoch": 52.52316076294278,
+ "grad_norm": 4.683032989501953,
+ "learning_rate": 9.668683908733283e-06,
+ "loss": 0.1836,
+ "step": 19276
+ },
+ {
+ "epoch": 52.525885558583106,
+ "grad_norm": 6.098485946655273,
+ "learning_rate": 9.667801899880609e-06,
+ "loss": 0.1793,
+ "step": 19277
+ },
+ {
+ "epoch": 52.52861035422343,
+ "grad_norm": 3.737724781036377,
+ "learning_rate": 9.66691989361508e-06,
+ "loss": 0.1247,
+ "step": 19278
+ },
+ {
+ "epoch": 52.53133514986376,
+ "grad_norm": 3.9942116737365723,
+ "learning_rate": 9.66603788994357e-06,
+ "loss": 0.1259,
+ "step": 19279
+ },
+ {
+ "epoch": 52.53405994550409,
+ "grad_norm": 4.8618035316467285,
+ "learning_rate": 9.665155888872943e-06,
+ "loss": 0.1133,
+ "step": 19280
+ },
+ {
+ "epoch": 52.536784741144416,
+ "grad_norm": 4.010344982147217,
+ "learning_rate": 9.664273890410073e-06,
+ "loss": 0.1095,
+ "step": 19281
+ },
+ {
+ "epoch": 52.53950953678474,
+ "grad_norm": 4.521393775939941,
+ "learning_rate": 9.66339189456183e-06,
+ "loss": 0.1318,
+ "step": 19282
+ },
+ {
+ "epoch": 52.54223433242507,
+ "grad_norm": 5.568043231964111,
+ "learning_rate": 9.662509901335077e-06,
+ "loss": 0.1339,
+ "step": 19283
+ },
+ {
+ "epoch": 52.54495912806539,
+ "grad_norm": 7.71300745010376,
+ "learning_rate": 9.661627910736689e-06,
+ "loss": 0.1413,
+ "step": 19284
+ },
+ {
+ "epoch": 52.54768392370572,
+ "grad_norm": 4.08627986907959,
+ "learning_rate": 9.660745922773529e-06,
+ "loss": 0.0931,
+ "step": 19285
+ },
+ {
+ "epoch": 52.55040871934605,
+ "grad_norm": 4.967341423034668,
+ "learning_rate": 9.65986393745247e-06,
+ "loss": 0.1998,
+ "step": 19286
+ },
+ {
+ "epoch": 52.55313351498638,
+ "grad_norm": 4.925725936889648,
+ "learning_rate": 9.65898195478038e-06,
+ "loss": 0.1094,
+ "step": 19287
+ },
+ {
+ "epoch": 52.555858310626704,
+ "grad_norm": 4.59002685546875,
+ "learning_rate": 9.658099974764129e-06,
+ "loss": 0.085,
+ "step": 19288
+ },
+ {
+ "epoch": 52.55858310626703,
+ "grad_norm": 5.515731334686279,
+ "learning_rate": 9.65721799741058e-06,
+ "loss": 0.2105,
+ "step": 19289
+ },
+ {
+ "epoch": 52.561307901907355,
+ "grad_norm": 4.188617706298828,
+ "learning_rate": 9.656336022726612e-06,
+ "loss": 0.076,
+ "step": 19290
+ },
+ {
+ "epoch": 52.56403269754768,
+ "grad_norm": 4.015984535217285,
+ "learning_rate": 9.655454050719081e-06,
+ "loss": 0.14,
+ "step": 19291
+ },
+ {
+ "epoch": 52.566757493188014,
+ "grad_norm": 3.490887403488159,
+ "learning_rate": 9.654572081394868e-06,
+ "loss": 0.068,
+ "step": 19292
+ },
+ {
+ "epoch": 52.56948228882834,
+ "grad_norm": 4.456308364868164,
+ "learning_rate": 9.653690114760835e-06,
+ "loss": 0.0687,
+ "step": 19293
+ },
+ {
+ "epoch": 52.572207084468666,
+ "grad_norm": 5.373715400695801,
+ "learning_rate": 9.65280815082385e-06,
+ "loss": 0.2611,
+ "step": 19294
+ },
+ {
+ "epoch": 52.57493188010899,
+ "grad_norm": 4.22686767578125,
+ "learning_rate": 9.65192618959079e-06,
+ "loss": 0.2667,
+ "step": 19295
+ },
+ {
+ "epoch": 52.57765667574932,
+ "grad_norm": 4.848435401916504,
+ "learning_rate": 9.651044231068513e-06,
+ "loss": 0.116,
+ "step": 19296
+ },
+ {
+ "epoch": 52.58038147138964,
+ "grad_norm": 5.875431537628174,
+ "learning_rate": 9.650162275263889e-06,
+ "loss": 0.2575,
+ "step": 19297
+ },
+ {
+ "epoch": 52.583106267029976,
+ "grad_norm": 5.266987323760986,
+ "learning_rate": 9.649280322183796e-06,
+ "loss": 0.099,
+ "step": 19298
+ },
+ {
+ "epoch": 52.5858310626703,
+ "grad_norm": 3.639037609100342,
+ "learning_rate": 9.648398371835094e-06,
+ "loss": 0.1616,
+ "step": 19299
+ },
+ {
+ "epoch": 52.58855585831063,
+ "grad_norm": 4.050128936767578,
+ "learning_rate": 9.647516424224655e-06,
+ "loss": 0.3132,
+ "step": 19300
+ },
+ {
+ "epoch": 52.59128065395095,
+ "grad_norm": 3.4647326469421387,
+ "learning_rate": 9.646634479359346e-06,
+ "loss": 0.0794,
+ "step": 19301
+ },
+ {
+ "epoch": 52.59400544959128,
+ "grad_norm": 5.349648952484131,
+ "learning_rate": 9.645752537246038e-06,
+ "loss": 0.1169,
+ "step": 19302
+ },
+ {
+ "epoch": 52.596730245231605,
+ "grad_norm": 5.098369121551514,
+ "learning_rate": 9.644870597891597e-06,
+ "loss": 0.1406,
+ "step": 19303
+ },
+ {
+ "epoch": 52.59945504087194,
+ "grad_norm": 3.8686046600341797,
+ "learning_rate": 9.643988661302893e-06,
+ "loss": 0.2649,
+ "step": 19304
+ },
+ {
+ "epoch": 52.60217983651226,
+ "grad_norm": 4.619300365447998,
+ "learning_rate": 9.643106727486792e-06,
+ "loss": 0.1186,
+ "step": 19305
+ },
+ {
+ "epoch": 52.60490463215259,
+ "grad_norm": 4.731567859649658,
+ "learning_rate": 9.642224796450165e-06,
+ "loss": 0.2956,
+ "step": 19306
+ },
+ {
+ "epoch": 52.607629427792915,
+ "grad_norm": 4.745423316955566,
+ "learning_rate": 9.64134286819988e-06,
+ "loss": 0.1265,
+ "step": 19307
+ },
+ {
+ "epoch": 52.61035422343324,
+ "grad_norm": 4.2086381912231445,
+ "learning_rate": 9.640460942742806e-06,
+ "loss": 0.0755,
+ "step": 19308
+ },
+ {
+ "epoch": 52.61307901907357,
+ "grad_norm": 5.149787425994873,
+ "learning_rate": 9.63957902008581e-06,
+ "loss": 0.1888,
+ "step": 19309
+ },
+ {
+ "epoch": 52.6158038147139,
+ "grad_norm": 3.8726794719696045,
+ "learning_rate": 9.638697100235763e-06,
+ "loss": 0.1378,
+ "step": 19310
+ },
+ {
+ "epoch": 52.618528610354225,
+ "grad_norm": 3.5131676197052,
+ "learning_rate": 9.637815183199527e-06,
+ "loss": 0.0739,
+ "step": 19311
+ },
+ {
+ "epoch": 52.62125340599455,
+ "grad_norm": 4.361724376678467,
+ "learning_rate": 9.636933268983979e-06,
+ "loss": 0.1274,
+ "step": 19312
+ },
+ {
+ "epoch": 52.62397820163488,
+ "grad_norm": 4.908632278442383,
+ "learning_rate": 9.636051357595979e-06,
+ "loss": 0.0928,
+ "step": 19313
+ },
+ {
+ "epoch": 52.6267029972752,
+ "grad_norm": 3.4299521446228027,
+ "learning_rate": 9.635169449042398e-06,
+ "loss": 0.1616,
+ "step": 19314
+ },
+ {
+ "epoch": 52.62942779291553,
+ "grad_norm": 5.611042022705078,
+ "learning_rate": 9.634287543330109e-06,
+ "loss": 0.1075,
+ "step": 19315
+ },
+ {
+ "epoch": 52.63215258855586,
+ "grad_norm": 5.181185722351074,
+ "learning_rate": 9.633405640465977e-06,
+ "loss": 0.1499,
+ "step": 19316
+ },
+ {
+ "epoch": 52.63487738419619,
+ "grad_norm": 3.2112326622009277,
+ "learning_rate": 9.632523740456869e-06,
+ "loss": 0.1762,
+ "step": 19317
+ },
+ {
+ "epoch": 52.63760217983651,
+ "grad_norm": 4.11383581161499,
+ "learning_rate": 9.631641843309656e-06,
+ "loss": 0.082,
+ "step": 19318
+ },
+ {
+ "epoch": 52.64032697547684,
+ "grad_norm": 4.444210529327393,
+ "learning_rate": 9.630759949031203e-06,
+ "loss": 0.1227,
+ "step": 19319
+ },
+ {
+ "epoch": 52.643051771117165,
+ "grad_norm": 3.353123664855957,
+ "learning_rate": 9.629878057628382e-06,
+ "loss": 0.1317,
+ "step": 19320
+ },
+ {
+ "epoch": 52.64577656675749,
+ "grad_norm": 4.4403486251831055,
+ "learning_rate": 9.628996169108056e-06,
+ "loss": 0.1149,
+ "step": 19321
+ },
+ {
+ "epoch": 52.64850136239782,
+ "grad_norm": 2.984766960144043,
+ "learning_rate": 9.628114283477098e-06,
+ "loss": 0.0698,
+ "step": 19322
+ },
+ {
+ "epoch": 52.65122615803815,
+ "grad_norm": 3.924394130706787,
+ "learning_rate": 9.62723240074237e-06,
+ "loss": 0.1254,
+ "step": 19323
+ },
+ {
+ "epoch": 52.653950953678475,
+ "grad_norm": 4.6532087326049805,
+ "learning_rate": 9.62635052091075e-06,
+ "loss": 0.0829,
+ "step": 19324
+ },
+ {
+ "epoch": 52.6566757493188,
+ "grad_norm": 3.568769693374634,
+ "learning_rate": 9.625468643989096e-06,
+ "loss": 0.1329,
+ "step": 19325
+ },
+ {
+ "epoch": 52.65940054495913,
+ "grad_norm": 4.401582717895508,
+ "learning_rate": 9.624586769984282e-06,
+ "loss": 0.1092,
+ "step": 19326
+ },
+ {
+ "epoch": 52.66212534059945,
+ "grad_norm": 4.047064781188965,
+ "learning_rate": 9.623704898903173e-06,
+ "loss": 0.0823,
+ "step": 19327
+ },
+ {
+ "epoch": 52.664850136239785,
+ "grad_norm": 6.713965892791748,
+ "learning_rate": 9.622823030752639e-06,
+ "loss": 0.1693,
+ "step": 19328
+ },
+ {
+ "epoch": 52.66757493188011,
+ "grad_norm": 4.513161659240723,
+ "learning_rate": 9.621941165539546e-06,
+ "loss": 0.1448,
+ "step": 19329
+ },
+ {
+ "epoch": 52.67029972752044,
+ "grad_norm": 4.816930294036865,
+ "learning_rate": 9.621059303270765e-06,
+ "loss": 0.113,
+ "step": 19330
+ },
+ {
+ "epoch": 52.67302452316076,
+ "grad_norm": 4.622618675231934,
+ "learning_rate": 9.620177443953156e-06,
+ "loss": 0.0817,
+ "step": 19331
+ },
+ {
+ "epoch": 52.67574931880109,
+ "grad_norm": 3.708385944366455,
+ "learning_rate": 9.619295587593597e-06,
+ "loss": 0.1095,
+ "step": 19332
+ },
+ {
+ "epoch": 52.678474114441414,
+ "grad_norm": 3.9158594608306885,
+ "learning_rate": 9.61841373419895e-06,
+ "loss": 0.0974,
+ "step": 19333
+ },
+ {
+ "epoch": 52.68119891008175,
+ "grad_norm": 5.615607261657715,
+ "learning_rate": 9.617531883776088e-06,
+ "loss": 0.2291,
+ "step": 19334
+ },
+ {
+ "epoch": 52.68392370572207,
+ "grad_norm": 5.181751251220703,
+ "learning_rate": 9.616650036331874e-06,
+ "loss": 0.2695,
+ "step": 19335
+ },
+ {
+ "epoch": 52.6866485013624,
+ "grad_norm": 4.0438151359558105,
+ "learning_rate": 9.615768191873179e-06,
+ "loss": 0.2152,
+ "step": 19336
+ },
+ {
+ "epoch": 52.689373297002724,
+ "grad_norm": 3.4214389324188232,
+ "learning_rate": 9.614886350406865e-06,
+ "loss": 0.0804,
+ "step": 19337
+ },
+ {
+ "epoch": 52.69209809264305,
+ "grad_norm": 3.4087636470794678,
+ "learning_rate": 9.614004511939807e-06,
+ "loss": 0.0582,
+ "step": 19338
+ },
+ {
+ "epoch": 52.694822888283376,
+ "grad_norm": 4.2999043464660645,
+ "learning_rate": 9.613122676478868e-06,
+ "loss": 0.1115,
+ "step": 19339
+ },
+ {
+ "epoch": 52.69754768392371,
+ "grad_norm": 4.865885257720947,
+ "learning_rate": 9.612240844030917e-06,
+ "loss": 0.135,
+ "step": 19340
+ },
+ {
+ "epoch": 52.700272479564035,
+ "grad_norm": 4.982079982757568,
+ "learning_rate": 9.611359014602823e-06,
+ "loss": 0.1326,
+ "step": 19341
+ },
+ {
+ "epoch": 52.70299727520436,
+ "grad_norm": 4.406929016113281,
+ "learning_rate": 9.610477188201452e-06,
+ "loss": 0.1047,
+ "step": 19342
+ },
+ {
+ "epoch": 52.705722070844686,
+ "grad_norm": 4.624931335449219,
+ "learning_rate": 9.609595364833672e-06,
+ "loss": 0.2232,
+ "step": 19343
+ },
+ {
+ "epoch": 52.70844686648501,
+ "grad_norm": 4.764208793640137,
+ "learning_rate": 9.60871354450635e-06,
+ "loss": 0.0927,
+ "step": 19344
+ },
+ {
+ "epoch": 52.71117166212534,
+ "grad_norm": 4.3923540115356445,
+ "learning_rate": 9.607831727226355e-06,
+ "loss": 0.1221,
+ "step": 19345
+ },
+ {
+ "epoch": 52.71389645776567,
+ "grad_norm": 3.9085776805877686,
+ "learning_rate": 9.606949913000554e-06,
+ "loss": 0.2829,
+ "step": 19346
+ },
+ {
+ "epoch": 52.716621253406,
+ "grad_norm": 4.042550563812256,
+ "learning_rate": 9.606068101835815e-06,
+ "loss": 0.1434,
+ "step": 19347
+ },
+ {
+ "epoch": 52.71934604904632,
+ "grad_norm": 3.807206392288208,
+ "learning_rate": 9.605186293739e-06,
+ "loss": 0.0913,
+ "step": 19348
+ },
+ {
+ "epoch": 52.72207084468665,
+ "grad_norm": 3.671191692352295,
+ "learning_rate": 9.604304488716987e-06,
+ "loss": 0.123,
+ "step": 19349
+ },
+ {
+ "epoch": 52.724795640326974,
+ "grad_norm": 4.420248031616211,
+ "learning_rate": 9.603422686776635e-06,
+ "loss": 0.1785,
+ "step": 19350
+ },
+ {
+ "epoch": 52.7275204359673,
+ "grad_norm": 4.048986434936523,
+ "learning_rate": 9.602540887924819e-06,
+ "loss": 0.1077,
+ "step": 19351
+ },
+ {
+ "epoch": 52.73024523160763,
+ "grad_norm": 3.655841588973999,
+ "learning_rate": 9.601659092168395e-06,
+ "loss": 0.0767,
+ "step": 19352
+ },
+ {
+ "epoch": 52.73297002724796,
+ "grad_norm": 4.169539928436279,
+ "learning_rate": 9.600777299514243e-06,
+ "loss": 0.204,
+ "step": 19353
+ },
+ {
+ "epoch": 52.735694822888284,
+ "grad_norm": 4.01200008392334,
+ "learning_rate": 9.59989550996922e-06,
+ "loss": 0.0708,
+ "step": 19354
+ },
+ {
+ "epoch": 52.73841961852861,
+ "grad_norm": 3.724123001098633,
+ "learning_rate": 9.599013723540204e-06,
+ "loss": 0.0999,
+ "step": 19355
+ },
+ {
+ "epoch": 52.741144414168936,
+ "grad_norm": 4.897405624389648,
+ "learning_rate": 9.598131940234051e-06,
+ "loss": 0.2238,
+ "step": 19356
+ },
+ {
+ "epoch": 52.74386920980926,
+ "grad_norm": 4.107428550720215,
+ "learning_rate": 9.597250160057635e-06,
+ "loss": 0.0983,
+ "step": 19357
+ },
+ {
+ "epoch": 52.746594005449595,
+ "grad_norm": 4.829750061035156,
+ "learning_rate": 9.596368383017822e-06,
+ "loss": 0.0737,
+ "step": 19358
+ },
+ {
+ "epoch": 52.74931880108992,
+ "grad_norm": 4.205144882202148,
+ "learning_rate": 9.595486609121477e-06,
+ "loss": 0.3055,
+ "step": 19359
+ },
+ {
+ "epoch": 52.752043596730246,
+ "grad_norm": 5.4464826583862305,
+ "learning_rate": 9.594604838375473e-06,
+ "loss": 0.1822,
+ "step": 19360
+ },
+ {
+ "epoch": 52.75476839237057,
+ "grad_norm": 3.527435779571533,
+ "learning_rate": 9.593723070786671e-06,
+ "loss": 0.0826,
+ "step": 19361
+ },
+ {
+ "epoch": 52.7574931880109,
+ "grad_norm": 4.032792568206787,
+ "learning_rate": 9.592841306361942e-06,
+ "loss": 0.1613,
+ "step": 19362
+ },
+ {
+ "epoch": 52.76021798365122,
+ "grad_norm": 4.165923118591309,
+ "learning_rate": 9.59195954510815e-06,
+ "loss": 0.1055,
+ "step": 19363
+ },
+ {
+ "epoch": 52.762942779291556,
+ "grad_norm": 5.197146892547607,
+ "learning_rate": 9.591077787032166e-06,
+ "loss": 0.1861,
+ "step": 19364
+ },
+ {
+ "epoch": 52.76566757493188,
+ "grad_norm": 6.287145614624023,
+ "learning_rate": 9.590196032140852e-06,
+ "loss": 0.0796,
+ "step": 19365
+ },
+ {
+ "epoch": 52.76839237057221,
+ "grad_norm": 5.605803966522217,
+ "learning_rate": 9.589314280441077e-06,
+ "loss": 0.1606,
+ "step": 19366
+ },
+ {
+ "epoch": 52.771117166212534,
+ "grad_norm": 3.812502145767212,
+ "learning_rate": 9.588432531939714e-06,
+ "loss": 0.0775,
+ "step": 19367
+ },
+ {
+ "epoch": 52.77384196185286,
+ "grad_norm": 5.06690788269043,
+ "learning_rate": 9.587550786643623e-06,
+ "loss": 0.1423,
+ "step": 19368
+ },
+ {
+ "epoch": 52.776566757493185,
+ "grad_norm": 4.095958709716797,
+ "learning_rate": 9.586669044559674e-06,
+ "loss": 0.212,
+ "step": 19369
+ },
+ {
+ "epoch": 52.77929155313352,
+ "grad_norm": 5.3416666984558105,
+ "learning_rate": 9.585787305694733e-06,
+ "loss": 0.314,
+ "step": 19370
+ },
+ {
+ "epoch": 52.782016348773844,
+ "grad_norm": 4.653022289276123,
+ "learning_rate": 9.584905570055668e-06,
+ "loss": 0.1592,
+ "step": 19371
+ },
+ {
+ "epoch": 52.78474114441417,
+ "grad_norm": 8.40907096862793,
+ "learning_rate": 9.584023837649343e-06,
+ "loss": 0.08,
+ "step": 19372
+ },
+ {
+ "epoch": 52.787465940054496,
+ "grad_norm": 6.979483604431152,
+ "learning_rate": 9.58314210848263e-06,
+ "loss": 0.1268,
+ "step": 19373
+ },
+ {
+ "epoch": 52.79019073569482,
+ "grad_norm": 4.940918922424316,
+ "learning_rate": 9.582260382562389e-06,
+ "loss": 0.0934,
+ "step": 19374
+ },
+ {
+ "epoch": 52.79291553133515,
+ "grad_norm": 4.029472827911377,
+ "learning_rate": 9.581378659895494e-06,
+ "loss": 0.0955,
+ "step": 19375
+ },
+ {
+ "epoch": 52.79564032697548,
+ "grad_norm": 3.5107131004333496,
+ "learning_rate": 9.580496940488806e-06,
+ "loss": 0.1079,
+ "step": 19376
+ },
+ {
+ "epoch": 52.798365122615806,
+ "grad_norm": 7.501389503479004,
+ "learning_rate": 9.579615224349195e-06,
+ "loss": 0.2101,
+ "step": 19377
+ },
+ {
+ "epoch": 52.80108991825613,
+ "grad_norm": 3.9385881423950195,
+ "learning_rate": 9.578733511483527e-06,
+ "loss": 0.0731,
+ "step": 19378
+ },
+ {
+ "epoch": 52.80381471389646,
+ "grad_norm": 4.246493339538574,
+ "learning_rate": 9.577851801898669e-06,
+ "loss": 0.1004,
+ "step": 19379
+ },
+ {
+ "epoch": 52.80653950953678,
+ "grad_norm": 4.60960578918457,
+ "learning_rate": 9.57697009560149e-06,
+ "loss": 0.2342,
+ "step": 19380
+ },
+ {
+ "epoch": 52.80926430517711,
+ "grad_norm": 3.791977643966675,
+ "learning_rate": 9.57608839259885e-06,
+ "loss": 0.2611,
+ "step": 19381
+ },
+ {
+ "epoch": 52.81198910081744,
+ "grad_norm": 4.869720935821533,
+ "learning_rate": 9.575206692897624e-06,
+ "loss": 0.2234,
+ "step": 19382
+ },
+ {
+ "epoch": 52.81471389645777,
+ "grad_norm": 4.54078483581543,
+ "learning_rate": 9.574324996504669e-06,
+ "loss": 0.1507,
+ "step": 19383
+ },
+ {
+ "epoch": 52.817438692098094,
+ "grad_norm": 4.842339038848877,
+ "learning_rate": 9.573443303426861e-06,
+ "loss": 0.1372,
+ "step": 19384
+ },
+ {
+ "epoch": 52.82016348773842,
+ "grad_norm": 5.749547481536865,
+ "learning_rate": 9.572561613671063e-06,
+ "loss": 0.1336,
+ "step": 19385
+ },
+ {
+ "epoch": 52.822888283378745,
+ "grad_norm": 4.521557807922363,
+ "learning_rate": 9.571679927244141e-06,
+ "loss": 0.305,
+ "step": 19386
+ },
+ {
+ "epoch": 52.82561307901907,
+ "grad_norm": 4.607681751251221,
+ "learning_rate": 9.570798244152962e-06,
+ "loss": 0.1954,
+ "step": 19387
+ },
+ {
+ "epoch": 52.828337874659404,
+ "grad_norm": 4.482492446899414,
+ "learning_rate": 9.569916564404392e-06,
+ "loss": 0.0844,
+ "step": 19388
+ },
+ {
+ "epoch": 52.83106267029973,
+ "grad_norm": 3.874396324157715,
+ "learning_rate": 9.5690348880053e-06,
+ "loss": 0.1349,
+ "step": 19389
+ },
+ {
+ "epoch": 52.833787465940055,
+ "grad_norm": 3.666623592376709,
+ "learning_rate": 9.568153214962548e-06,
+ "loss": 0.0805,
+ "step": 19390
+ },
+ {
+ "epoch": 52.83651226158038,
+ "grad_norm": 4.0994553565979,
+ "learning_rate": 9.567271545283008e-06,
+ "loss": 0.1871,
+ "step": 19391
+ },
+ {
+ "epoch": 52.83923705722071,
+ "grad_norm": 3.9918689727783203,
+ "learning_rate": 9.566389878973539e-06,
+ "loss": 0.0865,
+ "step": 19392
+ },
+ {
+ "epoch": 52.84196185286103,
+ "grad_norm": 5.492431640625,
+ "learning_rate": 9.565508216041015e-06,
+ "loss": 0.1218,
+ "step": 19393
+ },
+ {
+ "epoch": 52.844686648501366,
+ "grad_norm": 5.203312397003174,
+ "learning_rate": 9.564626556492297e-06,
+ "loss": 0.0878,
+ "step": 19394
+ },
+ {
+ "epoch": 52.84741144414169,
+ "grad_norm": 3.5612733364105225,
+ "learning_rate": 9.563744900334256e-06,
+ "loss": 0.1608,
+ "step": 19395
+ },
+ {
+ "epoch": 52.85013623978202,
+ "grad_norm": 5.559460163116455,
+ "learning_rate": 9.562863247573753e-06,
+ "loss": 0.0751,
+ "step": 19396
+ },
+ {
+ "epoch": 52.85286103542234,
+ "grad_norm": 3.9738035202026367,
+ "learning_rate": 9.561981598217658e-06,
+ "loss": 0.245,
+ "step": 19397
+ },
+ {
+ "epoch": 52.85558583106267,
+ "grad_norm": 3.7084290981292725,
+ "learning_rate": 9.561099952272835e-06,
+ "loss": 0.0937,
+ "step": 19398
+ },
+ {
+ "epoch": 52.858310626702995,
+ "grad_norm": 5.085404396057129,
+ "learning_rate": 9.560218309746154e-06,
+ "loss": 0.1895,
+ "step": 19399
+ },
+ {
+ "epoch": 52.86103542234333,
+ "grad_norm": 3.99646258354187,
+ "learning_rate": 9.559336670644472e-06,
+ "loss": 0.1783,
+ "step": 19400
+ },
+ {
+ "epoch": 52.86376021798365,
+ "grad_norm": 5.141168117523193,
+ "learning_rate": 9.558455034974667e-06,
+ "loss": 0.118,
+ "step": 19401
+ },
+ {
+ "epoch": 52.86648501362398,
+ "grad_norm": 3.759382486343384,
+ "learning_rate": 9.5575734027436e-06,
+ "loss": 0.1975,
+ "step": 19402
+ },
+ {
+ "epoch": 52.869209809264305,
+ "grad_norm": 4.657748222351074,
+ "learning_rate": 9.556691773958137e-06,
+ "loss": 0.0998,
+ "step": 19403
+ },
+ {
+ "epoch": 52.87193460490463,
+ "grad_norm": 4.618873119354248,
+ "learning_rate": 9.555810148625144e-06,
+ "loss": 0.2024,
+ "step": 19404
+ },
+ {
+ "epoch": 52.87465940054496,
+ "grad_norm": 4.090301513671875,
+ "learning_rate": 9.55492852675149e-06,
+ "loss": 0.1703,
+ "step": 19405
+ },
+ {
+ "epoch": 52.87738419618529,
+ "grad_norm": 5.711353778839111,
+ "learning_rate": 9.554046908344034e-06,
+ "loss": 0.0974,
+ "step": 19406
+ },
+ {
+ "epoch": 52.880108991825615,
+ "grad_norm": 5.343455791473389,
+ "learning_rate": 9.55316529340965e-06,
+ "loss": 0.1682,
+ "step": 19407
+ },
+ {
+ "epoch": 52.88283378746594,
+ "grad_norm": 4.769092082977295,
+ "learning_rate": 9.552283681955196e-06,
+ "loss": 0.1935,
+ "step": 19408
+ },
+ {
+ "epoch": 52.88555858310627,
+ "grad_norm": 3.6172735691070557,
+ "learning_rate": 9.551402073987547e-06,
+ "loss": 0.1412,
+ "step": 19409
+ },
+ {
+ "epoch": 52.88828337874659,
+ "grad_norm": 4.08225154876709,
+ "learning_rate": 9.55052046951356e-06,
+ "loss": 0.1674,
+ "step": 19410
+ },
+ {
+ "epoch": 52.89100817438692,
+ "grad_norm": 6.741689205169678,
+ "learning_rate": 9.549638868540108e-06,
+ "loss": 0.1482,
+ "step": 19411
+ },
+ {
+ "epoch": 52.89373297002725,
+ "grad_norm": 4.846926212310791,
+ "learning_rate": 9.548757271074053e-06,
+ "loss": 0.1357,
+ "step": 19412
+ },
+ {
+ "epoch": 52.89645776566758,
+ "grad_norm": 6.184783458709717,
+ "learning_rate": 9.547875677122262e-06,
+ "loss": 0.1598,
+ "step": 19413
+ },
+ {
+ "epoch": 52.8991825613079,
+ "grad_norm": 5.16526460647583,
+ "learning_rate": 9.5469940866916e-06,
+ "loss": 0.1519,
+ "step": 19414
+ },
+ {
+ "epoch": 52.90190735694823,
+ "grad_norm": 3.609684467315674,
+ "learning_rate": 9.546112499788935e-06,
+ "loss": 0.0773,
+ "step": 19415
+ },
+ {
+ "epoch": 52.904632152588555,
+ "grad_norm": 5.692165851593018,
+ "learning_rate": 9.545230916421129e-06,
+ "loss": 0.1726,
+ "step": 19416
+ },
+ {
+ "epoch": 52.90735694822888,
+ "grad_norm": 4.304907321929932,
+ "learning_rate": 9.544349336595049e-06,
+ "loss": 0.1301,
+ "step": 19417
+ },
+ {
+ "epoch": 52.91008174386921,
+ "grad_norm": 5.129548072814941,
+ "learning_rate": 9.543467760317565e-06,
+ "loss": 0.1788,
+ "step": 19418
+ },
+ {
+ "epoch": 52.91280653950954,
+ "grad_norm": 3.5996346473693848,
+ "learning_rate": 9.542586187595537e-06,
+ "loss": 0.127,
+ "step": 19419
+ },
+ {
+ "epoch": 52.915531335149865,
+ "grad_norm": 5.412356376647949,
+ "learning_rate": 9.541704618435834e-06,
+ "loss": 0.2205,
+ "step": 19420
+ },
+ {
+ "epoch": 52.91825613079019,
+ "grad_norm": 3.9680113792419434,
+ "learning_rate": 9.540823052845323e-06,
+ "loss": 0.1297,
+ "step": 19421
+ },
+ {
+ "epoch": 52.920980926430516,
+ "grad_norm": 3.8879904747009277,
+ "learning_rate": 9.539941490830863e-06,
+ "loss": 0.2313,
+ "step": 19422
+ },
+ {
+ "epoch": 52.92370572207084,
+ "grad_norm": 3.4496006965637207,
+ "learning_rate": 9.539059932399328e-06,
+ "loss": 0.1018,
+ "step": 19423
+ },
+ {
+ "epoch": 52.926430517711175,
+ "grad_norm": 3.728367328643799,
+ "learning_rate": 9.538178377557577e-06,
+ "loss": 0.195,
+ "step": 19424
+ },
+ {
+ "epoch": 52.9291553133515,
+ "grad_norm": 4.723453044891357,
+ "learning_rate": 9.53729682631248e-06,
+ "loss": 0.105,
+ "step": 19425
+ },
+ {
+ "epoch": 52.93188010899183,
+ "grad_norm": 4.525905609130859,
+ "learning_rate": 9.536415278670897e-06,
+ "loss": 0.0872,
+ "step": 19426
+ },
+ {
+ "epoch": 52.93460490463215,
+ "grad_norm": 4.863429546356201,
+ "learning_rate": 9.5355337346397e-06,
+ "loss": 0.2055,
+ "step": 19427
+ },
+ {
+ "epoch": 52.93732970027248,
+ "grad_norm": 4.197471618652344,
+ "learning_rate": 9.53465219422575e-06,
+ "loss": 0.2584,
+ "step": 19428
+ },
+ {
+ "epoch": 52.940054495912804,
+ "grad_norm": 4.145512580871582,
+ "learning_rate": 9.533770657435914e-06,
+ "loss": 0.0946,
+ "step": 19429
+ },
+ {
+ "epoch": 52.94277929155314,
+ "grad_norm": 4.528237342834473,
+ "learning_rate": 9.532889124277057e-06,
+ "loss": 0.2962,
+ "step": 19430
+ },
+ {
+ "epoch": 52.94550408719346,
+ "grad_norm": 4.709898948669434,
+ "learning_rate": 9.532007594756046e-06,
+ "loss": 0.1474,
+ "step": 19431
+ },
+ {
+ "epoch": 52.94822888283379,
+ "grad_norm": 5.081605911254883,
+ "learning_rate": 9.531126068879742e-06,
+ "loss": 0.1412,
+ "step": 19432
+ },
+ {
+ "epoch": 52.950953678474114,
+ "grad_norm": 8.18087387084961,
+ "learning_rate": 9.530244546655016e-06,
+ "loss": 0.2135,
+ "step": 19433
+ },
+ {
+ "epoch": 52.95367847411444,
+ "grad_norm": 3.8935437202453613,
+ "learning_rate": 9.529363028088725e-06,
+ "loss": 0.0655,
+ "step": 19434
+ },
+ {
+ "epoch": 52.956403269754766,
+ "grad_norm": 4.755772113800049,
+ "learning_rate": 9.528481513187744e-06,
+ "loss": 0.127,
+ "step": 19435
+ },
+ {
+ "epoch": 52.95912806539509,
+ "grad_norm": 4.46189546585083,
+ "learning_rate": 9.527600001958933e-06,
+ "loss": 0.1729,
+ "step": 19436
+ },
+ {
+ "epoch": 52.961852861035425,
+ "grad_norm": 8.863527297973633,
+ "learning_rate": 9.526718494409158e-06,
+ "loss": 0.158,
+ "step": 19437
+ },
+ {
+ "epoch": 52.96457765667575,
+ "grad_norm": 3.593932867050171,
+ "learning_rate": 9.525836990545283e-06,
+ "loss": 0.0814,
+ "step": 19438
+ },
+ {
+ "epoch": 52.967302452316076,
+ "grad_norm": 6.234457492828369,
+ "learning_rate": 9.524955490374176e-06,
+ "loss": 0.1996,
+ "step": 19439
+ },
+ {
+ "epoch": 52.9700272479564,
+ "grad_norm": 3.7607927322387695,
+ "learning_rate": 9.5240739939027e-06,
+ "loss": 0.1373,
+ "step": 19440
+ },
+ {
+ "epoch": 52.97275204359673,
+ "grad_norm": 3.821132183074951,
+ "learning_rate": 9.52319250113772e-06,
+ "loss": 0.1124,
+ "step": 19441
+ },
+ {
+ "epoch": 52.97547683923706,
+ "grad_norm": 4.514087200164795,
+ "learning_rate": 9.522311012086103e-06,
+ "loss": 0.121,
+ "step": 19442
+ },
+ {
+ "epoch": 52.97820163487739,
+ "grad_norm": 7.508065700531006,
+ "learning_rate": 9.52142952675471e-06,
+ "loss": 0.1596,
+ "step": 19443
+ },
+ {
+ "epoch": 52.98092643051771,
+ "grad_norm": 4.979015350341797,
+ "learning_rate": 9.52054804515041e-06,
+ "loss": 0.2283,
+ "step": 19444
+ },
+ {
+ "epoch": 52.98365122615804,
+ "grad_norm": 4.485701084136963,
+ "learning_rate": 9.519666567280067e-06,
+ "loss": 0.1493,
+ "step": 19445
+ },
+ {
+ "epoch": 52.986376021798364,
+ "grad_norm": 3.7773795127868652,
+ "learning_rate": 9.518785093150543e-06,
+ "loss": 0.0965,
+ "step": 19446
+ },
+ {
+ "epoch": 52.98910081743869,
+ "grad_norm": 3.1339917182922363,
+ "learning_rate": 9.517903622768707e-06,
+ "loss": 0.1167,
+ "step": 19447
+ },
+ {
+ "epoch": 52.991825613079016,
+ "grad_norm": 4.603447914123535,
+ "learning_rate": 9.51702215614142e-06,
+ "loss": 0.0751,
+ "step": 19448
+ },
+ {
+ "epoch": 52.99455040871935,
+ "grad_norm": 4.457182884216309,
+ "learning_rate": 9.516140693275554e-06,
+ "loss": 0.1444,
+ "step": 19449
+ },
+ {
+ "epoch": 52.997275204359674,
+ "grad_norm": 5.096701145172119,
+ "learning_rate": 9.515259234177964e-06,
+ "loss": 0.1583,
+ "step": 19450
+ },
+ {
+ "epoch": 53.0,
+ "grad_norm": 4.649552345275879,
+ "learning_rate": 9.514377778855521e-06,
+ "loss": 0.2083,
+ "step": 19451
+ },
+ {
+ "epoch": 53.002724795640326,
+ "grad_norm": 4.393429279327393,
+ "learning_rate": 9.513496327315085e-06,
+ "loss": 0.0915,
+ "step": 19452
+ },
+ {
+ "epoch": 53.00544959128065,
+ "grad_norm": 3.946039915084839,
+ "learning_rate": 9.512614879563525e-06,
+ "loss": 0.0755,
+ "step": 19453
+ },
+ {
+ "epoch": 53.00817438692098,
+ "grad_norm": 4.5312113761901855,
+ "learning_rate": 9.511733435607709e-06,
+ "loss": 0.2359,
+ "step": 19454
+ },
+ {
+ "epoch": 53.01089918256131,
+ "grad_norm": 4.726602554321289,
+ "learning_rate": 9.510851995454494e-06,
+ "loss": 0.2065,
+ "step": 19455
+ },
+ {
+ "epoch": 53.013623978201636,
+ "grad_norm": 4.218317985534668,
+ "learning_rate": 9.50997055911075e-06,
+ "loss": 0.0797,
+ "step": 19456
+ },
+ {
+ "epoch": 53.01634877384196,
+ "grad_norm": 4.34600305557251,
+ "learning_rate": 9.509089126583336e-06,
+ "loss": 0.1123,
+ "step": 19457
+ },
+ {
+ "epoch": 53.01907356948229,
+ "grad_norm": 4.702160835266113,
+ "learning_rate": 9.508207697879123e-06,
+ "loss": 0.0871,
+ "step": 19458
+ },
+ {
+ "epoch": 53.02179836512261,
+ "grad_norm": 3.6047987937927246,
+ "learning_rate": 9.507326273004972e-06,
+ "loss": 0.0744,
+ "step": 19459
+ },
+ {
+ "epoch": 53.02452316076294,
+ "grad_norm": 4.602707386016846,
+ "learning_rate": 9.50644485196775e-06,
+ "loss": 0.1927,
+ "step": 19460
+ },
+ {
+ "epoch": 53.02724795640327,
+ "grad_norm": 5.076196670532227,
+ "learning_rate": 9.505563434774317e-06,
+ "loss": 0.1479,
+ "step": 19461
+ },
+ {
+ "epoch": 53.0299727520436,
+ "grad_norm": 8.3142671585083,
+ "learning_rate": 9.504682021431541e-06,
+ "loss": 0.1404,
+ "step": 19462
+ },
+ {
+ "epoch": 53.032697547683924,
+ "grad_norm": 4.3612751960754395,
+ "learning_rate": 9.503800611946285e-06,
+ "loss": 0.0814,
+ "step": 19463
+ },
+ {
+ "epoch": 53.03542234332425,
+ "grad_norm": 3.6033620834350586,
+ "learning_rate": 9.502919206325415e-06,
+ "loss": 0.2357,
+ "step": 19464
+ },
+ {
+ "epoch": 53.038147138964575,
+ "grad_norm": 4.380779266357422,
+ "learning_rate": 9.502037804575793e-06,
+ "loss": 0.1751,
+ "step": 19465
+ },
+ {
+ "epoch": 53.0408719346049,
+ "grad_norm": 4.791330814361572,
+ "learning_rate": 9.501156406704284e-06,
+ "loss": 0.2727,
+ "step": 19466
+ },
+ {
+ "epoch": 53.043596730245234,
+ "grad_norm": 4.086306571960449,
+ "learning_rate": 9.500275012717754e-06,
+ "loss": 0.1402,
+ "step": 19467
+ },
+ {
+ "epoch": 53.04632152588556,
+ "grad_norm": 3.57738995552063,
+ "learning_rate": 9.499393622623064e-06,
+ "loss": 0.2562,
+ "step": 19468
+ },
+ {
+ "epoch": 53.049046321525886,
+ "grad_norm": 4.554544925689697,
+ "learning_rate": 9.49851223642708e-06,
+ "loss": 0.2626,
+ "step": 19469
+ },
+ {
+ "epoch": 53.05177111716621,
+ "grad_norm": 5.000865936279297,
+ "learning_rate": 9.49763085413667e-06,
+ "loss": 0.2058,
+ "step": 19470
+ },
+ {
+ "epoch": 53.05449591280654,
+ "grad_norm": 6.769252300262451,
+ "learning_rate": 9.496749475758692e-06,
+ "loss": 0.1646,
+ "step": 19471
+ },
+ {
+ "epoch": 53.05722070844686,
+ "grad_norm": 4.432536602020264,
+ "learning_rate": 9.495868101300015e-06,
+ "loss": 0.1401,
+ "step": 19472
+ },
+ {
+ "epoch": 53.059945504087196,
+ "grad_norm": 10.35960865020752,
+ "learning_rate": 9.4949867307675e-06,
+ "loss": 0.182,
+ "step": 19473
+ },
+ {
+ "epoch": 53.06267029972752,
+ "grad_norm": 3.592966318130493,
+ "learning_rate": 9.494105364168014e-06,
+ "loss": 0.2652,
+ "step": 19474
+ },
+ {
+ "epoch": 53.06539509536785,
+ "grad_norm": 4.498920440673828,
+ "learning_rate": 9.493224001508416e-06,
+ "loss": 0.1544,
+ "step": 19475
+ },
+ {
+ "epoch": 53.06811989100817,
+ "grad_norm": 4.001643657684326,
+ "learning_rate": 9.492342642795576e-06,
+ "loss": 0.061,
+ "step": 19476
+ },
+ {
+ "epoch": 53.0708446866485,
+ "grad_norm": 4.065978050231934,
+ "learning_rate": 9.491461288036353e-06,
+ "loss": 0.1452,
+ "step": 19477
+ },
+ {
+ "epoch": 53.073569482288825,
+ "grad_norm": 3.848238468170166,
+ "learning_rate": 9.490579937237615e-06,
+ "loss": 0.2558,
+ "step": 19478
+ },
+ {
+ "epoch": 53.07629427792916,
+ "grad_norm": 4.34864616394043,
+ "learning_rate": 9.489698590406223e-06,
+ "loss": 0.2458,
+ "step": 19479
+ },
+ {
+ "epoch": 53.079019073569484,
+ "grad_norm": 3.9366304874420166,
+ "learning_rate": 9.488817247549043e-06,
+ "loss": 0.0556,
+ "step": 19480
+ },
+ {
+ "epoch": 53.08174386920981,
+ "grad_norm": 3.9686615467071533,
+ "learning_rate": 9.487935908672936e-06,
+ "loss": 0.1271,
+ "step": 19481
+ },
+ {
+ "epoch": 53.084468664850135,
+ "grad_norm": 4.87516975402832,
+ "learning_rate": 9.487054573784769e-06,
+ "loss": 0.2584,
+ "step": 19482
+ },
+ {
+ "epoch": 53.08719346049046,
+ "grad_norm": 3.477492332458496,
+ "learning_rate": 9.486173242891404e-06,
+ "loss": 0.128,
+ "step": 19483
+ },
+ {
+ "epoch": 53.08991825613079,
+ "grad_norm": 3.921304225921631,
+ "learning_rate": 9.485291915999706e-06,
+ "loss": 0.0912,
+ "step": 19484
+ },
+ {
+ "epoch": 53.09264305177112,
+ "grad_norm": 4.01481294631958,
+ "learning_rate": 9.484410593116536e-06,
+ "loss": 0.1633,
+ "step": 19485
+ },
+ {
+ "epoch": 53.095367847411445,
+ "grad_norm": 5.032939910888672,
+ "learning_rate": 9.483529274248758e-06,
+ "loss": 0.167,
+ "step": 19486
+ },
+ {
+ "epoch": 53.09809264305177,
+ "grad_norm": 3.700946807861328,
+ "learning_rate": 9.48264795940324e-06,
+ "loss": 0.0914,
+ "step": 19487
+ },
+ {
+ "epoch": 53.1008174386921,
+ "grad_norm": 4.320295810699463,
+ "learning_rate": 9.481766648586844e-06,
+ "loss": 0.2146,
+ "step": 19488
+ },
+ {
+ "epoch": 53.10354223433242,
+ "grad_norm": 4.7659783363342285,
+ "learning_rate": 9.48088534180643e-06,
+ "loss": 0.1247,
+ "step": 19489
+ },
+ {
+ "epoch": 53.10626702997275,
+ "grad_norm": 3.985541343688965,
+ "learning_rate": 9.480004039068868e-06,
+ "loss": 0.1365,
+ "step": 19490
+ },
+ {
+ "epoch": 53.10899182561308,
+ "grad_norm": 3.8085134029388428,
+ "learning_rate": 9.479122740381015e-06,
+ "loss": 0.1226,
+ "step": 19491
+ },
+ {
+ "epoch": 53.11171662125341,
+ "grad_norm": 4.460117816925049,
+ "learning_rate": 9.478241445749739e-06,
+ "loss": 0.11,
+ "step": 19492
+ },
+ {
+ "epoch": 53.11444141689373,
+ "grad_norm": 4.521548748016357,
+ "learning_rate": 9.477360155181902e-06,
+ "loss": 0.2341,
+ "step": 19493
+ },
+ {
+ "epoch": 53.11716621253406,
+ "grad_norm": 4.03731632232666,
+ "learning_rate": 9.476478868684366e-06,
+ "loss": 0.1513,
+ "step": 19494
+ },
+ {
+ "epoch": 53.119891008174385,
+ "grad_norm": 4.526203155517578,
+ "learning_rate": 9.475597586263996e-06,
+ "loss": 0.155,
+ "step": 19495
+ },
+ {
+ "epoch": 53.12261580381471,
+ "grad_norm": 14.319269180297852,
+ "learning_rate": 9.474716307927657e-06,
+ "loss": 0.0924,
+ "step": 19496
+ },
+ {
+ "epoch": 53.12534059945504,
+ "grad_norm": 4.00183629989624,
+ "learning_rate": 9.473835033682209e-06,
+ "loss": 0.1389,
+ "step": 19497
+ },
+ {
+ "epoch": 53.12806539509537,
+ "grad_norm": 3.2636046409606934,
+ "learning_rate": 9.472953763534517e-06,
+ "loss": 0.067,
+ "step": 19498
+ },
+ {
+ "epoch": 53.130790190735695,
+ "grad_norm": 3.163428783416748,
+ "learning_rate": 9.472072497491443e-06,
+ "loss": 0.0709,
+ "step": 19499
+ },
+ {
+ "epoch": 53.13351498637602,
+ "grad_norm": 4.80781364440918,
+ "learning_rate": 9.471191235559853e-06,
+ "loss": 0.1009,
+ "step": 19500
+ },
+ {
+ "epoch": 53.13623978201635,
+ "grad_norm": 5.041027069091797,
+ "learning_rate": 9.470309977746607e-06,
+ "loss": 0.1678,
+ "step": 19501
+ },
+ {
+ "epoch": 53.13896457765667,
+ "grad_norm": 5.947676181793213,
+ "learning_rate": 9.46942872405857e-06,
+ "loss": 0.219,
+ "step": 19502
+ },
+ {
+ "epoch": 53.141689373297005,
+ "grad_norm": 4.79503059387207,
+ "learning_rate": 9.468547474502603e-06,
+ "loss": 0.1351,
+ "step": 19503
+ },
+ {
+ "epoch": 53.14441416893733,
+ "grad_norm": 3.2360799312591553,
+ "learning_rate": 9.467666229085574e-06,
+ "loss": 0.1247,
+ "step": 19504
+ },
+ {
+ "epoch": 53.14713896457766,
+ "grad_norm": 4.616093635559082,
+ "learning_rate": 9.466784987814345e-06,
+ "loss": 0.1742,
+ "step": 19505
+ },
+ {
+ "epoch": 53.14986376021798,
+ "grad_norm": 3.4572880268096924,
+ "learning_rate": 9.465903750695774e-06,
+ "loss": 0.0791,
+ "step": 19506
+ },
+ {
+ "epoch": 53.15258855585831,
+ "grad_norm": 5.055361270904541,
+ "learning_rate": 9.465022517736728e-06,
+ "loss": 0.1116,
+ "step": 19507
+ },
+ {
+ "epoch": 53.155313351498634,
+ "grad_norm": 4.294522762298584,
+ "learning_rate": 9.464141288944072e-06,
+ "loss": 0.1808,
+ "step": 19508
+ },
+ {
+ "epoch": 53.15803814713897,
+ "grad_norm": 3.945244550704956,
+ "learning_rate": 9.463260064324663e-06,
+ "loss": 0.12,
+ "step": 19509
+ },
+ {
+ "epoch": 53.16076294277929,
+ "grad_norm": 5.410464763641357,
+ "learning_rate": 9.46237884388537e-06,
+ "loss": 0.0788,
+ "step": 19510
+ },
+ {
+ "epoch": 53.16348773841962,
+ "grad_norm": 8.153961181640625,
+ "learning_rate": 9.461497627633051e-06,
+ "loss": 0.1865,
+ "step": 19511
+ },
+ {
+ "epoch": 53.166212534059945,
+ "grad_norm": 4.335062026977539,
+ "learning_rate": 9.460616415574575e-06,
+ "loss": 0.2073,
+ "step": 19512
+ },
+ {
+ "epoch": 53.16893732970027,
+ "grad_norm": 4.389134407043457,
+ "learning_rate": 9.459735207716796e-06,
+ "loss": 0.0822,
+ "step": 19513
+ },
+ {
+ "epoch": 53.171662125340596,
+ "grad_norm": 3.9332547187805176,
+ "learning_rate": 9.458854004066586e-06,
+ "loss": 0.0663,
+ "step": 19514
+ },
+ {
+ "epoch": 53.17438692098093,
+ "grad_norm": 4.0098676681518555,
+ "learning_rate": 9.457972804630801e-06,
+ "loss": 0.0951,
+ "step": 19515
+ },
+ {
+ "epoch": 53.177111716621255,
+ "grad_norm": 3.5633816719055176,
+ "learning_rate": 9.457091609416309e-06,
+ "loss": 0.0736,
+ "step": 19516
+ },
+ {
+ "epoch": 53.17983651226158,
+ "grad_norm": 4.113879203796387,
+ "learning_rate": 9.456210418429968e-06,
+ "loss": 0.1804,
+ "step": 19517
+ },
+ {
+ "epoch": 53.182561307901906,
+ "grad_norm": 4.0399861335754395,
+ "learning_rate": 9.455329231678644e-06,
+ "loss": 0.2328,
+ "step": 19518
+ },
+ {
+ "epoch": 53.18528610354223,
+ "grad_norm": 4.422402381896973,
+ "learning_rate": 9.454448049169195e-06,
+ "loss": 0.2042,
+ "step": 19519
+ },
+ {
+ "epoch": 53.18801089918256,
+ "grad_norm": 3.637037754058838,
+ "learning_rate": 9.453566870908488e-06,
+ "loss": 0.2312,
+ "step": 19520
+ },
+ {
+ "epoch": 53.19073569482289,
+ "grad_norm": 5.453971862792969,
+ "learning_rate": 9.452685696903387e-06,
+ "loss": 0.1949,
+ "step": 19521
+ },
+ {
+ "epoch": 53.19346049046322,
+ "grad_norm": 3.9778435230255127,
+ "learning_rate": 9.45180452716075e-06,
+ "loss": 0.1529,
+ "step": 19522
+ },
+ {
+ "epoch": 53.19618528610354,
+ "grad_norm": 6.233001708984375,
+ "learning_rate": 9.450923361687443e-06,
+ "loss": 0.1263,
+ "step": 19523
+ },
+ {
+ "epoch": 53.19891008174387,
+ "grad_norm": 4.244566917419434,
+ "learning_rate": 9.450042200490328e-06,
+ "loss": 0.2222,
+ "step": 19524
+ },
+ {
+ "epoch": 53.201634877384194,
+ "grad_norm": 4.423482894897461,
+ "learning_rate": 9.449161043576266e-06,
+ "loss": 0.2106,
+ "step": 19525
+ },
+ {
+ "epoch": 53.20435967302452,
+ "grad_norm": 4.039098262786865,
+ "learning_rate": 9.44827989095212e-06,
+ "loss": 0.2248,
+ "step": 19526
+ },
+ {
+ "epoch": 53.20708446866485,
+ "grad_norm": 2.4821112155914307,
+ "learning_rate": 9.447398742624754e-06,
+ "loss": 0.0965,
+ "step": 19527
+ },
+ {
+ "epoch": 53.20980926430518,
+ "grad_norm": 3.9655888080596924,
+ "learning_rate": 9.446517598601026e-06,
+ "loss": 0.1632,
+ "step": 19528
+ },
+ {
+ "epoch": 53.212534059945504,
+ "grad_norm": 3.9284117221832275,
+ "learning_rate": 9.445636458887804e-06,
+ "loss": 0.1691,
+ "step": 19529
+ },
+ {
+ "epoch": 53.21525885558583,
+ "grad_norm": 6.506946086883545,
+ "learning_rate": 9.444755323491944e-06,
+ "loss": 0.1877,
+ "step": 19530
+ },
+ {
+ "epoch": 53.217983651226156,
+ "grad_norm": 3.3470606803894043,
+ "learning_rate": 9.443874192420312e-06,
+ "loss": 0.1937,
+ "step": 19531
+ },
+ {
+ "epoch": 53.22070844686648,
+ "grad_norm": 4.093039035797119,
+ "learning_rate": 9.442993065679773e-06,
+ "loss": 0.0557,
+ "step": 19532
+ },
+ {
+ "epoch": 53.223433242506815,
+ "grad_norm": 3.836261034011841,
+ "learning_rate": 9.442111943277183e-06,
+ "loss": 0.1796,
+ "step": 19533
+ },
+ {
+ "epoch": 53.22615803814714,
+ "grad_norm": 4.765162944793701,
+ "learning_rate": 9.44123082521941e-06,
+ "loss": 0.122,
+ "step": 19534
+ },
+ {
+ "epoch": 53.228882833787466,
+ "grad_norm": 4.036040782928467,
+ "learning_rate": 9.440349711513311e-06,
+ "loss": 0.0643,
+ "step": 19535
+ },
+ {
+ "epoch": 53.23160762942779,
+ "grad_norm": 5.566751480102539,
+ "learning_rate": 9.439468602165752e-06,
+ "loss": 0.1608,
+ "step": 19536
+ },
+ {
+ "epoch": 53.23433242506812,
+ "grad_norm": 3.435711622238159,
+ "learning_rate": 9.438587497183592e-06,
+ "loss": 0.1056,
+ "step": 19537
+ },
+ {
+ "epoch": 53.237057220708444,
+ "grad_norm": 4.683530807495117,
+ "learning_rate": 9.437706396573693e-06,
+ "loss": 0.1333,
+ "step": 19538
+ },
+ {
+ "epoch": 53.23978201634878,
+ "grad_norm": 3.80041766166687,
+ "learning_rate": 9.43682530034292e-06,
+ "loss": 0.24,
+ "step": 19539
+ },
+ {
+ "epoch": 53.2425068119891,
+ "grad_norm": 4.056492805480957,
+ "learning_rate": 9.435944208498135e-06,
+ "loss": 0.2451,
+ "step": 19540
+ },
+ {
+ "epoch": 53.24523160762943,
+ "grad_norm": 3.077631711959839,
+ "learning_rate": 9.435063121046198e-06,
+ "loss": 0.1398,
+ "step": 19541
+ },
+ {
+ "epoch": 53.247956403269754,
+ "grad_norm": 5.0171990394592285,
+ "learning_rate": 9.43418203799397e-06,
+ "loss": 0.0593,
+ "step": 19542
+ },
+ {
+ "epoch": 53.25068119891008,
+ "grad_norm": 3.7705698013305664,
+ "learning_rate": 9.433300959348317e-06,
+ "loss": 0.1593,
+ "step": 19543
+ },
+ {
+ "epoch": 53.253405994550405,
+ "grad_norm": 17.04795265197754,
+ "learning_rate": 9.432419885116094e-06,
+ "loss": 0.1384,
+ "step": 19544
+ },
+ {
+ "epoch": 53.25613079019074,
+ "grad_norm": 3.9089910984039307,
+ "learning_rate": 9.43153881530417e-06,
+ "loss": 0.0772,
+ "step": 19545
+ },
+ {
+ "epoch": 53.258855585831064,
+ "grad_norm": 4.638715744018555,
+ "learning_rate": 9.4306577499194e-06,
+ "loss": 0.1451,
+ "step": 19546
+ },
+ {
+ "epoch": 53.26158038147139,
+ "grad_norm": 3.2247910499572754,
+ "learning_rate": 9.429776688968654e-06,
+ "loss": 0.0847,
+ "step": 19547
+ },
+ {
+ "epoch": 53.264305177111716,
+ "grad_norm": 3.8689346313476562,
+ "learning_rate": 9.428895632458785e-06,
+ "loss": 0.171,
+ "step": 19548
+ },
+ {
+ "epoch": 53.26702997275204,
+ "grad_norm": 4.553506851196289,
+ "learning_rate": 9.428014580396659e-06,
+ "loss": 0.1897,
+ "step": 19549
+ },
+ {
+ "epoch": 53.26975476839237,
+ "grad_norm": 4.09987211227417,
+ "learning_rate": 9.427133532789137e-06,
+ "loss": 0.1578,
+ "step": 19550
+ },
+ {
+ "epoch": 53.2724795640327,
+ "grad_norm": 3.6810247898101807,
+ "learning_rate": 9.426252489643082e-06,
+ "loss": 0.1001,
+ "step": 19551
+ },
+ {
+ "epoch": 53.275204359673026,
+ "grad_norm": 4.582121849060059,
+ "learning_rate": 9.425371450965352e-06,
+ "loss": 0.1994,
+ "step": 19552
+ },
+ {
+ "epoch": 53.27792915531335,
+ "grad_norm": 2.8743526935577393,
+ "learning_rate": 9.424490416762811e-06,
+ "loss": 0.0879,
+ "step": 19553
+ },
+ {
+ "epoch": 53.28065395095368,
+ "grad_norm": 4.316268444061279,
+ "learning_rate": 9.423609387042322e-06,
+ "loss": 0.1325,
+ "step": 19554
+ },
+ {
+ "epoch": 53.283378746594,
+ "grad_norm": 5.627859115600586,
+ "learning_rate": 9.42272836181074e-06,
+ "loss": 0.2588,
+ "step": 19555
+ },
+ {
+ "epoch": 53.28610354223433,
+ "grad_norm": 5.127203464508057,
+ "learning_rate": 9.421847341074933e-06,
+ "loss": 0.2171,
+ "step": 19556
+ },
+ {
+ "epoch": 53.28882833787466,
+ "grad_norm": 4.550676345825195,
+ "learning_rate": 9.420966324841762e-06,
+ "loss": 0.1611,
+ "step": 19557
+ },
+ {
+ "epoch": 53.29155313351499,
+ "grad_norm": 3.104943037033081,
+ "learning_rate": 9.420085313118086e-06,
+ "loss": 0.0543,
+ "step": 19558
+ },
+ {
+ "epoch": 53.294277929155314,
+ "grad_norm": 3.6725471019744873,
+ "learning_rate": 9.419204305910769e-06,
+ "loss": 0.2162,
+ "step": 19559
+ },
+ {
+ "epoch": 53.29700272479564,
+ "grad_norm": 3.9303996562957764,
+ "learning_rate": 9.418323303226667e-06,
+ "loss": 0.0666,
+ "step": 19560
+ },
+ {
+ "epoch": 53.299727520435965,
+ "grad_norm": 4.273158550262451,
+ "learning_rate": 9.417442305072647e-06,
+ "loss": 0.0828,
+ "step": 19561
+ },
+ {
+ "epoch": 53.30245231607629,
+ "grad_norm": 4.918844699859619,
+ "learning_rate": 9.416561311455565e-06,
+ "loss": 0.0793,
+ "step": 19562
+ },
+ {
+ "epoch": 53.305177111716624,
+ "grad_norm": 6.09805154800415,
+ "learning_rate": 9.415680322382289e-06,
+ "loss": 0.123,
+ "step": 19563
+ },
+ {
+ "epoch": 53.30790190735695,
+ "grad_norm": 4.17274284362793,
+ "learning_rate": 9.41479933785967e-06,
+ "loss": 0.0983,
+ "step": 19564
+ },
+ {
+ "epoch": 53.310626702997276,
+ "grad_norm": 4.336362838745117,
+ "learning_rate": 9.413918357894579e-06,
+ "loss": 0.0565,
+ "step": 19565
+ },
+ {
+ "epoch": 53.3133514986376,
+ "grad_norm": 5.13599967956543,
+ "learning_rate": 9.41303738249387e-06,
+ "loss": 0.3572,
+ "step": 19566
+ },
+ {
+ "epoch": 53.31607629427793,
+ "grad_norm": 3.890084743499756,
+ "learning_rate": 9.41215641166441e-06,
+ "loss": 0.167,
+ "step": 19567
+ },
+ {
+ "epoch": 53.31880108991825,
+ "grad_norm": 3.838386297225952,
+ "learning_rate": 9.411275445413055e-06,
+ "loss": 0.2074,
+ "step": 19568
+ },
+ {
+ "epoch": 53.321525885558586,
+ "grad_norm": 3.0424602031707764,
+ "learning_rate": 9.41039448374667e-06,
+ "loss": 0.0788,
+ "step": 19569
+ },
+ {
+ "epoch": 53.32425068119891,
+ "grad_norm": 3.4019460678100586,
+ "learning_rate": 9.409513526672111e-06,
+ "loss": 0.0977,
+ "step": 19570
+ },
+ {
+ "epoch": 53.32697547683924,
+ "grad_norm": 4.269498825073242,
+ "learning_rate": 9.408632574196245e-06,
+ "loss": 0.2103,
+ "step": 19571
+ },
+ {
+ "epoch": 53.32970027247956,
+ "grad_norm": 6.106554985046387,
+ "learning_rate": 9.407751626325922e-06,
+ "loss": 0.1869,
+ "step": 19572
+ },
+ {
+ "epoch": 53.33242506811989,
+ "grad_norm": 5.24274206161499,
+ "learning_rate": 9.406870683068017e-06,
+ "loss": 0.1613,
+ "step": 19573
+ },
+ {
+ "epoch": 53.335149863760215,
+ "grad_norm": 3.7461729049682617,
+ "learning_rate": 9.40598974442938e-06,
+ "loss": 0.086,
+ "step": 19574
+ },
+ {
+ "epoch": 53.33787465940055,
+ "grad_norm": 5.346202850341797,
+ "learning_rate": 9.405108810416881e-06,
+ "loss": 0.0685,
+ "step": 19575
+ },
+ {
+ "epoch": 53.34059945504087,
+ "grad_norm": 5.928539276123047,
+ "learning_rate": 9.404227881037372e-06,
+ "loss": 0.1774,
+ "step": 19576
+ },
+ {
+ "epoch": 53.3433242506812,
+ "grad_norm": 4.118345737457275,
+ "learning_rate": 9.40334695629772e-06,
+ "loss": 0.1966,
+ "step": 19577
+ },
+ {
+ "epoch": 53.346049046321525,
+ "grad_norm": 4.071616172790527,
+ "learning_rate": 9.402466036204779e-06,
+ "loss": 0.0869,
+ "step": 19578
+ },
+ {
+ "epoch": 53.34877384196185,
+ "grad_norm": 4.851202011108398,
+ "learning_rate": 9.401585120765416e-06,
+ "loss": 0.0747,
+ "step": 19579
+ },
+ {
+ "epoch": 53.35149863760218,
+ "grad_norm": 5.652044773101807,
+ "learning_rate": 9.400704209986488e-06,
+ "loss": 0.1734,
+ "step": 19580
+ },
+ {
+ "epoch": 53.35422343324251,
+ "grad_norm": 4.022444248199463,
+ "learning_rate": 9.399823303874856e-06,
+ "loss": 0.0729,
+ "step": 19581
+ },
+ {
+ "epoch": 53.356948228882835,
+ "grad_norm": 3.748548746109009,
+ "learning_rate": 9.398942402437382e-06,
+ "loss": 0.212,
+ "step": 19582
+ },
+ {
+ "epoch": 53.35967302452316,
+ "grad_norm": 3.7141458988189697,
+ "learning_rate": 9.398061505680925e-06,
+ "loss": 0.0992,
+ "step": 19583
+ },
+ {
+ "epoch": 53.36239782016349,
+ "grad_norm": 3.743070125579834,
+ "learning_rate": 9.397180613612343e-06,
+ "loss": 0.0816,
+ "step": 19584
+ },
+ {
+ "epoch": 53.36512261580381,
+ "grad_norm": 3.78251314163208,
+ "learning_rate": 9.396299726238501e-06,
+ "loss": 0.0992,
+ "step": 19585
+ },
+ {
+ "epoch": 53.36784741144414,
+ "grad_norm": 3.9803833961486816,
+ "learning_rate": 9.395418843566257e-06,
+ "loss": 0.126,
+ "step": 19586
+ },
+ {
+ "epoch": 53.37057220708447,
+ "grad_norm": 4.991311550140381,
+ "learning_rate": 9.394537965602473e-06,
+ "loss": 0.0616,
+ "step": 19587
+ },
+ {
+ "epoch": 53.3732970027248,
+ "grad_norm": 4.265721321105957,
+ "learning_rate": 9.393657092354005e-06,
+ "loss": 0.1159,
+ "step": 19588
+ },
+ {
+ "epoch": 53.37602179836512,
+ "grad_norm": 4.968245029449463,
+ "learning_rate": 9.392776223827715e-06,
+ "loss": 0.1558,
+ "step": 19589
+ },
+ {
+ "epoch": 53.37874659400545,
+ "grad_norm": 4.296175479888916,
+ "learning_rate": 9.391895360030467e-06,
+ "loss": 0.1086,
+ "step": 19590
+ },
+ {
+ "epoch": 53.381471389645775,
+ "grad_norm": 5.016697883605957,
+ "learning_rate": 9.391014500969118e-06,
+ "loss": 0.136,
+ "step": 19591
+ },
+ {
+ "epoch": 53.3841961852861,
+ "grad_norm": 4.269606113433838,
+ "learning_rate": 9.39013364665053e-06,
+ "loss": 0.2055,
+ "step": 19592
+ },
+ {
+ "epoch": 53.38692098092643,
+ "grad_norm": 5.176723003387451,
+ "learning_rate": 9.389252797081558e-06,
+ "loss": 0.0906,
+ "step": 19593
+ },
+ {
+ "epoch": 53.38964577656676,
+ "grad_norm": 3.5410618782043457,
+ "learning_rate": 9.388371952269068e-06,
+ "loss": 0.1775,
+ "step": 19594
+ },
+ {
+ "epoch": 53.392370572207085,
+ "grad_norm": 11.931692123413086,
+ "learning_rate": 9.387491112219917e-06,
+ "loss": 0.1672,
+ "step": 19595
+ },
+ {
+ "epoch": 53.39509536784741,
+ "grad_norm": 4.841396331787109,
+ "learning_rate": 9.386610276940966e-06,
+ "loss": 0.1384,
+ "step": 19596
+ },
+ {
+ "epoch": 53.39782016348774,
+ "grad_norm": 3.4168834686279297,
+ "learning_rate": 9.385729446439074e-06,
+ "loss": 0.1335,
+ "step": 19597
+ },
+ {
+ "epoch": 53.40054495912806,
+ "grad_norm": 4.518017768859863,
+ "learning_rate": 9.384848620721102e-06,
+ "loss": 0.0872,
+ "step": 19598
+ },
+ {
+ "epoch": 53.403269754768395,
+ "grad_norm": 3.9464101791381836,
+ "learning_rate": 9.38396779979391e-06,
+ "loss": 0.226,
+ "step": 19599
+ },
+ {
+ "epoch": 53.40599455040872,
+ "grad_norm": 3.6357007026672363,
+ "learning_rate": 9.383086983664354e-06,
+ "loss": 0.1953,
+ "step": 19600
+ },
+ {
+ "epoch": 53.40871934604905,
+ "grad_norm": 3.898745059967041,
+ "learning_rate": 9.3822061723393e-06,
+ "loss": 0.1117,
+ "step": 19601
+ },
+ {
+ "epoch": 53.41144414168937,
+ "grad_norm": 5.000555038452148,
+ "learning_rate": 9.381325365825601e-06,
+ "loss": 0.086,
+ "step": 19602
+ },
+ {
+ "epoch": 53.4141689373297,
+ "grad_norm": 4.185770034790039,
+ "learning_rate": 9.380444564130124e-06,
+ "loss": 0.2016,
+ "step": 19603
+ },
+ {
+ "epoch": 53.416893732970024,
+ "grad_norm": 4.505792140960693,
+ "learning_rate": 9.379563767259721e-06,
+ "loss": 0.1441,
+ "step": 19604
+ },
+ {
+ "epoch": 53.41961852861036,
+ "grad_norm": 5.0290632247924805,
+ "learning_rate": 9.378682975221258e-06,
+ "loss": 0.1137,
+ "step": 19605
+ },
+ {
+ "epoch": 53.42234332425068,
+ "grad_norm": 6.182051181793213,
+ "learning_rate": 9.37780218802159e-06,
+ "loss": 0.1923,
+ "step": 19606
+ },
+ {
+ "epoch": 53.42506811989101,
+ "grad_norm": 4.861679553985596,
+ "learning_rate": 9.376921405667576e-06,
+ "loss": 0.1379,
+ "step": 19607
+ },
+ {
+ "epoch": 53.427792915531334,
+ "grad_norm": 9.390670776367188,
+ "learning_rate": 9.376040628166084e-06,
+ "loss": 0.0715,
+ "step": 19608
+ },
+ {
+ "epoch": 53.43051771117166,
+ "grad_norm": 3.188892364501953,
+ "learning_rate": 9.375159855523964e-06,
+ "loss": 0.0807,
+ "step": 19609
+ },
+ {
+ "epoch": 53.433242506811986,
+ "grad_norm": 4.040568828582764,
+ "learning_rate": 9.374279087748082e-06,
+ "loss": 0.1842,
+ "step": 19610
+ },
+ {
+ "epoch": 53.43596730245232,
+ "grad_norm": 4.385910987854004,
+ "learning_rate": 9.37339832484529e-06,
+ "loss": 0.1429,
+ "step": 19611
+ },
+ {
+ "epoch": 53.438692098092645,
+ "grad_norm": 5.230727672576904,
+ "learning_rate": 9.372517566822456e-06,
+ "loss": 0.1741,
+ "step": 19612
+ },
+ {
+ "epoch": 53.44141689373297,
+ "grad_norm": 3.943782091140747,
+ "learning_rate": 9.371636813686433e-06,
+ "loss": 0.1633,
+ "step": 19613
+ },
+ {
+ "epoch": 53.444141689373296,
+ "grad_norm": 4.666703224182129,
+ "learning_rate": 9.370756065444083e-06,
+ "loss": 0.2011,
+ "step": 19614
+ },
+ {
+ "epoch": 53.44686648501362,
+ "grad_norm": 3.6243550777435303,
+ "learning_rate": 9.369875322102262e-06,
+ "loss": 0.1088,
+ "step": 19615
+ },
+ {
+ "epoch": 53.44959128065395,
+ "grad_norm": 5.502617359161377,
+ "learning_rate": 9.368994583667835e-06,
+ "loss": 0.1672,
+ "step": 19616
+ },
+ {
+ "epoch": 53.45231607629428,
+ "grad_norm": 4.114571571350098,
+ "learning_rate": 9.368113850147655e-06,
+ "loss": 0.0948,
+ "step": 19617
+ },
+ {
+ "epoch": 53.45504087193461,
+ "grad_norm": 4.559849262237549,
+ "learning_rate": 9.367233121548585e-06,
+ "loss": 0.1499,
+ "step": 19618
+ },
+ {
+ "epoch": 53.45776566757493,
+ "grad_norm": 5.137974262237549,
+ "learning_rate": 9.366352397877485e-06,
+ "loss": 0.1878,
+ "step": 19619
+ },
+ {
+ "epoch": 53.46049046321526,
+ "grad_norm": 4.2125139236450195,
+ "learning_rate": 9.36547167914121e-06,
+ "loss": 0.168,
+ "step": 19620
+ },
+ {
+ "epoch": 53.463215258855584,
+ "grad_norm": 4.2992377281188965,
+ "learning_rate": 9.364590965346622e-06,
+ "loss": 0.1176,
+ "step": 19621
+ },
+ {
+ "epoch": 53.46594005449591,
+ "grad_norm": 3.483376979827881,
+ "learning_rate": 9.363710256500578e-06,
+ "loss": 0.1051,
+ "step": 19622
+ },
+ {
+ "epoch": 53.46866485013624,
+ "grad_norm": 4.003507137298584,
+ "learning_rate": 9.36282955260994e-06,
+ "loss": 0.0981,
+ "step": 19623
+ },
+ {
+ "epoch": 53.47138964577657,
+ "grad_norm": 7.440272331237793,
+ "learning_rate": 9.361948853681562e-06,
+ "loss": 0.1848,
+ "step": 19624
+ },
+ {
+ "epoch": 53.474114441416894,
+ "grad_norm": 3.835020065307617,
+ "learning_rate": 9.361068159722306e-06,
+ "loss": 0.1417,
+ "step": 19625
+ },
+ {
+ "epoch": 53.47683923705722,
+ "grad_norm": 9.260590553283691,
+ "learning_rate": 9.360187470739033e-06,
+ "loss": 0.0837,
+ "step": 19626
+ },
+ {
+ "epoch": 53.479564032697546,
+ "grad_norm": 3.928607702255249,
+ "learning_rate": 9.359306786738598e-06,
+ "loss": 0.1703,
+ "step": 19627
+ },
+ {
+ "epoch": 53.48228882833787,
+ "grad_norm": 5.6095051765441895,
+ "learning_rate": 9.358426107727862e-06,
+ "loss": 0.153,
+ "step": 19628
+ },
+ {
+ "epoch": 53.485013623978205,
+ "grad_norm": 5.017398357391357,
+ "learning_rate": 9.357545433713683e-06,
+ "loss": 0.1423,
+ "step": 19629
+ },
+ {
+ "epoch": 53.48773841961853,
+ "grad_norm": 3.781545877456665,
+ "learning_rate": 9.35666476470292e-06,
+ "loss": 0.1471,
+ "step": 19630
+ },
+ {
+ "epoch": 53.490463215258856,
+ "grad_norm": 6.276341438293457,
+ "learning_rate": 9.35578410070243e-06,
+ "loss": 0.2157,
+ "step": 19631
+ },
+ {
+ "epoch": 53.49318801089918,
+ "grad_norm": 5.679474830627441,
+ "learning_rate": 9.354903441719073e-06,
+ "loss": 0.2014,
+ "step": 19632
+ },
+ {
+ "epoch": 53.49591280653951,
+ "grad_norm": 4.954401016235352,
+ "learning_rate": 9.354022787759707e-06,
+ "loss": 0.1579,
+ "step": 19633
+ },
+ {
+ "epoch": 53.49863760217983,
+ "grad_norm": 6.598718166351318,
+ "learning_rate": 9.353142138831192e-06,
+ "loss": 0.1546,
+ "step": 19634
+ },
+ {
+ "epoch": 53.50136239782017,
+ "grad_norm": 7.953682899475098,
+ "learning_rate": 9.352261494940382e-06,
+ "loss": 0.0758,
+ "step": 19635
+ },
+ {
+ "epoch": 53.50408719346049,
+ "grad_norm": 4.217384338378906,
+ "learning_rate": 9.351380856094142e-06,
+ "loss": 0.1745,
+ "step": 19636
+ },
+ {
+ "epoch": 53.50681198910082,
+ "grad_norm": 5.816168308258057,
+ "learning_rate": 9.350500222299326e-06,
+ "loss": 0.0973,
+ "step": 19637
+ },
+ {
+ "epoch": 53.509536784741144,
+ "grad_norm": 3.9512689113616943,
+ "learning_rate": 9.349619593562793e-06,
+ "loss": 0.1299,
+ "step": 19638
+ },
+ {
+ "epoch": 53.51226158038147,
+ "grad_norm": 4.017214775085449,
+ "learning_rate": 9.348738969891402e-06,
+ "loss": 0.105,
+ "step": 19639
+ },
+ {
+ "epoch": 53.514986376021795,
+ "grad_norm": 4.038506507873535,
+ "learning_rate": 9.34785835129201e-06,
+ "loss": 0.0985,
+ "step": 19640
+ },
+ {
+ "epoch": 53.51771117166213,
+ "grad_norm": 4.767246723175049,
+ "learning_rate": 9.346977737771471e-06,
+ "loss": 0.1997,
+ "step": 19641
+ },
+ {
+ "epoch": 53.520435967302454,
+ "grad_norm": 4.974850654602051,
+ "learning_rate": 9.346097129336658e-06,
+ "loss": 0.1952,
+ "step": 19642
+ },
+ {
+ "epoch": 53.52316076294278,
+ "grad_norm": 4.244633674621582,
+ "learning_rate": 9.345216525994415e-06,
+ "loss": 0.101,
+ "step": 19643
+ },
+ {
+ "epoch": 53.525885558583106,
+ "grad_norm": 4.580294132232666,
+ "learning_rate": 9.344335927751606e-06,
+ "loss": 0.2573,
+ "step": 19644
+ },
+ {
+ "epoch": 53.52861035422343,
+ "grad_norm": 4.44301176071167,
+ "learning_rate": 9.343455334615085e-06,
+ "loss": 0.2257,
+ "step": 19645
+ },
+ {
+ "epoch": 53.53133514986376,
+ "grad_norm": 4.0705671310424805,
+ "learning_rate": 9.342574746591718e-06,
+ "loss": 0.0916,
+ "step": 19646
+ },
+ {
+ "epoch": 53.53405994550409,
+ "grad_norm": 3.968733310699463,
+ "learning_rate": 9.341694163688352e-06,
+ "loss": 0.1892,
+ "step": 19647
+ },
+ {
+ "epoch": 53.536784741144416,
+ "grad_norm": 3.490436553955078,
+ "learning_rate": 9.340813585911854e-06,
+ "loss": 0.206,
+ "step": 19648
+ },
+ {
+ "epoch": 53.53950953678474,
+ "grad_norm": 4.871994972229004,
+ "learning_rate": 9.339933013269076e-06,
+ "loss": 0.1334,
+ "step": 19649
+ },
+ {
+ "epoch": 53.54223433242507,
+ "grad_norm": 3.9973957538604736,
+ "learning_rate": 9.339052445766883e-06,
+ "loss": 0.1299,
+ "step": 19650
+ },
+ {
+ "epoch": 53.54495912806539,
+ "grad_norm": 5.820115089416504,
+ "learning_rate": 9.338171883412123e-06,
+ "loss": 0.0772,
+ "step": 19651
+ },
+ {
+ "epoch": 53.54768392370572,
+ "grad_norm": 5.841065883636475,
+ "learning_rate": 9.337291326211663e-06,
+ "loss": 0.1235,
+ "step": 19652
+ },
+ {
+ "epoch": 53.55040871934605,
+ "grad_norm": 4.874732494354248,
+ "learning_rate": 9.336410774172356e-06,
+ "loss": 0.094,
+ "step": 19653
+ },
+ {
+ "epoch": 53.55313351498638,
+ "grad_norm": 4.347428321838379,
+ "learning_rate": 9.33553022730106e-06,
+ "loss": 0.0655,
+ "step": 19654
+ },
+ {
+ "epoch": 53.555858310626704,
+ "grad_norm": 3.9326961040496826,
+ "learning_rate": 9.334649685604632e-06,
+ "loss": 0.2916,
+ "step": 19655
+ },
+ {
+ "epoch": 53.55858310626703,
+ "grad_norm": 3.449640989303589,
+ "learning_rate": 9.333769149089934e-06,
+ "loss": 0.0591,
+ "step": 19656
+ },
+ {
+ "epoch": 53.561307901907355,
+ "grad_norm": 8.750727653503418,
+ "learning_rate": 9.332888617763816e-06,
+ "loss": 0.1439,
+ "step": 19657
+ },
+ {
+ "epoch": 53.56403269754768,
+ "grad_norm": 3.458325147628784,
+ "learning_rate": 9.33200809163314e-06,
+ "loss": 0.1673,
+ "step": 19658
+ },
+ {
+ "epoch": 53.566757493188014,
+ "grad_norm": 4.965142250061035,
+ "learning_rate": 9.331127570704765e-06,
+ "loss": 0.121,
+ "step": 19659
+ },
+ {
+ "epoch": 53.56948228882834,
+ "grad_norm": 3.2240495681762695,
+ "learning_rate": 9.330247054985548e-06,
+ "loss": 0.0541,
+ "step": 19660
+ },
+ {
+ "epoch": 53.572207084468666,
+ "grad_norm": 5.976936340332031,
+ "learning_rate": 9.329366544482346e-06,
+ "loss": 0.1824,
+ "step": 19661
+ },
+ {
+ "epoch": 53.57493188010899,
+ "grad_norm": 5.07879114151001,
+ "learning_rate": 9.328486039202015e-06,
+ "loss": 0.1499,
+ "step": 19662
+ },
+ {
+ "epoch": 53.57765667574932,
+ "grad_norm": 4.073906421661377,
+ "learning_rate": 9.327605539151412e-06,
+ "loss": 0.1132,
+ "step": 19663
+ },
+ {
+ "epoch": 53.58038147138964,
+ "grad_norm": 5.997085094451904,
+ "learning_rate": 9.326725044337398e-06,
+ "loss": 0.1735,
+ "step": 19664
+ },
+ {
+ "epoch": 53.583106267029976,
+ "grad_norm": 4.1504011154174805,
+ "learning_rate": 9.325844554766826e-06,
+ "loss": 0.0876,
+ "step": 19665
+ },
+ {
+ "epoch": 53.5858310626703,
+ "grad_norm": 4.301466941833496,
+ "learning_rate": 9.324964070446556e-06,
+ "loss": 0.1104,
+ "step": 19666
+ },
+ {
+ "epoch": 53.58855585831063,
+ "grad_norm": 3.404266595840454,
+ "learning_rate": 9.324083591383441e-06,
+ "loss": 0.1102,
+ "step": 19667
+ },
+ {
+ "epoch": 53.59128065395095,
+ "grad_norm": 4.574977874755859,
+ "learning_rate": 9.323203117584345e-06,
+ "loss": 0.1417,
+ "step": 19668
+ },
+ {
+ "epoch": 53.59400544959128,
+ "grad_norm": 5.017419815063477,
+ "learning_rate": 9.322322649056118e-06,
+ "loss": 0.0789,
+ "step": 19669
+ },
+ {
+ "epoch": 53.596730245231605,
+ "grad_norm": 3.7074153423309326,
+ "learning_rate": 9.321442185805625e-06,
+ "loss": 0.1018,
+ "step": 19670
+ },
+ {
+ "epoch": 53.59945504087194,
+ "grad_norm": 3.648831605911255,
+ "learning_rate": 9.320561727839715e-06,
+ "loss": 0.0912,
+ "step": 19671
+ },
+ {
+ "epoch": 53.60217983651226,
+ "grad_norm": 3.8857266902923584,
+ "learning_rate": 9.31968127516525e-06,
+ "loss": 0.1843,
+ "step": 19672
+ },
+ {
+ "epoch": 53.60490463215259,
+ "grad_norm": 4.4822678565979,
+ "learning_rate": 9.318800827789082e-06,
+ "loss": 0.138,
+ "step": 19673
+ },
+ {
+ "epoch": 53.607629427792915,
+ "grad_norm": 7.120094299316406,
+ "learning_rate": 9.317920385718075e-06,
+ "loss": 0.1012,
+ "step": 19674
+ },
+ {
+ "epoch": 53.61035422343324,
+ "grad_norm": 4.695366859436035,
+ "learning_rate": 9.317039948959077e-06,
+ "loss": 0.2115,
+ "step": 19675
+ },
+ {
+ "epoch": 53.61307901907357,
+ "grad_norm": 5.063755989074707,
+ "learning_rate": 9.316159517518952e-06,
+ "loss": 0.1157,
+ "step": 19676
+ },
+ {
+ "epoch": 53.6158038147139,
+ "grad_norm": 3.6411147117614746,
+ "learning_rate": 9.315279091404558e-06,
+ "loss": 0.118,
+ "step": 19677
+ },
+ {
+ "epoch": 53.618528610354225,
+ "grad_norm": 3.6441879272460938,
+ "learning_rate": 9.314398670622745e-06,
+ "loss": 0.1094,
+ "step": 19678
+ },
+ {
+ "epoch": 53.62125340599455,
+ "grad_norm": 3.994708299636841,
+ "learning_rate": 9.313518255180375e-06,
+ "loss": 0.118,
+ "step": 19679
+ },
+ {
+ "epoch": 53.62397820163488,
+ "grad_norm": 4.216256618499756,
+ "learning_rate": 9.312637845084303e-06,
+ "loss": 0.3642,
+ "step": 19680
+ },
+ {
+ "epoch": 53.6267029972752,
+ "grad_norm": 14.634512901306152,
+ "learning_rate": 9.311757440341384e-06,
+ "loss": 0.0635,
+ "step": 19681
+ },
+ {
+ "epoch": 53.62942779291553,
+ "grad_norm": 5.584765911102295,
+ "learning_rate": 9.310877040958478e-06,
+ "loss": 0.2964,
+ "step": 19682
+ },
+ {
+ "epoch": 53.63215258855586,
+ "grad_norm": 4.533825397491455,
+ "learning_rate": 9.309996646942437e-06,
+ "loss": 0.1632,
+ "step": 19683
+ },
+ {
+ "epoch": 53.63487738419619,
+ "grad_norm": 3.7038753032684326,
+ "learning_rate": 9.309116258300121e-06,
+ "loss": 0.1072,
+ "step": 19684
+ },
+ {
+ "epoch": 53.63760217983651,
+ "grad_norm": 4.378421783447266,
+ "learning_rate": 9.308235875038385e-06,
+ "loss": 0.0795,
+ "step": 19685
+ },
+ {
+ "epoch": 53.64032697547684,
+ "grad_norm": 4.553260326385498,
+ "learning_rate": 9.307355497164086e-06,
+ "loss": 0.1498,
+ "step": 19686
+ },
+ {
+ "epoch": 53.643051771117165,
+ "grad_norm": 4.38962984085083,
+ "learning_rate": 9.30647512468408e-06,
+ "loss": 0.0908,
+ "step": 19687
+ },
+ {
+ "epoch": 53.64577656675749,
+ "grad_norm": 4.790590763092041,
+ "learning_rate": 9.305594757605226e-06,
+ "loss": 0.1962,
+ "step": 19688
+ },
+ {
+ "epoch": 53.64850136239782,
+ "grad_norm": 3.918919801712036,
+ "learning_rate": 9.304714395934373e-06,
+ "loss": 0.1113,
+ "step": 19689
+ },
+ {
+ "epoch": 53.65122615803815,
+ "grad_norm": 4.994433879852295,
+ "learning_rate": 9.303834039678386e-06,
+ "loss": 0.1298,
+ "step": 19690
+ },
+ {
+ "epoch": 53.653950953678475,
+ "grad_norm": 13.808565139770508,
+ "learning_rate": 9.302953688844113e-06,
+ "loss": 0.139,
+ "step": 19691
+ },
+ {
+ "epoch": 53.6566757493188,
+ "grad_norm": 3.9738388061523438,
+ "learning_rate": 9.302073343438414e-06,
+ "loss": 0.0788,
+ "step": 19692
+ },
+ {
+ "epoch": 53.65940054495913,
+ "grad_norm": 3.889005184173584,
+ "learning_rate": 9.301193003468148e-06,
+ "loss": 0.2035,
+ "step": 19693
+ },
+ {
+ "epoch": 53.66212534059945,
+ "grad_norm": 4.200675010681152,
+ "learning_rate": 9.300312668940168e-06,
+ "loss": 0.1692,
+ "step": 19694
+ },
+ {
+ "epoch": 53.664850136239785,
+ "grad_norm": 7.192455768585205,
+ "learning_rate": 9.299432339861332e-06,
+ "loss": 0.0972,
+ "step": 19695
+ },
+ {
+ "epoch": 53.66757493188011,
+ "grad_norm": 3.8765366077423096,
+ "learning_rate": 9.298552016238492e-06,
+ "loss": 0.1349,
+ "step": 19696
+ },
+ {
+ "epoch": 53.67029972752044,
+ "grad_norm": 3.9085135459899902,
+ "learning_rate": 9.297671698078508e-06,
+ "loss": 0.1553,
+ "step": 19697
+ },
+ {
+ "epoch": 53.67302452316076,
+ "grad_norm": 5.163697719573975,
+ "learning_rate": 9.296791385388233e-06,
+ "loss": 0.11,
+ "step": 19698
+ },
+ {
+ "epoch": 53.67574931880109,
+ "grad_norm": 5.267614364624023,
+ "learning_rate": 9.295911078174526e-06,
+ "loss": 0.0688,
+ "step": 19699
+ },
+ {
+ "epoch": 53.678474114441414,
+ "grad_norm": 3.7285704612731934,
+ "learning_rate": 9.295030776444239e-06,
+ "loss": 0.0697,
+ "step": 19700
+ },
+ {
+ "epoch": 53.68119891008175,
+ "grad_norm": 3.6111433506011963,
+ "learning_rate": 9.29415048020423e-06,
+ "loss": 0.0731,
+ "step": 19701
+ },
+ {
+ "epoch": 53.68392370572207,
+ "grad_norm": 4.5582194328308105,
+ "learning_rate": 9.293270189461354e-06,
+ "loss": 0.1186,
+ "step": 19702
+ },
+ {
+ "epoch": 53.6866485013624,
+ "grad_norm": 3.8478405475616455,
+ "learning_rate": 9.292389904222468e-06,
+ "loss": 0.1078,
+ "step": 19703
+ },
+ {
+ "epoch": 53.689373297002724,
+ "grad_norm": 3.536839246749878,
+ "learning_rate": 9.291509624494426e-06,
+ "loss": 0.1933,
+ "step": 19704
+ },
+ {
+ "epoch": 53.69209809264305,
+ "grad_norm": 5.006591796875,
+ "learning_rate": 9.290629350284083e-06,
+ "loss": 0.2957,
+ "step": 19705
+ },
+ {
+ "epoch": 53.694822888283376,
+ "grad_norm": 5.5485358238220215,
+ "learning_rate": 9.289749081598298e-06,
+ "loss": 0.1277,
+ "step": 19706
+ },
+ {
+ "epoch": 53.69754768392371,
+ "grad_norm": 5.355322360992432,
+ "learning_rate": 9.288868818443923e-06,
+ "loss": 0.099,
+ "step": 19707
+ },
+ {
+ "epoch": 53.700272479564035,
+ "grad_norm": 3.967392683029175,
+ "learning_rate": 9.287988560827814e-06,
+ "loss": 0.0798,
+ "step": 19708
+ },
+ {
+ "epoch": 53.70299727520436,
+ "grad_norm": 4.786160469055176,
+ "learning_rate": 9.28710830875683e-06,
+ "loss": 0.0903,
+ "step": 19709
+ },
+ {
+ "epoch": 53.705722070844686,
+ "grad_norm": 4.865747451782227,
+ "learning_rate": 9.286228062237817e-06,
+ "loss": 0.2441,
+ "step": 19710
+ },
+ {
+ "epoch": 53.70844686648501,
+ "grad_norm": 7.860928535461426,
+ "learning_rate": 9.285347821277644e-06,
+ "loss": 0.2467,
+ "step": 19711
+ },
+ {
+ "epoch": 53.71117166212534,
+ "grad_norm": 3.6451687812805176,
+ "learning_rate": 9.284467585883156e-06,
+ "loss": 0.1245,
+ "step": 19712
+ },
+ {
+ "epoch": 53.71389645776567,
+ "grad_norm": 3.020920753479004,
+ "learning_rate": 9.283587356061214e-06,
+ "loss": 0.0737,
+ "step": 19713
+ },
+ {
+ "epoch": 53.716621253406,
+ "grad_norm": 4.057181358337402,
+ "learning_rate": 9.282707131818666e-06,
+ "loss": 0.1006,
+ "step": 19714
+ },
+ {
+ "epoch": 53.71934604904632,
+ "grad_norm": 5.180568218231201,
+ "learning_rate": 9.281826913162377e-06,
+ "loss": 0.11,
+ "step": 19715
+ },
+ {
+ "epoch": 53.72207084468665,
+ "grad_norm": 3.8155879974365234,
+ "learning_rate": 9.280946700099194e-06,
+ "loss": 0.1056,
+ "step": 19716
+ },
+ {
+ "epoch": 53.724795640326974,
+ "grad_norm": 3.676067352294922,
+ "learning_rate": 9.280066492635976e-06,
+ "loss": 0.0866,
+ "step": 19717
+ },
+ {
+ "epoch": 53.7275204359673,
+ "grad_norm": 6.118213653564453,
+ "learning_rate": 9.279186290779576e-06,
+ "loss": 0.095,
+ "step": 19718
+ },
+ {
+ "epoch": 53.73024523160763,
+ "grad_norm": 3.4128832817077637,
+ "learning_rate": 9.278306094536851e-06,
+ "loss": 0.0771,
+ "step": 19719
+ },
+ {
+ "epoch": 53.73297002724796,
+ "grad_norm": 4.553577423095703,
+ "learning_rate": 9.277425903914654e-06,
+ "loss": 0.0841,
+ "step": 19720
+ },
+ {
+ "epoch": 53.735694822888284,
+ "grad_norm": 6.063533782958984,
+ "learning_rate": 9.276545718919842e-06,
+ "loss": 0.1039,
+ "step": 19721
+ },
+ {
+ "epoch": 53.73841961852861,
+ "grad_norm": 4.499881267547607,
+ "learning_rate": 9.275665539559268e-06,
+ "loss": 0.1192,
+ "step": 19722
+ },
+ {
+ "epoch": 53.741144414168936,
+ "grad_norm": 5.290197372436523,
+ "learning_rate": 9.274785365839788e-06,
+ "loss": 0.0744,
+ "step": 19723
+ },
+ {
+ "epoch": 53.74386920980926,
+ "grad_norm": 4.888653755187988,
+ "learning_rate": 9.273905197768254e-06,
+ "loss": 0.165,
+ "step": 19724
+ },
+ {
+ "epoch": 53.746594005449595,
+ "grad_norm": 4.740888595581055,
+ "learning_rate": 9.273025035351526e-06,
+ "loss": 0.1876,
+ "step": 19725
+ },
+ {
+ "epoch": 53.74931880108992,
+ "grad_norm": 4.391806602478027,
+ "learning_rate": 9.272144878596454e-06,
+ "loss": 0.1214,
+ "step": 19726
+ },
+ {
+ "epoch": 53.752043596730246,
+ "grad_norm": 4.5872979164123535,
+ "learning_rate": 9.27126472750989e-06,
+ "loss": 0.1286,
+ "step": 19727
+ },
+ {
+ "epoch": 53.75476839237057,
+ "grad_norm": 4.158890724182129,
+ "learning_rate": 9.270384582098697e-06,
+ "loss": 0.0627,
+ "step": 19728
+ },
+ {
+ "epoch": 53.7574931880109,
+ "grad_norm": 3.866898775100708,
+ "learning_rate": 9.269504442369727e-06,
+ "loss": 0.1161,
+ "step": 19729
+ },
+ {
+ "epoch": 53.76021798365122,
+ "grad_norm": 4.930418491363525,
+ "learning_rate": 9.26862430832983e-06,
+ "loss": 0.1342,
+ "step": 19730
+ },
+ {
+ "epoch": 53.762942779291556,
+ "grad_norm": 8.506067276000977,
+ "learning_rate": 9.267744179985866e-06,
+ "loss": 0.1787,
+ "step": 19731
+ },
+ {
+ "epoch": 53.76566757493188,
+ "grad_norm": 5.147566318511963,
+ "learning_rate": 9.266864057344684e-06,
+ "loss": 0.0604,
+ "step": 19732
+ },
+ {
+ "epoch": 53.76839237057221,
+ "grad_norm": 9.657304763793945,
+ "learning_rate": 9.265983940413145e-06,
+ "loss": 0.1791,
+ "step": 19733
+ },
+ {
+ "epoch": 53.771117166212534,
+ "grad_norm": 4.672646999359131,
+ "learning_rate": 9.265103829198096e-06,
+ "loss": 0.1003,
+ "step": 19734
+ },
+ {
+ "epoch": 53.77384196185286,
+ "grad_norm": 4.547515392303467,
+ "learning_rate": 9.264223723706397e-06,
+ "loss": 0.0902,
+ "step": 19735
+ },
+ {
+ "epoch": 53.776566757493185,
+ "grad_norm": 2.914116382598877,
+ "learning_rate": 9.263343623944899e-06,
+ "loss": 0.0588,
+ "step": 19736
+ },
+ {
+ "epoch": 53.77929155313352,
+ "grad_norm": 4.2892961502075195,
+ "learning_rate": 9.262463529920458e-06,
+ "loss": 0.166,
+ "step": 19737
+ },
+ {
+ "epoch": 53.782016348773844,
+ "grad_norm": 3.9462146759033203,
+ "learning_rate": 9.261583441639926e-06,
+ "loss": 0.1907,
+ "step": 19738
+ },
+ {
+ "epoch": 53.78474114441417,
+ "grad_norm": 4.957346439361572,
+ "learning_rate": 9.26070335911016e-06,
+ "loss": 0.1905,
+ "step": 19739
+ },
+ {
+ "epoch": 53.787465940054496,
+ "grad_norm": 3.814995288848877,
+ "learning_rate": 9.259823282338008e-06,
+ "loss": 0.1315,
+ "step": 19740
+ },
+ {
+ "epoch": 53.79019073569482,
+ "grad_norm": 3.8015565872192383,
+ "learning_rate": 9.258943211330334e-06,
+ "loss": 0.0887,
+ "step": 19741
+ },
+ {
+ "epoch": 53.79291553133515,
+ "grad_norm": 3.8807504177093506,
+ "learning_rate": 9.258063146093984e-06,
+ "loss": 0.2631,
+ "step": 19742
+ },
+ {
+ "epoch": 53.79564032697548,
+ "grad_norm": 5.895612716674805,
+ "learning_rate": 9.257183086635814e-06,
+ "loss": 0.2002,
+ "step": 19743
+ },
+ {
+ "epoch": 53.798365122615806,
+ "grad_norm": 5.0606369972229,
+ "learning_rate": 9.256303032962676e-06,
+ "loss": 0.2234,
+ "step": 19744
+ },
+ {
+ "epoch": 53.80108991825613,
+ "grad_norm": 5.166808128356934,
+ "learning_rate": 9.255422985081426e-06,
+ "loss": 0.138,
+ "step": 19745
+ },
+ {
+ "epoch": 53.80381471389646,
+ "grad_norm": 5.078512191772461,
+ "learning_rate": 9.254542942998921e-06,
+ "loss": 0.1813,
+ "step": 19746
+ },
+ {
+ "epoch": 53.80653950953678,
+ "grad_norm": 4.038086891174316,
+ "learning_rate": 9.253662906722013e-06,
+ "loss": 0.1659,
+ "step": 19747
+ },
+ {
+ "epoch": 53.80926430517711,
+ "grad_norm": 5.574167251586914,
+ "learning_rate": 9.25278287625755e-06,
+ "loss": 0.1189,
+ "step": 19748
+ },
+ {
+ "epoch": 53.81198910081744,
+ "grad_norm": 4.144851207733154,
+ "learning_rate": 9.251902851612394e-06,
+ "loss": 0.1833,
+ "step": 19749
+ },
+ {
+ "epoch": 53.81471389645777,
+ "grad_norm": 5.024191379547119,
+ "learning_rate": 9.251022832793392e-06,
+ "loss": 0.1893,
+ "step": 19750
+ },
+ {
+ "epoch": 53.817438692098094,
+ "grad_norm": 3.9611613750457764,
+ "learning_rate": 9.250142819807402e-06,
+ "loss": 0.1355,
+ "step": 19751
+ },
+ {
+ "epoch": 53.82016348773842,
+ "grad_norm": 3.462373733520508,
+ "learning_rate": 9.249262812661273e-06,
+ "loss": 0.2155,
+ "step": 19752
+ },
+ {
+ "epoch": 53.822888283378745,
+ "grad_norm": 7.335973739624023,
+ "learning_rate": 9.248382811361864e-06,
+ "loss": 0.1384,
+ "step": 19753
+ },
+ {
+ "epoch": 53.82561307901907,
+ "grad_norm": 6.353860855102539,
+ "learning_rate": 9.247502815916023e-06,
+ "loss": 0.1822,
+ "step": 19754
+ },
+ {
+ "epoch": 53.828337874659404,
+ "grad_norm": 8.818236351013184,
+ "learning_rate": 9.246622826330607e-06,
+ "loss": 0.079,
+ "step": 19755
+ },
+ {
+ "epoch": 53.83106267029973,
+ "grad_norm": 4.357721328735352,
+ "learning_rate": 9.245742842612467e-06,
+ "loss": 0.1023,
+ "step": 19756
+ },
+ {
+ "epoch": 53.833787465940055,
+ "grad_norm": 4.350984573364258,
+ "learning_rate": 9.24486286476846e-06,
+ "loss": 0.1995,
+ "step": 19757
+ },
+ {
+ "epoch": 53.83651226158038,
+ "grad_norm": 5.060369968414307,
+ "learning_rate": 9.243982892805434e-06,
+ "loss": 0.197,
+ "step": 19758
+ },
+ {
+ "epoch": 53.83923705722071,
+ "grad_norm": 4.583494186401367,
+ "learning_rate": 9.243102926730247e-06,
+ "loss": 0.0623,
+ "step": 19759
+ },
+ {
+ "epoch": 53.84196185286103,
+ "grad_norm": 5.591639518737793,
+ "learning_rate": 9.242222966549748e-06,
+ "loss": 0.1246,
+ "step": 19760
+ },
+ {
+ "epoch": 53.844686648501366,
+ "grad_norm": 6.224551200866699,
+ "learning_rate": 9.24134301227079e-06,
+ "loss": 0.1306,
+ "step": 19761
+ },
+ {
+ "epoch": 53.84741144414169,
+ "grad_norm": 4.460511207580566,
+ "learning_rate": 9.240463063900233e-06,
+ "loss": 0.1049,
+ "step": 19762
+ },
+ {
+ "epoch": 53.85013623978202,
+ "grad_norm": 4.57638692855835,
+ "learning_rate": 9.239583121444923e-06,
+ "loss": 0.0678,
+ "step": 19763
+ },
+ {
+ "epoch": 53.85286103542234,
+ "grad_norm": 3.6189639568328857,
+ "learning_rate": 9.238703184911717e-06,
+ "loss": 0.1865,
+ "step": 19764
+ },
+ {
+ "epoch": 53.85558583106267,
+ "grad_norm": 5.947134971618652,
+ "learning_rate": 9.237823254307464e-06,
+ "loss": 0.104,
+ "step": 19765
+ },
+ {
+ "epoch": 53.858310626702995,
+ "grad_norm": 23.398439407348633,
+ "learning_rate": 9.236943329639022e-06,
+ "loss": 0.2495,
+ "step": 19766
+ },
+ {
+ "epoch": 53.86103542234333,
+ "grad_norm": 4.084773063659668,
+ "learning_rate": 9.236063410913237e-06,
+ "loss": 0.1149,
+ "step": 19767
+ },
+ {
+ "epoch": 53.86376021798365,
+ "grad_norm": 10.065081596374512,
+ "learning_rate": 9.235183498136965e-06,
+ "loss": 0.134,
+ "step": 19768
+ },
+ {
+ "epoch": 53.86648501362398,
+ "grad_norm": 3.6826155185699463,
+ "learning_rate": 9.234303591317064e-06,
+ "loss": 0.0661,
+ "step": 19769
+ },
+ {
+ "epoch": 53.869209809264305,
+ "grad_norm": 8.887621879577637,
+ "learning_rate": 9.233423690460377e-06,
+ "loss": 0.1275,
+ "step": 19770
+ },
+ {
+ "epoch": 53.87193460490463,
+ "grad_norm": 4.916548252105713,
+ "learning_rate": 9.232543795573766e-06,
+ "loss": 0.0894,
+ "step": 19771
+ },
+ {
+ "epoch": 53.87465940054496,
+ "grad_norm": 4.731387138366699,
+ "learning_rate": 9.231663906664077e-06,
+ "loss": 0.1106,
+ "step": 19772
+ },
+ {
+ "epoch": 53.87738419618529,
+ "grad_norm": 4.941989421844482,
+ "learning_rate": 9.230784023738165e-06,
+ "loss": 0.2027,
+ "step": 19773
+ },
+ {
+ "epoch": 53.880108991825615,
+ "grad_norm": 7.426902770996094,
+ "learning_rate": 9.229904146802882e-06,
+ "loss": 0.1344,
+ "step": 19774
+ },
+ {
+ "epoch": 53.88283378746594,
+ "grad_norm": 4.1482253074646,
+ "learning_rate": 9.229024275865083e-06,
+ "loss": 0.126,
+ "step": 19775
+ },
+ {
+ "epoch": 53.88555858310627,
+ "grad_norm": 6.658325672149658,
+ "learning_rate": 9.228144410931615e-06,
+ "loss": 0.2323,
+ "step": 19776
+ },
+ {
+ "epoch": 53.88828337874659,
+ "grad_norm": 4.1880269050598145,
+ "learning_rate": 9.227264552009336e-06,
+ "loss": 0.2457,
+ "step": 19777
+ },
+ {
+ "epoch": 53.89100817438692,
+ "grad_norm": 4.866042613983154,
+ "learning_rate": 9.226384699105094e-06,
+ "loss": 0.0798,
+ "step": 19778
+ },
+ {
+ "epoch": 53.89373297002725,
+ "grad_norm": 5.16387414932251,
+ "learning_rate": 9.22550485222574e-06,
+ "loss": 0.1007,
+ "step": 19779
+ },
+ {
+ "epoch": 53.89645776566758,
+ "grad_norm": 4.820022106170654,
+ "learning_rate": 9.224625011378134e-06,
+ "loss": 0.1,
+ "step": 19780
+ },
+ {
+ "epoch": 53.8991825613079,
+ "grad_norm": 4.451500415802002,
+ "learning_rate": 9.223745176569121e-06,
+ "loss": 0.0887,
+ "step": 19781
+ },
+ {
+ "epoch": 53.90190735694823,
+ "grad_norm": 5.097253799438477,
+ "learning_rate": 9.222865347805559e-06,
+ "loss": 0.1678,
+ "step": 19782
+ },
+ {
+ "epoch": 53.904632152588555,
+ "grad_norm": 5.498987197875977,
+ "learning_rate": 9.221985525094292e-06,
+ "loss": 0.0875,
+ "step": 19783
+ },
+ {
+ "epoch": 53.90735694822888,
+ "grad_norm": 4.22909688949585,
+ "learning_rate": 9.221105708442181e-06,
+ "loss": 0.1011,
+ "step": 19784
+ },
+ {
+ "epoch": 53.91008174386921,
+ "grad_norm": 3.702805280685425,
+ "learning_rate": 9.220225897856071e-06,
+ "loss": 0.0752,
+ "step": 19785
+ },
+ {
+ "epoch": 53.91280653950954,
+ "grad_norm": 5.755627632141113,
+ "learning_rate": 9.21934609334282e-06,
+ "loss": 0.1776,
+ "step": 19786
+ },
+ {
+ "epoch": 53.915531335149865,
+ "grad_norm": 6.495734214782715,
+ "learning_rate": 9.218466294909271e-06,
+ "loss": 0.1526,
+ "step": 19787
+ },
+ {
+ "epoch": 53.91825613079019,
+ "grad_norm": 4.754812717437744,
+ "learning_rate": 9.217586502562288e-06,
+ "loss": 0.1241,
+ "step": 19788
+ },
+ {
+ "epoch": 53.920980926430516,
+ "grad_norm": 5.09205436706543,
+ "learning_rate": 9.21670671630871e-06,
+ "loss": 0.1111,
+ "step": 19789
+ },
+ {
+ "epoch": 53.92370572207084,
+ "grad_norm": 3.6057493686676025,
+ "learning_rate": 9.215826936155396e-06,
+ "loss": 0.1001,
+ "step": 19790
+ },
+ {
+ "epoch": 53.926430517711175,
+ "grad_norm": 5.297196865081787,
+ "learning_rate": 9.2149471621092e-06,
+ "loss": 0.1512,
+ "step": 19791
+ },
+ {
+ "epoch": 53.9291553133515,
+ "grad_norm": 4.140446662902832,
+ "learning_rate": 9.214067394176967e-06,
+ "loss": 0.234,
+ "step": 19792
+ },
+ {
+ "epoch": 53.93188010899183,
+ "grad_norm": 3.711136817932129,
+ "learning_rate": 9.213187632365555e-06,
+ "loss": 0.1779,
+ "step": 19793
+ },
+ {
+ "epoch": 53.93460490463215,
+ "grad_norm": 3.979206085205078,
+ "learning_rate": 9.212307876681808e-06,
+ "loss": 0.1441,
+ "step": 19794
+ },
+ {
+ "epoch": 53.93732970027248,
+ "grad_norm": 4.640681743621826,
+ "learning_rate": 9.211428127132587e-06,
+ "loss": 0.0766,
+ "step": 19795
+ },
+ {
+ "epoch": 53.940054495912804,
+ "grad_norm": 5.542065620422363,
+ "learning_rate": 9.210548383724732e-06,
+ "loss": 0.0915,
+ "step": 19796
+ },
+ {
+ "epoch": 53.94277929155314,
+ "grad_norm": 3.4548604488372803,
+ "learning_rate": 9.209668646465103e-06,
+ "loss": 0.1297,
+ "step": 19797
+ },
+ {
+ "epoch": 53.94550408719346,
+ "grad_norm": 6.724388599395752,
+ "learning_rate": 9.208788915360552e-06,
+ "loss": 0.1034,
+ "step": 19798
+ },
+ {
+ "epoch": 53.94822888283379,
+ "grad_norm": 4.6330718994140625,
+ "learning_rate": 9.207909190417924e-06,
+ "loss": 0.2641,
+ "step": 19799
+ },
+ {
+ "epoch": 53.950953678474114,
+ "grad_norm": 4.715029716491699,
+ "learning_rate": 9.207029471644077e-06,
+ "loss": 0.298,
+ "step": 19800
+ },
+ {
+ "epoch": 53.95367847411444,
+ "grad_norm": 5.032526016235352,
+ "learning_rate": 9.206149759045859e-06,
+ "loss": 0.0849,
+ "step": 19801
+ },
+ {
+ "epoch": 53.956403269754766,
+ "grad_norm": 5.344160556793213,
+ "learning_rate": 9.20527005263012e-06,
+ "loss": 0.1629,
+ "step": 19802
+ },
+ {
+ "epoch": 53.95912806539509,
+ "grad_norm": 4.603373050689697,
+ "learning_rate": 9.204390352403711e-06,
+ "loss": 0.1553,
+ "step": 19803
+ },
+ {
+ "epoch": 53.961852861035425,
+ "grad_norm": 6.133690357208252,
+ "learning_rate": 9.203510658373487e-06,
+ "loss": 0.1337,
+ "step": 19804
+ },
+ {
+ "epoch": 53.96457765667575,
+ "grad_norm": 5.43211030960083,
+ "learning_rate": 9.202630970546293e-06,
+ "loss": 0.0983,
+ "step": 19805
+ },
+ {
+ "epoch": 53.967302452316076,
+ "grad_norm": 4.266453742980957,
+ "learning_rate": 9.201751288928988e-06,
+ "loss": 0.0805,
+ "step": 19806
+ },
+ {
+ "epoch": 53.9700272479564,
+ "grad_norm": 4.697748184204102,
+ "learning_rate": 9.200871613528414e-06,
+ "loss": 0.166,
+ "step": 19807
+ },
+ {
+ "epoch": 53.97275204359673,
+ "grad_norm": 4.268434047698975,
+ "learning_rate": 9.19999194435143e-06,
+ "loss": 0.0804,
+ "step": 19808
+ },
+ {
+ "epoch": 53.97547683923706,
+ "grad_norm": 3.7529213428497314,
+ "learning_rate": 9.199112281404878e-06,
+ "loss": 0.1446,
+ "step": 19809
+ },
+ {
+ "epoch": 53.97820163487739,
+ "grad_norm": 4.701591968536377,
+ "learning_rate": 9.198232624695618e-06,
+ "loss": 0.1803,
+ "step": 19810
+ },
+ {
+ "epoch": 53.98092643051771,
+ "grad_norm": 5.256634712219238,
+ "learning_rate": 9.197352974230494e-06,
+ "loss": 0.2383,
+ "step": 19811
+ },
+ {
+ "epoch": 53.98365122615804,
+ "grad_norm": 5.565563201904297,
+ "learning_rate": 9.196473330016361e-06,
+ "loss": 0.1864,
+ "step": 19812
+ },
+ {
+ "epoch": 53.986376021798364,
+ "grad_norm": 3.8778679370880127,
+ "learning_rate": 9.195593692060062e-06,
+ "loss": 0.1776,
+ "step": 19813
+ },
+ {
+ "epoch": 53.98910081743869,
+ "grad_norm": 4.592710494995117,
+ "learning_rate": 9.194714060368458e-06,
+ "loss": 0.1211,
+ "step": 19814
+ },
+ {
+ "epoch": 53.991825613079016,
+ "grad_norm": 3.748595714569092,
+ "learning_rate": 9.193834434948396e-06,
+ "loss": 0.1427,
+ "step": 19815
+ },
+ {
+ "epoch": 53.99455040871935,
+ "grad_norm": 5.07763147354126,
+ "learning_rate": 9.192954815806724e-06,
+ "loss": 0.0761,
+ "step": 19816
+ },
+ {
+ "epoch": 53.997275204359674,
+ "grad_norm": 4.350992679595947,
+ "learning_rate": 9.192075202950297e-06,
+ "loss": 0.0734,
+ "step": 19817
+ },
+ {
+ "epoch": 54.0,
+ "grad_norm": 4.1938629150390625,
+ "learning_rate": 9.19119559638596e-06,
+ "loss": 0.1311,
+ "step": 19818
+ },
+ {
+ "epoch": 54.002724795640326,
+ "grad_norm": 4.72659158706665,
+ "learning_rate": 9.190315996120565e-06,
+ "loss": 0.2525,
+ "step": 19819
+ },
+ {
+ "epoch": 54.00544959128065,
+ "grad_norm": 4.600130558013916,
+ "learning_rate": 9.189436402160964e-06,
+ "loss": 0.1599,
+ "step": 19820
+ },
+ {
+ "epoch": 54.00817438692098,
+ "grad_norm": 8.822296142578125,
+ "learning_rate": 9.188556814514004e-06,
+ "loss": 0.0787,
+ "step": 19821
+ },
+ {
+ "epoch": 54.01089918256131,
+ "grad_norm": 4.7953948974609375,
+ "learning_rate": 9.187677233186541e-06,
+ "loss": 0.0769,
+ "step": 19822
+ },
+ {
+ "epoch": 54.013623978201636,
+ "grad_norm": 8.404830932617188,
+ "learning_rate": 9.18679765818542e-06,
+ "loss": 0.1116,
+ "step": 19823
+ },
+ {
+ "epoch": 54.01634877384196,
+ "grad_norm": 4.598225116729736,
+ "learning_rate": 9.185918089517493e-06,
+ "loss": 0.1221,
+ "step": 19824
+ },
+ {
+ "epoch": 54.01907356948229,
+ "grad_norm": 5.0692925453186035,
+ "learning_rate": 9.18503852718961e-06,
+ "loss": 0.0839,
+ "step": 19825
+ },
+ {
+ "epoch": 54.02179836512261,
+ "grad_norm": 3.9961633682250977,
+ "learning_rate": 9.18415897120862e-06,
+ "loss": 0.0659,
+ "step": 19826
+ },
+ {
+ "epoch": 54.02452316076294,
+ "grad_norm": 5.0505523681640625,
+ "learning_rate": 9.183279421581373e-06,
+ "loss": 0.1316,
+ "step": 19827
+ },
+ {
+ "epoch": 54.02724795640327,
+ "grad_norm": 4.773257255554199,
+ "learning_rate": 9.18239987831472e-06,
+ "loss": 0.0747,
+ "step": 19828
+ },
+ {
+ "epoch": 54.0299727520436,
+ "grad_norm": 3.473534107208252,
+ "learning_rate": 9.181520341415511e-06,
+ "loss": 0.1516,
+ "step": 19829
+ },
+ {
+ "epoch": 54.032697547683924,
+ "grad_norm": 4.486723899841309,
+ "learning_rate": 9.180640810890591e-06,
+ "loss": 0.1769,
+ "step": 19830
+ },
+ {
+ "epoch": 54.03542234332425,
+ "grad_norm": 4.74202823638916,
+ "learning_rate": 9.17976128674682e-06,
+ "loss": 0.2705,
+ "step": 19831
+ },
+ {
+ "epoch": 54.038147138964575,
+ "grad_norm": 3.2471649646759033,
+ "learning_rate": 9.178881768991037e-06,
+ "loss": 0.0736,
+ "step": 19832
+ },
+ {
+ "epoch": 54.0408719346049,
+ "grad_norm": 4.45520544052124,
+ "learning_rate": 9.178002257630099e-06,
+ "loss": 0.1435,
+ "step": 19833
+ },
+ {
+ "epoch": 54.043596730245234,
+ "grad_norm": 4.415715217590332,
+ "learning_rate": 9.177122752670854e-06,
+ "loss": 0.0706,
+ "step": 19834
+ },
+ {
+ "epoch": 54.04632152588556,
+ "grad_norm": 2.955765724182129,
+ "learning_rate": 9.176243254120148e-06,
+ "loss": 0.1999,
+ "step": 19835
+ },
+ {
+ "epoch": 54.049046321525886,
+ "grad_norm": 3.835383653640747,
+ "learning_rate": 9.175363761984836e-06,
+ "loss": 0.0649,
+ "step": 19836
+ },
+ {
+ "epoch": 54.05177111716621,
+ "grad_norm": 3.48504638671875,
+ "learning_rate": 9.174484276271762e-06,
+ "loss": 0.0753,
+ "step": 19837
+ },
+ {
+ "epoch": 54.05449591280654,
+ "grad_norm": 3.7399494647979736,
+ "learning_rate": 9.17360479698778e-06,
+ "loss": 0.1064,
+ "step": 19838
+ },
+ {
+ "epoch": 54.05722070844686,
+ "grad_norm": 6.686160564422607,
+ "learning_rate": 9.172725324139735e-06,
+ "loss": 0.2414,
+ "step": 19839
+ },
+ {
+ "epoch": 54.059945504087196,
+ "grad_norm": 3.8733770847320557,
+ "learning_rate": 9.17184585773448e-06,
+ "loss": 0.2015,
+ "step": 19840
+ },
+ {
+ "epoch": 54.06267029972752,
+ "grad_norm": 3.7958931922912598,
+ "learning_rate": 9.170966397778862e-06,
+ "loss": 0.0806,
+ "step": 19841
+ },
+ {
+ "epoch": 54.06539509536785,
+ "grad_norm": 3.566927433013916,
+ "learning_rate": 9.170086944279733e-06,
+ "loss": 0.0867,
+ "step": 19842
+ },
+ {
+ "epoch": 54.06811989100817,
+ "grad_norm": 4.660705089569092,
+ "learning_rate": 9.169207497243939e-06,
+ "loss": 0.1188,
+ "step": 19843
+ },
+ {
+ "epoch": 54.0708446866485,
+ "grad_norm": 4.133790493011475,
+ "learning_rate": 9.16832805667833e-06,
+ "loss": 0.1706,
+ "step": 19844
+ },
+ {
+ "epoch": 54.073569482288825,
+ "grad_norm": 3.4390602111816406,
+ "learning_rate": 9.167448622589754e-06,
+ "loss": 0.0875,
+ "step": 19845
+ },
+ {
+ "epoch": 54.07629427792916,
+ "grad_norm": 5.287810325622559,
+ "learning_rate": 9.166569194985065e-06,
+ "loss": 0.0862,
+ "step": 19846
+ },
+ {
+ "epoch": 54.079019073569484,
+ "grad_norm": 4.312926769256592,
+ "learning_rate": 9.1656897738711e-06,
+ "loss": 0.1721,
+ "step": 19847
+ },
+ {
+ "epoch": 54.08174386920981,
+ "grad_norm": 9.076287269592285,
+ "learning_rate": 9.164810359254721e-06,
+ "loss": 0.1,
+ "step": 19848
+ },
+ {
+ "epoch": 54.084468664850135,
+ "grad_norm": 4.432627201080322,
+ "learning_rate": 9.163930951142777e-06,
+ "loss": 0.0796,
+ "step": 19849
+ },
+ {
+ "epoch": 54.08719346049046,
+ "grad_norm": 4.057800769805908,
+ "learning_rate": 9.163051549542106e-06,
+ "loss": 0.0967,
+ "step": 19850
+ },
+ {
+ "epoch": 54.08991825613079,
+ "grad_norm": 3.83794903755188,
+ "learning_rate": 9.162172154459565e-06,
+ "loss": 0.0676,
+ "step": 19851
+ },
+ {
+ "epoch": 54.09264305177112,
+ "grad_norm": 6.806939125061035,
+ "learning_rate": 9.161292765901998e-06,
+ "loss": 0.1545,
+ "step": 19852
+ },
+ {
+ "epoch": 54.095367847411445,
+ "grad_norm": 4.117062568664551,
+ "learning_rate": 9.16041338387626e-06,
+ "loss": 0.2045,
+ "step": 19853
+ },
+ {
+ "epoch": 54.09809264305177,
+ "grad_norm": 4.125771999359131,
+ "learning_rate": 9.159534008389193e-06,
+ "loss": 0.0902,
+ "step": 19854
+ },
+ {
+ "epoch": 54.1008174386921,
+ "grad_norm": 5.100405216217041,
+ "learning_rate": 9.158654639447647e-06,
+ "loss": 0.0767,
+ "step": 19855
+ },
+ {
+ "epoch": 54.10354223433242,
+ "grad_norm": 7.159243583679199,
+ "learning_rate": 9.157775277058474e-06,
+ "loss": 0.0882,
+ "step": 19856
+ },
+ {
+ "epoch": 54.10626702997275,
+ "grad_norm": 3.345010995864868,
+ "learning_rate": 9.156895921228519e-06,
+ "loss": 0.2141,
+ "step": 19857
+ },
+ {
+ "epoch": 54.10899182561308,
+ "grad_norm": 4.689110279083252,
+ "learning_rate": 9.156016571964633e-06,
+ "loss": 0.0822,
+ "step": 19858
+ },
+ {
+ "epoch": 54.11171662125341,
+ "grad_norm": 6.687030792236328,
+ "learning_rate": 9.155137229273658e-06,
+ "loss": 0.2441,
+ "step": 19859
+ },
+ {
+ "epoch": 54.11444141689373,
+ "grad_norm": 4.554111480712891,
+ "learning_rate": 9.154257893162452e-06,
+ "loss": 0.1471,
+ "step": 19860
+ },
+ {
+ "epoch": 54.11716621253406,
+ "grad_norm": 3.487919330596924,
+ "learning_rate": 9.153378563637855e-06,
+ "loss": 0.0966,
+ "step": 19861
+ },
+ {
+ "epoch": 54.119891008174385,
+ "grad_norm": 4.792840003967285,
+ "learning_rate": 9.152499240706723e-06,
+ "loss": 0.0964,
+ "step": 19862
+ },
+ {
+ "epoch": 54.12261580381471,
+ "grad_norm": 4.359868049621582,
+ "learning_rate": 9.151619924375896e-06,
+ "loss": 0.0888,
+ "step": 19863
+ },
+ {
+ "epoch": 54.12534059945504,
+ "grad_norm": 2.9529571533203125,
+ "learning_rate": 9.150740614652228e-06,
+ "loss": 0.0573,
+ "step": 19864
+ },
+ {
+ "epoch": 54.12806539509537,
+ "grad_norm": 4.3103179931640625,
+ "learning_rate": 9.149861311542559e-06,
+ "loss": 0.1637,
+ "step": 19865
+ },
+ {
+ "epoch": 54.130790190735695,
+ "grad_norm": 4.092645645141602,
+ "learning_rate": 9.148982015053746e-06,
+ "loss": 0.1923,
+ "step": 19866
+ },
+ {
+ "epoch": 54.13351498637602,
+ "grad_norm": 4.39013671875,
+ "learning_rate": 9.148102725192635e-06,
+ "loss": 0.1765,
+ "step": 19867
+ },
+ {
+ "epoch": 54.13623978201635,
+ "grad_norm": 4.031159400939941,
+ "learning_rate": 9.147223441966072e-06,
+ "loss": 0.0968,
+ "step": 19868
+ },
+ {
+ "epoch": 54.13896457765667,
+ "grad_norm": 3.996030569076538,
+ "learning_rate": 9.146344165380907e-06,
+ "loss": 0.0598,
+ "step": 19869
+ },
+ {
+ "epoch": 54.141689373297005,
+ "grad_norm": 5.097391128540039,
+ "learning_rate": 9.145464895443983e-06,
+ "loss": 0.0893,
+ "step": 19870
+ },
+ {
+ "epoch": 54.14441416893733,
+ "grad_norm": 4.223525047302246,
+ "learning_rate": 9.144585632162153e-06,
+ "loss": 0.0692,
+ "step": 19871
+ },
+ {
+ "epoch": 54.14713896457766,
+ "grad_norm": 5.750377655029297,
+ "learning_rate": 9.143706375542262e-06,
+ "loss": 0.2223,
+ "step": 19872
+ },
+ {
+ "epoch": 54.14986376021798,
+ "grad_norm": 5.008936882019043,
+ "learning_rate": 9.14282712559116e-06,
+ "loss": 0.1911,
+ "step": 19873
+ },
+ {
+ "epoch": 54.15258855585831,
+ "grad_norm": 5.459961414337158,
+ "learning_rate": 9.141947882315691e-06,
+ "loss": 0.1305,
+ "step": 19874
+ },
+ {
+ "epoch": 54.155313351498634,
+ "grad_norm": 3.7197933197021484,
+ "learning_rate": 9.141068645722705e-06,
+ "loss": 0.116,
+ "step": 19875
+ },
+ {
+ "epoch": 54.15803814713897,
+ "grad_norm": 4.223834991455078,
+ "learning_rate": 9.140189415819046e-06,
+ "loss": 0.1871,
+ "step": 19876
+ },
+ {
+ "epoch": 54.16076294277929,
+ "grad_norm": 4.812597751617432,
+ "learning_rate": 9.139310192611565e-06,
+ "loss": 0.1956,
+ "step": 19877
+ },
+ {
+ "epoch": 54.16348773841962,
+ "grad_norm": 4.515567302703857,
+ "learning_rate": 9.138430976107112e-06,
+ "loss": 0.0794,
+ "step": 19878
+ },
+ {
+ "epoch": 54.166212534059945,
+ "grad_norm": 5.7182512283325195,
+ "learning_rate": 9.137551766312528e-06,
+ "loss": 0.1091,
+ "step": 19879
+ },
+ {
+ "epoch": 54.16893732970027,
+ "grad_norm": 3.7585790157318115,
+ "learning_rate": 9.136672563234665e-06,
+ "loss": 0.1085,
+ "step": 19880
+ },
+ {
+ "epoch": 54.171662125340596,
+ "grad_norm": 3.8244426250457764,
+ "learning_rate": 9.135793366880365e-06,
+ "loss": 0.244,
+ "step": 19881
+ },
+ {
+ "epoch": 54.17438692098093,
+ "grad_norm": 5.750347137451172,
+ "learning_rate": 9.134914177256477e-06,
+ "loss": 0.0974,
+ "step": 19882
+ },
+ {
+ "epoch": 54.177111716621255,
+ "grad_norm": 4.220276832580566,
+ "learning_rate": 9.134034994369855e-06,
+ "loss": 0.1403,
+ "step": 19883
+ },
+ {
+ "epoch": 54.17983651226158,
+ "grad_norm": 3.6598060131073,
+ "learning_rate": 9.133155818227338e-06,
+ "loss": 0.0719,
+ "step": 19884
+ },
+ {
+ "epoch": 54.182561307901906,
+ "grad_norm": 4.386716365814209,
+ "learning_rate": 9.132276648835777e-06,
+ "loss": 0.1611,
+ "step": 19885
+ },
+ {
+ "epoch": 54.18528610354223,
+ "grad_norm": 3.7580742835998535,
+ "learning_rate": 9.131397486202016e-06,
+ "loss": 0.1606,
+ "step": 19886
+ },
+ {
+ "epoch": 54.18801089918256,
+ "grad_norm": 3.9836504459381104,
+ "learning_rate": 9.130518330332906e-06,
+ "loss": 0.1178,
+ "step": 19887
+ },
+ {
+ "epoch": 54.19073569482289,
+ "grad_norm": 3.4810760021209717,
+ "learning_rate": 9.129639181235287e-06,
+ "loss": 0.1179,
+ "step": 19888
+ },
+ {
+ "epoch": 54.19346049046322,
+ "grad_norm": 4.02688455581665,
+ "learning_rate": 9.128760038916014e-06,
+ "loss": 0.183,
+ "step": 19889
+ },
+ {
+ "epoch": 54.19618528610354,
+ "grad_norm": 5.134456157684326,
+ "learning_rate": 9.127880903381929e-06,
+ "loss": 0.1452,
+ "step": 19890
+ },
+ {
+ "epoch": 54.19891008174387,
+ "grad_norm": 6.035086154937744,
+ "learning_rate": 9.127001774639879e-06,
+ "loss": 0.1872,
+ "step": 19891
+ },
+ {
+ "epoch": 54.201634877384194,
+ "grad_norm": 4.073210716247559,
+ "learning_rate": 9.12612265269671e-06,
+ "loss": 0.121,
+ "step": 19892
+ },
+ {
+ "epoch": 54.20435967302452,
+ "grad_norm": 7.078280448913574,
+ "learning_rate": 9.125243537559271e-06,
+ "loss": 0.0725,
+ "step": 19893
+ },
+ {
+ "epoch": 54.20708446866485,
+ "grad_norm": 4.349194049835205,
+ "learning_rate": 9.124364429234405e-06,
+ "loss": 0.3014,
+ "step": 19894
+ },
+ {
+ "epoch": 54.20980926430518,
+ "grad_norm": 3.871732711791992,
+ "learning_rate": 9.123485327728964e-06,
+ "loss": 0.1668,
+ "step": 19895
+ },
+ {
+ "epoch": 54.212534059945504,
+ "grad_norm": 5.040707111358643,
+ "learning_rate": 9.122606233049788e-06,
+ "loss": 0.0866,
+ "step": 19896
+ },
+ {
+ "epoch": 54.21525885558583,
+ "grad_norm": 4.670590877532959,
+ "learning_rate": 9.12172714520373e-06,
+ "loss": 0.261,
+ "step": 19897
+ },
+ {
+ "epoch": 54.217983651226156,
+ "grad_norm": 3.076552152633667,
+ "learning_rate": 9.120848064197629e-06,
+ "loss": 0.0866,
+ "step": 19898
+ },
+ {
+ "epoch": 54.22070844686648,
+ "grad_norm": 4.455347061157227,
+ "learning_rate": 9.119968990038333e-06,
+ "loss": 0.0904,
+ "step": 19899
+ },
+ {
+ "epoch": 54.223433242506815,
+ "grad_norm": 5.187293529510498,
+ "learning_rate": 9.119089922732692e-06,
+ "loss": 0.0904,
+ "step": 19900
+ },
+ {
+ "epoch": 54.22615803814714,
+ "grad_norm": 4.790494441986084,
+ "learning_rate": 9.118210862287554e-06,
+ "loss": 0.2048,
+ "step": 19901
+ },
+ {
+ "epoch": 54.228882833787466,
+ "grad_norm": 4.984821319580078,
+ "learning_rate": 9.117331808709758e-06,
+ "loss": 0.1956,
+ "step": 19902
+ },
+ {
+ "epoch": 54.23160762942779,
+ "grad_norm": 5.494422912597656,
+ "learning_rate": 9.116452762006156e-06,
+ "loss": 0.196,
+ "step": 19903
+ },
+ {
+ "epoch": 54.23433242506812,
+ "grad_norm": 4.343879699707031,
+ "learning_rate": 9.11557372218359e-06,
+ "loss": 0.1167,
+ "step": 19904
+ },
+ {
+ "epoch": 54.237057220708444,
+ "grad_norm": 5.257289886474609,
+ "learning_rate": 9.114694689248908e-06,
+ "loss": 0.2315,
+ "step": 19905
+ },
+ {
+ "epoch": 54.23978201634878,
+ "grad_norm": 4.560327529907227,
+ "learning_rate": 9.113815663208954e-06,
+ "loss": 0.1373,
+ "step": 19906
+ },
+ {
+ "epoch": 54.2425068119891,
+ "grad_norm": 4.091838836669922,
+ "learning_rate": 9.112936644070577e-06,
+ "loss": 0.2889,
+ "step": 19907
+ },
+ {
+ "epoch": 54.24523160762943,
+ "grad_norm": 5.418046474456787,
+ "learning_rate": 9.11205763184062e-06,
+ "loss": 0.0983,
+ "step": 19908
+ },
+ {
+ "epoch": 54.247956403269754,
+ "grad_norm": 4.3591766357421875,
+ "learning_rate": 9.11117862652593e-06,
+ "loss": 0.0921,
+ "step": 19909
+ },
+ {
+ "epoch": 54.25068119891008,
+ "grad_norm": 3.6707077026367188,
+ "learning_rate": 9.11029962813335e-06,
+ "loss": 0.2086,
+ "step": 19910
+ },
+ {
+ "epoch": 54.253405994550405,
+ "grad_norm": 4.765595436096191,
+ "learning_rate": 9.10942063666973e-06,
+ "loss": 0.1228,
+ "step": 19911
+ },
+ {
+ "epoch": 54.25613079019074,
+ "grad_norm": 4.567806243896484,
+ "learning_rate": 9.108541652141913e-06,
+ "loss": 0.2093,
+ "step": 19912
+ },
+ {
+ "epoch": 54.258855585831064,
+ "grad_norm": 4.311723232269287,
+ "learning_rate": 9.107662674556746e-06,
+ "loss": 0.2204,
+ "step": 19913
+ },
+ {
+ "epoch": 54.26158038147139,
+ "grad_norm": 5.522973537445068,
+ "learning_rate": 9.106783703921073e-06,
+ "loss": 0.0944,
+ "step": 19914
+ },
+ {
+ "epoch": 54.264305177111716,
+ "grad_norm": 4.553855895996094,
+ "learning_rate": 9.10590474024174e-06,
+ "loss": 0.1351,
+ "step": 19915
+ },
+ {
+ "epoch": 54.26702997275204,
+ "grad_norm": 4.051435470581055,
+ "learning_rate": 9.105025783525587e-06,
+ "loss": 0.1354,
+ "step": 19916
+ },
+ {
+ "epoch": 54.26975476839237,
+ "grad_norm": 4.286976337432861,
+ "learning_rate": 9.104146833779467e-06,
+ "loss": 0.141,
+ "step": 19917
+ },
+ {
+ "epoch": 54.2724795640327,
+ "grad_norm": 4.656496524810791,
+ "learning_rate": 9.103267891010226e-06,
+ "loss": 0.116,
+ "step": 19918
+ },
+ {
+ "epoch": 54.275204359673026,
+ "grad_norm": 7.833804607391357,
+ "learning_rate": 9.102388955224703e-06,
+ "loss": 0.1368,
+ "step": 19919
+ },
+ {
+ "epoch": 54.27792915531335,
+ "grad_norm": 7.952826976776123,
+ "learning_rate": 9.101510026429747e-06,
+ "loss": 0.0883,
+ "step": 19920
+ },
+ {
+ "epoch": 54.28065395095368,
+ "grad_norm": 3.5332489013671875,
+ "learning_rate": 9.100631104632203e-06,
+ "loss": 0.1683,
+ "step": 19921
+ },
+ {
+ "epoch": 54.283378746594,
+ "grad_norm": 5.567306041717529,
+ "learning_rate": 9.099752189838912e-06,
+ "loss": 0.2112,
+ "step": 19922
+ },
+ {
+ "epoch": 54.28610354223433,
+ "grad_norm": 11.213207244873047,
+ "learning_rate": 9.098873282056726e-06,
+ "loss": 0.193,
+ "step": 19923
+ },
+ {
+ "epoch": 54.28882833787466,
+ "grad_norm": 3.878872871398926,
+ "learning_rate": 9.097994381292483e-06,
+ "loss": 0.1537,
+ "step": 19924
+ },
+ {
+ "epoch": 54.29155313351499,
+ "grad_norm": 5.20438814163208,
+ "learning_rate": 9.097115487553033e-06,
+ "loss": 0.1325,
+ "step": 19925
+ },
+ {
+ "epoch": 54.294277929155314,
+ "grad_norm": 4.002889156341553,
+ "learning_rate": 9.096236600845214e-06,
+ "loss": 0.0691,
+ "step": 19926
+ },
+ {
+ "epoch": 54.29700272479564,
+ "grad_norm": 5.819010257720947,
+ "learning_rate": 9.095357721175881e-06,
+ "loss": 0.1531,
+ "step": 19927
+ },
+ {
+ "epoch": 54.299727520435965,
+ "grad_norm": 4.930531978607178,
+ "learning_rate": 9.09447884855187e-06,
+ "loss": 0.125,
+ "step": 19928
+ },
+ {
+ "epoch": 54.30245231607629,
+ "grad_norm": 3.960874557495117,
+ "learning_rate": 9.093599982980029e-06,
+ "loss": 0.0625,
+ "step": 19929
+ },
+ {
+ "epoch": 54.305177111716624,
+ "grad_norm": 4.3878326416015625,
+ "learning_rate": 9.092721124467202e-06,
+ "loss": 0.1572,
+ "step": 19930
+ },
+ {
+ "epoch": 54.30790190735695,
+ "grad_norm": 6.021203517913818,
+ "learning_rate": 9.091842273020233e-06,
+ "loss": 0.0835,
+ "step": 19931
+ },
+ {
+ "epoch": 54.310626702997276,
+ "grad_norm": 7.436844825744629,
+ "learning_rate": 9.090963428645968e-06,
+ "loss": 0.2068,
+ "step": 19932
+ },
+ {
+ "epoch": 54.3133514986376,
+ "grad_norm": 3.2498369216918945,
+ "learning_rate": 9.090084591351247e-06,
+ "loss": 0.0638,
+ "step": 19933
+ },
+ {
+ "epoch": 54.31607629427793,
+ "grad_norm": 4.580674648284912,
+ "learning_rate": 9.089205761142923e-06,
+ "loss": 0.1088,
+ "step": 19934
+ },
+ {
+ "epoch": 54.31880108991825,
+ "grad_norm": 4.306822776794434,
+ "learning_rate": 9.088326938027832e-06,
+ "loss": 0.1295,
+ "step": 19935
+ },
+ {
+ "epoch": 54.321525885558586,
+ "grad_norm": 3.0955657958984375,
+ "learning_rate": 9.087448122012824e-06,
+ "loss": 0.3952,
+ "step": 19936
+ },
+ {
+ "epoch": 54.32425068119891,
+ "grad_norm": 3.77670955657959,
+ "learning_rate": 9.086569313104739e-06,
+ "loss": 0.1043,
+ "step": 19937
+ },
+ {
+ "epoch": 54.32697547683924,
+ "grad_norm": 17.023391723632812,
+ "learning_rate": 9.085690511310425e-06,
+ "loss": 0.1318,
+ "step": 19938
+ },
+ {
+ "epoch": 54.32970027247956,
+ "grad_norm": 4.265194416046143,
+ "learning_rate": 9.084811716636721e-06,
+ "loss": 0.0826,
+ "step": 19939
+ },
+ {
+ "epoch": 54.33242506811989,
+ "grad_norm": 3.366642475128174,
+ "learning_rate": 9.083932929090476e-06,
+ "loss": 0.1127,
+ "step": 19940
+ },
+ {
+ "epoch": 54.335149863760215,
+ "grad_norm": 4.4151201248168945,
+ "learning_rate": 9.083054148678531e-06,
+ "loss": 0.1242,
+ "step": 19941
+ },
+ {
+ "epoch": 54.33787465940055,
+ "grad_norm": 4.221611022949219,
+ "learning_rate": 9.082175375407729e-06,
+ "loss": 0.1635,
+ "step": 19942
+ },
+ {
+ "epoch": 54.34059945504087,
+ "grad_norm": 4.439167499542236,
+ "learning_rate": 9.081296609284919e-06,
+ "loss": 0.1386,
+ "step": 19943
+ },
+ {
+ "epoch": 54.3433242506812,
+ "grad_norm": 4.443729400634766,
+ "learning_rate": 9.080417850316938e-06,
+ "loss": 0.1717,
+ "step": 19944
+ },
+ {
+ "epoch": 54.346049046321525,
+ "grad_norm": 4.255154132843018,
+ "learning_rate": 9.079539098510637e-06,
+ "loss": 0.1705,
+ "step": 19945
+ },
+ {
+ "epoch": 54.34877384196185,
+ "grad_norm": 4.578707218170166,
+ "learning_rate": 9.078660353872853e-06,
+ "loss": 0.1526,
+ "step": 19946
+ },
+ {
+ "epoch": 54.35149863760218,
+ "grad_norm": 3.7247154712677,
+ "learning_rate": 9.077781616410436e-06,
+ "loss": 0.0903,
+ "step": 19947
+ },
+ {
+ "epoch": 54.35422343324251,
+ "grad_norm": 3.75530743598938,
+ "learning_rate": 9.076902886130221e-06,
+ "loss": 0.1433,
+ "step": 19948
+ },
+ {
+ "epoch": 54.356948228882835,
+ "grad_norm": 3.572218894958496,
+ "learning_rate": 9.076024163039061e-06,
+ "loss": 0.1547,
+ "step": 19949
+ },
+ {
+ "epoch": 54.35967302452316,
+ "grad_norm": 4.29448938369751,
+ "learning_rate": 9.075145447143792e-06,
+ "loss": 0.1369,
+ "step": 19950
+ },
+ {
+ "epoch": 54.36239782016349,
+ "grad_norm": 4.167031764984131,
+ "learning_rate": 9.074266738451258e-06,
+ "loss": 0.1004,
+ "step": 19951
+ },
+ {
+ "epoch": 54.36512261580381,
+ "grad_norm": 4.512342929840088,
+ "learning_rate": 9.07338803696831e-06,
+ "loss": 0.1222,
+ "step": 19952
+ },
+ {
+ "epoch": 54.36784741144414,
+ "grad_norm": 4.767820835113525,
+ "learning_rate": 9.072509342701785e-06,
+ "loss": 0.0902,
+ "step": 19953
+ },
+ {
+ "epoch": 54.37057220708447,
+ "grad_norm": 3.9609055519104004,
+ "learning_rate": 9.071630655658528e-06,
+ "loss": 0.0945,
+ "step": 19954
+ },
+ {
+ "epoch": 54.3732970027248,
+ "grad_norm": 3.627892255783081,
+ "learning_rate": 9.070751975845378e-06,
+ "loss": 0.0796,
+ "step": 19955
+ },
+ {
+ "epoch": 54.37602179836512,
+ "grad_norm": 3.317429780960083,
+ "learning_rate": 9.069873303269187e-06,
+ "loss": 0.2341,
+ "step": 19956
+ },
+ {
+ "epoch": 54.37874659400545,
+ "grad_norm": 3.9465110301971436,
+ "learning_rate": 9.068994637936789e-06,
+ "loss": 0.1977,
+ "step": 19957
+ },
+ {
+ "epoch": 54.381471389645775,
+ "grad_norm": 3.863725423812866,
+ "learning_rate": 9.068115979855033e-06,
+ "loss": 0.1488,
+ "step": 19958
+ },
+ {
+ "epoch": 54.3841961852861,
+ "grad_norm": 3.8893754482269287,
+ "learning_rate": 9.067237329030758e-06,
+ "loss": 0.1253,
+ "step": 19959
+ },
+ {
+ "epoch": 54.38692098092643,
+ "grad_norm": 3.4500949382781982,
+ "learning_rate": 9.066358685470811e-06,
+ "loss": 0.0806,
+ "step": 19960
+ },
+ {
+ "epoch": 54.38964577656676,
+ "grad_norm": 4.273351669311523,
+ "learning_rate": 9.06548004918203e-06,
+ "loss": 0.1133,
+ "step": 19961
+ },
+ {
+ "epoch": 54.392370572207085,
+ "grad_norm": 4.2101335525512695,
+ "learning_rate": 9.064601420171262e-06,
+ "loss": 0.2484,
+ "step": 19962
+ },
+ {
+ "epoch": 54.39509536784741,
+ "grad_norm": 4.323520660400391,
+ "learning_rate": 9.063722798445346e-06,
+ "loss": 0.0516,
+ "step": 19963
+ },
+ {
+ "epoch": 54.39782016348774,
+ "grad_norm": 4.718120098114014,
+ "learning_rate": 9.062844184011128e-06,
+ "loss": 0.1163,
+ "step": 19964
+ },
+ {
+ "epoch": 54.40054495912806,
+ "grad_norm": 3.932974100112915,
+ "learning_rate": 9.06196557687545e-06,
+ "loss": 0.1011,
+ "step": 19965
+ },
+ {
+ "epoch": 54.403269754768395,
+ "grad_norm": 3.1335978507995605,
+ "learning_rate": 9.061086977045151e-06,
+ "loss": 0.0983,
+ "step": 19966
+ },
+ {
+ "epoch": 54.40599455040872,
+ "grad_norm": 4.015022277832031,
+ "learning_rate": 9.06020838452708e-06,
+ "loss": 0.0814,
+ "step": 19967
+ },
+ {
+ "epoch": 54.40871934604905,
+ "grad_norm": 4.136988162994385,
+ "learning_rate": 9.059329799328071e-06,
+ "loss": 0.1075,
+ "step": 19968
+ },
+ {
+ "epoch": 54.41144414168937,
+ "grad_norm": 3.6818313598632812,
+ "learning_rate": 9.058451221454974e-06,
+ "loss": 0.087,
+ "step": 19969
+ },
+ {
+ "epoch": 54.4141689373297,
+ "grad_norm": 3.534766912460327,
+ "learning_rate": 9.057572650914631e-06,
+ "loss": 0.1218,
+ "step": 19970
+ },
+ {
+ "epoch": 54.416893732970024,
+ "grad_norm": 4.100685119628906,
+ "learning_rate": 9.05669408771388e-06,
+ "loss": 0.0897,
+ "step": 19971
+ },
+ {
+ "epoch": 54.41961852861036,
+ "grad_norm": 3.8797545433044434,
+ "learning_rate": 9.055815531859565e-06,
+ "loss": 0.113,
+ "step": 19972
+ },
+ {
+ "epoch": 54.42234332425068,
+ "grad_norm": 4.971447467803955,
+ "learning_rate": 9.054936983358528e-06,
+ "loss": 0.1782,
+ "step": 19973
+ },
+ {
+ "epoch": 54.42506811989101,
+ "grad_norm": 4.314890384674072,
+ "learning_rate": 9.054058442217613e-06,
+ "loss": 0.0845,
+ "step": 19974
+ },
+ {
+ "epoch": 54.427792915531334,
+ "grad_norm": 4.110722541809082,
+ "learning_rate": 9.053179908443658e-06,
+ "loss": 0.1403,
+ "step": 19975
+ },
+ {
+ "epoch": 54.43051771117166,
+ "grad_norm": 4.262246131896973,
+ "learning_rate": 9.05230138204351e-06,
+ "loss": 0.3095,
+ "step": 19976
+ },
+ {
+ "epoch": 54.433242506811986,
+ "grad_norm": 3.933448076248169,
+ "learning_rate": 9.051422863024006e-06,
+ "loss": 0.0857,
+ "step": 19977
+ },
+ {
+ "epoch": 54.43596730245232,
+ "grad_norm": 4.248157024383545,
+ "learning_rate": 9.050544351391992e-06,
+ "loss": 0.0955,
+ "step": 19978
+ },
+ {
+ "epoch": 54.438692098092645,
+ "grad_norm": 4.22047758102417,
+ "learning_rate": 9.049665847154307e-06,
+ "loss": 0.1916,
+ "step": 19979
+ },
+ {
+ "epoch": 54.44141689373297,
+ "grad_norm": 3.7908871173858643,
+ "learning_rate": 9.048787350317795e-06,
+ "loss": 0.257,
+ "step": 19980
+ },
+ {
+ "epoch": 54.444141689373296,
+ "grad_norm": 4.60216760635376,
+ "learning_rate": 9.047908860889295e-06,
+ "loss": 0.2006,
+ "step": 19981
+ },
+ {
+ "epoch": 54.44686648501362,
+ "grad_norm": 4.825819969177246,
+ "learning_rate": 9.047030378875652e-06,
+ "loss": 0.158,
+ "step": 19982
+ },
+ {
+ "epoch": 54.44959128065395,
+ "grad_norm": 3.4831581115722656,
+ "learning_rate": 9.046151904283703e-06,
+ "loss": 0.0746,
+ "step": 19983
+ },
+ {
+ "epoch": 54.45231607629428,
+ "grad_norm": 3.586744546890259,
+ "learning_rate": 9.045273437120294e-06,
+ "loss": 0.0596,
+ "step": 19984
+ },
+ {
+ "epoch": 54.45504087193461,
+ "grad_norm": 4.446600437164307,
+ "learning_rate": 9.04439497739226e-06,
+ "loss": 0.1326,
+ "step": 19985
+ },
+ {
+ "epoch": 54.45776566757493,
+ "grad_norm": 4.078514099121094,
+ "learning_rate": 9.043516525106452e-06,
+ "loss": 0.1062,
+ "step": 19986
+ },
+ {
+ "epoch": 54.46049046321526,
+ "grad_norm": 4.9097580909729,
+ "learning_rate": 9.042638080269705e-06,
+ "loss": 0.1133,
+ "step": 19987
+ },
+ {
+ "epoch": 54.463215258855584,
+ "grad_norm": 4.0611467361450195,
+ "learning_rate": 9.041759642888866e-06,
+ "loss": 0.0827,
+ "step": 19988
+ },
+ {
+ "epoch": 54.46594005449591,
+ "grad_norm": 4.112037181854248,
+ "learning_rate": 9.040881212970766e-06,
+ "loss": 0.1292,
+ "step": 19989
+ },
+ {
+ "epoch": 54.46866485013624,
+ "grad_norm": 4.098381996154785,
+ "learning_rate": 9.040002790522257e-06,
+ "loss": 0.1187,
+ "step": 19990
+ },
+ {
+ "epoch": 54.47138964577657,
+ "grad_norm": 3.539646863937378,
+ "learning_rate": 9.039124375550172e-06,
+ "loss": 0.1378,
+ "step": 19991
+ },
+ {
+ "epoch": 54.474114441416894,
+ "grad_norm": 4.825586318969727,
+ "learning_rate": 9.038245968061359e-06,
+ "loss": 0.0962,
+ "step": 19992
+ },
+ {
+ "epoch": 54.47683923705722,
+ "grad_norm": 5.104846477508545,
+ "learning_rate": 9.037367568062653e-06,
+ "loss": 0.1234,
+ "step": 19993
+ },
+ {
+ "epoch": 54.479564032697546,
+ "grad_norm": 4.715920925140381,
+ "learning_rate": 9.0364891755609e-06,
+ "loss": 0.1236,
+ "step": 19994
+ },
+ {
+ "epoch": 54.48228882833787,
+ "grad_norm": 7.497341156005859,
+ "learning_rate": 9.035610790562934e-06,
+ "loss": 0.226,
+ "step": 19995
+ },
+ {
+ "epoch": 54.485013623978205,
+ "grad_norm": 4.018693923950195,
+ "learning_rate": 9.034732413075603e-06,
+ "loss": 0.2543,
+ "step": 19996
+ },
+ {
+ "epoch": 54.48773841961853,
+ "grad_norm": 4.353559970855713,
+ "learning_rate": 9.033854043105743e-06,
+ "loss": 0.0858,
+ "step": 19997
+ },
+ {
+ "epoch": 54.490463215258856,
+ "grad_norm": 3.7409958839416504,
+ "learning_rate": 9.032975680660199e-06,
+ "loss": 0.0805,
+ "step": 19998
+ },
+ {
+ "epoch": 54.49318801089918,
+ "grad_norm": 7.8233137130737305,
+ "learning_rate": 9.032097325745808e-06,
+ "loss": 0.0697,
+ "step": 19999
+ },
+ {
+ "epoch": 54.49591280653951,
+ "grad_norm": 4.105851173400879,
+ "learning_rate": 9.031218978369412e-06,
+ "loss": 0.1566,
+ "step": 20000
+ },
+ {
+ "epoch": 54.49863760217983,
+ "grad_norm": 3.414713144302368,
+ "learning_rate": 9.03034063853785e-06,
+ "loss": 0.0754,
+ "step": 20001
+ },
+ {
+ "epoch": 54.50136239782017,
+ "grad_norm": 4.375031471252441,
+ "learning_rate": 9.029462306257964e-06,
+ "loss": 0.1029,
+ "step": 20002
+ },
+ {
+ "epoch": 54.50408719346049,
+ "grad_norm": 4.491516590118408,
+ "learning_rate": 9.028583981536596e-06,
+ "loss": 0.1226,
+ "step": 20003
+ },
+ {
+ "epoch": 54.50681198910082,
+ "grad_norm": 7.4483137130737305,
+ "learning_rate": 9.027705664380584e-06,
+ "loss": 0.1017,
+ "step": 20004
+ },
+ {
+ "epoch": 54.509536784741144,
+ "grad_norm": 4.860036373138428,
+ "learning_rate": 9.02682735479677e-06,
+ "loss": 0.1738,
+ "step": 20005
+ },
+ {
+ "epoch": 54.51226158038147,
+ "grad_norm": 3.863717555999756,
+ "learning_rate": 9.025949052791991e-06,
+ "loss": 0.0832,
+ "step": 20006
+ },
+ {
+ "epoch": 54.514986376021795,
+ "grad_norm": 3.6477813720703125,
+ "learning_rate": 9.02507075837309e-06,
+ "loss": 0.097,
+ "step": 20007
+ },
+ {
+ "epoch": 54.51771117166213,
+ "grad_norm": 3.176609992980957,
+ "learning_rate": 9.024192471546908e-06,
+ "loss": 0.0911,
+ "step": 20008
+ },
+ {
+ "epoch": 54.520435967302454,
+ "grad_norm": 3.793543577194214,
+ "learning_rate": 9.023314192320283e-06,
+ "loss": 0.25,
+ "step": 20009
+ },
+ {
+ "epoch": 54.52316076294278,
+ "grad_norm": 3.5359690189361572,
+ "learning_rate": 9.022435920700056e-06,
+ "loss": 0.0817,
+ "step": 20010
+ },
+ {
+ "epoch": 54.525885558583106,
+ "grad_norm": 3.758002519607544,
+ "learning_rate": 9.021557656693066e-06,
+ "loss": 0.1665,
+ "step": 20011
+ },
+ {
+ "epoch": 54.52861035422343,
+ "grad_norm": 3.602189540863037,
+ "learning_rate": 9.020679400306156e-06,
+ "loss": 0.2699,
+ "step": 20012
+ },
+ {
+ "epoch": 54.53133514986376,
+ "grad_norm": 3.8625736236572266,
+ "learning_rate": 9.019801151546158e-06,
+ "loss": 0.1331,
+ "step": 20013
+ },
+ {
+ "epoch": 54.53405994550409,
+ "grad_norm": 3.1072683334350586,
+ "learning_rate": 9.018922910419922e-06,
+ "loss": 0.0707,
+ "step": 20014
+ },
+ {
+ "epoch": 54.536784741144416,
+ "grad_norm": 4.463259220123291,
+ "learning_rate": 9.01804467693428e-06,
+ "loss": 0.1598,
+ "step": 20015
+ },
+ {
+ "epoch": 54.53950953678474,
+ "grad_norm": 3.9788694381713867,
+ "learning_rate": 9.017166451096077e-06,
+ "loss": 0.0881,
+ "step": 20016
+ },
+ {
+ "epoch": 54.54223433242507,
+ "grad_norm": 14.165175437927246,
+ "learning_rate": 9.016288232912149e-06,
+ "loss": 0.3357,
+ "step": 20017
+ },
+ {
+ "epoch": 54.54495912806539,
+ "grad_norm": 4.943851470947266,
+ "learning_rate": 9.015410022389336e-06,
+ "loss": 0.1081,
+ "step": 20018
+ },
+ {
+ "epoch": 54.54768392370572,
+ "grad_norm": 3.5630993843078613,
+ "learning_rate": 9.014531819534476e-06,
+ "loss": 0.0687,
+ "step": 20019
+ },
+ {
+ "epoch": 54.55040871934605,
+ "grad_norm": 3.5773746967315674,
+ "learning_rate": 9.013653624354412e-06,
+ "loss": 0.0726,
+ "step": 20020
+ },
+ {
+ "epoch": 54.55313351498638,
+ "grad_norm": 4.466707229614258,
+ "learning_rate": 9.012775436855983e-06,
+ "loss": 0.122,
+ "step": 20021
+ },
+ {
+ "epoch": 54.555858310626704,
+ "grad_norm": 5.6644816398620605,
+ "learning_rate": 9.011897257046025e-06,
+ "loss": 0.3513,
+ "step": 20022
+ },
+ {
+ "epoch": 54.55858310626703,
+ "grad_norm": 4.832213401794434,
+ "learning_rate": 9.011019084931383e-06,
+ "loss": 0.1543,
+ "step": 20023
+ },
+ {
+ "epoch": 54.561307901907355,
+ "grad_norm": 3.8002867698669434,
+ "learning_rate": 9.01014092051889e-06,
+ "loss": 0.087,
+ "step": 20024
+ },
+ {
+ "epoch": 54.56403269754768,
+ "grad_norm": 3.9812376499176025,
+ "learning_rate": 9.009262763815389e-06,
+ "loss": 0.1795,
+ "step": 20025
+ },
+ {
+ "epoch": 54.566757493188014,
+ "grad_norm": 6.038990497589111,
+ "learning_rate": 9.008384614827716e-06,
+ "loss": 0.0586,
+ "step": 20026
+ },
+ {
+ "epoch": 54.56948228882834,
+ "grad_norm": 3.3449394702911377,
+ "learning_rate": 9.007506473562713e-06,
+ "loss": 0.0652,
+ "step": 20027
+ },
+ {
+ "epoch": 54.572207084468666,
+ "grad_norm": 4.443698406219482,
+ "learning_rate": 9.006628340027215e-06,
+ "loss": 0.2079,
+ "step": 20028
+ },
+ {
+ "epoch": 54.57493188010899,
+ "grad_norm": 4.384361743927002,
+ "learning_rate": 9.005750214228066e-06,
+ "loss": 0.128,
+ "step": 20029
+ },
+ {
+ "epoch": 54.57765667574932,
+ "grad_norm": 4.37651252746582,
+ "learning_rate": 9.004872096172103e-06,
+ "loss": 0.1511,
+ "step": 20030
+ },
+ {
+ "epoch": 54.58038147138964,
+ "grad_norm": 4.8329267501831055,
+ "learning_rate": 9.003993985866162e-06,
+ "loss": 0.0954,
+ "step": 20031
+ },
+ {
+ "epoch": 54.583106267029976,
+ "grad_norm": 7.993609428405762,
+ "learning_rate": 9.003115883317085e-06,
+ "loss": 0.236,
+ "step": 20032
+ },
+ {
+ "epoch": 54.5858310626703,
+ "grad_norm": 4.4574174880981445,
+ "learning_rate": 9.00223778853171e-06,
+ "loss": 0.144,
+ "step": 20033
+ },
+ {
+ "epoch": 54.58855585831063,
+ "grad_norm": 3.9963061809539795,
+ "learning_rate": 9.001359701516876e-06,
+ "loss": 0.1694,
+ "step": 20034
+ },
+ {
+ "epoch": 54.59128065395095,
+ "grad_norm": 4.554906368255615,
+ "learning_rate": 9.000481622279417e-06,
+ "loss": 0.0969,
+ "step": 20035
+ },
+ {
+ "epoch": 54.59400544959128,
+ "grad_norm": 4.027370929718018,
+ "learning_rate": 8.999603550826179e-06,
+ "loss": 0.1302,
+ "step": 20036
+ },
+ {
+ "epoch": 54.596730245231605,
+ "grad_norm": 4.896831035614014,
+ "learning_rate": 8.998725487163989e-06,
+ "loss": 0.0989,
+ "step": 20037
+ },
+ {
+ "epoch": 54.59945504087194,
+ "grad_norm": 4.44710111618042,
+ "learning_rate": 8.997847431299697e-06,
+ "loss": 0.1535,
+ "step": 20038
+ },
+ {
+ "epoch": 54.60217983651226,
+ "grad_norm": 5.024483680725098,
+ "learning_rate": 8.996969383240139e-06,
+ "loss": 0.2239,
+ "step": 20039
+ },
+ {
+ "epoch": 54.60490463215259,
+ "grad_norm": 2.951127529144287,
+ "learning_rate": 8.996091342992149e-06,
+ "loss": 0.1386,
+ "step": 20040
+ },
+ {
+ "epoch": 54.607629427792915,
+ "grad_norm": 6.057160377502441,
+ "learning_rate": 8.99521331056257e-06,
+ "loss": 0.0736,
+ "step": 20041
+ },
+ {
+ "epoch": 54.61035422343324,
+ "grad_norm": 5.51812219619751,
+ "learning_rate": 8.994335285958235e-06,
+ "loss": 0.1019,
+ "step": 20042
+ },
+ {
+ "epoch": 54.61307901907357,
+ "grad_norm": 4.582193374633789,
+ "learning_rate": 8.993457269185985e-06,
+ "loss": 0.239,
+ "step": 20043
+ },
+ {
+ "epoch": 54.6158038147139,
+ "grad_norm": 4.180214881896973,
+ "learning_rate": 8.992579260252657e-06,
+ "loss": 0.2014,
+ "step": 20044
+ },
+ {
+ "epoch": 54.618528610354225,
+ "grad_norm": 5.111598014831543,
+ "learning_rate": 8.99170125916509e-06,
+ "loss": 0.1955,
+ "step": 20045
+ },
+ {
+ "epoch": 54.62125340599455,
+ "grad_norm": 4.240719318389893,
+ "learning_rate": 8.99082326593012e-06,
+ "loss": 0.1793,
+ "step": 20046
+ },
+ {
+ "epoch": 54.62397820163488,
+ "grad_norm": 3.8516135215759277,
+ "learning_rate": 8.98994528055459e-06,
+ "loss": 0.2461,
+ "step": 20047
+ },
+ {
+ "epoch": 54.6267029972752,
+ "grad_norm": 8.28837776184082,
+ "learning_rate": 8.989067303045329e-06,
+ "loss": 0.2363,
+ "step": 20048
+ },
+ {
+ "epoch": 54.62942779291553,
+ "grad_norm": 6.5025858879089355,
+ "learning_rate": 8.988189333409181e-06,
+ "loss": 0.097,
+ "step": 20049
+ },
+ {
+ "epoch": 54.63215258855586,
+ "grad_norm": 5.841561317443848,
+ "learning_rate": 8.987311371652981e-06,
+ "loss": 0.1508,
+ "step": 20050
+ },
+ {
+ "epoch": 54.63487738419619,
+ "grad_norm": 4.039793491363525,
+ "learning_rate": 8.986433417783568e-06,
+ "loss": 0.1022,
+ "step": 20051
+ },
+ {
+ "epoch": 54.63760217983651,
+ "grad_norm": 4.460607051849365,
+ "learning_rate": 8.98555547180778e-06,
+ "loss": 0.0702,
+ "step": 20052
+ },
+ {
+ "epoch": 54.64032697547684,
+ "grad_norm": 5.703071594238281,
+ "learning_rate": 8.98467753373245e-06,
+ "loss": 0.0853,
+ "step": 20053
+ },
+ {
+ "epoch": 54.643051771117165,
+ "grad_norm": 3.826636552810669,
+ "learning_rate": 8.983799603564419e-06,
+ "loss": 0.0832,
+ "step": 20054
+ },
+ {
+ "epoch": 54.64577656675749,
+ "grad_norm": 4.368951797485352,
+ "learning_rate": 8.982921681310527e-06,
+ "loss": 0.1486,
+ "step": 20055
+ },
+ {
+ "epoch": 54.64850136239782,
+ "grad_norm": 3.9449362754821777,
+ "learning_rate": 8.982043766977606e-06,
+ "loss": 0.2082,
+ "step": 20056
+ },
+ {
+ "epoch": 54.65122615803815,
+ "grad_norm": 4.87952995300293,
+ "learning_rate": 8.981165860572498e-06,
+ "loss": 0.1528,
+ "step": 20057
+ },
+ {
+ "epoch": 54.653950953678475,
+ "grad_norm": 5.293972969055176,
+ "learning_rate": 8.980287962102035e-06,
+ "loss": 0.2195,
+ "step": 20058
+ },
+ {
+ "epoch": 54.6566757493188,
+ "grad_norm": 3.0508005619049072,
+ "learning_rate": 8.979410071573059e-06,
+ "loss": 0.1929,
+ "step": 20059
+ },
+ {
+ "epoch": 54.65940054495913,
+ "grad_norm": 4.53085470199585,
+ "learning_rate": 8.978532188992403e-06,
+ "loss": 0.1281,
+ "step": 20060
+ },
+ {
+ "epoch": 54.66212534059945,
+ "grad_norm": 6.887814998626709,
+ "learning_rate": 8.977654314366906e-06,
+ "loss": 0.0915,
+ "step": 20061
+ },
+ {
+ "epoch": 54.664850136239785,
+ "grad_norm": 4.136505126953125,
+ "learning_rate": 8.976776447703402e-06,
+ "loss": 0.2221,
+ "step": 20062
+ },
+ {
+ "epoch": 54.66757493188011,
+ "grad_norm": 4.612685203552246,
+ "learning_rate": 8.975898589008734e-06,
+ "loss": 0.1751,
+ "step": 20063
+ },
+ {
+ "epoch": 54.67029972752044,
+ "grad_norm": 4.009918212890625,
+ "learning_rate": 8.975020738289732e-06,
+ "loss": 0.1879,
+ "step": 20064
+ },
+ {
+ "epoch": 54.67302452316076,
+ "grad_norm": 5.834253311157227,
+ "learning_rate": 8.974142895553237e-06,
+ "loss": 0.0889,
+ "step": 20065
+ },
+ {
+ "epoch": 54.67574931880109,
+ "grad_norm": 13.993331909179688,
+ "learning_rate": 8.973265060806083e-06,
+ "loss": 0.0889,
+ "step": 20066
+ },
+ {
+ "epoch": 54.678474114441414,
+ "grad_norm": 4.5561323165893555,
+ "learning_rate": 8.972387234055109e-06,
+ "loss": 0.0818,
+ "step": 20067
+ },
+ {
+ "epoch": 54.68119891008175,
+ "grad_norm": 3.4230246543884277,
+ "learning_rate": 8.971509415307147e-06,
+ "loss": 0.1092,
+ "step": 20068
+ },
+ {
+ "epoch": 54.68392370572207,
+ "grad_norm": 4.538247585296631,
+ "learning_rate": 8.970631604569041e-06,
+ "loss": 0.2038,
+ "step": 20069
+ },
+ {
+ "epoch": 54.6866485013624,
+ "grad_norm": 5.932735443115234,
+ "learning_rate": 8.96975380184762e-06,
+ "loss": 0.0815,
+ "step": 20070
+ },
+ {
+ "epoch": 54.689373297002724,
+ "grad_norm": 3.391663074493408,
+ "learning_rate": 8.968876007149721e-06,
+ "loss": 0.2214,
+ "step": 20071
+ },
+ {
+ "epoch": 54.69209809264305,
+ "grad_norm": 4.163836479187012,
+ "learning_rate": 8.967998220482184e-06,
+ "loss": 0.1795,
+ "step": 20072
+ },
+ {
+ "epoch": 54.694822888283376,
+ "grad_norm": 3.9255266189575195,
+ "learning_rate": 8.967120441851846e-06,
+ "loss": 0.1985,
+ "step": 20073
+ },
+ {
+ "epoch": 54.69754768392371,
+ "grad_norm": 6.915604591369629,
+ "learning_rate": 8.966242671265539e-06,
+ "loss": 0.1629,
+ "step": 20074
+ },
+ {
+ "epoch": 54.700272479564035,
+ "grad_norm": 4.429693698883057,
+ "learning_rate": 8.965364908730103e-06,
+ "loss": 0.1756,
+ "step": 20075
+ },
+ {
+ "epoch": 54.70299727520436,
+ "grad_norm": 8.323269844055176,
+ "learning_rate": 8.96448715425237e-06,
+ "loss": 0.1755,
+ "step": 20076
+ },
+ {
+ "epoch": 54.705722070844686,
+ "grad_norm": 3.622795581817627,
+ "learning_rate": 8.96360940783918e-06,
+ "loss": 0.1408,
+ "step": 20077
+ },
+ {
+ "epoch": 54.70844686648501,
+ "grad_norm": 6.326815605163574,
+ "learning_rate": 8.962731669497364e-06,
+ "loss": 0.1186,
+ "step": 20078
+ },
+ {
+ "epoch": 54.71117166212534,
+ "grad_norm": 4.19735860824585,
+ "learning_rate": 8.96185393923376e-06,
+ "loss": 0.065,
+ "step": 20079
+ },
+ {
+ "epoch": 54.71389645776567,
+ "grad_norm": 3.568211793899536,
+ "learning_rate": 8.960976217055205e-06,
+ "loss": 0.1169,
+ "step": 20080
+ },
+ {
+ "epoch": 54.716621253406,
+ "grad_norm": 5.315328598022461,
+ "learning_rate": 8.960098502968535e-06,
+ "loss": 0.1154,
+ "step": 20081
+ },
+ {
+ "epoch": 54.71934604904632,
+ "grad_norm": 4.539693832397461,
+ "learning_rate": 8.959220796980583e-06,
+ "loss": 0.1923,
+ "step": 20082
+ },
+ {
+ "epoch": 54.72207084468665,
+ "grad_norm": 3.790686845779419,
+ "learning_rate": 8.958343099098187e-06,
+ "loss": 0.1331,
+ "step": 20083
+ },
+ {
+ "epoch": 54.724795640326974,
+ "grad_norm": 4.368740558624268,
+ "learning_rate": 8.95746540932818e-06,
+ "loss": 0.0937,
+ "step": 20084
+ },
+ {
+ "epoch": 54.7275204359673,
+ "grad_norm": 5.634218692779541,
+ "learning_rate": 8.956587727677402e-06,
+ "loss": 0.1788,
+ "step": 20085
+ },
+ {
+ "epoch": 54.73024523160763,
+ "grad_norm": 4.544315814971924,
+ "learning_rate": 8.95571005415268e-06,
+ "loss": 0.21,
+ "step": 20086
+ },
+ {
+ "epoch": 54.73297002724796,
+ "grad_norm": 4.4608845710754395,
+ "learning_rate": 8.954832388760859e-06,
+ "loss": 0.1745,
+ "step": 20087
+ },
+ {
+ "epoch": 54.735694822888284,
+ "grad_norm": 4.1434831619262695,
+ "learning_rate": 8.953954731508765e-06,
+ "loss": 0.0603,
+ "step": 20088
+ },
+ {
+ "epoch": 54.73841961852861,
+ "grad_norm": 4.548007488250732,
+ "learning_rate": 8.95307708240324e-06,
+ "loss": 0.1487,
+ "step": 20089
+ },
+ {
+ "epoch": 54.741144414168936,
+ "grad_norm": 3.8979296684265137,
+ "learning_rate": 8.95219944145112e-06,
+ "loss": 0.1216,
+ "step": 20090
+ },
+ {
+ "epoch": 54.74386920980926,
+ "grad_norm": 4.369950771331787,
+ "learning_rate": 8.951321808659232e-06,
+ "loss": 0.2392,
+ "step": 20091
+ },
+ {
+ "epoch": 54.746594005449595,
+ "grad_norm": 3.8677966594696045,
+ "learning_rate": 8.950444184034422e-06,
+ "loss": 0.2513,
+ "step": 20092
+ },
+ {
+ "epoch": 54.74931880108992,
+ "grad_norm": 4.533779621124268,
+ "learning_rate": 8.949566567583514e-06,
+ "loss": 0.1116,
+ "step": 20093
+ },
+ {
+ "epoch": 54.752043596730246,
+ "grad_norm": 4.238668918609619,
+ "learning_rate": 8.948688959313348e-06,
+ "loss": 0.1522,
+ "step": 20094
+ },
+ {
+ "epoch": 54.75476839237057,
+ "grad_norm": 10.364192008972168,
+ "learning_rate": 8.947811359230762e-06,
+ "loss": 0.2108,
+ "step": 20095
+ },
+ {
+ "epoch": 54.7574931880109,
+ "grad_norm": 3.525343656539917,
+ "learning_rate": 8.946933767342584e-06,
+ "loss": 0.0685,
+ "step": 20096
+ },
+ {
+ "epoch": 54.76021798365122,
+ "grad_norm": 3.2858309745788574,
+ "learning_rate": 8.946056183655654e-06,
+ "loss": 0.0597,
+ "step": 20097
+ },
+ {
+ "epoch": 54.762942779291556,
+ "grad_norm": 4.3708977699279785,
+ "learning_rate": 8.945178608176804e-06,
+ "loss": 0.0842,
+ "step": 20098
+ },
+ {
+ "epoch": 54.76566757493188,
+ "grad_norm": 4.582279682159424,
+ "learning_rate": 8.94430104091287e-06,
+ "loss": 0.1406,
+ "step": 20099
+ },
+ {
+ "epoch": 54.76839237057221,
+ "grad_norm": 4.604583740234375,
+ "learning_rate": 8.943423481870684e-06,
+ "loss": 0.1027,
+ "step": 20100
+ },
+ {
+ "epoch": 54.771117166212534,
+ "grad_norm": 3.1620655059814453,
+ "learning_rate": 8.942545931057083e-06,
+ "loss": 0.1076,
+ "step": 20101
+ },
+ {
+ "epoch": 54.77384196185286,
+ "grad_norm": 3.718745470046997,
+ "learning_rate": 8.941668388478898e-06,
+ "loss": 0.1667,
+ "step": 20102
+ },
+ {
+ "epoch": 54.776566757493185,
+ "grad_norm": 3.7406957149505615,
+ "learning_rate": 8.940790854142967e-06,
+ "loss": 0.1095,
+ "step": 20103
+ },
+ {
+ "epoch": 54.77929155313352,
+ "grad_norm": 3.9838240146636963,
+ "learning_rate": 8.939913328056123e-06,
+ "loss": 0.1433,
+ "step": 20104
+ },
+ {
+ "epoch": 54.782016348773844,
+ "grad_norm": 3.6580402851104736,
+ "learning_rate": 8.939035810225196e-06,
+ "loss": 0.0863,
+ "step": 20105
+ },
+ {
+ "epoch": 54.78474114441417,
+ "grad_norm": 3.1197941303253174,
+ "learning_rate": 8.93815830065703e-06,
+ "loss": 0.1193,
+ "step": 20106
+ },
+ {
+ "epoch": 54.787465940054496,
+ "grad_norm": 3.9491944313049316,
+ "learning_rate": 8.937280799358449e-06,
+ "loss": 0.2518,
+ "step": 20107
+ },
+ {
+ "epoch": 54.79019073569482,
+ "grad_norm": 4.503064155578613,
+ "learning_rate": 8.936403306336294e-06,
+ "loss": 0.1006,
+ "step": 20108
+ },
+ {
+ "epoch": 54.79291553133515,
+ "grad_norm": 5.052579879760742,
+ "learning_rate": 8.935525821597393e-06,
+ "loss": 0.2372,
+ "step": 20109
+ },
+ {
+ "epoch": 54.79564032697548,
+ "grad_norm": 5.94606351852417,
+ "learning_rate": 8.934648345148586e-06,
+ "loss": 0.1735,
+ "step": 20110
+ },
+ {
+ "epoch": 54.798365122615806,
+ "grad_norm": 5.028207302093506,
+ "learning_rate": 8.933770876996701e-06,
+ "loss": 0.1473,
+ "step": 20111
+ },
+ {
+ "epoch": 54.80108991825613,
+ "grad_norm": 4.2381591796875,
+ "learning_rate": 8.932893417148574e-06,
+ "loss": 0.1469,
+ "step": 20112
+ },
+ {
+ "epoch": 54.80381471389646,
+ "grad_norm": 5.26708984375,
+ "learning_rate": 8.932015965611039e-06,
+ "loss": 0.1179,
+ "step": 20113
+ },
+ {
+ "epoch": 54.80653950953678,
+ "grad_norm": 3.5204062461853027,
+ "learning_rate": 8.931138522390932e-06,
+ "loss": 0.1249,
+ "step": 20114
+ },
+ {
+ "epoch": 54.80926430517711,
+ "grad_norm": 13.216294288635254,
+ "learning_rate": 8.93026108749508e-06,
+ "loss": 0.0952,
+ "step": 20115
+ },
+ {
+ "epoch": 54.81198910081744,
+ "grad_norm": 4.192880153656006,
+ "learning_rate": 8.92938366093032e-06,
+ "loss": 0.1293,
+ "step": 20116
+ },
+ {
+ "epoch": 54.81471389645777,
+ "grad_norm": 4.845882415771484,
+ "learning_rate": 8.928506242703487e-06,
+ "loss": 0.1374,
+ "step": 20117
+ },
+ {
+ "epoch": 54.817438692098094,
+ "grad_norm": 3.507521629333496,
+ "learning_rate": 8.927628832821414e-06,
+ "loss": 0.1211,
+ "step": 20118
+ },
+ {
+ "epoch": 54.82016348773842,
+ "grad_norm": 3.631596803665161,
+ "learning_rate": 8.926751431290932e-06,
+ "loss": 0.1978,
+ "step": 20119
+ },
+ {
+ "epoch": 54.822888283378745,
+ "grad_norm": 3.468186855316162,
+ "learning_rate": 8.925874038118874e-06,
+ "loss": 0.1683,
+ "step": 20120
+ },
+ {
+ "epoch": 54.82561307901907,
+ "grad_norm": 5.478501319885254,
+ "learning_rate": 8.924996653312078e-06,
+ "loss": 0.1497,
+ "step": 20121
+ },
+ {
+ "epoch": 54.828337874659404,
+ "grad_norm": 4.084097862243652,
+ "learning_rate": 8.92411927687737e-06,
+ "loss": 0.1836,
+ "step": 20122
+ },
+ {
+ "epoch": 54.83106267029973,
+ "grad_norm": 4.4851603507995605,
+ "learning_rate": 8.923241908821585e-06,
+ "loss": 0.097,
+ "step": 20123
+ },
+ {
+ "epoch": 54.833787465940055,
+ "grad_norm": 4.094699859619141,
+ "learning_rate": 8.92236454915156e-06,
+ "loss": 0.187,
+ "step": 20124
+ },
+ {
+ "epoch": 54.83651226158038,
+ "grad_norm": 4.169244289398193,
+ "learning_rate": 8.921487197874125e-06,
+ "loss": 0.1711,
+ "step": 20125
+ },
+ {
+ "epoch": 54.83923705722071,
+ "grad_norm": 4.472836494445801,
+ "learning_rate": 8.920609854996114e-06,
+ "loss": 0.1385,
+ "step": 20126
+ },
+ {
+ "epoch": 54.84196185286103,
+ "grad_norm": 4.887625694274902,
+ "learning_rate": 8.919732520524358e-06,
+ "loss": 0.0653,
+ "step": 20127
+ },
+ {
+ "epoch": 54.844686648501366,
+ "grad_norm": 3.731388568878174,
+ "learning_rate": 8.918855194465692e-06,
+ "loss": 0.1478,
+ "step": 20128
+ },
+ {
+ "epoch": 54.84741144414169,
+ "grad_norm": 3.4862475395202637,
+ "learning_rate": 8.917977876826944e-06,
+ "loss": 0.068,
+ "step": 20129
+ },
+ {
+ "epoch": 54.85013623978202,
+ "grad_norm": 3.36405086517334,
+ "learning_rate": 8.917100567614953e-06,
+ "loss": 0.1545,
+ "step": 20130
+ },
+ {
+ "epoch": 54.85286103542234,
+ "grad_norm": 4.44132661819458,
+ "learning_rate": 8.916223266836545e-06,
+ "loss": 0.0733,
+ "step": 20131
+ },
+ {
+ "epoch": 54.85558583106267,
+ "grad_norm": 3.3464503288269043,
+ "learning_rate": 8.915345974498555e-06,
+ "loss": 0.1082,
+ "step": 20132
+ },
+ {
+ "epoch": 54.858310626702995,
+ "grad_norm": 3.916621208190918,
+ "learning_rate": 8.914468690607817e-06,
+ "loss": 0.1018,
+ "step": 20133
+ },
+ {
+ "epoch": 54.86103542234333,
+ "grad_norm": 3.7433347702026367,
+ "learning_rate": 8.913591415171164e-06,
+ "loss": 0.2159,
+ "step": 20134
+ },
+ {
+ "epoch": 54.86376021798365,
+ "grad_norm": 4.746287822723389,
+ "learning_rate": 8.912714148195421e-06,
+ "loss": 0.0847,
+ "step": 20135
+ },
+ {
+ "epoch": 54.86648501362398,
+ "grad_norm": 3.4867773056030273,
+ "learning_rate": 8.91183688968743e-06,
+ "loss": 0.1162,
+ "step": 20136
+ },
+ {
+ "epoch": 54.869209809264305,
+ "grad_norm": 4.690593719482422,
+ "learning_rate": 8.910959639654016e-06,
+ "loss": 0.1168,
+ "step": 20137
+ },
+ {
+ "epoch": 54.87193460490463,
+ "grad_norm": 5.641656875610352,
+ "learning_rate": 8.910082398102011e-06,
+ "loss": 0.1863,
+ "step": 20138
+ },
+ {
+ "epoch": 54.87465940054496,
+ "grad_norm": 3.7166199684143066,
+ "learning_rate": 8.909205165038254e-06,
+ "loss": 0.0903,
+ "step": 20139
+ },
+ {
+ "epoch": 54.87738419618529,
+ "grad_norm": 3.8179373741149902,
+ "learning_rate": 8.908327940469566e-06,
+ "loss": 0.1289,
+ "step": 20140
+ },
+ {
+ "epoch": 54.880108991825615,
+ "grad_norm": 3.5929508209228516,
+ "learning_rate": 8.907450724402787e-06,
+ "loss": 0.2132,
+ "step": 20141
+ },
+ {
+ "epoch": 54.88283378746594,
+ "grad_norm": 4.170956611633301,
+ "learning_rate": 8.906573516844749e-06,
+ "loss": 0.0654,
+ "step": 20142
+ },
+ {
+ "epoch": 54.88555858310627,
+ "grad_norm": 5.51287841796875,
+ "learning_rate": 8.90569631780228e-06,
+ "loss": 0.3354,
+ "step": 20143
+ },
+ {
+ "epoch": 54.88828337874659,
+ "grad_norm": 4.574120044708252,
+ "learning_rate": 8.904819127282215e-06,
+ "loss": 0.1151,
+ "step": 20144
+ },
+ {
+ "epoch": 54.89100817438692,
+ "grad_norm": 4.020722389221191,
+ "learning_rate": 8.903941945291381e-06,
+ "loss": 0.0802,
+ "step": 20145
+ },
+ {
+ "epoch": 54.89373297002725,
+ "grad_norm": 4.197763442993164,
+ "learning_rate": 8.903064771836614e-06,
+ "loss": 0.0967,
+ "step": 20146
+ },
+ {
+ "epoch": 54.89645776566758,
+ "grad_norm": 4.7374138832092285,
+ "learning_rate": 8.90218760692474e-06,
+ "loss": 0.104,
+ "step": 20147
+ },
+ {
+ "epoch": 54.8991825613079,
+ "grad_norm": 4.119732856750488,
+ "learning_rate": 8.901310450562596e-06,
+ "loss": 0.1324,
+ "step": 20148
+ },
+ {
+ "epoch": 54.90190735694823,
+ "grad_norm": 4.031776428222656,
+ "learning_rate": 8.900433302757011e-06,
+ "loss": 0.1899,
+ "step": 20149
+ },
+ {
+ "epoch": 54.904632152588555,
+ "grad_norm": 3.7676784992218018,
+ "learning_rate": 8.899556163514816e-06,
+ "loss": 0.0882,
+ "step": 20150
+ },
+ {
+ "epoch": 54.90735694822888,
+ "grad_norm": 3.5313427448272705,
+ "learning_rate": 8.898679032842841e-06,
+ "loss": 0.0704,
+ "step": 20151
+ },
+ {
+ "epoch": 54.91008174386921,
+ "grad_norm": 7.0860748291015625,
+ "learning_rate": 8.89780191074792e-06,
+ "loss": 0.3893,
+ "step": 20152
+ },
+ {
+ "epoch": 54.91280653950954,
+ "grad_norm": 4.015528678894043,
+ "learning_rate": 8.89692479723688e-06,
+ "loss": 0.0862,
+ "step": 20153
+ },
+ {
+ "epoch": 54.915531335149865,
+ "grad_norm": 3.9792304039001465,
+ "learning_rate": 8.896047692316556e-06,
+ "loss": 0.0752,
+ "step": 20154
+ },
+ {
+ "epoch": 54.91825613079019,
+ "grad_norm": 4.7039794921875,
+ "learning_rate": 8.895170595993775e-06,
+ "loss": 0.0793,
+ "step": 20155
+ },
+ {
+ "epoch": 54.920980926430516,
+ "grad_norm": 3.5627522468566895,
+ "learning_rate": 8.894293508275372e-06,
+ "loss": 0.0566,
+ "step": 20156
+ },
+ {
+ "epoch": 54.92370572207084,
+ "grad_norm": 3.825472831726074,
+ "learning_rate": 8.89341642916817e-06,
+ "loss": 0.0845,
+ "step": 20157
+ },
+ {
+ "epoch": 54.926430517711175,
+ "grad_norm": 6.54740047454834,
+ "learning_rate": 8.89253935867901e-06,
+ "loss": 0.1128,
+ "step": 20158
+ },
+ {
+ "epoch": 54.9291553133515,
+ "grad_norm": 3.504307985305786,
+ "learning_rate": 8.891662296814718e-06,
+ "loss": 0.0474,
+ "step": 20159
+ },
+ {
+ "epoch": 54.93188010899183,
+ "grad_norm": 3.362431049346924,
+ "learning_rate": 8.890785243582126e-06,
+ "loss": 0.0863,
+ "step": 20160
+ },
+ {
+ "epoch": 54.93460490463215,
+ "grad_norm": 4.529660701751709,
+ "learning_rate": 8.88990819898806e-06,
+ "loss": 0.1229,
+ "step": 20161
+ },
+ {
+ "epoch": 54.93732970027248,
+ "grad_norm": 4.243590354919434,
+ "learning_rate": 8.889031163039354e-06,
+ "loss": 0.1806,
+ "step": 20162
+ },
+ {
+ "epoch": 54.940054495912804,
+ "grad_norm": 4.1471052169799805,
+ "learning_rate": 8.888154135742837e-06,
+ "loss": 0.1809,
+ "step": 20163
+ },
+ {
+ "epoch": 54.94277929155314,
+ "grad_norm": 4.807526111602783,
+ "learning_rate": 8.887277117105342e-06,
+ "loss": 0.1097,
+ "step": 20164
+ },
+ {
+ "epoch": 54.94550408719346,
+ "grad_norm": 4.902317523956299,
+ "learning_rate": 8.886400107133693e-06,
+ "loss": 0.0878,
+ "step": 20165
+ },
+ {
+ "epoch": 54.94822888283379,
+ "grad_norm": 3.7905032634735107,
+ "learning_rate": 8.885523105834728e-06,
+ "loss": 0.0941,
+ "step": 20166
+ },
+ {
+ "epoch": 54.950953678474114,
+ "grad_norm": 3.9634134769439697,
+ "learning_rate": 8.884646113215271e-06,
+ "loss": 0.1036,
+ "step": 20167
+ },
+ {
+ "epoch": 54.95367847411444,
+ "grad_norm": 3.690251588821411,
+ "learning_rate": 8.883769129282157e-06,
+ "loss": 0.1237,
+ "step": 20168
+ },
+ {
+ "epoch": 54.956403269754766,
+ "grad_norm": 3.8657050132751465,
+ "learning_rate": 8.88289215404221e-06,
+ "loss": 0.0878,
+ "step": 20169
+ },
+ {
+ "epoch": 54.95912806539509,
+ "grad_norm": 3.9786417484283447,
+ "learning_rate": 8.882015187502266e-06,
+ "loss": 0.1353,
+ "step": 20170
+ },
+ {
+ "epoch": 54.961852861035425,
+ "grad_norm": 3.9551243782043457,
+ "learning_rate": 8.881138229669148e-06,
+ "loss": 0.0948,
+ "step": 20171
+ },
+ {
+ "epoch": 54.96457765667575,
+ "grad_norm": 3.3971383571624756,
+ "learning_rate": 8.880261280549693e-06,
+ "loss": 0.0944,
+ "step": 20172
+ },
+ {
+ "epoch": 54.967302452316076,
+ "grad_norm": 3.829512119293213,
+ "learning_rate": 8.879384340150723e-06,
+ "loss": 0.0624,
+ "step": 20173
+ },
+ {
+ "epoch": 54.9700272479564,
+ "grad_norm": 3.6681878566741943,
+ "learning_rate": 8.878507408479071e-06,
+ "loss": 0.1425,
+ "step": 20174
+ },
+ {
+ "epoch": 54.97275204359673,
+ "grad_norm": 5.585506439208984,
+ "learning_rate": 8.877630485541572e-06,
+ "loss": 0.1311,
+ "step": 20175
+ },
+ {
+ "epoch": 54.97547683923706,
+ "grad_norm": 3.7614965438842773,
+ "learning_rate": 8.876753571345047e-06,
+ "loss": 0.1328,
+ "step": 20176
+ },
+ {
+ "epoch": 54.97820163487739,
+ "grad_norm": 3.8820040225982666,
+ "learning_rate": 8.875876665896332e-06,
+ "loss": 0.146,
+ "step": 20177
+ },
+ {
+ "epoch": 54.98092643051771,
+ "grad_norm": 4.194509983062744,
+ "learning_rate": 8.874999769202252e-06,
+ "loss": 0.0942,
+ "step": 20178
+ },
+ {
+ "epoch": 54.98365122615804,
+ "grad_norm": 3.0866785049438477,
+ "learning_rate": 8.874122881269638e-06,
+ "loss": 0.0562,
+ "step": 20179
+ },
+ {
+ "epoch": 54.986376021798364,
+ "grad_norm": 4.456143379211426,
+ "learning_rate": 8.873246002105318e-06,
+ "loss": 0.1501,
+ "step": 20180
+ },
+ {
+ "epoch": 54.98910081743869,
+ "grad_norm": 5.2778544425964355,
+ "learning_rate": 8.872369131716122e-06,
+ "loss": 0.1049,
+ "step": 20181
+ },
+ {
+ "epoch": 54.991825613079016,
+ "grad_norm": 4.072261333465576,
+ "learning_rate": 8.87149227010888e-06,
+ "loss": 0.0715,
+ "step": 20182
+ },
+ {
+ "epoch": 54.99455040871935,
+ "grad_norm": 4.435225963592529,
+ "learning_rate": 8.870615417290418e-06,
+ "loss": 0.1282,
+ "step": 20183
+ },
+ {
+ "epoch": 54.997275204359674,
+ "grad_norm": 7.494845390319824,
+ "learning_rate": 8.86973857326757e-06,
+ "loss": 0.3999,
+ "step": 20184
+ },
+ {
+ "epoch": 55.0,
+ "grad_norm": 3.7138309478759766,
+ "learning_rate": 8.868861738047158e-06,
+ "loss": 0.3206,
+ "step": 20185
+ },
+ {
+ "epoch": 55.002724795640326,
+ "grad_norm": 2.3504903316497803,
+ "learning_rate": 8.867984911636018e-06,
+ "loss": 0.042,
+ "step": 20186
+ },
+ {
+ "epoch": 55.00544959128065,
+ "grad_norm": 4.132227420806885,
+ "learning_rate": 8.867108094040971e-06,
+ "loss": 0.1461,
+ "step": 20187
+ },
+ {
+ "epoch": 55.00817438692098,
+ "grad_norm": 5.002457141876221,
+ "learning_rate": 8.866231285268853e-06,
+ "loss": 0.085,
+ "step": 20188
+ },
+ {
+ "epoch": 55.01089918256131,
+ "grad_norm": 3.5996875762939453,
+ "learning_rate": 8.865354485326488e-06,
+ "loss": 0.1164,
+ "step": 20189
+ },
+ {
+ "epoch": 55.013623978201636,
+ "grad_norm": 3.4471304416656494,
+ "learning_rate": 8.864477694220707e-06,
+ "loss": 0.2071,
+ "step": 20190
+ },
+ {
+ "epoch": 55.01634877384196,
+ "grad_norm": 3.784421920776367,
+ "learning_rate": 8.863600911958332e-06,
+ "loss": 0.1949,
+ "step": 20191
+ },
+ {
+ "epoch": 55.01907356948229,
+ "grad_norm": 3.1663200855255127,
+ "learning_rate": 8.862724138546199e-06,
+ "loss": 0.2372,
+ "step": 20192
+ },
+ {
+ "epoch": 55.02179836512261,
+ "grad_norm": 7.027255058288574,
+ "learning_rate": 8.861847373991137e-06,
+ "loss": 0.1854,
+ "step": 20193
+ },
+ {
+ "epoch": 55.02452316076294,
+ "grad_norm": 4.086968898773193,
+ "learning_rate": 8.860970618299969e-06,
+ "loss": 0.0725,
+ "step": 20194
+ },
+ {
+ "epoch": 55.02724795640327,
+ "grad_norm": 3.4274401664733887,
+ "learning_rate": 8.860093871479527e-06,
+ "loss": 0.1138,
+ "step": 20195
+ },
+ {
+ "epoch": 55.0299727520436,
+ "grad_norm": 4.892838954925537,
+ "learning_rate": 8.859217133536634e-06,
+ "loss": 0.086,
+ "step": 20196
+ },
+ {
+ "epoch": 55.032697547683924,
+ "grad_norm": 3.099942207336426,
+ "learning_rate": 8.858340404478125e-06,
+ "loss": 0.1526,
+ "step": 20197
+ },
+ {
+ "epoch": 55.03542234332425,
+ "grad_norm": 3.834798574447632,
+ "learning_rate": 8.857463684310822e-06,
+ "loss": 0.1158,
+ "step": 20198
+ },
+ {
+ "epoch": 55.038147138964575,
+ "grad_norm": 3.4103872776031494,
+ "learning_rate": 8.856586973041554e-06,
+ "loss": 0.1156,
+ "step": 20199
+ },
+ {
+ "epoch": 55.0408719346049,
+ "grad_norm": 3.874640703201294,
+ "learning_rate": 8.855710270677152e-06,
+ "loss": 0.0671,
+ "step": 20200
+ },
+ {
+ "epoch": 55.043596730245234,
+ "grad_norm": 3.6838603019714355,
+ "learning_rate": 8.854833577224441e-06,
+ "loss": 0.0981,
+ "step": 20201
+ },
+ {
+ "epoch": 55.04632152588556,
+ "grad_norm": 3.1662166118621826,
+ "learning_rate": 8.853956892690247e-06,
+ "loss": 0.0902,
+ "step": 20202
+ },
+ {
+ "epoch": 55.049046321525886,
+ "grad_norm": 4.34156608581543,
+ "learning_rate": 8.8530802170814e-06,
+ "loss": 0.0939,
+ "step": 20203
+ },
+ {
+ "epoch": 55.05177111716621,
+ "grad_norm": 3.8500425815582275,
+ "learning_rate": 8.852203550404733e-06,
+ "loss": 0.0719,
+ "step": 20204
+ },
+ {
+ "epoch": 55.05449591280654,
+ "grad_norm": 3.3220314979553223,
+ "learning_rate": 8.851326892667061e-06,
+ "loss": 0.1083,
+ "step": 20205
+ },
+ {
+ "epoch": 55.05722070844686,
+ "grad_norm": 4.671602725982666,
+ "learning_rate": 8.850450243875223e-06,
+ "loss": 0.186,
+ "step": 20206
+ },
+ {
+ "epoch": 55.059945504087196,
+ "grad_norm": 4.377599716186523,
+ "learning_rate": 8.849573604036037e-06,
+ "loss": 0.1742,
+ "step": 20207
+ },
+ {
+ "epoch": 55.06267029972752,
+ "grad_norm": 3.458615779876709,
+ "learning_rate": 8.84869697315634e-06,
+ "loss": 0.0964,
+ "step": 20208
+ },
+ {
+ "epoch": 55.06539509536785,
+ "grad_norm": 3.8470566272735596,
+ "learning_rate": 8.847820351242949e-06,
+ "loss": 0.0632,
+ "step": 20209
+ },
+ {
+ "epoch": 55.06811989100817,
+ "grad_norm": 4.82185173034668,
+ "learning_rate": 8.846943738302697e-06,
+ "loss": 0.0863,
+ "step": 20210
+ },
+ {
+ "epoch": 55.0708446866485,
+ "grad_norm": 3.5537400245666504,
+ "learning_rate": 8.846067134342412e-06,
+ "loss": 0.0965,
+ "step": 20211
+ },
+ {
+ "epoch": 55.073569482288825,
+ "grad_norm": 7.0138726234436035,
+ "learning_rate": 8.845190539368918e-06,
+ "loss": 0.1019,
+ "step": 20212
+ },
+ {
+ "epoch": 55.07629427792916,
+ "grad_norm": 3.815699338912964,
+ "learning_rate": 8.844313953389043e-06,
+ "loss": 0.0778,
+ "step": 20213
+ },
+ {
+ "epoch": 55.079019073569484,
+ "grad_norm": 4.912858963012695,
+ "learning_rate": 8.843437376409614e-06,
+ "loss": 0.1153,
+ "step": 20214
+ },
+ {
+ "epoch": 55.08174386920981,
+ "grad_norm": 3.5321946144104004,
+ "learning_rate": 8.842560808437459e-06,
+ "loss": 0.0825,
+ "step": 20215
+ },
+ {
+ "epoch": 55.084468664850135,
+ "grad_norm": 4.460391044616699,
+ "learning_rate": 8.841684249479399e-06,
+ "loss": 0.1036,
+ "step": 20216
+ },
+ {
+ "epoch": 55.08719346049046,
+ "grad_norm": 3.628164529800415,
+ "learning_rate": 8.840807699542269e-06,
+ "loss": 0.0758,
+ "step": 20217
+ },
+ {
+ "epoch": 55.08991825613079,
+ "grad_norm": 4.200746536254883,
+ "learning_rate": 8.839931158632889e-06,
+ "loss": 0.1253,
+ "step": 20218
+ },
+ {
+ "epoch": 55.09264305177112,
+ "grad_norm": 4.804069995880127,
+ "learning_rate": 8.83905462675809e-06,
+ "loss": 0.3142,
+ "step": 20219
+ },
+ {
+ "epoch": 55.095367847411445,
+ "grad_norm": 2.774752616882324,
+ "learning_rate": 8.838178103924694e-06,
+ "loss": 0.0545,
+ "step": 20220
+ },
+ {
+ "epoch": 55.09809264305177,
+ "grad_norm": 4.986216068267822,
+ "learning_rate": 8.83730159013953e-06,
+ "loss": 0.2886,
+ "step": 20221
+ },
+ {
+ "epoch": 55.1008174386921,
+ "grad_norm": 3.9713242053985596,
+ "learning_rate": 8.836425085409424e-06,
+ "loss": 0.0606,
+ "step": 20222
+ },
+ {
+ "epoch": 55.10354223433242,
+ "grad_norm": 3.014117479324341,
+ "learning_rate": 8.835548589741204e-06,
+ "loss": 0.0635,
+ "step": 20223
+ },
+ {
+ "epoch": 55.10626702997275,
+ "grad_norm": 3.384340763092041,
+ "learning_rate": 8.834672103141691e-06,
+ "loss": 0.2183,
+ "step": 20224
+ },
+ {
+ "epoch": 55.10899182561308,
+ "grad_norm": 4.542238235473633,
+ "learning_rate": 8.833795625617715e-06,
+ "loss": 0.1492,
+ "step": 20225
+ },
+ {
+ "epoch": 55.11171662125341,
+ "grad_norm": 5.573112487792969,
+ "learning_rate": 8.832919157176098e-06,
+ "loss": 0.2511,
+ "step": 20226
+ },
+ {
+ "epoch": 55.11444141689373,
+ "grad_norm": 4.03924560546875,
+ "learning_rate": 8.832042697823673e-06,
+ "loss": 0.1052,
+ "step": 20227
+ },
+ {
+ "epoch": 55.11716621253406,
+ "grad_norm": 3.9031364917755127,
+ "learning_rate": 8.83116624756726e-06,
+ "loss": 0.092,
+ "step": 20228
+ },
+ {
+ "epoch": 55.119891008174385,
+ "grad_norm": 4.472345352172852,
+ "learning_rate": 8.83028980641369e-06,
+ "loss": 0.1997,
+ "step": 20229
+ },
+ {
+ "epoch": 55.12261580381471,
+ "grad_norm": 3.6592280864715576,
+ "learning_rate": 8.829413374369782e-06,
+ "loss": 0.0813,
+ "step": 20230
+ },
+ {
+ "epoch": 55.12534059945504,
+ "grad_norm": 3.745520830154419,
+ "learning_rate": 8.828536951442367e-06,
+ "loss": 0.0754,
+ "step": 20231
+ },
+ {
+ "epoch": 55.12806539509537,
+ "grad_norm": 3.5315065383911133,
+ "learning_rate": 8.827660537638267e-06,
+ "loss": 0.1161,
+ "step": 20232
+ },
+ {
+ "epoch": 55.130790190735695,
+ "grad_norm": 4.480501174926758,
+ "learning_rate": 8.826784132964313e-06,
+ "loss": 0.0642,
+ "step": 20233
+ },
+ {
+ "epoch": 55.13351498637602,
+ "grad_norm": 4.230098724365234,
+ "learning_rate": 8.825907737427321e-06,
+ "loss": 0.1604,
+ "step": 20234
+ },
+ {
+ "epoch": 55.13623978201635,
+ "grad_norm": 5.051258087158203,
+ "learning_rate": 8.825031351034125e-06,
+ "loss": 0.1923,
+ "step": 20235
+ },
+ {
+ "epoch": 55.13896457765667,
+ "grad_norm": 4.391542911529541,
+ "learning_rate": 8.824154973791545e-06,
+ "loss": 0.0783,
+ "step": 20236
+ },
+ {
+ "epoch": 55.141689373297005,
+ "grad_norm": 4.71673583984375,
+ "learning_rate": 8.823278605706412e-06,
+ "loss": 0.1286,
+ "step": 20237
+ },
+ {
+ "epoch": 55.14441416893733,
+ "grad_norm": 5.092132091522217,
+ "learning_rate": 8.822402246785542e-06,
+ "loss": 0.1752,
+ "step": 20238
+ },
+ {
+ "epoch": 55.14713896457766,
+ "grad_norm": 3.5076375007629395,
+ "learning_rate": 8.82152589703577e-06,
+ "loss": 0.0689,
+ "step": 20239
+ },
+ {
+ "epoch": 55.14986376021798,
+ "grad_norm": 5.270573616027832,
+ "learning_rate": 8.820649556463913e-06,
+ "loss": 0.0711,
+ "step": 20240
+ },
+ {
+ "epoch": 55.15258855585831,
+ "grad_norm": 4.217471599578857,
+ "learning_rate": 8.819773225076803e-06,
+ "loss": 0.0764,
+ "step": 20241
+ },
+ {
+ "epoch": 55.155313351498634,
+ "grad_norm": 2.447371244430542,
+ "learning_rate": 8.818896902881257e-06,
+ "loss": 0.0484,
+ "step": 20242
+ },
+ {
+ "epoch": 55.15803814713897,
+ "grad_norm": 4.374931335449219,
+ "learning_rate": 8.818020589884103e-06,
+ "loss": 0.2461,
+ "step": 20243
+ },
+ {
+ "epoch": 55.16076294277929,
+ "grad_norm": 2.9120328426361084,
+ "learning_rate": 8.817144286092167e-06,
+ "loss": 0.1152,
+ "step": 20244
+ },
+ {
+ "epoch": 55.16348773841962,
+ "grad_norm": 4.129950046539307,
+ "learning_rate": 8.816267991512277e-06,
+ "loss": 0.1396,
+ "step": 20245
+ },
+ {
+ "epoch": 55.166212534059945,
+ "grad_norm": 27.105342864990234,
+ "learning_rate": 8.815391706151252e-06,
+ "loss": 0.1394,
+ "step": 20246
+ },
+ {
+ "epoch": 55.16893732970027,
+ "grad_norm": 8.449474334716797,
+ "learning_rate": 8.81451543001592e-06,
+ "loss": 0.1023,
+ "step": 20247
+ },
+ {
+ "epoch": 55.171662125340596,
+ "grad_norm": 3.819932222366333,
+ "learning_rate": 8.8136391631131e-06,
+ "loss": 0.1099,
+ "step": 20248
+ },
+ {
+ "epoch": 55.17438692098093,
+ "grad_norm": 3.9747045040130615,
+ "learning_rate": 8.812762905449624e-06,
+ "loss": 0.1669,
+ "step": 20249
+ },
+ {
+ "epoch": 55.177111716621255,
+ "grad_norm": 3.383382797241211,
+ "learning_rate": 8.81188665703231e-06,
+ "loss": 0.1389,
+ "step": 20250
+ },
+ {
+ "epoch": 55.17983651226158,
+ "grad_norm": 4.292916774749756,
+ "learning_rate": 8.811010417867987e-06,
+ "loss": 0.0666,
+ "step": 20251
+ },
+ {
+ "epoch": 55.182561307901906,
+ "grad_norm": 4.522629737854004,
+ "learning_rate": 8.810134187963472e-06,
+ "loss": 0.1429,
+ "step": 20252
+ },
+ {
+ "epoch": 55.18528610354223,
+ "grad_norm": 5.1233015060424805,
+ "learning_rate": 8.809257967325598e-06,
+ "loss": 0.1429,
+ "step": 20253
+ },
+ {
+ "epoch": 55.18801089918256,
+ "grad_norm": 7.660608291625977,
+ "learning_rate": 8.808381755961183e-06,
+ "loss": 0.107,
+ "step": 20254
+ },
+ {
+ "epoch": 55.19073569482289,
+ "grad_norm": 5.419578552246094,
+ "learning_rate": 8.807505553877054e-06,
+ "loss": 0.2346,
+ "step": 20255
+ },
+ {
+ "epoch": 55.19346049046322,
+ "grad_norm": 4.0470757484436035,
+ "learning_rate": 8.80662936108003e-06,
+ "loss": 0.1617,
+ "step": 20256
+ },
+ {
+ "epoch": 55.19618528610354,
+ "grad_norm": 4.291471481323242,
+ "learning_rate": 8.805753177576942e-06,
+ "loss": 0.055,
+ "step": 20257
+ },
+ {
+ "epoch": 55.19891008174387,
+ "grad_norm": 3.448298454284668,
+ "learning_rate": 8.804877003374606e-06,
+ "loss": 0.0694,
+ "step": 20258
+ },
+ {
+ "epoch": 55.201634877384194,
+ "grad_norm": 3.65120005607605,
+ "learning_rate": 8.804000838479853e-06,
+ "loss": 0.1836,
+ "step": 20259
+ },
+ {
+ "epoch": 55.20435967302452,
+ "grad_norm": 3.6651101112365723,
+ "learning_rate": 8.803124682899498e-06,
+ "loss": 0.1116,
+ "step": 20260
+ },
+ {
+ "epoch": 55.20708446866485,
+ "grad_norm": 4.730973243713379,
+ "learning_rate": 8.802248536640371e-06,
+ "loss": 0.154,
+ "step": 20261
+ },
+ {
+ "epoch": 55.20980926430518,
+ "grad_norm": 3.9444150924682617,
+ "learning_rate": 8.801372399709297e-06,
+ "loss": 0.205,
+ "step": 20262
+ },
+ {
+ "epoch": 55.212534059945504,
+ "grad_norm": 4.400238037109375,
+ "learning_rate": 8.800496272113094e-06,
+ "loss": 0.1721,
+ "step": 20263
+ },
+ {
+ "epoch": 55.21525885558583,
+ "grad_norm": 4.010095596313477,
+ "learning_rate": 8.79962015385859e-06,
+ "loss": 0.1627,
+ "step": 20264
+ },
+ {
+ "epoch": 55.217983651226156,
+ "grad_norm": 5.48933219909668,
+ "learning_rate": 8.798744044952602e-06,
+ "loss": 0.1086,
+ "step": 20265
+ },
+ {
+ "epoch": 55.22070844686648,
+ "grad_norm": 5.2862548828125,
+ "learning_rate": 8.797867945401957e-06,
+ "loss": 0.1496,
+ "step": 20266
+ },
+ {
+ "epoch": 55.223433242506815,
+ "grad_norm": 4.545261383056641,
+ "learning_rate": 8.79699185521348e-06,
+ "loss": 0.084,
+ "step": 20267
+ },
+ {
+ "epoch": 55.22615803814714,
+ "grad_norm": 6.042707443237305,
+ "learning_rate": 8.79611577439399e-06,
+ "loss": 0.1042,
+ "step": 20268
+ },
+ {
+ "epoch": 55.228882833787466,
+ "grad_norm": 7.061752796173096,
+ "learning_rate": 8.795239702950314e-06,
+ "loss": 0.1304,
+ "step": 20269
+ },
+ {
+ "epoch": 55.23160762942779,
+ "grad_norm": 3.2901804447174072,
+ "learning_rate": 8.794363640889269e-06,
+ "loss": 0.2088,
+ "step": 20270
+ },
+ {
+ "epoch": 55.23433242506812,
+ "grad_norm": 8.586701393127441,
+ "learning_rate": 8.793487588217686e-06,
+ "loss": 0.127,
+ "step": 20271
+ },
+ {
+ "epoch": 55.237057220708444,
+ "grad_norm": 3.2752881050109863,
+ "learning_rate": 8.792611544942378e-06,
+ "loss": 0.2658,
+ "step": 20272
+ },
+ {
+ "epoch": 55.23978201634878,
+ "grad_norm": 3.862663984298706,
+ "learning_rate": 8.791735511070175e-06,
+ "loss": 0.0598,
+ "step": 20273
+ },
+ {
+ "epoch": 55.2425068119891,
+ "grad_norm": 4.582693576812744,
+ "learning_rate": 8.790859486607896e-06,
+ "loss": 0.1095,
+ "step": 20274
+ },
+ {
+ "epoch": 55.24523160762943,
+ "grad_norm": 4.33612060546875,
+ "learning_rate": 8.789983471562365e-06,
+ "loss": 0.1885,
+ "step": 20275
+ },
+ {
+ "epoch": 55.247956403269754,
+ "grad_norm": 4.18079137802124,
+ "learning_rate": 8.789107465940403e-06,
+ "loss": 0.0801,
+ "step": 20276
+ },
+ {
+ "epoch": 55.25068119891008,
+ "grad_norm": 3.529261589050293,
+ "learning_rate": 8.788231469748831e-06,
+ "loss": 0.3526,
+ "step": 20277
+ },
+ {
+ "epoch": 55.253405994550405,
+ "grad_norm": 4.6453657150268555,
+ "learning_rate": 8.787355482994477e-06,
+ "loss": 0.0942,
+ "step": 20278
+ },
+ {
+ "epoch": 55.25613079019074,
+ "grad_norm": 4.475424289703369,
+ "learning_rate": 8.786479505684157e-06,
+ "loss": 0.1576,
+ "step": 20279
+ },
+ {
+ "epoch": 55.258855585831064,
+ "grad_norm": 5.170428276062012,
+ "learning_rate": 8.785603537824699e-06,
+ "loss": 0.1326,
+ "step": 20280
+ },
+ {
+ "epoch": 55.26158038147139,
+ "grad_norm": 5.155692100524902,
+ "learning_rate": 8.784727579422918e-06,
+ "loss": 0.0831,
+ "step": 20281
+ },
+ {
+ "epoch": 55.264305177111716,
+ "grad_norm": 4.734813213348389,
+ "learning_rate": 8.783851630485642e-06,
+ "loss": 0.0534,
+ "step": 20282
+ },
+ {
+ "epoch": 55.26702997275204,
+ "grad_norm": 3.995192289352417,
+ "learning_rate": 8.782975691019689e-06,
+ "loss": 0.1358,
+ "step": 20283
+ },
+ {
+ "epoch": 55.26975476839237,
+ "grad_norm": 6.3889288902282715,
+ "learning_rate": 8.782099761031882e-06,
+ "loss": 0.1075,
+ "step": 20284
+ },
+ {
+ "epoch": 55.2724795640327,
+ "grad_norm": 4.618751525878906,
+ "learning_rate": 8.781223840529043e-06,
+ "loss": 0.2006,
+ "step": 20285
+ },
+ {
+ "epoch": 55.275204359673026,
+ "grad_norm": 4.445119380950928,
+ "learning_rate": 8.780347929517995e-06,
+ "loss": 0.132,
+ "step": 20286
+ },
+ {
+ "epoch": 55.27792915531335,
+ "grad_norm": 4.009746551513672,
+ "learning_rate": 8.779472028005555e-06,
+ "loss": 0.0733,
+ "step": 20287
+ },
+ {
+ "epoch": 55.28065395095368,
+ "grad_norm": 5.356363296508789,
+ "learning_rate": 8.778596135998551e-06,
+ "loss": 0.084,
+ "step": 20288
+ },
+ {
+ "epoch": 55.283378746594,
+ "grad_norm": 3.0403525829315186,
+ "learning_rate": 8.777720253503799e-06,
+ "loss": 0.1113,
+ "step": 20289
+ },
+ {
+ "epoch": 55.28610354223433,
+ "grad_norm": 4.624750137329102,
+ "learning_rate": 8.776844380528123e-06,
+ "loss": 0.157,
+ "step": 20290
+ },
+ {
+ "epoch": 55.28882833787466,
+ "grad_norm": 4.86638879776001,
+ "learning_rate": 8.775968517078343e-06,
+ "loss": 0.3833,
+ "step": 20291
+ },
+ {
+ "epoch": 55.29155313351499,
+ "grad_norm": 3.088222026824951,
+ "learning_rate": 8.77509266316128e-06,
+ "loss": 0.0966,
+ "step": 20292
+ },
+ {
+ "epoch": 55.294277929155314,
+ "grad_norm": 4.835270404815674,
+ "learning_rate": 8.774216818783758e-06,
+ "loss": 0.113,
+ "step": 20293
+ },
+ {
+ "epoch": 55.29700272479564,
+ "grad_norm": 6.672879695892334,
+ "learning_rate": 8.773340983952595e-06,
+ "loss": 0.0722,
+ "step": 20294
+ },
+ {
+ "epoch": 55.299727520435965,
+ "grad_norm": 7.032373428344727,
+ "learning_rate": 8.77246515867461e-06,
+ "loss": 0.1777,
+ "step": 20295
+ },
+ {
+ "epoch": 55.30245231607629,
+ "grad_norm": 5.144742965698242,
+ "learning_rate": 8.77158934295663e-06,
+ "loss": 0.1588,
+ "step": 20296
+ },
+ {
+ "epoch": 55.305177111716624,
+ "grad_norm": 5.2068915367126465,
+ "learning_rate": 8.770713536805471e-06,
+ "loss": 0.1146,
+ "step": 20297
+ },
+ {
+ "epoch": 55.30790190735695,
+ "grad_norm": 2.8044724464416504,
+ "learning_rate": 8.769837740227959e-06,
+ "loss": 0.0561,
+ "step": 20298
+ },
+ {
+ "epoch": 55.310626702997276,
+ "grad_norm": 5.347578525543213,
+ "learning_rate": 8.768961953230908e-06,
+ "loss": 0.0992,
+ "step": 20299
+ },
+ {
+ "epoch": 55.3133514986376,
+ "grad_norm": 4.6252970695495605,
+ "learning_rate": 8.768086175821145e-06,
+ "loss": 0.0579,
+ "step": 20300
+ },
+ {
+ "epoch": 55.31607629427793,
+ "grad_norm": 3.5642454624176025,
+ "learning_rate": 8.767210408005483e-06,
+ "loss": 0.1003,
+ "step": 20301
+ },
+ {
+ "epoch": 55.31880108991825,
+ "grad_norm": 3.8838951587677,
+ "learning_rate": 8.76633464979075e-06,
+ "loss": 0.1208,
+ "step": 20302
+ },
+ {
+ "epoch": 55.321525885558586,
+ "grad_norm": 6.521909713745117,
+ "learning_rate": 8.76545890118376e-06,
+ "loss": 0.1335,
+ "step": 20303
+ },
+ {
+ "epoch": 55.32425068119891,
+ "grad_norm": 3.353015899658203,
+ "learning_rate": 8.764583162191338e-06,
+ "loss": 0.1621,
+ "step": 20304
+ },
+ {
+ "epoch": 55.32697547683924,
+ "grad_norm": 3.9906301498413086,
+ "learning_rate": 8.763707432820303e-06,
+ "loss": 0.0857,
+ "step": 20305
+ },
+ {
+ "epoch": 55.32970027247956,
+ "grad_norm": 4.320180892944336,
+ "learning_rate": 8.762831713077475e-06,
+ "loss": 0.1162,
+ "step": 20306
+ },
+ {
+ "epoch": 55.33242506811989,
+ "grad_norm": 4.274276256561279,
+ "learning_rate": 8.761956002969672e-06,
+ "loss": 0.0848,
+ "step": 20307
+ },
+ {
+ "epoch": 55.335149863760215,
+ "grad_norm": 3.954271078109741,
+ "learning_rate": 8.761080302503718e-06,
+ "loss": 0.1116,
+ "step": 20308
+ },
+ {
+ "epoch": 55.33787465940055,
+ "grad_norm": 8.057647705078125,
+ "learning_rate": 8.760204611686429e-06,
+ "loss": 0.1377,
+ "step": 20309
+ },
+ {
+ "epoch": 55.34059945504087,
+ "grad_norm": 3.788517475128174,
+ "learning_rate": 8.759328930524628e-06,
+ "loss": 0.0685,
+ "step": 20310
+ },
+ {
+ "epoch": 55.3433242506812,
+ "grad_norm": 4.2331438064575195,
+ "learning_rate": 8.75845325902513e-06,
+ "loss": 0.0902,
+ "step": 20311
+ },
+ {
+ "epoch": 55.346049046321525,
+ "grad_norm": 5.339404582977295,
+ "learning_rate": 8.757577597194758e-06,
+ "loss": 0.1751,
+ "step": 20312
+ },
+ {
+ "epoch": 55.34877384196185,
+ "grad_norm": 5.503269672393799,
+ "learning_rate": 8.756701945040334e-06,
+ "loss": 0.1377,
+ "step": 20313
+ },
+ {
+ "epoch": 55.35149863760218,
+ "grad_norm": 4.48171329498291,
+ "learning_rate": 8.755826302568676e-06,
+ "loss": 0.1856,
+ "step": 20314
+ },
+ {
+ "epoch": 55.35422343324251,
+ "grad_norm": 3.3599138259887695,
+ "learning_rate": 8.754950669786602e-06,
+ "loss": 0.0976,
+ "step": 20315
+ },
+ {
+ "epoch": 55.356948228882835,
+ "grad_norm": 4.272397041320801,
+ "learning_rate": 8.754075046700934e-06,
+ "loss": 0.0889,
+ "step": 20316
+ },
+ {
+ "epoch": 55.35967302452316,
+ "grad_norm": 3.6690478324890137,
+ "learning_rate": 8.753199433318486e-06,
+ "loss": 0.0819,
+ "step": 20317
+ },
+ {
+ "epoch": 55.36239782016349,
+ "grad_norm": 5.556273460388184,
+ "learning_rate": 8.752323829646084e-06,
+ "loss": 0.1198,
+ "step": 20318
+ },
+ {
+ "epoch": 55.36512261580381,
+ "grad_norm": 6.00161075592041,
+ "learning_rate": 8.751448235690541e-06,
+ "loss": 0.2671,
+ "step": 20319
+ },
+ {
+ "epoch": 55.36784741144414,
+ "grad_norm": 4.806107044219971,
+ "learning_rate": 8.750572651458682e-06,
+ "loss": 0.1753,
+ "step": 20320
+ },
+ {
+ "epoch": 55.37057220708447,
+ "grad_norm": 4.758706569671631,
+ "learning_rate": 8.74969707695732e-06,
+ "loss": 0.0665,
+ "step": 20321
+ },
+ {
+ "epoch": 55.3732970027248,
+ "grad_norm": 4.076588153839111,
+ "learning_rate": 8.74882151219328e-06,
+ "loss": 0.0696,
+ "step": 20322
+ },
+ {
+ "epoch": 55.37602179836512,
+ "grad_norm": 4.132752418518066,
+ "learning_rate": 8.747945957173374e-06,
+ "loss": 0.1716,
+ "step": 20323
+ },
+ {
+ "epoch": 55.37874659400545,
+ "grad_norm": 4.330327987670898,
+ "learning_rate": 8.747070411904429e-06,
+ "loss": 0.088,
+ "step": 20324
+ },
+ {
+ "epoch": 55.381471389645775,
+ "grad_norm": 7.776508808135986,
+ "learning_rate": 8.746194876393255e-06,
+ "loss": 0.091,
+ "step": 20325
+ },
+ {
+ "epoch": 55.3841961852861,
+ "grad_norm": 3.777819871902466,
+ "learning_rate": 8.745319350646678e-06,
+ "loss": 0.1072,
+ "step": 20326
+ },
+ {
+ "epoch": 55.38692098092643,
+ "grad_norm": 4.417204856872559,
+ "learning_rate": 8.744443834671509e-06,
+ "loss": 0.1621,
+ "step": 20327
+ },
+ {
+ "epoch": 55.38964577656676,
+ "grad_norm": 4.460134983062744,
+ "learning_rate": 8.743568328474577e-06,
+ "loss": 0.0995,
+ "step": 20328
+ },
+ {
+ "epoch": 55.392370572207085,
+ "grad_norm": 2.475911855697632,
+ "learning_rate": 8.742692832062688e-06,
+ "loss": 0.0443,
+ "step": 20329
+ },
+ {
+ "epoch": 55.39509536784741,
+ "grad_norm": 4.059835433959961,
+ "learning_rate": 8.74181734544267e-06,
+ "loss": 0.0958,
+ "step": 20330
+ },
+ {
+ "epoch": 55.39782016348774,
+ "grad_norm": 6.29917049407959,
+ "learning_rate": 8.740941868621337e-06,
+ "loss": 0.1114,
+ "step": 20331
+ },
+ {
+ "epoch": 55.40054495912806,
+ "grad_norm": 4.21348237991333,
+ "learning_rate": 8.740066401605512e-06,
+ "loss": 0.1171,
+ "step": 20332
+ },
+ {
+ "epoch": 55.403269754768395,
+ "grad_norm": 4.922358512878418,
+ "learning_rate": 8.739190944402006e-06,
+ "loss": 0.2403,
+ "step": 20333
+ },
+ {
+ "epoch": 55.40599455040872,
+ "grad_norm": 4.729889869689941,
+ "learning_rate": 8.738315497017642e-06,
+ "loss": 0.128,
+ "step": 20334
+ },
+ {
+ "epoch": 55.40871934604905,
+ "grad_norm": 4.229569435119629,
+ "learning_rate": 8.737440059459234e-06,
+ "loss": 0.115,
+ "step": 20335
+ },
+ {
+ "epoch": 55.41144414168937,
+ "grad_norm": 4.083345890045166,
+ "learning_rate": 8.736564631733606e-06,
+ "loss": 0.1628,
+ "step": 20336
+ },
+ {
+ "epoch": 55.4141689373297,
+ "grad_norm": 4.032779216766357,
+ "learning_rate": 8.735689213847569e-06,
+ "loss": 0.1891,
+ "step": 20337
+ },
+ {
+ "epoch": 55.416893732970024,
+ "grad_norm": 3.4884467124938965,
+ "learning_rate": 8.734813805807944e-06,
+ "loss": 0.2137,
+ "step": 20338
+ },
+ {
+ "epoch": 55.41961852861036,
+ "grad_norm": 3.715762138366699,
+ "learning_rate": 8.73393840762155e-06,
+ "loss": 0.1797,
+ "step": 20339
+ },
+ {
+ "epoch": 55.42234332425068,
+ "grad_norm": 4.092436790466309,
+ "learning_rate": 8.733063019295202e-06,
+ "loss": 0.1081,
+ "step": 20340
+ },
+ {
+ "epoch": 55.42506811989101,
+ "grad_norm": 4.212950229644775,
+ "learning_rate": 8.732187640835718e-06,
+ "loss": 0.0681,
+ "step": 20341
+ },
+ {
+ "epoch": 55.427792915531334,
+ "grad_norm": 3.463665723800659,
+ "learning_rate": 8.731312272249916e-06,
+ "loss": 0.0773,
+ "step": 20342
+ },
+ {
+ "epoch": 55.43051771117166,
+ "grad_norm": 3.5409793853759766,
+ "learning_rate": 8.730436913544612e-06,
+ "loss": 0.1978,
+ "step": 20343
+ },
+ {
+ "epoch": 55.433242506811986,
+ "grad_norm": 4.001033782958984,
+ "learning_rate": 8.729561564726627e-06,
+ "loss": 0.1921,
+ "step": 20344
+ },
+ {
+ "epoch": 55.43596730245232,
+ "grad_norm": 4.495682239532471,
+ "learning_rate": 8.728686225802773e-06,
+ "loss": 0.1104,
+ "step": 20345
+ },
+ {
+ "epoch": 55.438692098092645,
+ "grad_norm": 5.5811967849731445,
+ "learning_rate": 8.727810896779869e-06,
+ "loss": 0.0699,
+ "step": 20346
+ },
+ {
+ "epoch": 55.44141689373297,
+ "grad_norm": 4.244899749755859,
+ "learning_rate": 8.726935577664737e-06,
+ "loss": 0.1407,
+ "step": 20347
+ },
+ {
+ "epoch": 55.444141689373296,
+ "grad_norm": 6.328291893005371,
+ "learning_rate": 8.726060268464186e-06,
+ "loss": 0.1195,
+ "step": 20348
+ },
+ {
+ "epoch": 55.44686648501362,
+ "grad_norm": 3.9155054092407227,
+ "learning_rate": 8.72518496918504e-06,
+ "loss": 0.1208,
+ "step": 20349
+ },
+ {
+ "epoch": 55.44959128065395,
+ "grad_norm": 4.084961414337158,
+ "learning_rate": 8.724309679834109e-06,
+ "loss": 0.0744,
+ "step": 20350
+ },
+ {
+ "epoch": 55.45231607629428,
+ "grad_norm": 6.089450836181641,
+ "learning_rate": 8.723434400418215e-06,
+ "loss": 0.1051,
+ "step": 20351
+ },
+ {
+ "epoch": 55.45504087193461,
+ "grad_norm": 3.64111328125,
+ "learning_rate": 8.722559130944173e-06,
+ "loss": 0.1728,
+ "step": 20352
+ },
+ {
+ "epoch": 55.45776566757493,
+ "grad_norm": 4.314663410186768,
+ "learning_rate": 8.721683871418797e-06,
+ "loss": 0.1598,
+ "step": 20353
+ },
+ {
+ "epoch": 55.46049046321526,
+ "grad_norm": 2.8920440673828125,
+ "learning_rate": 8.720808621848911e-06,
+ "loss": 0.1399,
+ "step": 20354
+ },
+ {
+ "epoch": 55.463215258855584,
+ "grad_norm": 4.880285739898682,
+ "learning_rate": 8.719933382241322e-06,
+ "loss": 0.094,
+ "step": 20355
+ },
+ {
+ "epoch": 55.46594005449591,
+ "grad_norm": 3.634341239929199,
+ "learning_rate": 8.719058152602853e-06,
+ "loss": 0.1027,
+ "step": 20356
+ },
+ {
+ "epoch": 55.46866485013624,
+ "grad_norm": 4.2444024085998535,
+ "learning_rate": 8.718182932940316e-06,
+ "loss": 0.1918,
+ "step": 20357
+ },
+ {
+ "epoch": 55.47138964577657,
+ "grad_norm": 6.068127155303955,
+ "learning_rate": 8.71730772326053e-06,
+ "loss": 0.2071,
+ "step": 20358
+ },
+ {
+ "epoch": 55.474114441416894,
+ "grad_norm": 2.986868143081665,
+ "learning_rate": 8.71643252357031e-06,
+ "loss": 0.2392,
+ "step": 20359
+ },
+ {
+ "epoch": 55.47683923705722,
+ "grad_norm": 4.797121524810791,
+ "learning_rate": 8.715557333876472e-06,
+ "loss": 0.135,
+ "step": 20360
+ },
+ {
+ "epoch": 55.479564032697546,
+ "grad_norm": 4.307587623596191,
+ "learning_rate": 8.714682154185831e-06,
+ "loss": 0.0817,
+ "step": 20361
+ },
+ {
+ "epoch": 55.48228882833787,
+ "grad_norm": 3.9596898555755615,
+ "learning_rate": 8.713806984505208e-06,
+ "loss": 0.1155,
+ "step": 20362
+ },
+ {
+ "epoch": 55.485013623978205,
+ "grad_norm": 4.114192008972168,
+ "learning_rate": 8.712931824841411e-06,
+ "loss": 0.0847,
+ "step": 20363
+ },
+ {
+ "epoch": 55.48773841961853,
+ "grad_norm": 3.0506885051727295,
+ "learning_rate": 8.712056675201257e-06,
+ "loss": 0.1047,
+ "step": 20364
+ },
+ {
+ "epoch": 55.490463215258856,
+ "grad_norm": 3.6099131107330322,
+ "learning_rate": 8.711181535591569e-06,
+ "loss": 0.0744,
+ "step": 20365
+ },
+ {
+ "epoch": 55.49318801089918,
+ "grad_norm": 4.8901591300964355,
+ "learning_rate": 8.710306406019155e-06,
+ "loss": 0.1609,
+ "step": 20366
+ },
+ {
+ "epoch": 55.49591280653951,
+ "grad_norm": 6.4215874671936035,
+ "learning_rate": 8.709431286490837e-06,
+ "loss": 0.1302,
+ "step": 20367
+ },
+ {
+ "epoch": 55.49863760217983,
+ "grad_norm": 4.286976337432861,
+ "learning_rate": 8.708556177013423e-06,
+ "loss": 0.1142,
+ "step": 20368
+ },
+ {
+ "epoch": 55.50136239782017,
+ "grad_norm": 4.187290191650391,
+ "learning_rate": 8.707681077593735e-06,
+ "loss": 0.3471,
+ "step": 20369
+ },
+ {
+ "epoch": 55.50408719346049,
+ "grad_norm": 4.669692516326904,
+ "learning_rate": 8.70680598823858e-06,
+ "loss": 0.1053,
+ "step": 20370
+ },
+ {
+ "epoch": 55.50681198910082,
+ "grad_norm": 5.98300838470459,
+ "learning_rate": 8.705930908954786e-06,
+ "loss": 0.2092,
+ "step": 20371
+ },
+ {
+ "epoch": 55.509536784741144,
+ "grad_norm": 5.066943168640137,
+ "learning_rate": 8.705055839749154e-06,
+ "loss": 0.0883,
+ "step": 20372
+ },
+ {
+ "epoch": 55.51226158038147,
+ "grad_norm": 4.160504341125488,
+ "learning_rate": 8.704180780628508e-06,
+ "loss": 0.1035,
+ "step": 20373
+ },
+ {
+ "epoch": 55.514986376021795,
+ "grad_norm": 4.330354690551758,
+ "learning_rate": 8.70330573159966e-06,
+ "loss": 0.107,
+ "step": 20374
+ },
+ {
+ "epoch": 55.51771117166213,
+ "grad_norm": 3.0367326736450195,
+ "learning_rate": 8.702430692669426e-06,
+ "loss": 0.0578,
+ "step": 20375
+ },
+ {
+ "epoch": 55.520435967302454,
+ "grad_norm": 4.381452560424805,
+ "learning_rate": 8.701555663844619e-06,
+ "loss": 0.3114,
+ "step": 20376
+ },
+ {
+ "epoch": 55.52316076294278,
+ "grad_norm": 5.92275857925415,
+ "learning_rate": 8.700680645132053e-06,
+ "loss": 0.3236,
+ "step": 20377
+ },
+ {
+ "epoch": 55.525885558583106,
+ "grad_norm": 3.6232314109802246,
+ "learning_rate": 8.699805636538548e-06,
+ "loss": 0.0894,
+ "step": 20378
+ },
+ {
+ "epoch": 55.52861035422343,
+ "grad_norm": 4.690647602081299,
+ "learning_rate": 8.698930638070913e-06,
+ "loss": 0.0753,
+ "step": 20379
+ },
+ {
+ "epoch": 55.53133514986376,
+ "grad_norm": 4.333375453948975,
+ "learning_rate": 8.698055649735964e-06,
+ "loss": 0.138,
+ "step": 20380
+ },
+ {
+ "epoch": 55.53405994550409,
+ "grad_norm": 4.587692737579346,
+ "learning_rate": 8.697180671540513e-06,
+ "loss": 0.0817,
+ "step": 20381
+ },
+ {
+ "epoch": 55.536784741144416,
+ "grad_norm": 4.031619071960449,
+ "learning_rate": 8.69630570349138e-06,
+ "loss": 0.1549,
+ "step": 20382
+ },
+ {
+ "epoch": 55.53950953678474,
+ "grad_norm": 4.475871562957764,
+ "learning_rate": 8.695430745595377e-06,
+ "loss": 0.2075,
+ "step": 20383
+ },
+ {
+ "epoch": 55.54223433242507,
+ "grad_norm": 3.520782470703125,
+ "learning_rate": 8.694555797859317e-06,
+ "loss": 0.0868,
+ "step": 20384
+ },
+ {
+ "epoch": 55.54495912806539,
+ "grad_norm": 5.136046409606934,
+ "learning_rate": 8.693680860290016e-06,
+ "loss": 0.1181,
+ "step": 20385
+ },
+ {
+ "epoch": 55.54768392370572,
+ "grad_norm": 4.102364540100098,
+ "learning_rate": 8.692805932894281e-06,
+ "loss": 0.2792,
+ "step": 20386
+ },
+ {
+ "epoch": 55.55040871934605,
+ "grad_norm": 4.081116199493408,
+ "learning_rate": 8.691931015678938e-06,
+ "loss": 0.132,
+ "step": 20387
+ },
+ {
+ "epoch": 55.55313351498638,
+ "grad_norm": 4.678136825561523,
+ "learning_rate": 8.69105610865079e-06,
+ "loss": 0.1073,
+ "step": 20388
+ },
+ {
+ "epoch": 55.555858310626704,
+ "grad_norm": 3.575960874557495,
+ "learning_rate": 8.690181211816657e-06,
+ "loss": 0.0895,
+ "step": 20389
+ },
+ {
+ "epoch": 55.55858310626703,
+ "grad_norm": 3.154576063156128,
+ "learning_rate": 8.689306325183348e-06,
+ "loss": 0.113,
+ "step": 20390
+ },
+ {
+ "epoch": 55.561307901907355,
+ "grad_norm": 3.1575584411621094,
+ "learning_rate": 8.688431448757682e-06,
+ "loss": 0.314,
+ "step": 20391
+ },
+ {
+ "epoch": 55.56403269754768,
+ "grad_norm": 3.662139892578125,
+ "learning_rate": 8.687556582546467e-06,
+ "loss": 0.1995,
+ "step": 20392
+ },
+ {
+ "epoch": 55.566757493188014,
+ "grad_norm": 4.017824172973633,
+ "learning_rate": 8.686681726556521e-06,
+ "loss": 0.2252,
+ "step": 20393
+ },
+ {
+ "epoch": 55.56948228882834,
+ "grad_norm": 5.218798637390137,
+ "learning_rate": 8.685806880794654e-06,
+ "loss": 0.1921,
+ "step": 20394
+ },
+ {
+ "epoch": 55.572207084468666,
+ "grad_norm": 4.111189365386963,
+ "learning_rate": 8.684932045267683e-06,
+ "loss": 0.1295,
+ "step": 20395
+ },
+ {
+ "epoch": 55.57493188010899,
+ "grad_norm": 3.641528367996216,
+ "learning_rate": 8.684057219982416e-06,
+ "loss": 0.0877,
+ "step": 20396
+ },
+ {
+ "epoch": 55.57765667574932,
+ "grad_norm": 5.454028129577637,
+ "learning_rate": 8.683182404945672e-06,
+ "loss": 0.1628,
+ "step": 20397
+ },
+ {
+ "epoch": 55.58038147138964,
+ "grad_norm": 3.9976165294647217,
+ "learning_rate": 8.682307600164255e-06,
+ "loss": 0.0892,
+ "step": 20398
+ },
+ {
+ "epoch": 55.583106267029976,
+ "grad_norm": 4.10651969909668,
+ "learning_rate": 8.68143280564499e-06,
+ "loss": 0.1394,
+ "step": 20399
+ },
+ {
+ "epoch": 55.5858310626703,
+ "grad_norm": 4.620141983032227,
+ "learning_rate": 8.68055802139468e-06,
+ "loss": 0.0581,
+ "step": 20400
+ },
+ {
+ "epoch": 55.58855585831063,
+ "grad_norm": 3.702589750289917,
+ "learning_rate": 8.679683247420146e-06,
+ "loss": 0.0711,
+ "step": 20401
+ },
+ {
+ "epoch": 55.59128065395095,
+ "grad_norm": 3.2625372409820557,
+ "learning_rate": 8.678808483728194e-06,
+ "loss": 0.0644,
+ "step": 20402
+ },
+ {
+ "epoch": 55.59400544959128,
+ "grad_norm": 4.552007675170898,
+ "learning_rate": 8.67793373032564e-06,
+ "loss": 0.2491,
+ "step": 20403
+ },
+ {
+ "epoch": 55.596730245231605,
+ "grad_norm": 3.1166679859161377,
+ "learning_rate": 8.677058987219294e-06,
+ "loss": 0.0956,
+ "step": 20404
+ },
+ {
+ "epoch": 55.59945504087194,
+ "grad_norm": 3.954953193664551,
+ "learning_rate": 8.676184254415973e-06,
+ "loss": 0.067,
+ "step": 20405
+ },
+ {
+ "epoch": 55.60217983651226,
+ "grad_norm": 3.1082582473754883,
+ "learning_rate": 8.675309531922484e-06,
+ "loss": 0.1931,
+ "step": 20406
+ },
+ {
+ "epoch": 55.60490463215259,
+ "grad_norm": 4.5571513175964355,
+ "learning_rate": 8.674434819745643e-06,
+ "loss": 0.1322,
+ "step": 20407
+ },
+ {
+ "epoch": 55.607629427792915,
+ "grad_norm": 5.0540571212768555,
+ "learning_rate": 8.67356011789226e-06,
+ "loss": 0.2517,
+ "step": 20408
+ },
+ {
+ "epoch": 55.61035422343324,
+ "grad_norm": 6.6033782958984375,
+ "learning_rate": 8.672685426369148e-06,
+ "loss": 0.0835,
+ "step": 20409
+ },
+ {
+ "epoch": 55.61307901907357,
+ "grad_norm": 3.401458501815796,
+ "learning_rate": 8.671810745183118e-06,
+ "loss": 0.0837,
+ "step": 20410
+ },
+ {
+ "epoch": 55.6158038147139,
+ "grad_norm": 4.99204158782959,
+ "learning_rate": 8.670936074340987e-06,
+ "loss": 0.1478,
+ "step": 20411
+ },
+ {
+ "epoch": 55.618528610354225,
+ "grad_norm": 6.409547328948975,
+ "learning_rate": 8.67006141384956e-06,
+ "loss": 0.179,
+ "step": 20412
+ },
+ {
+ "epoch": 55.62125340599455,
+ "grad_norm": 9.704611778259277,
+ "learning_rate": 8.669186763715654e-06,
+ "loss": 0.1256,
+ "step": 20413
+ },
+ {
+ "epoch": 55.62397820163488,
+ "grad_norm": 4.166541576385498,
+ "learning_rate": 8.668312123946076e-06,
+ "loss": 0.1664,
+ "step": 20414
+ },
+ {
+ "epoch": 55.6267029972752,
+ "grad_norm": 4.253971576690674,
+ "learning_rate": 8.667437494547637e-06,
+ "loss": 0.0987,
+ "step": 20415
+ },
+ {
+ "epoch": 55.62942779291553,
+ "grad_norm": 3.637429714202881,
+ "learning_rate": 8.666562875527158e-06,
+ "loss": 0.1224,
+ "step": 20416
+ },
+ {
+ "epoch": 55.63215258855586,
+ "grad_norm": 3.9984216690063477,
+ "learning_rate": 8.665688266891442e-06,
+ "loss": 0.1385,
+ "step": 20417
+ },
+ {
+ "epoch": 55.63487738419619,
+ "grad_norm": 7.363391876220703,
+ "learning_rate": 8.664813668647303e-06,
+ "loss": 0.089,
+ "step": 20418
+ },
+ {
+ "epoch": 55.63760217983651,
+ "grad_norm": 3.269890785217285,
+ "learning_rate": 8.663939080801555e-06,
+ "loss": 0.0553,
+ "step": 20419
+ },
+ {
+ "epoch": 55.64032697547684,
+ "grad_norm": 3.394165515899658,
+ "learning_rate": 8.663064503361003e-06,
+ "loss": 0.143,
+ "step": 20420
+ },
+ {
+ "epoch": 55.643051771117165,
+ "grad_norm": 4.915383338928223,
+ "learning_rate": 8.662189936332463e-06,
+ "loss": 0.1576,
+ "step": 20421
+ },
+ {
+ "epoch": 55.64577656675749,
+ "grad_norm": 4.551702499389648,
+ "learning_rate": 8.661315379722745e-06,
+ "loss": 0.1276,
+ "step": 20422
+ },
+ {
+ "epoch": 55.64850136239782,
+ "grad_norm": 6.632296085357666,
+ "learning_rate": 8.66044083353866e-06,
+ "loss": 0.1448,
+ "step": 20423
+ },
+ {
+ "epoch": 55.65122615803815,
+ "grad_norm": 3.6714444160461426,
+ "learning_rate": 8.659566297787016e-06,
+ "loss": 0.0493,
+ "step": 20424
+ },
+ {
+ "epoch": 55.653950953678475,
+ "grad_norm": 4.507234573364258,
+ "learning_rate": 8.658691772474632e-06,
+ "loss": 0.1582,
+ "step": 20425
+ },
+ {
+ "epoch": 55.6566757493188,
+ "grad_norm": 6.121192932128906,
+ "learning_rate": 8.657817257608308e-06,
+ "loss": 0.1015,
+ "step": 20426
+ },
+ {
+ "epoch": 55.65940054495913,
+ "grad_norm": 5.42222785949707,
+ "learning_rate": 8.656942753194863e-06,
+ "loss": 0.1766,
+ "step": 20427
+ },
+ {
+ "epoch": 55.66212534059945,
+ "grad_norm": 3.701658010482788,
+ "learning_rate": 8.656068259241102e-06,
+ "loss": 0.0617,
+ "step": 20428
+ },
+ {
+ "epoch": 55.664850136239785,
+ "grad_norm": 3.8383970260620117,
+ "learning_rate": 8.655193775753841e-06,
+ "loss": 0.1377,
+ "step": 20429
+ },
+ {
+ "epoch": 55.66757493188011,
+ "grad_norm": 4.109371662139893,
+ "learning_rate": 8.654319302739887e-06,
+ "loss": 0.1278,
+ "step": 20430
+ },
+ {
+ "epoch": 55.67029972752044,
+ "grad_norm": 3.5328078269958496,
+ "learning_rate": 8.65344484020605e-06,
+ "loss": 0.0901,
+ "step": 20431
+ },
+ {
+ "epoch": 55.67302452316076,
+ "grad_norm": 4.257531642913818,
+ "learning_rate": 8.652570388159139e-06,
+ "loss": 0.1675,
+ "step": 20432
+ },
+ {
+ "epoch": 55.67574931880109,
+ "grad_norm": 3.289428472518921,
+ "learning_rate": 8.651695946605967e-06,
+ "loss": 0.1157,
+ "step": 20433
+ },
+ {
+ "epoch": 55.678474114441414,
+ "grad_norm": 4.315040111541748,
+ "learning_rate": 8.650821515553347e-06,
+ "loss": 0.1814,
+ "step": 20434
+ },
+ {
+ "epoch": 55.68119891008175,
+ "grad_norm": 5.300807476043701,
+ "learning_rate": 8.649947095008083e-06,
+ "loss": 0.1745,
+ "step": 20435
+ },
+ {
+ "epoch": 55.68392370572207,
+ "grad_norm": 3.0710952281951904,
+ "learning_rate": 8.64907268497699e-06,
+ "loss": 0.1117,
+ "step": 20436
+ },
+ {
+ "epoch": 55.6866485013624,
+ "grad_norm": 3.7290239334106445,
+ "learning_rate": 8.648198285466874e-06,
+ "loss": 0.076,
+ "step": 20437
+ },
+ {
+ "epoch": 55.689373297002724,
+ "grad_norm": 4.601301193237305,
+ "learning_rate": 8.647323896484547e-06,
+ "loss": 0.2185,
+ "step": 20438
+ },
+ {
+ "epoch": 55.69209809264305,
+ "grad_norm": 4.6118550300598145,
+ "learning_rate": 8.646449518036817e-06,
+ "loss": 0.067,
+ "step": 20439
+ },
+ {
+ "epoch": 55.694822888283376,
+ "grad_norm": 4.642988204956055,
+ "learning_rate": 8.645575150130494e-06,
+ "loss": 0.1258,
+ "step": 20440
+ },
+ {
+ "epoch": 55.69754768392371,
+ "grad_norm": 4.468482494354248,
+ "learning_rate": 8.64470079277239e-06,
+ "loss": 0.2527,
+ "step": 20441
+ },
+ {
+ "epoch": 55.700272479564035,
+ "grad_norm": 4.860848903656006,
+ "learning_rate": 8.64382644596931e-06,
+ "loss": 0.0957,
+ "step": 20442
+ },
+ {
+ "epoch": 55.70299727520436,
+ "grad_norm": 4.185880184173584,
+ "learning_rate": 8.642952109728069e-06,
+ "loss": 0.0742,
+ "step": 20443
+ },
+ {
+ "epoch": 55.705722070844686,
+ "grad_norm": 4.801362037658691,
+ "learning_rate": 8.642077784055472e-06,
+ "loss": 0.1382,
+ "step": 20444
+ },
+ {
+ "epoch": 55.70844686648501,
+ "grad_norm": 4.546573162078857,
+ "learning_rate": 8.64120346895833e-06,
+ "loss": 0.2831,
+ "step": 20445
+ },
+ {
+ "epoch": 55.71117166212534,
+ "grad_norm": 4.603366851806641,
+ "learning_rate": 8.64032916444345e-06,
+ "loss": 0.1412,
+ "step": 20446
+ },
+ {
+ "epoch": 55.71389645776567,
+ "grad_norm": 4.130717754364014,
+ "learning_rate": 8.639454870517646e-06,
+ "loss": 0.1299,
+ "step": 20447
+ },
+ {
+ "epoch": 55.716621253406,
+ "grad_norm": 4.901968479156494,
+ "learning_rate": 8.63858058718772e-06,
+ "loss": 0.1439,
+ "step": 20448
+ },
+ {
+ "epoch": 55.71934604904632,
+ "grad_norm": 3.360917806625366,
+ "learning_rate": 8.637706314460487e-06,
+ "loss": 0.163,
+ "step": 20449
+ },
+ {
+ "epoch": 55.72207084468665,
+ "grad_norm": 4.054257392883301,
+ "learning_rate": 8.63683205234275e-06,
+ "loss": 0.1393,
+ "step": 20450
+ },
+ {
+ "epoch": 55.724795640326974,
+ "grad_norm": 3.5764174461364746,
+ "learning_rate": 8.63595780084132e-06,
+ "loss": 0.318,
+ "step": 20451
+ },
+ {
+ "epoch": 55.7275204359673,
+ "grad_norm": 3.5609607696533203,
+ "learning_rate": 8.635083559963014e-06,
+ "loss": 0.0677,
+ "step": 20452
+ },
+ {
+ "epoch": 55.73024523160763,
+ "grad_norm": 3.7269129753112793,
+ "learning_rate": 8.634209329714628e-06,
+ "loss": 0.0785,
+ "step": 20453
+ },
+ {
+ "epoch": 55.73297002724796,
+ "grad_norm": 4.766541004180908,
+ "learning_rate": 8.633335110102979e-06,
+ "loss": 0.1893,
+ "step": 20454
+ },
+ {
+ "epoch": 55.735694822888284,
+ "grad_norm": 4.41552209854126,
+ "learning_rate": 8.632460901134869e-06,
+ "loss": 0.1576,
+ "step": 20455
+ },
+ {
+ "epoch": 55.73841961852861,
+ "grad_norm": 5.0423479080200195,
+ "learning_rate": 8.631586702817111e-06,
+ "loss": 0.0763,
+ "step": 20456
+ },
+ {
+ "epoch": 55.741144414168936,
+ "grad_norm": 4.5149736404418945,
+ "learning_rate": 8.630712515156512e-06,
+ "loss": 0.1774,
+ "step": 20457
+ },
+ {
+ "epoch": 55.74386920980926,
+ "grad_norm": 3.756617784500122,
+ "learning_rate": 8.62983833815988e-06,
+ "loss": 0.2158,
+ "step": 20458
+ },
+ {
+ "epoch": 55.746594005449595,
+ "grad_norm": 3.6888821125030518,
+ "learning_rate": 8.628964171834023e-06,
+ "loss": 0.1418,
+ "step": 20459
+ },
+ {
+ "epoch": 55.74931880108992,
+ "grad_norm": 5.236166000366211,
+ "learning_rate": 8.628090016185748e-06,
+ "loss": 0.1648,
+ "step": 20460
+ },
+ {
+ "epoch": 55.752043596730246,
+ "grad_norm": 3.830169439315796,
+ "learning_rate": 8.627215871221864e-06,
+ "loss": 0.1081,
+ "step": 20461
+ },
+ {
+ "epoch": 55.75476839237057,
+ "grad_norm": 4.974534034729004,
+ "learning_rate": 8.62634173694918e-06,
+ "loss": 0.1028,
+ "step": 20462
+ },
+ {
+ "epoch": 55.7574931880109,
+ "grad_norm": 7.999661922454834,
+ "learning_rate": 8.625467613374501e-06,
+ "loss": 0.1679,
+ "step": 20463
+ },
+ {
+ "epoch": 55.76021798365122,
+ "grad_norm": 3.9220337867736816,
+ "learning_rate": 8.624593500504634e-06,
+ "loss": 0.1749,
+ "step": 20464
+ },
+ {
+ "epoch": 55.762942779291556,
+ "grad_norm": 4.370566368103027,
+ "learning_rate": 8.623719398346394e-06,
+ "loss": 0.2471,
+ "step": 20465
+ },
+ {
+ "epoch": 55.76566757493188,
+ "grad_norm": 4.0340728759765625,
+ "learning_rate": 8.622845306906577e-06,
+ "loss": 0.0947,
+ "step": 20466
+ },
+ {
+ "epoch": 55.76839237057221,
+ "grad_norm": 3.9111313819885254,
+ "learning_rate": 8.621971226191995e-06,
+ "loss": 0.167,
+ "step": 20467
+ },
+ {
+ "epoch": 55.771117166212534,
+ "grad_norm": 2.8047828674316406,
+ "learning_rate": 8.621097156209463e-06,
+ "loss": 0.0542,
+ "step": 20468
+ },
+ {
+ "epoch": 55.77384196185286,
+ "grad_norm": 3.8338875770568848,
+ "learning_rate": 8.62022309696578e-06,
+ "loss": 0.1348,
+ "step": 20469
+ },
+ {
+ "epoch": 55.776566757493185,
+ "grad_norm": 3.6789472103118896,
+ "learning_rate": 8.619349048467755e-06,
+ "loss": 0.1679,
+ "step": 20470
+ },
+ {
+ "epoch": 55.77929155313352,
+ "grad_norm": 3.9221291542053223,
+ "learning_rate": 8.618475010722194e-06,
+ "loss": 0.09,
+ "step": 20471
+ },
+ {
+ "epoch": 55.782016348773844,
+ "grad_norm": 4.1862592697143555,
+ "learning_rate": 8.617600983735908e-06,
+ "loss": 0.0659,
+ "step": 20472
+ },
+ {
+ "epoch": 55.78474114441417,
+ "grad_norm": 4.799045085906982,
+ "learning_rate": 8.6167269675157e-06,
+ "loss": 0.068,
+ "step": 20473
+ },
+ {
+ "epoch": 55.787465940054496,
+ "grad_norm": 3.4132657051086426,
+ "learning_rate": 8.615852962068377e-06,
+ "loss": 0.0683,
+ "step": 20474
+ },
+ {
+ "epoch": 55.79019073569482,
+ "grad_norm": 3.262223482131958,
+ "learning_rate": 8.614978967400747e-06,
+ "loss": 0.1489,
+ "step": 20475
+ },
+ {
+ "epoch": 55.79291553133515,
+ "grad_norm": 3.795609712600708,
+ "learning_rate": 8.614104983519617e-06,
+ "loss": 0.227,
+ "step": 20476
+ },
+ {
+ "epoch": 55.79564032697548,
+ "grad_norm": 3.7105584144592285,
+ "learning_rate": 8.61323101043179e-06,
+ "loss": 0.0702,
+ "step": 20477
+ },
+ {
+ "epoch": 55.798365122615806,
+ "grad_norm": 3.7257235050201416,
+ "learning_rate": 8.612357048144079e-06,
+ "loss": 0.1147,
+ "step": 20478
+ },
+ {
+ "epoch": 55.80108991825613,
+ "grad_norm": 3.381202220916748,
+ "learning_rate": 8.611483096663284e-06,
+ "loss": 0.1281,
+ "step": 20479
+ },
+ {
+ "epoch": 55.80381471389646,
+ "grad_norm": 3.040492534637451,
+ "learning_rate": 8.610609155996216e-06,
+ "loss": 0.0807,
+ "step": 20480
+ },
+ {
+ "epoch": 55.80653950953678,
+ "grad_norm": 4.473389148712158,
+ "learning_rate": 8.609735226149676e-06,
+ "loss": 0.1294,
+ "step": 20481
+ },
+ {
+ "epoch": 55.80926430517711,
+ "grad_norm": 5.4073896408081055,
+ "learning_rate": 8.608861307130477e-06,
+ "loss": 0.1582,
+ "step": 20482
+ },
+ {
+ "epoch": 55.81198910081744,
+ "grad_norm": 3.274014949798584,
+ "learning_rate": 8.607987398945419e-06,
+ "loss": 0.1768,
+ "step": 20483
+ },
+ {
+ "epoch": 55.81471389645777,
+ "grad_norm": 2.8430848121643066,
+ "learning_rate": 8.607113501601307e-06,
+ "loss": 0.1409,
+ "step": 20484
+ },
+ {
+ "epoch": 55.817438692098094,
+ "grad_norm": 4.293489456176758,
+ "learning_rate": 8.606239615104953e-06,
+ "loss": 0.0842,
+ "step": 20485
+ },
+ {
+ "epoch": 55.82016348773842,
+ "grad_norm": 4.750711917877197,
+ "learning_rate": 8.605365739463163e-06,
+ "loss": 0.1093,
+ "step": 20486
+ },
+ {
+ "epoch": 55.822888283378745,
+ "grad_norm": 4.375786304473877,
+ "learning_rate": 8.604491874682736e-06,
+ "loss": 0.1656,
+ "step": 20487
+ },
+ {
+ "epoch": 55.82561307901907,
+ "grad_norm": 4.1107611656188965,
+ "learning_rate": 8.603618020770486e-06,
+ "loss": 0.2394,
+ "step": 20488
+ },
+ {
+ "epoch": 55.828337874659404,
+ "grad_norm": 3.8165786266326904,
+ "learning_rate": 8.602744177733208e-06,
+ "loss": 0.0979,
+ "step": 20489
+ },
+ {
+ "epoch": 55.83106267029973,
+ "grad_norm": 5.442535400390625,
+ "learning_rate": 8.601870345577719e-06,
+ "loss": 0.0686,
+ "step": 20490
+ },
+ {
+ "epoch": 55.833787465940055,
+ "grad_norm": 3.9983370304107666,
+ "learning_rate": 8.600996524310814e-06,
+ "loss": 0.1364,
+ "step": 20491
+ },
+ {
+ "epoch": 55.83651226158038,
+ "grad_norm": 5.155202865600586,
+ "learning_rate": 8.600122713939307e-06,
+ "loss": 0.0956,
+ "step": 20492
+ },
+ {
+ "epoch": 55.83923705722071,
+ "grad_norm": 5.143024444580078,
+ "learning_rate": 8.599248914469997e-06,
+ "loss": 0.0867,
+ "step": 20493
+ },
+ {
+ "epoch": 55.84196185286103,
+ "grad_norm": 5.1866559982299805,
+ "learning_rate": 8.598375125909693e-06,
+ "loss": 0.1143,
+ "step": 20494
+ },
+ {
+ "epoch": 55.844686648501366,
+ "grad_norm": 3.8809587955474854,
+ "learning_rate": 8.597501348265197e-06,
+ "loss": 0.1009,
+ "step": 20495
+ },
+ {
+ "epoch": 55.84741144414169,
+ "grad_norm": 4.155538082122803,
+ "learning_rate": 8.596627581543317e-06,
+ "loss": 0.1741,
+ "step": 20496
+ },
+ {
+ "epoch": 55.85013623978202,
+ "grad_norm": 3.671724796295166,
+ "learning_rate": 8.595753825750853e-06,
+ "loss": 0.1216,
+ "step": 20497
+ },
+ {
+ "epoch": 55.85286103542234,
+ "grad_norm": 4.219904899597168,
+ "learning_rate": 8.594880080894616e-06,
+ "loss": 0.1168,
+ "step": 20498
+ },
+ {
+ "epoch": 55.85558583106267,
+ "grad_norm": 5.11779260635376,
+ "learning_rate": 8.594006346981406e-06,
+ "loss": 0.1481,
+ "step": 20499
+ },
+ {
+ "epoch": 55.858310626702995,
+ "grad_norm": 4.027957439422607,
+ "learning_rate": 8.59313262401803e-06,
+ "loss": 0.1699,
+ "step": 20500
+ },
+ {
+ "epoch": 55.86103542234333,
+ "grad_norm": 3.728930950164795,
+ "learning_rate": 8.59225891201129e-06,
+ "loss": 0.0855,
+ "step": 20501
+ },
+ {
+ "epoch": 55.86376021798365,
+ "grad_norm": 4.834834098815918,
+ "learning_rate": 8.591385210967993e-06,
+ "loss": 0.2245,
+ "step": 20502
+ },
+ {
+ "epoch": 55.86648501362398,
+ "grad_norm": 4.288930416107178,
+ "learning_rate": 8.590511520894946e-06,
+ "loss": 0.1592,
+ "step": 20503
+ },
+ {
+ "epoch": 55.869209809264305,
+ "grad_norm": 4.237362861633301,
+ "learning_rate": 8.589637841798945e-06,
+ "loss": 0.1316,
+ "step": 20504
+ },
+ {
+ "epoch": 55.87193460490463,
+ "grad_norm": 3.412639617919922,
+ "learning_rate": 8.5887641736868e-06,
+ "loss": 0.0765,
+ "step": 20505
+ },
+ {
+ "epoch": 55.87465940054496,
+ "grad_norm": 5.373528480529785,
+ "learning_rate": 8.587890516565319e-06,
+ "loss": 0.1209,
+ "step": 20506
+ },
+ {
+ "epoch": 55.87738419618529,
+ "grad_norm": 4.227440357208252,
+ "learning_rate": 8.587016870441297e-06,
+ "loss": 0.0988,
+ "step": 20507
+ },
+ {
+ "epoch": 55.880108991825615,
+ "grad_norm": 4.1393280029296875,
+ "learning_rate": 8.586143235321545e-06,
+ "loss": 0.0866,
+ "step": 20508
+ },
+ {
+ "epoch": 55.88283378746594,
+ "grad_norm": 3.8176050186157227,
+ "learning_rate": 8.585269611212862e-06,
+ "loss": 0.11,
+ "step": 20509
+ },
+ {
+ "epoch": 55.88555858310627,
+ "grad_norm": 4.862467288970947,
+ "learning_rate": 8.584395998122054e-06,
+ "loss": 0.1565,
+ "step": 20510
+ },
+ {
+ "epoch": 55.88828337874659,
+ "grad_norm": 3.5602667331695557,
+ "learning_rate": 8.583522396055923e-06,
+ "loss": 0.146,
+ "step": 20511
+ },
+ {
+ "epoch": 55.89100817438692,
+ "grad_norm": 4.005143165588379,
+ "learning_rate": 8.582648805021276e-06,
+ "loss": 0.1389,
+ "step": 20512
+ },
+ {
+ "epoch": 55.89373297002725,
+ "grad_norm": 3.108684778213501,
+ "learning_rate": 8.581775225024914e-06,
+ "loss": 0.1552,
+ "step": 20513
+ },
+ {
+ "epoch": 55.89645776566758,
+ "grad_norm": 3.6260788440704346,
+ "learning_rate": 8.58090165607364e-06,
+ "loss": 0.0751,
+ "step": 20514
+ },
+ {
+ "epoch": 55.8991825613079,
+ "grad_norm": 4.506085395812988,
+ "learning_rate": 8.58002809817426e-06,
+ "loss": 0.188,
+ "step": 20515
+ },
+ {
+ "epoch": 55.90190735694823,
+ "grad_norm": 3.595628499984741,
+ "learning_rate": 8.579154551333574e-06,
+ "loss": 0.1135,
+ "step": 20516
+ },
+ {
+ "epoch": 55.904632152588555,
+ "grad_norm": 4.162252426147461,
+ "learning_rate": 8.578281015558388e-06,
+ "loss": 0.1032,
+ "step": 20517
+ },
+ {
+ "epoch": 55.90735694822888,
+ "grad_norm": 3.3928403854370117,
+ "learning_rate": 8.577407490855499e-06,
+ "loss": 0.1577,
+ "step": 20518
+ },
+ {
+ "epoch": 55.91008174386921,
+ "grad_norm": 4.454849720001221,
+ "learning_rate": 8.57653397723172e-06,
+ "loss": 0.1331,
+ "step": 20519
+ },
+ {
+ "epoch": 55.91280653950954,
+ "grad_norm": 3.7224721908569336,
+ "learning_rate": 8.575660474693846e-06,
+ "loss": 0.0846,
+ "step": 20520
+ },
+ {
+ "epoch": 55.915531335149865,
+ "grad_norm": 3.00057315826416,
+ "learning_rate": 8.574786983248684e-06,
+ "loss": 0.1174,
+ "step": 20521
+ },
+ {
+ "epoch": 55.91825613079019,
+ "grad_norm": 3.5504508018493652,
+ "learning_rate": 8.573913502903034e-06,
+ "loss": 0.202,
+ "step": 20522
+ },
+ {
+ "epoch": 55.920980926430516,
+ "grad_norm": 4.388420104980469,
+ "learning_rate": 8.573040033663702e-06,
+ "loss": 0.0857,
+ "step": 20523
+ },
+ {
+ "epoch": 55.92370572207084,
+ "grad_norm": 3.6599771976470947,
+ "learning_rate": 8.572166575537484e-06,
+ "loss": 0.0688,
+ "step": 20524
+ },
+ {
+ "epoch": 55.926430517711175,
+ "grad_norm": 5.742560386657715,
+ "learning_rate": 8.571293128531191e-06,
+ "loss": 0.1443,
+ "step": 20525
+ },
+ {
+ "epoch": 55.9291553133515,
+ "grad_norm": 5.439338684082031,
+ "learning_rate": 8.57041969265162e-06,
+ "loss": 0.1298,
+ "step": 20526
+ },
+ {
+ "epoch": 55.93188010899183,
+ "grad_norm": 4.148625373840332,
+ "learning_rate": 8.569546267905571e-06,
+ "loss": 0.1327,
+ "step": 20527
+ },
+ {
+ "epoch": 55.93460490463215,
+ "grad_norm": 4.74026346206665,
+ "learning_rate": 8.568672854299856e-06,
+ "loss": 0.2154,
+ "step": 20528
+ },
+ {
+ "epoch": 55.93732970027248,
+ "grad_norm": 3.3893229961395264,
+ "learning_rate": 8.567799451841266e-06,
+ "loss": 0.0736,
+ "step": 20529
+ },
+ {
+ "epoch": 55.940054495912804,
+ "grad_norm": 2.7869043350219727,
+ "learning_rate": 8.566926060536608e-06,
+ "loss": 0.0547,
+ "step": 20530
+ },
+ {
+ "epoch": 55.94277929155314,
+ "grad_norm": 4.547995567321777,
+ "learning_rate": 8.566052680392684e-06,
+ "loss": 0.2509,
+ "step": 20531
+ },
+ {
+ "epoch": 55.94550408719346,
+ "grad_norm": 3.5843234062194824,
+ "learning_rate": 8.565179311416298e-06,
+ "loss": 0.1101,
+ "step": 20532
+ },
+ {
+ "epoch": 55.94822888283379,
+ "grad_norm": 4.6569414138793945,
+ "learning_rate": 8.564305953614246e-06,
+ "loss": 0.0799,
+ "step": 20533
+ },
+ {
+ "epoch": 55.950953678474114,
+ "grad_norm": 4.099673271179199,
+ "learning_rate": 8.563432606993337e-06,
+ "loss": 0.2314,
+ "step": 20534
+ },
+ {
+ "epoch": 55.95367847411444,
+ "grad_norm": 3.8664135932922363,
+ "learning_rate": 8.562559271560365e-06,
+ "loss": 0.1103,
+ "step": 20535
+ },
+ {
+ "epoch": 55.956403269754766,
+ "grad_norm": 4.16465425491333,
+ "learning_rate": 8.561685947322133e-06,
+ "loss": 0.1514,
+ "step": 20536
+ },
+ {
+ "epoch": 55.95912806539509,
+ "grad_norm": 5.871386528015137,
+ "learning_rate": 8.560812634285451e-06,
+ "loss": 0.0679,
+ "step": 20537
+ },
+ {
+ "epoch": 55.961852861035425,
+ "grad_norm": 3.923872470855713,
+ "learning_rate": 8.559939332457109e-06,
+ "loss": 0.0887,
+ "step": 20538
+ },
+ {
+ "epoch": 55.96457765667575,
+ "grad_norm": 4.287431240081787,
+ "learning_rate": 8.559066041843917e-06,
+ "loss": 0.1737,
+ "step": 20539
+ },
+ {
+ "epoch": 55.967302452316076,
+ "grad_norm": 3.428402900695801,
+ "learning_rate": 8.558192762452669e-06,
+ "loss": 0.0724,
+ "step": 20540
+ },
+ {
+ "epoch": 55.9700272479564,
+ "grad_norm": 4.2366533279418945,
+ "learning_rate": 8.557319494290171e-06,
+ "loss": 0.1356,
+ "step": 20541
+ },
+ {
+ "epoch": 55.97275204359673,
+ "grad_norm": 3.562201738357544,
+ "learning_rate": 8.55644623736322e-06,
+ "loss": 0.1089,
+ "step": 20542
+ },
+ {
+ "epoch": 55.97547683923706,
+ "grad_norm": 4.23938512802124,
+ "learning_rate": 8.555572991678624e-06,
+ "loss": 0.1206,
+ "step": 20543
+ },
+ {
+ "epoch": 55.97820163487739,
+ "grad_norm": 5.907759666442871,
+ "learning_rate": 8.554699757243174e-06,
+ "loss": 0.1504,
+ "step": 20544
+ },
+ {
+ "epoch": 55.98092643051771,
+ "grad_norm": 4.7009148597717285,
+ "learning_rate": 8.553826534063681e-06,
+ "loss": 0.147,
+ "step": 20545
+ },
+ {
+ "epoch": 55.98365122615804,
+ "grad_norm": 4.274569511413574,
+ "learning_rate": 8.552953322146936e-06,
+ "loss": 0.1461,
+ "step": 20546
+ },
+ {
+ "epoch": 55.986376021798364,
+ "grad_norm": 3.7574856281280518,
+ "learning_rate": 8.552080121499747e-06,
+ "loss": 0.0946,
+ "step": 20547
+ },
+ {
+ "epoch": 55.98910081743869,
+ "grad_norm": 3.955724000930786,
+ "learning_rate": 8.551206932128908e-06,
+ "loss": 0.1318,
+ "step": 20548
+ },
+ {
+ "epoch": 55.991825613079016,
+ "grad_norm": 3.2213187217712402,
+ "learning_rate": 8.550333754041227e-06,
+ "loss": 0.1254,
+ "step": 20549
+ },
+ {
+ "epoch": 55.99455040871935,
+ "grad_norm": 3.9226980209350586,
+ "learning_rate": 8.549460587243496e-06,
+ "loss": 0.0988,
+ "step": 20550
+ },
+ {
+ "epoch": 55.997275204359674,
+ "grad_norm": 4.1123576164245605,
+ "learning_rate": 8.54858743174252e-06,
+ "loss": 0.1186,
+ "step": 20551
+ },
+ {
+ "epoch": 56.0,
+ "grad_norm": 3.55380916595459,
+ "learning_rate": 8.5477142875451e-06,
+ "loss": 0.0511,
+ "step": 20552
+ },
+ {
+ "epoch": 56.002724795640326,
+ "grad_norm": 4.605118751525879,
+ "learning_rate": 8.546841154658031e-06,
+ "loss": 0.1745,
+ "step": 20553
+ },
+ {
+ "epoch": 56.00544959128065,
+ "grad_norm": 2.965914249420166,
+ "learning_rate": 8.545968033088117e-06,
+ "loss": 0.0537,
+ "step": 20554
+ },
+ {
+ "epoch": 56.00817438692098,
+ "grad_norm": 4.400588035583496,
+ "learning_rate": 8.545094922842161e-06,
+ "loss": 0.1819,
+ "step": 20555
+ },
+ {
+ "epoch": 56.01089918256131,
+ "grad_norm": 4.025671482086182,
+ "learning_rate": 8.544221823926957e-06,
+ "loss": 0.0813,
+ "step": 20556
+ },
+ {
+ "epoch": 56.013623978201636,
+ "grad_norm": 6.826101779937744,
+ "learning_rate": 8.543348736349307e-06,
+ "loss": 0.0879,
+ "step": 20557
+ },
+ {
+ "epoch": 56.01634877384196,
+ "grad_norm": 4.12449836730957,
+ "learning_rate": 8.54247566011601e-06,
+ "loss": 0.1038,
+ "step": 20558
+ },
+ {
+ "epoch": 56.01907356948229,
+ "grad_norm": 3.6200411319732666,
+ "learning_rate": 8.541602595233866e-06,
+ "loss": 0.0882,
+ "step": 20559
+ },
+ {
+ "epoch": 56.02179836512261,
+ "grad_norm": 3.680046319961548,
+ "learning_rate": 8.540729541709673e-06,
+ "loss": 0.0771,
+ "step": 20560
+ },
+ {
+ "epoch": 56.02452316076294,
+ "grad_norm": 5.322786808013916,
+ "learning_rate": 8.539856499550233e-06,
+ "loss": 0.088,
+ "step": 20561
+ },
+ {
+ "epoch": 56.02724795640327,
+ "grad_norm": 3.4235246181488037,
+ "learning_rate": 8.53898346876234e-06,
+ "loss": 0.1759,
+ "step": 20562
+ },
+ {
+ "epoch": 56.0299727520436,
+ "grad_norm": 3.9941909313201904,
+ "learning_rate": 8.5381104493528e-06,
+ "loss": 0.182,
+ "step": 20563
+ },
+ {
+ "epoch": 56.032697547683924,
+ "grad_norm": 3.8364150524139404,
+ "learning_rate": 8.537237441328409e-06,
+ "loss": 0.0684,
+ "step": 20564
+ },
+ {
+ "epoch": 56.03542234332425,
+ "grad_norm": 3.503875255584717,
+ "learning_rate": 8.536364444695967e-06,
+ "loss": 0.099,
+ "step": 20565
+ },
+ {
+ "epoch": 56.038147138964575,
+ "grad_norm": 9.737573623657227,
+ "learning_rate": 8.535491459462267e-06,
+ "loss": 0.1859,
+ "step": 20566
+ },
+ {
+ "epoch": 56.0408719346049,
+ "grad_norm": 3.5125746726989746,
+ "learning_rate": 8.534618485634115e-06,
+ "loss": 0.1195,
+ "step": 20567
+ },
+ {
+ "epoch": 56.043596730245234,
+ "grad_norm": 3.228148937225342,
+ "learning_rate": 8.533745523218307e-06,
+ "loss": 0.0768,
+ "step": 20568
+ },
+ {
+ "epoch": 56.04632152588556,
+ "grad_norm": 4.585299015045166,
+ "learning_rate": 8.532872572221642e-06,
+ "loss": 0.1622,
+ "step": 20569
+ },
+ {
+ "epoch": 56.049046321525886,
+ "grad_norm": 3.633225202560425,
+ "learning_rate": 8.531999632650912e-06,
+ "loss": 0.3036,
+ "step": 20570
+ },
+ {
+ "epoch": 56.05177111716621,
+ "grad_norm": 3.193605899810791,
+ "learning_rate": 8.531126704512928e-06,
+ "loss": 0.1625,
+ "step": 20571
+ },
+ {
+ "epoch": 56.05449591280654,
+ "grad_norm": 4.373520851135254,
+ "learning_rate": 8.53025378781448e-06,
+ "loss": 0.2033,
+ "step": 20572
+ },
+ {
+ "epoch": 56.05722070844686,
+ "grad_norm": 3.933464765548706,
+ "learning_rate": 8.529380882562371e-06,
+ "loss": 0.1679,
+ "step": 20573
+ },
+ {
+ "epoch": 56.059945504087196,
+ "grad_norm": 3.5256805419921875,
+ "learning_rate": 8.528507988763393e-06,
+ "loss": 0.0786,
+ "step": 20574
+ },
+ {
+ "epoch": 56.06267029972752,
+ "grad_norm": 4.1520891189575195,
+ "learning_rate": 8.527635106424352e-06,
+ "loss": 0.1364,
+ "step": 20575
+ },
+ {
+ "epoch": 56.06539509536785,
+ "grad_norm": 4.632296562194824,
+ "learning_rate": 8.526762235552038e-06,
+ "loss": 0.1718,
+ "step": 20576
+ },
+ {
+ "epoch": 56.06811989100817,
+ "grad_norm": 4.335762977600098,
+ "learning_rate": 8.525889376153253e-06,
+ "loss": 0.1075,
+ "step": 20577
+ },
+ {
+ "epoch": 56.0708446866485,
+ "grad_norm": 3.0486397743225098,
+ "learning_rate": 8.525016528234794e-06,
+ "loss": 0.078,
+ "step": 20578
+ },
+ {
+ "epoch": 56.073569482288825,
+ "grad_norm": 4.040469646453857,
+ "learning_rate": 8.52414369180346e-06,
+ "loss": 0.0702,
+ "step": 20579
+ },
+ {
+ "epoch": 56.07629427792916,
+ "grad_norm": 3.926084041595459,
+ "learning_rate": 8.523270866866044e-06,
+ "loss": 0.0851,
+ "step": 20580
+ },
+ {
+ "epoch": 56.079019073569484,
+ "grad_norm": 4.060538291931152,
+ "learning_rate": 8.52239805342935e-06,
+ "loss": 0.2353,
+ "step": 20581
+ },
+ {
+ "epoch": 56.08174386920981,
+ "grad_norm": 5.469473361968994,
+ "learning_rate": 8.521525251500172e-06,
+ "loss": 0.0915,
+ "step": 20582
+ },
+ {
+ "epoch": 56.084468664850135,
+ "grad_norm": 3.8926613330841064,
+ "learning_rate": 8.520652461085309e-06,
+ "loss": 0.1103,
+ "step": 20583
+ },
+ {
+ "epoch": 56.08719346049046,
+ "grad_norm": 3.446298360824585,
+ "learning_rate": 8.519779682191554e-06,
+ "loss": 0.0861,
+ "step": 20584
+ },
+ {
+ "epoch": 56.08991825613079,
+ "grad_norm": 3.4064533710479736,
+ "learning_rate": 8.518906914825709e-06,
+ "loss": 0.0959,
+ "step": 20585
+ },
+ {
+ "epoch": 56.09264305177112,
+ "grad_norm": 3.9588980674743652,
+ "learning_rate": 8.518034158994567e-06,
+ "loss": 0.0604,
+ "step": 20586
+ },
+ {
+ "epoch": 56.095367847411445,
+ "grad_norm": 3.596825122833252,
+ "learning_rate": 8.517161414704926e-06,
+ "loss": 0.0688,
+ "step": 20587
+ },
+ {
+ "epoch": 56.09809264305177,
+ "grad_norm": 3.5281028747558594,
+ "learning_rate": 8.516288681963589e-06,
+ "loss": 0.2004,
+ "step": 20588
+ },
+ {
+ "epoch": 56.1008174386921,
+ "grad_norm": 4.134294509887695,
+ "learning_rate": 8.515415960777345e-06,
+ "loss": 0.0913,
+ "step": 20589
+ },
+ {
+ "epoch": 56.10354223433242,
+ "grad_norm": 4.095026969909668,
+ "learning_rate": 8.514543251152996e-06,
+ "loss": 0.253,
+ "step": 20590
+ },
+ {
+ "epoch": 56.10626702997275,
+ "grad_norm": 3.5762150287628174,
+ "learning_rate": 8.513670553097335e-06,
+ "loss": 0.1701,
+ "step": 20591
+ },
+ {
+ "epoch": 56.10899182561308,
+ "grad_norm": 3.8802061080932617,
+ "learning_rate": 8.512797866617158e-06,
+ "loss": 0.1399,
+ "step": 20592
+ },
+ {
+ "epoch": 56.11171662125341,
+ "grad_norm": 4.417481899261475,
+ "learning_rate": 8.511925191719268e-06,
+ "loss": 0.187,
+ "step": 20593
+ },
+ {
+ "epoch": 56.11444141689373,
+ "grad_norm": 4.006098747253418,
+ "learning_rate": 8.511052528410453e-06,
+ "loss": 0.1473,
+ "step": 20594
+ },
+ {
+ "epoch": 56.11716621253406,
+ "grad_norm": 4.55978536605835,
+ "learning_rate": 8.510179876697514e-06,
+ "loss": 0.2118,
+ "step": 20595
+ },
+ {
+ "epoch": 56.119891008174385,
+ "grad_norm": 3.7112536430358887,
+ "learning_rate": 8.509307236587247e-06,
+ "loss": 0.1585,
+ "step": 20596
+ },
+ {
+ "epoch": 56.12261580381471,
+ "grad_norm": 2.8644304275512695,
+ "learning_rate": 8.508434608086448e-06,
+ "loss": 0.1177,
+ "step": 20597
+ },
+ {
+ "epoch": 56.12534059945504,
+ "grad_norm": 4.249670028686523,
+ "learning_rate": 8.507561991201908e-06,
+ "loss": 0.0741,
+ "step": 20598
+ },
+ {
+ "epoch": 56.12806539509537,
+ "grad_norm": 3.9912595748901367,
+ "learning_rate": 8.506689385940433e-06,
+ "loss": 0.0659,
+ "step": 20599
+ },
+ {
+ "epoch": 56.130790190735695,
+ "grad_norm": 3.794909954071045,
+ "learning_rate": 8.50581679230881e-06,
+ "loss": 0.0722,
+ "step": 20600
+ },
+ {
+ "epoch": 56.13351498637602,
+ "grad_norm": 3.5600454807281494,
+ "learning_rate": 8.504944210313838e-06,
+ "loss": 0.1109,
+ "step": 20601
+ },
+ {
+ "epoch": 56.13623978201635,
+ "grad_norm": 5.2991414070129395,
+ "learning_rate": 8.50407163996231e-06,
+ "loss": 0.0802,
+ "step": 20602
+ },
+ {
+ "epoch": 56.13896457765667,
+ "grad_norm": 7.255417346954346,
+ "learning_rate": 8.503199081261028e-06,
+ "loss": 0.1211,
+ "step": 20603
+ },
+ {
+ "epoch": 56.141689373297005,
+ "grad_norm": 3.479802370071411,
+ "learning_rate": 8.50232653421678e-06,
+ "loss": 0.0732,
+ "step": 20604
+ },
+ {
+ "epoch": 56.14441416893733,
+ "grad_norm": 3.8354055881500244,
+ "learning_rate": 8.501453998836364e-06,
+ "loss": 0.0726,
+ "step": 20605
+ },
+ {
+ "epoch": 56.14713896457766,
+ "grad_norm": 3.690303087234497,
+ "learning_rate": 8.50058147512658e-06,
+ "loss": 0.1032,
+ "step": 20606
+ },
+ {
+ "epoch": 56.14986376021798,
+ "grad_norm": 4.3305182456970215,
+ "learning_rate": 8.499708963094216e-06,
+ "loss": 0.3212,
+ "step": 20607
+ },
+ {
+ "epoch": 56.15258855585831,
+ "grad_norm": 4.2532196044921875,
+ "learning_rate": 8.498836462746074e-06,
+ "loss": 0.073,
+ "step": 20608
+ },
+ {
+ "epoch": 56.155313351498634,
+ "grad_norm": 4.8961873054504395,
+ "learning_rate": 8.497963974088942e-06,
+ "loss": 0.2046,
+ "step": 20609
+ },
+ {
+ "epoch": 56.15803814713897,
+ "grad_norm": 3.996030330657959,
+ "learning_rate": 8.497091497129621e-06,
+ "loss": 0.1031,
+ "step": 20610
+ },
+ {
+ "epoch": 56.16076294277929,
+ "grad_norm": 3.6293375492095947,
+ "learning_rate": 8.496219031874899e-06,
+ "loss": 0.1507,
+ "step": 20611
+ },
+ {
+ "epoch": 56.16348773841962,
+ "grad_norm": 4.9578633308410645,
+ "learning_rate": 8.49534657833158e-06,
+ "loss": 0.1609,
+ "step": 20612
+ },
+ {
+ "epoch": 56.166212534059945,
+ "grad_norm": 4.215757369995117,
+ "learning_rate": 8.49447413650645e-06,
+ "loss": 0.1286,
+ "step": 20613
+ },
+ {
+ "epoch": 56.16893732970027,
+ "grad_norm": 4.967205047607422,
+ "learning_rate": 8.493601706406305e-06,
+ "loss": 0.2106,
+ "step": 20614
+ },
+ {
+ "epoch": 56.171662125340596,
+ "grad_norm": 3.4942333698272705,
+ "learning_rate": 8.492729288037945e-06,
+ "loss": 0.0626,
+ "step": 20615
+ },
+ {
+ "epoch": 56.17438692098093,
+ "grad_norm": 3.1676595211029053,
+ "learning_rate": 8.491856881408159e-06,
+ "loss": 0.0788,
+ "step": 20616
+ },
+ {
+ "epoch": 56.177111716621255,
+ "grad_norm": 4.532700061798096,
+ "learning_rate": 8.490984486523746e-06,
+ "loss": 0.101,
+ "step": 20617
+ },
+ {
+ "epoch": 56.17983651226158,
+ "grad_norm": 3.0709919929504395,
+ "learning_rate": 8.490112103391494e-06,
+ "loss": 0.0716,
+ "step": 20618
+ },
+ {
+ "epoch": 56.182561307901906,
+ "grad_norm": 4.7369384765625,
+ "learning_rate": 8.489239732018202e-06,
+ "loss": 0.1132,
+ "step": 20619
+ },
+ {
+ "epoch": 56.18528610354223,
+ "grad_norm": 4.261050224304199,
+ "learning_rate": 8.48836737241066e-06,
+ "loss": 0.1538,
+ "step": 20620
+ },
+ {
+ "epoch": 56.18801089918256,
+ "grad_norm": 8.628913879394531,
+ "learning_rate": 8.487495024575668e-06,
+ "loss": 0.077,
+ "step": 20621
+ },
+ {
+ "epoch": 56.19073569482289,
+ "grad_norm": 3.7310938835144043,
+ "learning_rate": 8.48662268852001e-06,
+ "loss": 0.1542,
+ "step": 20622
+ },
+ {
+ "epoch": 56.19346049046322,
+ "grad_norm": 4.899902820587158,
+ "learning_rate": 8.48575036425049e-06,
+ "loss": 0.209,
+ "step": 20623
+ },
+ {
+ "epoch": 56.19618528610354,
+ "grad_norm": 3.526634693145752,
+ "learning_rate": 8.4848780517739e-06,
+ "loss": 0.098,
+ "step": 20624
+ },
+ {
+ "epoch": 56.19891008174387,
+ "grad_norm": 4.161648750305176,
+ "learning_rate": 8.484005751097026e-06,
+ "loss": 0.1522,
+ "step": 20625
+ },
+ {
+ "epoch": 56.201634877384194,
+ "grad_norm": 3.330474853515625,
+ "learning_rate": 8.483133462226671e-06,
+ "loss": 0.1376,
+ "step": 20626
+ },
+ {
+ "epoch": 56.20435967302452,
+ "grad_norm": 4.167783260345459,
+ "learning_rate": 8.48226118516962e-06,
+ "loss": 0.1346,
+ "step": 20627
+ },
+ {
+ "epoch": 56.20708446866485,
+ "grad_norm": 4.754262924194336,
+ "learning_rate": 8.481388919932672e-06,
+ "loss": 0.0906,
+ "step": 20628
+ },
+ {
+ "epoch": 56.20980926430518,
+ "grad_norm": 3.272594928741455,
+ "learning_rate": 8.480516666522616e-06,
+ "loss": 0.1415,
+ "step": 20629
+ },
+ {
+ "epoch": 56.212534059945504,
+ "grad_norm": 3.318922758102417,
+ "learning_rate": 8.479644424946251e-06,
+ "loss": 0.0499,
+ "step": 20630
+ },
+ {
+ "epoch": 56.21525885558583,
+ "grad_norm": 4.075006484985352,
+ "learning_rate": 8.478772195210365e-06,
+ "loss": 0.1142,
+ "step": 20631
+ },
+ {
+ "epoch": 56.217983651226156,
+ "grad_norm": 4.122602462768555,
+ "learning_rate": 8.477899977321752e-06,
+ "loss": 0.1281,
+ "step": 20632
+ },
+ {
+ "epoch": 56.22070844686648,
+ "grad_norm": 3.0714304447174072,
+ "learning_rate": 8.477027771287203e-06,
+ "loss": 0.1627,
+ "step": 20633
+ },
+ {
+ "epoch": 56.223433242506815,
+ "grad_norm": 5.425609588623047,
+ "learning_rate": 8.476155577113515e-06,
+ "loss": 0.1478,
+ "step": 20634
+ },
+ {
+ "epoch": 56.22615803814714,
+ "grad_norm": 4.0460920333862305,
+ "learning_rate": 8.475283394807478e-06,
+ "loss": 0.1296,
+ "step": 20635
+ },
+ {
+ "epoch": 56.228882833787466,
+ "grad_norm": 3.1727192401885986,
+ "learning_rate": 8.474411224375885e-06,
+ "loss": 0.206,
+ "step": 20636
+ },
+ {
+ "epoch": 56.23160762942779,
+ "grad_norm": 3.6730051040649414,
+ "learning_rate": 8.473539065825527e-06,
+ "loss": 0.1467,
+ "step": 20637
+ },
+ {
+ "epoch": 56.23433242506812,
+ "grad_norm": 3.1039352416992188,
+ "learning_rate": 8.472666919163198e-06,
+ "loss": 0.0871,
+ "step": 20638
+ },
+ {
+ "epoch": 56.237057220708444,
+ "grad_norm": 2.95245099067688,
+ "learning_rate": 8.471794784395687e-06,
+ "loss": 0.0625,
+ "step": 20639
+ },
+ {
+ "epoch": 56.23978201634878,
+ "grad_norm": 5.449034690856934,
+ "learning_rate": 8.470922661529792e-06,
+ "loss": 0.0532,
+ "step": 20640
+ },
+ {
+ "epoch": 56.2425068119891,
+ "grad_norm": 4.009894371032715,
+ "learning_rate": 8.470050550572302e-06,
+ "loss": 0.1112,
+ "step": 20641
+ },
+ {
+ "epoch": 56.24523160762943,
+ "grad_norm": 3.69368052482605,
+ "learning_rate": 8.46917845153001e-06,
+ "loss": 0.1003,
+ "step": 20642
+ },
+ {
+ "epoch": 56.247956403269754,
+ "grad_norm": 4.515437126159668,
+ "learning_rate": 8.468306364409704e-06,
+ "loss": 0.0798,
+ "step": 20643
+ },
+ {
+ "epoch": 56.25068119891008,
+ "grad_norm": 4.0363450050354,
+ "learning_rate": 8.467434289218184e-06,
+ "loss": 0.075,
+ "step": 20644
+ },
+ {
+ "epoch": 56.253405994550405,
+ "grad_norm": 4.053673267364502,
+ "learning_rate": 8.466562225962233e-06,
+ "loss": 0.1453,
+ "step": 20645
+ },
+ {
+ "epoch": 56.25613079019074,
+ "grad_norm": 3.6368520259857178,
+ "learning_rate": 8.465690174648648e-06,
+ "loss": 0.1522,
+ "step": 20646
+ },
+ {
+ "epoch": 56.258855585831064,
+ "grad_norm": 4.203634738922119,
+ "learning_rate": 8.464818135284214e-06,
+ "loss": 0.1559,
+ "step": 20647
+ },
+ {
+ "epoch": 56.26158038147139,
+ "grad_norm": 3.756179094314575,
+ "learning_rate": 8.463946107875732e-06,
+ "loss": 0.2895,
+ "step": 20648
+ },
+ {
+ "epoch": 56.264305177111716,
+ "grad_norm": 3.291050910949707,
+ "learning_rate": 8.463074092429986e-06,
+ "loss": 0.0635,
+ "step": 20649
+ },
+ {
+ "epoch": 56.26702997275204,
+ "grad_norm": 3.4768476486206055,
+ "learning_rate": 8.462202088953771e-06,
+ "loss": 0.091,
+ "step": 20650
+ },
+ {
+ "epoch": 56.26975476839237,
+ "grad_norm": 4.023835182189941,
+ "learning_rate": 8.461330097453875e-06,
+ "loss": 0.1656,
+ "step": 20651
+ },
+ {
+ "epoch": 56.2724795640327,
+ "grad_norm": 3.9702351093292236,
+ "learning_rate": 8.460458117937091e-06,
+ "loss": 0.1035,
+ "step": 20652
+ },
+ {
+ "epoch": 56.275204359673026,
+ "grad_norm": 3.135334014892578,
+ "learning_rate": 8.45958615041021e-06,
+ "loss": 0.0998,
+ "step": 20653
+ },
+ {
+ "epoch": 56.27792915531335,
+ "grad_norm": 4.371511459350586,
+ "learning_rate": 8.458714194880022e-06,
+ "loss": 0.0726,
+ "step": 20654
+ },
+ {
+ "epoch": 56.28065395095368,
+ "grad_norm": 3.310818910598755,
+ "learning_rate": 8.45784225135332e-06,
+ "loss": 0.0718,
+ "step": 20655
+ },
+ {
+ "epoch": 56.283378746594,
+ "grad_norm": 3.2568392753601074,
+ "learning_rate": 8.456970319836886e-06,
+ "loss": 0.0666,
+ "step": 20656
+ },
+ {
+ "epoch": 56.28610354223433,
+ "grad_norm": 4.366418361663818,
+ "learning_rate": 8.456098400337522e-06,
+ "loss": 0.2138,
+ "step": 20657
+ },
+ {
+ "epoch": 56.28882833787466,
+ "grad_norm": 4.223952770233154,
+ "learning_rate": 8.455226492862017e-06,
+ "loss": 0.0636,
+ "step": 20658
+ },
+ {
+ "epoch": 56.29155313351499,
+ "grad_norm": 3.9034769535064697,
+ "learning_rate": 8.454354597417155e-06,
+ "loss": 0.1913,
+ "step": 20659
+ },
+ {
+ "epoch": 56.294277929155314,
+ "grad_norm": 7.27374267578125,
+ "learning_rate": 8.453482714009732e-06,
+ "loss": 0.1548,
+ "step": 20660
+ },
+ {
+ "epoch": 56.29700272479564,
+ "grad_norm": 4.076107025146484,
+ "learning_rate": 8.452610842646533e-06,
+ "loss": 0.1189,
+ "step": 20661
+ },
+ {
+ "epoch": 56.299727520435965,
+ "grad_norm": 3.573756694793701,
+ "learning_rate": 8.451738983334355e-06,
+ "loss": 0.064,
+ "step": 20662
+ },
+ {
+ "epoch": 56.30245231607629,
+ "grad_norm": 3.9268429279327393,
+ "learning_rate": 8.45086713607998e-06,
+ "loss": 0.1564,
+ "step": 20663
+ },
+ {
+ "epoch": 56.305177111716624,
+ "grad_norm": 4.568852424621582,
+ "learning_rate": 8.449995300890204e-06,
+ "loss": 0.0923,
+ "step": 20664
+ },
+ {
+ "epoch": 56.30790190735695,
+ "grad_norm": 4.122679710388184,
+ "learning_rate": 8.449123477771815e-06,
+ "loss": 0.1715,
+ "step": 20665
+ },
+ {
+ "epoch": 56.310626702997276,
+ "grad_norm": 3.1892356872558594,
+ "learning_rate": 8.448251666731601e-06,
+ "loss": 0.0709,
+ "step": 20666
+ },
+ {
+ "epoch": 56.3133514986376,
+ "grad_norm": 3.214322328567505,
+ "learning_rate": 8.447379867776353e-06,
+ "loss": 0.0796,
+ "step": 20667
+ },
+ {
+ "epoch": 56.31607629427793,
+ "grad_norm": 4.30591344833374,
+ "learning_rate": 8.446508080912863e-06,
+ "loss": 0.1585,
+ "step": 20668
+ },
+ {
+ "epoch": 56.31880108991825,
+ "grad_norm": 3.253145217895508,
+ "learning_rate": 8.445636306147915e-06,
+ "loss": 0.0599,
+ "step": 20669
+ },
+ {
+ "epoch": 56.321525885558586,
+ "grad_norm": 3.429258108139038,
+ "learning_rate": 8.444764543488303e-06,
+ "loss": 0.0623,
+ "step": 20670
+ },
+ {
+ "epoch": 56.32425068119891,
+ "grad_norm": 3.463414192199707,
+ "learning_rate": 8.443892792940815e-06,
+ "loss": 0.0788,
+ "step": 20671
+ },
+ {
+ "epoch": 56.32697547683924,
+ "grad_norm": 4.158020496368408,
+ "learning_rate": 8.44302105451224e-06,
+ "loss": 0.1442,
+ "step": 20672
+ },
+ {
+ "epoch": 56.32970027247956,
+ "grad_norm": 4.838292598724365,
+ "learning_rate": 8.442149328209364e-06,
+ "loss": 0.1763,
+ "step": 20673
+ },
+ {
+ "epoch": 56.33242506811989,
+ "grad_norm": 3.9878294467926025,
+ "learning_rate": 8.44127761403898e-06,
+ "loss": 0.078,
+ "step": 20674
+ },
+ {
+ "epoch": 56.335149863760215,
+ "grad_norm": 2.6165270805358887,
+ "learning_rate": 8.440405912007879e-06,
+ "loss": 0.0497,
+ "step": 20675
+ },
+ {
+ "epoch": 56.33787465940055,
+ "grad_norm": 4.76611852645874,
+ "learning_rate": 8.439534222122843e-06,
+ "loss": 0.3121,
+ "step": 20676
+ },
+ {
+ "epoch": 56.34059945504087,
+ "grad_norm": 3.606412172317505,
+ "learning_rate": 8.438662544390666e-06,
+ "loss": 0.0633,
+ "step": 20677
+ },
+ {
+ "epoch": 56.3433242506812,
+ "grad_norm": 4.322358131408691,
+ "learning_rate": 8.437790878818135e-06,
+ "loss": 0.1374,
+ "step": 20678
+ },
+ {
+ "epoch": 56.346049046321525,
+ "grad_norm": 3.323930263519287,
+ "learning_rate": 8.436919225412038e-06,
+ "loss": 0.1242,
+ "step": 20679
+ },
+ {
+ "epoch": 56.34877384196185,
+ "grad_norm": 4.404124736785889,
+ "learning_rate": 8.436047584179163e-06,
+ "loss": 0.099,
+ "step": 20680
+ },
+ {
+ "epoch": 56.35149863760218,
+ "grad_norm": 5.267062664031982,
+ "learning_rate": 8.4351759551263e-06,
+ "loss": 0.1487,
+ "step": 20681
+ },
+ {
+ "epoch": 56.35422343324251,
+ "grad_norm": 3.791018486022949,
+ "learning_rate": 8.434304338260237e-06,
+ "loss": 0.1992,
+ "step": 20682
+ },
+ {
+ "epoch": 56.356948228882835,
+ "grad_norm": 3.1285722255706787,
+ "learning_rate": 8.433432733587758e-06,
+ "loss": 0.0647,
+ "step": 20683
+ },
+ {
+ "epoch": 56.35967302452316,
+ "grad_norm": 4.164439678192139,
+ "learning_rate": 8.43256114111566e-06,
+ "loss": 0.1759,
+ "step": 20684
+ },
+ {
+ "epoch": 56.36239782016349,
+ "grad_norm": 6.165648937225342,
+ "learning_rate": 8.43168956085072e-06,
+ "loss": 0.1041,
+ "step": 20685
+ },
+ {
+ "epoch": 56.36512261580381,
+ "grad_norm": 3.150517225265503,
+ "learning_rate": 8.430817992799735e-06,
+ "loss": 0.0934,
+ "step": 20686
+ },
+ {
+ "epoch": 56.36784741144414,
+ "grad_norm": 3.8604135513305664,
+ "learning_rate": 8.429946436969488e-06,
+ "loss": 0.1202,
+ "step": 20687
+ },
+ {
+ "epoch": 56.37057220708447,
+ "grad_norm": 2.8514785766601562,
+ "learning_rate": 8.429074893366768e-06,
+ "loss": 0.0547,
+ "step": 20688
+ },
+ {
+ "epoch": 56.3732970027248,
+ "grad_norm": 3.9102790355682373,
+ "learning_rate": 8.42820336199836e-06,
+ "loss": 0.0665,
+ "step": 20689
+ },
+ {
+ "epoch": 56.37602179836512,
+ "grad_norm": 3.69484281539917,
+ "learning_rate": 8.427331842871052e-06,
+ "loss": 0.0907,
+ "step": 20690
+ },
+ {
+ "epoch": 56.37874659400545,
+ "grad_norm": 6.28098201751709,
+ "learning_rate": 8.426460335991638e-06,
+ "loss": 0.0531,
+ "step": 20691
+ },
+ {
+ "epoch": 56.381471389645775,
+ "grad_norm": 3.8371851444244385,
+ "learning_rate": 8.425588841366896e-06,
+ "loss": 0.0674,
+ "step": 20692
+ },
+ {
+ "epoch": 56.3841961852861,
+ "grad_norm": 5.768299102783203,
+ "learning_rate": 8.424717359003621e-06,
+ "loss": 0.1763,
+ "step": 20693
+ },
+ {
+ "epoch": 56.38692098092643,
+ "grad_norm": 3.979182004928589,
+ "learning_rate": 8.423845888908595e-06,
+ "loss": 0.1097,
+ "step": 20694
+ },
+ {
+ "epoch": 56.38964577656676,
+ "grad_norm": 6.081275463104248,
+ "learning_rate": 8.422974431088607e-06,
+ "loss": 0.2229,
+ "step": 20695
+ },
+ {
+ "epoch": 56.392370572207085,
+ "grad_norm": 2.5754799842834473,
+ "learning_rate": 8.422102985550441e-06,
+ "loss": 0.1401,
+ "step": 20696
+ },
+ {
+ "epoch": 56.39509536784741,
+ "grad_norm": 3.954085350036621,
+ "learning_rate": 8.42123155230089e-06,
+ "loss": 0.0638,
+ "step": 20697
+ },
+ {
+ "epoch": 56.39782016348774,
+ "grad_norm": 6.7409563064575195,
+ "learning_rate": 8.420360131346735e-06,
+ "loss": 0.2512,
+ "step": 20698
+ },
+ {
+ "epoch": 56.40054495912806,
+ "grad_norm": 5.291450023651123,
+ "learning_rate": 8.419488722694765e-06,
+ "loss": 0.0859,
+ "step": 20699
+ },
+ {
+ "epoch": 56.403269754768395,
+ "grad_norm": 3.6343750953674316,
+ "learning_rate": 8.418617326351765e-06,
+ "loss": 0.1427,
+ "step": 20700
+ },
+ {
+ "epoch": 56.40599455040872,
+ "grad_norm": 4.284163951873779,
+ "learning_rate": 8.417745942324522e-06,
+ "loss": 0.1995,
+ "step": 20701
+ },
+ {
+ "epoch": 56.40871934604905,
+ "grad_norm": 4.142784595489502,
+ "learning_rate": 8.416874570619825e-06,
+ "loss": 0.1035,
+ "step": 20702
+ },
+ {
+ "epoch": 56.41144414168937,
+ "grad_norm": 3.6764538288116455,
+ "learning_rate": 8.416003211244454e-06,
+ "loss": 0.0861,
+ "step": 20703
+ },
+ {
+ "epoch": 56.4141689373297,
+ "grad_norm": 5.162350177764893,
+ "learning_rate": 8.415131864205204e-06,
+ "loss": 0.0556,
+ "step": 20704
+ },
+ {
+ "epoch": 56.416893732970024,
+ "grad_norm": 3.668029546737671,
+ "learning_rate": 8.414260529508851e-06,
+ "loss": 0.2694,
+ "step": 20705
+ },
+ {
+ "epoch": 56.41961852861036,
+ "grad_norm": 3.40997576713562,
+ "learning_rate": 8.41338920716219e-06,
+ "loss": 0.1552,
+ "step": 20706
+ },
+ {
+ "epoch": 56.42234332425068,
+ "grad_norm": 3.400639057159424,
+ "learning_rate": 8.412517897172001e-06,
+ "loss": 0.0723,
+ "step": 20707
+ },
+ {
+ "epoch": 56.42506811989101,
+ "grad_norm": 2.9111382961273193,
+ "learning_rate": 8.411646599545068e-06,
+ "loss": 0.0683,
+ "step": 20708
+ },
+ {
+ "epoch": 56.427792915531334,
+ "grad_norm": 3.2668423652648926,
+ "learning_rate": 8.410775314288186e-06,
+ "loss": 0.1265,
+ "step": 20709
+ },
+ {
+ "epoch": 56.43051771117166,
+ "grad_norm": 3.4724650382995605,
+ "learning_rate": 8.40990404140813e-06,
+ "loss": 0.1359,
+ "step": 20710
+ },
+ {
+ "epoch": 56.433242506811986,
+ "grad_norm": 3.0020253658294678,
+ "learning_rate": 8.409032780911695e-06,
+ "loss": 0.0692,
+ "step": 20711
+ },
+ {
+ "epoch": 56.43596730245232,
+ "grad_norm": 3.6473333835601807,
+ "learning_rate": 8.408161532805659e-06,
+ "loss": 0.0758,
+ "step": 20712
+ },
+ {
+ "epoch": 56.438692098092645,
+ "grad_norm": 2.9921231269836426,
+ "learning_rate": 8.40729029709681e-06,
+ "loss": 0.0782,
+ "step": 20713
+ },
+ {
+ "epoch": 56.44141689373297,
+ "grad_norm": 3.7293179035186768,
+ "learning_rate": 8.406419073791933e-06,
+ "loss": 0.094,
+ "step": 20714
+ },
+ {
+ "epoch": 56.444141689373296,
+ "grad_norm": 4.795324802398682,
+ "learning_rate": 8.405547862897813e-06,
+ "loss": 0.0817,
+ "step": 20715
+ },
+ {
+ "epoch": 56.44686648501362,
+ "grad_norm": 3.7878880500793457,
+ "learning_rate": 8.404676664421235e-06,
+ "loss": 0.0871,
+ "step": 20716
+ },
+ {
+ "epoch": 56.44959128065395,
+ "grad_norm": 4.343838691711426,
+ "learning_rate": 8.403805478368983e-06,
+ "loss": 0.2216,
+ "step": 20717
+ },
+ {
+ "epoch": 56.45231607629428,
+ "grad_norm": 3.9245493412017822,
+ "learning_rate": 8.402934304747843e-06,
+ "loss": 0.0767,
+ "step": 20718
+ },
+ {
+ "epoch": 56.45504087193461,
+ "grad_norm": 3.8246958255767822,
+ "learning_rate": 8.402063143564601e-06,
+ "loss": 0.1074,
+ "step": 20719
+ },
+ {
+ "epoch": 56.45776566757493,
+ "grad_norm": 3.887381076812744,
+ "learning_rate": 8.401191994826036e-06,
+ "loss": 0.1733,
+ "step": 20720
+ },
+ {
+ "epoch": 56.46049046321526,
+ "grad_norm": 4.081824779510498,
+ "learning_rate": 8.40032085853894e-06,
+ "loss": 0.1419,
+ "step": 20721
+ },
+ {
+ "epoch": 56.463215258855584,
+ "grad_norm": 3.5036237239837646,
+ "learning_rate": 8.399449734710092e-06,
+ "loss": 0.0743,
+ "step": 20722
+ },
+ {
+ "epoch": 56.46594005449591,
+ "grad_norm": 5.252984046936035,
+ "learning_rate": 8.398578623346277e-06,
+ "loss": 0.1331,
+ "step": 20723
+ },
+ {
+ "epoch": 56.46866485013624,
+ "grad_norm": 4.580055236816406,
+ "learning_rate": 8.397707524454283e-06,
+ "loss": 0.2314,
+ "step": 20724
+ },
+ {
+ "epoch": 56.47138964577657,
+ "grad_norm": 3.5325496196746826,
+ "learning_rate": 8.396836438040885e-06,
+ "loss": 0.0936,
+ "step": 20725
+ },
+ {
+ "epoch": 56.474114441416894,
+ "grad_norm": 3.3489267826080322,
+ "learning_rate": 8.395965364112877e-06,
+ "loss": 0.2236,
+ "step": 20726
+ },
+ {
+ "epoch": 56.47683923705722,
+ "grad_norm": 4.340264797210693,
+ "learning_rate": 8.395094302677041e-06,
+ "loss": 0.0966,
+ "step": 20727
+ },
+ {
+ "epoch": 56.479564032697546,
+ "grad_norm": 2.4337453842163086,
+ "learning_rate": 8.394223253740157e-06,
+ "loss": 0.0514,
+ "step": 20728
+ },
+ {
+ "epoch": 56.48228882833787,
+ "grad_norm": 4.0651679039001465,
+ "learning_rate": 8.393352217309012e-06,
+ "loss": 0.2055,
+ "step": 20729
+ },
+ {
+ "epoch": 56.485013623978205,
+ "grad_norm": 4.50044584274292,
+ "learning_rate": 8.392481193390388e-06,
+ "loss": 0.2629,
+ "step": 20730
+ },
+ {
+ "epoch": 56.48773841961853,
+ "grad_norm": 5.812916278839111,
+ "learning_rate": 8.391610181991068e-06,
+ "loss": 0.1296,
+ "step": 20731
+ },
+ {
+ "epoch": 56.490463215258856,
+ "grad_norm": 3.895035743713379,
+ "learning_rate": 8.390739183117836e-06,
+ "loss": 0.0793,
+ "step": 20732
+ },
+ {
+ "epoch": 56.49318801089918,
+ "grad_norm": 3.867765426635742,
+ "learning_rate": 8.389868196777478e-06,
+ "loss": 0.1574,
+ "step": 20733
+ },
+ {
+ "epoch": 56.49591280653951,
+ "grad_norm": 3.1692419052124023,
+ "learning_rate": 8.388997222976772e-06,
+ "loss": 0.0734,
+ "step": 20734
+ },
+ {
+ "epoch": 56.49863760217983,
+ "grad_norm": 4.660286903381348,
+ "learning_rate": 8.388126261722504e-06,
+ "loss": 0.2578,
+ "step": 20735
+ },
+ {
+ "epoch": 56.50136239782017,
+ "grad_norm": 3.813767910003662,
+ "learning_rate": 8.387255313021456e-06,
+ "loss": 0.0827,
+ "step": 20736
+ },
+ {
+ "epoch": 56.50408719346049,
+ "grad_norm": 3.25433087348938,
+ "learning_rate": 8.386384376880414e-06,
+ "loss": 0.1,
+ "step": 20737
+ },
+ {
+ "epoch": 56.50681198910082,
+ "grad_norm": 3.4825737476348877,
+ "learning_rate": 8.385513453306157e-06,
+ "loss": 0.0449,
+ "step": 20738
+ },
+ {
+ "epoch": 56.509536784741144,
+ "grad_norm": 4.238973617553711,
+ "learning_rate": 8.38464254230547e-06,
+ "loss": 0.1629,
+ "step": 20739
+ },
+ {
+ "epoch": 56.51226158038147,
+ "grad_norm": 3.243096113204956,
+ "learning_rate": 8.383771643885134e-06,
+ "loss": 0.0877,
+ "step": 20740
+ },
+ {
+ "epoch": 56.514986376021795,
+ "grad_norm": 3.553771495819092,
+ "learning_rate": 8.382900758051934e-06,
+ "loss": 0.2725,
+ "step": 20741
+ },
+ {
+ "epoch": 56.51771117166213,
+ "grad_norm": 5.023160457611084,
+ "learning_rate": 8.382029884812644e-06,
+ "loss": 0.2727,
+ "step": 20742
+ },
+ {
+ "epoch": 56.520435967302454,
+ "grad_norm": 4.514641284942627,
+ "learning_rate": 8.381159024174061e-06,
+ "loss": 0.1745,
+ "step": 20743
+ },
+ {
+ "epoch": 56.52316076294278,
+ "grad_norm": 3.5146920680999756,
+ "learning_rate": 8.380288176142957e-06,
+ "loss": 0.0662,
+ "step": 20744
+ },
+ {
+ "epoch": 56.525885558583106,
+ "grad_norm": 3.1947133541107178,
+ "learning_rate": 8.379417340726118e-06,
+ "loss": 0.1594,
+ "step": 20745
+ },
+ {
+ "epoch": 56.52861035422343,
+ "grad_norm": 4.743031024932861,
+ "learning_rate": 8.378546517930322e-06,
+ "loss": 0.1361,
+ "step": 20746
+ },
+ {
+ "epoch": 56.53133514986376,
+ "grad_norm": 5.257390975952148,
+ "learning_rate": 8.377675707762356e-06,
+ "loss": 0.1024,
+ "step": 20747
+ },
+ {
+ "epoch": 56.53405994550409,
+ "grad_norm": 4.6400604248046875,
+ "learning_rate": 8.376804910228996e-06,
+ "loss": 0.1175,
+ "step": 20748
+ },
+ {
+ "epoch": 56.536784741144416,
+ "grad_norm": 10.755497932434082,
+ "learning_rate": 8.375934125337032e-06,
+ "loss": 0.0668,
+ "step": 20749
+ },
+ {
+ "epoch": 56.53950953678474,
+ "grad_norm": 5.789342403411865,
+ "learning_rate": 8.375063353093237e-06,
+ "loss": 0.1429,
+ "step": 20750
+ },
+ {
+ "epoch": 56.54223433242507,
+ "grad_norm": 5.7196760177612305,
+ "learning_rate": 8.3741925935044e-06,
+ "loss": 0.1703,
+ "step": 20751
+ },
+ {
+ "epoch": 56.54495912806539,
+ "grad_norm": 5.382983684539795,
+ "learning_rate": 8.373321846577295e-06,
+ "loss": 0.1995,
+ "step": 20752
+ },
+ {
+ "epoch": 56.54768392370572,
+ "grad_norm": 3.461686134338379,
+ "learning_rate": 8.37245111231871e-06,
+ "loss": 0.0761,
+ "step": 20753
+ },
+ {
+ "epoch": 56.55040871934605,
+ "grad_norm": 4.363855838775635,
+ "learning_rate": 8.371580390735421e-06,
+ "loss": 0.13,
+ "step": 20754
+ },
+ {
+ "epoch": 56.55313351498638,
+ "grad_norm": 3.5286946296691895,
+ "learning_rate": 8.370709681834213e-06,
+ "loss": 0.0899,
+ "step": 20755
+ },
+ {
+ "epoch": 56.555858310626704,
+ "grad_norm": 4.524600505828857,
+ "learning_rate": 8.369838985621864e-06,
+ "loss": 0.0949,
+ "step": 20756
+ },
+ {
+ "epoch": 56.55858310626703,
+ "grad_norm": 6.84073543548584,
+ "learning_rate": 8.368968302105158e-06,
+ "loss": 0.0614,
+ "step": 20757
+ },
+ {
+ "epoch": 56.561307901907355,
+ "grad_norm": 3.4950039386749268,
+ "learning_rate": 8.368097631290873e-06,
+ "loss": 0.1144,
+ "step": 20758
+ },
+ {
+ "epoch": 56.56403269754768,
+ "grad_norm": 4.201791286468506,
+ "learning_rate": 8.367226973185789e-06,
+ "loss": 0.0992,
+ "step": 20759
+ },
+ {
+ "epoch": 56.566757493188014,
+ "grad_norm": 4.8018798828125,
+ "learning_rate": 8.366356327796693e-06,
+ "loss": 0.2256,
+ "step": 20760
+ },
+ {
+ "epoch": 56.56948228882834,
+ "grad_norm": 3.444166898727417,
+ "learning_rate": 8.36548569513036e-06,
+ "loss": 0.0888,
+ "step": 20761
+ },
+ {
+ "epoch": 56.572207084468666,
+ "grad_norm": 3.421161651611328,
+ "learning_rate": 8.364615075193572e-06,
+ "loss": 0.0611,
+ "step": 20762
+ },
+ {
+ "epoch": 56.57493188010899,
+ "grad_norm": 3.7761220932006836,
+ "learning_rate": 8.363744467993108e-06,
+ "loss": 0.1276,
+ "step": 20763
+ },
+ {
+ "epoch": 56.57765667574932,
+ "grad_norm": 6.344570159912109,
+ "learning_rate": 8.362873873535751e-06,
+ "loss": 0.1218,
+ "step": 20764
+ },
+ {
+ "epoch": 56.58038147138964,
+ "grad_norm": 4.360270977020264,
+ "learning_rate": 8.362003291828279e-06,
+ "loss": 0.141,
+ "step": 20765
+ },
+ {
+ "epoch": 56.583106267029976,
+ "grad_norm": 6.195434093475342,
+ "learning_rate": 8.361132722877471e-06,
+ "loss": 0.2367,
+ "step": 20766
+ },
+ {
+ "epoch": 56.5858310626703,
+ "grad_norm": 4.121311664581299,
+ "learning_rate": 8.360262166690112e-06,
+ "loss": 0.123,
+ "step": 20767
+ },
+ {
+ "epoch": 56.58855585831063,
+ "grad_norm": 4.218409538269043,
+ "learning_rate": 8.359391623272976e-06,
+ "loss": 0.0734,
+ "step": 20768
+ },
+ {
+ "epoch": 56.59128065395095,
+ "grad_norm": 4.011482238769531,
+ "learning_rate": 8.358521092632848e-06,
+ "loss": 0.1374,
+ "step": 20769
+ },
+ {
+ "epoch": 56.59400544959128,
+ "grad_norm": 7.294281005859375,
+ "learning_rate": 8.357650574776501e-06,
+ "loss": 0.1011,
+ "step": 20770
+ },
+ {
+ "epoch": 56.596730245231605,
+ "grad_norm": 3.218067169189453,
+ "learning_rate": 8.356780069710721e-06,
+ "loss": 0.1312,
+ "step": 20771
+ },
+ {
+ "epoch": 56.59945504087194,
+ "grad_norm": 6.19024658203125,
+ "learning_rate": 8.355909577442284e-06,
+ "loss": 0.2366,
+ "step": 20772
+ },
+ {
+ "epoch": 56.60217983651226,
+ "grad_norm": 4.183459281921387,
+ "learning_rate": 8.355039097977972e-06,
+ "loss": 0.2199,
+ "step": 20773
+ },
+ {
+ "epoch": 56.60490463215259,
+ "grad_norm": 5.475216388702393,
+ "learning_rate": 8.35416863132456e-06,
+ "loss": 0.2377,
+ "step": 20774
+ },
+ {
+ "epoch": 56.607629427792915,
+ "grad_norm": 3.531409978866577,
+ "learning_rate": 8.353298177488832e-06,
+ "loss": 0.0806,
+ "step": 20775
+ },
+ {
+ "epoch": 56.61035422343324,
+ "grad_norm": 5.869809627532959,
+ "learning_rate": 8.35242773647756e-06,
+ "loss": 0.0627,
+ "step": 20776
+ },
+ {
+ "epoch": 56.61307901907357,
+ "grad_norm": 6.493967056274414,
+ "learning_rate": 8.35155730829753e-06,
+ "loss": 0.1159,
+ "step": 20777
+ },
+ {
+ "epoch": 56.6158038147139,
+ "grad_norm": 2.9832074642181396,
+ "learning_rate": 8.350686892955522e-06,
+ "loss": 0.1214,
+ "step": 20778
+ },
+ {
+ "epoch": 56.618528610354225,
+ "grad_norm": 3.689751386642456,
+ "learning_rate": 8.349816490458307e-06,
+ "loss": 0.2088,
+ "step": 20779
+ },
+ {
+ "epoch": 56.62125340599455,
+ "grad_norm": 5.616393089294434,
+ "learning_rate": 8.348946100812672e-06,
+ "loss": 0.1126,
+ "step": 20780
+ },
+ {
+ "epoch": 56.62397820163488,
+ "grad_norm": 6.355755805969238,
+ "learning_rate": 8.34807572402539e-06,
+ "loss": 0.1506,
+ "step": 20781
+ },
+ {
+ "epoch": 56.6267029972752,
+ "grad_norm": 4.0162672996521,
+ "learning_rate": 8.347205360103243e-06,
+ "loss": 0.0995,
+ "step": 20782
+ },
+ {
+ "epoch": 56.62942779291553,
+ "grad_norm": 4.354006767272949,
+ "learning_rate": 8.346335009053004e-06,
+ "loss": 0.1814,
+ "step": 20783
+ },
+ {
+ "epoch": 56.63215258855586,
+ "grad_norm": 4.109909534454346,
+ "learning_rate": 8.345464670881458e-06,
+ "loss": 0.1874,
+ "step": 20784
+ },
+ {
+ "epoch": 56.63487738419619,
+ "grad_norm": 3.7556591033935547,
+ "learning_rate": 8.344594345595377e-06,
+ "loss": 0.2412,
+ "step": 20785
+ },
+ {
+ "epoch": 56.63760217983651,
+ "grad_norm": 7.884458065032959,
+ "learning_rate": 8.343724033201544e-06,
+ "loss": 0.1487,
+ "step": 20786
+ },
+ {
+ "epoch": 56.64032697547684,
+ "grad_norm": 3.905724287033081,
+ "learning_rate": 8.342853733706733e-06,
+ "loss": 0.1255,
+ "step": 20787
+ },
+ {
+ "epoch": 56.643051771117165,
+ "grad_norm": 4.148049831390381,
+ "learning_rate": 8.341983447117725e-06,
+ "loss": 0.108,
+ "step": 20788
+ },
+ {
+ "epoch": 56.64577656675749,
+ "grad_norm": 4.072840690612793,
+ "learning_rate": 8.341113173441298e-06,
+ "loss": 0.096,
+ "step": 20789
+ },
+ {
+ "epoch": 56.64850136239782,
+ "grad_norm": 3.712479829788208,
+ "learning_rate": 8.340242912684225e-06,
+ "loss": 0.0745,
+ "step": 20790
+ },
+ {
+ "epoch": 56.65122615803815,
+ "grad_norm": 4.330201625823975,
+ "learning_rate": 8.33937266485329e-06,
+ "loss": 0.1308,
+ "step": 20791
+ },
+ {
+ "epoch": 56.653950953678475,
+ "grad_norm": 4.016898155212402,
+ "learning_rate": 8.338502429955264e-06,
+ "loss": 0.0759,
+ "step": 20792
+ },
+ {
+ "epoch": 56.6566757493188,
+ "grad_norm": 3.2190215587615967,
+ "learning_rate": 8.337632207996932e-06,
+ "loss": 0.1056,
+ "step": 20793
+ },
+ {
+ "epoch": 56.65940054495913,
+ "grad_norm": 4.42525053024292,
+ "learning_rate": 8.336761998985059e-06,
+ "loss": 0.0807,
+ "step": 20794
+ },
+ {
+ "epoch": 56.66212534059945,
+ "grad_norm": 3.3427927494049072,
+ "learning_rate": 8.335891802926435e-06,
+ "loss": 0.0768,
+ "step": 20795
+ },
+ {
+ "epoch": 56.664850136239785,
+ "grad_norm": 2.8755178451538086,
+ "learning_rate": 8.335021619827833e-06,
+ "loss": 0.1892,
+ "step": 20796
+ },
+ {
+ "epoch": 56.66757493188011,
+ "grad_norm": 4.551873683929443,
+ "learning_rate": 8.334151449696027e-06,
+ "loss": 0.1809,
+ "step": 20797
+ },
+ {
+ "epoch": 56.67029972752044,
+ "grad_norm": 3.6021249294281006,
+ "learning_rate": 8.333281292537799e-06,
+ "loss": 0.1102,
+ "step": 20798
+ },
+ {
+ "epoch": 56.67302452316076,
+ "grad_norm": 3.869985342025757,
+ "learning_rate": 8.33241114835992e-06,
+ "loss": 0.155,
+ "step": 20799
+ },
+ {
+ "epoch": 56.67574931880109,
+ "grad_norm": 4.747959613800049,
+ "learning_rate": 8.331541017169172e-06,
+ "loss": 0.0875,
+ "step": 20800
+ },
+ {
+ "epoch": 56.678474114441414,
+ "grad_norm": 3.290243148803711,
+ "learning_rate": 8.330670898972326e-06,
+ "loss": 0.0621,
+ "step": 20801
+ },
+ {
+ "epoch": 56.68119891008175,
+ "grad_norm": 4.514286041259766,
+ "learning_rate": 8.329800793776163e-06,
+ "loss": 0.0868,
+ "step": 20802
+ },
+ {
+ "epoch": 56.68392370572207,
+ "grad_norm": 3.982741117477417,
+ "learning_rate": 8.328930701587456e-06,
+ "loss": 0.0877,
+ "step": 20803
+ },
+ {
+ "epoch": 56.6866485013624,
+ "grad_norm": 5.891603946685791,
+ "learning_rate": 8.328060622412986e-06,
+ "loss": 0.0628,
+ "step": 20804
+ },
+ {
+ "epoch": 56.689373297002724,
+ "grad_norm": 4.320755481719971,
+ "learning_rate": 8.327190556259523e-06,
+ "loss": 0.0843,
+ "step": 20805
+ },
+ {
+ "epoch": 56.69209809264305,
+ "grad_norm": 3.407414674758911,
+ "learning_rate": 8.326320503133847e-06,
+ "loss": 0.0976,
+ "step": 20806
+ },
+ {
+ "epoch": 56.694822888283376,
+ "grad_norm": 3.5583882331848145,
+ "learning_rate": 8.325450463042733e-06,
+ "loss": 0.1037,
+ "step": 20807
+ },
+ {
+ "epoch": 56.69754768392371,
+ "grad_norm": 4.379970073699951,
+ "learning_rate": 8.324580435992959e-06,
+ "loss": 0.0786,
+ "step": 20808
+ },
+ {
+ "epoch": 56.700272479564035,
+ "grad_norm": 5.11167049407959,
+ "learning_rate": 8.323710421991295e-06,
+ "loss": 0.4112,
+ "step": 20809
+ },
+ {
+ "epoch": 56.70299727520436,
+ "grad_norm": 4.02913236618042,
+ "learning_rate": 8.32284042104452e-06,
+ "loss": 0.2831,
+ "step": 20810
+ },
+ {
+ "epoch": 56.705722070844686,
+ "grad_norm": 4.0310845375061035,
+ "learning_rate": 8.321970433159409e-06,
+ "loss": 0.0971,
+ "step": 20811
+ },
+ {
+ "epoch": 56.70844686648501,
+ "grad_norm": 3.525644063949585,
+ "learning_rate": 8.321100458342742e-06,
+ "loss": 0.0836,
+ "step": 20812
+ },
+ {
+ "epoch": 56.71117166212534,
+ "grad_norm": 4.3504958152771,
+ "learning_rate": 8.32023049660129e-06,
+ "loss": 0.1602,
+ "step": 20813
+ },
+ {
+ "epoch": 56.71389645776567,
+ "grad_norm": 3.7884342670440674,
+ "learning_rate": 8.319360547941828e-06,
+ "loss": 0.071,
+ "step": 20814
+ },
+ {
+ "epoch": 56.716621253406,
+ "grad_norm": 14.091556549072266,
+ "learning_rate": 8.318490612371132e-06,
+ "loss": 0.0971,
+ "step": 20815
+ },
+ {
+ "epoch": 56.71934604904632,
+ "grad_norm": 2.9496817588806152,
+ "learning_rate": 8.317620689895979e-06,
+ "loss": 0.0968,
+ "step": 20816
+ },
+ {
+ "epoch": 56.72207084468665,
+ "grad_norm": 3.5632452964782715,
+ "learning_rate": 8.316750780523139e-06,
+ "loss": 0.0613,
+ "step": 20817
+ },
+ {
+ "epoch": 56.724795640326974,
+ "grad_norm": 3.4774179458618164,
+ "learning_rate": 8.315880884259393e-06,
+ "loss": 0.1866,
+ "step": 20818
+ },
+ {
+ "epoch": 56.7275204359673,
+ "grad_norm": 6.17877197265625,
+ "learning_rate": 8.31501100111151e-06,
+ "loss": 0.1622,
+ "step": 20819
+ },
+ {
+ "epoch": 56.73024523160763,
+ "grad_norm": 4.434709548950195,
+ "learning_rate": 8.314141131086268e-06,
+ "loss": 0.2256,
+ "step": 20820
+ },
+ {
+ "epoch": 56.73297002724796,
+ "grad_norm": 5.374114036560059,
+ "learning_rate": 8.31327127419044e-06,
+ "loss": 0.2084,
+ "step": 20821
+ },
+ {
+ "epoch": 56.735694822888284,
+ "grad_norm": 4.9178595542907715,
+ "learning_rate": 8.312401430430802e-06,
+ "loss": 0.2069,
+ "step": 20822
+ },
+ {
+ "epoch": 56.73841961852861,
+ "grad_norm": 3.505828380584717,
+ "learning_rate": 8.311531599814125e-06,
+ "loss": 0.0871,
+ "step": 20823
+ },
+ {
+ "epoch": 56.741144414168936,
+ "grad_norm": 4.222629547119141,
+ "learning_rate": 8.310661782347189e-06,
+ "loss": 0.1207,
+ "step": 20824
+ },
+ {
+ "epoch": 56.74386920980926,
+ "grad_norm": 3.801757574081421,
+ "learning_rate": 8.309791978036762e-06,
+ "loss": 0.067,
+ "step": 20825
+ },
+ {
+ "epoch": 56.746594005449595,
+ "grad_norm": 3.894122838973999,
+ "learning_rate": 8.308922186889623e-06,
+ "loss": 0.2891,
+ "step": 20826
+ },
+ {
+ "epoch": 56.74931880108992,
+ "grad_norm": 3.1469714641571045,
+ "learning_rate": 8.308052408912541e-06,
+ "loss": 0.0763,
+ "step": 20827
+ },
+ {
+ "epoch": 56.752043596730246,
+ "grad_norm": 5.020132541656494,
+ "learning_rate": 8.307182644112291e-06,
+ "loss": 0.0999,
+ "step": 20828
+ },
+ {
+ "epoch": 56.75476839237057,
+ "grad_norm": 3.6829075813293457,
+ "learning_rate": 8.306312892495648e-06,
+ "loss": 0.0729,
+ "step": 20829
+ },
+ {
+ "epoch": 56.7574931880109,
+ "grad_norm": 5.328718185424805,
+ "learning_rate": 8.30544315406939e-06,
+ "loss": 0.0652,
+ "step": 20830
+ },
+ {
+ "epoch": 56.76021798365122,
+ "grad_norm": 3.8909647464752197,
+ "learning_rate": 8.304573428840284e-06,
+ "loss": 0.0955,
+ "step": 20831
+ },
+ {
+ "epoch": 56.762942779291556,
+ "grad_norm": 4.502145290374756,
+ "learning_rate": 8.303703716815108e-06,
+ "loss": 0.096,
+ "step": 20832
+ },
+ {
+ "epoch": 56.76566757493188,
+ "grad_norm": 5.859290599822998,
+ "learning_rate": 8.302834018000628e-06,
+ "loss": 0.2217,
+ "step": 20833
+ },
+ {
+ "epoch": 56.76839237057221,
+ "grad_norm": 7.264393329620361,
+ "learning_rate": 8.301964332403627e-06,
+ "loss": 0.2151,
+ "step": 20834
+ },
+ {
+ "epoch": 56.771117166212534,
+ "grad_norm": 3.542628288269043,
+ "learning_rate": 8.301094660030869e-06,
+ "loss": 0.0687,
+ "step": 20835
+ },
+ {
+ "epoch": 56.77384196185286,
+ "grad_norm": 3.1421024799346924,
+ "learning_rate": 8.300225000889135e-06,
+ "loss": 0.0777,
+ "step": 20836
+ },
+ {
+ "epoch": 56.776566757493185,
+ "grad_norm": 4.3368377685546875,
+ "learning_rate": 8.299355354985192e-06,
+ "loss": 0.0837,
+ "step": 20837
+ },
+ {
+ "epoch": 56.77929155313352,
+ "grad_norm": 4.881613731384277,
+ "learning_rate": 8.298485722325815e-06,
+ "loss": 0.1662,
+ "step": 20838
+ },
+ {
+ "epoch": 56.782016348773844,
+ "grad_norm": 7.901316165924072,
+ "learning_rate": 8.297616102917776e-06,
+ "loss": 0.1904,
+ "step": 20839
+ },
+ {
+ "epoch": 56.78474114441417,
+ "grad_norm": 4.116857528686523,
+ "learning_rate": 8.29674649676785e-06,
+ "loss": 0.1002,
+ "step": 20840
+ },
+ {
+ "epoch": 56.787465940054496,
+ "grad_norm": 3.000873327255249,
+ "learning_rate": 8.295876903882804e-06,
+ "loss": 0.0516,
+ "step": 20841
+ },
+ {
+ "epoch": 56.79019073569482,
+ "grad_norm": 3.8488805294036865,
+ "learning_rate": 8.295007324269417e-06,
+ "loss": 0.0744,
+ "step": 20842
+ },
+ {
+ "epoch": 56.79291553133515,
+ "grad_norm": 4.251661777496338,
+ "learning_rate": 8.294137757934456e-06,
+ "loss": 0.1279,
+ "step": 20843
+ },
+ {
+ "epoch": 56.79564032697548,
+ "grad_norm": 3.890658378601074,
+ "learning_rate": 8.293268204884696e-06,
+ "loss": 0.0802,
+ "step": 20844
+ },
+ {
+ "epoch": 56.798365122615806,
+ "grad_norm": 4.6637163162231445,
+ "learning_rate": 8.292398665126906e-06,
+ "loss": 0.1038,
+ "step": 20845
+ },
+ {
+ "epoch": 56.80108991825613,
+ "grad_norm": 4.350137233734131,
+ "learning_rate": 8.291529138667862e-06,
+ "loss": 0.1758,
+ "step": 20846
+ },
+ {
+ "epoch": 56.80381471389646,
+ "grad_norm": 3.3026187419891357,
+ "learning_rate": 8.290659625514336e-06,
+ "loss": 0.1161,
+ "step": 20847
+ },
+ {
+ "epoch": 56.80653950953678,
+ "grad_norm": 3.4914233684539795,
+ "learning_rate": 8.289790125673095e-06,
+ "loss": 0.1193,
+ "step": 20848
+ },
+ {
+ "epoch": 56.80926430517711,
+ "grad_norm": 4.479560375213623,
+ "learning_rate": 8.288920639150915e-06,
+ "loss": 0.0678,
+ "step": 20849
+ },
+ {
+ "epoch": 56.81198910081744,
+ "grad_norm": 3.654784679412842,
+ "learning_rate": 8.288051165954566e-06,
+ "loss": 0.1295,
+ "step": 20850
+ },
+ {
+ "epoch": 56.81471389645777,
+ "grad_norm": 3.607421875,
+ "learning_rate": 8.28718170609082e-06,
+ "loss": 0.1604,
+ "step": 20851
+ },
+ {
+ "epoch": 56.817438692098094,
+ "grad_norm": 4.677554130554199,
+ "learning_rate": 8.286312259566445e-06,
+ "loss": 0.0532,
+ "step": 20852
+ },
+ {
+ "epoch": 56.82016348773842,
+ "grad_norm": 4.797582149505615,
+ "learning_rate": 8.285442826388217e-06,
+ "loss": 0.1041,
+ "step": 20853
+ },
+ {
+ "epoch": 56.822888283378745,
+ "grad_norm": 4.3747663497924805,
+ "learning_rate": 8.284573406562906e-06,
+ "loss": 0.2096,
+ "step": 20854
+ },
+ {
+ "epoch": 56.82561307901907,
+ "grad_norm": 5.039104461669922,
+ "learning_rate": 8.283704000097281e-06,
+ "loss": 0.0731,
+ "step": 20855
+ },
+ {
+ "epoch": 56.828337874659404,
+ "grad_norm": 6.823355674743652,
+ "learning_rate": 8.282834606998114e-06,
+ "loss": 0.1905,
+ "step": 20856
+ },
+ {
+ "epoch": 56.83106267029973,
+ "grad_norm": 3.110656261444092,
+ "learning_rate": 8.281965227272176e-06,
+ "loss": 0.0642,
+ "step": 20857
+ },
+ {
+ "epoch": 56.833787465940055,
+ "grad_norm": 5.17993688583374,
+ "learning_rate": 8.281095860926238e-06,
+ "loss": 0.1422,
+ "step": 20858
+ },
+ {
+ "epoch": 56.83651226158038,
+ "grad_norm": 3.290844678878784,
+ "learning_rate": 8.280226507967068e-06,
+ "loss": 0.0627,
+ "step": 20859
+ },
+ {
+ "epoch": 56.83923705722071,
+ "grad_norm": 4.022027492523193,
+ "learning_rate": 8.279357168401442e-06,
+ "loss": 0.0629,
+ "step": 20860
+ },
+ {
+ "epoch": 56.84196185286103,
+ "grad_norm": 3.564958095550537,
+ "learning_rate": 8.278487842236125e-06,
+ "loss": 0.1541,
+ "step": 20861
+ },
+ {
+ "epoch": 56.844686648501366,
+ "grad_norm": 5.737844944000244,
+ "learning_rate": 8.277618529477886e-06,
+ "loss": 0.1378,
+ "step": 20862
+ },
+ {
+ "epoch": 56.84741144414169,
+ "grad_norm": 3.8045578002929688,
+ "learning_rate": 8.276749230133503e-06,
+ "loss": 0.0741,
+ "step": 20863
+ },
+ {
+ "epoch": 56.85013623978202,
+ "grad_norm": 3.8062503337860107,
+ "learning_rate": 8.27587994420974e-06,
+ "loss": 0.2534,
+ "step": 20864
+ },
+ {
+ "epoch": 56.85286103542234,
+ "grad_norm": 4.266364574432373,
+ "learning_rate": 8.27501067171337e-06,
+ "loss": 0.0873,
+ "step": 20865
+ },
+ {
+ "epoch": 56.85558583106267,
+ "grad_norm": 3.5831804275512695,
+ "learning_rate": 8.27414141265116e-06,
+ "loss": 0.1219,
+ "step": 20866
+ },
+ {
+ "epoch": 56.858310626702995,
+ "grad_norm": 4.1305131912231445,
+ "learning_rate": 8.273272167029882e-06,
+ "loss": 0.1514,
+ "step": 20867
+ },
+ {
+ "epoch": 56.86103542234333,
+ "grad_norm": 4.11383581161499,
+ "learning_rate": 8.272402934856302e-06,
+ "loss": 0.1572,
+ "step": 20868
+ },
+ {
+ "epoch": 56.86376021798365,
+ "grad_norm": 6.590770721435547,
+ "learning_rate": 8.271533716137196e-06,
+ "loss": 0.1691,
+ "step": 20869
+ },
+ {
+ "epoch": 56.86648501362398,
+ "grad_norm": 3.7014214992523193,
+ "learning_rate": 8.270664510879328e-06,
+ "loss": 0.0933,
+ "step": 20870
+ },
+ {
+ "epoch": 56.869209809264305,
+ "grad_norm": 5.859397888183594,
+ "learning_rate": 8.269795319089471e-06,
+ "loss": 0.0823,
+ "step": 20871
+ },
+ {
+ "epoch": 56.87193460490463,
+ "grad_norm": 5.130993366241455,
+ "learning_rate": 8.26892614077439e-06,
+ "loss": 0.2859,
+ "step": 20872
+ },
+ {
+ "epoch": 56.87465940054496,
+ "grad_norm": 3.934887170791626,
+ "learning_rate": 8.26805697594086e-06,
+ "loss": 0.0851,
+ "step": 20873
+ },
+ {
+ "epoch": 56.87738419618529,
+ "grad_norm": 4.152246475219727,
+ "learning_rate": 8.267187824595641e-06,
+ "loss": 0.1747,
+ "step": 20874
+ },
+ {
+ "epoch": 56.880108991825615,
+ "grad_norm": 3.5175857543945312,
+ "learning_rate": 8.26631868674551e-06,
+ "loss": 0.0463,
+ "step": 20875
+ },
+ {
+ "epoch": 56.88283378746594,
+ "grad_norm": 3.765432357788086,
+ "learning_rate": 8.265449562397235e-06,
+ "loss": 0.0878,
+ "step": 20876
+ },
+ {
+ "epoch": 56.88555858310627,
+ "grad_norm": 4.602232933044434,
+ "learning_rate": 8.26458045155758e-06,
+ "loss": 0.0716,
+ "step": 20877
+ },
+ {
+ "epoch": 56.88828337874659,
+ "grad_norm": 4.033105373382568,
+ "learning_rate": 8.26371135423332e-06,
+ "loss": 0.1735,
+ "step": 20878
+ },
+ {
+ "epoch": 56.89100817438692,
+ "grad_norm": 3.979550838470459,
+ "learning_rate": 8.262842270431218e-06,
+ "loss": 0.0935,
+ "step": 20879
+ },
+ {
+ "epoch": 56.89373297002725,
+ "grad_norm": 4.2078938484191895,
+ "learning_rate": 8.26197320015804e-06,
+ "loss": 0.0885,
+ "step": 20880
+ },
+ {
+ "epoch": 56.89645776566758,
+ "grad_norm": 4.143012046813965,
+ "learning_rate": 8.261104143420566e-06,
+ "loss": 0.1719,
+ "step": 20881
+ },
+ {
+ "epoch": 56.8991825613079,
+ "grad_norm": 3.549680471420288,
+ "learning_rate": 8.260235100225553e-06,
+ "loss": 0.1014,
+ "step": 20882
+ },
+ {
+ "epoch": 56.90190735694823,
+ "grad_norm": 4.424400806427002,
+ "learning_rate": 8.259366070579775e-06,
+ "loss": 0.2626,
+ "step": 20883
+ },
+ {
+ "epoch": 56.904632152588555,
+ "grad_norm": 3.190826892852783,
+ "learning_rate": 8.258497054489998e-06,
+ "loss": 0.0614,
+ "step": 20884
+ },
+ {
+ "epoch": 56.90735694822888,
+ "grad_norm": 4.439691066741943,
+ "learning_rate": 8.25762805196299e-06,
+ "loss": 0.0798,
+ "step": 20885
+ },
+ {
+ "epoch": 56.91008174386921,
+ "grad_norm": 4.760251522064209,
+ "learning_rate": 8.256759063005517e-06,
+ "loss": 0.1198,
+ "step": 20886
+ },
+ {
+ "epoch": 56.91280653950954,
+ "grad_norm": 3.8580844402313232,
+ "learning_rate": 8.255890087624352e-06,
+ "loss": 0.0949,
+ "step": 20887
+ },
+ {
+ "epoch": 56.915531335149865,
+ "grad_norm": 3.825615882873535,
+ "learning_rate": 8.255021125826255e-06,
+ "loss": 0.0951,
+ "step": 20888
+ },
+ {
+ "epoch": 56.91825613079019,
+ "grad_norm": 4.554897308349609,
+ "learning_rate": 8.254152177618e-06,
+ "loss": 0.0915,
+ "step": 20889
+ },
+ {
+ "epoch": 56.920980926430516,
+ "grad_norm": 3.0845141410827637,
+ "learning_rate": 8.253283243006349e-06,
+ "loss": 0.1355,
+ "step": 20890
+ },
+ {
+ "epoch": 56.92370572207084,
+ "grad_norm": 4.7472662925720215,
+ "learning_rate": 8.252414321998075e-06,
+ "loss": 0.0902,
+ "step": 20891
+ },
+ {
+ "epoch": 56.926430517711175,
+ "grad_norm": 3.4225594997406006,
+ "learning_rate": 8.25154541459994e-06,
+ "loss": 0.0618,
+ "step": 20892
+ },
+ {
+ "epoch": 56.9291553133515,
+ "grad_norm": 4.021973609924316,
+ "learning_rate": 8.250676520818712e-06,
+ "loss": 0.1459,
+ "step": 20893
+ },
+ {
+ "epoch": 56.93188010899183,
+ "grad_norm": 4.833191394805908,
+ "learning_rate": 8.24980764066116e-06,
+ "loss": 0.2345,
+ "step": 20894
+ },
+ {
+ "epoch": 56.93460490463215,
+ "grad_norm": 4.990149974822998,
+ "learning_rate": 8.248938774134052e-06,
+ "loss": 0.123,
+ "step": 20895
+ },
+ {
+ "epoch": 56.93732970027248,
+ "grad_norm": 4.602786540985107,
+ "learning_rate": 8.248069921244148e-06,
+ "loss": 0.136,
+ "step": 20896
+ },
+ {
+ "epoch": 56.940054495912804,
+ "grad_norm": 3.887037515640259,
+ "learning_rate": 8.247201081998218e-06,
+ "loss": 0.1327,
+ "step": 20897
+ },
+ {
+ "epoch": 56.94277929155314,
+ "grad_norm": 3.8991174697875977,
+ "learning_rate": 8.246332256403033e-06,
+ "loss": 0.148,
+ "step": 20898
+ },
+ {
+ "epoch": 56.94550408719346,
+ "grad_norm": 5.6237993240356445,
+ "learning_rate": 8.245463444465357e-06,
+ "loss": 0.176,
+ "step": 20899
+ },
+ {
+ "epoch": 56.94822888283379,
+ "grad_norm": 3.590494394302368,
+ "learning_rate": 8.244594646191953e-06,
+ "loss": 0.1345,
+ "step": 20900
+ },
+ {
+ "epoch": 56.950953678474114,
+ "grad_norm": 3.9823145866394043,
+ "learning_rate": 8.243725861589592e-06,
+ "loss": 0.1468,
+ "step": 20901
+ },
+ {
+ "epoch": 56.95367847411444,
+ "grad_norm": 4.785423755645752,
+ "learning_rate": 8.242857090665036e-06,
+ "loss": 0.0687,
+ "step": 20902
+ },
+ {
+ "epoch": 56.956403269754766,
+ "grad_norm": 4.729231834411621,
+ "learning_rate": 8.241988333425052e-06,
+ "loss": 0.1528,
+ "step": 20903
+ },
+ {
+ "epoch": 56.95912806539509,
+ "grad_norm": 3.7704522609710693,
+ "learning_rate": 8.241119589876406e-06,
+ "loss": 0.1939,
+ "step": 20904
+ },
+ {
+ "epoch": 56.961852861035425,
+ "grad_norm": 4.724066734313965,
+ "learning_rate": 8.240250860025866e-06,
+ "loss": 0.0784,
+ "step": 20905
+ },
+ {
+ "epoch": 56.96457765667575,
+ "grad_norm": 3.4864683151245117,
+ "learning_rate": 8.239382143880195e-06,
+ "loss": 0.0798,
+ "step": 20906
+ },
+ {
+ "epoch": 56.967302452316076,
+ "grad_norm": 4.217945575714111,
+ "learning_rate": 8.238513441446158e-06,
+ "loss": 0.2088,
+ "step": 20907
+ },
+ {
+ "epoch": 56.9700272479564,
+ "grad_norm": 3.3189778327941895,
+ "learning_rate": 8.237644752730522e-06,
+ "loss": 0.0701,
+ "step": 20908
+ },
+ {
+ "epoch": 56.97275204359673,
+ "grad_norm": 3.262610912322998,
+ "learning_rate": 8.236776077740054e-06,
+ "loss": 0.0706,
+ "step": 20909
+ },
+ {
+ "epoch": 56.97547683923706,
+ "grad_norm": 5.687419414520264,
+ "learning_rate": 8.235907416481514e-06,
+ "loss": 0.1054,
+ "step": 20910
+ },
+ {
+ "epoch": 56.97820163487739,
+ "grad_norm": 3.3241074085235596,
+ "learning_rate": 8.235038768961672e-06,
+ "loss": 0.2147,
+ "step": 20911
+ },
+ {
+ "epoch": 56.98092643051771,
+ "grad_norm": 4.45330810546875,
+ "learning_rate": 8.23417013518729e-06,
+ "loss": 0.0628,
+ "step": 20912
+ },
+ {
+ "epoch": 56.98365122615804,
+ "grad_norm": 4.936892509460449,
+ "learning_rate": 8.233301515165138e-06,
+ "loss": 0.1097,
+ "step": 20913
+ },
+ {
+ "epoch": 56.986376021798364,
+ "grad_norm": 3.4377126693725586,
+ "learning_rate": 8.23243290890197e-06,
+ "loss": 0.0554,
+ "step": 20914
+ },
+ {
+ "epoch": 56.98910081743869,
+ "grad_norm": 4.021442413330078,
+ "learning_rate": 8.23156431640456e-06,
+ "loss": 0.1718,
+ "step": 20915
+ },
+ {
+ "epoch": 56.991825613079016,
+ "grad_norm": 5.111627101898193,
+ "learning_rate": 8.230695737679671e-06,
+ "loss": 0.0534,
+ "step": 20916
+ },
+ {
+ "epoch": 56.99455040871935,
+ "grad_norm": 4.411771297454834,
+ "learning_rate": 8.229827172734068e-06,
+ "loss": 0.303,
+ "step": 20917
+ },
+ {
+ "epoch": 56.997275204359674,
+ "grad_norm": 4.301294803619385,
+ "learning_rate": 8.228958621574514e-06,
+ "loss": 0.2108,
+ "step": 20918
+ },
+ {
+ "epoch": 57.0,
+ "grad_norm": 3.4039785861968994,
+ "learning_rate": 8.228090084207773e-06,
+ "loss": 0.0957,
+ "step": 20919
+ },
+ {
+ "epoch": 57.002724795640326,
+ "grad_norm": 4.393790245056152,
+ "learning_rate": 8.227221560640609e-06,
+ "loss": 0.1562,
+ "step": 20920
+ },
+ {
+ "epoch": 57.00544959128065,
+ "grad_norm": 3.451871395111084,
+ "learning_rate": 8.226353050879788e-06,
+ "loss": 0.0594,
+ "step": 20921
+ },
+ {
+ "epoch": 57.00817438692098,
+ "grad_norm": 3.661106586456299,
+ "learning_rate": 8.225484554932069e-06,
+ "loss": 0.0763,
+ "step": 20922
+ },
+ {
+ "epoch": 57.01089918256131,
+ "grad_norm": 5.8789167404174805,
+ "learning_rate": 8.224616072804223e-06,
+ "loss": 0.1362,
+ "step": 20923
+ },
+ {
+ "epoch": 57.013623978201636,
+ "grad_norm": 3.4945576190948486,
+ "learning_rate": 8.223747604503005e-06,
+ "loss": 0.0889,
+ "step": 20924
+ },
+ {
+ "epoch": 57.01634877384196,
+ "grad_norm": 4.172882080078125,
+ "learning_rate": 8.22287915003519e-06,
+ "loss": 0.1805,
+ "step": 20925
+ },
+ {
+ "epoch": 57.01907356948229,
+ "grad_norm": 3.1446330547332764,
+ "learning_rate": 8.22201070940753e-06,
+ "loss": 0.194,
+ "step": 20926
+ },
+ {
+ "epoch": 57.02179836512261,
+ "grad_norm": 4.150295257568359,
+ "learning_rate": 8.221142282626795e-06,
+ "loss": 0.1064,
+ "step": 20927
+ },
+ {
+ "epoch": 57.02452316076294,
+ "grad_norm": 5.671179294586182,
+ "learning_rate": 8.220273869699746e-06,
+ "loss": 0.0806,
+ "step": 20928
+ },
+ {
+ "epoch": 57.02724795640327,
+ "grad_norm": 4.209830284118652,
+ "learning_rate": 8.219405470633149e-06,
+ "loss": 0.1902,
+ "step": 20929
+ },
+ {
+ "epoch": 57.0299727520436,
+ "grad_norm": 5.202353477478027,
+ "learning_rate": 8.218537085433761e-06,
+ "loss": 0.1203,
+ "step": 20930
+ },
+ {
+ "epoch": 57.032697547683924,
+ "grad_norm": 2.7137610912323,
+ "learning_rate": 8.217668714108348e-06,
+ "loss": 0.0501,
+ "step": 20931
+ },
+ {
+ "epoch": 57.03542234332425,
+ "grad_norm": 3.73943829536438,
+ "learning_rate": 8.216800356663679e-06,
+ "loss": 0.1214,
+ "step": 20932
+ },
+ {
+ "epoch": 57.038147138964575,
+ "grad_norm": 4.07224702835083,
+ "learning_rate": 8.215932013106508e-06,
+ "loss": 0.1636,
+ "step": 20933
+ },
+ {
+ "epoch": 57.0408719346049,
+ "grad_norm": 3.760071277618408,
+ "learning_rate": 8.215063683443603e-06,
+ "loss": 0.1316,
+ "step": 20934
+ },
+ {
+ "epoch": 57.043596730245234,
+ "grad_norm": 3.020530939102173,
+ "learning_rate": 8.214195367681723e-06,
+ "loss": 0.0668,
+ "step": 20935
+ },
+ {
+ "epoch": 57.04632152588556,
+ "grad_norm": 6.602606773376465,
+ "learning_rate": 8.213327065827635e-06,
+ "loss": 0.092,
+ "step": 20936
+ },
+ {
+ "epoch": 57.049046321525886,
+ "grad_norm": 3.1322200298309326,
+ "learning_rate": 8.212458777888094e-06,
+ "loss": 0.0659,
+ "step": 20937
+ },
+ {
+ "epoch": 57.05177111716621,
+ "grad_norm": 3.437601327896118,
+ "learning_rate": 8.21159050386987e-06,
+ "loss": 0.0693,
+ "step": 20938
+ },
+ {
+ "epoch": 57.05449591280654,
+ "grad_norm": 3.798060178756714,
+ "learning_rate": 8.210722243779719e-06,
+ "loss": 0.1284,
+ "step": 20939
+ },
+ {
+ "epoch": 57.05722070844686,
+ "grad_norm": 4.102583885192871,
+ "learning_rate": 8.209853997624406e-06,
+ "loss": 0.0916,
+ "step": 20940
+ },
+ {
+ "epoch": 57.059945504087196,
+ "grad_norm": 5.362946510314941,
+ "learning_rate": 8.208985765410694e-06,
+ "loss": 0.1258,
+ "step": 20941
+ },
+ {
+ "epoch": 57.06267029972752,
+ "grad_norm": 3.262148380279541,
+ "learning_rate": 8.20811754714534e-06,
+ "loss": 0.067,
+ "step": 20942
+ },
+ {
+ "epoch": 57.06539509536785,
+ "grad_norm": 4.280355930328369,
+ "learning_rate": 8.207249342835114e-06,
+ "loss": 0.0927,
+ "step": 20943
+ },
+ {
+ "epoch": 57.06811989100817,
+ "grad_norm": 4.460330963134766,
+ "learning_rate": 8.206381152486769e-06,
+ "loss": 0.0997,
+ "step": 20944
+ },
+ {
+ "epoch": 57.0708446866485,
+ "grad_norm": 3.6226274967193604,
+ "learning_rate": 8.205512976107071e-06,
+ "loss": 0.0791,
+ "step": 20945
+ },
+ {
+ "epoch": 57.073569482288825,
+ "grad_norm": 2.9987363815307617,
+ "learning_rate": 8.204644813702778e-06,
+ "loss": 0.062,
+ "step": 20946
+ },
+ {
+ "epoch": 57.07629427792916,
+ "grad_norm": 3.7295479774475098,
+ "learning_rate": 8.203776665280656e-06,
+ "loss": 0.1054,
+ "step": 20947
+ },
+ {
+ "epoch": 57.079019073569484,
+ "grad_norm": 4.244683265686035,
+ "learning_rate": 8.202908530847463e-06,
+ "loss": 0.115,
+ "step": 20948
+ },
+ {
+ "epoch": 57.08174386920981,
+ "grad_norm": 4.423742771148682,
+ "learning_rate": 8.202040410409957e-06,
+ "loss": 0.244,
+ "step": 20949
+ },
+ {
+ "epoch": 57.084468664850135,
+ "grad_norm": 4.738261699676514,
+ "learning_rate": 8.201172303974907e-06,
+ "loss": 0.1805,
+ "step": 20950
+ },
+ {
+ "epoch": 57.08719346049046,
+ "grad_norm": 4.013214588165283,
+ "learning_rate": 8.200304211549066e-06,
+ "loss": 0.1277,
+ "step": 20951
+ },
+ {
+ "epoch": 57.08991825613079,
+ "grad_norm": 4.8289899826049805,
+ "learning_rate": 8.199436133139202e-06,
+ "loss": 0.1858,
+ "step": 20952
+ },
+ {
+ "epoch": 57.09264305177112,
+ "grad_norm": 3.8840034008026123,
+ "learning_rate": 8.198568068752069e-06,
+ "loss": 0.2074,
+ "step": 20953
+ },
+ {
+ "epoch": 57.095367847411445,
+ "grad_norm": 3.429579257965088,
+ "learning_rate": 8.19770001839443e-06,
+ "loss": 0.1578,
+ "step": 20954
+ },
+ {
+ "epoch": 57.09809264305177,
+ "grad_norm": 5.330948829650879,
+ "learning_rate": 8.196831982073044e-06,
+ "loss": 0.1479,
+ "step": 20955
+ },
+ {
+ "epoch": 57.1008174386921,
+ "grad_norm": 3.138073444366455,
+ "learning_rate": 8.195963959794675e-06,
+ "loss": 0.0659,
+ "step": 20956
+ },
+ {
+ "epoch": 57.10354223433242,
+ "grad_norm": 4.590211868286133,
+ "learning_rate": 8.19509595156608e-06,
+ "loss": 0.0611,
+ "step": 20957
+ },
+ {
+ "epoch": 57.10626702997275,
+ "grad_norm": 4.668395519256592,
+ "learning_rate": 8.19422795739402e-06,
+ "loss": 0.1441,
+ "step": 20958
+ },
+ {
+ "epoch": 57.10899182561308,
+ "grad_norm": 3.013331890106201,
+ "learning_rate": 8.193359977285252e-06,
+ "loss": 0.0626,
+ "step": 20959
+ },
+ {
+ "epoch": 57.11171662125341,
+ "grad_norm": 3.3874785900115967,
+ "learning_rate": 8.19249201124654e-06,
+ "loss": 0.1339,
+ "step": 20960
+ },
+ {
+ "epoch": 57.11444141689373,
+ "grad_norm": 4.477400779724121,
+ "learning_rate": 8.191624059284643e-06,
+ "loss": 0.2508,
+ "step": 20961
+ },
+ {
+ "epoch": 57.11716621253406,
+ "grad_norm": 3.449695348739624,
+ "learning_rate": 8.190756121406317e-06,
+ "loss": 0.0629,
+ "step": 20962
+ },
+ {
+ "epoch": 57.119891008174385,
+ "grad_norm": 3.6937551498413086,
+ "learning_rate": 8.189888197618326e-06,
+ "loss": 0.1012,
+ "step": 20963
+ },
+ {
+ "epoch": 57.12261580381471,
+ "grad_norm": 4.387967586517334,
+ "learning_rate": 8.189020287927428e-06,
+ "loss": 0.0852,
+ "step": 20964
+ },
+ {
+ "epoch": 57.12534059945504,
+ "grad_norm": 3.6131112575531006,
+ "learning_rate": 8.18815239234038e-06,
+ "loss": 0.0723,
+ "step": 20965
+ },
+ {
+ "epoch": 57.12806539509537,
+ "grad_norm": 3.1580309867858887,
+ "learning_rate": 8.187284510863943e-06,
+ "loss": 0.132,
+ "step": 20966
+ },
+ {
+ "epoch": 57.130790190735695,
+ "grad_norm": 3.4441542625427246,
+ "learning_rate": 8.186416643504874e-06,
+ "loss": 0.1683,
+ "step": 20967
+ },
+ {
+ "epoch": 57.13351498637602,
+ "grad_norm": 3.049184799194336,
+ "learning_rate": 8.185548790269937e-06,
+ "loss": 0.0765,
+ "step": 20968
+ },
+ {
+ "epoch": 57.13623978201635,
+ "grad_norm": 3.3789780139923096,
+ "learning_rate": 8.184680951165887e-06,
+ "loss": 0.0705,
+ "step": 20969
+ },
+ {
+ "epoch": 57.13896457765667,
+ "grad_norm": 3.8413381576538086,
+ "learning_rate": 8.183813126199485e-06,
+ "loss": 0.0927,
+ "step": 20970
+ },
+ {
+ "epoch": 57.141689373297005,
+ "grad_norm": 3.9096827507019043,
+ "learning_rate": 8.182945315377484e-06,
+ "loss": 0.1362,
+ "step": 20971
+ },
+ {
+ "epoch": 57.14441416893733,
+ "grad_norm": 4.063755989074707,
+ "learning_rate": 8.18207751870665e-06,
+ "loss": 0.1608,
+ "step": 20972
+ },
+ {
+ "epoch": 57.14713896457766,
+ "grad_norm": 3.655320405960083,
+ "learning_rate": 8.181209736193736e-06,
+ "loss": 0.0954,
+ "step": 20973
+ },
+ {
+ "epoch": 57.14986376021798,
+ "grad_norm": 3.309751272201538,
+ "learning_rate": 8.180341967845505e-06,
+ "loss": 0.1083,
+ "step": 20974
+ },
+ {
+ "epoch": 57.15258855585831,
+ "grad_norm": 5.1634979248046875,
+ "learning_rate": 8.179474213668709e-06,
+ "loss": 0.1171,
+ "step": 20975
+ },
+ {
+ "epoch": 57.155313351498634,
+ "grad_norm": 3.713399887084961,
+ "learning_rate": 8.17860647367011e-06,
+ "loss": 0.1329,
+ "step": 20976
+ },
+ {
+ "epoch": 57.15803814713897,
+ "grad_norm": 3.0816543102264404,
+ "learning_rate": 8.177738747856464e-06,
+ "loss": 0.069,
+ "step": 20977
+ },
+ {
+ "epoch": 57.16076294277929,
+ "grad_norm": 3.5811123847961426,
+ "learning_rate": 8.176871036234533e-06,
+ "loss": 0.0922,
+ "step": 20978
+ },
+ {
+ "epoch": 57.16348773841962,
+ "grad_norm": 3.7834033966064453,
+ "learning_rate": 8.176003338811069e-06,
+ "loss": 0.1462,
+ "step": 20979
+ },
+ {
+ "epoch": 57.166212534059945,
+ "grad_norm": 3.9214141368865967,
+ "learning_rate": 8.175135655592833e-06,
+ "loss": 0.1544,
+ "step": 20980
+ },
+ {
+ "epoch": 57.16893732970027,
+ "grad_norm": 3.1623823642730713,
+ "learning_rate": 8.17426798658658e-06,
+ "loss": 0.0527,
+ "step": 20981
+ },
+ {
+ "epoch": 57.171662125340596,
+ "grad_norm": 14.0775146484375,
+ "learning_rate": 8.173400331799072e-06,
+ "loss": 0.1046,
+ "step": 20982
+ },
+ {
+ "epoch": 57.17438692098093,
+ "grad_norm": 4.159304618835449,
+ "learning_rate": 8.172532691237058e-06,
+ "loss": 0.1219,
+ "step": 20983
+ },
+ {
+ "epoch": 57.177111716621255,
+ "grad_norm": 4.568202018737793,
+ "learning_rate": 8.171665064907306e-06,
+ "loss": 0.1168,
+ "step": 20984
+ },
+ {
+ "epoch": 57.17983651226158,
+ "grad_norm": 2.868018865585327,
+ "learning_rate": 8.170797452816566e-06,
+ "loss": 0.0655,
+ "step": 20985
+ },
+ {
+ "epoch": 57.182561307901906,
+ "grad_norm": 3.5403952598571777,
+ "learning_rate": 8.169929854971598e-06,
+ "loss": 0.1954,
+ "step": 20986
+ },
+ {
+ "epoch": 57.18528610354223,
+ "grad_norm": 7.548911094665527,
+ "learning_rate": 8.169062271379155e-06,
+ "loss": 0.201,
+ "step": 20987
+ },
+ {
+ "epoch": 57.18801089918256,
+ "grad_norm": 3.3708622455596924,
+ "learning_rate": 8.168194702046e-06,
+ "loss": 0.0669,
+ "step": 20988
+ },
+ {
+ "epoch": 57.19073569482289,
+ "grad_norm": 3.5939998626708984,
+ "learning_rate": 8.167327146978883e-06,
+ "loss": 0.0934,
+ "step": 20989
+ },
+ {
+ "epoch": 57.19346049046322,
+ "grad_norm": 3.2615737915039062,
+ "learning_rate": 8.166459606184565e-06,
+ "loss": 0.0636,
+ "step": 20990
+ },
+ {
+ "epoch": 57.19618528610354,
+ "grad_norm": 4.119452476501465,
+ "learning_rate": 8.165592079669798e-06,
+ "loss": 0.1014,
+ "step": 20991
+ },
+ {
+ "epoch": 57.19891008174387,
+ "grad_norm": 2.944352388381958,
+ "learning_rate": 8.164724567441343e-06,
+ "loss": 0.1998,
+ "step": 20992
+ },
+ {
+ "epoch": 57.201634877384194,
+ "grad_norm": 3.481367826461792,
+ "learning_rate": 8.163857069505952e-06,
+ "loss": 0.1698,
+ "step": 20993
+ },
+ {
+ "epoch": 57.20435967302452,
+ "grad_norm": 3.1614503860473633,
+ "learning_rate": 8.162989585870385e-06,
+ "loss": 0.1418,
+ "step": 20994
+ },
+ {
+ "epoch": 57.20708446866485,
+ "grad_norm": 4.005900859832764,
+ "learning_rate": 8.162122116541394e-06,
+ "loss": 0.1592,
+ "step": 20995
+ },
+ {
+ "epoch": 57.20980926430518,
+ "grad_norm": 3.480644702911377,
+ "learning_rate": 8.161254661525739e-06,
+ "loss": 0.095,
+ "step": 20996
+ },
+ {
+ "epoch": 57.212534059945504,
+ "grad_norm": 3.2617340087890625,
+ "learning_rate": 8.160387220830172e-06,
+ "loss": 0.1094,
+ "step": 20997
+ },
+ {
+ "epoch": 57.21525885558583,
+ "grad_norm": 4.810868740081787,
+ "learning_rate": 8.159519794461452e-06,
+ "loss": 0.109,
+ "step": 20998
+ },
+ {
+ "epoch": 57.217983651226156,
+ "grad_norm": 2.804990291595459,
+ "learning_rate": 8.158652382426328e-06,
+ "loss": 0.1342,
+ "step": 20999
+ },
+ {
+ "epoch": 57.22070844686648,
+ "grad_norm": 17.00299644470215,
+ "learning_rate": 8.157784984731561e-06,
+ "loss": 0.1707,
+ "step": 21000
+ },
+ {
+ "epoch": 57.223433242506815,
+ "grad_norm": 4.369019031524658,
+ "learning_rate": 8.156917601383909e-06,
+ "loss": 0.1973,
+ "step": 21001
+ },
+ {
+ "epoch": 57.22615803814714,
+ "grad_norm": 3.4167332649230957,
+ "learning_rate": 8.156050232390121e-06,
+ "loss": 0.1066,
+ "step": 21002
+ },
+ {
+ "epoch": 57.228882833787466,
+ "grad_norm": 6.498249053955078,
+ "learning_rate": 8.155182877756953e-06,
+ "loss": 0.2003,
+ "step": 21003
+ },
+ {
+ "epoch": 57.23160762942779,
+ "grad_norm": 25.307979583740234,
+ "learning_rate": 8.154315537491166e-06,
+ "loss": 0.136,
+ "step": 21004
+ },
+ {
+ "epoch": 57.23433242506812,
+ "grad_norm": 3.269639492034912,
+ "learning_rate": 8.153448211599506e-06,
+ "loss": 0.1138,
+ "step": 21005
+ },
+ {
+ "epoch": 57.237057220708444,
+ "grad_norm": 3.17785906791687,
+ "learning_rate": 8.152580900088735e-06,
+ "loss": 0.0825,
+ "step": 21006
+ },
+ {
+ "epoch": 57.23978201634878,
+ "grad_norm": 3.8047120571136475,
+ "learning_rate": 8.151713602965602e-06,
+ "loss": 0.1321,
+ "step": 21007
+ },
+ {
+ "epoch": 57.2425068119891,
+ "grad_norm": 2.9458749294281006,
+ "learning_rate": 8.150846320236866e-06,
+ "loss": 0.1597,
+ "step": 21008
+ },
+ {
+ "epoch": 57.24523160762943,
+ "grad_norm": 4.262577533721924,
+ "learning_rate": 8.149979051909278e-06,
+ "loss": 0.0785,
+ "step": 21009
+ },
+ {
+ "epoch": 57.247956403269754,
+ "grad_norm": 4.848487854003906,
+ "learning_rate": 8.149111797989595e-06,
+ "loss": 0.1172,
+ "step": 21010
+ },
+ {
+ "epoch": 57.25068119891008,
+ "grad_norm": 6.822971820831299,
+ "learning_rate": 8.148244558484568e-06,
+ "loss": 0.1364,
+ "step": 21011
+ },
+ {
+ "epoch": 57.253405994550405,
+ "grad_norm": 4.221641540527344,
+ "learning_rate": 8.147377333400955e-06,
+ "loss": 0.0943,
+ "step": 21012
+ },
+ {
+ "epoch": 57.25613079019074,
+ "grad_norm": 3.7261950969696045,
+ "learning_rate": 8.146510122745504e-06,
+ "loss": 0.1605,
+ "step": 21013
+ },
+ {
+ "epoch": 57.258855585831064,
+ "grad_norm": 4.5704345703125,
+ "learning_rate": 8.145642926524977e-06,
+ "loss": 0.0632,
+ "step": 21014
+ },
+ {
+ "epoch": 57.26158038147139,
+ "grad_norm": 4.229184150695801,
+ "learning_rate": 8.14477574474612e-06,
+ "loss": 0.0648,
+ "step": 21015
+ },
+ {
+ "epoch": 57.264305177111716,
+ "grad_norm": 3.4966213703155518,
+ "learning_rate": 8.143908577415691e-06,
+ "loss": 0.0934,
+ "step": 21016
+ },
+ {
+ "epoch": 57.26702997275204,
+ "grad_norm": 4.787452220916748,
+ "learning_rate": 8.14304142454044e-06,
+ "loss": 0.1329,
+ "step": 21017
+ },
+ {
+ "epoch": 57.26975476839237,
+ "grad_norm": 5.035547733306885,
+ "learning_rate": 8.142174286127123e-06,
+ "loss": 0.0921,
+ "step": 21018
+ },
+ {
+ "epoch": 57.2724795640327,
+ "grad_norm": 3.683725118637085,
+ "learning_rate": 8.141307162182496e-06,
+ "loss": 0.0705,
+ "step": 21019
+ },
+ {
+ "epoch": 57.275204359673026,
+ "grad_norm": 4.442389488220215,
+ "learning_rate": 8.140440052713307e-06,
+ "loss": 0.241,
+ "step": 21020
+ },
+ {
+ "epoch": 57.27792915531335,
+ "grad_norm": 3.7261180877685547,
+ "learning_rate": 8.139572957726312e-06,
+ "loss": 0.0714,
+ "step": 21021
+ },
+ {
+ "epoch": 57.28065395095368,
+ "grad_norm": 3.876488447189331,
+ "learning_rate": 8.138705877228262e-06,
+ "loss": 0.2101,
+ "step": 21022
+ },
+ {
+ "epoch": 57.283378746594,
+ "grad_norm": 5.133909702301025,
+ "learning_rate": 8.137838811225913e-06,
+ "loss": 0.116,
+ "step": 21023
+ },
+ {
+ "epoch": 57.28610354223433,
+ "grad_norm": 4.60747766494751,
+ "learning_rate": 8.136971759726011e-06,
+ "loss": 0.1487,
+ "step": 21024
+ },
+ {
+ "epoch": 57.28882833787466,
+ "grad_norm": 4.002742767333984,
+ "learning_rate": 8.136104722735317e-06,
+ "loss": 0.0709,
+ "step": 21025
+ },
+ {
+ "epoch": 57.29155313351499,
+ "grad_norm": 3.7660610675811768,
+ "learning_rate": 8.135237700260578e-06,
+ "loss": 0.0797,
+ "step": 21026
+ },
+ {
+ "epoch": 57.294277929155314,
+ "grad_norm": 4.8447465896606445,
+ "learning_rate": 8.134370692308547e-06,
+ "loss": 0.1175,
+ "step": 21027
+ },
+ {
+ "epoch": 57.29700272479564,
+ "grad_norm": 4.493288993835449,
+ "learning_rate": 8.133503698885978e-06,
+ "loss": 0.2296,
+ "step": 21028
+ },
+ {
+ "epoch": 57.299727520435965,
+ "grad_norm": 30.658430099487305,
+ "learning_rate": 8.132636719999622e-06,
+ "loss": 0.0807,
+ "step": 21029
+ },
+ {
+ "epoch": 57.30245231607629,
+ "grad_norm": 3.621741771697998,
+ "learning_rate": 8.131769755656231e-06,
+ "loss": 0.0795,
+ "step": 21030
+ },
+ {
+ "epoch": 57.305177111716624,
+ "grad_norm": 3.7663137912750244,
+ "learning_rate": 8.130902805862556e-06,
+ "loss": 0.1682,
+ "step": 21031
+ },
+ {
+ "epoch": 57.30790190735695,
+ "grad_norm": 6.516160488128662,
+ "learning_rate": 8.130035870625352e-06,
+ "loss": 0.0639,
+ "step": 21032
+ },
+ {
+ "epoch": 57.310626702997276,
+ "grad_norm": 3.108703136444092,
+ "learning_rate": 8.129168949951368e-06,
+ "loss": 0.1736,
+ "step": 21033
+ },
+ {
+ "epoch": 57.3133514986376,
+ "grad_norm": 2.8198657035827637,
+ "learning_rate": 8.128302043847355e-06,
+ "loss": 0.0448,
+ "step": 21034
+ },
+ {
+ "epoch": 57.31607629427793,
+ "grad_norm": 2.566166639328003,
+ "learning_rate": 8.127435152320061e-06,
+ "loss": 0.0431,
+ "step": 21035
+ },
+ {
+ "epoch": 57.31880108991825,
+ "grad_norm": 6.921756267547607,
+ "learning_rate": 8.126568275376247e-06,
+ "loss": 0.1104,
+ "step": 21036
+ },
+ {
+ "epoch": 57.321525885558586,
+ "grad_norm": 4.090224266052246,
+ "learning_rate": 8.125701413022659e-06,
+ "loss": 0.2506,
+ "step": 21037
+ },
+ {
+ "epoch": 57.32425068119891,
+ "grad_norm": 3.300335645675659,
+ "learning_rate": 8.124834565266048e-06,
+ "loss": 0.0638,
+ "step": 21038
+ },
+ {
+ "epoch": 57.32697547683924,
+ "grad_norm": 4.812459945678711,
+ "learning_rate": 8.123967732113165e-06,
+ "loss": 0.1904,
+ "step": 21039
+ },
+ {
+ "epoch": 57.32970027247956,
+ "grad_norm": 3.0873422622680664,
+ "learning_rate": 8.12310091357076e-06,
+ "loss": 0.0469,
+ "step": 21040
+ },
+ {
+ "epoch": 57.33242506811989,
+ "grad_norm": 3.7849323749542236,
+ "learning_rate": 8.122234109645586e-06,
+ "loss": 0.1019,
+ "step": 21041
+ },
+ {
+ "epoch": 57.335149863760215,
+ "grad_norm": 3.6425018310546875,
+ "learning_rate": 8.12136732034439e-06,
+ "loss": 0.1474,
+ "step": 21042
+ },
+ {
+ "epoch": 57.33787465940055,
+ "grad_norm": 4.636575698852539,
+ "learning_rate": 8.120500545673928e-06,
+ "loss": 0.0658,
+ "step": 21043
+ },
+ {
+ "epoch": 57.34059945504087,
+ "grad_norm": 3.2334156036376953,
+ "learning_rate": 8.119633785640944e-06,
+ "loss": 0.1799,
+ "step": 21044
+ },
+ {
+ "epoch": 57.3433242506812,
+ "grad_norm": 4.16218376159668,
+ "learning_rate": 8.118767040252196e-06,
+ "loss": 0.0955,
+ "step": 21045
+ },
+ {
+ "epoch": 57.346049046321525,
+ "grad_norm": 3.0309019088745117,
+ "learning_rate": 8.117900309514425e-06,
+ "loss": 0.0419,
+ "step": 21046
+ },
+ {
+ "epoch": 57.34877384196185,
+ "grad_norm": 3.9720096588134766,
+ "learning_rate": 8.117033593434389e-06,
+ "loss": 0.1225,
+ "step": 21047
+ },
+ {
+ "epoch": 57.35149863760218,
+ "grad_norm": 3.7392325401306152,
+ "learning_rate": 8.116166892018834e-06,
+ "loss": 0.0861,
+ "step": 21048
+ },
+ {
+ "epoch": 57.35422343324251,
+ "grad_norm": 4.26577615737915,
+ "learning_rate": 8.115300205274508e-06,
+ "loss": 0.1512,
+ "step": 21049
+ },
+ {
+ "epoch": 57.356948228882835,
+ "grad_norm": 3.7570958137512207,
+ "learning_rate": 8.114433533208165e-06,
+ "loss": 0.13,
+ "step": 21050
+ },
+ {
+ "epoch": 57.35967302452316,
+ "grad_norm": 4.121349811553955,
+ "learning_rate": 8.113566875826553e-06,
+ "loss": 0.2045,
+ "step": 21051
+ },
+ {
+ "epoch": 57.36239782016349,
+ "grad_norm": 5.072442531585693,
+ "learning_rate": 8.11270023313642e-06,
+ "loss": 0.0885,
+ "step": 21052
+ },
+ {
+ "epoch": 57.36512261580381,
+ "grad_norm": 3.1366050243377686,
+ "learning_rate": 8.11183360514452e-06,
+ "loss": 0.0985,
+ "step": 21053
+ },
+ {
+ "epoch": 57.36784741144414,
+ "grad_norm": 4.402289390563965,
+ "learning_rate": 8.110966991857596e-06,
+ "loss": 0.1637,
+ "step": 21054
+ },
+ {
+ "epoch": 57.37057220708447,
+ "grad_norm": 3.750377893447876,
+ "learning_rate": 8.110100393282402e-06,
+ "loss": 0.0972,
+ "step": 21055
+ },
+ {
+ "epoch": 57.3732970027248,
+ "grad_norm": 6.2638773918151855,
+ "learning_rate": 8.109233809425686e-06,
+ "loss": 0.127,
+ "step": 21056
+ },
+ {
+ "epoch": 57.37602179836512,
+ "grad_norm": 4.752940654754639,
+ "learning_rate": 8.108367240294197e-06,
+ "loss": 0.2132,
+ "step": 21057
+ },
+ {
+ "epoch": 57.37874659400545,
+ "grad_norm": 3.561741590499878,
+ "learning_rate": 8.10750068589468e-06,
+ "loss": 0.0837,
+ "step": 21058
+ },
+ {
+ "epoch": 57.381471389645775,
+ "grad_norm": 5.152788162231445,
+ "learning_rate": 8.10663414623389e-06,
+ "loss": 0.1005,
+ "step": 21059
+ },
+ {
+ "epoch": 57.3841961852861,
+ "grad_norm": 4.3131489753723145,
+ "learning_rate": 8.10576762131857e-06,
+ "loss": 0.2148,
+ "step": 21060
+ },
+ {
+ "epoch": 57.38692098092643,
+ "grad_norm": 3.1346771717071533,
+ "learning_rate": 8.104901111155472e-06,
+ "loss": 0.081,
+ "step": 21061
+ },
+ {
+ "epoch": 57.38964577656676,
+ "grad_norm": 3.919673442840576,
+ "learning_rate": 8.104034615751343e-06,
+ "loss": 0.1024,
+ "step": 21062
+ },
+ {
+ "epoch": 57.392370572207085,
+ "grad_norm": 3.703479051589966,
+ "learning_rate": 8.103168135112932e-06,
+ "loss": 0.1538,
+ "step": 21063
+ },
+ {
+ "epoch": 57.39509536784741,
+ "grad_norm": 4.304934024810791,
+ "learning_rate": 8.102301669246984e-06,
+ "loss": 0.2611,
+ "step": 21064
+ },
+ {
+ "epoch": 57.39782016348774,
+ "grad_norm": 5.615895748138428,
+ "learning_rate": 8.101435218160253e-06,
+ "loss": 0.0922,
+ "step": 21065
+ },
+ {
+ "epoch": 57.40054495912806,
+ "grad_norm": 5.641123294830322,
+ "learning_rate": 8.10056878185948e-06,
+ "loss": 0.1476,
+ "step": 21066
+ },
+ {
+ "epoch": 57.403269754768395,
+ "grad_norm": 4.991501808166504,
+ "learning_rate": 8.09970236035142e-06,
+ "loss": 0.0636,
+ "step": 21067
+ },
+ {
+ "epoch": 57.40599455040872,
+ "grad_norm": 7.819751262664795,
+ "learning_rate": 8.098835953642813e-06,
+ "loss": 0.18,
+ "step": 21068
+ },
+ {
+ "epoch": 57.40871934604905,
+ "grad_norm": 3.9003374576568604,
+ "learning_rate": 8.097969561740409e-06,
+ "loss": 0.0832,
+ "step": 21069
+ },
+ {
+ "epoch": 57.41144414168937,
+ "grad_norm": 3.9136853218078613,
+ "learning_rate": 8.097103184650959e-06,
+ "loss": 0.0986,
+ "step": 21070
+ },
+ {
+ "epoch": 57.4141689373297,
+ "grad_norm": 4.419578552246094,
+ "learning_rate": 8.09623682238121e-06,
+ "loss": 0.0991,
+ "step": 21071
+ },
+ {
+ "epoch": 57.416893732970024,
+ "grad_norm": 4.347434997558594,
+ "learning_rate": 8.095370474937904e-06,
+ "loss": 0.0892,
+ "step": 21072
+ },
+ {
+ "epoch": 57.41961852861036,
+ "grad_norm": 7.327247619628906,
+ "learning_rate": 8.094504142327796e-06,
+ "loss": 0.1526,
+ "step": 21073
+ },
+ {
+ "epoch": 57.42234332425068,
+ "grad_norm": 4.945771217346191,
+ "learning_rate": 8.093637824557625e-06,
+ "loss": 0.1173,
+ "step": 21074
+ },
+ {
+ "epoch": 57.42506811989101,
+ "grad_norm": 4.112789154052734,
+ "learning_rate": 8.092771521634143e-06,
+ "loss": 0.093,
+ "step": 21075
+ },
+ {
+ "epoch": 57.427792915531334,
+ "grad_norm": 2.9911928176879883,
+ "learning_rate": 8.091905233564095e-06,
+ "loss": 0.0547,
+ "step": 21076
+ },
+ {
+ "epoch": 57.43051771117166,
+ "grad_norm": 11.361251831054688,
+ "learning_rate": 8.091038960354227e-06,
+ "loss": 0.0711,
+ "step": 21077
+ },
+ {
+ "epoch": 57.433242506811986,
+ "grad_norm": 2.9650349617004395,
+ "learning_rate": 8.090172702011287e-06,
+ "loss": 0.1761,
+ "step": 21078
+ },
+ {
+ "epoch": 57.43596730245232,
+ "grad_norm": 5.548549175262451,
+ "learning_rate": 8.08930645854202e-06,
+ "loss": 0.1474,
+ "step": 21079
+ },
+ {
+ "epoch": 57.438692098092645,
+ "grad_norm": 6.829399585723877,
+ "learning_rate": 8.088440229953172e-06,
+ "loss": 0.1011,
+ "step": 21080
+ },
+ {
+ "epoch": 57.44141689373297,
+ "grad_norm": 3.559237480163574,
+ "learning_rate": 8.087574016251492e-06,
+ "loss": 0.0824,
+ "step": 21081
+ },
+ {
+ "epoch": 57.444141689373296,
+ "grad_norm": 5.038529872894287,
+ "learning_rate": 8.086707817443722e-06,
+ "loss": 0.0856,
+ "step": 21082
+ },
+ {
+ "epoch": 57.44686648501362,
+ "grad_norm": 6.732036113739014,
+ "learning_rate": 8.085841633536611e-06,
+ "loss": 0.0751,
+ "step": 21083
+ },
+ {
+ "epoch": 57.44959128065395,
+ "grad_norm": 4.63095760345459,
+ "learning_rate": 8.084975464536902e-06,
+ "loss": 0.1056,
+ "step": 21084
+ },
+ {
+ "epoch": 57.45231607629428,
+ "grad_norm": 3.8541738986968994,
+ "learning_rate": 8.084109310451345e-06,
+ "loss": 0.1154,
+ "step": 21085
+ },
+ {
+ "epoch": 57.45504087193461,
+ "grad_norm": 4.783348560333252,
+ "learning_rate": 8.083243171286679e-06,
+ "loss": 0.387,
+ "step": 21086
+ },
+ {
+ "epoch": 57.45776566757493,
+ "grad_norm": 4.016456127166748,
+ "learning_rate": 8.082377047049654e-06,
+ "loss": 0.1227,
+ "step": 21087
+ },
+ {
+ "epoch": 57.46049046321526,
+ "grad_norm": 3.026258707046509,
+ "learning_rate": 8.08151093774702e-06,
+ "loss": 0.0905,
+ "step": 21088
+ },
+ {
+ "epoch": 57.463215258855584,
+ "grad_norm": 4.230606555938721,
+ "learning_rate": 8.080644843385512e-06,
+ "loss": 0.1961,
+ "step": 21089
+ },
+ {
+ "epoch": 57.46594005449591,
+ "grad_norm": 3.694626569747925,
+ "learning_rate": 8.079778763971882e-06,
+ "loss": 0.1383,
+ "step": 21090
+ },
+ {
+ "epoch": 57.46866485013624,
+ "grad_norm": 3.6818764209747314,
+ "learning_rate": 8.078912699512874e-06,
+ "loss": 0.1239,
+ "step": 21091
+ },
+ {
+ "epoch": 57.47138964577657,
+ "grad_norm": 3.8059468269348145,
+ "learning_rate": 8.07804665001523e-06,
+ "loss": 0.1128,
+ "step": 21092
+ },
+ {
+ "epoch": 57.474114441416894,
+ "grad_norm": 4.613978385925293,
+ "learning_rate": 8.0771806154857e-06,
+ "loss": 0.2063,
+ "step": 21093
+ },
+ {
+ "epoch": 57.47683923705722,
+ "grad_norm": 2.964661121368408,
+ "learning_rate": 8.076314595931024e-06,
+ "loss": 0.0482,
+ "step": 21094
+ },
+ {
+ "epoch": 57.479564032697546,
+ "grad_norm": 4.8119049072265625,
+ "learning_rate": 8.075448591357948e-06,
+ "loss": 0.0736,
+ "step": 21095
+ },
+ {
+ "epoch": 57.48228882833787,
+ "grad_norm": 4.246369361877441,
+ "learning_rate": 8.074582601773215e-06,
+ "loss": 0.0999,
+ "step": 21096
+ },
+ {
+ "epoch": 57.485013623978205,
+ "grad_norm": 3.5195250511169434,
+ "learning_rate": 8.073716627183575e-06,
+ "loss": 0.0621,
+ "step": 21097
+ },
+ {
+ "epoch": 57.48773841961853,
+ "grad_norm": 5.680939674377441,
+ "learning_rate": 8.072850667595763e-06,
+ "loss": 0.095,
+ "step": 21098
+ },
+ {
+ "epoch": 57.490463215258856,
+ "grad_norm": 3.6644961833953857,
+ "learning_rate": 8.071984723016532e-06,
+ "loss": 0.063,
+ "step": 21099
+ },
+ {
+ "epoch": 57.49318801089918,
+ "grad_norm": 3.7200732231140137,
+ "learning_rate": 8.071118793452618e-06,
+ "loss": 0.1048,
+ "step": 21100
+ },
+ {
+ "epoch": 57.49591280653951,
+ "grad_norm": 3.758270025253296,
+ "learning_rate": 8.070252878910771e-06,
+ "loss": 0.0762,
+ "step": 21101
+ },
+ {
+ "epoch": 57.49863760217983,
+ "grad_norm": 2.9253904819488525,
+ "learning_rate": 8.069386979397732e-06,
+ "loss": 0.1048,
+ "step": 21102
+ },
+ {
+ "epoch": 57.50136239782017,
+ "grad_norm": 4.1088714599609375,
+ "learning_rate": 8.068521094920242e-06,
+ "loss": 0.0957,
+ "step": 21103
+ },
+ {
+ "epoch": 57.50408719346049,
+ "grad_norm": 5.188478469848633,
+ "learning_rate": 8.067655225485052e-06,
+ "loss": 0.1402,
+ "step": 21104
+ },
+ {
+ "epoch": 57.50681198910082,
+ "grad_norm": 8.501290321350098,
+ "learning_rate": 8.066789371098899e-06,
+ "loss": 0.1355,
+ "step": 21105
+ },
+ {
+ "epoch": 57.509536784741144,
+ "grad_norm": 3.4538586139678955,
+ "learning_rate": 8.065923531768529e-06,
+ "loss": 0.0738,
+ "step": 21106
+ },
+ {
+ "epoch": 57.51226158038147,
+ "grad_norm": 3.281200647354126,
+ "learning_rate": 8.065057707500684e-06,
+ "loss": 0.1021,
+ "step": 21107
+ },
+ {
+ "epoch": 57.514986376021795,
+ "grad_norm": 4.295124530792236,
+ "learning_rate": 8.064191898302109e-06,
+ "loss": 0.2357,
+ "step": 21108
+ },
+ {
+ "epoch": 57.51771117166213,
+ "grad_norm": 4.262333869934082,
+ "learning_rate": 8.063326104179542e-06,
+ "loss": 0.0805,
+ "step": 21109
+ },
+ {
+ "epoch": 57.520435967302454,
+ "grad_norm": 4.151923179626465,
+ "learning_rate": 8.062460325139731e-06,
+ "loss": 0.0682,
+ "step": 21110
+ },
+ {
+ "epoch": 57.52316076294278,
+ "grad_norm": 3.6162490844726562,
+ "learning_rate": 8.061594561189417e-06,
+ "loss": 0.118,
+ "step": 21111
+ },
+ {
+ "epoch": 57.525885558583106,
+ "grad_norm": 4.753512859344482,
+ "learning_rate": 8.06072881233534e-06,
+ "loss": 0.1768,
+ "step": 21112
+ },
+ {
+ "epoch": 57.52861035422343,
+ "grad_norm": 7.29217529296875,
+ "learning_rate": 8.059863078584245e-06,
+ "loss": 0.1235,
+ "step": 21113
+ },
+ {
+ "epoch": 57.53133514986376,
+ "grad_norm": 3.687530040740967,
+ "learning_rate": 8.058997359942875e-06,
+ "loss": 0.1103,
+ "step": 21114
+ },
+ {
+ "epoch": 57.53405994550409,
+ "grad_norm": 3.6048548221588135,
+ "learning_rate": 8.058131656417972e-06,
+ "loss": 0.0726,
+ "step": 21115
+ },
+ {
+ "epoch": 57.536784741144416,
+ "grad_norm": 3.727325916290283,
+ "learning_rate": 8.057265968016275e-06,
+ "loss": 0.0839,
+ "step": 21116
+ },
+ {
+ "epoch": 57.53950953678474,
+ "grad_norm": 4.673880100250244,
+ "learning_rate": 8.056400294744531e-06,
+ "loss": 0.0867,
+ "step": 21117
+ },
+ {
+ "epoch": 57.54223433242507,
+ "grad_norm": 2.8797502517700195,
+ "learning_rate": 8.055534636609476e-06,
+ "loss": 0.0489,
+ "step": 21118
+ },
+ {
+ "epoch": 57.54495912806539,
+ "grad_norm": 4.70318603515625,
+ "learning_rate": 8.054668993617857e-06,
+ "loss": 0.1014,
+ "step": 21119
+ },
+ {
+ "epoch": 57.54768392370572,
+ "grad_norm": 4.084402084350586,
+ "learning_rate": 8.053803365776412e-06,
+ "loss": 0.1301,
+ "step": 21120
+ },
+ {
+ "epoch": 57.55040871934605,
+ "grad_norm": 3.4945762157440186,
+ "learning_rate": 8.052937753091879e-06,
+ "loss": 0.2309,
+ "step": 21121
+ },
+ {
+ "epoch": 57.55313351498638,
+ "grad_norm": 3.5946857929229736,
+ "learning_rate": 8.05207215557101e-06,
+ "loss": 0.1019,
+ "step": 21122
+ },
+ {
+ "epoch": 57.555858310626704,
+ "grad_norm": 4.264369010925293,
+ "learning_rate": 8.05120657322054e-06,
+ "loss": 0.2453,
+ "step": 21123
+ },
+ {
+ "epoch": 57.55858310626703,
+ "grad_norm": 5.001492500305176,
+ "learning_rate": 8.050341006047209e-06,
+ "loss": 0.2087,
+ "step": 21124
+ },
+ {
+ "epoch": 57.561307901907355,
+ "grad_norm": 4.087818622589111,
+ "learning_rate": 8.04947545405776e-06,
+ "loss": 0.097,
+ "step": 21125
+ },
+ {
+ "epoch": 57.56403269754768,
+ "grad_norm": 6.340839385986328,
+ "learning_rate": 8.048609917258935e-06,
+ "loss": 0.1306,
+ "step": 21126
+ },
+ {
+ "epoch": 57.566757493188014,
+ "grad_norm": 4.888052463531494,
+ "learning_rate": 8.047744395657471e-06,
+ "loss": 0.0972,
+ "step": 21127
+ },
+ {
+ "epoch": 57.56948228882834,
+ "grad_norm": 3.893559217453003,
+ "learning_rate": 8.046878889260112e-06,
+ "loss": 0.0995,
+ "step": 21128
+ },
+ {
+ "epoch": 57.572207084468666,
+ "grad_norm": 4.35330867767334,
+ "learning_rate": 8.046013398073597e-06,
+ "loss": 0.2851,
+ "step": 21129
+ },
+ {
+ "epoch": 57.57493188010899,
+ "grad_norm": 3.9809250831604004,
+ "learning_rate": 8.045147922104668e-06,
+ "loss": 0.0911,
+ "step": 21130
+ },
+ {
+ "epoch": 57.57765667574932,
+ "grad_norm": 3.5093841552734375,
+ "learning_rate": 8.044282461360062e-06,
+ "loss": 0.5028,
+ "step": 21131
+ },
+ {
+ "epoch": 57.58038147138964,
+ "grad_norm": 5.057225704193115,
+ "learning_rate": 8.043417015846523e-06,
+ "loss": 0.1298,
+ "step": 21132
+ },
+ {
+ "epoch": 57.583106267029976,
+ "grad_norm": 3.862987995147705,
+ "learning_rate": 8.042551585570787e-06,
+ "loss": 0.0906,
+ "step": 21133
+ },
+ {
+ "epoch": 57.5858310626703,
+ "grad_norm": 7.200356960296631,
+ "learning_rate": 8.041686170539599e-06,
+ "loss": 0.0996,
+ "step": 21134
+ },
+ {
+ "epoch": 57.58855585831063,
+ "grad_norm": 6.5382890701293945,
+ "learning_rate": 8.040820770759694e-06,
+ "loss": 0.1129,
+ "step": 21135
+ },
+ {
+ "epoch": 57.59128065395095,
+ "grad_norm": 6.598848342895508,
+ "learning_rate": 8.039955386237813e-06,
+ "loss": 0.0697,
+ "step": 21136
+ },
+ {
+ "epoch": 57.59400544959128,
+ "grad_norm": 5.061677932739258,
+ "learning_rate": 8.0390900169807e-06,
+ "loss": 0.1203,
+ "step": 21137
+ },
+ {
+ "epoch": 57.596730245231605,
+ "grad_norm": 6.442782878875732,
+ "learning_rate": 8.038224662995084e-06,
+ "loss": 0.1633,
+ "step": 21138
+ },
+ {
+ "epoch": 57.59945504087194,
+ "grad_norm": 5.684314250946045,
+ "learning_rate": 8.037359324287716e-06,
+ "loss": 0.1409,
+ "step": 21139
+ },
+ {
+ "epoch": 57.60217983651226,
+ "grad_norm": 4.345500946044922,
+ "learning_rate": 8.036494000865331e-06,
+ "loss": 0.1985,
+ "step": 21140
+ },
+ {
+ "epoch": 57.60490463215259,
+ "grad_norm": 3.5980756282806396,
+ "learning_rate": 8.035628692734666e-06,
+ "loss": 0.0802,
+ "step": 21141
+ },
+ {
+ "epoch": 57.607629427792915,
+ "grad_norm": 3.9551618099212646,
+ "learning_rate": 8.034763399902462e-06,
+ "loss": 0.2361,
+ "step": 21142
+ },
+ {
+ "epoch": 57.61035422343324,
+ "grad_norm": 4.956972122192383,
+ "learning_rate": 8.033898122375458e-06,
+ "loss": 0.0805,
+ "step": 21143
+ },
+ {
+ "epoch": 57.61307901907357,
+ "grad_norm": 2.717604160308838,
+ "learning_rate": 8.033032860160394e-06,
+ "loss": 0.0599,
+ "step": 21144
+ },
+ {
+ "epoch": 57.6158038147139,
+ "grad_norm": 3.742825984954834,
+ "learning_rate": 8.032167613264002e-06,
+ "loss": 0.0542,
+ "step": 21145
+ },
+ {
+ "epoch": 57.618528610354225,
+ "grad_norm": 5.366011142730713,
+ "learning_rate": 8.03130238169303e-06,
+ "loss": 0.1661,
+ "step": 21146
+ },
+ {
+ "epoch": 57.62125340599455,
+ "grad_norm": 4.602841854095459,
+ "learning_rate": 8.030437165454208e-06,
+ "loss": 0.1687,
+ "step": 21147
+ },
+ {
+ "epoch": 57.62397820163488,
+ "grad_norm": 4.1078362464904785,
+ "learning_rate": 8.029571964554282e-06,
+ "loss": 0.1252,
+ "step": 21148
+ },
+ {
+ "epoch": 57.6267029972752,
+ "grad_norm": 3.8847732543945312,
+ "learning_rate": 8.028706778999982e-06,
+ "loss": 0.0739,
+ "step": 21149
+ },
+ {
+ "epoch": 57.62942779291553,
+ "grad_norm": 4.712838649749756,
+ "learning_rate": 8.027841608798053e-06,
+ "loss": 0.1337,
+ "step": 21150
+ },
+ {
+ "epoch": 57.63215258855586,
+ "grad_norm": 4.490561008453369,
+ "learning_rate": 8.026976453955228e-06,
+ "loss": 0.07,
+ "step": 21151
+ },
+ {
+ "epoch": 57.63487738419619,
+ "grad_norm": 3.750500440597534,
+ "learning_rate": 8.026111314478249e-06,
+ "loss": 0.0686,
+ "step": 21152
+ },
+ {
+ "epoch": 57.63760217983651,
+ "grad_norm": 3.8146345615386963,
+ "learning_rate": 8.02524619037385e-06,
+ "loss": 0.0689,
+ "step": 21153
+ },
+ {
+ "epoch": 57.64032697547684,
+ "grad_norm": 6.2692718505859375,
+ "learning_rate": 8.02438108164877e-06,
+ "loss": 0.0755,
+ "step": 21154
+ },
+ {
+ "epoch": 57.643051771117165,
+ "grad_norm": 3.5104455947875977,
+ "learning_rate": 8.023515988309742e-06,
+ "loss": 0.0951,
+ "step": 21155
+ },
+ {
+ "epoch": 57.64577656675749,
+ "grad_norm": 5.580707550048828,
+ "learning_rate": 8.022650910363516e-06,
+ "loss": 0.1287,
+ "step": 21156
+ },
+ {
+ "epoch": 57.64850136239782,
+ "grad_norm": 3.445660352706909,
+ "learning_rate": 8.021785847816816e-06,
+ "loss": 0.1773,
+ "step": 21157
+ },
+ {
+ "epoch": 57.65122615803815,
+ "grad_norm": 4.380588054656982,
+ "learning_rate": 8.020920800676387e-06,
+ "loss": 0.1294,
+ "step": 21158
+ },
+ {
+ "epoch": 57.653950953678475,
+ "grad_norm": 7.622682094573975,
+ "learning_rate": 8.020055768948963e-06,
+ "loss": 0.257,
+ "step": 21159
+ },
+ {
+ "epoch": 57.6566757493188,
+ "grad_norm": 4.133795261383057,
+ "learning_rate": 8.01919075264128e-06,
+ "loss": 0.1186,
+ "step": 21160
+ },
+ {
+ "epoch": 57.65940054495913,
+ "grad_norm": 10.034468650817871,
+ "learning_rate": 8.018325751760075e-06,
+ "loss": 0.2248,
+ "step": 21161
+ },
+ {
+ "epoch": 57.66212534059945,
+ "grad_norm": 4.84804630279541,
+ "learning_rate": 8.017460766312088e-06,
+ "loss": 0.2466,
+ "step": 21162
+ },
+ {
+ "epoch": 57.664850136239785,
+ "grad_norm": 3.387465000152588,
+ "learning_rate": 8.01659579630405e-06,
+ "loss": 0.0704,
+ "step": 21163
+ },
+ {
+ "epoch": 57.66757493188011,
+ "grad_norm": 4.253676891326904,
+ "learning_rate": 8.015730841742702e-06,
+ "loss": 0.1156,
+ "step": 21164
+ },
+ {
+ "epoch": 57.67029972752044,
+ "grad_norm": 5.0305657386779785,
+ "learning_rate": 8.014865902634774e-06,
+ "loss": 0.1137,
+ "step": 21165
+ },
+ {
+ "epoch": 57.67302452316076,
+ "grad_norm": 3.5951809883117676,
+ "learning_rate": 8.014000978987013e-06,
+ "loss": 0.2383,
+ "step": 21166
+ },
+ {
+ "epoch": 57.67574931880109,
+ "grad_norm": 4.939373016357422,
+ "learning_rate": 8.013136070806143e-06,
+ "loss": 0.1463,
+ "step": 21167
+ },
+ {
+ "epoch": 57.678474114441414,
+ "grad_norm": 3.7658889293670654,
+ "learning_rate": 8.01227117809891e-06,
+ "loss": 0.0886,
+ "step": 21168
+ },
+ {
+ "epoch": 57.68119891008175,
+ "grad_norm": 6.335522174835205,
+ "learning_rate": 8.011406300872041e-06,
+ "loss": 0.2037,
+ "step": 21169
+ },
+ {
+ "epoch": 57.68392370572207,
+ "grad_norm": 4.378781318664551,
+ "learning_rate": 8.01054143913228e-06,
+ "loss": 0.1036,
+ "step": 21170
+ },
+ {
+ "epoch": 57.6866485013624,
+ "grad_norm": 3.1508800983428955,
+ "learning_rate": 8.009676592886353e-06,
+ "loss": 0.133,
+ "step": 21171
+ },
+ {
+ "epoch": 57.689373297002724,
+ "grad_norm": 3.9530043601989746,
+ "learning_rate": 8.008811762141e-06,
+ "loss": 0.0892,
+ "step": 21172
+ },
+ {
+ "epoch": 57.69209809264305,
+ "grad_norm": 5.408289432525635,
+ "learning_rate": 8.00794694690296e-06,
+ "loss": 0.1036,
+ "step": 21173
+ },
+ {
+ "epoch": 57.694822888283376,
+ "grad_norm": 4.0240278244018555,
+ "learning_rate": 8.007082147178967e-06,
+ "loss": 0.0761,
+ "step": 21174
+ },
+ {
+ "epoch": 57.69754768392371,
+ "grad_norm": 4.17277717590332,
+ "learning_rate": 8.006217362975752e-06,
+ "loss": 0.0883,
+ "step": 21175
+ },
+ {
+ "epoch": 57.700272479564035,
+ "grad_norm": 3.8516342639923096,
+ "learning_rate": 8.005352594300052e-06,
+ "loss": 0.1287,
+ "step": 21176
+ },
+ {
+ "epoch": 57.70299727520436,
+ "grad_norm": 3.2691752910614014,
+ "learning_rate": 8.004487841158601e-06,
+ "loss": 0.279,
+ "step": 21177
+ },
+ {
+ "epoch": 57.705722070844686,
+ "grad_norm": 4.902161121368408,
+ "learning_rate": 8.003623103558137e-06,
+ "loss": 0.1033,
+ "step": 21178
+ },
+ {
+ "epoch": 57.70844686648501,
+ "grad_norm": 4.927868843078613,
+ "learning_rate": 8.002758381505389e-06,
+ "loss": 0.1865,
+ "step": 21179
+ },
+ {
+ "epoch": 57.71117166212534,
+ "grad_norm": 3.784280300140381,
+ "learning_rate": 8.001893675007098e-06,
+ "loss": 0.0666,
+ "step": 21180
+ },
+ {
+ "epoch": 57.71389645776567,
+ "grad_norm": 5.653964996337891,
+ "learning_rate": 8.001028984069991e-06,
+ "loss": 0.0703,
+ "step": 21181
+ },
+ {
+ "epoch": 57.716621253406,
+ "grad_norm": 3.5887389183044434,
+ "learning_rate": 8.00016430870081e-06,
+ "loss": 0.0579,
+ "step": 21182
+ },
+ {
+ "epoch": 57.71934604904632,
+ "grad_norm": 3.9548680782318115,
+ "learning_rate": 7.999299648906281e-06,
+ "loss": 0.1167,
+ "step": 21183
+ },
+ {
+ "epoch": 57.72207084468665,
+ "grad_norm": 5.61143684387207,
+ "learning_rate": 7.998435004693144e-06,
+ "loss": 0.0734,
+ "step": 21184
+ },
+ {
+ "epoch": 57.724795640326974,
+ "grad_norm": 7.683944225311279,
+ "learning_rate": 7.99757037606813e-06,
+ "loss": 0.2285,
+ "step": 21185
+ },
+ {
+ "epoch": 57.7275204359673,
+ "grad_norm": 3.710585355758667,
+ "learning_rate": 7.996705763037975e-06,
+ "loss": 0.0516,
+ "step": 21186
+ },
+ {
+ "epoch": 57.73024523160763,
+ "grad_norm": 3.7653274536132812,
+ "learning_rate": 7.99584116560941e-06,
+ "loss": 0.0953,
+ "step": 21187
+ },
+ {
+ "epoch": 57.73297002724796,
+ "grad_norm": 3.338184118270874,
+ "learning_rate": 7.99497658378917e-06,
+ "loss": 0.1255,
+ "step": 21188
+ },
+ {
+ "epoch": 57.735694822888284,
+ "grad_norm": 3.2238829135894775,
+ "learning_rate": 7.994112017583984e-06,
+ "loss": 0.057,
+ "step": 21189
+ },
+ {
+ "epoch": 57.73841961852861,
+ "grad_norm": 3.815045118331909,
+ "learning_rate": 7.99324746700059e-06,
+ "loss": 0.216,
+ "step": 21190
+ },
+ {
+ "epoch": 57.741144414168936,
+ "grad_norm": 5.742342472076416,
+ "learning_rate": 7.992382932045726e-06,
+ "loss": 0.1826,
+ "step": 21191
+ },
+ {
+ "epoch": 57.74386920980926,
+ "grad_norm": 3.9520397186279297,
+ "learning_rate": 7.991518412726113e-06,
+ "loss": 0.0978,
+ "step": 21192
+ },
+ {
+ "epoch": 57.746594005449595,
+ "grad_norm": 3.801438808441162,
+ "learning_rate": 7.990653909048494e-06,
+ "loss": 0.0702,
+ "step": 21193
+ },
+ {
+ "epoch": 57.74931880108992,
+ "grad_norm": 5.18593168258667,
+ "learning_rate": 7.989789421019596e-06,
+ "loss": 0.1799,
+ "step": 21194
+ },
+ {
+ "epoch": 57.752043596730246,
+ "grad_norm": 13.383259773254395,
+ "learning_rate": 7.988924948646153e-06,
+ "loss": 0.1071,
+ "step": 21195
+ },
+ {
+ "epoch": 57.75476839237057,
+ "grad_norm": 3.170557737350464,
+ "learning_rate": 7.988060491934899e-06,
+ "loss": 0.1505,
+ "step": 21196
+ },
+ {
+ "epoch": 57.7574931880109,
+ "grad_norm": 4.092858791351318,
+ "learning_rate": 7.987196050892565e-06,
+ "loss": 0.0949,
+ "step": 21197
+ },
+ {
+ "epoch": 57.76021798365122,
+ "grad_norm": 3.719846487045288,
+ "learning_rate": 7.986331625525883e-06,
+ "loss": 0.0713,
+ "step": 21198
+ },
+ {
+ "epoch": 57.762942779291556,
+ "grad_norm": 3.993051528930664,
+ "learning_rate": 7.985467215841584e-06,
+ "loss": 0.1295,
+ "step": 21199
+ },
+ {
+ "epoch": 57.76566757493188,
+ "grad_norm": 3.3964996337890625,
+ "learning_rate": 7.984602821846404e-06,
+ "loss": 0.1053,
+ "step": 21200
+ },
+ {
+ "epoch": 57.76839237057221,
+ "grad_norm": 3.152707576751709,
+ "learning_rate": 7.983738443547068e-06,
+ "loss": 0.0612,
+ "step": 21201
+ },
+ {
+ "epoch": 57.771117166212534,
+ "grad_norm": 4.443272590637207,
+ "learning_rate": 7.982874080950319e-06,
+ "loss": 0.0838,
+ "step": 21202
+ },
+ {
+ "epoch": 57.77384196185286,
+ "grad_norm": 4.386751174926758,
+ "learning_rate": 7.982009734062876e-06,
+ "loss": 0.2328,
+ "step": 21203
+ },
+ {
+ "epoch": 57.776566757493185,
+ "grad_norm": 3.799968719482422,
+ "learning_rate": 7.98114540289148e-06,
+ "loss": 0.0868,
+ "step": 21204
+ },
+ {
+ "epoch": 57.77929155313352,
+ "grad_norm": 3.518902540206909,
+ "learning_rate": 7.980281087442855e-06,
+ "loss": 0.1107,
+ "step": 21205
+ },
+ {
+ "epoch": 57.782016348773844,
+ "grad_norm": 3.5291759967803955,
+ "learning_rate": 7.97941678772374e-06,
+ "loss": 0.0716,
+ "step": 21206
+ },
+ {
+ "epoch": 57.78474114441417,
+ "grad_norm": 3.9906630516052246,
+ "learning_rate": 7.978552503740855e-06,
+ "loss": 0.168,
+ "step": 21207
+ },
+ {
+ "epoch": 57.787465940054496,
+ "grad_norm": 3.3229517936706543,
+ "learning_rate": 7.977688235500942e-06,
+ "loss": 0.1101,
+ "step": 21208
+ },
+ {
+ "epoch": 57.79019073569482,
+ "grad_norm": 4.04408597946167,
+ "learning_rate": 7.97682398301073e-06,
+ "loss": 0.1445,
+ "step": 21209
+ },
+ {
+ "epoch": 57.79291553133515,
+ "grad_norm": 4.9350690841674805,
+ "learning_rate": 7.975959746276946e-06,
+ "loss": 0.2702,
+ "step": 21210
+ },
+ {
+ "epoch": 57.79564032697548,
+ "grad_norm": 4.619058609008789,
+ "learning_rate": 7.975095525306324e-06,
+ "loss": 0.0929,
+ "step": 21211
+ },
+ {
+ "epoch": 57.798365122615806,
+ "grad_norm": 4.2038679122924805,
+ "learning_rate": 7.97423132010559e-06,
+ "loss": 0.0711,
+ "step": 21212
+ },
+ {
+ "epoch": 57.80108991825613,
+ "grad_norm": 3.2375524044036865,
+ "learning_rate": 7.97336713068148e-06,
+ "loss": 0.0973,
+ "step": 21213
+ },
+ {
+ "epoch": 57.80381471389646,
+ "grad_norm": 3.6754302978515625,
+ "learning_rate": 7.97250295704072e-06,
+ "loss": 0.3182,
+ "step": 21214
+ },
+ {
+ "epoch": 57.80653950953678,
+ "grad_norm": 3.4124221801757812,
+ "learning_rate": 7.971638799190044e-06,
+ "loss": 0.1551,
+ "step": 21215
+ },
+ {
+ "epoch": 57.80926430517711,
+ "grad_norm": 3.6353249549865723,
+ "learning_rate": 7.970774657136177e-06,
+ "loss": 0.203,
+ "step": 21216
+ },
+ {
+ "epoch": 57.81198910081744,
+ "grad_norm": 5.511824607849121,
+ "learning_rate": 7.969910530885854e-06,
+ "loss": 0.1322,
+ "step": 21217
+ },
+ {
+ "epoch": 57.81471389645777,
+ "grad_norm": 6.8044633865356445,
+ "learning_rate": 7.9690464204458e-06,
+ "loss": 0.1543,
+ "step": 21218
+ },
+ {
+ "epoch": 57.817438692098094,
+ "grad_norm": 4.027974605560303,
+ "learning_rate": 7.968182325822748e-06,
+ "loss": 0.1423,
+ "step": 21219
+ },
+ {
+ "epoch": 57.82016348773842,
+ "grad_norm": 3.3240561485290527,
+ "learning_rate": 7.967318247023427e-06,
+ "loss": 0.0687,
+ "step": 21220
+ },
+ {
+ "epoch": 57.822888283378745,
+ "grad_norm": 3.256725311279297,
+ "learning_rate": 7.966454184054566e-06,
+ "loss": 0.049,
+ "step": 21221
+ },
+ {
+ "epoch": 57.82561307901907,
+ "grad_norm": 6.475952625274658,
+ "learning_rate": 7.965590136922894e-06,
+ "loss": 0.0575,
+ "step": 21222
+ },
+ {
+ "epoch": 57.828337874659404,
+ "grad_norm": 6.960272312164307,
+ "learning_rate": 7.96472610563514e-06,
+ "loss": 0.0667,
+ "step": 21223
+ },
+ {
+ "epoch": 57.83106267029973,
+ "grad_norm": 4.397171974182129,
+ "learning_rate": 7.96386209019803e-06,
+ "loss": 0.1421,
+ "step": 21224
+ },
+ {
+ "epoch": 57.833787465940055,
+ "grad_norm": 4.35145378112793,
+ "learning_rate": 7.962998090618303e-06,
+ "loss": 0.1062,
+ "step": 21225
+ },
+ {
+ "epoch": 57.83651226158038,
+ "grad_norm": 6.342430114746094,
+ "learning_rate": 7.962134106902679e-06,
+ "loss": 0.1545,
+ "step": 21226
+ },
+ {
+ "epoch": 57.83923705722071,
+ "grad_norm": 4.252971172332764,
+ "learning_rate": 7.961270139057891e-06,
+ "loss": 0.0715,
+ "step": 21227
+ },
+ {
+ "epoch": 57.84196185286103,
+ "grad_norm": 3.5006935596466064,
+ "learning_rate": 7.960406187090661e-06,
+ "loss": 0.1496,
+ "step": 21228
+ },
+ {
+ "epoch": 57.844686648501366,
+ "grad_norm": 3.8766372203826904,
+ "learning_rate": 7.959542251007726e-06,
+ "loss": 0.0847,
+ "step": 21229
+ },
+ {
+ "epoch": 57.84741144414169,
+ "grad_norm": 5.189877986907959,
+ "learning_rate": 7.95867833081581e-06,
+ "loss": 0.156,
+ "step": 21230
+ },
+ {
+ "epoch": 57.85013623978202,
+ "grad_norm": 4.126110076904297,
+ "learning_rate": 7.95781442652164e-06,
+ "loss": 0.0603,
+ "step": 21231
+ },
+ {
+ "epoch": 57.85286103542234,
+ "grad_norm": 2.957515001296997,
+ "learning_rate": 7.956950538131946e-06,
+ "loss": 0.0549,
+ "step": 21232
+ },
+ {
+ "epoch": 57.85558583106267,
+ "grad_norm": 5.171656608581543,
+ "learning_rate": 7.956086665653456e-06,
+ "loss": 0.1057,
+ "step": 21233
+ },
+ {
+ "epoch": 57.858310626702995,
+ "grad_norm": 5.595894813537598,
+ "learning_rate": 7.955222809092895e-06,
+ "loss": 0.1428,
+ "step": 21234
+ },
+ {
+ "epoch": 57.86103542234333,
+ "grad_norm": 5.651068210601807,
+ "learning_rate": 7.954358968456997e-06,
+ "loss": 0.1894,
+ "step": 21235
+ },
+ {
+ "epoch": 57.86376021798365,
+ "grad_norm": 5.017315864562988,
+ "learning_rate": 7.953495143752481e-06,
+ "loss": 0.1441,
+ "step": 21236
+ },
+ {
+ "epoch": 57.86648501362398,
+ "grad_norm": 3.8824210166931152,
+ "learning_rate": 7.952631334986083e-06,
+ "loss": 0.0687,
+ "step": 21237
+ },
+ {
+ "epoch": 57.869209809264305,
+ "grad_norm": 4.548652648925781,
+ "learning_rate": 7.951767542164524e-06,
+ "loss": 0.1594,
+ "step": 21238
+ },
+ {
+ "epoch": 57.87193460490463,
+ "grad_norm": 3.957911491394043,
+ "learning_rate": 7.950903765294534e-06,
+ "loss": 0.1356,
+ "step": 21239
+ },
+ {
+ "epoch": 57.87465940054496,
+ "grad_norm": 4.3087263107299805,
+ "learning_rate": 7.950040004382838e-06,
+ "loss": 0.0463,
+ "step": 21240
+ },
+ {
+ "epoch": 57.87738419618529,
+ "grad_norm": 3.348483085632324,
+ "learning_rate": 7.949176259436164e-06,
+ "loss": 0.1183,
+ "step": 21241
+ },
+ {
+ "epoch": 57.880108991825615,
+ "grad_norm": 3.969270706176758,
+ "learning_rate": 7.94831253046124e-06,
+ "loss": 0.1048,
+ "step": 21242
+ },
+ {
+ "epoch": 57.88283378746594,
+ "grad_norm": 4.792532444000244,
+ "learning_rate": 7.947448817464793e-06,
+ "loss": 0.2866,
+ "step": 21243
+ },
+ {
+ "epoch": 57.88555858310627,
+ "grad_norm": 3.986077070236206,
+ "learning_rate": 7.946585120453549e-06,
+ "loss": 0.0796,
+ "step": 21244
+ },
+ {
+ "epoch": 57.88828337874659,
+ "grad_norm": 10.107830047607422,
+ "learning_rate": 7.945721439434234e-06,
+ "loss": 0.0846,
+ "step": 21245
+ },
+ {
+ "epoch": 57.89100817438692,
+ "grad_norm": 4.53139591217041,
+ "learning_rate": 7.944857774413573e-06,
+ "loss": 0.1073,
+ "step": 21246
+ },
+ {
+ "epoch": 57.89373297002725,
+ "grad_norm": 4.03631067276001,
+ "learning_rate": 7.943994125398295e-06,
+ "loss": 0.0719,
+ "step": 21247
+ },
+ {
+ "epoch": 57.89645776566758,
+ "grad_norm": 3.6810109615325928,
+ "learning_rate": 7.943130492395123e-06,
+ "loss": 0.1046,
+ "step": 21248
+ },
+ {
+ "epoch": 57.8991825613079,
+ "grad_norm": 5.402345180511475,
+ "learning_rate": 7.942266875410788e-06,
+ "loss": 0.1807,
+ "step": 21249
+ },
+ {
+ "epoch": 57.90190735694823,
+ "grad_norm": 5.32850456237793,
+ "learning_rate": 7.941403274452009e-06,
+ "loss": 0.0887,
+ "step": 21250
+ },
+ {
+ "epoch": 57.904632152588555,
+ "grad_norm": 5.606999397277832,
+ "learning_rate": 7.940539689525517e-06,
+ "loss": 0.0795,
+ "step": 21251
+ },
+ {
+ "epoch": 57.90735694822888,
+ "grad_norm": 3.406586170196533,
+ "learning_rate": 7.939676120638033e-06,
+ "loss": 0.0599,
+ "step": 21252
+ },
+ {
+ "epoch": 57.91008174386921,
+ "grad_norm": 3.391803741455078,
+ "learning_rate": 7.938812567796289e-06,
+ "loss": 0.17,
+ "step": 21253
+ },
+ {
+ "epoch": 57.91280653950954,
+ "grad_norm": 4.0680928230285645,
+ "learning_rate": 7.937949031007001e-06,
+ "loss": 0.1939,
+ "step": 21254
+ },
+ {
+ "epoch": 57.915531335149865,
+ "grad_norm": 3.9837732315063477,
+ "learning_rate": 7.937085510276904e-06,
+ "loss": 0.132,
+ "step": 21255
+ },
+ {
+ "epoch": 57.91825613079019,
+ "grad_norm": 3.055096387863159,
+ "learning_rate": 7.936222005612717e-06,
+ "loss": 0.0558,
+ "step": 21256
+ },
+ {
+ "epoch": 57.920980926430516,
+ "grad_norm": 4.074774265289307,
+ "learning_rate": 7.935358517021168e-06,
+ "loss": 0.1265,
+ "step": 21257
+ },
+ {
+ "epoch": 57.92370572207084,
+ "grad_norm": 3.5439140796661377,
+ "learning_rate": 7.934495044508976e-06,
+ "loss": 0.1168,
+ "step": 21258
+ },
+ {
+ "epoch": 57.926430517711175,
+ "grad_norm": 4.016378879547119,
+ "learning_rate": 7.933631588082872e-06,
+ "loss": 0.115,
+ "step": 21259
+ },
+ {
+ "epoch": 57.9291553133515,
+ "grad_norm": 3.780677318572998,
+ "learning_rate": 7.932768147749582e-06,
+ "loss": 0.0652,
+ "step": 21260
+ },
+ {
+ "epoch": 57.93188010899183,
+ "grad_norm": 4.864652156829834,
+ "learning_rate": 7.931904723515825e-06,
+ "loss": 0.2459,
+ "step": 21261
+ },
+ {
+ "epoch": 57.93460490463215,
+ "grad_norm": 6.173576831817627,
+ "learning_rate": 7.931041315388328e-06,
+ "loss": 0.1484,
+ "step": 21262
+ },
+ {
+ "epoch": 57.93732970027248,
+ "grad_norm": 3.8185551166534424,
+ "learning_rate": 7.930177923373814e-06,
+ "loss": 0.0882,
+ "step": 21263
+ },
+ {
+ "epoch": 57.940054495912804,
+ "grad_norm": 4.387790203094482,
+ "learning_rate": 7.929314547479007e-06,
+ "loss": 0.1572,
+ "step": 21264
+ },
+ {
+ "epoch": 57.94277929155314,
+ "grad_norm": 3.009045124053955,
+ "learning_rate": 7.928451187710632e-06,
+ "loss": 0.0655,
+ "step": 21265
+ },
+ {
+ "epoch": 57.94550408719346,
+ "grad_norm": 3.612657070159912,
+ "learning_rate": 7.927587844075413e-06,
+ "loss": 0.1895,
+ "step": 21266
+ },
+ {
+ "epoch": 57.94822888283379,
+ "grad_norm": 4.834962844848633,
+ "learning_rate": 7.926724516580076e-06,
+ "loss": 0.1516,
+ "step": 21267
+ },
+ {
+ "epoch": 57.950953678474114,
+ "grad_norm": 4.229416847229004,
+ "learning_rate": 7.925861205231336e-06,
+ "loss": 0.124,
+ "step": 21268
+ },
+ {
+ "epoch": 57.95367847411444,
+ "grad_norm": 4.106301307678223,
+ "learning_rate": 7.924997910035928e-06,
+ "loss": 0.0933,
+ "step": 21269
+ },
+ {
+ "epoch": 57.956403269754766,
+ "grad_norm": 4.202123165130615,
+ "learning_rate": 7.924134631000566e-06,
+ "loss": 0.1113,
+ "step": 21270
+ },
+ {
+ "epoch": 57.95912806539509,
+ "grad_norm": 4.454462051391602,
+ "learning_rate": 7.923271368131977e-06,
+ "loss": 0.1347,
+ "step": 21271
+ },
+ {
+ "epoch": 57.961852861035425,
+ "grad_norm": 4.040456295013428,
+ "learning_rate": 7.922408121436883e-06,
+ "loss": 0.0798,
+ "step": 21272
+ },
+ {
+ "epoch": 57.96457765667575,
+ "grad_norm": 3.8941664695739746,
+ "learning_rate": 7.921544890922011e-06,
+ "loss": 0.0735,
+ "step": 21273
+ },
+ {
+ "epoch": 57.967302452316076,
+ "grad_norm": 4.834648609161377,
+ "learning_rate": 7.920681676594077e-06,
+ "loss": 0.1558,
+ "step": 21274
+ },
+ {
+ "epoch": 57.9700272479564,
+ "grad_norm": 4.663985252380371,
+ "learning_rate": 7.919818478459805e-06,
+ "loss": 0.216,
+ "step": 21275
+ },
+ {
+ "epoch": 57.97275204359673,
+ "grad_norm": 5.6572465896606445,
+ "learning_rate": 7.918955296525925e-06,
+ "loss": 0.072,
+ "step": 21276
+ },
+ {
+ "epoch": 57.97547683923706,
+ "grad_norm": 2.902808427810669,
+ "learning_rate": 7.91809213079915e-06,
+ "loss": 0.0762,
+ "step": 21277
+ },
+ {
+ "epoch": 57.97820163487739,
+ "grad_norm": 3.3866100311279297,
+ "learning_rate": 7.917228981286212e-06,
+ "loss": 0.0842,
+ "step": 21278
+ },
+ {
+ "epoch": 57.98092643051771,
+ "grad_norm": 4.018303871154785,
+ "learning_rate": 7.916365847993823e-06,
+ "loss": 0.1088,
+ "step": 21279
+ },
+ {
+ "epoch": 57.98365122615804,
+ "grad_norm": 4.212928295135498,
+ "learning_rate": 7.915502730928713e-06,
+ "loss": 0.1219,
+ "step": 21280
+ },
+ {
+ "epoch": 57.986376021798364,
+ "grad_norm": 3.5765438079833984,
+ "learning_rate": 7.914639630097598e-06,
+ "loss": 0.0922,
+ "step": 21281
+ },
+ {
+ "epoch": 57.98910081743869,
+ "grad_norm": 5.174197196960449,
+ "learning_rate": 7.913776545507204e-06,
+ "loss": 0.2322,
+ "step": 21282
+ },
+ {
+ "epoch": 57.991825613079016,
+ "grad_norm": 12.848947525024414,
+ "learning_rate": 7.91291347716425e-06,
+ "loss": 0.1827,
+ "step": 21283
+ },
+ {
+ "epoch": 57.99455040871935,
+ "grad_norm": 3.7650251388549805,
+ "learning_rate": 7.91205042507546e-06,
+ "loss": 0.0621,
+ "step": 21284
+ },
+ {
+ "epoch": 57.997275204359674,
+ "grad_norm": 3.8231921195983887,
+ "learning_rate": 7.911187389247553e-06,
+ "loss": 0.0696,
+ "step": 21285
+ },
+ {
+ "epoch": 58.0,
+ "grad_norm": 3.755431652069092,
+ "learning_rate": 7.91032436968725e-06,
+ "loss": 0.167,
+ "step": 21286
+ },
+ {
+ "epoch": 58.002724795640326,
+ "grad_norm": 4.290729999542236,
+ "learning_rate": 7.909461366401277e-06,
+ "loss": 0.0838,
+ "step": 21287
+ },
+ {
+ "epoch": 58.00544959128065,
+ "grad_norm": 3.493969202041626,
+ "learning_rate": 7.908598379396349e-06,
+ "loss": 0.0639,
+ "step": 21288
+ },
+ {
+ "epoch": 58.00817438692098,
+ "grad_norm": 4.644974231719971,
+ "learning_rate": 7.90773540867919e-06,
+ "loss": 0.0932,
+ "step": 21289
+ },
+ {
+ "epoch": 58.01089918256131,
+ "grad_norm": 3.7207095623016357,
+ "learning_rate": 7.90687245425652e-06,
+ "loss": 0.0752,
+ "step": 21290
+ },
+ {
+ "epoch": 58.013623978201636,
+ "grad_norm": 5.176153659820557,
+ "learning_rate": 7.90600951613506e-06,
+ "loss": 0.1327,
+ "step": 21291
+ },
+ {
+ "epoch": 58.01634877384196,
+ "grad_norm": 4.342294216156006,
+ "learning_rate": 7.905146594321532e-06,
+ "loss": 0.0694,
+ "step": 21292
+ },
+ {
+ "epoch": 58.01907356948229,
+ "grad_norm": 7.584478855133057,
+ "learning_rate": 7.904283688822651e-06,
+ "loss": 0.0665,
+ "step": 21293
+ },
+ {
+ "epoch": 58.02179836512261,
+ "grad_norm": 4.0451459884643555,
+ "learning_rate": 7.903420799645145e-06,
+ "loss": 0.0988,
+ "step": 21294
+ },
+ {
+ "epoch": 58.02452316076294,
+ "grad_norm": 4.211483955383301,
+ "learning_rate": 7.90255792679573e-06,
+ "loss": 0.1224,
+ "step": 21295
+ },
+ {
+ "epoch": 58.02724795640327,
+ "grad_norm": 5.9595947265625,
+ "learning_rate": 7.901695070281126e-06,
+ "loss": 0.1019,
+ "step": 21296
+ },
+ {
+ "epoch": 58.0299727520436,
+ "grad_norm": 5.6954569816589355,
+ "learning_rate": 7.90083223010805e-06,
+ "loss": 0.0998,
+ "step": 21297
+ },
+ {
+ "epoch": 58.032697547683924,
+ "grad_norm": 3.059959888458252,
+ "learning_rate": 7.899969406283232e-06,
+ "loss": 0.2582,
+ "step": 21298
+ },
+ {
+ "epoch": 58.03542234332425,
+ "grad_norm": 3.3717527389526367,
+ "learning_rate": 7.89910659881338e-06,
+ "loss": 0.197,
+ "step": 21299
+ },
+ {
+ "epoch": 58.038147138964575,
+ "grad_norm": 5.451910495758057,
+ "learning_rate": 7.898243807705219e-06,
+ "loss": 0.1239,
+ "step": 21300
+ },
+ {
+ "epoch": 58.0408719346049,
+ "grad_norm": 3.5340797901153564,
+ "learning_rate": 7.897381032965467e-06,
+ "loss": 0.0729,
+ "step": 21301
+ },
+ {
+ "epoch": 58.043596730245234,
+ "grad_norm": 4.630802631378174,
+ "learning_rate": 7.896518274600845e-06,
+ "loss": 0.1574,
+ "step": 21302
+ },
+ {
+ "epoch": 58.04632152588556,
+ "grad_norm": 4.857437610626221,
+ "learning_rate": 7.89565553261807e-06,
+ "loss": 0.1973,
+ "step": 21303
+ },
+ {
+ "epoch": 58.049046321525886,
+ "grad_norm": 4.43881893157959,
+ "learning_rate": 7.894792807023864e-06,
+ "loss": 0.0897,
+ "step": 21304
+ },
+ {
+ "epoch": 58.05177111716621,
+ "grad_norm": 3.798677682876587,
+ "learning_rate": 7.89393009782494e-06,
+ "loss": 0.0626,
+ "step": 21305
+ },
+ {
+ "epoch": 58.05449591280654,
+ "grad_norm": 3.7635207176208496,
+ "learning_rate": 7.893067405028025e-06,
+ "loss": 0.1203,
+ "step": 21306
+ },
+ {
+ "epoch": 58.05722070844686,
+ "grad_norm": 3.1937971115112305,
+ "learning_rate": 7.89220472863983e-06,
+ "loss": 0.0529,
+ "step": 21307
+ },
+ {
+ "epoch": 58.059945504087196,
+ "grad_norm": 3.741414785385132,
+ "learning_rate": 7.891342068667079e-06,
+ "loss": 0.083,
+ "step": 21308
+ },
+ {
+ "epoch": 58.06267029972752,
+ "grad_norm": 3.0845866203308105,
+ "learning_rate": 7.890479425116484e-06,
+ "loss": 0.1788,
+ "step": 21309
+ },
+ {
+ "epoch": 58.06539509536785,
+ "grad_norm": 3.9257125854492188,
+ "learning_rate": 7.889616797994768e-06,
+ "loss": 0.0752,
+ "step": 21310
+ },
+ {
+ "epoch": 58.06811989100817,
+ "grad_norm": 5.93182373046875,
+ "learning_rate": 7.88875418730865e-06,
+ "loss": 0.2888,
+ "step": 21311
+ },
+ {
+ "epoch": 58.0708446866485,
+ "grad_norm": 2.8869850635528564,
+ "learning_rate": 7.887891593064848e-06,
+ "loss": 0.0445,
+ "step": 21312
+ },
+ {
+ "epoch": 58.073569482288825,
+ "grad_norm": 3.5473380088806152,
+ "learning_rate": 7.887029015270076e-06,
+ "loss": 0.0753,
+ "step": 21313
+ },
+ {
+ "epoch": 58.07629427792916,
+ "grad_norm": 5.232302665710449,
+ "learning_rate": 7.886166453931056e-06,
+ "loss": 0.1679,
+ "step": 21314
+ },
+ {
+ "epoch": 58.079019073569484,
+ "grad_norm": 3.481288433074951,
+ "learning_rate": 7.885303909054504e-06,
+ "loss": 0.0694,
+ "step": 21315
+ },
+ {
+ "epoch": 58.08174386920981,
+ "grad_norm": 4.258885860443115,
+ "learning_rate": 7.884441380647136e-06,
+ "loss": 0.0734,
+ "step": 21316
+ },
+ {
+ "epoch": 58.084468664850135,
+ "grad_norm": 3.5817365646362305,
+ "learning_rate": 7.88357886871567e-06,
+ "loss": 0.158,
+ "step": 21317
+ },
+ {
+ "epoch": 58.08719346049046,
+ "grad_norm": 4.158348560333252,
+ "learning_rate": 7.882716373266825e-06,
+ "loss": 0.1088,
+ "step": 21318
+ },
+ {
+ "epoch": 58.08991825613079,
+ "grad_norm": 4.0440802574157715,
+ "learning_rate": 7.881853894307316e-06,
+ "loss": 0.2369,
+ "step": 21319
+ },
+ {
+ "epoch": 58.09264305177112,
+ "grad_norm": 4.712680339813232,
+ "learning_rate": 7.880991431843861e-06,
+ "loss": 0.0653,
+ "step": 21320
+ },
+ {
+ "epoch": 58.095367847411445,
+ "grad_norm": 3.7499608993530273,
+ "learning_rate": 7.880128985883175e-06,
+ "loss": 0.0768,
+ "step": 21321
+ },
+ {
+ "epoch": 58.09809264305177,
+ "grad_norm": 4.3392157554626465,
+ "learning_rate": 7.879266556431979e-06,
+ "loss": 0.0587,
+ "step": 21322
+ },
+ {
+ "epoch": 58.1008174386921,
+ "grad_norm": 5.922008514404297,
+ "learning_rate": 7.878404143496985e-06,
+ "loss": 0.1057,
+ "step": 21323
+ },
+ {
+ "epoch": 58.10354223433242,
+ "grad_norm": 3.9000155925750732,
+ "learning_rate": 7.877541747084912e-06,
+ "loss": 0.0811,
+ "step": 21324
+ },
+ {
+ "epoch": 58.10626702997275,
+ "grad_norm": 3.4240224361419678,
+ "learning_rate": 7.876679367202474e-06,
+ "loss": 0.1955,
+ "step": 21325
+ },
+ {
+ "epoch": 58.10899182561308,
+ "grad_norm": 3.6861934661865234,
+ "learning_rate": 7.875817003856392e-06,
+ "loss": 0.0501,
+ "step": 21326
+ },
+ {
+ "epoch": 58.11171662125341,
+ "grad_norm": 4.137561798095703,
+ "learning_rate": 7.874954657053373e-06,
+ "loss": 0.2101,
+ "step": 21327
+ },
+ {
+ "epoch": 58.11444141689373,
+ "grad_norm": 3.0040736198425293,
+ "learning_rate": 7.874092326800142e-06,
+ "loss": 0.1097,
+ "step": 21328
+ },
+ {
+ "epoch": 58.11716621253406,
+ "grad_norm": 4.561694622039795,
+ "learning_rate": 7.87323001310341e-06,
+ "loss": 0.2594,
+ "step": 21329
+ },
+ {
+ "epoch": 58.119891008174385,
+ "grad_norm": 3.0798263549804688,
+ "learning_rate": 7.872367715969897e-06,
+ "loss": 0.0712,
+ "step": 21330
+ },
+ {
+ "epoch": 58.12261580381471,
+ "grad_norm": 3.4744293689727783,
+ "learning_rate": 7.871505435406315e-06,
+ "loss": 0.1981,
+ "step": 21331
+ },
+ {
+ "epoch": 58.12534059945504,
+ "grad_norm": 3.486356735229492,
+ "learning_rate": 7.870643171419382e-06,
+ "loss": 0.054,
+ "step": 21332
+ },
+ {
+ "epoch": 58.12806539509537,
+ "grad_norm": 3.9207701683044434,
+ "learning_rate": 7.869780924015807e-06,
+ "loss": 0.0655,
+ "step": 21333
+ },
+ {
+ "epoch": 58.130790190735695,
+ "grad_norm": 3.4613382816314697,
+ "learning_rate": 7.868918693202314e-06,
+ "loss": 0.1243,
+ "step": 21334
+ },
+ {
+ "epoch": 58.13351498637602,
+ "grad_norm": 3.66589617729187,
+ "learning_rate": 7.86805647898561e-06,
+ "loss": 0.1703,
+ "step": 21335
+ },
+ {
+ "epoch": 58.13623978201635,
+ "grad_norm": 3.6065454483032227,
+ "learning_rate": 7.867194281372417e-06,
+ "loss": 0.1415,
+ "step": 21336
+ },
+ {
+ "epoch": 58.13896457765667,
+ "grad_norm": 4.07046365737915,
+ "learning_rate": 7.866332100369444e-06,
+ "loss": 0.1409,
+ "step": 21337
+ },
+ {
+ "epoch": 58.141689373297005,
+ "grad_norm": 3.97886061668396,
+ "learning_rate": 7.865469935983409e-06,
+ "loss": 0.1356,
+ "step": 21338
+ },
+ {
+ "epoch": 58.14441416893733,
+ "grad_norm": 4.356708526611328,
+ "learning_rate": 7.864607788221024e-06,
+ "loss": 0.1442,
+ "step": 21339
+ },
+ {
+ "epoch": 58.14713896457766,
+ "grad_norm": 4.287309646606445,
+ "learning_rate": 7.863745657089008e-06,
+ "loss": 0.1436,
+ "step": 21340
+ },
+ {
+ "epoch": 58.14986376021798,
+ "grad_norm": 2.969545364379883,
+ "learning_rate": 7.862883542594067e-06,
+ "loss": 0.0489,
+ "step": 21341
+ },
+ {
+ "epoch": 58.15258855585831,
+ "grad_norm": 3.9011642932891846,
+ "learning_rate": 7.862021444742924e-06,
+ "loss": 0.103,
+ "step": 21342
+ },
+ {
+ "epoch": 58.155313351498634,
+ "grad_norm": 3.09757924079895,
+ "learning_rate": 7.861159363542289e-06,
+ "loss": 0.1337,
+ "step": 21343
+ },
+ {
+ "epoch": 58.15803814713897,
+ "grad_norm": 3.0279064178466797,
+ "learning_rate": 7.860297298998871e-06,
+ "loss": 0.0505,
+ "step": 21344
+ },
+ {
+ "epoch": 58.16076294277929,
+ "grad_norm": 3.4479753971099854,
+ "learning_rate": 7.859435251119394e-06,
+ "loss": 0.154,
+ "step": 21345
+ },
+ {
+ "epoch": 58.16348773841962,
+ "grad_norm": 3.727128744125366,
+ "learning_rate": 7.858573219910565e-06,
+ "loss": 0.1915,
+ "step": 21346
+ },
+ {
+ "epoch": 58.166212534059945,
+ "grad_norm": 5.588064670562744,
+ "learning_rate": 7.857711205379099e-06,
+ "loss": 0.1808,
+ "step": 21347
+ },
+ {
+ "epoch": 58.16893732970027,
+ "grad_norm": 5.7774128913879395,
+ "learning_rate": 7.85684920753171e-06,
+ "loss": 0.1534,
+ "step": 21348
+ },
+ {
+ "epoch": 58.171662125340596,
+ "grad_norm": 3.6232221126556396,
+ "learning_rate": 7.85598722637511e-06,
+ "loss": 0.1654,
+ "step": 21349
+ },
+ {
+ "epoch": 58.17438692098093,
+ "grad_norm": 4.164429187774658,
+ "learning_rate": 7.855125261916012e-06,
+ "loss": 0.098,
+ "step": 21350
+ },
+ {
+ "epoch": 58.177111716621255,
+ "grad_norm": 3.551900625228882,
+ "learning_rate": 7.854263314161128e-06,
+ "loss": 0.0566,
+ "step": 21351
+ },
+ {
+ "epoch": 58.17983651226158,
+ "grad_norm": 4.061517238616943,
+ "learning_rate": 7.853401383117176e-06,
+ "loss": 0.1674,
+ "step": 21352
+ },
+ {
+ "epoch": 58.182561307901906,
+ "grad_norm": 4.399727821350098,
+ "learning_rate": 7.85253946879086e-06,
+ "loss": 0.1202,
+ "step": 21353
+ },
+ {
+ "epoch": 58.18528610354223,
+ "grad_norm": 3.430011749267578,
+ "learning_rate": 7.851677571188903e-06,
+ "loss": 0.2057,
+ "step": 21354
+ },
+ {
+ "epoch": 58.18801089918256,
+ "grad_norm": 3.1353375911712646,
+ "learning_rate": 7.850815690318007e-06,
+ "loss": 0.0631,
+ "step": 21355
+ },
+ {
+ "epoch": 58.19073569482289,
+ "grad_norm": 4.898374080657959,
+ "learning_rate": 7.849953826184892e-06,
+ "loss": 0.2719,
+ "step": 21356
+ },
+ {
+ "epoch": 58.19346049046322,
+ "grad_norm": 4.685498237609863,
+ "learning_rate": 7.849091978796267e-06,
+ "loss": 0.0952,
+ "step": 21357
+ },
+ {
+ "epoch": 58.19618528610354,
+ "grad_norm": 6.148848056793213,
+ "learning_rate": 7.848230148158847e-06,
+ "loss": 0.1801,
+ "step": 21358
+ },
+ {
+ "epoch": 58.19891008174387,
+ "grad_norm": 4.193655967712402,
+ "learning_rate": 7.847368334279336e-06,
+ "loss": 0.1095,
+ "step": 21359
+ },
+ {
+ "epoch": 58.201634877384194,
+ "grad_norm": 3.1795859336853027,
+ "learning_rate": 7.846506537164456e-06,
+ "loss": 0.0984,
+ "step": 21360
+ },
+ {
+ "epoch": 58.20435967302452,
+ "grad_norm": 4.306779861450195,
+ "learning_rate": 7.845644756820908e-06,
+ "loss": 0.1707,
+ "step": 21361
+ },
+ {
+ "epoch": 58.20708446866485,
+ "grad_norm": 3.9911789894104004,
+ "learning_rate": 7.844782993255412e-06,
+ "loss": 0.0743,
+ "step": 21362
+ },
+ {
+ "epoch": 58.20980926430518,
+ "grad_norm": 4.329372406005859,
+ "learning_rate": 7.843921246474679e-06,
+ "loss": 0.1007,
+ "step": 21363
+ },
+ {
+ "epoch": 58.212534059945504,
+ "grad_norm": 2.8500869274139404,
+ "learning_rate": 7.843059516485415e-06,
+ "loss": 0.0463,
+ "step": 21364
+ },
+ {
+ "epoch": 58.21525885558583,
+ "grad_norm": 4.476006984710693,
+ "learning_rate": 7.842197803294337e-06,
+ "loss": 0.1228,
+ "step": 21365
+ },
+ {
+ "epoch": 58.217983651226156,
+ "grad_norm": 3.1800928115844727,
+ "learning_rate": 7.84133610690815e-06,
+ "loss": 0.0705,
+ "step": 21366
+ },
+ {
+ "epoch": 58.22070844686648,
+ "grad_norm": 3.367802619934082,
+ "learning_rate": 7.840474427333573e-06,
+ "loss": 0.0722,
+ "step": 21367
+ },
+ {
+ "epoch": 58.223433242506815,
+ "grad_norm": 3.4590463638305664,
+ "learning_rate": 7.839612764577305e-06,
+ "loss": 0.0742,
+ "step": 21368
+ },
+ {
+ "epoch": 58.22615803814714,
+ "grad_norm": 3.1542577743530273,
+ "learning_rate": 7.838751118646068e-06,
+ "loss": 0.0678,
+ "step": 21369
+ },
+ {
+ "epoch": 58.228882833787466,
+ "grad_norm": 3.5310192108154297,
+ "learning_rate": 7.837889489546566e-06,
+ "loss": 0.0516,
+ "step": 21370
+ },
+ {
+ "epoch": 58.23160762942779,
+ "grad_norm": 3.7076683044433594,
+ "learning_rate": 7.837027877285512e-06,
+ "loss": 0.1798,
+ "step": 21371
+ },
+ {
+ "epoch": 58.23433242506812,
+ "grad_norm": 3.785773992538452,
+ "learning_rate": 7.836166281869614e-06,
+ "loss": 0.1145,
+ "step": 21372
+ },
+ {
+ "epoch": 58.237057220708444,
+ "grad_norm": 3.829242706298828,
+ "learning_rate": 7.835304703305583e-06,
+ "loss": 0.2267,
+ "step": 21373
+ },
+ {
+ "epoch": 58.23978201634878,
+ "grad_norm": 3.6718368530273438,
+ "learning_rate": 7.834443141600131e-06,
+ "loss": 0.0481,
+ "step": 21374
+ },
+ {
+ "epoch": 58.2425068119891,
+ "grad_norm": 3.986198902130127,
+ "learning_rate": 7.833581596759965e-06,
+ "loss": 0.1318,
+ "step": 21375
+ },
+ {
+ "epoch": 58.24523160762943,
+ "grad_norm": 5.590548992156982,
+ "learning_rate": 7.832720068791798e-06,
+ "loss": 0.073,
+ "step": 21376
+ },
+ {
+ "epoch": 58.247956403269754,
+ "grad_norm": 4.912227630615234,
+ "learning_rate": 7.831858557702332e-06,
+ "loss": 0.0819,
+ "step": 21377
+ },
+ {
+ "epoch": 58.25068119891008,
+ "grad_norm": 4.700142860412598,
+ "learning_rate": 7.830997063498288e-06,
+ "loss": 0.0877,
+ "step": 21378
+ },
+ {
+ "epoch": 58.253405994550405,
+ "grad_norm": 3.449402093887329,
+ "learning_rate": 7.830135586186363e-06,
+ "loss": 0.0639,
+ "step": 21379
+ },
+ {
+ "epoch": 58.25613079019074,
+ "grad_norm": 4.228108882904053,
+ "learning_rate": 7.829274125773275e-06,
+ "loss": 0.1262,
+ "step": 21380
+ },
+ {
+ "epoch": 58.258855585831064,
+ "grad_norm": 3.4274513721466064,
+ "learning_rate": 7.82841268226573e-06,
+ "loss": 0.1647,
+ "step": 21381
+ },
+ {
+ "epoch": 58.26158038147139,
+ "grad_norm": 4.357746601104736,
+ "learning_rate": 7.827551255670438e-06,
+ "loss": 0.1457,
+ "step": 21382
+ },
+ {
+ "epoch": 58.264305177111716,
+ "grad_norm": 5.125286102294922,
+ "learning_rate": 7.82668984599411e-06,
+ "loss": 0.1067,
+ "step": 21383
+ },
+ {
+ "epoch": 58.26702997275204,
+ "grad_norm": 3.2794137001037598,
+ "learning_rate": 7.825828453243446e-06,
+ "loss": 0.0759,
+ "step": 21384
+ },
+ {
+ "epoch": 58.26975476839237,
+ "grad_norm": 6.392207145690918,
+ "learning_rate": 7.824967077425163e-06,
+ "loss": 0.074,
+ "step": 21385
+ },
+ {
+ "epoch": 58.2724795640327,
+ "grad_norm": 3.7522635459899902,
+ "learning_rate": 7.824105718545964e-06,
+ "loss": 0.0575,
+ "step": 21386
+ },
+ {
+ "epoch": 58.275204359673026,
+ "grad_norm": 3.603132486343384,
+ "learning_rate": 7.823244376612565e-06,
+ "loss": 0.0482,
+ "step": 21387
+ },
+ {
+ "epoch": 58.27792915531335,
+ "grad_norm": 4.035679340362549,
+ "learning_rate": 7.822383051631664e-06,
+ "loss": 0.058,
+ "step": 21388
+ },
+ {
+ "epoch": 58.28065395095368,
+ "grad_norm": 4.110881805419922,
+ "learning_rate": 7.821521743609974e-06,
+ "loss": 0.1739,
+ "step": 21389
+ },
+ {
+ "epoch": 58.283378746594,
+ "grad_norm": 4.31303596496582,
+ "learning_rate": 7.820660452554203e-06,
+ "loss": 0.1267,
+ "step": 21390
+ },
+ {
+ "epoch": 58.28610354223433,
+ "grad_norm": 4.4154534339904785,
+ "learning_rate": 7.81979917847106e-06,
+ "loss": 0.1102,
+ "step": 21391
+ },
+ {
+ "epoch": 58.28882833787466,
+ "grad_norm": 3.369174003601074,
+ "learning_rate": 7.81893792136725e-06,
+ "loss": 0.1161,
+ "step": 21392
+ },
+ {
+ "epoch": 58.29155313351499,
+ "grad_norm": 3.901320695877075,
+ "learning_rate": 7.81807668124948e-06,
+ "loss": 0.0618,
+ "step": 21393
+ },
+ {
+ "epoch": 58.294277929155314,
+ "grad_norm": 5.338075160980225,
+ "learning_rate": 7.817215458124459e-06,
+ "loss": 0.0779,
+ "step": 21394
+ },
+ {
+ "epoch": 58.29700272479564,
+ "grad_norm": 3.79465913772583,
+ "learning_rate": 7.816354251998896e-06,
+ "loss": 0.1361,
+ "step": 21395
+ },
+ {
+ "epoch": 58.299727520435965,
+ "grad_norm": 4.482502460479736,
+ "learning_rate": 7.815493062879488e-06,
+ "loss": 0.1486,
+ "step": 21396
+ },
+ {
+ "epoch": 58.30245231607629,
+ "grad_norm": 3.5135910511016846,
+ "learning_rate": 7.814631890772957e-06,
+ "loss": 0.1713,
+ "step": 21397
+ },
+ {
+ "epoch": 58.305177111716624,
+ "grad_norm": 4.737347602844238,
+ "learning_rate": 7.813770735686e-06,
+ "loss": 0.2697,
+ "step": 21398
+ },
+ {
+ "epoch": 58.30790190735695,
+ "grad_norm": 3.4451520442962646,
+ "learning_rate": 7.812909597625328e-06,
+ "loss": 0.1412,
+ "step": 21399
+ },
+ {
+ "epoch": 58.310626702997276,
+ "grad_norm": 4.710101127624512,
+ "learning_rate": 7.812048476597645e-06,
+ "loss": 0.0543,
+ "step": 21400
+ },
+ {
+ "epoch": 58.3133514986376,
+ "grad_norm": 4.055838108062744,
+ "learning_rate": 7.811187372609658e-06,
+ "loss": 0.0741,
+ "step": 21401
+ },
+ {
+ "epoch": 58.31607629427793,
+ "grad_norm": 4.483063220977783,
+ "learning_rate": 7.810326285668073e-06,
+ "loss": 0.1152,
+ "step": 21402
+ },
+ {
+ "epoch": 58.31880108991825,
+ "grad_norm": 3.3968918323516846,
+ "learning_rate": 7.809465215779596e-06,
+ "loss": 0.0614,
+ "step": 21403
+ },
+ {
+ "epoch": 58.321525885558586,
+ "grad_norm": 3.713894844055176,
+ "learning_rate": 7.808604162950934e-06,
+ "loss": 0.0972,
+ "step": 21404
+ },
+ {
+ "epoch": 58.32425068119891,
+ "grad_norm": 3.5638866424560547,
+ "learning_rate": 7.807743127188794e-06,
+ "loss": 0.0657,
+ "step": 21405
+ },
+ {
+ "epoch": 58.32697547683924,
+ "grad_norm": 4.74470329284668,
+ "learning_rate": 7.806882108499878e-06,
+ "loss": 0.1854,
+ "step": 21406
+ },
+ {
+ "epoch": 58.32970027247956,
+ "grad_norm": 4.56574010848999,
+ "learning_rate": 7.806021106890894e-06,
+ "loss": 0.0825,
+ "step": 21407
+ },
+ {
+ "epoch": 58.33242506811989,
+ "grad_norm": 3.5397439002990723,
+ "learning_rate": 7.805160122368548e-06,
+ "loss": 0.1053,
+ "step": 21408
+ },
+ {
+ "epoch": 58.335149863760215,
+ "grad_norm": 3.121457815170288,
+ "learning_rate": 7.804299154939543e-06,
+ "loss": 0.1497,
+ "step": 21409
+ },
+ {
+ "epoch": 58.33787465940055,
+ "grad_norm": 3.075286626815796,
+ "learning_rate": 7.803438204610584e-06,
+ "loss": 0.0687,
+ "step": 21410
+ },
+ {
+ "epoch": 58.34059945504087,
+ "grad_norm": 3.287900686264038,
+ "learning_rate": 7.802577271388381e-06,
+ "loss": 0.1355,
+ "step": 21411
+ },
+ {
+ "epoch": 58.3433242506812,
+ "grad_norm": 4.360344409942627,
+ "learning_rate": 7.801716355279632e-06,
+ "loss": 0.1377,
+ "step": 21412
+ },
+ {
+ "epoch": 58.346049046321525,
+ "grad_norm": 4.808806896209717,
+ "learning_rate": 7.800855456291045e-06,
+ "loss": 0.2072,
+ "step": 21413
+ },
+ {
+ "epoch": 58.34877384196185,
+ "grad_norm": 4.6278300285339355,
+ "learning_rate": 7.799994574429329e-06,
+ "loss": 0.1165,
+ "step": 21414
+ },
+ {
+ "epoch": 58.35149863760218,
+ "grad_norm": 2.3931100368499756,
+ "learning_rate": 7.79913370970118e-06,
+ "loss": 0.0474,
+ "step": 21415
+ },
+ {
+ "epoch": 58.35422343324251,
+ "grad_norm": 4.6696295738220215,
+ "learning_rate": 7.798272862113308e-06,
+ "loss": 0.0821,
+ "step": 21416
+ },
+ {
+ "epoch": 58.356948228882835,
+ "grad_norm": 3.7376925945281982,
+ "learning_rate": 7.797412031672419e-06,
+ "loss": 0.057,
+ "step": 21417
+ },
+ {
+ "epoch": 58.35967302452316,
+ "grad_norm": 3.901583671569824,
+ "learning_rate": 7.796551218385211e-06,
+ "loss": 0.073,
+ "step": 21418
+ },
+ {
+ "epoch": 58.36239782016349,
+ "grad_norm": 4.015518665313721,
+ "learning_rate": 7.795690422258394e-06,
+ "loss": 0.0653,
+ "step": 21419
+ },
+ {
+ "epoch": 58.36512261580381,
+ "grad_norm": 3.206453800201416,
+ "learning_rate": 7.794829643298667e-06,
+ "loss": 0.0632,
+ "step": 21420
+ },
+ {
+ "epoch": 58.36784741144414,
+ "grad_norm": 7.467257976531982,
+ "learning_rate": 7.793968881512737e-06,
+ "loss": 0.1243,
+ "step": 21421
+ },
+ {
+ "epoch": 58.37057220708447,
+ "grad_norm": 4.359302043914795,
+ "learning_rate": 7.793108136907306e-06,
+ "loss": 0.0704,
+ "step": 21422
+ },
+ {
+ "epoch": 58.3732970027248,
+ "grad_norm": 4.667004108428955,
+ "learning_rate": 7.79224740948908e-06,
+ "loss": 0.0965,
+ "step": 21423
+ },
+ {
+ "epoch": 58.37602179836512,
+ "grad_norm": 3.114868402481079,
+ "learning_rate": 7.791386699264756e-06,
+ "loss": 0.1781,
+ "step": 21424
+ },
+ {
+ "epoch": 58.37874659400545,
+ "grad_norm": 5.092816352844238,
+ "learning_rate": 7.790526006241044e-06,
+ "loss": 0.1404,
+ "step": 21425
+ },
+ {
+ "epoch": 58.381471389645775,
+ "grad_norm": 2.988006353378296,
+ "learning_rate": 7.789665330424643e-06,
+ "loss": 0.1273,
+ "step": 21426
+ },
+ {
+ "epoch": 58.3841961852861,
+ "grad_norm": 3.5393736362457275,
+ "learning_rate": 7.78880467182226e-06,
+ "loss": 0.0856,
+ "step": 21427
+ },
+ {
+ "epoch": 58.38692098092643,
+ "grad_norm": 3.369912624359131,
+ "learning_rate": 7.78794403044059e-06,
+ "loss": 0.2267,
+ "step": 21428
+ },
+ {
+ "epoch": 58.38964577656676,
+ "grad_norm": 4.061559200286865,
+ "learning_rate": 7.787083406286345e-06,
+ "loss": 0.1604,
+ "step": 21429
+ },
+ {
+ "epoch": 58.392370572207085,
+ "grad_norm": 3.5608556270599365,
+ "learning_rate": 7.78622279936622e-06,
+ "loss": 0.2598,
+ "step": 21430
+ },
+ {
+ "epoch": 58.39509536784741,
+ "grad_norm": 5.442565441131592,
+ "learning_rate": 7.78536220968692e-06,
+ "loss": 0.1797,
+ "step": 21431
+ },
+ {
+ "epoch": 58.39782016348774,
+ "grad_norm": 3.6805570125579834,
+ "learning_rate": 7.78450163725515e-06,
+ "loss": 0.0749,
+ "step": 21432
+ },
+ {
+ "epoch": 58.40054495912806,
+ "grad_norm": 3.387275218963623,
+ "learning_rate": 7.78364108207761e-06,
+ "loss": 0.0808,
+ "step": 21433
+ },
+ {
+ "epoch": 58.403269754768395,
+ "grad_norm": 4.009548664093018,
+ "learning_rate": 7.782780544161002e-06,
+ "loss": 0.1643,
+ "step": 21434
+ },
+ {
+ "epoch": 58.40599455040872,
+ "grad_norm": 6.480135917663574,
+ "learning_rate": 7.781920023512027e-06,
+ "loss": 0.2497,
+ "step": 21435
+ },
+ {
+ "epoch": 58.40871934604905,
+ "grad_norm": 4.250776290893555,
+ "learning_rate": 7.78105952013739e-06,
+ "loss": 0.1018,
+ "step": 21436
+ },
+ {
+ "epoch": 58.41144414168937,
+ "grad_norm": 3.59672212600708,
+ "learning_rate": 7.780199034043787e-06,
+ "loss": 0.1838,
+ "step": 21437
+ },
+ {
+ "epoch": 58.4141689373297,
+ "grad_norm": 4.79533576965332,
+ "learning_rate": 7.779338565237922e-06,
+ "loss": 0.251,
+ "step": 21438
+ },
+ {
+ "epoch": 58.416893732970024,
+ "grad_norm": 3.9480504989624023,
+ "learning_rate": 7.778478113726501e-06,
+ "loss": 0.1554,
+ "step": 21439
+ },
+ {
+ "epoch": 58.41961852861036,
+ "grad_norm": 4.790663719177246,
+ "learning_rate": 7.777617679516217e-06,
+ "loss": 0.2321,
+ "step": 21440
+ },
+ {
+ "epoch": 58.42234332425068,
+ "grad_norm": 4.551621437072754,
+ "learning_rate": 7.776757262613777e-06,
+ "loss": 0.0843,
+ "step": 21441
+ },
+ {
+ "epoch": 58.42506811989101,
+ "grad_norm": 4.327082633972168,
+ "learning_rate": 7.77589686302588e-06,
+ "loss": 0.0786,
+ "step": 21442
+ },
+ {
+ "epoch": 58.427792915531334,
+ "grad_norm": 3.325671434402466,
+ "learning_rate": 7.775036480759226e-06,
+ "loss": 0.0904,
+ "step": 21443
+ },
+ {
+ "epoch": 58.43051771117166,
+ "grad_norm": 4.046737194061279,
+ "learning_rate": 7.774176115820516e-06,
+ "loss": 0.0647,
+ "step": 21444
+ },
+ {
+ "epoch": 58.433242506811986,
+ "grad_norm": 2.9866275787353516,
+ "learning_rate": 7.773315768216452e-06,
+ "loss": 0.05,
+ "step": 21445
+ },
+ {
+ "epoch": 58.43596730245232,
+ "grad_norm": 4.174355506896973,
+ "learning_rate": 7.772455437953731e-06,
+ "loss": 0.0584,
+ "step": 21446
+ },
+ {
+ "epoch": 58.438692098092645,
+ "grad_norm": 3.5630075931549072,
+ "learning_rate": 7.771595125039053e-06,
+ "loss": 0.3054,
+ "step": 21447
+ },
+ {
+ "epoch": 58.44141689373297,
+ "grad_norm": 3.7853434085845947,
+ "learning_rate": 7.770734829479126e-06,
+ "loss": 0.0693,
+ "step": 21448
+ },
+ {
+ "epoch": 58.444141689373296,
+ "grad_norm": 4.610340118408203,
+ "learning_rate": 7.76987455128064e-06,
+ "loss": 0.2594,
+ "step": 21449
+ },
+ {
+ "epoch": 58.44686648501362,
+ "grad_norm": 4.337750434875488,
+ "learning_rate": 7.769014290450303e-06,
+ "loss": 0.1092,
+ "step": 21450
+ },
+ {
+ "epoch": 58.44959128065395,
+ "grad_norm": 4.147157192230225,
+ "learning_rate": 7.76815404699481e-06,
+ "loss": 0.1268,
+ "step": 21451
+ },
+ {
+ "epoch": 58.45231607629428,
+ "grad_norm": 4.715500354766846,
+ "learning_rate": 7.76729382092086e-06,
+ "loss": 0.0855,
+ "step": 21452
+ },
+ {
+ "epoch": 58.45504087193461,
+ "grad_norm": 5.13818359375,
+ "learning_rate": 7.766433612235154e-06,
+ "loss": 0.09,
+ "step": 21453
+ },
+ {
+ "epoch": 58.45776566757493,
+ "grad_norm": 3.5562307834625244,
+ "learning_rate": 7.765573420944394e-06,
+ "loss": 0.0597,
+ "step": 21454
+ },
+ {
+ "epoch": 58.46049046321526,
+ "grad_norm": 8.059571266174316,
+ "learning_rate": 7.764713247055273e-06,
+ "loss": 0.1189,
+ "step": 21455
+ },
+ {
+ "epoch": 58.463215258855584,
+ "grad_norm": 4.303390979766846,
+ "learning_rate": 7.763853090574495e-06,
+ "loss": 0.0741,
+ "step": 21456
+ },
+ {
+ "epoch": 58.46594005449591,
+ "grad_norm": 3.4709019660949707,
+ "learning_rate": 7.762992951508757e-06,
+ "loss": 0.0471,
+ "step": 21457
+ },
+ {
+ "epoch": 58.46866485013624,
+ "grad_norm": 4.330159664154053,
+ "learning_rate": 7.762132829864757e-06,
+ "loss": 0.0934,
+ "step": 21458
+ },
+ {
+ "epoch": 58.47138964577657,
+ "grad_norm": 5.4488911628723145,
+ "learning_rate": 7.761272725649195e-06,
+ "loss": 0.0801,
+ "step": 21459
+ },
+ {
+ "epoch": 58.474114441416894,
+ "grad_norm": 4.719922065734863,
+ "learning_rate": 7.760412638868768e-06,
+ "loss": 0.0891,
+ "step": 21460
+ },
+ {
+ "epoch": 58.47683923705722,
+ "grad_norm": 4.579160690307617,
+ "learning_rate": 7.759552569530178e-06,
+ "loss": 0.0819,
+ "step": 21461
+ },
+ {
+ "epoch": 58.479564032697546,
+ "grad_norm": 3.2546329498291016,
+ "learning_rate": 7.758692517640117e-06,
+ "loss": 0.1069,
+ "step": 21462
+ },
+ {
+ "epoch": 58.48228882833787,
+ "grad_norm": 2.822486162185669,
+ "learning_rate": 7.75783248320529e-06,
+ "loss": 0.0632,
+ "step": 21463
+ },
+ {
+ "epoch": 58.485013623978205,
+ "grad_norm": 4.434988498687744,
+ "learning_rate": 7.756972466232388e-06,
+ "loss": 0.0693,
+ "step": 21464
+ },
+ {
+ "epoch": 58.48773841961853,
+ "grad_norm": 3.8925631046295166,
+ "learning_rate": 7.756112466728111e-06,
+ "loss": 0.1362,
+ "step": 21465
+ },
+ {
+ "epoch": 58.490463215258856,
+ "grad_norm": 3.5528383255004883,
+ "learning_rate": 7.755252484699163e-06,
+ "loss": 0.1053,
+ "step": 21466
+ },
+ {
+ "epoch": 58.49318801089918,
+ "grad_norm": 3.9033761024475098,
+ "learning_rate": 7.754392520152233e-06,
+ "loss": 0.1055,
+ "step": 21467
+ },
+ {
+ "epoch": 58.49591280653951,
+ "grad_norm": 3.428138017654419,
+ "learning_rate": 7.753532573094024e-06,
+ "loss": 0.0671,
+ "step": 21468
+ },
+ {
+ "epoch": 58.49863760217983,
+ "grad_norm": 5.6496262550354,
+ "learning_rate": 7.75267264353123e-06,
+ "loss": 0.1115,
+ "step": 21469
+ },
+ {
+ "epoch": 58.50136239782017,
+ "grad_norm": 4.147008419036865,
+ "learning_rate": 7.751812731470549e-06,
+ "loss": 0.1251,
+ "step": 21470
+ },
+ {
+ "epoch": 58.50408719346049,
+ "grad_norm": 3.3708302974700928,
+ "learning_rate": 7.750952836918679e-06,
+ "loss": 0.0984,
+ "step": 21471
+ },
+ {
+ "epoch": 58.50681198910082,
+ "grad_norm": 4.073522567749023,
+ "learning_rate": 7.750092959882315e-06,
+ "loss": 0.1517,
+ "step": 21472
+ },
+ {
+ "epoch": 58.509536784741144,
+ "grad_norm": 13.929010391235352,
+ "learning_rate": 7.749233100368155e-06,
+ "loss": 0.0846,
+ "step": 21473
+ },
+ {
+ "epoch": 58.51226158038147,
+ "grad_norm": 3.3463056087493896,
+ "learning_rate": 7.748373258382896e-06,
+ "loss": 0.2056,
+ "step": 21474
+ },
+ {
+ "epoch": 58.514986376021795,
+ "grad_norm": 3.756589889526367,
+ "learning_rate": 7.747513433933231e-06,
+ "loss": 0.1352,
+ "step": 21475
+ },
+ {
+ "epoch": 58.51771117166213,
+ "grad_norm": 3.955935001373291,
+ "learning_rate": 7.746653627025861e-06,
+ "loss": 0.1816,
+ "step": 21476
+ },
+ {
+ "epoch": 58.520435967302454,
+ "grad_norm": 3.919924259185791,
+ "learning_rate": 7.745793837667479e-06,
+ "loss": 0.0746,
+ "step": 21477
+ },
+ {
+ "epoch": 58.52316076294278,
+ "grad_norm": 5.583837032318115,
+ "learning_rate": 7.744934065864785e-06,
+ "loss": 0.1019,
+ "step": 21478
+ },
+ {
+ "epoch": 58.525885558583106,
+ "grad_norm": 4.4430155754089355,
+ "learning_rate": 7.744074311624468e-06,
+ "loss": 0.0647,
+ "step": 21479
+ },
+ {
+ "epoch": 58.52861035422343,
+ "grad_norm": 3.9184672832489014,
+ "learning_rate": 7.743214574953231e-06,
+ "loss": 0.0539,
+ "step": 21480
+ },
+ {
+ "epoch": 58.53133514986376,
+ "grad_norm": 3.769113063812256,
+ "learning_rate": 7.742354855857761e-06,
+ "loss": 0.0516,
+ "step": 21481
+ },
+ {
+ "epoch": 58.53405994550409,
+ "grad_norm": 4.248811721801758,
+ "learning_rate": 7.74149515434476e-06,
+ "loss": 0.1288,
+ "step": 21482
+ },
+ {
+ "epoch": 58.536784741144416,
+ "grad_norm": 3.2389869689941406,
+ "learning_rate": 7.740635470420922e-06,
+ "loss": 0.1682,
+ "step": 21483
+ },
+ {
+ "epoch": 58.53950953678474,
+ "grad_norm": 3.2946629524230957,
+ "learning_rate": 7.739775804092947e-06,
+ "loss": 0.0769,
+ "step": 21484
+ },
+ {
+ "epoch": 58.54223433242507,
+ "grad_norm": 4.172604560852051,
+ "learning_rate": 7.738916155367522e-06,
+ "loss": 0.103,
+ "step": 21485
+ },
+ {
+ "epoch": 58.54495912806539,
+ "grad_norm": 3.7815375328063965,
+ "learning_rate": 7.738056524251347e-06,
+ "loss": 0.2709,
+ "step": 21486
+ },
+ {
+ "epoch": 58.54768392370572,
+ "grad_norm": 3.3296620845794678,
+ "learning_rate": 7.737196910751113e-06,
+ "loss": 0.0737,
+ "step": 21487
+ },
+ {
+ "epoch": 58.55040871934605,
+ "grad_norm": 3.880136489868164,
+ "learning_rate": 7.73633731487352e-06,
+ "loss": 0.1735,
+ "step": 21488
+ },
+ {
+ "epoch": 58.55313351498638,
+ "grad_norm": 3.3581833839416504,
+ "learning_rate": 7.735477736625255e-06,
+ "loss": 0.1288,
+ "step": 21489
+ },
+ {
+ "epoch": 58.555858310626704,
+ "grad_norm": 7.105356216430664,
+ "learning_rate": 7.73461817601302e-06,
+ "loss": 0.1674,
+ "step": 21490
+ },
+ {
+ "epoch": 58.55858310626703,
+ "grad_norm": 5.7333083152771,
+ "learning_rate": 7.733758633043502e-06,
+ "loss": 0.1656,
+ "step": 21491
+ },
+ {
+ "epoch": 58.561307901907355,
+ "grad_norm": 4.50360631942749,
+ "learning_rate": 7.732899107723401e-06,
+ "loss": 0.1094,
+ "step": 21492
+ },
+ {
+ "epoch": 58.56403269754768,
+ "grad_norm": 3.3514621257781982,
+ "learning_rate": 7.732039600059407e-06,
+ "loss": 0.1267,
+ "step": 21493
+ },
+ {
+ "epoch": 58.566757493188014,
+ "grad_norm": 5.052760601043701,
+ "learning_rate": 7.73118011005822e-06,
+ "loss": 0.049,
+ "step": 21494
+ },
+ {
+ "epoch": 58.56948228882834,
+ "grad_norm": 5.315223217010498,
+ "learning_rate": 7.730320637726524e-06,
+ "loss": 0.1214,
+ "step": 21495
+ },
+ {
+ "epoch": 58.572207084468666,
+ "grad_norm": 3.963050603866577,
+ "learning_rate": 7.729461183071023e-06,
+ "loss": 0.1245,
+ "step": 21496
+ },
+ {
+ "epoch": 58.57493188010899,
+ "grad_norm": 6.392207622528076,
+ "learning_rate": 7.728601746098401e-06,
+ "loss": 0.1709,
+ "step": 21497
+ },
+ {
+ "epoch": 58.57765667574932,
+ "grad_norm": 3.605137586593628,
+ "learning_rate": 7.727742326815357e-06,
+ "loss": 0.0681,
+ "step": 21498
+ },
+ {
+ "epoch": 58.58038147138964,
+ "grad_norm": 3.6206047534942627,
+ "learning_rate": 7.72688292522858e-06,
+ "loss": 0.073,
+ "step": 21499
+ },
+ {
+ "epoch": 58.583106267029976,
+ "grad_norm": 5.480008602142334,
+ "learning_rate": 7.726023541344767e-06,
+ "loss": 0.1793,
+ "step": 21500
+ },
+ {
+ "epoch": 58.5858310626703,
+ "grad_norm": 4.394006252288818,
+ "learning_rate": 7.725164175170611e-06,
+ "loss": 0.2018,
+ "step": 21501
+ },
+ {
+ "epoch": 58.58855585831063,
+ "grad_norm": 5.898493766784668,
+ "learning_rate": 7.724304826712802e-06,
+ "loss": 0.1331,
+ "step": 21502
+ },
+ {
+ "epoch": 58.59128065395095,
+ "grad_norm": 3.7584009170532227,
+ "learning_rate": 7.723445495978034e-06,
+ "loss": 0.0893,
+ "step": 21503
+ },
+ {
+ "epoch": 58.59400544959128,
+ "grad_norm": 3.396317481994629,
+ "learning_rate": 7.722586182973002e-06,
+ "loss": 0.0871,
+ "step": 21504
+ },
+ {
+ "epoch": 58.596730245231605,
+ "grad_norm": 4.105969429016113,
+ "learning_rate": 7.721726887704392e-06,
+ "loss": 0.0996,
+ "step": 21505
+ },
+ {
+ "epoch": 58.59945504087194,
+ "grad_norm": 3.7845029830932617,
+ "learning_rate": 7.720867610178902e-06,
+ "loss": 0.1126,
+ "step": 21506
+ },
+ {
+ "epoch": 58.60217983651226,
+ "grad_norm": 6.148295879364014,
+ "learning_rate": 7.72000835040322e-06,
+ "loss": 0.2394,
+ "step": 21507
+ },
+ {
+ "epoch": 58.60490463215259,
+ "grad_norm": 4.514403820037842,
+ "learning_rate": 7.719149108384042e-06,
+ "loss": 0.1659,
+ "step": 21508
+ },
+ {
+ "epoch": 58.607629427792915,
+ "grad_norm": 3.663196086883545,
+ "learning_rate": 7.718289884128054e-06,
+ "loss": 0.0688,
+ "step": 21509
+ },
+ {
+ "epoch": 58.61035422343324,
+ "grad_norm": 3.3898158073425293,
+ "learning_rate": 7.717430677641954e-06,
+ "loss": 0.0567,
+ "step": 21510
+ },
+ {
+ "epoch": 58.61307901907357,
+ "grad_norm": 4.63852596282959,
+ "learning_rate": 7.716571488932427e-06,
+ "loss": 0.0974,
+ "step": 21511
+ },
+ {
+ "epoch": 58.6158038147139,
+ "grad_norm": 3.5420165061950684,
+ "learning_rate": 7.715712318006173e-06,
+ "loss": 0.1034,
+ "step": 21512
+ },
+ {
+ "epoch": 58.618528610354225,
+ "grad_norm": 3.5376248359680176,
+ "learning_rate": 7.714853164869872e-06,
+ "loss": 0.0632,
+ "step": 21513
+ },
+ {
+ "epoch": 58.62125340599455,
+ "grad_norm": 3.5798234939575195,
+ "learning_rate": 7.713994029530224e-06,
+ "loss": 0.1411,
+ "step": 21514
+ },
+ {
+ "epoch": 58.62397820163488,
+ "grad_norm": 3.4283549785614014,
+ "learning_rate": 7.713134911993917e-06,
+ "loss": 0.1473,
+ "step": 21515
+ },
+ {
+ "epoch": 58.6267029972752,
+ "grad_norm": 4.478358268737793,
+ "learning_rate": 7.712275812267638e-06,
+ "loss": 0.1915,
+ "step": 21516
+ },
+ {
+ "epoch": 58.62942779291553,
+ "grad_norm": 4.1488237380981445,
+ "learning_rate": 7.711416730358085e-06,
+ "loss": 0.0788,
+ "step": 21517
+ },
+ {
+ "epoch": 58.63215258855586,
+ "grad_norm": 4.851395130157471,
+ "learning_rate": 7.710557666271943e-06,
+ "loss": 0.1862,
+ "step": 21518
+ },
+ {
+ "epoch": 58.63487738419619,
+ "grad_norm": 4.15927791595459,
+ "learning_rate": 7.709698620015908e-06,
+ "loss": 0.1268,
+ "step": 21519
+ },
+ {
+ "epoch": 58.63760217983651,
+ "grad_norm": 3.2418174743652344,
+ "learning_rate": 7.708839591596663e-06,
+ "loss": 0.121,
+ "step": 21520
+ },
+ {
+ "epoch": 58.64032697547684,
+ "grad_norm": 4.322272300720215,
+ "learning_rate": 7.707980581020903e-06,
+ "loss": 0.1349,
+ "step": 21521
+ },
+ {
+ "epoch": 58.643051771117165,
+ "grad_norm": 4.424936771392822,
+ "learning_rate": 7.707121588295316e-06,
+ "loss": 0.06,
+ "step": 21522
+ },
+ {
+ "epoch": 58.64577656675749,
+ "grad_norm": 4.182270050048828,
+ "learning_rate": 7.706262613426594e-06,
+ "loss": 0.0556,
+ "step": 21523
+ },
+ {
+ "epoch": 58.64850136239782,
+ "grad_norm": 3.3170406818389893,
+ "learning_rate": 7.705403656421422e-06,
+ "loss": 0.1684,
+ "step": 21524
+ },
+ {
+ "epoch": 58.65122615803815,
+ "grad_norm": 4.232260704040527,
+ "learning_rate": 7.704544717286493e-06,
+ "loss": 0.0699,
+ "step": 21525
+ },
+ {
+ "epoch": 58.653950953678475,
+ "grad_norm": 4.209249019622803,
+ "learning_rate": 7.703685796028499e-06,
+ "loss": 0.0765,
+ "step": 21526
+ },
+ {
+ "epoch": 58.6566757493188,
+ "grad_norm": 3.5731842517852783,
+ "learning_rate": 7.702826892654121e-06,
+ "loss": 0.0448,
+ "step": 21527
+ },
+ {
+ "epoch": 58.65940054495913,
+ "grad_norm": 3.5391786098480225,
+ "learning_rate": 7.701968007170057e-06,
+ "loss": 0.0694,
+ "step": 21528
+ },
+ {
+ "epoch": 58.66212534059945,
+ "grad_norm": 3.4241995811462402,
+ "learning_rate": 7.701109139582993e-06,
+ "loss": 0.2635,
+ "step": 21529
+ },
+ {
+ "epoch": 58.664850136239785,
+ "grad_norm": 6.018126964569092,
+ "learning_rate": 7.700250289899614e-06,
+ "loss": 0.1424,
+ "step": 21530
+ },
+ {
+ "epoch": 58.66757493188011,
+ "grad_norm": 3.708371162414551,
+ "learning_rate": 7.699391458126612e-06,
+ "loss": 0.1822,
+ "step": 21531
+ },
+ {
+ "epoch": 58.67029972752044,
+ "grad_norm": 4.279620170593262,
+ "learning_rate": 7.698532644270678e-06,
+ "loss": 0.265,
+ "step": 21532
+ },
+ {
+ "epoch": 58.67302452316076,
+ "grad_norm": 5.6820969581604,
+ "learning_rate": 7.697673848338495e-06,
+ "loss": 0.0961,
+ "step": 21533
+ },
+ {
+ "epoch": 58.67574931880109,
+ "grad_norm": 3.770305871963501,
+ "learning_rate": 7.696815070336752e-06,
+ "loss": 0.0676,
+ "step": 21534
+ },
+ {
+ "epoch": 58.678474114441414,
+ "grad_norm": 4.238286018371582,
+ "learning_rate": 7.695956310272143e-06,
+ "loss": 0.1453,
+ "step": 21535
+ },
+ {
+ "epoch": 58.68119891008175,
+ "grad_norm": 3.1553149223327637,
+ "learning_rate": 7.695097568151351e-06,
+ "loss": 0.1258,
+ "step": 21536
+ },
+ {
+ "epoch": 58.68392370572207,
+ "grad_norm": 3.0492682456970215,
+ "learning_rate": 7.694238843981066e-06,
+ "loss": 0.0873,
+ "step": 21537
+ },
+ {
+ "epoch": 58.6866485013624,
+ "grad_norm": 3.081958055496216,
+ "learning_rate": 7.693380137767971e-06,
+ "loss": 0.0869,
+ "step": 21538
+ },
+ {
+ "epoch": 58.689373297002724,
+ "grad_norm": 3.7943410873413086,
+ "learning_rate": 7.692521449518763e-06,
+ "loss": 0.0703,
+ "step": 21539
+ },
+ {
+ "epoch": 58.69209809264305,
+ "grad_norm": 4.566564083099365,
+ "learning_rate": 7.691662779240119e-06,
+ "loss": 0.1587,
+ "step": 21540
+ },
+ {
+ "epoch": 58.694822888283376,
+ "grad_norm": 4.0657572746276855,
+ "learning_rate": 7.690804126938733e-06,
+ "loss": 0.0757,
+ "step": 21541
+ },
+ {
+ "epoch": 58.69754768392371,
+ "grad_norm": 3.274008274078369,
+ "learning_rate": 7.68994549262129e-06,
+ "loss": 0.0666,
+ "step": 21542
+ },
+ {
+ "epoch": 58.700272479564035,
+ "grad_norm": 3.5570719242095947,
+ "learning_rate": 7.689086876294479e-06,
+ "loss": 0.3087,
+ "step": 21543
+ },
+ {
+ "epoch": 58.70299727520436,
+ "grad_norm": 2.881232500076294,
+ "learning_rate": 7.68822827796498e-06,
+ "loss": 0.0512,
+ "step": 21544
+ },
+ {
+ "epoch": 58.705722070844686,
+ "grad_norm": 3.1296496391296387,
+ "learning_rate": 7.68736969763949e-06,
+ "loss": 0.0736,
+ "step": 21545
+ },
+ {
+ "epoch": 58.70844686648501,
+ "grad_norm": 3.461085557937622,
+ "learning_rate": 7.686511135324687e-06,
+ "loss": 0.0604,
+ "step": 21546
+ },
+ {
+ "epoch": 58.71117166212534,
+ "grad_norm": 3.1067328453063965,
+ "learning_rate": 7.685652591027261e-06,
+ "loss": 0.1282,
+ "step": 21547
+ },
+ {
+ "epoch": 58.71389645776567,
+ "grad_norm": 2.9073550701141357,
+ "learning_rate": 7.6847940647539e-06,
+ "loss": 0.1454,
+ "step": 21548
+ },
+ {
+ "epoch": 58.716621253406,
+ "grad_norm": 3.7609846591949463,
+ "learning_rate": 7.683935556511287e-06,
+ "loss": 0.1043,
+ "step": 21549
+ },
+ {
+ "epoch": 58.71934604904632,
+ "grad_norm": 4.674740791320801,
+ "learning_rate": 7.68307706630611e-06,
+ "loss": 0.2425,
+ "step": 21550
+ },
+ {
+ "epoch": 58.72207084468665,
+ "grad_norm": 4.871628761291504,
+ "learning_rate": 7.682218594145052e-06,
+ "loss": 0.2236,
+ "step": 21551
+ },
+ {
+ "epoch": 58.724795640326974,
+ "grad_norm": 4.0654191970825195,
+ "learning_rate": 7.681360140034802e-06,
+ "loss": 0.1669,
+ "step": 21552
+ },
+ {
+ "epoch": 58.7275204359673,
+ "grad_norm": 3.182121992111206,
+ "learning_rate": 7.680501703982047e-06,
+ "loss": 0.1692,
+ "step": 21553
+ },
+ {
+ "epoch": 58.73024523160763,
+ "grad_norm": 4.811152458190918,
+ "learning_rate": 7.679643285993466e-06,
+ "loss": 0.1249,
+ "step": 21554
+ },
+ {
+ "epoch": 58.73297002724796,
+ "grad_norm": 3.7067596912384033,
+ "learning_rate": 7.678784886075753e-06,
+ "loss": 0.1163,
+ "step": 21555
+ },
+ {
+ "epoch": 58.735694822888284,
+ "grad_norm": 3.1542389392852783,
+ "learning_rate": 7.677926504235585e-06,
+ "loss": 0.0612,
+ "step": 21556
+ },
+ {
+ "epoch": 58.73841961852861,
+ "grad_norm": 3.0129261016845703,
+ "learning_rate": 7.677068140479654e-06,
+ "loss": 0.2432,
+ "step": 21557
+ },
+ {
+ "epoch": 58.741144414168936,
+ "grad_norm": 2.8790557384490967,
+ "learning_rate": 7.676209794814639e-06,
+ "loss": 0.0482,
+ "step": 21558
+ },
+ {
+ "epoch": 58.74386920980926,
+ "grad_norm": 3.94728946685791,
+ "learning_rate": 7.67535146724723e-06,
+ "loss": 0.0951,
+ "step": 21559
+ },
+ {
+ "epoch": 58.746594005449595,
+ "grad_norm": 3.058041572570801,
+ "learning_rate": 7.674493157784106e-06,
+ "loss": 0.1165,
+ "step": 21560
+ },
+ {
+ "epoch": 58.74931880108992,
+ "grad_norm": 3.3404855728149414,
+ "learning_rate": 7.673634866431955e-06,
+ "loss": 0.0721,
+ "step": 21561
+ },
+ {
+ "epoch": 58.752043596730246,
+ "grad_norm": 5.324344635009766,
+ "learning_rate": 7.672776593197463e-06,
+ "loss": 0.1768,
+ "step": 21562
+ },
+ {
+ "epoch": 58.75476839237057,
+ "grad_norm": 3.7187886238098145,
+ "learning_rate": 7.67191833808731e-06,
+ "loss": 0.0909,
+ "step": 21563
+ },
+ {
+ "epoch": 58.7574931880109,
+ "grad_norm": 5.002996444702148,
+ "learning_rate": 7.671060101108182e-06,
+ "loss": 0.0889,
+ "step": 21564
+ },
+ {
+ "epoch": 58.76021798365122,
+ "grad_norm": 3.5215115547180176,
+ "learning_rate": 7.670201882266764e-06,
+ "loss": 0.0895,
+ "step": 21565
+ },
+ {
+ "epoch": 58.762942779291556,
+ "grad_norm": 4.215787887573242,
+ "learning_rate": 7.669343681569737e-06,
+ "loss": 0.1413,
+ "step": 21566
+ },
+ {
+ "epoch": 58.76566757493188,
+ "grad_norm": 3.1859095096588135,
+ "learning_rate": 7.66848549902379e-06,
+ "loss": 0.1498,
+ "step": 21567
+ },
+ {
+ "epoch": 58.76839237057221,
+ "grad_norm": 3.565659284591675,
+ "learning_rate": 7.667627334635595e-06,
+ "loss": 0.0579,
+ "step": 21568
+ },
+ {
+ "epoch": 58.771117166212534,
+ "grad_norm": 3.4855968952178955,
+ "learning_rate": 7.666769188411848e-06,
+ "loss": 0.0735,
+ "step": 21569
+ },
+ {
+ "epoch": 58.77384196185286,
+ "grad_norm": 4.283398628234863,
+ "learning_rate": 7.665911060359228e-06,
+ "loss": 0.2532,
+ "step": 21570
+ },
+ {
+ "epoch": 58.776566757493185,
+ "grad_norm": 3.126268148422241,
+ "learning_rate": 7.66505295048442e-06,
+ "loss": 0.1428,
+ "step": 21571
+ },
+ {
+ "epoch": 58.77929155313352,
+ "grad_norm": 4.907703399658203,
+ "learning_rate": 7.6641948587941e-06,
+ "loss": 0.1766,
+ "step": 21572
+ },
+ {
+ "epoch": 58.782016348773844,
+ "grad_norm": 4.114948749542236,
+ "learning_rate": 7.663336785294959e-06,
+ "loss": 0.1095,
+ "step": 21573
+ },
+ {
+ "epoch": 58.78474114441417,
+ "grad_norm": 3.390493154525757,
+ "learning_rate": 7.662478729993673e-06,
+ "loss": 0.1895,
+ "step": 21574
+ },
+ {
+ "epoch": 58.787465940054496,
+ "grad_norm": 3.6392195224761963,
+ "learning_rate": 7.661620692896931e-06,
+ "loss": 0.114,
+ "step": 21575
+ },
+ {
+ "epoch": 58.79019073569482,
+ "grad_norm": 4.038777828216553,
+ "learning_rate": 7.660762674011408e-06,
+ "loss": 0.1706,
+ "step": 21576
+ },
+ {
+ "epoch": 58.79291553133515,
+ "grad_norm": 3.585653066635132,
+ "learning_rate": 7.659904673343793e-06,
+ "loss": 0.0877,
+ "step": 21577
+ },
+ {
+ "epoch": 58.79564032697548,
+ "grad_norm": 5.2134575843811035,
+ "learning_rate": 7.659046690900762e-06,
+ "loss": 0.1707,
+ "step": 21578
+ },
+ {
+ "epoch": 58.798365122615806,
+ "grad_norm": 3.6076905727386475,
+ "learning_rate": 7.658188726689003e-06,
+ "loss": 0.1078,
+ "step": 21579
+ },
+ {
+ "epoch": 58.80108991825613,
+ "grad_norm": 4.470366477966309,
+ "learning_rate": 7.657330780715193e-06,
+ "loss": 0.181,
+ "step": 21580
+ },
+ {
+ "epoch": 58.80381471389646,
+ "grad_norm": 3.638078451156616,
+ "learning_rate": 7.656472852986017e-06,
+ "loss": 0.1224,
+ "step": 21581
+ },
+ {
+ "epoch": 58.80653950953678,
+ "grad_norm": 3.5840208530426025,
+ "learning_rate": 7.655614943508153e-06,
+ "loss": 0.108,
+ "step": 21582
+ },
+ {
+ "epoch": 58.80926430517711,
+ "grad_norm": 6.398871421813965,
+ "learning_rate": 7.654757052288286e-06,
+ "loss": 0.0816,
+ "step": 21583
+ },
+ {
+ "epoch": 58.81198910081744,
+ "grad_norm": 3.523592472076416,
+ "learning_rate": 7.653899179333094e-06,
+ "loss": 0.1269,
+ "step": 21584
+ },
+ {
+ "epoch": 58.81471389645777,
+ "grad_norm": 4.927404403686523,
+ "learning_rate": 7.653041324649258e-06,
+ "loss": 0.066,
+ "step": 21585
+ },
+ {
+ "epoch": 58.817438692098094,
+ "grad_norm": 3.422100067138672,
+ "learning_rate": 7.652183488243465e-06,
+ "loss": 0.0608,
+ "step": 21586
+ },
+ {
+ "epoch": 58.82016348773842,
+ "grad_norm": 3.7407214641571045,
+ "learning_rate": 7.651325670122389e-06,
+ "loss": 0.0925,
+ "step": 21587
+ },
+ {
+ "epoch": 58.822888283378745,
+ "grad_norm": 3.263108968734741,
+ "learning_rate": 7.650467870292711e-06,
+ "loss": 0.0745,
+ "step": 21588
+ },
+ {
+ "epoch": 58.82561307901907,
+ "grad_norm": 4.6756815910339355,
+ "learning_rate": 7.649610088761117e-06,
+ "loss": 0.3144,
+ "step": 21589
+ },
+ {
+ "epoch": 58.828337874659404,
+ "grad_norm": 5.076279640197754,
+ "learning_rate": 7.648752325534283e-06,
+ "loss": 0.0882,
+ "step": 21590
+ },
+ {
+ "epoch": 58.83106267029973,
+ "grad_norm": 3.9108126163482666,
+ "learning_rate": 7.647894580618892e-06,
+ "loss": 0.0979,
+ "step": 21591
+ },
+ {
+ "epoch": 58.833787465940055,
+ "grad_norm": 3.7094666957855225,
+ "learning_rate": 7.64703685402162e-06,
+ "loss": 0.1617,
+ "step": 21592
+ },
+ {
+ "epoch": 58.83651226158038,
+ "grad_norm": 3.3642637729644775,
+ "learning_rate": 7.646179145749151e-06,
+ "loss": 0.0763,
+ "step": 21593
+ },
+ {
+ "epoch": 58.83923705722071,
+ "grad_norm": 4.531522750854492,
+ "learning_rate": 7.645321455808162e-06,
+ "loss": 0.1066,
+ "step": 21594
+ },
+ {
+ "epoch": 58.84196185286103,
+ "grad_norm": 3.2476766109466553,
+ "learning_rate": 7.644463784205335e-06,
+ "loss": 0.0698,
+ "step": 21595
+ },
+ {
+ "epoch": 58.844686648501366,
+ "grad_norm": 3.3269529342651367,
+ "learning_rate": 7.643606130947345e-06,
+ "loss": 0.0512,
+ "step": 21596
+ },
+ {
+ "epoch": 58.84741144414169,
+ "grad_norm": 3.5970005989074707,
+ "learning_rate": 7.64274849604088e-06,
+ "loss": 0.2536,
+ "step": 21597
+ },
+ {
+ "epoch": 58.85013623978202,
+ "grad_norm": 3.4453017711639404,
+ "learning_rate": 7.641890879492608e-06,
+ "loss": 0.0743,
+ "step": 21598
+ },
+ {
+ "epoch": 58.85286103542234,
+ "grad_norm": 4.354587554931641,
+ "learning_rate": 7.641033281309219e-06,
+ "loss": 0.1206,
+ "step": 21599
+ },
+ {
+ "epoch": 58.85558583106267,
+ "grad_norm": 3.3186676502227783,
+ "learning_rate": 7.640175701497383e-06,
+ "loss": 0.065,
+ "step": 21600
+ },
+ {
+ "epoch": 58.858310626702995,
+ "grad_norm": 4.4106950759887695,
+ "learning_rate": 7.639318140063785e-06,
+ "loss": 0.0593,
+ "step": 21601
+ },
+ {
+ "epoch": 58.86103542234333,
+ "grad_norm": 3.0654456615448,
+ "learning_rate": 7.638460597015097e-06,
+ "loss": 0.0836,
+ "step": 21602
+ },
+ {
+ "epoch": 58.86376021798365,
+ "grad_norm": 3.552016258239746,
+ "learning_rate": 7.637603072358004e-06,
+ "loss": 0.122,
+ "step": 21603
+ },
+ {
+ "epoch": 58.86648501362398,
+ "grad_norm": 6.45775032043457,
+ "learning_rate": 7.636745566099185e-06,
+ "loss": 0.1001,
+ "step": 21604
+ },
+ {
+ "epoch": 58.869209809264305,
+ "grad_norm": 3.066519260406494,
+ "learning_rate": 7.635888078245312e-06,
+ "loss": 0.1041,
+ "step": 21605
+ },
+ {
+ "epoch": 58.87193460490463,
+ "grad_norm": 3.6877498626708984,
+ "learning_rate": 7.635030608803072e-06,
+ "loss": 0.0741,
+ "step": 21606
+ },
+ {
+ "epoch": 58.87465940054496,
+ "grad_norm": 4.111044883728027,
+ "learning_rate": 7.634173157779133e-06,
+ "loss": 0.3042,
+ "step": 21607
+ },
+ {
+ "epoch": 58.87738419618529,
+ "grad_norm": 3.6182291507720947,
+ "learning_rate": 7.633315725180178e-06,
+ "loss": 0.0835,
+ "step": 21608
+ },
+ {
+ "epoch": 58.880108991825615,
+ "grad_norm": 2.8847904205322266,
+ "learning_rate": 7.632458311012884e-06,
+ "loss": 0.1888,
+ "step": 21609
+ },
+ {
+ "epoch": 58.88283378746594,
+ "grad_norm": 3.524197816848755,
+ "learning_rate": 7.63160091528393e-06,
+ "loss": 0.091,
+ "step": 21610
+ },
+ {
+ "epoch": 58.88555858310627,
+ "grad_norm": 3.9682729244232178,
+ "learning_rate": 7.630743537999989e-06,
+ "loss": 0.0787,
+ "step": 21611
+ },
+ {
+ "epoch": 58.88828337874659,
+ "grad_norm": 3.8259661197662354,
+ "learning_rate": 7.629886179167743e-06,
+ "loss": 0.1559,
+ "step": 21612
+ },
+ {
+ "epoch": 58.89100817438692,
+ "grad_norm": 3.9684224128723145,
+ "learning_rate": 7.629028838793867e-06,
+ "loss": 0.1177,
+ "step": 21613
+ },
+ {
+ "epoch": 58.89373297002725,
+ "grad_norm": 4.789135456085205,
+ "learning_rate": 7.6281715168850364e-06,
+ "loss": 0.0941,
+ "step": 21614
+ },
+ {
+ "epoch": 58.89645776566758,
+ "grad_norm": 6.84328556060791,
+ "learning_rate": 7.6273142134479335e-06,
+ "loss": 0.1571,
+ "step": 21615
+ },
+ {
+ "epoch": 58.8991825613079,
+ "grad_norm": 3.524958848953247,
+ "learning_rate": 7.626456928489228e-06,
+ "loss": 0.0701,
+ "step": 21616
+ },
+ {
+ "epoch": 58.90190735694823,
+ "grad_norm": 3.621579885482788,
+ "learning_rate": 7.625599662015602e-06,
+ "loss": 0.1075,
+ "step": 21617
+ },
+ {
+ "epoch": 58.904632152588555,
+ "grad_norm": 3.4036946296691895,
+ "learning_rate": 7.624742414033725e-06,
+ "loss": 0.1193,
+ "step": 21618
+ },
+ {
+ "epoch": 58.90735694822888,
+ "grad_norm": 5.28678560256958,
+ "learning_rate": 7.623885184550283e-06,
+ "loss": 0.1419,
+ "step": 21619
+ },
+ {
+ "epoch": 58.91008174386921,
+ "grad_norm": 4.394040107727051,
+ "learning_rate": 7.6230279735719415e-06,
+ "loss": 0.1415,
+ "step": 21620
+ },
+ {
+ "epoch": 58.91280653950954,
+ "grad_norm": 4.134680271148682,
+ "learning_rate": 7.622170781105382e-06,
+ "loss": 0.1504,
+ "step": 21621
+ },
+ {
+ "epoch": 58.915531335149865,
+ "grad_norm": 3.1160125732421875,
+ "learning_rate": 7.621313607157285e-06,
+ "loss": 0.1596,
+ "step": 21622
+ },
+ {
+ "epoch": 58.91825613079019,
+ "grad_norm": 3.513460636138916,
+ "learning_rate": 7.620456451734317e-06,
+ "loss": 0.1005,
+ "step": 21623
+ },
+ {
+ "epoch": 58.920980926430516,
+ "grad_norm": 3.427602767944336,
+ "learning_rate": 7.61959931484316e-06,
+ "loss": 0.0597,
+ "step": 21624
+ },
+ {
+ "epoch": 58.92370572207084,
+ "grad_norm": 4.323990345001221,
+ "learning_rate": 7.618742196490485e-06,
+ "loss": 0.1795,
+ "step": 21625
+ },
+ {
+ "epoch": 58.926430517711175,
+ "grad_norm": 2.7273409366607666,
+ "learning_rate": 7.617885096682971e-06,
+ "loss": 0.2101,
+ "step": 21626
+ },
+ {
+ "epoch": 58.9291553133515,
+ "grad_norm": 4.046576499938965,
+ "learning_rate": 7.617028015427289e-06,
+ "loss": 0.0985,
+ "step": 21627
+ },
+ {
+ "epoch": 58.93188010899183,
+ "grad_norm": 3.4946789741516113,
+ "learning_rate": 7.616170952730118e-06,
+ "loss": 0.1829,
+ "step": 21628
+ },
+ {
+ "epoch": 58.93460490463215,
+ "grad_norm": 5.407798767089844,
+ "learning_rate": 7.6153139085981296e-06,
+ "loss": 0.2557,
+ "step": 21629
+ },
+ {
+ "epoch": 58.93732970027248,
+ "grad_norm": 3.398526430130005,
+ "learning_rate": 7.614456883038001e-06,
+ "loss": 0.0642,
+ "step": 21630
+ },
+ {
+ "epoch": 58.940054495912804,
+ "grad_norm": 3.662095069885254,
+ "learning_rate": 7.613599876056404e-06,
+ "loss": 0.1326,
+ "step": 21631
+ },
+ {
+ "epoch": 58.94277929155314,
+ "grad_norm": 3.950141191482544,
+ "learning_rate": 7.612742887660016e-06,
+ "loss": 0.1051,
+ "step": 21632
+ },
+ {
+ "epoch": 58.94550408719346,
+ "grad_norm": 2.7301089763641357,
+ "learning_rate": 7.611885917855508e-06,
+ "loss": 0.0519,
+ "step": 21633
+ },
+ {
+ "epoch": 58.94822888283379,
+ "grad_norm": 3.6168124675750732,
+ "learning_rate": 7.611028966649555e-06,
+ "loss": 0.096,
+ "step": 21634
+ },
+ {
+ "epoch": 58.950953678474114,
+ "grad_norm": 5.342549800872803,
+ "learning_rate": 7.610172034048835e-06,
+ "loss": 0.136,
+ "step": 21635
+ },
+ {
+ "epoch": 58.95367847411444,
+ "grad_norm": 2.9107892513275146,
+ "learning_rate": 7.609315120060015e-06,
+ "loss": 0.0935,
+ "step": 21636
+ },
+ {
+ "epoch": 58.956403269754766,
+ "grad_norm": 3.528442859649658,
+ "learning_rate": 7.60845822468977e-06,
+ "loss": 0.0686,
+ "step": 21637
+ },
+ {
+ "epoch": 58.95912806539509,
+ "grad_norm": 4.349478721618652,
+ "learning_rate": 7.6076013479447786e-06,
+ "loss": 0.1161,
+ "step": 21638
+ },
+ {
+ "epoch": 58.961852861035425,
+ "grad_norm": 3.902848958969116,
+ "learning_rate": 7.60674448983171e-06,
+ "loss": 0.1102,
+ "step": 21639
+ },
+ {
+ "epoch": 58.96457765667575,
+ "grad_norm": 2.843625545501709,
+ "learning_rate": 7.60588765035724e-06,
+ "loss": 0.0689,
+ "step": 21640
+ },
+ {
+ "epoch": 58.967302452316076,
+ "grad_norm": 3.7142114639282227,
+ "learning_rate": 7.605030829528037e-06,
+ "loss": 0.1922,
+ "step": 21641
+ },
+ {
+ "epoch": 58.9700272479564,
+ "grad_norm": 2.9767210483551025,
+ "learning_rate": 7.60417402735078e-06,
+ "loss": 0.0972,
+ "step": 21642
+ },
+ {
+ "epoch": 58.97275204359673,
+ "grad_norm": 3.785778284072876,
+ "learning_rate": 7.603317243832137e-06,
+ "loss": 0.1285,
+ "step": 21643
+ },
+ {
+ "epoch": 58.97547683923706,
+ "grad_norm": 4.361304759979248,
+ "learning_rate": 7.6024604789787835e-06,
+ "loss": 0.0826,
+ "step": 21644
+ },
+ {
+ "epoch": 58.97820163487739,
+ "grad_norm": 3.8239848613739014,
+ "learning_rate": 7.601603732797389e-06,
+ "loss": 0.1777,
+ "step": 21645
+ },
+ {
+ "epoch": 58.98092643051771,
+ "grad_norm": 4.224652290344238,
+ "learning_rate": 7.600747005294629e-06,
+ "loss": 0.0697,
+ "step": 21646
+ },
+ {
+ "epoch": 58.98365122615804,
+ "grad_norm": 4.886425971984863,
+ "learning_rate": 7.599890296477171e-06,
+ "loss": 0.1468,
+ "step": 21647
+ },
+ {
+ "epoch": 58.986376021798364,
+ "grad_norm": 4.023881435394287,
+ "learning_rate": 7.599033606351694e-06,
+ "loss": 0.0609,
+ "step": 21648
+ },
+ {
+ "epoch": 58.98910081743869,
+ "grad_norm": 2.9752514362335205,
+ "learning_rate": 7.598176934924863e-06,
+ "loss": 0.1779,
+ "step": 21649
+ },
+ {
+ "epoch": 58.991825613079016,
+ "grad_norm": 5.338901042938232,
+ "learning_rate": 7.5973202822033554e-06,
+ "loss": 0.1998,
+ "step": 21650
+ },
+ {
+ "epoch": 58.99455040871935,
+ "grad_norm": 3.1338915824890137,
+ "learning_rate": 7.596463648193837e-06,
+ "loss": 0.1939,
+ "step": 21651
+ },
+ {
+ "epoch": 58.997275204359674,
+ "grad_norm": 4.405067443847656,
+ "learning_rate": 7.595607032902985e-06,
+ "loss": 0.1446,
+ "step": 21652
+ },
+ {
+ "epoch": 59.0,
+ "grad_norm": 2.0436484813690186,
+ "learning_rate": 7.594750436337467e-06,
+ "loss": 0.0406,
+ "step": 21653
+ },
+ {
+ "epoch": 59.002724795640326,
+ "grad_norm": 3.777146577835083,
+ "learning_rate": 7.593893858503951e-06,
+ "loss": 0.0633,
+ "step": 21654
+ },
+ {
+ "epoch": 59.00544959128065,
+ "grad_norm": 4.3965325355529785,
+ "learning_rate": 7.593037299409116e-06,
+ "loss": 0.0934,
+ "step": 21655
+ },
+ {
+ "epoch": 59.00817438692098,
+ "grad_norm": 4.872261047363281,
+ "learning_rate": 7.592180759059631e-06,
+ "loss": 0.0787,
+ "step": 21656
+ },
+ {
+ "epoch": 59.01089918256131,
+ "grad_norm": 2.4931423664093018,
+ "learning_rate": 7.591324237462162e-06,
+ "loss": 0.0901,
+ "step": 21657
+ },
+ {
+ "epoch": 59.013623978201636,
+ "grad_norm": 3.5393104553222656,
+ "learning_rate": 7.5904677346233845e-06,
+ "loss": 0.1323,
+ "step": 21658
+ },
+ {
+ "epoch": 59.01634877384196,
+ "grad_norm": 2.8393118381500244,
+ "learning_rate": 7.589611250549965e-06,
+ "loss": 0.0628,
+ "step": 21659
+ },
+ {
+ "epoch": 59.01907356948229,
+ "grad_norm": 3.608720541000366,
+ "learning_rate": 7.588754785248578e-06,
+ "loss": 0.1887,
+ "step": 21660
+ },
+ {
+ "epoch": 59.02179836512261,
+ "grad_norm": 2.7257919311523438,
+ "learning_rate": 7.587898338725887e-06,
+ "loss": 0.052,
+ "step": 21661
+ },
+ {
+ "epoch": 59.02452316076294,
+ "grad_norm": 5.552196979522705,
+ "learning_rate": 7.587041910988571e-06,
+ "loss": 0.0633,
+ "step": 21662
+ },
+ {
+ "epoch": 59.02724795640327,
+ "grad_norm": 3.2473134994506836,
+ "learning_rate": 7.586185502043291e-06,
+ "loss": 0.0936,
+ "step": 21663
+ },
+ {
+ "epoch": 59.0299727520436,
+ "grad_norm": 3.7006382942199707,
+ "learning_rate": 7.5853291118967236e-06,
+ "loss": 0.061,
+ "step": 21664
+ },
+ {
+ "epoch": 59.032697547683924,
+ "grad_norm": 3.480757474899292,
+ "learning_rate": 7.584472740555533e-06,
+ "loss": 0.0865,
+ "step": 21665
+ },
+ {
+ "epoch": 59.03542234332425,
+ "grad_norm": 4.306460857391357,
+ "learning_rate": 7.583616388026392e-06,
+ "loss": 0.0588,
+ "step": 21666
+ },
+ {
+ "epoch": 59.038147138964575,
+ "grad_norm": 3.5792856216430664,
+ "learning_rate": 7.582760054315968e-06,
+ "loss": 0.1445,
+ "step": 21667
+ },
+ {
+ "epoch": 59.0408719346049,
+ "grad_norm": 3.097454786300659,
+ "learning_rate": 7.5819037394309326e-06,
+ "loss": 0.121,
+ "step": 21668
+ },
+ {
+ "epoch": 59.043596730245234,
+ "grad_norm": 3.4855430126190186,
+ "learning_rate": 7.581047443377951e-06,
+ "loss": 0.0504,
+ "step": 21669
+ },
+ {
+ "epoch": 59.04632152588556,
+ "grad_norm": 3.136826753616333,
+ "learning_rate": 7.580191166163696e-06,
+ "loss": 0.1283,
+ "step": 21670
+ },
+ {
+ "epoch": 59.049046321525886,
+ "grad_norm": 3.7873098850250244,
+ "learning_rate": 7.5793349077948296e-06,
+ "loss": 0.0774,
+ "step": 21671
+ },
+ {
+ "epoch": 59.05177111716621,
+ "grad_norm": 2.9616713523864746,
+ "learning_rate": 7.578478668278029e-06,
+ "loss": 0.0621,
+ "step": 21672
+ },
+ {
+ "epoch": 59.05449591280654,
+ "grad_norm": 3.8275697231292725,
+ "learning_rate": 7.5776224476199585e-06,
+ "loss": 0.1353,
+ "step": 21673
+ },
+ {
+ "epoch": 59.05722070844686,
+ "grad_norm": 3.3241209983825684,
+ "learning_rate": 7.576766245827285e-06,
+ "loss": 0.059,
+ "step": 21674
+ },
+ {
+ "epoch": 59.059945504087196,
+ "grad_norm": 2.50747013092041,
+ "learning_rate": 7.5759100629066785e-06,
+ "loss": 0.1116,
+ "step": 21675
+ },
+ {
+ "epoch": 59.06267029972752,
+ "grad_norm": 3.2242865562438965,
+ "learning_rate": 7.575053898864808e-06,
+ "loss": 0.0873,
+ "step": 21676
+ },
+ {
+ "epoch": 59.06539509536785,
+ "grad_norm": 3.4980032444000244,
+ "learning_rate": 7.574197753708339e-06,
+ "loss": 0.1898,
+ "step": 21677
+ },
+ {
+ "epoch": 59.06811989100817,
+ "grad_norm": 4.965635776519775,
+ "learning_rate": 7.57334162744394e-06,
+ "loss": 0.1019,
+ "step": 21678
+ },
+ {
+ "epoch": 59.0708446866485,
+ "grad_norm": 3.2334609031677246,
+ "learning_rate": 7.572485520078277e-06,
+ "loss": 0.0603,
+ "step": 21679
+ },
+ {
+ "epoch": 59.073569482288825,
+ "grad_norm": 3.3962340354919434,
+ "learning_rate": 7.571629431618021e-06,
+ "loss": 0.2385,
+ "step": 21680
+ },
+ {
+ "epoch": 59.07629427792916,
+ "grad_norm": 2.7325992584228516,
+ "learning_rate": 7.570773362069835e-06,
+ "loss": 0.0608,
+ "step": 21681
+ },
+ {
+ "epoch": 59.079019073569484,
+ "grad_norm": 3.219993829727173,
+ "learning_rate": 7.569917311440389e-06,
+ "loss": 0.0719,
+ "step": 21682
+ },
+ {
+ "epoch": 59.08174386920981,
+ "grad_norm": 2.691089630126953,
+ "learning_rate": 7.569061279736347e-06,
+ "loss": 0.0976,
+ "step": 21683
+ },
+ {
+ "epoch": 59.084468664850135,
+ "grad_norm": 4.899687767028809,
+ "learning_rate": 7.568205266964379e-06,
+ "loss": 0.1574,
+ "step": 21684
+ },
+ {
+ "epoch": 59.08719346049046,
+ "grad_norm": 4.418859958648682,
+ "learning_rate": 7.567349273131149e-06,
+ "loss": 0.2519,
+ "step": 21685
+ },
+ {
+ "epoch": 59.08991825613079,
+ "grad_norm": 3.6111385822296143,
+ "learning_rate": 7.566493298243327e-06,
+ "loss": 0.0763,
+ "step": 21686
+ },
+ {
+ "epoch": 59.09264305177112,
+ "grad_norm": 2.2135980129241943,
+ "learning_rate": 7.565637342307574e-06,
+ "loss": 0.0471,
+ "step": 21687
+ },
+ {
+ "epoch": 59.095367847411445,
+ "grad_norm": 3.797297716140747,
+ "learning_rate": 7.5647814053305565e-06,
+ "loss": 0.0653,
+ "step": 21688
+ },
+ {
+ "epoch": 59.09809264305177,
+ "grad_norm": 3.493048667907715,
+ "learning_rate": 7.563925487318948e-06,
+ "loss": 0.058,
+ "step": 21689
+ },
+ {
+ "epoch": 59.1008174386921,
+ "grad_norm": 3.347757339477539,
+ "learning_rate": 7.563069588279407e-06,
+ "loss": 0.0806,
+ "step": 21690
+ },
+ {
+ "epoch": 59.10354223433242,
+ "grad_norm": 3.1683833599090576,
+ "learning_rate": 7.562213708218604e-06,
+ "loss": 0.0761,
+ "step": 21691
+ },
+ {
+ "epoch": 59.10626702997275,
+ "grad_norm": 3.5190916061401367,
+ "learning_rate": 7.5613578471432e-06,
+ "loss": 0.0521,
+ "step": 21692
+ },
+ {
+ "epoch": 59.10899182561308,
+ "grad_norm": 4.314681529998779,
+ "learning_rate": 7.560502005059864e-06,
+ "loss": 0.0595,
+ "step": 21693
+ },
+ {
+ "epoch": 59.11171662125341,
+ "grad_norm": 5.3859758377075195,
+ "learning_rate": 7.559646181975259e-06,
+ "loss": 0.2263,
+ "step": 21694
+ },
+ {
+ "epoch": 59.11444141689373,
+ "grad_norm": 3.3791892528533936,
+ "learning_rate": 7.558790377896052e-06,
+ "loss": 0.1202,
+ "step": 21695
+ },
+ {
+ "epoch": 59.11716621253406,
+ "grad_norm": 3.9917123317718506,
+ "learning_rate": 7.557934592828906e-06,
+ "loss": 0.0982,
+ "step": 21696
+ },
+ {
+ "epoch": 59.119891008174385,
+ "grad_norm": 3.4781248569488525,
+ "learning_rate": 7.557078826780488e-06,
+ "loss": 0.1791,
+ "step": 21697
+ },
+ {
+ "epoch": 59.12261580381471,
+ "grad_norm": 3.8536505699157715,
+ "learning_rate": 7.5562230797574585e-06,
+ "loss": 0.096,
+ "step": 21698
+ },
+ {
+ "epoch": 59.12534059945504,
+ "grad_norm": 4.126902103424072,
+ "learning_rate": 7.555367351766487e-06,
+ "loss": 0.0674,
+ "step": 21699
+ },
+ {
+ "epoch": 59.12806539509537,
+ "grad_norm": 4.913824558258057,
+ "learning_rate": 7.5545116428142375e-06,
+ "loss": 0.0651,
+ "step": 21700
+ },
+ {
+ "epoch": 59.130790190735695,
+ "grad_norm": 3.8185019493103027,
+ "learning_rate": 7.553655952907369e-06,
+ "loss": 0.0649,
+ "step": 21701
+ },
+ {
+ "epoch": 59.13351498637602,
+ "grad_norm": 3.033230781555176,
+ "learning_rate": 7.552800282052552e-06,
+ "loss": 0.0725,
+ "step": 21702
+ },
+ {
+ "epoch": 59.13623978201635,
+ "grad_norm": 3.427907943725586,
+ "learning_rate": 7.551944630256447e-06,
+ "loss": 0.1338,
+ "step": 21703
+ },
+ {
+ "epoch": 59.13896457765667,
+ "grad_norm": 3.5687830448150635,
+ "learning_rate": 7.55108899752572e-06,
+ "loss": 0.243,
+ "step": 21704
+ },
+ {
+ "epoch": 59.141689373297005,
+ "grad_norm": 4.709448337554932,
+ "learning_rate": 7.5502333838670295e-06,
+ "loss": 0.3231,
+ "step": 21705
+ },
+ {
+ "epoch": 59.14441416893733,
+ "grad_norm": 2.8295841217041016,
+ "learning_rate": 7.5493777892870416e-06,
+ "loss": 0.1049,
+ "step": 21706
+ },
+ {
+ "epoch": 59.14713896457766,
+ "grad_norm": 5.204916954040527,
+ "learning_rate": 7.548522213792424e-06,
+ "loss": 0.0607,
+ "step": 21707
+ },
+ {
+ "epoch": 59.14986376021798,
+ "grad_norm": 3.4823975563049316,
+ "learning_rate": 7.547666657389836e-06,
+ "loss": 0.1337,
+ "step": 21708
+ },
+ {
+ "epoch": 59.15258855585831,
+ "grad_norm": 3.985304117202759,
+ "learning_rate": 7.546811120085942e-06,
+ "loss": 0.0356,
+ "step": 21709
+ },
+ {
+ "epoch": 59.155313351498634,
+ "grad_norm": 3.720289945602417,
+ "learning_rate": 7.545955601887402e-06,
+ "loss": 0.066,
+ "step": 21710
+ },
+ {
+ "epoch": 59.15803814713897,
+ "grad_norm": 3.5102925300598145,
+ "learning_rate": 7.545100102800883e-06,
+ "loss": 0.1042,
+ "step": 21711
+ },
+ {
+ "epoch": 59.16076294277929,
+ "grad_norm": 2.699995279312134,
+ "learning_rate": 7.544244622833043e-06,
+ "loss": 0.0558,
+ "step": 21712
+ },
+ {
+ "epoch": 59.16348773841962,
+ "grad_norm": 5.10889196395874,
+ "learning_rate": 7.5433891619905496e-06,
+ "loss": 0.1035,
+ "step": 21713
+ },
+ {
+ "epoch": 59.166212534059945,
+ "grad_norm": 3.469667673110962,
+ "learning_rate": 7.542533720280061e-06,
+ "loss": 0.0737,
+ "step": 21714
+ },
+ {
+ "epoch": 59.16893732970027,
+ "grad_norm": 3.9109909534454346,
+ "learning_rate": 7.541678297708241e-06,
+ "loss": 0.1187,
+ "step": 21715
+ },
+ {
+ "epoch": 59.171662125340596,
+ "grad_norm": 6.658548355102539,
+ "learning_rate": 7.5408228942817495e-06,
+ "loss": 0.0556,
+ "step": 21716
+ },
+ {
+ "epoch": 59.17438692098093,
+ "grad_norm": 3.173408031463623,
+ "learning_rate": 7.539967510007253e-06,
+ "loss": 0.0692,
+ "step": 21717
+ },
+ {
+ "epoch": 59.177111716621255,
+ "grad_norm": 4.470581531524658,
+ "learning_rate": 7.5391121448914085e-06,
+ "loss": 0.2408,
+ "step": 21718
+ },
+ {
+ "epoch": 59.17983651226158,
+ "grad_norm": 3.0410196781158447,
+ "learning_rate": 7.5382567989408805e-06,
+ "loss": 0.1242,
+ "step": 21719
+ },
+ {
+ "epoch": 59.182561307901906,
+ "grad_norm": 3.175139904022217,
+ "learning_rate": 7.537401472162328e-06,
+ "loss": 0.0443,
+ "step": 21720
+ },
+ {
+ "epoch": 59.18528610354223,
+ "grad_norm": 4.160188674926758,
+ "learning_rate": 7.536546164562413e-06,
+ "loss": 0.0828,
+ "step": 21721
+ },
+ {
+ "epoch": 59.18801089918256,
+ "grad_norm": 3.967879056930542,
+ "learning_rate": 7.5356908761478e-06,
+ "loss": 0.147,
+ "step": 21722
+ },
+ {
+ "epoch": 59.19073569482289,
+ "grad_norm": 3.446207284927368,
+ "learning_rate": 7.534835606925141e-06,
+ "loss": 0.1565,
+ "step": 21723
+ },
+ {
+ "epoch": 59.19346049046322,
+ "grad_norm": 4.34999418258667,
+ "learning_rate": 7.533980356901107e-06,
+ "loss": 0.0983,
+ "step": 21724
+ },
+ {
+ "epoch": 59.19618528610354,
+ "grad_norm": 3.562150716781616,
+ "learning_rate": 7.533125126082357e-06,
+ "loss": 0.1047,
+ "step": 21725
+ },
+ {
+ "epoch": 59.19891008174387,
+ "grad_norm": 3.700178384780884,
+ "learning_rate": 7.532269914475546e-06,
+ "loss": 0.2572,
+ "step": 21726
+ },
+ {
+ "epoch": 59.201634877384194,
+ "grad_norm": 8.654916763305664,
+ "learning_rate": 7.53141472208734e-06,
+ "loss": 0.1077,
+ "step": 21727
+ },
+ {
+ "epoch": 59.20435967302452,
+ "grad_norm": 4.667231559753418,
+ "learning_rate": 7.530559548924395e-06,
+ "loss": 0.0829,
+ "step": 21728
+ },
+ {
+ "epoch": 59.20708446866485,
+ "grad_norm": 3.4512836933135986,
+ "learning_rate": 7.529704394993374e-06,
+ "loss": 0.0853,
+ "step": 21729
+ },
+ {
+ "epoch": 59.20980926430518,
+ "grad_norm": 3.270360231399536,
+ "learning_rate": 7.528849260300933e-06,
+ "loss": 0.057,
+ "step": 21730
+ },
+ {
+ "epoch": 59.212534059945504,
+ "grad_norm": 3.6670432090759277,
+ "learning_rate": 7.527994144853738e-06,
+ "loss": 0.2495,
+ "step": 21731
+ },
+ {
+ "epoch": 59.21525885558583,
+ "grad_norm": 3.787236213684082,
+ "learning_rate": 7.5271390486584416e-06,
+ "loss": 0.0844,
+ "step": 21732
+ },
+ {
+ "epoch": 59.217983651226156,
+ "grad_norm": 4.844411849975586,
+ "learning_rate": 7.526283971721711e-06,
+ "loss": 0.2772,
+ "step": 21733
+ },
+ {
+ "epoch": 59.22070844686648,
+ "grad_norm": 5.151246070861816,
+ "learning_rate": 7.5254289140501965e-06,
+ "loss": 0.2213,
+ "step": 21734
+ },
+ {
+ "epoch": 59.223433242506815,
+ "grad_norm": 3.862370491027832,
+ "learning_rate": 7.524573875650565e-06,
+ "loss": 0.0471,
+ "step": 21735
+ },
+ {
+ "epoch": 59.22615803814714,
+ "grad_norm": 3.706761360168457,
+ "learning_rate": 7.523718856529471e-06,
+ "loss": 0.0729,
+ "step": 21736
+ },
+ {
+ "epoch": 59.228882833787466,
+ "grad_norm": 3.490652561187744,
+ "learning_rate": 7.522863856693577e-06,
+ "loss": 0.2747,
+ "step": 21737
+ },
+ {
+ "epoch": 59.23160762942779,
+ "grad_norm": 4.000617980957031,
+ "learning_rate": 7.522008876149537e-06,
+ "loss": 0.0969,
+ "step": 21738
+ },
+ {
+ "epoch": 59.23433242506812,
+ "grad_norm": 4.829466819763184,
+ "learning_rate": 7.521153914904013e-06,
+ "loss": 0.1152,
+ "step": 21739
+ },
+ {
+ "epoch": 59.237057220708444,
+ "grad_norm": 3.3655080795288086,
+ "learning_rate": 7.520298972963657e-06,
+ "loss": 0.1643,
+ "step": 21740
+ },
+ {
+ "epoch": 59.23978201634878,
+ "grad_norm": 3.153468132019043,
+ "learning_rate": 7.51944405033514e-06,
+ "loss": 0.0683,
+ "step": 21741
+ },
+ {
+ "epoch": 59.2425068119891,
+ "grad_norm": 5.982385635375977,
+ "learning_rate": 7.51858914702511e-06,
+ "loss": 0.1112,
+ "step": 21742
+ },
+ {
+ "epoch": 59.24523160762943,
+ "grad_norm": 3.087956666946411,
+ "learning_rate": 7.517734263040232e-06,
+ "loss": 0.0805,
+ "step": 21743
+ },
+ {
+ "epoch": 59.247956403269754,
+ "grad_norm": 5.980727195739746,
+ "learning_rate": 7.516879398387156e-06,
+ "loss": 0.1112,
+ "step": 21744
+ },
+ {
+ "epoch": 59.25068119891008,
+ "grad_norm": 4.207536697387695,
+ "learning_rate": 7.516024553072545e-06,
+ "loss": 0.0576,
+ "step": 21745
+ },
+ {
+ "epoch": 59.253405994550405,
+ "grad_norm": 3.840688943862915,
+ "learning_rate": 7.515169727103052e-06,
+ "loss": 0.1398,
+ "step": 21746
+ },
+ {
+ "epoch": 59.25613079019074,
+ "grad_norm": 2.959146738052368,
+ "learning_rate": 7.514314920485341e-06,
+ "loss": 0.1536,
+ "step": 21747
+ },
+ {
+ "epoch": 59.258855585831064,
+ "grad_norm": 4.634994029998779,
+ "learning_rate": 7.513460133226062e-06,
+ "loss": 0.0914,
+ "step": 21748
+ },
+ {
+ "epoch": 59.26158038147139,
+ "grad_norm": 2.8339734077453613,
+ "learning_rate": 7.512605365331878e-06,
+ "loss": 0.1018,
+ "step": 21749
+ },
+ {
+ "epoch": 59.264305177111716,
+ "grad_norm": 2.8966667652130127,
+ "learning_rate": 7.511750616809443e-06,
+ "loss": 0.0798,
+ "step": 21750
+ },
+ {
+ "epoch": 59.26702997275204,
+ "grad_norm": 4.672469615936279,
+ "learning_rate": 7.510895887665413e-06,
+ "loss": 0.1637,
+ "step": 21751
+ },
+ {
+ "epoch": 59.26975476839237,
+ "grad_norm": 2.795789957046509,
+ "learning_rate": 7.510041177906446e-06,
+ "loss": 0.0714,
+ "step": 21752
+ },
+ {
+ "epoch": 59.2724795640327,
+ "grad_norm": 4.427687644958496,
+ "learning_rate": 7.5091864875392e-06,
+ "loss": 0.1869,
+ "step": 21753
+ },
+ {
+ "epoch": 59.275204359673026,
+ "grad_norm": 3.7736551761627197,
+ "learning_rate": 7.508331816570327e-06,
+ "loss": 0.0782,
+ "step": 21754
+ },
+ {
+ "epoch": 59.27792915531335,
+ "grad_norm": 5.1422224044799805,
+ "learning_rate": 7.507477165006487e-06,
+ "loss": 0.0795,
+ "step": 21755
+ },
+ {
+ "epoch": 59.28065395095368,
+ "grad_norm": 4.449389934539795,
+ "learning_rate": 7.506622532854333e-06,
+ "loss": 0.219,
+ "step": 21756
+ },
+ {
+ "epoch": 59.283378746594,
+ "grad_norm": 3.5036587715148926,
+ "learning_rate": 7.50576792012052e-06,
+ "loss": 0.0755,
+ "step": 21757
+ },
+ {
+ "epoch": 59.28610354223433,
+ "grad_norm": 3.461836576461792,
+ "learning_rate": 7.504913326811711e-06,
+ "loss": 0.1001,
+ "step": 21758
+ },
+ {
+ "epoch": 59.28882833787466,
+ "grad_norm": 3.3612518310546875,
+ "learning_rate": 7.504058752934555e-06,
+ "loss": 0.0488,
+ "step": 21759
+ },
+ {
+ "epoch": 59.29155313351499,
+ "grad_norm": 3.089484214782715,
+ "learning_rate": 7.5032041984957106e-06,
+ "loss": 0.0509,
+ "step": 21760
+ },
+ {
+ "epoch": 59.294277929155314,
+ "grad_norm": 3.250932455062866,
+ "learning_rate": 7.502349663501829e-06,
+ "loss": 0.0917,
+ "step": 21761
+ },
+ {
+ "epoch": 59.29700272479564,
+ "grad_norm": 3.6009373664855957,
+ "learning_rate": 7.5014951479595684e-06,
+ "loss": 0.0587,
+ "step": 21762
+ },
+ {
+ "epoch": 59.299727520435965,
+ "grad_norm": 4.550698280334473,
+ "learning_rate": 7.5006406518755856e-06,
+ "loss": 0.0628,
+ "step": 21763
+ },
+ {
+ "epoch": 59.30245231607629,
+ "grad_norm": 9.64401912689209,
+ "learning_rate": 7.499786175256531e-06,
+ "loss": 0.1326,
+ "step": 21764
+ },
+ {
+ "epoch": 59.305177111716624,
+ "grad_norm": 2.655383586883545,
+ "learning_rate": 7.498931718109063e-06,
+ "loss": 0.0938,
+ "step": 21765
+ },
+ {
+ "epoch": 59.30790190735695,
+ "grad_norm": 4.906900882720947,
+ "learning_rate": 7.49807728043983e-06,
+ "loss": 0.0627,
+ "step": 21766
+ },
+ {
+ "epoch": 59.310626702997276,
+ "grad_norm": 3.091667413711548,
+ "learning_rate": 7.497222862255496e-06,
+ "loss": 0.0704,
+ "step": 21767
+ },
+ {
+ "epoch": 59.3133514986376,
+ "grad_norm": 5.284510612487793,
+ "learning_rate": 7.496368463562706e-06,
+ "loss": 0.1104,
+ "step": 21768
+ },
+ {
+ "epoch": 59.31607629427793,
+ "grad_norm": 2.9647274017333984,
+ "learning_rate": 7.495514084368121e-06,
+ "loss": 0.0474,
+ "step": 21769
+ },
+ {
+ "epoch": 59.31880108991825,
+ "grad_norm": 3.8396527767181396,
+ "learning_rate": 7.494659724678388e-06,
+ "loss": 0.0631,
+ "step": 21770
+ },
+ {
+ "epoch": 59.321525885558586,
+ "grad_norm": 3.168015956878662,
+ "learning_rate": 7.493805384500168e-06,
+ "loss": 0.1236,
+ "step": 21771
+ },
+ {
+ "epoch": 59.32425068119891,
+ "grad_norm": 9.776162147521973,
+ "learning_rate": 7.492951063840109e-06,
+ "loss": 0.119,
+ "step": 21772
+ },
+ {
+ "epoch": 59.32697547683924,
+ "grad_norm": 5.564446449279785,
+ "learning_rate": 7.492096762704868e-06,
+ "loss": 0.2097,
+ "step": 21773
+ },
+ {
+ "epoch": 59.32970027247956,
+ "grad_norm": 3.545588254928589,
+ "learning_rate": 7.491242481101091e-06,
+ "loss": 0.0916,
+ "step": 21774
+ },
+ {
+ "epoch": 59.33242506811989,
+ "grad_norm": 3.705561876296997,
+ "learning_rate": 7.490388219035441e-06,
+ "loss": 0.1592,
+ "step": 21775
+ },
+ {
+ "epoch": 59.335149863760215,
+ "grad_norm": 4.552818298339844,
+ "learning_rate": 7.489533976514568e-06,
+ "loss": 0.0495,
+ "step": 21776
+ },
+ {
+ "epoch": 59.33787465940055,
+ "grad_norm": 4.008409023284912,
+ "learning_rate": 7.488679753545121e-06,
+ "loss": 0.0848,
+ "step": 21777
+ },
+ {
+ "epoch": 59.34059945504087,
+ "grad_norm": 4.364948749542236,
+ "learning_rate": 7.487825550133759e-06,
+ "loss": 0.0598,
+ "step": 21778
+ },
+ {
+ "epoch": 59.3433242506812,
+ "grad_norm": 3.707984209060669,
+ "learning_rate": 7.486971366287128e-06,
+ "loss": 0.1673,
+ "step": 21779
+ },
+ {
+ "epoch": 59.346049046321525,
+ "grad_norm": 3.483253002166748,
+ "learning_rate": 7.4861172020118844e-06,
+ "loss": 0.0927,
+ "step": 21780
+ },
+ {
+ "epoch": 59.34877384196185,
+ "grad_norm": 3.4793434143066406,
+ "learning_rate": 7.485263057314678e-06,
+ "loss": 0.0881,
+ "step": 21781
+ },
+ {
+ "epoch": 59.35149863760218,
+ "grad_norm": 3.1901800632476807,
+ "learning_rate": 7.484408932202163e-06,
+ "loss": 0.1949,
+ "step": 21782
+ },
+ {
+ "epoch": 59.35422343324251,
+ "grad_norm": 3.7107465267181396,
+ "learning_rate": 7.483554826680989e-06,
+ "loss": 0.1693,
+ "step": 21783
+ },
+ {
+ "epoch": 59.356948228882835,
+ "grad_norm": 4.341519355773926,
+ "learning_rate": 7.482700740757811e-06,
+ "loss": 0.1126,
+ "step": 21784
+ },
+ {
+ "epoch": 59.35967302452316,
+ "grad_norm": 3.539825201034546,
+ "learning_rate": 7.481846674439276e-06,
+ "loss": 0.0811,
+ "step": 21785
+ },
+ {
+ "epoch": 59.36239782016349,
+ "grad_norm": 2.9512150287628174,
+ "learning_rate": 7.480992627732038e-06,
+ "loss": 0.1052,
+ "step": 21786
+ },
+ {
+ "epoch": 59.36512261580381,
+ "grad_norm": 4.722318172454834,
+ "learning_rate": 7.4801386006427515e-06,
+ "loss": 0.0778,
+ "step": 21787
+ },
+ {
+ "epoch": 59.36784741144414,
+ "grad_norm": 3.9388997554779053,
+ "learning_rate": 7.479284593178061e-06,
+ "loss": 0.119,
+ "step": 21788
+ },
+ {
+ "epoch": 59.37057220708447,
+ "grad_norm": 5.726805686950684,
+ "learning_rate": 7.478430605344624e-06,
+ "loss": 0.1978,
+ "step": 21789
+ },
+ {
+ "epoch": 59.3732970027248,
+ "grad_norm": 4.962177276611328,
+ "learning_rate": 7.477576637149086e-06,
+ "loss": 0.1384,
+ "step": 21790
+ },
+ {
+ "epoch": 59.37602179836512,
+ "grad_norm": 2.873889446258545,
+ "learning_rate": 7.476722688598102e-06,
+ "loss": 0.0598,
+ "step": 21791
+ },
+ {
+ "epoch": 59.37874659400545,
+ "grad_norm": 3.9591760635375977,
+ "learning_rate": 7.475868759698317e-06,
+ "loss": 0.2101,
+ "step": 21792
+ },
+ {
+ "epoch": 59.381471389645775,
+ "grad_norm": 3.4086108207702637,
+ "learning_rate": 7.4750148504563855e-06,
+ "loss": 0.1091,
+ "step": 21793
+ },
+ {
+ "epoch": 59.3841961852861,
+ "grad_norm": 4.699950695037842,
+ "learning_rate": 7.47416096087896e-06,
+ "loss": 0.206,
+ "step": 21794
+ },
+ {
+ "epoch": 59.38692098092643,
+ "grad_norm": 2.7233259677886963,
+ "learning_rate": 7.473307090972685e-06,
+ "loss": 0.0496,
+ "step": 21795
+ },
+ {
+ "epoch": 59.38964577656676,
+ "grad_norm": 4.428097724914551,
+ "learning_rate": 7.4724532407442165e-06,
+ "loss": 0.1381,
+ "step": 21796
+ },
+ {
+ "epoch": 59.392370572207085,
+ "grad_norm": 4.300647258758545,
+ "learning_rate": 7.471599410200198e-06,
+ "loss": 0.2477,
+ "step": 21797
+ },
+ {
+ "epoch": 59.39509536784741,
+ "grad_norm": 3.2388229370117188,
+ "learning_rate": 7.470745599347285e-06,
+ "loss": 0.0697,
+ "step": 21798
+ },
+ {
+ "epoch": 59.39782016348774,
+ "grad_norm": 3.206294059753418,
+ "learning_rate": 7.46989180819212e-06,
+ "loss": 0.0859,
+ "step": 21799
+ },
+ {
+ "epoch": 59.40054495912806,
+ "grad_norm": 3.8222544193267822,
+ "learning_rate": 7.469038036741358e-06,
+ "loss": 0.1102,
+ "step": 21800
+ },
+ {
+ "epoch": 59.403269754768395,
+ "grad_norm": 3.2217648029327393,
+ "learning_rate": 7.468184285001645e-06,
+ "loss": 0.2023,
+ "step": 21801
+ },
+ {
+ "epoch": 59.40599455040872,
+ "grad_norm": 4.229472637176514,
+ "learning_rate": 7.467330552979635e-06,
+ "loss": 0.0896,
+ "step": 21802
+ },
+ {
+ "epoch": 59.40871934604905,
+ "grad_norm": 4.491195201873779,
+ "learning_rate": 7.4664768406819685e-06,
+ "loss": 0.1437,
+ "step": 21803
+ },
+ {
+ "epoch": 59.41144414168937,
+ "grad_norm": 3.7320375442504883,
+ "learning_rate": 7.465623148115302e-06,
+ "loss": 0.0935,
+ "step": 21804
+ },
+ {
+ "epoch": 59.4141689373297,
+ "grad_norm": 4.812129974365234,
+ "learning_rate": 7.46476947528628e-06,
+ "loss": 0.1163,
+ "step": 21805
+ },
+ {
+ "epoch": 59.416893732970024,
+ "grad_norm": 5.116265773773193,
+ "learning_rate": 7.463915822201552e-06,
+ "loss": 0.0648,
+ "step": 21806
+ },
+ {
+ "epoch": 59.41961852861036,
+ "grad_norm": 4.548985481262207,
+ "learning_rate": 7.463062188867764e-06,
+ "loss": 0.0927,
+ "step": 21807
+ },
+ {
+ "epoch": 59.42234332425068,
+ "grad_norm": 5.495615005493164,
+ "learning_rate": 7.462208575291567e-06,
+ "loss": 0.0849,
+ "step": 21808
+ },
+ {
+ "epoch": 59.42506811989101,
+ "grad_norm": 3.476064443588257,
+ "learning_rate": 7.461354981479605e-06,
+ "loss": 0.1317,
+ "step": 21809
+ },
+ {
+ "epoch": 59.427792915531334,
+ "grad_norm": 4.945058822631836,
+ "learning_rate": 7.460501407438533e-06,
+ "loss": 0.093,
+ "step": 21810
+ },
+ {
+ "epoch": 59.43051771117166,
+ "grad_norm": 4.617724418640137,
+ "learning_rate": 7.459647853174993e-06,
+ "loss": 0.0963,
+ "step": 21811
+ },
+ {
+ "epoch": 59.433242506811986,
+ "grad_norm": 3.9213743209838867,
+ "learning_rate": 7.458794318695635e-06,
+ "loss": 0.0577,
+ "step": 21812
+ },
+ {
+ "epoch": 59.43596730245232,
+ "grad_norm": 3.279602289199829,
+ "learning_rate": 7.457940804007104e-06,
+ "loss": 0.1098,
+ "step": 21813
+ },
+ {
+ "epoch": 59.438692098092645,
+ "grad_norm": 4.74573278427124,
+ "learning_rate": 7.457087309116049e-06,
+ "loss": 0.082,
+ "step": 21814
+ },
+ {
+ "epoch": 59.44141689373297,
+ "grad_norm": 7.025487422943115,
+ "learning_rate": 7.456233834029114e-06,
+ "loss": 0.0725,
+ "step": 21815
+ },
+ {
+ "epoch": 59.444141689373296,
+ "grad_norm": 4.187443256378174,
+ "learning_rate": 7.455380378752951e-06,
+ "loss": 0.067,
+ "step": 21816
+ },
+ {
+ "epoch": 59.44686648501362,
+ "grad_norm": 3.6091067790985107,
+ "learning_rate": 7.454526943294201e-06,
+ "loss": 0.0634,
+ "step": 21817
+ },
+ {
+ "epoch": 59.44959128065395,
+ "grad_norm": 4.672299385070801,
+ "learning_rate": 7.4536735276595165e-06,
+ "loss": 0.0685,
+ "step": 21818
+ },
+ {
+ "epoch": 59.45231607629428,
+ "grad_norm": 4.091929912567139,
+ "learning_rate": 7.452820131855538e-06,
+ "loss": 0.1621,
+ "step": 21819
+ },
+ {
+ "epoch": 59.45504087193461,
+ "grad_norm": 3.060480833053589,
+ "learning_rate": 7.451966755888915e-06,
+ "loss": 0.0589,
+ "step": 21820
+ },
+ {
+ "epoch": 59.45776566757493,
+ "grad_norm": 3.5286495685577393,
+ "learning_rate": 7.451113399766292e-06,
+ "loss": 0.1765,
+ "step": 21821
+ },
+ {
+ "epoch": 59.46049046321526,
+ "grad_norm": 4.204300403594971,
+ "learning_rate": 7.450260063494319e-06,
+ "loss": 0.0821,
+ "step": 21822
+ },
+ {
+ "epoch": 59.463215258855584,
+ "grad_norm": 3.3798656463623047,
+ "learning_rate": 7.449406747079635e-06,
+ "loss": 0.1145,
+ "step": 21823
+ },
+ {
+ "epoch": 59.46594005449591,
+ "grad_norm": 3.8153555393218994,
+ "learning_rate": 7.448553450528891e-06,
+ "loss": 0.0652,
+ "step": 21824
+ },
+ {
+ "epoch": 59.46866485013624,
+ "grad_norm": 3.8584842681884766,
+ "learning_rate": 7.447700173848729e-06,
+ "loss": 0.0803,
+ "step": 21825
+ },
+ {
+ "epoch": 59.47138964577657,
+ "grad_norm": 4.309252738952637,
+ "learning_rate": 7.446846917045793e-06,
+ "loss": 0.193,
+ "step": 21826
+ },
+ {
+ "epoch": 59.474114441416894,
+ "grad_norm": 4.435990333557129,
+ "learning_rate": 7.445993680126735e-06,
+ "loss": 0.0748,
+ "step": 21827
+ },
+ {
+ "epoch": 59.47683923705722,
+ "grad_norm": 4.829715728759766,
+ "learning_rate": 7.445140463098197e-06,
+ "loss": 0.1138,
+ "step": 21828
+ },
+ {
+ "epoch": 59.479564032697546,
+ "grad_norm": 3.765371561050415,
+ "learning_rate": 7.444287265966821e-06,
+ "loss": 0.0964,
+ "step": 21829
+ },
+ {
+ "epoch": 59.48228882833787,
+ "grad_norm": 3.971548557281494,
+ "learning_rate": 7.443434088739256e-06,
+ "loss": 0.1511,
+ "step": 21830
+ },
+ {
+ "epoch": 59.485013623978205,
+ "grad_norm": 4.259155750274658,
+ "learning_rate": 7.442580931422141e-06,
+ "loss": 0.1125,
+ "step": 21831
+ },
+ {
+ "epoch": 59.48773841961853,
+ "grad_norm": 3.840143918991089,
+ "learning_rate": 7.441727794022126e-06,
+ "loss": 0.0983,
+ "step": 21832
+ },
+ {
+ "epoch": 59.490463215258856,
+ "grad_norm": 4.222861289978027,
+ "learning_rate": 7.44087467654585e-06,
+ "loss": 0.0993,
+ "step": 21833
+ },
+ {
+ "epoch": 59.49318801089918,
+ "grad_norm": 2.950629711151123,
+ "learning_rate": 7.440021578999963e-06,
+ "loss": 0.1224,
+ "step": 21834
+ },
+ {
+ "epoch": 59.49591280653951,
+ "grad_norm": 3.4389383792877197,
+ "learning_rate": 7.439168501391103e-06,
+ "loss": 0.1837,
+ "step": 21835
+ },
+ {
+ "epoch": 59.49863760217983,
+ "grad_norm": 4.719254493713379,
+ "learning_rate": 7.438315443725919e-06,
+ "loss": 0.0572,
+ "step": 21836
+ },
+ {
+ "epoch": 59.50136239782017,
+ "grad_norm": 3.35953950881958,
+ "learning_rate": 7.437462406011048e-06,
+ "loss": 0.074,
+ "step": 21837
+ },
+ {
+ "epoch": 59.50408719346049,
+ "grad_norm": 4.480406761169434,
+ "learning_rate": 7.43660938825314e-06,
+ "loss": 0.0826,
+ "step": 21838
+ },
+ {
+ "epoch": 59.50681198910082,
+ "grad_norm": 4.066308498382568,
+ "learning_rate": 7.435756390458834e-06,
+ "loss": 0.089,
+ "step": 21839
+ },
+ {
+ "epoch": 59.509536784741144,
+ "grad_norm": 4.58651065826416,
+ "learning_rate": 7.4349034126347765e-06,
+ "loss": 0.1235,
+ "step": 21840
+ },
+ {
+ "epoch": 59.51226158038147,
+ "grad_norm": 3.3988780975341797,
+ "learning_rate": 7.4340504547876066e-06,
+ "loss": 0.196,
+ "step": 21841
+ },
+ {
+ "epoch": 59.514986376021795,
+ "grad_norm": 3.3992702960968018,
+ "learning_rate": 7.433197516923971e-06,
+ "loss": 0.1059,
+ "step": 21842
+ },
+ {
+ "epoch": 59.51771117166213,
+ "grad_norm": 3.836113929748535,
+ "learning_rate": 7.432344599050507e-06,
+ "loss": 0.0917,
+ "step": 21843
+ },
+ {
+ "epoch": 59.520435967302454,
+ "grad_norm": 3.456178665161133,
+ "learning_rate": 7.431491701173862e-06,
+ "loss": 0.1329,
+ "step": 21844
+ },
+ {
+ "epoch": 59.52316076294278,
+ "grad_norm": 3.428816318511963,
+ "learning_rate": 7.43063882330068e-06,
+ "loss": 0.1099,
+ "step": 21845
+ },
+ {
+ "epoch": 59.525885558583106,
+ "grad_norm": 3.238723039627075,
+ "learning_rate": 7.429785965437597e-06,
+ "loss": 0.13,
+ "step": 21846
+ },
+ {
+ "epoch": 59.52861035422343,
+ "grad_norm": 4.485742092132568,
+ "learning_rate": 7.42893312759126e-06,
+ "loss": 0.1619,
+ "step": 21847
+ },
+ {
+ "epoch": 59.53133514986376,
+ "grad_norm": 3.8060503005981445,
+ "learning_rate": 7.4280803097683086e-06,
+ "loss": 0.0648,
+ "step": 21848
+ },
+ {
+ "epoch": 59.53405994550409,
+ "grad_norm": 3.3967173099517822,
+ "learning_rate": 7.427227511975383e-06,
+ "loss": 0.0954,
+ "step": 21849
+ },
+ {
+ "epoch": 59.536784741144416,
+ "grad_norm": 3.5591654777526855,
+ "learning_rate": 7.426374734219131e-06,
+ "loss": 0.076,
+ "step": 21850
+ },
+ {
+ "epoch": 59.53950953678474,
+ "grad_norm": 6.30497407913208,
+ "learning_rate": 7.425521976506186e-06,
+ "loss": 0.1958,
+ "step": 21851
+ },
+ {
+ "epoch": 59.54223433242507,
+ "grad_norm": 3.986257553100586,
+ "learning_rate": 7.424669238843195e-06,
+ "loss": 0.1863,
+ "step": 21852
+ },
+ {
+ "epoch": 59.54495912806539,
+ "grad_norm": 3.7997138500213623,
+ "learning_rate": 7.423816521236795e-06,
+ "loss": 0.1201,
+ "step": 21853
+ },
+ {
+ "epoch": 59.54768392370572,
+ "grad_norm": 4.160584449768066,
+ "learning_rate": 7.4229638236936315e-06,
+ "loss": 0.1436,
+ "step": 21854
+ },
+ {
+ "epoch": 59.55040871934605,
+ "grad_norm": 4.1414618492126465,
+ "learning_rate": 7.422111146220342e-06,
+ "loss": 0.0686,
+ "step": 21855
+ },
+ {
+ "epoch": 59.55313351498638,
+ "grad_norm": 3.886396884918213,
+ "learning_rate": 7.421258488823568e-06,
+ "loss": 0.0863,
+ "step": 21856
+ },
+ {
+ "epoch": 59.555858310626704,
+ "grad_norm": 4.574501037597656,
+ "learning_rate": 7.42040585150995e-06,
+ "loss": 0.0976,
+ "step": 21857
+ },
+ {
+ "epoch": 59.55858310626703,
+ "grad_norm": 3.625762701034546,
+ "learning_rate": 7.419553234286129e-06,
+ "loss": 0.0833,
+ "step": 21858
+ },
+ {
+ "epoch": 59.561307901907355,
+ "grad_norm": 3.206472158432007,
+ "learning_rate": 7.418700637158742e-06,
+ "loss": 0.1783,
+ "step": 21859
+ },
+ {
+ "epoch": 59.56403269754768,
+ "grad_norm": 3.9687817096710205,
+ "learning_rate": 7.417848060134429e-06,
+ "loss": 0.2486,
+ "step": 21860
+ },
+ {
+ "epoch": 59.566757493188014,
+ "grad_norm": 3.5982322692871094,
+ "learning_rate": 7.416995503219837e-06,
+ "loss": 0.0667,
+ "step": 21861
+ },
+ {
+ "epoch": 59.56948228882834,
+ "grad_norm": 3.204102039337158,
+ "learning_rate": 7.416142966421599e-06,
+ "loss": 0.0469,
+ "step": 21862
+ },
+ {
+ "epoch": 59.572207084468666,
+ "grad_norm": 3.5523905754089355,
+ "learning_rate": 7.4152904497463575e-06,
+ "loss": 0.2118,
+ "step": 21863
+ },
+ {
+ "epoch": 59.57493188010899,
+ "grad_norm": 3.9007256031036377,
+ "learning_rate": 7.414437953200751e-06,
+ "loss": 0.0643,
+ "step": 21864
+ },
+ {
+ "epoch": 59.57765667574932,
+ "grad_norm": 5.8959736824035645,
+ "learning_rate": 7.413585476791418e-06,
+ "loss": 0.1617,
+ "step": 21865
+ },
+ {
+ "epoch": 59.58038147138964,
+ "grad_norm": 4.635599613189697,
+ "learning_rate": 7.412733020524997e-06,
+ "loss": 0.0736,
+ "step": 21866
+ },
+ {
+ "epoch": 59.583106267029976,
+ "grad_norm": 3.5214428901672363,
+ "learning_rate": 7.411880584408131e-06,
+ "loss": 0.2338,
+ "step": 21867
+ },
+ {
+ "epoch": 59.5858310626703,
+ "grad_norm": 4.32875394821167,
+ "learning_rate": 7.4110281684474515e-06,
+ "loss": 0.1346,
+ "step": 21868
+ },
+ {
+ "epoch": 59.58855585831063,
+ "grad_norm": 3.2541072368621826,
+ "learning_rate": 7.410175772649605e-06,
+ "loss": 0.1198,
+ "step": 21869
+ },
+ {
+ "epoch": 59.59128065395095,
+ "grad_norm": 5.001347064971924,
+ "learning_rate": 7.4093233970212245e-06,
+ "loss": 0.0656,
+ "step": 21870
+ },
+ {
+ "epoch": 59.59400544959128,
+ "grad_norm": 4.108007431030273,
+ "learning_rate": 7.40847104156895e-06,
+ "loss": 0.061,
+ "step": 21871
+ },
+ {
+ "epoch": 59.596730245231605,
+ "grad_norm": 3.7400007247924805,
+ "learning_rate": 7.40761870629942e-06,
+ "loss": 0.0729,
+ "step": 21872
+ },
+ {
+ "epoch": 59.59945504087194,
+ "grad_norm": 3.1615638732910156,
+ "learning_rate": 7.40676639121927e-06,
+ "loss": 0.1703,
+ "step": 21873
+ },
+ {
+ "epoch": 59.60217983651226,
+ "grad_norm": 4.166745185852051,
+ "learning_rate": 7.405914096335143e-06,
+ "loss": 0.131,
+ "step": 21874
+ },
+ {
+ "epoch": 59.60490463215259,
+ "grad_norm": 3.6109678745269775,
+ "learning_rate": 7.405061821653672e-06,
+ "loss": 0.1533,
+ "step": 21875
+ },
+ {
+ "epoch": 59.607629427792915,
+ "grad_norm": 4.113295078277588,
+ "learning_rate": 7.404209567181497e-06,
+ "loss": 0.159,
+ "step": 21876
+ },
+ {
+ "epoch": 59.61035422343324,
+ "grad_norm": 2.682974338531494,
+ "learning_rate": 7.403357332925251e-06,
+ "loss": 0.0432,
+ "step": 21877
+ },
+ {
+ "epoch": 59.61307901907357,
+ "grad_norm": 4.304617404937744,
+ "learning_rate": 7.402505118891575e-06,
+ "loss": 0.1348,
+ "step": 21878
+ },
+ {
+ "epoch": 59.6158038147139,
+ "grad_norm": 4.079246520996094,
+ "learning_rate": 7.40165292508711e-06,
+ "loss": 0.0517,
+ "step": 21879
+ },
+ {
+ "epoch": 59.618528610354225,
+ "grad_norm": 4.5099568367004395,
+ "learning_rate": 7.400800751518484e-06,
+ "loss": 0.0699,
+ "step": 21880
+ },
+ {
+ "epoch": 59.62125340599455,
+ "grad_norm": 4.95874547958374,
+ "learning_rate": 7.399948598192341e-06,
+ "loss": 0.0891,
+ "step": 21881
+ },
+ {
+ "epoch": 59.62397820163488,
+ "grad_norm": 3.754046678543091,
+ "learning_rate": 7.3990964651153144e-06,
+ "loss": 0.1493,
+ "step": 21882
+ },
+ {
+ "epoch": 59.6267029972752,
+ "grad_norm": 4.105714797973633,
+ "learning_rate": 7.39824435229404e-06,
+ "loss": 0.224,
+ "step": 21883
+ },
+ {
+ "epoch": 59.62942779291553,
+ "grad_norm": 3.4785470962524414,
+ "learning_rate": 7.397392259735155e-06,
+ "loss": 0.1122,
+ "step": 21884
+ },
+ {
+ "epoch": 59.63215258855586,
+ "grad_norm": 4.887084484100342,
+ "learning_rate": 7.396540187445296e-06,
+ "loss": 0.2015,
+ "step": 21885
+ },
+ {
+ "epoch": 59.63487738419619,
+ "grad_norm": 3.4088008403778076,
+ "learning_rate": 7.395688135431096e-06,
+ "loss": 0.1561,
+ "step": 21886
+ },
+ {
+ "epoch": 59.63760217983651,
+ "grad_norm": 6.81312894821167,
+ "learning_rate": 7.394836103699197e-06,
+ "loss": 0.1588,
+ "step": 21887
+ },
+ {
+ "epoch": 59.64032697547684,
+ "grad_norm": 4.069431781768799,
+ "learning_rate": 7.393984092256227e-06,
+ "loss": 0.1011,
+ "step": 21888
+ },
+ {
+ "epoch": 59.643051771117165,
+ "grad_norm": 6.171210289001465,
+ "learning_rate": 7.393132101108827e-06,
+ "loss": 0.1744,
+ "step": 21889
+ },
+ {
+ "epoch": 59.64577656675749,
+ "grad_norm": 3.589771032333374,
+ "learning_rate": 7.392280130263628e-06,
+ "loss": 0.0546,
+ "step": 21890
+ },
+ {
+ "epoch": 59.64850136239782,
+ "grad_norm": 3.006995677947998,
+ "learning_rate": 7.39142817972727e-06,
+ "loss": 0.0706,
+ "step": 21891
+ },
+ {
+ "epoch": 59.65122615803815,
+ "grad_norm": 2.884824752807617,
+ "learning_rate": 7.390576249506384e-06,
+ "loss": 0.05,
+ "step": 21892
+ },
+ {
+ "epoch": 59.653950953678475,
+ "grad_norm": 4.403576850891113,
+ "learning_rate": 7.389724339607606e-06,
+ "loss": 0.2201,
+ "step": 21893
+ },
+ {
+ "epoch": 59.6566757493188,
+ "grad_norm": 4.115321636199951,
+ "learning_rate": 7.388872450037572e-06,
+ "loss": 0.1991,
+ "step": 21894
+ },
+ {
+ "epoch": 59.65940054495913,
+ "grad_norm": 5.070188522338867,
+ "learning_rate": 7.38802058080291e-06,
+ "loss": 0.1135,
+ "step": 21895
+ },
+ {
+ "epoch": 59.66212534059945,
+ "grad_norm": 3.9264934062957764,
+ "learning_rate": 7.387168731910264e-06,
+ "loss": 0.2953,
+ "step": 21896
+ },
+ {
+ "epoch": 59.664850136239785,
+ "grad_norm": 23.98346710205078,
+ "learning_rate": 7.386316903366266e-06,
+ "loss": 0.0699,
+ "step": 21897
+ },
+ {
+ "epoch": 59.66757493188011,
+ "grad_norm": 4.844391345977783,
+ "learning_rate": 7.385465095177544e-06,
+ "loss": 0.1196,
+ "step": 21898
+ },
+ {
+ "epoch": 59.67029972752044,
+ "grad_norm": 3.194143533706665,
+ "learning_rate": 7.384613307350739e-06,
+ "loss": 0.0528,
+ "step": 21899
+ },
+ {
+ "epoch": 59.67302452316076,
+ "grad_norm": 4.888129234313965,
+ "learning_rate": 7.38376153989248e-06,
+ "loss": 0.1125,
+ "step": 21900
+ },
+ {
+ "epoch": 59.67574931880109,
+ "grad_norm": 4.619625568389893,
+ "learning_rate": 7.382909792809403e-06,
+ "loss": 0.1219,
+ "step": 21901
+ },
+ {
+ "epoch": 59.678474114441414,
+ "grad_norm": 3.538721799850464,
+ "learning_rate": 7.3820580661081375e-06,
+ "loss": 0.0601,
+ "step": 21902
+ },
+ {
+ "epoch": 59.68119891008175,
+ "grad_norm": 3.7365593910217285,
+ "learning_rate": 7.381206359795323e-06,
+ "loss": 0.0731,
+ "step": 21903
+ },
+ {
+ "epoch": 59.68392370572207,
+ "grad_norm": 3.50585675239563,
+ "learning_rate": 7.380354673877585e-06,
+ "loss": 0.1768,
+ "step": 21904
+ },
+ {
+ "epoch": 59.6866485013624,
+ "grad_norm": 4.8301239013671875,
+ "learning_rate": 7.379503008361565e-06,
+ "loss": 0.1422,
+ "step": 21905
+ },
+ {
+ "epoch": 59.689373297002724,
+ "grad_norm": 2.799285650253296,
+ "learning_rate": 7.378651363253888e-06,
+ "loss": 0.0722,
+ "step": 21906
+ },
+ {
+ "epoch": 59.69209809264305,
+ "grad_norm": 3.759619951248169,
+ "learning_rate": 7.377799738561192e-06,
+ "loss": 0.0821,
+ "step": 21907
+ },
+ {
+ "epoch": 59.694822888283376,
+ "grad_norm": 3.615964412689209,
+ "learning_rate": 7.376948134290105e-06,
+ "loss": 0.1244,
+ "step": 21908
+ },
+ {
+ "epoch": 59.69754768392371,
+ "grad_norm": 3.153252601623535,
+ "learning_rate": 7.376096550447265e-06,
+ "loss": 0.0886,
+ "step": 21909
+ },
+ {
+ "epoch": 59.700272479564035,
+ "grad_norm": 2.7910876274108887,
+ "learning_rate": 7.375244987039296e-06,
+ "loss": 0.0422,
+ "step": 21910
+ },
+ {
+ "epoch": 59.70299727520436,
+ "grad_norm": 4.728867530822754,
+ "learning_rate": 7.3743934440728385e-06,
+ "loss": 0.2137,
+ "step": 21911
+ },
+ {
+ "epoch": 59.705722070844686,
+ "grad_norm": 2.8954384326934814,
+ "learning_rate": 7.373541921554515e-06,
+ "loss": 0.0603,
+ "step": 21912
+ },
+ {
+ "epoch": 59.70844686648501,
+ "grad_norm": 3.641709566116333,
+ "learning_rate": 7.3726904194909655e-06,
+ "loss": 0.1728,
+ "step": 21913
+ },
+ {
+ "epoch": 59.71117166212534,
+ "grad_norm": 3.848088026046753,
+ "learning_rate": 7.3718389378888175e-06,
+ "loss": 0.1199,
+ "step": 21914
+ },
+ {
+ "epoch": 59.71389645776567,
+ "grad_norm": 3.926086187362671,
+ "learning_rate": 7.370987476754707e-06,
+ "loss": 0.0781,
+ "step": 21915
+ },
+ {
+ "epoch": 59.716621253406,
+ "grad_norm": 3.1481707096099854,
+ "learning_rate": 7.370136036095258e-06,
+ "loss": 0.1687,
+ "step": 21916
+ },
+ {
+ "epoch": 59.71934604904632,
+ "grad_norm": 3.281507968902588,
+ "learning_rate": 7.369284615917107e-06,
+ "loss": 0.3074,
+ "step": 21917
+ },
+ {
+ "epoch": 59.72207084468665,
+ "grad_norm": 3.6226589679718018,
+ "learning_rate": 7.368433216226881e-06,
+ "loss": 0.1139,
+ "step": 21918
+ },
+ {
+ "epoch": 59.724795640326974,
+ "grad_norm": 3.5362019538879395,
+ "learning_rate": 7.3675818370312145e-06,
+ "loss": 0.1129,
+ "step": 21919
+ },
+ {
+ "epoch": 59.7275204359673,
+ "grad_norm": 5.129333019256592,
+ "learning_rate": 7.3667304783367345e-06,
+ "loss": 0.2957,
+ "step": 21920
+ },
+ {
+ "epoch": 59.73024523160763,
+ "grad_norm": 3.0170693397521973,
+ "learning_rate": 7.365879140150074e-06,
+ "loss": 0.0705,
+ "step": 21921
+ },
+ {
+ "epoch": 59.73297002724796,
+ "grad_norm": 4.153504371643066,
+ "learning_rate": 7.36502782247786e-06,
+ "loss": 0.1186,
+ "step": 21922
+ },
+ {
+ "epoch": 59.735694822888284,
+ "grad_norm": 3.5138421058654785,
+ "learning_rate": 7.364176525326726e-06,
+ "loss": 0.1865,
+ "step": 21923
+ },
+ {
+ "epoch": 59.73841961852861,
+ "grad_norm": 3.734121561050415,
+ "learning_rate": 7.3633252487032995e-06,
+ "loss": 0.151,
+ "step": 21924
+ },
+ {
+ "epoch": 59.741144414168936,
+ "grad_norm": 4.205217361450195,
+ "learning_rate": 7.362473992614212e-06,
+ "loss": 0.1132,
+ "step": 21925
+ },
+ {
+ "epoch": 59.74386920980926,
+ "grad_norm": 3.6806509494781494,
+ "learning_rate": 7.361622757066092e-06,
+ "loss": 0.0675,
+ "step": 21926
+ },
+ {
+ "epoch": 59.746594005449595,
+ "grad_norm": 3.2617616653442383,
+ "learning_rate": 7.360771542065569e-06,
+ "loss": 0.0991,
+ "step": 21927
+ },
+ {
+ "epoch": 59.74931880108992,
+ "grad_norm": 5.201332092285156,
+ "learning_rate": 7.3599203476192716e-06,
+ "loss": 0.1436,
+ "step": 21928
+ },
+ {
+ "epoch": 59.752043596730246,
+ "grad_norm": 3.168055534362793,
+ "learning_rate": 7.3590691737338264e-06,
+ "loss": 0.1375,
+ "step": 21929
+ },
+ {
+ "epoch": 59.75476839237057,
+ "grad_norm": 3.6250600814819336,
+ "learning_rate": 7.35821802041587e-06,
+ "loss": 0.0624,
+ "step": 21930
+ },
+ {
+ "epoch": 59.7574931880109,
+ "grad_norm": 4.313841342926025,
+ "learning_rate": 7.357366887672025e-06,
+ "loss": 0.1178,
+ "step": 21931
+ },
+ {
+ "epoch": 59.76021798365122,
+ "grad_norm": 4.536067008972168,
+ "learning_rate": 7.356515775508924e-06,
+ "loss": 0.2123,
+ "step": 21932
+ },
+ {
+ "epoch": 59.762942779291556,
+ "grad_norm": 3.065178394317627,
+ "learning_rate": 7.35566468393319e-06,
+ "loss": 0.0482,
+ "step": 21933
+ },
+ {
+ "epoch": 59.76566757493188,
+ "grad_norm": 4.149610996246338,
+ "learning_rate": 7.354813612951457e-06,
+ "loss": 0.1382,
+ "step": 21934
+ },
+ {
+ "epoch": 59.76839237057221,
+ "grad_norm": 3.3267109394073486,
+ "learning_rate": 7.353962562570347e-06,
+ "loss": 0.0592,
+ "step": 21935
+ },
+ {
+ "epoch": 59.771117166212534,
+ "grad_norm": 3.2652664184570312,
+ "learning_rate": 7.353111532796493e-06,
+ "loss": 0.1259,
+ "step": 21936
+ },
+ {
+ "epoch": 59.77384196185286,
+ "grad_norm": 3.761549949645996,
+ "learning_rate": 7.352260523636523e-06,
+ "loss": 0.1538,
+ "step": 21937
+ },
+ {
+ "epoch": 59.776566757493185,
+ "grad_norm": 3.6344947814941406,
+ "learning_rate": 7.351409535097061e-06,
+ "loss": 0.0993,
+ "step": 21938
+ },
+ {
+ "epoch": 59.77929155313352,
+ "grad_norm": 5.851442337036133,
+ "learning_rate": 7.350558567184738e-06,
+ "loss": 0.1137,
+ "step": 21939
+ },
+ {
+ "epoch": 59.782016348773844,
+ "grad_norm": 3.915271282196045,
+ "learning_rate": 7.349707619906177e-06,
+ "loss": 0.0746,
+ "step": 21940
+ },
+ {
+ "epoch": 59.78474114441417,
+ "grad_norm": 4.664577484130859,
+ "learning_rate": 7.348856693268011e-06,
+ "loss": 0.0618,
+ "step": 21941
+ },
+ {
+ "epoch": 59.787465940054496,
+ "grad_norm": 3.6140897274017334,
+ "learning_rate": 7.348005787276861e-06,
+ "loss": 0.0537,
+ "step": 21942
+ },
+ {
+ "epoch": 59.79019073569482,
+ "grad_norm": 2.723332643508911,
+ "learning_rate": 7.347154901939358e-06,
+ "loss": 0.0602,
+ "step": 21943
+ },
+ {
+ "epoch": 59.79291553133515,
+ "grad_norm": 3.181187152862549,
+ "learning_rate": 7.346304037262127e-06,
+ "loss": 0.0488,
+ "step": 21944
+ },
+ {
+ "epoch": 59.79564032697548,
+ "grad_norm": 5.005062580108643,
+ "learning_rate": 7.345453193251795e-06,
+ "loss": 0.0624,
+ "step": 21945
+ },
+ {
+ "epoch": 59.798365122615806,
+ "grad_norm": 4.6376423835754395,
+ "learning_rate": 7.344602369914984e-06,
+ "loss": 0.1224,
+ "step": 21946
+ },
+ {
+ "epoch": 59.80108991825613,
+ "grad_norm": 5.750683784484863,
+ "learning_rate": 7.343751567258328e-06,
+ "loss": 0.1832,
+ "step": 21947
+ },
+ {
+ "epoch": 59.80381471389646,
+ "grad_norm": 3.7080774307250977,
+ "learning_rate": 7.34290078528845e-06,
+ "loss": 0.1166,
+ "step": 21948
+ },
+ {
+ "epoch": 59.80653950953678,
+ "grad_norm": 4.58156681060791,
+ "learning_rate": 7.342050024011973e-06,
+ "loss": 0.144,
+ "step": 21949
+ },
+ {
+ "epoch": 59.80926430517711,
+ "grad_norm": 2.935380458831787,
+ "learning_rate": 7.3411992834355276e-06,
+ "loss": 0.053,
+ "step": 21950
+ },
+ {
+ "epoch": 59.81198910081744,
+ "grad_norm": 5.052936553955078,
+ "learning_rate": 7.340348563565735e-06,
+ "loss": 0.1395,
+ "step": 21951
+ },
+ {
+ "epoch": 59.81471389645777,
+ "grad_norm": 4.201597213745117,
+ "learning_rate": 7.339497864409223e-06,
+ "loss": 0.0573,
+ "step": 21952
+ },
+ {
+ "epoch": 59.817438692098094,
+ "grad_norm": 3.823265790939331,
+ "learning_rate": 7.338647185972614e-06,
+ "loss": 0.0551,
+ "step": 21953
+ },
+ {
+ "epoch": 59.82016348773842,
+ "grad_norm": 4.828398704528809,
+ "learning_rate": 7.337796528262537e-06,
+ "loss": 0.1576,
+ "step": 21954
+ },
+ {
+ "epoch": 59.822888283378745,
+ "grad_norm": 3.4092397689819336,
+ "learning_rate": 7.336945891285614e-06,
+ "loss": 0.05,
+ "step": 21955
+ },
+ {
+ "epoch": 59.82561307901907,
+ "grad_norm": 5.1029863357543945,
+ "learning_rate": 7.336095275048474e-06,
+ "loss": 0.1454,
+ "step": 21956
+ },
+ {
+ "epoch": 59.828337874659404,
+ "grad_norm": 3.9042434692382812,
+ "learning_rate": 7.3352446795577336e-06,
+ "loss": 0.1659,
+ "step": 21957
+ },
+ {
+ "epoch": 59.83106267029973,
+ "grad_norm": 3.6238622665405273,
+ "learning_rate": 7.334394104820024e-06,
+ "loss": 0.0742,
+ "step": 21958
+ },
+ {
+ "epoch": 59.833787465940055,
+ "grad_norm": 12.98780345916748,
+ "learning_rate": 7.333543550841966e-06,
+ "loss": 0.1047,
+ "step": 21959
+ },
+ {
+ "epoch": 59.83651226158038,
+ "grad_norm": 6.426098823547363,
+ "learning_rate": 7.332693017630185e-06,
+ "loss": 0.1479,
+ "step": 21960
+ },
+ {
+ "epoch": 59.83923705722071,
+ "grad_norm": 3.744154214859009,
+ "learning_rate": 7.331842505191308e-06,
+ "loss": 0.0855,
+ "step": 21961
+ },
+ {
+ "epoch": 59.84196185286103,
+ "grad_norm": 8.704964637756348,
+ "learning_rate": 7.330992013531952e-06,
+ "loss": 0.1569,
+ "step": 21962
+ },
+ {
+ "epoch": 59.844686648501366,
+ "grad_norm": 5.0485944747924805,
+ "learning_rate": 7.330141542658747e-06,
+ "loss": 0.1304,
+ "step": 21963
+ },
+ {
+ "epoch": 59.84741144414169,
+ "grad_norm": 4.686516761779785,
+ "learning_rate": 7.32929109257831e-06,
+ "loss": 0.0861,
+ "step": 21964
+ },
+ {
+ "epoch": 59.85013623978202,
+ "grad_norm": 4.361832618713379,
+ "learning_rate": 7.328440663297269e-06,
+ "loss": 0.2178,
+ "step": 21965
+ },
+ {
+ "epoch": 59.85286103542234,
+ "grad_norm": 4.1770501136779785,
+ "learning_rate": 7.32759025482225e-06,
+ "loss": 0.098,
+ "step": 21966
+ },
+ {
+ "epoch": 59.85558583106267,
+ "grad_norm": 2.7962067127227783,
+ "learning_rate": 7.3267398671598685e-06,
+ "loss": 0.0984,
+ "step": 21967
+ },
+ {
+ "epoch": 59.858310626702995,
+ "grad_norm": 3.77594256401062,
+ "learning_rate": 7.325889500316754e-06,
+ "loss": 0.169,
+ "step": 21968
+ },
+ {
+ "epoch": 59.86103542234333,
+ "grad_norm": 5.534327507019043,
+ "learning_rate": 7.325039154299522e-06,
+ "loss": 0.2511,
+ "step": 21969
+ },
+ {
+ "epoch": 59.86376021798365,
+ "grad_norm": 3.6949567794799805,
+ "learning_rate": 7.324188829114804e-06,
+ "loss": 0.2434,
+ "step": 21970
+ },
+ {
+ "epoch": 59.86648501362398,
+ "grad_norm": 6.855175018310547,
+ "learning_rate": 7.323338524769212e-06,
+ "loss": 0.0748,
+ "step": 21971
+ },
+ {
+ "epoch": 59.869209809264305,
+ "grad_norm": 3.2030975818634033,
+ "learning_rate": 7.322488241269379e-06,
+ "loss": 0.0537,
+ "step": 21972
+ },
+ {
+ "epoch": 59.87193460490463,
+ "grad_norm": 5.0401387214660645,
+ "learning_rate": 7.321637978621916e-06,
+ "loss": 0.1184,
+ "step": 21973
+ },
+ {
+ "epoch": 59.87465940054496,
+ "grad_norm": 4.25337553024292,
+ "learning_rate": 7.320787736833455e-06,
+ "loss": 0.1038,
+ "step": 21974
+ },
+ {
+ "epoch": 59.87738419618529,
+ "grad_norm": 4.143477439880371,
+ "learning_rate": 7.319937515910609e-06,
+ "loss": 0.1226,
+ "step": 21975
+ },
+ {
+ "epoch": 59.880108991825615,
+ "grad_norm": 4.022922515869141,
+ "learning_rate": 7.319087315860005e-06,
+ "loss": 0.0766,
+ "step": 21976
+ },
+ {
+ "epoch": 59.88283378746594,
+ "grad_norm": 3.7847626209259033,
+ "learning_rate": 7.318237136688262e-06,
+ "loss": 0.0651,
+ "step": 21977
+ },
+ {
+ "epoch": 59.88555858310627,
+ "grad_norm": 3.106093645095825,
+ "learning_rate": 7.317386978402003e-06,
+ "loss": 0.0693,
+ "step": 21978
+ },
+ {
+ "epoch": 59.88828337874659,
+ "grad_norm": 4.657619953155518,
+ "learning_rate": 7.316536841007847e-06,
+ "loss": 0.1568,
+ "step": 21979
+ },
+ {
+ "epoch": 59.89100817438692,
+ "grad_norm": 4.844773292541504,
+ "learning_rate": 7.3156867245124175e-06,
+ "loss": 0.1726,
+ "step": 21980
+ },
+ {
+ "epoch": 59.89373297002725,
+ "grad_norm": 2.992464303970337,
+ "learning_rate": 7.314836628922326e-06,
+ "loss": 0.1088,
+ "step": 21981
+ },
+ {
+ "epoch": 59.89645776566758,
+ "grad_norm": 4.16619348526001,
+ "learning_rate": 7.313986554244208e-06,
+ "loss": 0.1272,
+ "step": 21982
+ },
+ {
+ "epoch": 59.8991825613079,
+ "grad_norm": 3.4509432315826416,
+ "learning_rate": 7.313136500484673e-06,
+ "loss": 0.0958,
+ "step": 21983
+ },
+ {
+ "epoch": 59.90190735694823,
+ "grad_norm": 3.953277111053467,
+ "learning_rate": 7.312286467650347e-06,
+ "loss": 0.0955,
+ "step": 21984
+ },
+ {
+ "epoch": 59.904632152588555,
+ "grad_norm": 3.0407843589782715,
+ "learning_rate": 7.311436455747847e-06,
+ "loss": 0.0777,
+ "step": 21985
+ },
+ {
+ "epoch": 59.90735694822888,
+ "grad_norm": 3.9172523021698,
+ "learning_rate": 7.3105864647837934e-06,
+ "loss": 0.0896,
+ "step": 21986
+ },
+ {
+ "epoch": 59.91008174386921,
+ "grad_norm": 5.004632472991943,
+ "learning_rate": 7.309736494764804e-06,
+ "loss": 0.1148,
+ "step": 21987
+ },
+ {
+ "epoch": 59.91280653950954,
+ "grad_norm": 3.2358882427215576,
+ "learning_rate": 7.308886545697502e-06,
+ "loss": 0.2064,
+ "step": 21988
+ },
+ {
+ "epoch": 59.915531335149865,
+ "grad_norm": 4.379899501800537,
+ "learning_rate": 7.308036617588504e-06,
+ "loss": 0.0795,
+ "step": 21989
+ },
+ {
+ "epoch": 59.91825613079019,
+ "grad_norm": 3.341609477996826,
+ "learning_rate": 7.307186710444432e-06,
+ "loss": 0.1664,
+ "step": 21990
+ },
+ {
+ "epoch": 59.920980926430516,
+ "grad_norm": 3.8921256065368652,
+ "learning_rate": 7.3063368242719005e-06,
+ "loss": 0.1101,
+ "step": 21991
+ },
+ {
+ "epoch": 59.92370572207084,
+ "grad_norm": 3.9960689544677734,
+ "learning_rate": 7.3054869590775344e-06,
+ "loss": 0.0649,
+ "step": 21992
+ },
+ {
+ "epoch": 59.926430517711175,
+ "grad_norm": 3.2175517082214355,
+ "learning_rate": 7.304637114867946e-06,
+ "loss": 0.1003,
+ "step": 21993
+ },
+ {
+ "epoch": 59.9291553133515,
+ "grad_norm": 3.395170211791992,
+ "learning_rate": 7.30378729164976e-06,
+ "loss": 0.0413,
+ "step": 21994
+ },
+ {
+ "epoch": 59.93188010899183,
+ "grad_norm": 4.161465167999268,
+ "learning_rate": 7.302937489429589e-06,
+ "loss": 0.0669,
+ "step": 21995
+ },
+ {
+ "epoch": 59.93460490463215,
+ "grad_norm": 3.115039587020874,
+ "learning_rate": 7.302087708214056e-06,
+ "loss": 0.1485,
+ "step": 21996
+ },
+ {
+ "epoch": 59.93732970027248,
+ "grad_norm": 3.1612086296081543,
+ "learning_rate": 7.301237948009775e-06,
+ "loss": 0.0508,
+ "step": 21997
+ },
+ {
+ "epoch": 59.940054495912804,
+ "grad_norm": 6.413022518157959,
+ "learning_rate": 7.3003882088233635e-06,
+ "loss": 0.2392,
+ "step": 21998
+ },
+ {
+ "epoch": 59.94277929155314,
+ "grad_norm": 4.683806419372559,
+ "learning_rate": 7.299538490661446e-06,
+ "loss": 0.1101,
+ "step": 21999
+ },
+ {
+ "epoch": 59.94550408719346,
+ "grad_norm": 4.365520000457764,
+ "learning_rate": 7.298688793530635e-06,
+ "loss": 0.1686,
+ "step": 22000
+ },
+ {
+ "epoch": 59.94822888283379,
+ "grad_norm": 3.62276554107666,
+ "learning_rate": 7.297839117437549e-06,
+ "loss": 0.1164,
+ "step": 22001
+ },
+ {
+ "epoch": 59.950953678474114,
+ "grad_norm": 4.794510364532471,
+ "learning_rate": 7.296989462388806e-06,
+ "loss": 0.2839,
+ "step": 22002
+ },
+ {
+ "epoch": 59.95367847411444,
+ "grad_norm": 3.246356964111328,
+ "learning_rate": 7.2961398283910204e-06,
+ "loss": 0.1993,
+ "step": 22003
+ },
+ {
+ "epoch": 59.956403269754766,
+ "grad_norm": 4.223857879638672,
+ "learning_rate": 7.295290215450812e-06,
+ "loss": 0.0891,
+ "step": 22004
+ },
+ {
+ "epoch": 59.95912806539509,
+ "grad_norm": 5.262650966644287,
+ "learning_rate": 7.2944406235747945e-06,
+ "loss": 0.1266,
+ "step": 22005
+ },
+ {
+ "epoch": 59.961852861035425,
+ "grad_norm": 3.6192314624786377,
+ "learning_rate": 7.293591052769589e-06,
+ "loss": 0.1053,
+ "step": 22006
+ },
+ {
+ "epoch": 59.96457765667575,
+ "grad_norm": 3.421889543533325,
+ "learning_rate": 7.292741503041807e-06,
+ "loss": 0.0818,
+ "step": 22007
+ },
+ {
+ "epoch": 59.967302452316076,
+ "grad_norm": 3.889723777770996,
+ "learning_rate": 7.2918919743980685e-06,
+ "loss": 0.1904,
+ "step": 22008
+ },
+ {
+ "epoch": 59.9700272479564,
+ "grad_norm": 7.882750511169434,
+ "learning_rate": 7.291042466844986e-06,
+ "loss": 0.0924,
+ "step": 22009
+ },
+ {
+ "epoch": 59.97275204359673,
+ "grad_norm": 4.6614670753479,
+ "learning_rate": 7.290192980389182e-06,
+ "loss": 0.1675,
+ "step": 22010
+ },
+ {
+ "epoch": 59.97547683923706,
+ "grad_norm": 4.777350902557373,
+ "learning_rate": 7.289343515037263e-06,
+ "loss": 0.1633,
+ "step": 22011
+ },
+ {
+ "epoch": 59.97820163487739,
+ "grad_norm": 3.8556883335113525,
+ "learning_rate": 7.288494070795853e-06,
+ "loss": 0.0764,
+ "step": 22012
+ },
+ {
+ "epoch": 59.98092643051771,
+ "grad_norm": 2.663574695587158,
+ "learning_rate": 7.287644647671561e-06,
+ "loss": 0.1514,
+ "step": 22013
+ },
+ {
+ "epoch": 59.98365122615804,
+ "grad_norm": 3.57833194732666,
+ "learning_rate": 7.2867952456710075e-06,
+ "loss": 0.1716,
+ "step": 22014
+ },
+ {
+ "epoch": 59.986376021798364,
+ "grad_norm": 4.133760929107666,
+ "learning_rate": 7.2859458648008005e-06,
+ "loss": 0.1235,
+ "step": 22015
+ },
+ {
+ "epoch": 59.98910081743869,
+ "grad_norm": 3.7926201820373535,
+ "learning_rate": 7.285096505067564e-06,
+ "loss": 0.2471,
+ "step": 22016
+ },
+ {
+ "epoch": 59.991825613079016,
+ "grad_norm": 5.786928176879883,
+ "learning_rate": 7.284247166477909e-06,
+ "loss": 0.1275,
+ "step": 22017
+ },
+ {
+ "epoch": 59.99455040871935,
+ "grad_norm": 4.353601932525635,
+ "learning_rate": 7.283397849038447e-06,
+ "loss": 0.232,
+ "step": 22018
+ },
+ {
+ "epoch": 59.997275204359674,
+ "grad_norm": 3.548330307006836,
+ "learning_rate": 7.282548552755799e-06,
+ "loss": 0.0597,
+ "step": 22019
+ },
+ {
+ "epoch": 60.0,
+ "grad_norm": 4.561960697174072,
+ "learning_rate": 7.2816992776365714e-06,
+ "loss": 0.064,
+ "step": 22020
+ },
+ {
+ "epoch": 60.002724795640326,
+ "grad_norm": 9.981670379638672,
+ "learning_rate": 7.280850023687387e-06,
+ "loss": 0.1695,
+ "step": 22021
+ },
+ {
+ "epoch": 60.00544959128065,
+ "grad_norm": 5.571465492248535,
+ "learning_rate": 7.280000790914851e-06,
+ "loss": 0.1023,
+ "step": 22022
+ },
+ {
+ "epoch": 60.00817438692098,
+ "grad_norm": 2.7264788150787354,
+ "learning_rate": 7.27915157932558e-06,
+ "loss": 0.2045,
+ "step": 22023
+ },
+ {
+ "epoch": 60.01089918256131,
+ "grad_norm": 3.745054244995117,
+ "learning_rate": 7.278302388926194e-06,
+ "loss": 0.068,
+ "step": 22024
+ },
+ {
+ "epoch": 60.013623978201636,
+ "grad_norm": 4.376850605010986,
+ "learning_rate": 7.277453219723298e-06,
+ "loss": 0.1635,
+ "step": 22025
+ },
+ {
+ "epoch": 60.01634877384196,
+ "grad_norm": 12.780744552612305,
+ "learning_rate": 7.276604071723511e-06,
+ "loss": 0.1066,
+ "step": 22026
+ },
+ {
+ "epoch": 60.01907356948229,
+ "grad_norm": 3.120161771774292,
+ "learning_rate": 7.275754944933442e-06,
+ "loss": 0.0925,
+ "step": 22027
+ },
+ {
+ "epoch": 60.02179836512261,
+ "grad_norm": 4.451543807983398,
+ "learning_rate": 7.274905839359707e-06,
+ "loss": 0.0965,
+ "step": 22028
+ },
+ {
+ "epoch": 60.02452316076294,
+ "grad_norm": 3.282378911972046,
+ "learning_rate": 7.274056755008916e-06,
+ "loss": 0.3144,
+ "step": 22029
+ },
+ {
+ "epoch": 60.02724795640327,
+ "grad_norm": 4.26405143737793,
+ "learning_rate": 7.273207691887685e-06,
+ "loss": 0.106,
+ "step": 22030
+ },
+ {
+ "epoch": 60.0299727520436,
+ "grad_norm": 4.883692741394043,
+ "learning_rate": 7.272358650002623e-06,
+ "loss": 0.1461,
+ "step": 22031
+ },
+ {
+ "epoch": 60.032697547683924,
+ "grad_norm": 2.7487285137176514,
+ "learning_rate": 7.271509629360343e-06,
+ "loss": 0.0393,
+ "step": 22032
+ },
+ {
+ "epoch": 60.03542234332425,
+ "grad_norm": 2.9640891551971436,
+ "learning_rate": 7.270660629967461e-06,
+ "loss": 0.0767,
+ "step": 22033
+ },
+ {
+ "epoch": 60.038147138964575,
+ "grad_norm": 3.9891130924224854,
+ "learning_rate": 7.269811651830584e-06,
+ "loss": 0.0686,
+ "step": 22034
+ },
+ {
+ "epoch": 60.0408719346049,
+ "grad_norm": 6.4960103034973145,
+ "learning_rate": 7.268962694956329e-06,
+ "loss": 0.221,
+ "step": 22035
+ },
+ {
+ "epoch": 60.043596730245234,
+ "grad_norm": 2.927238941192627,
+ "learning_rate": 7.2681137593513005e-06,
+ "loss": 0.1274,
+ "step": 22036
+ },
+ {
+ "epoch": 60.04632152588556,
+ "grad_norm": 2.9344594478607178,
+ "learning_rate": 7.2672648450221195e-06,
+ "loss": 0.0531,
+ "step": 22037
+ },
+ {
+ "epoch": 60.049046321525886,
+ "grad_norm": 6.458965301513672,
+ "learning_rate": 7.266415951975388e-06,
+ "loss": 0.1501,
+ "step": 22038
+ },
+ {
+ "epoch": 60.05177111716621,
+ "grad_norm": 2.0938048362731934,
+ "learning_rate": 7.265567080217723e-06,
+ "loss": 0.0368,
+ "step": 22039
+ },
+ {
+ "epoch": 60.05449591280654,
+ "grad_norm": 6.481177806854248,
+ "learning_rate": 7.264718229755731e-06,
+ "loss": 0.0939,
+ "step": 22040
+ },
+ {
+ "epoch": 60.05722070844686,
+ "grad_norm": 3.4094817638397217,
+ "learning_rate": 7.263869400596028e-06,
+ "loss": 0.1864,
+ "step": 22041
+ },
+ {
+ "epoch": 60.059945504087196,
+ "grad_norm": 3.0574076175689697,
+ "learning_rate": 7.26302059274522e-06,
+ "loss": 0.0507,
+ "step": 22042
+ },
+ {
+ "epoch": 60.06267029972752,
+ "grad_norm": 3.760446310043335,
+ "learning_rate": 7.262171806209924e-06,
+ "loss": 0.0899,
+ "step": 22043
+ },
+ {
+ "epoch": 60.06539509536785,
+ "grad_norm": 4.761295318603516,
+ "learning_rate": 7.261323040996739e-06,
+ "loss": 0.1372,
+ "step": 22044
+ },
+ {
+ "epoch": 60.06811989100817,
+ "grad_norm": 4.419173717498779,
+ "learning_rate": 7.260474297112286e-06,
+ "loss": 0.1579,
+ "step": 22045
+ },
+ {
+ "epoch": 60.0708446866485,
+ "grad_norm": 3.5458569526672363,
+ "learning_rate": 7.259625574563172e-06,
+ "loss": 0.055,
+ "step": 22046
+ },
+ {
+ "epoch": 60.073569482288825,
+ "grad_norm": 5.580803394317627,
+ "learning_rate": 7.258776873356003e-06,
+ "loss": 0.054,
+ "step": 22047
+ },
+ {
+ "epoch": 60.07629427792916,
+ "grad_norm": 4.740196228027344,
+ "learning_rate": 7.257928193497394e-06,
+ "loss": 0.1395,
+ "step": 22048
+ },
+ {
+ "epoch": 60.079019073569484,
+ "grad_norm": 3.0760657787323,
+ "learning_rate": 7.257079534993949e-06,
+ "loss": 0.1613,
+ "step": 22049
+ },
+ {
+ "epoch": 60.08174386920981,
+ "grad_norm": 5.045286178588867,
+ "learning_rate": 7.2562308978522784e-06,
+ "loss": 0.1632,
+ "step": 22050
+ },
+ {
+ "epoch": 60.084468664850135,
+ "grad_norm": 3.709996461868286,
+ "learning_rate": 7.255382282079e-06,
+ "loss": 0.0966,
+ "step": 22051
+ },
+ {
+ "epoch": 60.08719346049046,
+ "grad_norm": 2.9020793437957764,
+ "learning_rate": 7.254533687680712e-06,
+ "loss": 0.0437,
+ "step": 22052
+ },
+ {
+ "epoch": 60.08991825613079,
+ "grad_norm": 6.386335849761963,
+ "learning_rate": 7.253685114664029e-06,
+ "loss": 0.1422,
+ "step": 22053
+ },
+ {
+ "epoch": 60.09264305177112,
+ "grad_norm": 5.222840309143066,
+ "learning_rate": 7.252836563035557e-06,
+ "loss": 0.1472,
+ "step": 22054
+ },
+ {
+ "epoch": 60.095367847411445,
+ "grad_norm": 8.410630226135254,
+ "learning_rate": 7.251988032801906e-06,
+ "loss": 0.1042,
+ "step": 22055
+ },
+ {
+ "epoch": 60.09809264305177,
+ "grad_norm": 4.177931308746338,
+ "learning_rate": 7.251139523969683e-06,
+ "loss": 0.0703,
+ "step": 22056
+ },
+ {
+ "epoch": 60.1008174386921,
+ "grad_norm": 5.191798210144043,
+ "learning_rate": 7.2502910365454985e-06,
+ "loss": 0.2655,
+ "step": 22057
+ },
+ {
+ "epoch": 60.10354223433242,
+ "grad_norm": 3.9571166038513184,
+ "learning_rate": 7.249442570535956e-06,
+ "loss": 0.31,
+ "step": 22058
+ },
+ {
+ "epoch": 60.10626702997275,
+ "grad_norm": 3.569178342819214,
+ "learning_rate": 7.24859412594767e-06,
+ "loss": 0.1664,
+ "step": 22059
+ },
+ {
+ "epoch": 60.10899182561308,
+ "grad_norm": 2.9958372116088867,
+ "learning_rate": 7.247745702787241e-06,
+ "loss": 0.0885,
+ "step": 22060
+ },
+ {
+ "epoch": 60.11171662125341,
+ "grad_norm": 3.663642168045044,
+ "learning_rate": 7.246897301061282e-06,
+ "loss": 0.2168,
+ "step": 22061
+ },
+ {
+ "epoch": 60.11444141689373,
+ "grad_norm": 3.5634939670562744,
+ "learning_rate": 7.2460489207763965e-06,
+ "loss": 0.117,
+ "step": 22062
+ },
+ {
+ "epoch": 60.11716621253406,
+ "grad_norm": 4.0436482429504395,
+ "learning_rate": 7.245200561939196e-06,
+ "loss": 0.0934,
+ "step": 22063
+ },
+ {
+ "epoch": 60.119891008174385,
+ "grad_norm": 3.052210807800293,
+ "learning_rate": 7.244352224556281e-06,
+ "loss": 0.1476,
+ "step": 22064
+ },
+ {
+ "epoch": 60.12261580381471,
+ "grad_norm": 3.5404224395751953,
+ "learning_rate": 7.243503908634266e-06,
+ "loss": 0.0699,
+ "step": 22065
+ },
+ {
+ "epoch": 60.12534059945504,
+ "grad_norm": 2.996366500854492,
+ "learning_rate": 7.2426556141797525e-06,
+ "loss": 0.1023,
+ "step": 22066
+ },
+ {
+ "epoch": 60.12806539509537,
+ "grad_norm": 4.221047401428223,
+ "learning_rate": 7.241807341199345e-06,
+ "loss": 0.2897,
+ "step": 22067
+ },
+ {
+ "epoch": 60.130790190735695,
+ "grad_norm": 4.326673984527588,
+ "learning_rate": 7.240959089699655e-06,
+ "loss": 0.1031,
+ "step": 22068
+ },
+ {
+ "epoch": 60.13351498637602,
+ "grad_norm": 3.4288883209228516,
+ "learning_rate": 7.2401108596872885e-06,
+ "loss": 0.0897,
+ "step": 22069
+ },
+ {
+ "epoch": 60.13623978201635,
+ "grad_norm": 2.740156650543213,
+ "learning_rate": 7.239262651168848e-06,
+ "loss": 0.0967,
+ "step": 22070
+ },
+ {
+ "epoch": 60.13896457765667,
+ "grad_norm": 3.2299089431762695,
+ "learning_rate": 7.238414464150945e-06,
+ "loss": 0.0601,
+ "step": 22071
+ },
+ {
+ "epoch": 60.141689373297005,
+ "grad_norm": 3.3907079696655273,
+ "learning_rate": 7.237566298640178e-06,
+ "loss": 0.1046,
+ "step": 22072
+ },
+ {
+ "epoch": 60.14441416893733,
+ "grad_norm": 6.267420768737793,
+ "learning_rate": 7.2367181546431565e-06,
+ "loss": 0.0843,
+ "step": 22073
+ },
+ {
+ "epoch": 60.14713896457766,
+ "grad_norm": 3.6383748054504395,
+ "learning_rate": 7.2358700321664845e-06,
+ "loss": 0.0925,
+ "step": 22074
+ },
+ {
+ "epoch": 60.14986376021798,
+ "grad_norm": 4.796145439147949,
+ "learning_rate": 7.2350219312167695e-06,
+ "loss": 0.0666,
+ "step": 22075
+ },
+ {
+ "epoch": 60.15258855585831,
+ "grad_norm": 3.1013946533203125,
+ "learning_rate": 7.234173851800612e-06,
+ "loss": 0.1023,
+ "step": 22076
+ },
+ {
+ "epoch": 60.155313351498634,
+ "grad_norm": 3.4992892742156982,
+ "learning_rate": 7.2333257939246226e-06,
+ "loss": 0.0661,
+ "step": 22077
+ },
+ {
+ "epoch": 60.15803814713897,
+ "grad_norm": 3.698241949081421,
+ "learning_rate": 7.2324777575954e-06,
+ "loss": 0.0531,
+ "step": 22078
+ },
+ {
+ "epoch": 60.16076294277929,
+ "grad_norm": 4.444230079650879,
+ "learning_rate": 7.231629742819554e-06,
+ "loss": 0.143,
+ "step": 22079
+ },
+ {
+ "epoch": 60.16348773841962,
+ "grad_norm": 4.365219593048096,
+ "learning_rate": 7.230781749603685e-06,
+ "loss": 0.0715,
+ "step": 22080
+ },
+ {
+ "epoch": 60.166212534059945,
+ "grad_norm": 3.577834129333496,
+ "learning_rate": 7.2299337779543995e-06,
+ "loss": 0.2797,
+ "step": 22081
+ },
+ {
+ "epoch": 60.16893732970027,
+ "grad_norm": 4.878407001495361,
+ "learning_rate": 7.2290858278783e-06,
+ "loss": 0.1666,
+ "step": 22082
+ },
+ {
+ "epoch": 60.171662125340596,
+ "grad_norm": 4.7122802734375,
+ "learning_rate": 7.2282378993819916e-06,
+ "loss": 0.0753,
+ "step": 22083
+ },
+ {
+ "epoch": 60.17438692098093,
+ "grad_norm": 3.255444288253784,
+ "learning_rate": 7.227389992472073e-06,
+ "loss": 0.1144,
+ "step": 22084
+ },
+ {
+ "epoch": 60.177111716621255,
+ "grad_norm": 4.510351181030273,
+ "learning_rate": 7.226542107155154e-06,
+ "loss": 0.1177,
+ "step": 22085
+ },
+ {
+ "epoch": 60.17983651226158,
+ "grad_norm": 6.7560601234436035,
+ "learning_rate": 7.2256942434378395e-06,
+ "loss": 0.089,
+ "step": 22086
+ },
+ {
+ "epoch": 60.182561307901906,
+ "grad_norm": 2.752912998199463,
+ "learning_rate": 7.224846401326725e-06,
+ "loss": 0.0446,
+ "step": 22087
+ },
+ {
+ "epoch": 60.18528610354223,
+ "grad_norm": 3.046994924545288,
+ "learning_rate": 7.223998580828418e-06,
+ "loss": 0.1037,
+ "step": 22088
+ },
+ {
+ "epoch": 60.18801089918256,
+ "grad_norm": 3.984055757522583,
+ "learning_rate": 7.223150781949524e-06,
+ "loss": 0.1455,
+ "step": 22089
+ },
+ {
+ "epoch": 60.19073569482289,
+ "grad_norm": 3.351414918899536,
+ "learning_rate": 7.222303004696638e-06,
+ "loss": 0.0956,
+ "step": 22090
+ },
+ {
+ "epoch": 60.19346049046322,
+ "grad_norm": 3.3346078395843506,
+ "learning_rate": 7.22145524907637e-06,
+ "loss": 0.0917,
+ "step": 22091
+ },
+ {
+ "epoch": 60.19618528610354,
+ "grad_norm": 2.8271543979644775,
+ "learning_rate": 7.220607515095317e-06,
+ "loss": 0.1488,
+ "step": 22092
+ },
+ {
+ "epoch": 60.19891008174387,
+ "grad_norm": 2.8824541568756104,
+ "learning_rate": 7.219759802760085e-06,
+ "loss": 0.0432,
+ "step": 22093
+ },
+ {
+ "epoch": 60.201634877384194,
+ "grad_norm": 3.8971989154815674,
+ "learning_rate": 7.2189121120772735e-06,
+ "loss": 0.0515,
+ "step": 22094
+ },
+ {
+ "epoch": 60.20435967302452,
+ "grad_norm": 5.140842437744141,
+ "learning_rate": 7.218064443053485e-06,
+ "loss": 0.0583,
+ "step": 22095
+ },
+ {
+ "epoch": 60.20708446866485,
+ "grad_norm": 5.072154521942139,
+ "learning_rate": 7.217216795695321e-06,
+ "loss": 0.0774,
+ "step": 22096
+ },
+ {
+ "epoch": 60.20980926430518,
+ "grad_norm": 2.937187910079956,
+ "learning_rate": 7.216369170009384e-06,
+ "loss": 0.0567,
+ "step": 22097
+ },
+ {
+ "epoch": 60.212534059945504,
+ "grad_norm": 6.213933944702148,
+ "learning_rate": 7.215521566002273e-06,
+ "loss": 0.119,
+ "step": 22098
+ },
+ {
+ "epoch": 60.21525885558583,
+ "grad_norm": 3.187241554260254,
+ "learning_rate": 7.214673983680591e-06,
+ "loss": 0.0503,
+ "step": 22099
+ },
+ {
+ "epoch": 60.217983651226156,
+ "grad_norm": 3.052718162536621,
+ "learning_rate": 7.213826423050937e-06,
+ "loss": 0.1028,
+ "step": 22100
+ },
+ {
+ "epoch": 60.22070844686648,
+ "grad_norm": 3.518193006515503,
+ "learning_rate": 7.212978884119911e-06,
+ "loss": 0.1897,
+ "step": 22101
+ },
+ {
+ "epoch": 60.223433242506815,
+ "grad_norm": 2.903453826904297,
+ "learning_rate": 7.212131366894121e-06,
+ "loss": 0.0758,
+ "step": 22102
+ },
+ {
+ "epoch": 60.22615803814714,
+ "grad_norm": 4.256850242614746,
+ "learning_rate": 7.211283871380159e-06,
+ "loss": 0.2743,
+ "step": 22103
+ },
+ {
+ "epoch": 60.228882833787466,
+ "grad_norm": 3.5818071365356445,
+ "learning_rate": 7.21043639758463e-06,
+ "loss": 0.0663,
+ "step": 22104
+ },
+ {
+ "epoch": 60.23160762942779,
+ "grad_norm": 5.526252746582031,
+ "learning_rate": 7.2095889455141325e-06,
+ "loss": 0.1409,
+ "step": 22105
+ },
+ {
+ "epoch": 60.23433242506812,
+ "grad_norm": 4.099296569824219,
+ "learning_rate": 7.208741515175266e-06,
+ "loss": 0.118,
+ "step": 22106
+ },
+ {
+ "epoch": 60.237057220708444,
+ "grad_norm": 3.241194725036621,
+ "learning_rate": 7.207894106574631e-06,
+ "loss": 0.0593,
+ "step": 22107
+ },
+ {
+ "epoch": 60.23978201634878,
+ "grad_norm": 3.287278413772583,
+ "learning_rate": 7.207046719718827e-06,
+ "loss": 0.1654,
+ "step": 22108
+ },
+ {
+ "epoch": 60.2425068119891,
+ "grad_norm": 3.462165117263794,
+ "learning_rate": 7.206199354614453e-06,
+ "loss": 0.0911,
+ "step": 22109
+ },
+ {
+ "epoch": 60.24523160762943,
+ "grad_norm": 6.26113224029541,
+ "learning_rate": 7.205352011268107e-06,
+ "loss": 0.0879,
+ "step": 22110
+ },
+ {
+ "epoch": 60.247956403269754,
+ "grad_norm": 2.651669502258301,
+ "learning_rate": 7.204504689686392e-06,
+ "loss": 0.0418,
+ "step": 22111
+ },
+ {
+ "epoch": 60.25068119891008,
+ "grad_norm": 5.0154805183410645,
+ "learning_rate": 7.203657389875902e-06,
+ "loss": 0.0581,
+ "step": 22112
+ },
+ {
+ "epoch": 60.253405994550405,
+ "grad_norm": 4.798368453979492,
+ "learning_rate": 7.2028101118432414e-06,
+ "loss": 0.0945,
+ "step": 22113
+ },
+ {
+ "epoch": 60.25613079019074,
+ "grad_norm": 3.665332794189453,
+ "learning_rate": 7.201962855595004e-06,
+ "loss": 0.0734,
+ "step": 22114
+ },
+ {
+ "epoch": 60.258855585831064,
+ "grad_norm": 2.9860355854034424,
+ "learning_rate": 7.2011156211377904e-06,
+ "loss": 0.0616,
+ "step": 22115
+ },
+ {
+ "epoch": 60.26158038147139,
+ "grad_norm": 3.9235002994537354,
+ "learning_rate": 7.200268408478197e-06,
+ "loss": 0.0806,
+ "step": 22116
+ },
+ {
+ "epoch": 60.264305177111716,
+ "grad_norm": 5.279658317565918,
+ "learning_rate": 7.199421217622825e-06,
+ "loss": 0.0655,
+ "step": 22117
+ },
+ {
+ "epoch": 60.26702997275204,
+ "grad_norm": 3.8670432567596436,
+ "learning_rate": 7.198574048578268e-06,
+ "loss": 0.0725,
+ "step": 22118
+ },
+ {
+ "epoch": 60.26975476839237,
+ "grad_norm": 3.356159210205078,
+ "learning_rate": 7.1977269013511254e-06,
+ "loss": 0.2106,
+ "step": 22119
+ },
+ {
+ "epoch": 60.2724795640327,
+ "grad_norm": 3.390110731124878,
+ "learning_rate": 7.196879775947998e-06,
+ "loss": 0.1548,
+ "step": 22120
+ },
+ {
+ "epoch": 60.275204359673026,
+ "grad_norm": 5.2056074142456055,
+ "learning_rate": 7.196032672375479e-06,
+ "loss": 0.1162,
+ "step": 22121
+ },
+ {
+ "epoch": 60.27792915531335,
+ "grad_norm": 5.498204708099365,
+ "learning_rate": 7.19518559064017e-06,
+ "loss": 0.1115,
+ "step": 22122
+ },
+ {
+ "epoch": 60.28065395095368,
+ "grad_norm": 3.208754062652588,
+ "learning_rate": 7.194338530748663e-06,
+ "loss": 0.0471,
+ "step": 22123
+ },
+ {
+ "epoch": 60.283378746594,
+ "grad_norm": 3.2935304641723633,
+ "learning_rate": 7.1934914927075595e-06,
+ "loss": 0.0933,
+ "step": 22124
+ },
+ {
+ "epoch": 60.28610354223433,
+ "grad_norm": 2.8551547527313232,
+ "learning_rate": 7.1926444765234515e-06,
+ "loss": 0.0838,
+ "step": 22125
+ },
+ {
+ "epoch": 60.28882833787466,
+ "grad_norm": 3.8854739665985107,
+ "learning_rate": 7.19179748220294e-06,
+ "loss": 0.13,
+ "step": 22126
+ },
+ {
+ "epoch": 60.29155313351499,
+ "grad_norm": 3.63547945022583,
+ "learning_rate": 7.190950509752617e-06,
+ "loss": 0.2624,
+ "step": 22127
+ },
+ {
+ "epoch": 60.294277929155314,
+ "grad_norm": 3.5233612060546875,
+ "learning_rate": 7.190103559179085e-06,
+ "loss": 0.1408,
+ "step": 22128
+ },
+ {
+ "epoch": 60.29700272479564,
+ "grad_norm": 4.2197675704956055,
+ "learning_rate": 7.1892566304889315e-06,
+ "loss": 0.1865,
+ "step": 22129
+ },
+ {
+ "epoch": 60.299727520435965,
+ "grad_norm": 2.6265814304351807,
+ "learning_rate": 7.188409723688759e-06,
+ "loss": 0.0843,
+ "step": 22130
+ },
+ {
+ "epoch": 60.30245231607629,
+ "grad_norm": 3.485671043395996,
+ "learning_rate": 7.18756283878516e-06,
+ "loss": 0.0534,
+ "step": 22131
+ },
+ {
+ "epoch": 60.305177111716624,
+ "grad_norm": 3.559150218963623,
+ "learning_rate": 7.186715975784731e-06,
+ "loss": 0.1518,
+ "step": 22132
+ },
+ {
+ "epoch": 60.30790190735695,
+ "grad_norm": 3.630086660385132,
+ "learning_rate": 7.18586913469407e-06,
+ "loss": 0.0574,
+ "step": 22133
+ },
+ {
+ "epoch": 60.310626702997276,
+ "grad_norm": 4.573139667510986,
+ "learning_rate": 7.185022315519768e-06,
+ "loss": 0.1498,
+ "step": 22134
+ },
+ {
+ "epoch": 60.3133514986376,
+ "grad_norm": 3.360421895980835,
+ "learning_rate": 7.1841755182684215e-06,
+ "loss": 0.0763,
+ "step": 22135
+ },
+ {
+ "epoch": 60.31607629427793,
+ "grad_norm": 5.917803764343262,
+ "learning_rate": 7.183328742946623e-06,
+ "loss": 0.1306,
+ "step": 22136
+ },
+ {
+ "epoch": 60.31880108991825,
+ "grad_norm": 3.198390007019043,
+ "learning_rate": 7.182481989560971e-06,
+ "loss": 0.0556,
+ "step": 22137
+ },
+ {
+ "epoch": 60.321525885558586,
+ "grad_norm": 4.424189567565918,
+ "learning_rate": 7.18163525811806e-06,
+ "loss": 0.1054,
+ "step": 22138
+ },
+ {
+ "epoch": 60.32425068119891,
+ "grad_norm": 3.526097059249878,
+ "learning_rate": 7.180788548624482e-06,
+ "loss": 0.1707,
+ "step": 22139
+ },
+ {
+ "epoch": 60.32697547683924,
+ "grad_norm": 4.693763732910156,
+ "learning_rate": 7.179941861086834e-06,
+ "loss": 0.1795,
+ "step": 22140
+ },
+ {
+ "epoch": 60.32970027247956,
+ "grad_norm": 4.731674671173096,
+ "learning_rate": 7.179095195511707e-06,
+ "loss": 0.1277,
+ "step": 22141
+ },
+ {
+ "epoch": 60.33242506811989,
+ "grad_norm": 4.0111165046691895,
+ "learning_rate": 7.178248551905696e-06,
+ "loss": 0.09,
+ "step": 22142
+ },
+ {
+ "epoch": 60.335149863760215,
+ "grad_norm": 4.440929889678955,
+ "learning_rate": 7.177401930275394e-06,
+ "loss": 0.058,
+ "step": 22143
+ },
+ {
+ "epoch": 60.33787465940055,
+ "grad_norm": 3.536142349243164,
+ "learning_rate": 7.176555330627395e-06,
+ "loss": 0.117,
+ "step": 22144
+ },
+ {
+ "epoch": 60.34059945504087,
+ "grad_norm": 3.8005049228668213,
+ "learning_rate": 7.175708752968291e-06,
+ "loss": 0.2346,
+ "step": 22145
+ },
+ {
+ "epoch": 60.3433242506812,
+ "grad_norm": 4.1204657554626465,
+ "learning_rate": 7.174862197304679e-06,
+ "loss": 0.1546,
+ "step": 22146
+ },
+ {
+ "epoch": 60.346049046321525,
+ "grad_norm": 3.4227209091186523,
+ "learning_rate": 7.174015663643147e-06,
+ "loss": 0.0885,
+ "step": 22147
+ },
+ {
+ "epoch": 60.34877384196185,
+ "grad_norm": 3.576946496963501,
+ "learning_rate": 7.173169151990291e-06,
+ "loss": 0.0629,
+ "step": 22148
+ },
+ {
+ "epoch": 60.35149863760218,
+ "grad_norm": 4.644906520843506,
+ "learning_rate": 7.172322662352702e-06,
+ "loss": 0.0993,
+ "step": 22149
+ },
+ {
+ "epoch": 60.35422343324251,
+ "grad_norm": 5.073850631713867,
+ "learning_rate": 7.171476194736975e-06,
+ "loss": 0.1712,
+ "step": 22150
+ },
+ {
+ "epoch": 60.356948228882835,
+ "grad_norm": 2.734004259109497,
+ "learning_rate": 7.170629749149698e-06,
+ "loss": 0.0679,
+ "step": 22151
+ },
+ {
+ "epoch": 60.35967302452316,
+ "grad_norm": 3.039759635925293,
+ "learning_rate": 7.169783325597468e-06,
+ "loss": 0.0629,
+ "step": 22152
+ },
+ {
+ "epoch": 60.36239782016349,
+ "grad_norm": 6.838952541351318,
+ "learning_rate": 7.168936924086866e-06,
+ "loss": 0.1168,
+ "step": 22153
+ },
+ {
+ "epoch": 60.36512261580381,
+ "grad_norm": 3.255216121673584,
+ "learning_rate": 7.168090544624501e-06,
+ "loss": 0.1238,
+ "step": 22154
+ },
+ {
+ "epoch": 60.36784741144414,
+ "grad_norm": 2.8387744426727295,
+ "learning_rate": 7.167244187216953e-06,
+ "loss": 0.1882,
+ "step": 22155
+ },
+ {
+ "epoch": 60.37057220708447,
+ "grad_norm": 3.734137535095215,
+ "learning_rate": 7.166397851870816e-06,
+ "loss": 0.1078,
+ "step": 22156
+ },
+ {
+ "epoch": 60.3732970027248,
+ "grad_norm": 3.122952461242676,
+ "learning_rate": 7.165551538592682e-06,
+ "loss": 0.146,
+ "step": 22157
+ },
+ {
+ "epoch": 60.37602179836512,
+ "grad_norm": 4.570494651794434,
+ "learning_rate": 7.164705247389143e-06,
+ "loss": 0.1751,
+ "step": 22158
+ },
+ {
+ "epoch": 60.37874659400545,
+ "grad_norm": 3.697592258453369,
+ "learning_rate": 7.163858978266786e-06,
+ "loss": 0.0641,
+ "step": 22159
+ },
+ {
+ "epoch": 60.381471389645775,
+ "grad_norm": 4.88624382019043,
+ "learning_rate": 7.163012731232206e-06,
+ "loss": 0.0748,
+ "step": 22160
+ },
+ {
+ "epoch": 60.3841961852861,
+ "grad_norm": 4.610586643218994,
+ "learning_rate": 7.162166506291988e-06,
+ "loss": 0.1797,
+ "step": 22161
+ },
+ {
+ "epoch": 60.38692098092643,
+ "grad_norm": 3.272887706756592,
+ "learning_rate": 7.16132030345273e-06,
+ "loss": 0.1669,
+ "step": 22162
+ },
+ {
+ "epoch": 60.38964577656676,
+ "grad_norm": 3.7306933403015137,
+ "learning_rate": 7.160474122721015e-06,
+ "loss": 0.2393,
+ "step": 22163
+ },
+ {
+ "epoch": 60.392370572207085,
+ "grad_norm": 2.8864564895629883,
+ "learning_rate": 7.159627964103439e-06,
+ "loss": 0.0601,
+ "step": 22164
+ },
+ {
+ "epoch": 60.39509536784741,
+ "grad_norm": 4.231517791748047,
+ "learning_rate": 7.158781827606587e-06,
+ "loss": 0.1163,
+ "step": 22165
+ },
+ {
+ "epoch": 60.39782016348774,
+ "grad_norm": 3.783748149871826,
+ "learning_rate": 7.157935713237052e-06,
+ "loss": 0.1739,
+ "step": 22166
+ },
+ {
+ "epoch": 60.40054495912806,
+ "grad_norm": 3.2768189907073975,
+ "learning_rate": 7.15708962100142e-06,
+ "loss": 0.0844,
+ "step": 22167
+ },
+ {
+ "epoch": 60.403269754768395,
+ "grad_norm": 4.838784694671631,
+ "learning_rate": 7.156243550906285e-06,
+ "loss": 0.1401,
+ "step": 22168
+ },
+ {
+ "epoch": 60.40599455040872,
+ "grad_norm": 3.03964900970459,
+ "learning_rate": 7.155397502958231e-06,
+ "loss": 0.0579,
+ "step": 22169
+ },
+ {
+ "epoch": 60.40871934604905,
+ "grad_norm": 2.7429299354553223,
+ "learning_rate": 7.154551477163848e-06,
+ "loss": 0.0578,
+ "step": 22170
+ },
+ {
+ "epoch": 60.41144414168937,
+ "grad_norm": 5.089840412139893,
+ "learning_rate": 7.153705473529731e-06,
+ "loss": 0.1068,
+ "step": 22171
+ },
+ {
+ "epoch": 60.4141689373297,
+ "grad_norm": 3.6841890811920166,
+ "learning_rate": 7.152859492062462e-06,
+ "loss": 0.0485,
+ "step": 22172
+ },
+ {
+ "epoch": 60.416893732970024,
+ "grad_norm": 3.1107046604156494,
+ "learning_rate": 7.152013532768633e-06,
+ "loss": 0.1558,
+ "step": 22173
+ },
+ {
+ "epoch": 60.41961852861036,
+ "grad_norm": 2.3434879779815674,
+ "learning_rate": 7.15116759565483e-06,
+ "loss": 0.0388,
+ "step": 22174
+ },
+ {
+ "epoch": 60.42234332425068,
+ "grad_norm": 4.760533332824707,
+ "learning_rate": 7.150321680727641e-06,
+ "loss": 0.152,
+ "step": 22175
+ },
+ {
+ "epoch": 60.42506811989101,
+ "grad_norm": 6.486580848693848,
+ "learning_rate": 7.149475787993658e-06,
+ "loss": 0.1653,
+ "step": 22176
+ },
+ {
+ "epoch": 60.427792915531334,
+ "grad_norm": 3.468561887741089,
+ "learning_rate": 7.148629917459464e-06,
+ "loss": 0.1182,
+ "step": 22177
+ },
+ {
+ "epoch": 60.43051771117166,
+ "grad_norm": 4.1860480308532715,
+ "learning_rate": 7.147784069131649e-06,
+ "loss": 0.2068,
+ "step": 22178
+ },
+ {
+ "epoch": 60.433242506811986,
+ "grad_norm": 8.364831924438477,
+ "learning_rate": 7.146938243016799e-06,
+ "loss": 0.1613,
+ "step": 22179
+ },
+ {
+ "epoch": 60.43596730245232,
+ "grad_norm": 3.9601993560791016,
+ "learning_rate": 7.146092439121504e-06,
+ "loss": 0.0836,
+ "step": 22180
+ },
+ {
+ "epoch": 60.438692098092645,
+ "grad_norm": 3.8030402660369873,
+ "learning_rate": 7.145246657452347e-06,
+ "loss": 0.0639,
+ "step": 22181
+ },
+ {
+ "epoch": 60.44141689373297,
+ "grad_norm": 3.136075258255005,
+ "learning_rate": 7.144400898015919e-06,
+ "loss": 0.0527,
+ "step": 22182
+ },
+ {
+ "epoch": 60.444141689373296,
+ "grad_norm": 3.5900537967681885,
+ "learning_rate": 7.1435551608188035e-06,
+ "loss": 0.1179,
+ "step": 22183
+ },
+ {
+ "epoch": 60.44686648501362,
+ "grad_norm": 3.3428232669830322,
+ "learning_rate": 7.14270944586759e-06,
+ "loss": 0.1567,
+ "step": 22184
+ },
+ {
+ "epoch": 60.44959128065395,
+ "grad_norm": 3.301100492477417,
+ "learning_rate": 7.141863753168861e-06,
+ "loss": 0.1342,
+ "step": 22185
+ },
+ {
+ "epoch": 60.45231607629428,
+ "grad_norm": 2.8534092903137207,
+ "learning_rate": 7.141018082729208e-06,
+ "loss": 0.0732,
+ "step": 22186
+ },
+ {
+ "epoch": 60.45504087193461,
+ "grad_norm": 2.955643892288208,
+ "learning_rate": 7.14017243455521e-06,
+ "loss": 0.0669,
+ "step": 22187
+ },
+ {
+ "epoch": 60.45776566757493,
+ "grad_norm": 3.058328628540039,
+ "learning_rate": 7.13932680865346e-06,
+ "loss": 0.0651,
+ "step": 22188
+ },
+ {
+ "epoch": 60.46049046321526,
+ "grad_norm": 3.639937162399292,
+ "learning_rate": 7.1384812050305404e-06,
+ "loss": 0.1457,
+ "step": 22189
+ },
+ {
+ "epoch": 60.463215258855584,
+ "grad_norm": 3.513044595718384,
+ "learning_rate": 7.137635623693036e-06,
+ "loss": 0.1729,
+ "step": 22190
+ },
+ {
+ "epoch": 60.46594005449591,
+ "grad_norm": 5.378262042999268,
+ "learning_rate": 7.136790064647536e-06,
+ "loss": 0.1175,
+ "step": 22191
+ },
+ {
+ "epoch": 60.46866485013624,
+ "grad_norm": 3.233370304107666,
+ "learning_rate": 7.1359445279006205e-06,
+ "loss": 0.0607,
+ "step": 22192
+ },
+ {
+ "epoch": 60.47138964577657,
+ "grad_norm": 4.573462963104248,
+ "learning_rate": 7.135099013458879e-06,
+ "loss": 0.1568,
+ "step": 22193
+ },
+ {
+ "epoch": 60.474114441416894,
+ "grad_norm": 6.657225131988525,
+ "learning_rate": 7.134253521328891e-06,
+ "loss": 0.109,
+ "step": 22194
+ },
+ {
+ "epoch": 60.47683923705722,
+ "grad_norm": 4.017292022705078,
+ "learning_rate": 7.133408051517247e-06,
+ "loss": 0.0874,
+ "step": 22195
+ },
+ {
+ "epoch": 60.479564032697546,
+ "grad_norm": 4.407981872558594,
+ "learning_rate": 7.1325626040305275e-06,
+ "loss": 0.1247,
+ "step": 22196
+ },
+ {
+ "epoch": 60.48228882833787,
+ "grad_norm": 2.8455512523651123,
+ "learning_rate": 7.131717178875317e-06,
+ "loss": 0.056,
+ "step": 22197
+ },
+ {
+ "epoch": 60.485013623978205,
+ "grad_norm": 4.186744689941406,
+ "learning_rate": 7.130871776058204e-06,
+ "loss": 0.0763,
+ "step": 22198
+ },
+ {
+ "epoch": 60.48773841961853,
+ "grad_norm": 3.396908760070801,
+ "learning_rate": 7.130026395585766e-06,
+ "loss": 0.0671,
+ "step": 22199
+ },
+ {
+ "epoch": 60.490463215258856,
+ "grad_norm": 3.2078208923339844,
+ "learning_rate": 7.129181037464593e-06,
+ "loss": 0.0563,
+ "step": 22200
+ },
+ {
+ "epoch": 60.49318801089918,
+ "grad_norm": 3.7207226753234863,
+ "learning_rate": 7.1283357017012635e-06,
+ "loss": 0.1127,
+ "step": 22201
+ },
+ {
+ "epoch": 60.49591280653951,
+ "grad_norm": 3.3196473121643066,
+ "learning_rate": 7.127490388302365e-06,
+ "loss": 0.1172,
+ "step": 22202
+ },
+ {
+ "epoch": 60.49863760217983,
+ "grad_norm": 3.7749881744384766,
+ "learning_rate": 7.126645097274477e-06,
+ "loss": 0.0881,
+ "step": 22203
+ },
+ {
+ "epoch": 60.50136239782017,
+ "grad_norm": 5.279852390289307,
+ "learning_rate": 7.125799828624187e-06,
+ "loss": 0.0739,
+ "step": 22204
+ },
+ {
+ "epoch": 60.50408719346049,
+ "grad_norm": 3.02209210395813,
+ "learning_rate": 7.12495458235807e-06,
+ "loss": 0.1081,
+ "step": 22205
+ },
+ {
+ "epoch": 60.50681198910082,
+ "grad_norm": 2.5446105003356934,
+ "learning_rate": 7.1241093584827185e-06,
+ "loss": 0.0489,
+ "step": 22206
+ },
+ {
+ "epoch": 60.509536784741144,
+ "grad_norm": 6.3202056884765625,
+ "learning_rate": 7.12326415700471e-06,
+ "loss": 0.0687,
+ "step": 22207
+ },
+ {
+ "epoch": 60.51226158038147,
+ "grad_norm": 4.158862113952637,
+ "learning_rate": 7.122418977930628e-06,
+ "loss": 0.1117,
+ "step": 22208
+ },
+ {
+ "epoch": 60.514986376021795,
+ "grad_norm": 3.6309733390808105,
+ "learning_rate": 7.121573821267055e-06,
+ "loss": 0.1504,
+ "step": 22209
+ },
+ {
+ "epoch": 60.51771117166213,
+ "grad_norm": 8.954504013061523,
+ "learning_rate": 7.120728687020571e-06,
+ "loss": 0.1151,
+ "step": 22210
+ },
+ {
+ "epoch": 60.520435967302454,
+ "grad_norm": 2.6598422527313232,
+ "learning_rate": 7.1198835751977615e-06,
+ "loss": 0.1323,
+ "step": 22211
+ },
+ {
+ "epoch": 60.52316076294278,
+ "grad_norm": 3.196981906890869,
+ "learning_rate": 7.119038485805203e-06,
+ "loss": 0.1082,
+ "step": 22212
+ },
+ {
+ "epoch": 60.525885558583106,
+ "grad_norm": 4.38768196105957,
+ "learning_rate": 7.118193418849483e-06,
+ "loss": 0.0946,
+ "step": 22213
+ },
+ {
+ "epoch": 60.52861035422343,
+ "grad_norm": 3.1019296646118164,
+ "learning_rate": 7.1173483743371775e-06,
+ "loss": 0.0557,
+ "step": 22214
+ },
+ {
+ "epoch": 60.53133514986376,
+ "grad_norm": 3.9349355697631836,
+ "learning_rate": 7.116503352274873e-06,
+ "loss": 0.0742,
+ "step": 22215
+ },
+ {
+ "epoch": 60.53405994550409,
+ "grad_norm": 3.114135503768921,
+ "learning_rate": 7.115658352669143e-06,
+ "loss": 0.0707,
+ "step": 22216
+ },
+ {
+ "epoch": 60.536784741144416,
+ "grad_norm": 2.8861827850341797,
+ "learning_rate": 7.114813375526577e-06,
+ "loss": 0.0675,
+ "step": 22217
+ },
+ {
+ "epoch": 60.53950953678474,
+ "grad_norm": 3.6690704822540283,
+ "learning_rate": 7.113968420853749e-06,
+ "loss": 0.07,
+ "step": 22218
+ },
+ {
+ "epoch": 60.54223433242507,
+ "grad_norm": 3.5133728981018066,
+ "learning_rate": 7.113123488657243e-06,
+ "loss": 0.216,
+ "step": 22219
+ },
+ {
+ "epoch": 60.54495912806539,
+ "grad_norm": 3.4835526943206787,
+ "learning_rate": 7.11227857894364e-06,
+ "loss": 0.0794,
+ "step": 22220
+ },
+ {
+ "epoch": 60.54768392370572,
+ "grad_norm": 3.0973880290985107,
+ "learning_rate": 7.111433691719516e-06,
+ "loss": 0.0509,
+ "step": 22221
+ },
+ {
+ "epoch": 60.55040871934605,
+ "grad_norm": 3.050398826599121,
+ "learning_rate": 7.110588826991451e-06,
+ "loss": 0.0558,
+ "step": 22222
+ },
+ {
+ "epoch": 60.55313351498638,
+ "grad_norm": 3.540860414505005,
+ "learning_rate": 7.109743984766032e-06,
+ "loss": 0.134,
+ "step": 22223
+ },
+ {
+ "epoch": 60.555858310626704,
+ "grad_norm": 3.0423455238342285,
+ "learning_rate": 7.108899165049832e-06,
+ "loss": 0.1101,
+ "step": 22224
+ },
+ {
+ "epoch": 60.55858310626703,
+ "grad_norm": 2.595421314239502,
+ "learning_rate": 7.108054367849434e-06,
+ "loss": 0.1572,
+ "step": 22225
+ },
+ {
+ "epoch": 60.561307901907355,
+ "grad_norm": 3.4921460151672363,
+ "learning_rate": 7.107209593171414e-06,
+ "loss": 0.0852,
+ "step": 22226
+ },
+ {
+ "epoch": 60.56403269754768,
+ "grad_norm": 2.6923108100891113,
+ "learning_rate": 7.106364841022353e-06,
+ "loss": 0.1585,
+ "step": 22227
+ },
+ {
+ "epoch": 60.566757493188014,
+ "grad_norm": 3.6124486923217773,
+ "learning_rate": 7.105520111408828e-06,
+ "loss": 0.0763,
+ "step": 22228
+ },
+ {
+ "epoch": 60.56948228882834,
+ "grad_norm": 3.460284471511841,
+ "learning_rate": 7.104675404337422e-06,
+ "loss": 0.0548,
+ "step": 22229
+ },
+ {
+ "epoch": 60.572207084468666,
+ "grad_norm": 3.73207950592041,
+ "learning_rate": 7.103830719814708e-06,
+ "loss": 0.1149,
+ "step": 22230
+ },
+ {
+ "epoch": 60.57493188010899,
+ "grad_norm": 3.1647777557373047,
+ "learning_rate": 7.102986057847269e-06,
+ "loss": 0.0626,
+ "step": 22231
+ },
+ {
+ "epoch": 60.57765667574932,
+ "grad_norm": 3.840442419052124,
+ "learning_rate": 7.102141418441681e-06,
+ "loss": 0.1868,
+ "step": 22232
+ },
+ {
+ "epoch": 60.58038147138964,
+ "grad_norm": 2.726717710494995,
+ "learning_rate": 7.101296801604525e-06,
+ "loss": 0.1371,
+ "step": 22233
+ },
+ {
+ "epoch": 60.583106267029976,
+ "grad_norm": 4.018718242645264,
+ "learning_rate": 7.100452207342372e-06,
+ "loss": 0.0779,
+ "step": 22234
+ },
+ {
+ "epoch": 60.5858310626703,
+ "grad_norm": 3.435814619064331,
+ "learning_rate": 7.099607635661806e-06,
+ "loss": 0.0674,
+ "step": 22235
+ },
+ {
+ "epoch": 60.58855585831063,
+ "grad_norm": 5.884005546569824,
+ "learning_rate": 7.0987630865694e-06,
+ "loss": 0.1441,
+ "step": 22236
+ },
+ {
+ "epoch": 60.59128065395095,
+ "grad_norm": 4.433471202850342,
+ "learning_rate": 7.097918560071737e-06,
+ "loss": 0.1748,
+ "step": 22237
+ },
+ {
+ "epoch": 60.59400544959128,
+ "grad_norm": 1.9378094673156738,
+ "learning_rate": 7.0970740561753884e-06,
+ "loss": 0.1367,
+ "step": 22238
+ },
+ {
+ "epoch": 60.596730245231605,
+ "grad_norm": 2.8464200496673584,
+ "learning_rate": 7.0962295748869314e-06,
+ "loss": 0.2006,
+ "step": 22239
+ },
+ {
+ "epoch": 60.59945504087194,
+ "grad_norm": 3.6421751976013184,
+ "learning_rate": 7.095385116212947e-06,
+ "loss": 0.1616,
+ "step": 22240
+ },
+ {
+ "epoch": 60.60217983651226,
+ "grad_norm": 4.609543800354004,
+ "learning_rate": 7.094540680160013e-06,
+ "loss": 0.1867,
+ "step": 22241
+ },
+ {
+ "epoch": 60.60490463215259,
+ "grad_norm": 4.839238166809082,
+ "learning_rate": 7.0936962667347e-06,
+ "loss": 0.0766,
+ "step": 22242
+ },
+ {
+ "epoch": 60.607629427792915,
+ "grad_norm": 4.464300155639648,
+ "learning_rate": 7.092851875943587e-06,
+ "loss": 0.1777,
+ "step": 22243
+ },
+ {
+ "epoch": 60.61035422343324,
+ "grad_norm": 4.258381366729736,
+ "learning_rate": 7.09200750779325e-06,
+ "loss": 0.0482,
+ "step": 22244
+ },
+ {
+ "epoch": 60.61307901907357,
+ "grad_norm": 3.4603633880615234,
+ "learning_rate": 7.091163162290266e-06,
+ "loss": 0.0709,
+ "step": 22245
+ },
+ {
+ "epoch": 60.6158038147139,
+ "grad_norm": 2.9299049377441406,
+ "learning_rate": 7.090318839441209e-06,
+ "loss": 0.117,
+ "step": 22246
+ },
+ {
+ "epoch": 60.618528610354225,
+ "grad_norm": 3.896228790283203,
+ "learning_rate": 7.089474539252656e-06,
+ "loss": 0.1283,
+ "step": 22247
+ },
+ {
+ "epoch": 60.62125340599455,
+ "grad_norm": 3.1333820819854736,
+ "learning_rate": 7.088630261731181e-06,
+ "loss": 0.1385,
+ "step": 22248
+ },
+ {
+ "epoch": 60.62397820163488,
+ "grad_norm": 3.3098950386047363,
+ "learning_rate": 7.087786006883362e-06,
+ "loss": 0.1398,
+ "step": 22249
+ },
+ {
+ "epoch": 60.6267029972752,
+ "grad_norm": 3.3676881790161133,
+ "learning_rate": 7.086941774715767e-06,
+ "loss": 0.097,
+ "step": 22250
+ },
+ {
+ "epoch": 60.62942779291553,
+ "grad_norm": 3.3836073875427246,
+ "learning_rate": 7.08609756523498e-06,
+ "loss": 0.0805,
+ "step": 22251
+ },
+ {
+ "epoch": 60.63215258855586,
+ "grad_norm": 4.441920280456543,
+ "learning_rate": 7.0852533784475695e-06,
+ "loss": 0.1654,
+ "step": 22252
+ },
+ {
+ "epoch": 60.63487738419619,
+ "grad_norm": 3.9132440090179443,
+ "learning_rate": 7.084409214360113e-06,
+ "loss": 0.0749,
+ "step": 22253
+ },
+ {
+ "epoch": 60.63760217983651,
+ "grad_norm": 3.0047171115875244,
+ "learning_rate": 7.083565072979182e-06,
+ "loss": 0.0818,
+ "step": 22254
+ },
+ {
+ "epoch": 60.64032697547684,
+ "grad_norm": 3.052492141723633,
+ "learning_rate": 7.082720954311354e-06,
+ "loss": 0.0597,
+ "step": 22255
+ },
+ {
+ "epoch": 60.643051771117165,
+ "grad_norm": 3.1172616481781006,
+ "learning_rate": 7.081876858363197e-06,
+ "loss": 0.0921,
+ "step": 22256
+ },
+ {
+ "epoch": 60.64577656675749,
+ "grad_norm": 2.963144302368164,
+ "learning_rate": 7.081032785141292e-06,
+ "loss": 0.2355,
+ "step": 22257
+ },
+ {
+ "epoch": 60.64850136239782,
+ "grad_norm": 3.6875598430633545,
+ "learning_rate": 7.0801887346522116e-06,
+ "loss": 0.0915,
+ "step": 22258
+ },
+ {
+ "epoch": 60.65122615803815,
+ "grad_norm": 2.982158899307251,
+ "learning_rate": 7.079344706902525e-06,
+ "loss": 0.0556,
+ "step": 22259
+ },
+ {
+ "epoch": 60.653950953678475,
+ "grad_norm": 3.083127021789551,
+ "learning_rate": 7.0785007018988095e-06,
+ "loss": 0.0559,
+ "step": 22260
+ },
+ {
+ "epoch": 60.6566757493188,
+ "grad_norm": 2.750852346420288,
+ "learning_rate": 7.077656719647636e-06,
+ "loss": 0.1345,
+ "step": 22261
+ },
+ {
+ "epoch": 60.65940054495913,
+ "grad_norm": 3.7517549991607666,
+ "learning_rate": 7.076812760155576e-06,
+ "loss": 0.0534,
+ "step": 22262
+ },
+ {
+ "epoch": 60.66212534059945,
+ "grad_norm": 4.5389556884765625,
+ "learning_rate": 7.075968823429207e-06,
+ "loss": 0.1213,
+ "step": 22263
+ },
+ {
+ "epoch": 60.664850136239785,
+ "grad_norm": 3.5940957069396973,
+ "learning_rate": 7.075124909475097e-06,
+ "loss": 0.049,
+ "step": 22264
+ },
+ {
+ "epoch": 60.66757493188011,
+ "grad_norm": 2.6097493171691895,
+ "learning_rate": 7.074281018299822e-06,
+ "loss": 0.092,
+ "step": 22265
+ },
+ {
+ "epoch": 60.67029972752044,
+ "grad_norm": 4.9819655418396,
+ "learning_rate": 7.07343714990995e-06,
+ "loss": 0.0739,
+ "step": 22266
+ },
+ {
+ "epoch": 60.67302452316076,
+ "grad_norm": 3.7648372650146484,
+ "learning_rate": 7.072593304312057e-06,
+ "loss": 0.0592,
+ "step": 22267
+ },
+ {
+ "epoch": 60.67574931880109,
+ "grad_norm": 2.8173046112060547,
+ "learning_rate": 7.071749481512712e-06,
+ "loss": 0.083,
+ "step": 22268
+ },
+ {
+ "epoch": 60.678474114441414,
+ "grad_norm": 4.30924129486084,
+ "learning_rate": 7.070905681518489e-06,
+ "loss": 0.2088,
+ "step": 22269
+ },
+ {
+ "epoch": 60.68119891008175,
+ "grad_norm": 3.3528645038604736,
+ "learning_rate": 7.070061904335956e-06,
+ "loss": 0.0917,
+ "step": 22270
+ },
+ {
+ "epoch": 60.68392370572207,
+ "grad_norm": 3.794343948364258,
+ "learning_rate": 7.0692181499716905e-06,
+ "loss": 0.0905,
+ "step": 22271
+ },
+ {
+ "epoch": 60.6866485013624,
+ "grad_norm": 3.7777822017669678,
+ "learning_rate": 7.0683744184322554e-06,
+ "loss": 0.0592,
+ "step": 22272
+ },
+ {
+ "epoch": 60.689373297002724,
+ "grad_norm": 3.484302043914795,
+ "learning_rate": 7.067530709724226e-06,
+ "loss": 0.2144,
+ "step": 22273
+ },
+ {
+ "epoch": 60.69209809264305,
+ "grad_norm": 3.621645927429199,
+ "learning_rate": 7.066687023854175e-06,
+ "loss": 0.0953,
+ "step": 22274
+ },
+ {
+ "epoch": 60.694822888283376,
+ "grad_norm": 4.2324018478393555,
+ "learning_rate": 7.06584336082867e-06,
+ "loss": 0.0622,
+ "step": 22275
+ },
+ {
+ "epoch": 60.69754768392371,
+ "grad_norm": 3.1080031394958496,
+ "learning_rate": 7.0649997206542855e-06,
+ "loss": 0.083,
+ "step": 22276
+ },
+ {
+ "epoch": 60.700272479564035,
+ "grad_norm": 17.693635940551758,
+ "learning_rate": 7.064156103337585e-06,
+ "loss": 0.1117,
+ "step": 22277
+ },
+ {
+ "epoch": 60.70299727520436,
+ "grad_norm": 3.959184169769287,
+ "learning_rate": 7.063312508885145e-06,
+ "loss": 0.1859,
+ "step": 22278
+ },
+ {
+ "epoch": 60.705722070844686,
+ "grad_norm": 3.653937339782715,
+ "learning_rate": 7.06246893730353e-06,
+ "loss": 0.1018,
+ "step": 22279
+ },
+ {
+ "epoch": 60.70844686648501,
+ "grad_norm": 4.431345462799072,
+ "learning_rate": 7.061625388599316e-06,
+ "loss": 0.134,
+ "step": 22280
+ },
+ {
+ "epoch": 60.71117166212534,
+ "grad_norm": 2.741877317428589,
+ "learning_rate": 7.060781862779067e-06,
+ "loss": 0.0766,
+ "step": 22281
+ },
+ {
+ "epoch": 60.71389645776567,
+ "grad_norm": 3.2073557376861572,
+ "learning_rate": 7.0599383598493545e-06,
+ "loss": 0.0572,
+ "step": 22282
+ },
+ {
+ "epoch": 60.716621253406,
+ "grad_norm": 4.956356048583984,
+ "learning_rate": 7.059094879816746e-06,
+ "loss": 0.1087,
+ "step": 22283
+ },
+ {
+ "epoch": 60.71934604904632,
+ "grad_norm": 3.5810546875,
+ "learning_rate": 7.058251422687812e-06,
+ "loss": 0.1391,
+ "step": 22284
+ },
+ {
+ "epoch": 60.72207084468665,
+ "grad_norm": 2.8752553462982178,
+ "learning_rate": 7.057407988469123e-06,
+ "loss": 0.1421,
+ "step": 22285
+ },
+ {
+ "epoch": 60.724795640326974,
+ "grad_norm": 4.71677303314209,
+ "learning_rate": 7.056564577167244e-06,
+ "loss": 0.1228,
+ "step": 22286
+ },
+ {
+ "epoch": 60.7275204359673,
+ "grad_norm": 3.7873075008392334,
+ "learning_rate": 7.055721188788749e-06,
+ "loss": 0.0911,
+ "step": 22287
+ },
+ {
+ "epoch": 60.73024523160763,
+ "grad_norm": 4.778517723083496,
+ "learning_rate": 7.054877823340199e-06,
+ "loss": 0.2246,
+ "step": 22288
+ },
+ {
+ "epoch": 60.73297002724796,
+ "grad_norm": 5.951353549957275,
+ "learning_rate": 7.054034480828167e-06,
+ "loss": 0.12,
+ "step": 22289
+ },
+ {
+ "epoch": 60.735694822888284,
+ "grad_norm": 4.711767196655273,
+ "learning_rate": 7.0531911612592184e-06,
+ "loss": 0.1744,
+ "step": 22290
+ },
+ {
+ "epoch": 60.73841961852861,
+ "grad_norm": 3.759284496307373,
+ "learning_rate": 7.052347864639921e-06,
+ "loss": 0.0527,
+ "step": 22291
+ },
+ {
+ "epoch": 60.741144414168936,
+ "grad_norm": 4.224436283111572,
+ "learning_rate": 7.051504590976847e-06,
+ "loss": 0.0721,
+ "step": 22292
+ },
+ {
+ "epoch": 60.74386920980926,
+ "grad_norm": 3.3867928981781006,
+ "learning_rate": 7.050661340276558e-06,
+ "loss": 0.0701,
+ "step": 22293
+ },
+ {
+ "epoch": 60.746594005449595,
+ "grad_norm": 3.020172119140625,
+ "learning_rate": 7.049818112545626e-06,
+ "loss": 0.0398,
+ "step": 22294
+ },
+ {
+ "epoch": 60.74931880108992,
+ "grad_norm": 4.343257427215576,
+ "learning_rate": 7.048974907790613e-06,
+ "loss": 0.1534,
+ "step": 22295
+ },
+ {
+ "epoch": 60.752043596730246,
+ "grad_norm": 2.9345269203186035,
+ "learning_rate": 7.0481317260180905e-06,
+ "loss": 0.0415,
+ "step": 22296
+ },
+ {
+ "epoch": 60.75476839237057,
+ "grad_norm": 3.8636176586151123,
+ "learning_rate": 7.047288567234621e-06,
+ "loss": 0.1054,
+ "step": 22297
+ },
+ {
+ "epoch": 60.7574931880109,
+ "grad_norm": 4.413434028625488,
+ "learning_rate": 7.046445431446775e-06,
+ "loss": 0.0801,
+ "step": 22298
+ },
+ {
+ "epoch": 60.76021798365122,
+ "grad_norm": 10.045730590820312,
+ "learning_rate": 7.045602318661117e-06,
+ "loss": 0.1175,
+ "step": 22299
+ },
+ {
+ "epoch": 60.762942779291556,
+ "grad_norm": 4.641239643096924,
+ "learning_rate": 7.044759228884212e-06,
+ "loss": 0.1289,
+ "step": 22300
+ },
+ {
+ "epoch": 60.76566757493188,
+ "grad_norm": 3.2659778594970703,
+ "learning_rate": 7.043916162122628e-06,
+ "loss": 0.0746,
+ "step": 22301
+ },
+ {
+ "epoch": 60.76839237057221,
+ "grad_norm": 3.401627540588379,
+ "learning_rate": 7.0430731183829305e-06,
+ "loss": 0.1623,
+ "step": 22302
+ },
+ {
+ "epoch": 60.771117166212534,
+ "grad_norm": 4.0639190673828125,
+ "learning_rate": 7.042230097671681e-06,
+ "loss": 0.1029,
+ "step": 22303
+ },
+ {
+ "epoch": 60.77384196185286,
+ "grad_norm": 4.258162498474121,
+ "learning_rate": 7.0413870999954525e-06,
+ "loss": 0.0601,
+ "step": 22304
+ },
+ {
+ "epoch": 60.776566757493185,
+ "grad_norm": 3.7025859355926514,
+ "learning_rate": 7.040544125360802e-06,
+ "loss": 0.0993,
+ "step": 22305
+ },
+ {
+ "epoch": 60.77929155313352,
+ "grad_norm": 2.8596882820129395,
+ "learning_rate": 7.0397011737743e-06,
+ "loss": 0.0642,
+ "step": 22306
+ },
+ {
+ "epoch": 60.782016348773844,
+ "grad_norm": 4.452273845672607,
+ "learning_rate": 7.038858245242513e-06,
+ "loss": 0.1547,
+ "step": 22307
+ },
+ {
+ "epoch": 60.78474114441417,
+ "grad_norm": 4.354523658752441,
+ "learning_rate": 7.038015339771996e-06,
+ "loss": 0.1604,
+ "step": 22308
+ },
+ {
+ "epoch": 60.787465940054496,
+ "grad_norm": 3.5376999378204346,
+ "learning_rate": 7.037172457369324e-06,
+ "loss": 0.06,
+ "step": 22309
+ },
+ {
+ "epoch": 60.79019073569482,
+ "grad_norm": 3.7299249172210693,
+ "learning_rate": 7.036329598041058e-06,
+ "loss": 0.0904,
+ "step": 22310
+ },
+ {
+ "epoch": 60.79291553133515,
+ "grad_norm": 4.104896545410156,
+ "learning_rate": 7.035486761793762e-06,
+ "loss": 0.1193,
+ "step": 22311
+ },
+ {
+ "epoch": 60.79564032697548,
+ "grad_norm": 4.079039096832275,
+ "learning_rate": 7.034643948634e-06,
+ "loss": 0.0749,
+ "step": 22312
+ },
+ {
+ "epoch": 60.798365122615806,
+ "grad_norm": 3.414623975753784,
+ "learning_rate": 7.033801158568334e-06,
+ "loss": 0.0761,
+ "step": 22313
+ },
+ {
+ "epoch": 60.80108991825613,
+ "grad_norm": 2.737549066543579,
+ "learning_rate": 7.03295839160333e-06,
+ "loss": 0.1327,
+ "step": 22314
+ },
+ {
+ "epoch": 60.80381471389646,
+ "grad_norm": 3.315855026245117,
+ "learning_rate": 7.03211564774555e-06,
+ "loss": 0.1702,
+ "step": 22315
+ },
+ {
+ "epoch": 60.80653950953678,
+ "grad_norm": 3.430767059326172,
+ "learning_rate": 7.03127292700156e-06,
+ "loss": 0.1141,
+ "step": 22316
+ },
+ {
+ "epoch": 60.80926430517711,
+ "grad_norm": 3.510793924331665,
+ "learning_rate": 7.030430229377918e-06,
+ "loss": 0.0642,
+ "step": 22317
+ },
+ {
+ "epoch": 60.81198910081744,
+ "grad_norm": 3.1327335834503174,
+ "learning_rate": 7.029587554881192e-06,
+ "loss": 0.0691,
+ "step": 22318
+ },
+ {
+ "epoch": 60.81471389645777,
+ "grad_norm": 2.9371345043182373,
+ "learning_rate": 7.028744903517941e-06,
+ "loss": 0.118,
+ "step": 22319
+ },
+ {
+ "epoch": 60.817438692098094,
+ "grad_norm": 4.144138813018799,
+ "learning_rate": 7.027902275294731e-06,
+ "loss": 0.1529,
+ "step": 22320
+ },
+ {
+ "epoch": 60.82016348773842,
+ "grad_norm": 3.3764593601226807,
+ "learning_rate": 7.027059670218119e-06,
+ "loss": 0.185,
+ "step": 22321
+ },
+ {
+ "epoch": 60.822888283378745,
+ "grad_norm": 3.683173894882202,
+ "learning_rate": 7.026217088294674e-06,
+ "loss": 0.0987,
+ "step": 22322
+ },
+ {
+ "epoch": 60.82561307901907,
+ "grad_norm": 3.99582576751709,
+ "learning_rate": 7.025374529530952e-06,
+ "loss": 0.1898,
+ "step": 22323
+ },
+ {
+ "epoch": 60.828337874659404,
+ "grad_norm": 4.927083969116211,
+ "learning_rate": 7.024531993933521e-06,
+ "loss": 0.1131,
+ "step": 22324
+ },
+ {
+ "epoch": 60.83106267029973,
+ "grad_norm": 6.777295112609863,
+ "learning_rate": 7.023689481508931e-06,
+ "loss": 0.1139,
+ "step": 22325
+ },
+ {
+ "epoch": 60.833787465940055,
+ "grad_norm": 4.779987812042236,
+ "learning_rate": 7.0228469922637586e-06,
+ "loss": 0.0963,
+ "step": 22326
+ },
+ {
+ "epoch": 60.83651226158038,
+ "grad_norm": 3.708977460861206,
+ "learning_rate": 7.0220045262045555e-06,
+ "loss": 0.0673,
+ "step": 22327
+ },
+ {
+ "epoch": 60.83923705722071,
+ "grad_norm": 4.627310752868652,
+ "learning_rate": 7.021162083337888e-06,
+ "loss": 0.255,
+ "step": 22328
+ },
+ {
+ "epoch": 60.84196185286103,
+ "grad_norm": 3.8745877742767334,
+ "learning_rate": 7.020319663670312e-06,
+ "loss": 0.1111,
+ "step": 22329
+ },
+ {
+ "epoch": 60.844686648501366,
+ "grad_norm": 4.898205757141113,
+ "learning_rate": 7.019477267208392e-06,
+ "loss": 0.1139,
+ "step": 22330
+ },
+ {
+ "epoch": 60.84741144414169,
+ "grad_norm": 4.8633952140808105,
+ "learning_rate": 7.018634893958686e-06,
+ "loss": 0.254,
+ "step": 22331
+ },
+ {
+ "epoch": 60.85013623978202,
+ "grad_norm": 3.453780174255371,
+ "learning_rate": 7.0177925439277574e-06,
+ "loss": 0.0698,
+ "step": 22332
+ },
+ {
+ "epoch": 60.85286103542234,
+ "grad_norm": 3.9543163776397705,
+ "learning_rate": 7.016950217122162e-06,
+ "loss": 0.1174,
+ "step": 22333
+ },
+ {
+ "epoch": 60.85558583106267,
+ "grad_norm": 4.60977029800415,
+ "learning_rate": 7.016107913548465e-06,
+ "loss": 0.1254,
+ "step": 22334
+ },
+ {
+ "epoch": 60.858310626702995,
+ "grad_norm": 4.855064868927002,
+ "learning_rate": 7.01526563321322e-06,
+ "loss": 0.1817,
+ "step": 22335
+ },
+ {
+ "epoch": 60.86103542234333,
+ "grad_norm": 3.0899245738983154,
+ "learning_rate": 7.014423376122993e-06,
+ "loss": 0.1541,
+ "step": 22336
+ },
+ {
+ "epoch": 60.86376021798365,
+ "grad_norm": 5.996626377105713,
+ "learning_rate": 7.0135811422843384e-06,
+ "loss": 0.065,
+ "step": 22337
+ },
+ {
+ "epoch": 60.86648501362398,
+ "grad_norm": 4.739663600921631,
+ "learning_rate": 7.0127389317038205e-06,
+ "loss": 0.1193,
+ "step": 22338
+ },
+ {
+ "epoch": 60.869209809264305,
+ "grad_norm": 3.998300552368164,
+ "learning_rate": 7.011896744387993e-06,
+ "loss": 0.1159,
+ "step": 22339
+ },
+ {
+ "epoch": 60.87193460490463,
+ "grad_norm": 3.2619245052337646,
+ "learning_rate": 7.011054580343421e-06,
+ "loss": 0.0794,
+ "step": 22340
+ },
+ {
+ "epoch": 60.87465940054496,
+ "grad_norm": 3.9167654514312744,
+ "learning_rate": 7.010212439576656e-06,
+ "loss": 0.0969,
+ "step": 22341
+ },
+ {
+ "epoch": 60.87738419618529,
+ "grad_norm": 3.9060447216033936,
+ "learning_rate": 7.009370322094258e-06,
+ "loss": 0.0973,
+ "step": 22342
+ },
+ {
+ "epoch": 60.880108991825615,
+ "grad_norm": 3.3744008541107178,
+ "learning_rate": 7.008528227902793e-06,
+ "loss": 0.1455,
+ "step": 22343
+ },
+ {
+ "epoch": 60.88283378746594,
+ "grad_norm": 3.30375075340271,
+ "learning_rate": 7.00768615700881e-06,
+ "loss": 0.0569,
+ "step": 22344
+ },
+ {
+ "epoch": 60.88555858310627,
+ "grad_norm": 2.545348644256592,
+ "learning_rate": 7.006844109418876e-06,
+ "loss": 0.0956,
+ "step": 22345
+ },
+ {
+ "epoch": 60.88828337874659,
+ "grad_norm": 5.121275901794434,
+ "learning_rate": 7.0060020851395395e-06,
+ "loss": 0.2386,
+ "step": 22346
+ },
+ {
+ "epoch": 60.89100817438692,
+ "grad_norm": 3.8333396911621094,
+ "learning_rate": 7.005160084177365e-06,
+ "loss": 0.1525,
+ "step": 22347
+ },
+ {
+ "epoch": 60.89373297002725,
+ "grad_norm": 5.419399261474609,
+ "learning_rate": 7.0043181065389055e-06,
+ "loss": 0.1043,
+ "step": 22348
+ },
+ {
+ "epoch": 60.89645776566758,
+ "grad_norm": 3.4094061851501465,
+ "learning_rate": 7.003476152230719e-06,
+ "loss": 0.327,
+ "step": 22349
+ },
+ {
+ "epoch": 60.8991825613079,
+ "grad_norm": 3.9822192192077637,
+ "learning_rate": 7.0026342212593674e-06,
+ "loss": 0.0889,
+ "step": 22350
+ },
+ {
+ "epoch": 60.90190735694823,
+ "grad_norm": 3.1728477478027344,
+ "learning_rate": 7.001792313631401e-06,
+ "loss": 0.0861,
+ "step": 22351
+ },
+ {
+ "epoch": 60.904632152588555,
+ "grad_norm": 3.60927414894104,
+ "learning_rate": 7.000950429353382e-06,
+ "loss": 0.0656,
+ "step": 22352
+ },
+ {
+ "epoch": 60.90735694822888,
+ "grad_norm": 3.099705696105957,
+ "learning_rate": 7.000108568431863e-06,
+ "loss": 0.0534,
+ "step": 22353
+ },
+ {
+ "epoch": 60.91008174386921,
+ "grad_norm": 5.447761058807373,
+ "learning_rate": 6.999266730873403e-06,
+ "loss": 0.0543,
+ "step": 22354
+ },
+ {
+ "epoch": 60.91280653950954,
+ "grad_norm": 3.7554986476898193,
+ "learning_rate": 6.998424916684557e-06,
+ "loss": 0.1462,
+ "step": 22355
+ },
+ {
+ "epoch": 60.915531335149865,
+ "grad_norm": 2.8073854446411133,
+ "learning_rate": 6.997583125871881e-06,
+ "loss": 0.057,
+ "step": 22356
+ },
+ {
+ "epoch": 60.91825613079019,
+ "grad_norm": 3.9090890884399414,
+ "learning_rate": 6.996741358441928e-06,
+ "loss": 0.0587,
+ "step": 22357
+ },
+ {
+ "epoch": 60.920980926430516,
+ "grad_norm": 5.497412204742432,
+ "learning_rate": 6.995899614401261e-06,
+ "loss": 0.1058,
+ "step": 22358
+ },
+ {
+ "epoch": 60.92370572207084,
+ "grad_norm": 5.184669017791748,
+ "learning_rate": 6.9950578937564265e-06,
+ "loss": 0.1425,
+ "step": 22359
+ },
+ {
+ "epoch": 60.926430517711175,
+ "grad_norm": 4.452134132385254,
+ "learning_rate": 6.994216196513985e-06,
+ "loss": 0.1044,
+ "step": 22360
+ },
+ {
+ "epoch": 60.9291553133515,
+ "grad_norm": 3.787231206893921,
+ "learning_rate": 6.9933745226804965e-06,
+ "loss": 0.1101,
+ "step": 22361
+ },
+ {
+ "epoch": 60.93188010899183,
+ "grad_norm": 5.098844051361084,
+ "learning_rate": 6.992532872262505e-06,
+ "loss": 0.1892,
+ "step": 22362
+ },
+ {
+ "epoch": 60.93460490463215,
+ "grad_norm": 2.834341287612915,
+ "learning_rate": 6.991691245266574e-06,
+ "loss": 0.0508,
+ "step": 22363
+ },
+ {
+ "epoch": 60.93732970027248,
+ "grad_norm": 3.818565607070923,
+ "learning_rate": 6.990849641699254e-06,
+ "loss": 0.071,
+ "step": 22364
+ },
+ {
+ "epoch": 60.940054495912804,
+ "grad_norm": 3.319694757461548,
+ "learning_rate": 6.9900080615671e-06,
+ "loss": 0.1031,
+ "step": 22365
+ },
+ {
+ "epoch": 60.94277929155314,
+ "grad_norm": 4.184003829956055,
+ "learning_rate": 6.989166504876665e-06,
+ "loss": 0.1331,
+ "step": 22366
+ },
+ {
+ "epoch": 60.94550408719346,
+ "grad_norm": 3.072000741958618,
+ "learning_rate": 6.988324971634506e-06,
+ "loss": 0.0658,
+ "step": 22367
+ },
+ {
+ "epoch": 60.94822888283379,
+ "grad_norm": 5.3535943031311035,
+ "learning_rate": 6.987483461847174e-06,
+ "loss": 0.1483,
+ "step": 22368
+ },
+ {
+ "epoch": 60.950953678474114,
+ "grad_norm": 3.907127618789673,
+ "learning_rate": 6.9866419755212264e-06,
+ "loss": 0.0844,
+ "step": 22369
+ },
+ {
+ "epoch": 60.95367847411444,
+ "grad_norm": 4.069503307342529,
+ "learning_rate": 6.98580051266321e-06,
+ "loss": 0.108,
+ "step": 22370
+ },
+ {
+ "epoch": 60.956403269754766,
+ "grad_norm": 4.840079307556152,
+ "learning_rate": 6.9849590732796845e-06,
+ "loss": 0.0725,
+ "step": 22371
+ },
+ {
+ "epoch": 60.95912806539509,
+ "grad_norm": 4.470433712005615,
+ "learning_rate": 6.9841176573772005e-06,
+ "loss": 0.2054,
+ "step": 22372
+ },
+ {
+ "epoch": 60.961852861035425,
+ "grad_norm": 3.4157469272613525,
+ "learning_rate": 6.983276264962311e-06,
+ "loss": 0.1004,
+ "step": 22373
+ },
+ {
+ "epoch": 60.96457765667575,
+ "grad_norm": 3.0583250522613525,
+ "learning_rate": 6.98243489604157e-06,
+ "loss": 0.0575,
+ "step": 22374
+ },
+ {
+ "epoch": 60.967302452316076,
+ "grad_norm": 4.783733367919922,
+ "learning_rate": 6.981593550621528e-06,
+ "loss": 0.1084,
+ "step": 22375
+ },
+ {
+ "epoch": 60.9700272479564,
+ "grad_norm": 4.70540714263916,
+ "learning_rate": 6.980752228708738e-06,
+ "loss": 0.0414,
+ "step": 22376
+ },
+ {
+ "epoch": 60.97275204359673,
+ "grad_norm": 5.025938034057617,
+ "learning_rate": 6.97991093030975e-06,
+ "loss": 0.0565,
+ "step": 22377
+ },
+ {
+ "epoch": 60.97547683923706,
+ "grad_norm": 3.380636692047119,
+ "learning_rate": 6.979069655431121e-06,
+ "loss": 0.0724,
+ "step": 22378
+ },
+ {
+ "epoch": 60.97820163487739,
+ "grad_norm": 2.896272897720337,
+ "learning_rate": 6.978228404079401e-06,
+ "loss": 0.0569,
+ "step": 22379
+ },
+ {
+ "epoch": 60.98092643051771,
+ "grad_norm": 5.541884422302246,
+ "learning_rate": 6.97738717626114e-06,
+ "loss": 0.0641,
+ "step": 22380
+ },
+ {
+ "epoch": 60.98365122615804,
+ "grad_norm": 3.4038572311401367,
+ "learning_rate": 6.976545971982892e-06,
+ "loss": 0.1173,
+ "step": 22381
+ },
+ {
+ "epoch": 60.986376021798364,
+ "grad_norm": 4.201849460601807,
+ "learning_rate": 6.975704791251205e-06,
+ "loss": 0.0852,
+ "step": 22382
+ },
+ {
+ "epoch": 60.98910081743869,
+ "grad_norm": 3.5013699531555176,
+ "learning_rate": 6.974863634072633e-06,
+ "loss": 0.1106,
+ "step": 22383
+ },
+ {
+ "epoch": 60.991825613079016,
+ "grad_norm": 2.2500011920928955,
+ "learning_rate": 6.974022500453723e-06,
+ "loss": 0.0475,
+ "step": 22384
+ },
+ {
+ "epoch": 60.99455040871935,
+ "grad_norm": 5.096434593200684,
+ "learning_rate": 6.973181390401031e-06,
+ "loss": 0.087,
+ "step": 22385
+ },
+ {
+ "epoch": 60.997275204359674,
+ "grad_norm": 3.684089422225952,
+ "learning_rate": 6.972340303921105e-06,
+ "loss": 0.1392,
+ "step": 22386
+ },
+ {
+ "epoch": 61.0,
+ "grad_norm": 3.029940128326416,
+ "learning_rate": 6.971499241020495e-06,
+ "loss": 0.0491,
+ "step": 22387
+ },
+ {
+ "epoch": 61.002724795640326,
+ "grad_norm": 3.285654306411743,
+ "learning_rate": 6.97065820170575e-06,
+ "loss": 0.046,
+ "step": 22388
+ },
+ {
+ "epoch": 61.00544959128065,
+ "grad_norm": 4.274191856384277,
+ "learning_rate": 6.969817185983423e-06,
+ "loss": 0.1853,
+ "step": 22389
+ },
+ {
+ "epoch": 61.00817438692098,
+ "grad_norm": 3.9813826084136963,
+ "learning_rate": 6.968976193860061e-06,
+ "loss": 0.0845,
+ "step": 22390
+ },
+ {
+ "epoch": 61.01089918256131,
+ "grad_norm": 3.7100205421447754,
+ "learning_rate": 6.968135225342216e-06,
+ "loss": 0.0688,
+ "step": 22391
+ },
+ {
+ "epoch": 61.013623978201636,
+ "grad_norm": 2.5532753467559814,
+ "learning_rate": 6.967294280436435e-06,
+ "loss": 0.0678,
+ "step": 22392
+ },
+ {
+ "epoch": 61.01634877384196,
+ "grad_norm": 13.749371528625488,
+ "learning_rate": 6.9664533591492676e-06,
+ "loss": 0.1025,
+ "step": 22393
+ },
+ {
+ "epoch": 61.01907356948229,
+ "grad_norm": 5.873416900634766,
+ "learning_rate": 6.965612461487263e-06,
+ "loss": 0.1202,
+ "step": 22394
+ },
+ {
+ "epoch": 61.02179836512261,
+ "grad_norm": 3.4473066329956055,
+ "learning_rate": 6.9647715874569744e-06,
+ "loss": 0.0517,
+ "step": 22395
+ },
+ {
+ "epoch": 61.02452316076294,
+ "grad_norm": 3.542557716369629,
+ "learning_rate": 6.963930737064946e-06,
+ "loss": 0.1713,
+ "step": 22396
+ },
+ {
+ "epoch": 61.02724795640327,
+ "grad_norm": 3.8530821800231934,
+ "learning_rate": 6.9630899103177275e-06,
+ "loss": 0.0548,
+ "step": 22397
+ },
+ {
+ "epoch": 61.0299727520436,
+ "grad_norm": 3.076282501220703,
+ "learning_rate": 6.962249107221865e-06,
+ "loss": 0.0881,
+ "step": 22398
+ },
+ {
+ "epoch": 61.032697547683924,
+ "grad_norm": 3.455415964126587,
+ "learning_rate": 6.961408327783911e-06,
+ "loss": 0.1036,
+ "step": 22399
+ },
+ {
+ "epoch": 61.03542234332425,
+ "grad_norm": 3.222121477127075,
+ "learning_rate": 6.9605675720104105e-06,
+ "loss": 0.1229,
+ "step": 22400
+ },
+ {
+ "epoch": 61.038147138964575,
+ "grad_norm": 4.793354511260986,
+ "learning_rate": 6.959726839907914e-06,
+ "loss": 0.1207,
+ "step": 22401
+ },
+ {
+ "epoch": 61.0408719346049,
+ "grad_norm": 4.104300498962402,
+ "learning_rate": 6.958886131482964e-06,
+ "loss": 0.0864,
+ "step": 22402
+ },
+ {
+ "epoch": 61.043596730245234,
+ "grad_norm": 3.9924874305725098,
+ "learning_rate": 6.958045446742112e-06,
+ "loss": 0.0618,
+ "step": 22403
+ },
+ {
+ "epoch": 61.04632152588556,
+ "grad_norm": 2.7155587673187256,
+ "learning_rate": 6.957204785691905e-06,
+ "loss": 0.0994,
+ "step": 22404
+ },
+ {
+ "epoch": 61.049046321525886,
+ "grad_norm": 3.9910666942596436,
+ "learning_rate": 6.956364148338888e-06,
+ "loss": 0.0863,
+ "step": 22405
+ },
+ {
+ "epoch": 61.05177111716621,
+ "grad_norm": 3.0680413246154785,
+ "learning_rate": 6.955523534689609e-06,
+ "loss": 0.0805,
+ "step": 22406
+ },
+ {
+ "epoch": 61.05449591280654,
+ "grad_norm": 4.468904495239258,
+ "learning_rate": 6.954682944750616e-06,
+ "loss": 0.0771,
+ "step": 22407
+ },
+ {
+ "epoch": 61.05722070844686,
+ "grad_norm": 2.7519149780273438,
+ "learning_rate": 6.9538423785284524e-06,
+ "loss": 0.1257,
+ "step": 22408
+ },
+ {
+ "epoch": 61.059945504087196,
+ "grad_norm": 4.085991382598877,
+ "learning_rate": 6.953001836029668e-06,
+ "loss": 0.1341,
+ "step": 22409
+ },
+ {
+ "epoch": 61.06267029972752,
+ "grad_norm": 3.700883626937866,
+ "learning_rate": 6.952161317260806e-06,
+ "loss": 0.1026,
+ "step": 22410
+ },
+ {
+ "epoch": 61.06539509536785,
+ "grad_norm": 2.7471423149108887,
+ "learning_rate": 6.951320822228411e-06,
+ "loss": 0.0779,
+ "step": 22411
+ },
+ {
+ "epoch": 61.06811989100817,
+ "grad_norm": 3.2887837886810303,
+ "learning_rate": 6.9504803509390324e-06,
+ "loss": 0.0651,
+ "step": 22412
+ },
+ {
+ "epoch": 61.0708446866485,
+ "grad_norm": 4.459373950958252,
+ "learning_rate": 6.949639903399219e-06,
+ "loss": 0.0993,
+ "step": 22413
+ },
+ {
+ "epoch": 61.073569482288825,
+ "grad_norm": 3.905278205871582,
+ "learning_rate": 6.948799479615508e-06,
+ "loss": 0.183,
+ "step": 22414
+ },
+ {
+ "epoch": 61.07629427792916,
+ "grad_norm": 4.412621974945068,
+ "learning_rate": 6.947959079594451e-06,
+ "loss": 0.0534,
+ "step": 22415
+ },
+ {
+ "epoch": 61.079019073569484,
+ "grad_norm": 3.1119372844696045,
+ "learning_rate": 6.947118703342588e-06,
+ "loss": 0.0983,
+ "step": 22416
+ },
+ {
+ "epoch": 61.08174386920981,
+ "grad_norm": 3.1814849376678467,
+ "learning_rate": 6.9462783508664685e-06,
+ "loss": 0.0478,
+ "step": 22417
+ },
+ {
+ "epoch": 61.084468664850135,
+ "grad_norm": 3.6415998935699463,
+ "learning_rate": 6.9454380221726335e-06,
+ "loss": 0.2283,
+ "step": 22418
+ },
+ {
+ "epoch": 61.08719346049046,
+ "grad_norm": 3.1991705894470215,
+ "learning_rate": 6.9445977172676315e-06,
+ "loss": 0.1656,
+ "step": 22419
+ },
+ {
+ "epoch": 61.08991825613079,
+ "grad_norm": 3.5609500408172607,
+ "learning_rate": 6.943757436158001e-06,
+ "loss": 0.2535,
+ "step": 22420
+ },
+ {
+ "epoch": 61.09264305177112,
+ "grad_norm": 3.4742014408111572,
+ "learning_rate": 6.94291717885029e-06,
+ "loss": 0.0565,
+ "step": 22421
+ },
+ {
+ "epoch": 61.095367847411445,
+ "grad_norm": 5.54591703414917,
+ "learning_rate": 6.9420769453510415e-06,
+ "loss": 0.0777,
+ "step": 22422
+ },
+ {
+ "epoch": 61.09809264305177,
+ "grad_norm": 3.9256865978240967,
+ "learning_rate": 6.941236735666801e-06,
+ "loss": 0.1117,
+ "step": 22423
+ },
+ {
+ "epoch": 61.1008174386921,
+ "grad_norm": 4.0424017906188965,
+ "learning_rate": 6.9403965498041084e-06,
+ "loss": 0.1486,
+ "step": 22424
+ },
+ {
+ "epoch": 61.10354223433242,
+ "grad_norm": 3.375750780105591,
+ "learning_rate": 6.939556387769511e-06,
+ "loss": 0.3533,
+ "step": 22425
+ },
+ {
+ "epoch": 61.10626702997275,
+ "grad_norm": 3.0661110877990723,
+ "learning_rate": 6.9387162495695485e-06,
+ "loss": 0.2026,
+ "step": 22426
+ },
+ {
+ "epoch": 61.10899182561308,
+ "grad_norm": 3.263305902481079,
+ "learning_rate": 6.937876135210766e-06,
+ "loss": 0.1391,
+ "step": 22427
+ },
+ {
+ "epoch": 61.11171662125341,
+ "grad_norm": 6.555750370025635,
+ "learning_rate": 6.937036044699701e-06,
+ "loss": 0.085,
+ "step": 22428
+ },
+ {
+ "epoch": 61.11444141689373,
+ "grad_norm": 2.908816337585449,
+ "learning_rate": 6.936195978042904e-06,
+ "loss": 0.157,
+ "step": 22429
+ },
+ {
+ "epoch": 61.11716621253406,
+ "grad_norm": 3.787827253341675,
+ "learning_rate": 6.9353559352469165e-06,
+ "loss": 0.1936,
+ "step": 22430
+ },
+ {
+ "epoch": 61.119891008174385,
+ "grad_norm": 3.831509590148926,
+ "learning_rate": 6.934515916318276e-06,
+ "loss": 0.0693,
+ "step": 22431
+ },
+ {
+ "epoch": 61.12261580381471,
+ "grad_norm": 5.685774326324463,
+ "learning_rate": 6.9336759212635285e-06,
+ "loss": 0.0648,
+ "step": 22432
+ },
+ {
+ "epoch": 61.12534059945504,
+ "grad_norm": 3.847019672393799,
+ "learning_rate": 6.932835950089211e-06,
+ "loss": 0.126,
+ "step": 22433
+ },
+ {
+ "epoch": 61.12806539509537,
+ "grad_norm": 2.8347580432891846,
+ "learning_rate": 6.93199600280187e-06,
+ "loss": 0.0598,
+ "step": 22434
+ },
+ {
+ "epoch": 61.130790190735695,
+ "grad_norm": 2.3914573192596436,
+ "learning_rate": 6.931156079408048e-06,
+ "loss": 0.0418,
+ "step": 22435
+ },
+ {
+ "epoch": 61.13351498637602,
+ "grad_norm": 3.817255973815918,
+ "learning_rate": 6.930316179914281e-06,
+ "loss": 0.1644,
+ "step": 22436
+ },
+ {
+ "epoch": 61.13623978201635,
+ "grad_norm": 3.574416160583496,
+ "learning_rate": 6.9294763043271156e-06,
+ "loss": 0.1007,
+ "step": 22437
+ },
+ {
+ "epoch": 61.13896457765667,
+ "grad_norm": 3.91249942779541,
+ "learning_rate": 6.928636452653086e-06,
+ "loss": 0.1997,
+ "step": 22438
+ },
+ {
+ "epoch": 61.141689373297005,
+ "grad_norm": 4.053663730621338,
+ "learning_rate": 6.9277966248987405e-06,
+ "loss": 0.1863,
+ "step": 22439
+ },
+ {
+ "epoch": 61.14441416893733,
+ "grad_norm": 3.43363881111145,
+ "learning_rate": 6.926956821070614e-06,
+ "loss": 0.1179,
+ "step": 22440
+ },
+ {
+ "epoch": 61.14713896457766,
+ "grad_norm": 3.894035816192627,
+ "learning_rate": 6.92611704117525e-06,
+ "loss": 0.0746,
+ "step": 22441
+ },
+ {
+ "epoch": 61.14986376021798,
+ "grad_norm": 3.0605595111846924,
+ "learning_rate": 6.925277285219185e-06,
+ "loss": 0.0626,
+ "step": 22442
+ },
+ {
+ "epoch": 61.15258855585831,
+ "grad_norm": 4.345304012298584,
+ "learning_rate": 6.924437553208965e-06,
+ "loss": 0.1464,
+ "step": 22443
+ },
+ {
+ "epoch": 61.155313351498634,
+ "grad_norm": 4.668532848358154,
+ "learning_rate": 6.923597845151124e-06,
+ "loss": 0.1101,
+ "step": 22444
+ },
+ {
+ "epoch": 61.15803814713897,
+ "grad_norm": 3.243645429611206,
+ "learning_rate": 6.922758161052201e-06,
+ "loss": 0.0891,
+ "step": 22445
+ },
+ {
+ "epoch": 61.16076294277929,
+ "grad_norm": 4.130244731903076,
+ "learning_rate": 6.921918500918743e-06,
+ "loss": 0.1457,
+ "step": 22446
+ },
+ {
+ "epoch": 61.16348773841962,
+ "grad_norm": 4.43756628036499,
+ "learning_rate": 6.921078864757282e-06,
+ "loss": 0.1449,
+ "step": 22447
+ },
+ {
+ "epoch": 61.166212534059945,
+ "grad_norm": 3.9297196865081787,
+ "learning_rate": 6.920239252574364e-06,
+ "loss": 0.0579,
+ "step": 22448
+ },
+ {
+ "epoch": 61.16893732970027,
+ "grad_norm": 4.997093200683594,
+ "learning_rate": 6.9193996643765195e-06,
+ "loss": 0.1195,
+ "step": 22449
+ },
+ {
+ "epoch": 61.171662125340596,
+ "grad_norm": 3.6902146339416504,
+ "learning_rate": 6.918560100170293e-06,
+ "loss": 0.11,
+ "step": 22450
+ },
+ {
+ "epoch": 61.17438692098093,
+ "grad_norm": 2.218496322631836,
+ "learning_rate": 6.91772055996222e-06,
+ "loss": 0.0283,
+ "step": 22451
+ },
+ {
+ "epoch": 61.177111716621255,
+ "grad_norm": 4.0584211349487305,
+ "learning_rate": 6.916881043758843e-06,
+ "loss": 0.1857,
+ "step": 22452
+ },
+ {
+ "epoch": 61.17983651226158,
+ "grad_norm": 5.4693193435668945,
+ "learning_rate": 6.916041551566695e-06,
+ "loss": 0.0712,
+ "step": 22453
+ },
+ {
+ "epoch": 61.182561307901906,
+ "grad_norm": 2.8290891647338867,
+ "learning_rate": 6.915202083392316e-06,
+ "loss": 0.0834,
+ "step": 22454
+ },
+ {
+ "epoch": 61.18528610354223,
+ "grad_norm": 4.029819488525391,
+ "learning_rate": 6.9143626392422446e-06,
+ "loss": 0.1181,
+ "step": 22455
+ },
+ {
+ "epoch": 61.18801089918256,
+ "grad_norm": 2.920246124267578,
+ "learning_rate": 6.9135232191230176e-06,
+ "loss": 0.0597,
+ "step": 22456
+ },
+ {
+ "epoch": 61.19073569482289,
+ "grad_norm": 3.2647705078125,
+ "learning_rate": 6.912683823041171e-06,
+ "loss": 0.1243,
+ "step": 22457
+ },
+ {
+ "epoch": 61.19346049046322,
+ "grad_norm": 4.116549968719482,
+ "learning_rate": 6.911844451003244e-06,
+ "loss": 0.1568,
+ "step": 22458
+ },
+ {
+ "epoch": 61.19618528610354,
+ "grad_norm": 3.7574572563171387,
+ "learning_rate": 6.911005103015775e-06,
+ "loss": 0.2098,
+ "step": 22459
+ },
+ {
+ "epoch": 61.19891008174387,
+ "grad_norm": 3.683820962905884,
+ "learning_rate": 6.910165779085296e-06,
+ "loss": 0.1229,
+ "step": 22460
+ },
+ {
+ "epoch": 61.201634877384194,
+ "grad_norm": 4.492462158203125,
+ "learning_rate": 6.90932647921835e-06,
+ "loss": 0.1008,
+ "step": 22461
+ },
+ {
+ "epoch": 61.20435967302452,
+ "grad_norm": 3.6631996631622314,
+ "learning_rate": 6.908487203421465e-06,
+ "loss": 0.0954,
+ "step": 22462
+ },
+ {
+ "epoch": 61.20708446866485,
+ "grad_norm": 2.686357021331787,
+ "learning_rate": 6.907647951701183e-06,
+ "loss": 0.0509,
+ "step": 22463
+ },
+ {
+ "epoch": 61.20980926430518,
+ "grad_norm": 3.2772693634033203,
+ "learning_rate": 6.906808724064043e-06,
+ "loss": 0.054,
+ "step": 22464
+ },
+ {
+ "epoch": 61.212534059945504,
+ "grad_norm": 3.1622159481048584,
+ "learning_rate": 6.905969520516573e-06,
+ "loss": 0.0817,
+ "step": 22465
+ },
+ {
+ "epoch": 61.21525885558583,
+ "grad_norm": 3.74229097366333,
+ "learning_rate": 6.905130341065317e-06,
+ "loss": 0.0751,
+ "step": 22466
+ },
+ {
+ "epoch": 61.217983651226156,
+ "grad_norm": 3.26526141166687,
+ "learning_rate": 6.904291185716802e-06,
+ "loss": 0.0645,
+ "step": 22467
+ },
+ {
+ "epoch": 61.22070844686648,
+ "grad_norm": 3.589921236038208,
+ "learning_rate": 6.903452054477573e-06,
+ "loss": 0.0629,
+ "step": 22468
+ },
+ {
+ "epoch": 61.223433242506815,
+ "grad_norm": 5.118885040283203,
+ "learning_rate": 6.902612947354155e-06,
+ "loss": 0.1421,
+ "step": 22469
+ },
+ {
+ "epoch": 61.22615803814714,
+ "grad_norm": 3.6298789978027344,
+ "learning_rate": 6.9017738643530905e-06,
+ "loss": 0.0704,
+ "step": 22470
+ },
+ {
+ "epoch": 61.228882833787466,
+ "grad_norm": 3.2231998443603516,
+ "learning_rate": 6.90093480548091e-06,
+ "loss": 0.0662,
+ "step": 22471
+ },
+ {
+ "epoch": 61.23160762942779,
+ "grad_norm": 2.864978313446045,
+ "learning_rate": 6.9000957707441505e-06,
+ "loss": 0.1268,
+ "step": 22472
+ },
+ {
+ "epoch": 61.23433242506812,
+ "grad_norm": 3.8802876472473145,
+ "learning_rate": 6.899256760149345e-06,
+ "loss": 0.0984,
+ "step": 22473
+ },
+ {
+ "epoch": 61.237057220708444,
+ "grad_norm": 2.5116190910339355,
+ "learning_rate": 6.898417773703028e-06,
+ "loss": 0.0491,
+ "step": 22474
+ },
+ {
+ "epoch": 61.23978201634878,
+ "grad_norm": 3.569486141204834,
+ "learning_rate": 6.897578811411732e-06,
+ "loss": 0.0665,
+ "step": 22475
+ },
+ {
+ "epoch": 61.2425068119891,
+ "grad_norm": 3.417987823486328,
+ "learning_rate": 6.896739873281995e-06,
+ "loss": 0.1306,
+ "step": 22476
+ },
+ {
+ "epoch": 61.24523160762943,
+ "grad_norm": 3.795724868774414,
+ "learning_rate": 6.8959009593203454e-06,
+ "loss": 0.2253,
+ "step": 22477
+ },
+ {
+ "epoch": 61.247956403269754,
+ "grad_norm": 4.208312511444092,
+ "learning_rate": 6.895062069533322e-06,
+ "loss": 0.1128,
+ "step": 22478
+ },
+ {
+ "epoch": 61.25068119891008,
+ "grad_norm": 4.227952480316162,
+ "learning_rate": 6.894223203927452e-06,
+ "loss": 0.1524,
+ "step": 22479
+ },
+ {
+ "epoch": 61.253405994550405,
+ "grad_norm": 5.267580509185791,
+ "learning_rate": 6.8933843625092715e-06,
+ "loss": 0.0809,
+ "step": 22480
+ },
+ {
+ "epoch": 61.25613079019074,
+ "grad_norm": 3.6058425903320312,
+ "learning_rate": 6.892545545285314e-06,
+ "loss": 0.0906,
+ "step": 22481
+ },
+ {
+ "epoch": 61.258855585831064,
+ "grad_norm": 7.454145431518555,
+ "learning_rate": 6.891706752262115e-06,
+ "loss": 0.1498,
+ "step": 22482
+ },
+ {
+ "epoch": 61.26158038147139,
+ "grad_norm": 3.4177675247192383,
+ "learning_rate": 6.890867983446201e-06,
+ "loss": 0.0654,
+ "step": 22483
+ },
+ {
+ "epoch": 61.264305177111716,
+ "grad_norm": 2.882645606994629,
+ "learning_rate": 6.8900292388441095e-06,
+ "loss": 0.0957,
+ "step": 22484
+ },
+ {
+ "epoch": 61.26702997275204,
+ "grad_norm": 3.294074773788452,
+ "learning_rate": 6.889190518462368e-06,
+ "loss": 0.0733,
+ "step": 22485
+ },
+ {
+ "epoch": 61.26975476839237,
+ "grad_norm": 3.619446039199829,
+ "learning_rate": 6.888351822307513e-06,
+ "loss": 0.0694,
+ "step": 22486
+ },
+ {
+ "epoch": 61.2724795640327,
+ "grad_norm": 3.25736141204834,
+ "learning_rate": 6.887513150386072e-06,
+ "loss": 0.0637,
+ "step": 22487
+ },
+ {
+ "epoch": 61.275204359673026,
+ "grad_norm": 4.02907657623291,
+ "learning_rate": 6.886674502704579e-06,
+ "loss": 0.1833,
+ "step": 22488
+ },
+ {
+ "epoch": 61.27792915531335,
+ "grad_norm": 3.1237282752990723,
+ "learning_rate": 6.885835879269564e-06,
+ "loss": 0.0694,
+ "step": 22489
+ },
+ {
+ "epoch": 61.28065395095368,
+ "grad_norm": 8.443364143371582,
+ "learning_rate": 6.88499728008756e-06,
+ "loss": 0.1257,
+ "step": 22490
+ },
+ {
+ "epoch": 61.283378746594,
+ "grad_norm": 4.005463600158691,
+ "learning_rate": 6.884158705165096e-06,
+ "loss": 0.0746,
+ "step": 22491
+ },
+ {
+ "epoch": 61.28610354223433,
+ "grad_norm": 3.8555893898010254,
+ "learning_rate": 6.883320154508705e-06,
+ "loss": 0.0707,
+ "step": 22492
+ },
+ {
+ "epoch": 61.28882833787466,
+ "grad_norm": 2.8718743324279785,
+ "learning_rate": 6.882481628124915e-06,
+ "loss": 0.0623,
+ "step": 22493
+ },
+ {
+ "epoch": 61.29155313351499,
+ "grad_norm": 3.9258992671966553,
+ "learning_rate": 6.881643126020259e-06,
+ "loss": 0.1837,
+ "step": 22494
+ },
+ {
+ "epoch": 61.294277929155314,
+ "grad_norm": 7.436041355133057,
+ "learning_rate": 6.8808046482012645e-06,
+ "loss": 0.0849,
+ "step": 22495
+ },
+ {
+ "epoch": 61.29700272479564,
+ "grad_norm": 3.05180287361145,
+ "learning_rate": 6.8799661946744646e-06,
+ "loss": 0.106,
+ "step": 22496
+ },
+ {
+ "epoch": 61.299727520435965,
+ "grad_norm": 3.570476531982422,
+ "learning_rate": 6.879127765446383e-06,
+ "loss": 0.2072,
+ "step": 22497
+ },
+ {
+ "epoch": 61.30245231607629,
+ "grad_norm": 2.7125468254089355,
+ "learning_rate": 6.878289360523556e-06,
+ "loss": 0.0435,
+ "step": 22498
+ },
+ {
+ "epoch": 61.305177111716624,
+ "grad_norm": 6.026636600494385,
+ "learning_rate": 6.877450979912512e-06,
+ "loss": 0.0725,
+ "step": 22499
+ },
+ {
+ "epoch": 61.30790190735695,
+ "grad_norm": 3.470548391342163,
+ "learning_rate": 6.876612623619782e-06,
+ "loss": 0.059,
+ "step": 22500
+ },
+ {
+ "epoch": 61.310626702997276,
+ "grad_norm": 3.3297195434570312,
+ "learning_rate": 6.875774291651889e-06,
+ "loss": 0.1602,
+ "step": 22501
+ },
+ {
+ "epoch": 61.3133514986376,
+ "grad_norm": 2.9722609519958496,
+ "learning_rate": 6.874935984015367e-06,
+ "loss": 0.098,
+ "step": 22502
+ },
+ {
+ "epoch": 61.31607629427793,
+ "grad_norm": 4.761186122894287,
+ "learning_rate": 6.874097700716742e-06,
+ "loss": 0.1268,
+ "step": 22503
+ },
+ {
+ "epoch": 61.31880108991825,
+ "grad_norm": 3.75443434715271,
+ "learning_rate": 6.873259441762545e-06,
+ "loss": 0.0661,
+ "step": 22504
+ },
+ {
+ "epoch": 61.321525885558586,
+ "grad_norm": 3.4605464935302734,
+ "learning_rate": 6.872421207159301e-06,
+ "loss": 0.0559,
+ "step": 22505
+ },
+ {
+ "epoch": 61.32425068119891,
+ "grad_norm": 2.499070644378662,
+ "learning_rate": 6.871582996913542e-06,
+ "loss": 0.0584,
+ "step": 22506
+ },
+ {
+ "epoch": 61.32697547683924,
+ "grad_norm": 4.2966437339782715,
+ "learning_rate": 6.870744811031791e-06,
+ "loss": 0.0485,
+ "step": 22507
+ },
+ {
+ "epoch": 61.32970027247956,
+ "grad_norm": 8.06656551361084,
+ "learning_rate": 6.869906649520581e-06,
+ "loss": 0.1118,
+ "step": 22508
+ },
+ {
+ "epoch": 61.33242506811989,
+ "grad_norm": 3.6609208583831787,
+ "learning_rate": 6.869068512386436e-06,
+ "loss": 0.0799,
+ "step": 22509
+ },
+ {
+ "epoch": 61.335149863760215,
+ "grad_norm": 2.774722099304199,
+ "learning_rate": 6.868230399635887e-06,
+ "loss": 0.1738,
+ "step": 22510
+ },
+ {
+ "epoch": 61.33787465940055,
+ "grad_norm": 3.4997575283050537,
+ "learning_rate": 6.867392311275456e-06,
+ "loss": 0.1908,
+ "step": 22511
+ },
+ {
+ "epoch": 61.34059945504087,
+ "grad_norm": 2.995242118835449,
+ "learning_rate": 6.866554247311676e-06,
+ "loss": 0.1446,
+ "step": 22512
+ },
+ {
+ "epoch": 61.3433242506812,
+ "grad_norm": 2.2353782653808594,
+ "learning_rate": 6.865716207751068e-06,
+ "loss": 0.0471,
+ "step": 22513
+ },
+ {
+ "epoch": 61.346049046321525,
+ "grad_norm": 4.911764144897461,
+ "learning_rate": 6.864878192600158e-06,
+ "loss": 0.1985,
+ "step": 22514
+ },
+ {
+ "epoch": 61.34877384196185,
+ "grad_norm": 4.077296733856201,
+ "learning_rate": 6.864040201865481e-06,
+ "loss": 0.0599,
+ "step": 22515
+ },
+ {
+ "epoch": 61.35149863760218,
+ "grad_norm": 5.075759410858154,
+ "learning_rate": 6.863202235553557e-06,
+ "loss": 0.0898,
+ "step": 22516
+ },
+ {
+ "epoch": 61.35422343324251,
+ "grad_norm": 3.448331594467163,
+ "learning_rate": 6.862364293670913e-06,
+ "loss": 0.0492,
+ "step": 22517
+ },
+ {
+ "epoch": 61.356948228882835,
+ "grad_norm": 2.8780722618103027,
+ "learning_rate": 6.8615263762240735e-06,
+ "loss": 0.124,
+ "step": 22518
+ },
+ {
+ "epoch": 61.35967302452316,
+ "grad_norm": 3.84973406791687,
+ "learning_rate": 6.860688483219569e-06,
+ "loss": 0.1241,
+ "step": 22519
+ },
+ {
+ "epoch": 61.36239782016349,
+ "grad_norm": 3.990999698638916,
+ "learning_rate": 6.859850614663916e-06,
+ "loss": 0.1081,
+ "step": 22520
+ },
+ {
+ "epoch": 61.36512261580381,
+ "grad_norm": 3.954577922821045,
+ "learning_rate": 6.859012770563649e-06,
+ "loss": 0.0656,
+ "step": 22521
+ },
+ {
+ "epoch": 61.36784741144414,
+ "grad_norm": 4.023142337799072,
+ "learning_rate": 6.858174950925289e-06,
+ "loss": 0.0796,
+ "step": 22522
+ },
+ {
+ "epoch": 61.37057220708447,
+ "grad_norm": 3.638831853866577,
+ "learning_rate": 6.857337155755362e-06,
+ "loss": 0.0473,
+ "step": 22523
+ },
+ {
+ "epoch": 61.3732970027248,
+ "grad_norm": 3.5866053104400635,
+ "learning_rate": 6.856499385060392e-06,
+ "loss": 0.1376,
+ "step": 22524
+ },
+ {
+ "epoch": 61.37602179836512,
+ "grad_norm": 3.0281224250793457,
+ "learning_rate": 6.855661638846902e-06,
+ "loss": 0.0581,
+ "step": 22525
+ },
+ {
+ "epoch": 61.37874659400545,
+ "grad_norm": 3.867025375366211,
+ "learning_rate": 6.854823917121421e-06,
+ "loss": 0.0782,
+ "step": 22526
+ },
+ {
+ "epoch": 61.381471389645775,
+ "grad_norm": 4.331473350524902,
+ "learning_rate": 6.853986219890467e-06,
+ "loss": 0.0702,
+ "step": 22527
+ },
+ {
+ "epoch": 61.3841961852861,
+ "grad_norm": 3.835432291030884,
+ "learning_rate": 6.853148547160568e-06,
+ "loss": 0.0706,
+ "step": 22528
+ },
+ {
+ "epoch": 61.38692098092643,
+ "grad_norm": 5.395134449005127,
+ "learning_rate": 6.852310898938248e-06,
+ "loss": 0.1446,
+ "step": 22529
+ },
+ {
+ "epoch": 61.38964577656676,
+ "grad_norm": 3.941890239715576,
+ "learning_rate": 6.85147327523003e-06,
+ "loss": 0.1196,
+ "step": 22530
+ },
+ {
+ "epoch": 61.392370572207085,
+ "grad_norm": 3.325962781906128,
+ "learning_rate": 6.850635676042432e-06,
+ "loss": 0.0991,
+ "step": 22531
+ },
+ {
+ "epoch": 61.39509536784741,
+ "grad_norm": 4.40023946762085,
+ "learning_rate": 6.849798101381984e-06,
+ "loss": 0.0587,
+ "step": 22532
+ },
+ {
+ "epoch": 61.39782016348774,
+ "grad_norm": 3.027614116668701,
+ "learning_rate": 6.848960551255208e-06,
+ "loss": 0.049,
+ "step": 22533
+ },
+ {
+ "epoch": 61.40054495912806,
+ "grad_norm": 5.605319499969482,
+ "learning_rate": 6.848123025668626e-06,
+ "loss": 0.2438,
+ "step": 22534
+ },
+ {
+ "epoch": 61.403269754768395,
+ "grad_norm": 5.745209217071533,
+ "learning_rate": 6.847285524628762e-06,
+ "loss": 0.0956,
+ "step": 22535
+ },
+ {
+ "epoch": 61.40599455040872,
+ "grad_norm": 3.1595828533172607,
+ "learning_rate": 6.846448048142134e-06,
+ "loss": 0.0941,
+ "step": 22536
+ },
+ {
+ "epoch": 61.40871934604905,
+ "grad_norm": 2.9316658973693848,
+ "learning_rate": 6.84561059621527e-06,
+ "loss": 0.1674,
+ "step": 22537
+ },
+ {
+ "epoch": 61.41144414168937,
+ "grad_norm": 5.271034240722656,
+ "learning_rate": 6.844773168854686e-06,
+ "loss": 0.1526,
+ "step": 22538
+ },
+ {
+ "epoch": 61.4141689373297,
+ "grad_norm": 3.7947235107421875,
+ "learning_rate": 6.843935766066911e-06,
+ "loss": 0.0582,
+ "step": 22539
+ },
+ {
+ "epoch": 61.416893732970024,
+ "grad_norm": 3.0826029777526855,
+ "learning_rate": 6.8430983878584585e-06,
+ "loss": 0.0697,
+ "step": 22540
+ },
+ {
+ "epoch": 61.41961852861036,
+ "grad_norm": 3.8238813877105713,
+ "learning_rate": 6.842261034235858e-06,
+ "loss": 0.1339,
+ "step": 22541
+ },
+ {
+ "epoch": 61.42234332425068,
+ "grad_norm": 4.125527381896973,
+ "learning_rate": 6.841423705205623e-06,
+ "loss": 0.1194,
+ "step": 22542
+ },
+ {
+ "epoch": 61.42506811989101,
+ "grad_norm": 4.080195426940918,
+ "learning_rate": 6.840586400774282e-06,
+ "loss": 0.1927,
+ "step": 22543
+ },
+ {
+ "epoch": 61.427792915531334,
+ "grad_norm": 4.2366228103637695,
+ "learning_rate": 6.839749120948349e-06,
+ "loss": 0.1214,
+ "step": 22544
+ },
+ {
+ "epoch": 61.43051771117166,
+ "grad_norm": 3.4900057315826416,
+ "learning_rate": 6.8389118657343505e-06,
+ "loss": 0.0864,
+ "step": 22545
+ },
+ {
+ "epoch": 61.433242506811986,
+ "grad_norm": 3.958977460861206,
+ "learning_rate": 6.838074635138805e-06,
+ "loss": 0.0958,
+ "step": 22546
+ },
+ {
+ "epoch": 61.43596730245232,
+ "grad_norm": 6.551956653594971,
+ "learning_rate": 6.8372374291682306e-06,
+ "loss": 0.2499,
+ "step": 22547
+ },
+ {
+ "epoch": 61.438692098092645,
+ "grad_norm": 4.2710371017456055,
+ "learning_rate": 6.836400247829151e-06,
+ "loss": 0.0968,
+ "step": 22548
+ },
+ {
+ "epoch": 61.44141689373297,
+ "grad_norm": 2.7208895683288574,
+ "learning_rate": 6.835563091128081e-06,
+ "loss": 0.1067,
+ "step": 22549
+ },
+ {
+ "epoch": 61.444141689373296,
+ "grad_norm": 4.0786285400390625,
+ "learning_rate": 6.834725959071546e-06,
+ "loss": 0.1261,
+ "step": 22550
+ },
+ {
+ "epoch": 61.44686648501362,
+ "grad_norm": 4.6377105712890625,
+ "learning_rate": 6.833888851666064e-06,
+ "loss": 0.0836,
+ "step": 22551
+ },
+ {
+ "epoch": 61.44959128065395,
+ "grad_norm": 3.952730894088745,
+ "learning_rate": 6.8330517689181534e-06,
+ "loss": 0.1789,
+ "step": 22552
+ },
+ {
+ "epoch": 61.45231607629428,
+ "grad_norm": 7.379684925079346,
+ "learning_rate": 6.832214710834335e-06,
+ "loss": 0.1058,
+ "step": 22553
+ },
+ {
+ "epoch": 61.45504087193461,
+ "grad_norm": 4.6327223777771,
+ "learning_rate": 6.831377677421125e-06,
+ "loss": 0.131,
+ "step": 22554
+ },
+ {
+ "epoch": 61.45776566757493,
+ "grad_norm": 2.3379297256469727,
+ "learning_rate": 6.830540668685045e-06,
+ "loss": 0.0889,
+ "step": 22555
+ },
+ {
+ "epoch": 61.46049046321526,
+ "grad_norm": 2.2440812587738037,
+ "learning_rate": 6.82970368463261e-06,
+ "loss": 0.1082,
+ "step": 22556
+ },
+ {
+ "epoch": 61.463215258855584,
+ "grad_norm": 4.8782877922058105,
+ "learning_rate": 6.8288667252703435e-06,
+ "loss": 0.0587,
+ "step": 22557
+ },
+ {
+ "epoch": 61.46594005449591,
+ "grad_norm": 3.6590161323547363,
+ "learning_rate": 6.828029790604757e-06,
+ "loss": 0.2096,
+ "step": 22558
+ },
+ {
+ "epoch": 61.46866485013624,
+ "grad_norm": 3.6848299503326416,
+ "learning_rate": 6.827192880642377e-06,
+ "loss": 0.0511,
+ "step": 22559
+ },
+ {
+ "epoch": 61.47138964577657,
+ "grad_norm": 5.054895877838135,
+ "learning_rate": 6.826355995389714e-06,
+ "loss": 0.1669,
+ "step": 22560
+ },
+ {
+ "epoch": 61.474114441416894,
+ "grad_norm": 3.6900060176849365,
+ "learning_rate": 6.82551913485329e-06,
+ "loss": 0.1283,
+ "step": 22561
+ },
+ {
+ "epoch": 61.47683923705722,
+ "grad_norm": 3.7525711059570312,
+ "learning_rate": 6.824682299039619e-06,
+ "loss": 0.0659,
+ "step": 22562
+ },
+ {
+ "epoch": 61.479564032697546,
+ "grad_norm": 4.069061756134033,
+ "learning_rate": 6.823845487955222e-06,
+ "loss": 0.1744,
+ "step": 22563
+ },
+ {
+ "epoch": 61.48228882833787,
+ "grad_norm": 4.4344096183776855,
+ "learning_rate": 6.823008701606612e-06,
+ "loss": 0.1213,
+ "step": 22564
+ },
+ {
+ "epoch": 61.485013623978205,
+ "grad_norm": 3.128112316131592,
+ "learning_rate": 6.822171940000311e-06,
+ "loss": 0.0555,
+ "step": 22565
+ },
+ {
+ "epoch": 61.48773841961853,
+ "grad_norm": 5.1781110763549805,
+ "learning_rate": 6.821335203142825e-06,
+ "loss": 0.0946,
+ "step": 22566
+ },
+ {
+ "epoch": 61.490463215258856,
+ "grad_norm": 3.098604917526245,
+ "learning_rate": 6.820498491040684e-06,
+ "loss": 0.1108,
+ "step": 22567
+ },
+ {
+ "epoch": 61.49318801089918,
+ "grad_norm": 5.4357075691223145,
+ "learning_rate": 6.819661803700397e-06,
+ "loss": 0.0706,
+ "step": 22568
+ },
+ {
+ "epoch": 61.49591280653951,
+ "grad_norm": 4.7054266929626465,
+ "learning_rate": 6.818825141128484e-06,
+ "loss": 0.0891,
+ "step": 22569
+ },
+ {
+ "epoch": 61.49863760217983,
+ "grad_norm": 5.830087184906006,
+ "learning_rate": 6.817988503331456e-06,
+ "loss": 0.303,
+ "step": 22570
+ },
+ {
+ "epoch": 61.50136239782017,
+ "grad_norm": 4.259527206420898,
+ "learning_rate": 6.817151890315834e-06,
+ "loss": 0.2109,
+ "step": 22571
+ },
+ {
+ "epoch": 61.50408719346049,
+ "grad_norm": 3.3473060131073,
+ "learning_rate": 6.816315302088128e-06,
+ "loss": 0.0757,
+ "step": 22572
+ },
+ {
+ "epoch": 61.50681198910082,
+ "grad_norm": 6.24845552444458,
+ "learning_rate": 6.815478738654857e-06,
+ "loss": 0.1215,
+ "step": 22573
+ },
+ {
+ "epoch": 61.509536784741144,
+ "grad_norm": 5.4939351081848145,
+ "learning_rate": 6.814642200022534e-06,
+ "loss": 0.1916,
+ "step": 22574
+ },
+ {
+ "epoch": 61.51226158038147,
+ "grad_norm": 3.96571946144104,
+ "learning_rate": 6.813805686197677e-06,
+ "loss": 0.1267,
+ "step": 22575
+ },
+ {
+ "epoch": 61.514986376021795,
+ "grad_norm": 3.6861422061920166,
+ "learning_rate": 6.812969197186796e-06,
+ "loss": 0.0727,
+ "step": 22576
+ },
+ {
+ "epoch": 61.51771117166213,
+ "grad_norm": 3.844547986984253,
+ "learning_rate": 6.8121327329964116e-06,
+ "loss": 0.1031,
+ "step": 22577
+ },
+ {
+ "epoch": 61.520435967302454,
+ "grad_norm": 3.123567581176758,
+ "learning_rate": 6.811296293633032e-06,
+ "loss": 0.1303,
+ "step": 22578
+ },
+ {
+ "epoch": 61.52316076294278,
+ "grad_norm": 2.9488346576690674,
+ "learning_rate": 6.810459879103177e-06,
+ "loss": 0.0529,
+ "step": 22579
+ },
+ {
+ "epoch": 61.525885558583106,
+ "grad_norm": 3.1225693225860596,
+ "learning_rate": 6.8096234894133554e-06,
+ "loss": 0.0552,
+ "step": 22580
+ },
+ {
+ "epoch": 61.52861035422343,
+ "grad_norm": 7.820192337036133,
+ "learning_rate": 6.808787124570086e-06,
+ "loss": 0.1403,
+ "step": 22581
+ },
+ {
+ "epoch": 61.53133514986376,
+ "grad_norm": 3.2657599449157715,
+ "learning_rate": 6.8079507845798754e-06,
+ "loss": 0.1341,
+ "step": 22582
+ },
+ {
+ "epoch": 61.53405994550409,
+ "grad_norm": 8.19572639465332,
+ "learning_rate": 6.807114469449242e-06,
+ "loss": 0.1402,
+ "step": 22583
+ },
+ {
+ "epoch": 61.536784741144416,
+ "grad_norm": 5.6479291915893555,
+ "learning_rate": 6.806278179184701e-06,
+ "loss": 0.0685,
+ "step": 22584
+ },
+ {
+ "epoch": 61.53950953678474,
+ "grad_norm": 6.213305473327637,
+ "learning_rate": 6.805441913792761e-06,
+ "loss": 0.0791,
+ "step": 22585
+ },
+ {
+ "epoch": 61.54223433242507,
+ "grad_norm": 3.350292444229126,
+ "learning_rate": 6.804605673279937e-06,
+ "loss": 0.1291,
+ "step": 22586
+ },
+ {
+ "epoch": 61.54495912806539,
+ "grad_norm": 3.873460054397583,
+ "learning_rate": 6.803769457652743e-06,
+ "loss": 0.0658,
+ "step": 22587
+ },
+ {
+ "epoch": 61.54768392370572,
+ "grad_norm": 3.1772074699401855,
+ "learning_rate": 6.802933266917687e-06,
+ "loss": 0.1259,
+ "step": 22588
+ },
+ {
+ "epoch": 61.55040871934605,
+ "grad_norm": 4.587749004364014,
+ "learning_rate": 6.802097101081286e-06,
+ "loss": 0.1125,
+ "step": 22589
+ },
+ {
+ "epoch": 61.55313351498638,
+ "grad_norm": 4.840493202209473,
+ "learning_rate": 6.801260960150049e-06,
+ "loss": 0.0879,
+ "step": 22590
+ },
+ {
+ "epoch": 61.555858310626704,
+ "grad_norm": 3.0096285343170166,
+ "learning_rate": 6.80042484413049e-06,
+ "loss": 0.119,
+ "step": 22591
+ },
+ {
+ "epoch": 61.55858310626703,
+ "grad_norm": 3.6800713539123535,
+ "learning_rate": 6.799588753029116e-06,
+ "loss": 0.0525,
+ "step": 22592
+ },
+ {
+ "epoch": 61.561307901907355,
+ "grad_norm": 4.493557453155518,
+ "learning_rate": 6.798752686852445e-06,
+ "loss": 0.1426,
+ "step": 22593
+ },
+ {
+ "epoch": 61.56403269754768,
+ "grad_norm": 3.826521158218384,
+ "learning_rate": 6.797916645606984e-06,
+ "loss": 0.1073,
+ "step": 22594
+ },
+ {
+ "epoch": 61.566757493188014,
+ "grad_norm": 4.606961250305176,
+ "learning_rate": 6.797080629299246e-06,
+ "loss": 0.0999,
+ "step": 22595
+ },
+ {
+ "epoch": 61.56948228882834,
+ "grad_norm": 3.625265598297119,
+ "learning_rate": 6.796244637935738e-06,
+ "loss": 0.1786,
+ "step": 22596
+ },
+ {
+ "epoch": 61.572207084468666,
+ "grad_norm": 3.434013605117798,
+ "learning_rate": 6.7954086715229785e-06,
+ "loss": 0.1318,
+ "step": 22597
+ },
+ {
+ "epoch": 61.57493188010899,
+ "grad_norm": 4.323663234710693,
+ "learning_rate": 6.794572730067468e-06,
+ "loss": 0.0674,
+ "step": 22598
+ },
+ {
+ "epoch": 61.57765667574932,
+ "grad_norm": 4.009775638580322,
+ "learning_rate": 6.793736813575726e-06,
+ "loss": 0.1404,
+ "step": 22599
+ },
+ {
+ "epoch": 61.58038147138964,
+ "grad_norm": 3.958038568496704,
+ "learning_rate": 6.792900922054253e-06,
+ "loss": 0.0547,
+ "step": 22600
+ },
+ {
+ "epoch": 61.583106267029976,
+ "grad_norm": 5.43556022644043,
+ "learning_rate": 6.792065055509567e-06,
+ "loss": 0.104,
+ "step": 22601
+ },
+ {
+ "epoch": 61.5858310626703,
+ "grad_norm": 3.598926067352295,
+ "learning_rate": 6.791229213948178e-06,
+ "loss": 0.0685,
+ "step": 22602
+ },
+ {
+ "epoch": 61.58855585831063,
+ "grad_norm": 3.2011067867279053,
+ "learning_rate": 6.79039339737659e-06,
+ "loss": 0.066,
+ "step": 22603
+ },
+ {
+ "epoch": 61.59128065395095,
+ "grad_norm": 4.33527135848999,
+ "learning_rate": 6.7895576058013165e-06,
+ "loss": 0.1314,
+ "step": 22604
+ },
+ {
+ "epoch": 61.59400544959128,
+ "grad_norm": 4.108130931854248,
+ "learning_rate": 6.788721839228863e-06,
+ "loss": 0.0926,
+ "step": 22605
+ },
+ {
+ "epoch": 61.596730245231605,
+ "grad_norm": 3.942216157913208,
+ "learning_rate": 6.787886097665744e-06,
+ "loss": 0.0581,
+ "step": 22606
+ },
+ {
+ "epoch": 61.59945504087194,
+ "grad_norm": 4.376565933227539,
+ "learning_rate": 6.787050381118461e-06,
+ "loss": 0.0901,
+ "step": 22607
+ },
+ {
+ "epoch": 61.60217983651226,
+ "grad_norm": 9.13692569732666,
+ "learning_rate": 6.786214689593527e-06,
+ "loss": 0.1621,
+ "step": 22608
+ },
+ {
+ "epoch": 61.60490463215259,
+ "grad_norm": 3.2546372413635254,
+ "learning_rate": 6.785379023097451e-06,
+ "loss": 0.1854,
+ "step": 22609
+ },
+ {
+ "epoch": 61.607629427792915,
+ "grad_norm": 3.8960635662078857,
+ "learning_rate": 6.784543381636738e-06,
+ "loss": 0.072,
+ "step": 22610
+ },
+ {
+ "epoch": 61.61035422343324,
+ "grad_norm": 3.6300668716430664,
+ "learning_rate": 6.783707765217899e-06,
+ "loss": 0.0814,
+ "step": 22611
+ },
+ {
+ "epoch": 61.61307901907357,
+ "grad_norm": 4.188830852508545,
+ "learning_rate": 6.782872173847439e-06,
+ "loss": 0.1216,
+ "step": 22612
+ },
+ {
+ "epoch": 61.6158038147139,
+ "grad_norm": 4.343804359436035,
+ "learning_rate": 6.78203660753187e-06,
+ "loss": 0.0654,
+ "step": 22613
+ },
+ {
+ "epoch": 61.618528610354225,
+ "grad_norm": 4.386777877807617,
+ "learning_rate": 6.781201066277693e-06,
+ "loss": 0.1287,
+ "step": 22614
+ },
+ {
+ "epoch": 61.62125340599455,
+ "grad_norm": 3.194927215576172,
+ "learning_rate": 6.780365550091421e-06,
+ "loss": 0.1733,
+ "step": 22615
+ },
+ {
+ "epoch": 61.62397820163488,
+ "grad_norm": 2.8710696697235107,
+ "learning_rate": 6.779530058979555e-06,
+ "loss": 0.0936,
+ "step": 22616
+ },
+ {
+ "epoch": 61.6267029972752,
+ "grad_norm": 4.807511806488037,
+ "learning_rate": 6.778694592948605e-06,
+ "loss": 0.0514,
+ "step": 22617
+ },
+ {
+ "epoch": 61.62942779291553,
+ "grad_norm": 3.2285690307617188,
+ "learning_rate": 6.777859152005082e-06,
+ "loss": 0.1046,
+ "step": 22618
+ },
+ {
+ "epoch": 61.63215258855586,
+ "grad_norm": 6.532040119171143,
+ "learning_rate": 6.777023736155486e-06,
+ "loss": 0.1783,
+ "step": 22619
+ },
+ {
+ "epoch": 61.63487738419619,
+ "grad_norm": 3.0889177322387695,
+ "learning_rate": 6.776188345406327e-06,
+ "loss": 0.0656,
+ "step": 22620
+ },
+ {
+ "epoch": 61.63760217983651,
+ "grad_norm": 4.285674095153809,
+ "learning_rate": 6.775352979764107e-06,
+ "loss": 0.0695,
+ "step": 22621
+ },
+ {
+ "epoch": 61.64032697547684,
+ "grad_norm": 5.0756001472473145,
+ "learning_rate": 6.7745176392353365e-06,
+ "loss": 0.0649,
+ "step": 22622
+ },
+ {
+ "epoch": 61.643051771117165,
+ "grad_norm": 4.603452682495117,
+ "learning_rate": 6.773682323826517e-06,
+ "loss": 0.1991,
+ "step": 22623
+ },
+ {
+ "epoch": 61.64577656675749,
+ "grad_norm": 3.4590930938720703,
+ "learning_rate": 6.772847033544157e-06,
+ "loss": 0.0685,
+ "step": 22624
+ },
+ {
+ "epoch": 61.64850136239782,
+ "grad_norm": 3.503081798553467,
+ "learning_rate": 6.77201176839476e-06,
+ "loss": 0.107,
+ "step": 22625
+ },
+ {
+ "epoch": 61.65122615803815,
+ "grad_norm": 2.494121551513672,
+ "learning_rate": 6.771176528384833e-06,
+ "loss": 0.0417,
+ "step": 22626
+ },
+ {
+ "epoch": 61.653950953678475,
+ "grad_norm": 5.950601100921631,
+ "learning_rate": 6.770341313520877e-06,
+ "loss": 0.1306,
+ "step": 22627
+ },
+ {
+ "epoch": 61.6566757493188,
+ "grad_norm": 2.828500270843506,
+ "learning_rate": 6.7695061238094e-06,
+ "loss": 0.0437,
+ "step": 22628
+ },
+ {
+ "epoch": 61.65940054495913,
+ "grad_norm": 2.743598461151123,
+ "learning_rate": 6.7686709592569046e-06,
+ "loss": 0.0455,
+ "step": 22629
+ },
+ {
+ "epoch": 61.66212534059945,
+ "grad_norm": 2.979541301727295,
+ "learning_rate": 6.767835819869897e-06,
+ "loss": 0.0521,
+ "step": 22630
+ },
+ {
+ "epoch": 61.664850136239785,
+ "grad_norm": 3.4339613914489746,
+ "learning_rate": 6.767000705654878e-06,
+ "loss": 0.2072,
+ "step": 22631
+ },
+ {
+ "epoch": 61.66757493188011,
+ "grad_norm": 4.0011162757873535,
+ "learning_rate": 6.766165616618354e-06,
+ "loss": 0.1283,
+ "step": 22632
+ },
+ {
+ "epoch": 61.67029972752044,
+ "grad_norm": 3.5324370861053467,
+ "learning_rate": 6.76533055276683e-06,
+ "loss": 0.1995,
+ "step": 22633
+ },
+ {
+ "epoch": 61.67302452316076,
+ "grad_norm": 2.553166627883911,
+ "learning_rate": 6.764495514106806e-06,
+ "loss": 0.0326,
+ "step": 22634
+ },
+ {
+ "epoch": 61.67574931880109,
+ "grad_norm": 4.523924350738525,
+ "learning_rate": 6.763660500644783e-06,
+ "loss": 0.0511,
+ "step": 22635
+ },
+ {
+ "epoch": 61.678474114441414,
+ "grad_norm": 4.016600608825684,
+ "learning_rate": 6.762825512387273e-06,
+ "loss": 0.1556,
+ "step": 22636
+ },
+ {
+ "epoch": 61.68119891008175,
+ "grad_norm": 5.064176082611084,
+ "learning_rate": 6.761990549340771e-06,
+ "loss": 0.1284,
+ "step": 22637
+ },
+ {
+ "epoch": 61.68392370572207,
+ "grad_norm": 2.2795469760894775,
+ "learning_rate": 6.761155611511786e-06,
+ "loss": 0.0496,
+ "step": 22638
+ },
+ {
+ "epoch": 61.6866485013624,
+ "grad_norm": 3.7937819957733154,
+ "learning_rate": 6.760320698906815e-06,
+ "loss": 0.1301,
+ "step": 22639
+ },
+ {
+ "epoch": 61.689373297002724,
+ "grad_norm": 4.277508735656738,
+ "learning_rate": 6.7594858115323625e-06,
+ "loss": 0.0692,
+ "step": 22640
+ },
+ {
+ "epoch": 61.69209809264305,
+ "grad_norm": 2.199242353439331,
+ "learning_rate": 6.758650949394929e-06,
+ "loss": 0.0883,
+ "step": 22641
+ },
+ {
+ "epoch": 61.694822888283376,
+ "grad_norm": 4.541222095489502,
+ "learning_rate": 6.757816112501019e-06,
+ "loss": 0.2393,
+ "step": 22642
+ },
+ {
+ "epoch": 61.69754768392371,
+ "grad_norm": 3.7574493885040283,
+ "learning_rate": 6.756981300857131e-06,
+ "loss": 0.0803,
+ "step": 22643
+ },
+ {
+ "epoch": 61.700272479564035,
+ "grad_norm": 3.8200643062591553,
+ "learning_rate": 6.75614651446977e-06,
+ "loss": 0.1866,
+ "step": 22644
+ },
+ {
+ "epoch": 61.70299727520436,
+ "grad_norm": 3.394278049468994,
+ "learning_rate": 6.7553117533454345e-06,
+ "loss": 0.0454,
+ "step": 22645
+ },
+ {
+ "epoch": 61.705722070844686,
+ "grad_norm": 3.9583377838134766,
+ "learning_rate": 6.754477017490628e-06,
+ "loss": 0.1482,
+ "step": 22646
+ },
+ {
+ "epoch": 61.70844686648501,
+ "grad_norm": 3.4778318405151367,
+ "learning_rate": 6.753642306911849e-06,
+ "loss": 0.0746,
+ "step": 22647
+ },
+ {
+ "epoch": 61.71117166212534,
+ "grad_norm": 5.393945693969727,
+ "learning_rate": 6.7528076216156e-06,
+ "loss": 0.0903,
+ "step": 22648
+ },
+ {
+ "epoch": 61.71389645776567,
+ "grad_norm": 3.733022689819336,
+ "learning_rate": 6.751972961608379e-06,
+ "loss": 0.0537,
+ "step": 22649
+ },
+ {
+ "epoch": 61.716621253406,
+ "grad_norm": 4.430414199829102,
+ "learning_rate": 6.75113832689669e-06,
+ "loss": 0.2244,
+ "step": 22650
+ },
+ {
+ "epoch": 61.71934604904632,
+ "grad_norm": 3.1594595909118652,
+ "learning_rate": 6.75030371748703e-06,
+ "loss": 0.1262,
+ "step": 22651
+ },
+ {
+ "epoch": 61.72207084468665,
+ "grad_norm": 4.033882141113281,
+ "learning_rate": 6.7494691333858964e-06,
+ "loss": 0.0899,
+ "step": 22652
+ },
+ {
+ "epoch": 61.724795640326974,
+ "grad_norm": 3.0013859272003174,
+ "learning_rate": 6.748634574599795e-06,
+ "loss": 0.0946,
+ "step": 22653
+ },
+ {
+ "epoch": 61.7275204359673,
+ "grad_norm": 3.480828285217285,
+ "learning_rate": 6.747800041135226e-06,
+ "loss": 0.0471,
+ "step": 22654
+ },
+ {
+ "epoch": 61.73024523160763,
+ "grad_norm": 6.171280860900879,
+ "learning_rate": 6.746965532998684e-06,
+ "loss": 0.0784,
+ "step": 22655
+ },
+ {
+ "epoch": 61.73297002724796,
+ "grad_norm": 3.1149210929870605,
+ "learning_rate": 6.7461310501966695e-06,
+ "loss": 0.0691,
+ "step": 22656
+ },
+ {
+ "epoch": 61.735694822888284,
+ "grad_norm": 5.454401969909668,
+ "learning_rate": 6.745296592735682e-06,
+ "loss": 0.2389,
+ "step": 22657
+ },
+ {
+ "epoch": 61.73841961852861,
+ "grad_norm": 4.131072521209717,
+ "learning_rate": 6.744462160622221e-06,
+ "loss": 0.1386,
+ "step": 22658
+ },
+ {
+ "epoch": 61.741144414168936,
+ "grad_norm": 3.9972660541534424,
+ "learning_rate": 6.7436277538627804e-06,
+ "loss": 0.1325,
+ "step": 22659
+ },
+ {
+ "epoch": 61.74386920980926,
+ "grad_norm": 3.5973973274230957,
+ "learning_rate": 6.742793372463865e-06,
+ "loss": 0.0751,
+ "step": 22660
+ },
+ {
+ "epoch": 61.746594005449595,
+ "grad_norm": 2.9896881580352783,
+ "learning_rate": 6.741959016431969e-06,
+ "loss": 0.0532,
+ "step": 22661
+ },
+ {
+ "epoch": 61.74931880108992,
+ "grad_norm": 9.038811683654785,
+ "learning_rate": 6.741124685773592e-06,
+ "loss": 0.1706,
+ "step": 22662
+ },
+ {
+ "epoch": 61.752043596730246,
+ "grad_norm": 4.241949081420898,
+ "learning_rate": 6.7402903804952304e-06,
+ "loss": 0.158,
+ "step": 22663
+ },
+ {
+ "epoch": 61.75476839237057,
+ "grad_norm": 2.5723586082458496,
+ "learning_rate": 6.739456100603383e-06,
+ "loss": 0.0453,
+ "step": 22664
+ },
+ {
+ "epoch": 61.7574931880109,
+ "grad_norm": 2.763686180114746,
+ "learning_rate": 6.738621846104546e-06,
+ "loss": 0.0517,
+ "step": 22665
+ },
+ {
+ "epoch": 61.76021798365122,
+ "grad_norm": 2.9788365364074707,
+ "learning_rate": 6.737787617005218e-06,
+ "loss": 0.0671,
+ "step": 22666
+ },
+ {
+ "epoch": 61.762942779291556,
+ "grad_norm": 4.045244216918945,
+ "learning_rate": 6.736953413311893e-06,
+ "loss": 0.2312,
+ "step": 22667
+ },
+ {
+ "epoch": 61.76566757493188,
+ "grad_norm": 3.8430511951446533,
+ "learning_rate": 6.736119235031074e-06,
+ "loss": 0.0478,
+ "step": 22668
+ },
+ {
+ "epoch": 61.76839237057221,
+ "grad_norm": 3.877647638320923,
+ "learning_rate": 6.735285082169246e-06,
+ "loss": 0.0659,
+ "step": 22669
+ },
+ {
+ "epoch": 61.771117166212534,
+ "grad_norm": 3.7261879444122314,
+ "learning_rate": 6.734450954732916e-06,
+ "loss": 0.1214,
+ "step": 22670
+ },
+ {
+ "epoch": 61.77384196185286,
+ "grad_norm": 3.3089585304260254,
+ "learning_rate": 6.7336168527285796e-06,
+ "loss": 0.117,
+ "step": 22671
+ },
+ {
+ "epoch": 61.776566757493185,
+ "grad_norm": 5.874284744262695,
+ "learning_rate": 6.732782776162727e-06,
+ "loss": 0.1129,
+ "step": 22672
+ },
+ {
+ "epoch": 61.77929155313352,
+ "grad_norm": 3.244377613067627,
+ "learning_rate": 6.731948725041858e-06,
+ "loss": 0.0564,
+ "step": 22673
+ },
+ {
+ "epoch": 61.782016348773844,
+ "grad_norm": 3.3005571365356445,
+ "learning_rate": 6.73111469937247e-06,
+ "loss": 0.0891,
+ "step": 22674
+ },
+ {
+ "epoch": 61.78474114441417,
+ "grad_norm": 4.592073917388916,
+ "learning_rate": 6.730280699161052e-06,
+ "loss": 0.0561,
+ "step": 22675
+ },
+ {
+ "epoch": 61.787465940054496,
+ "grad_norm": 3.6790101528167725,
+ "learning_rate": 6.729446724414103e-06,
+ "loss": 0.057,
+ "step": 22676
+ },
+ {
+ "epoch": 61.79019073569482,
+ "grad_norm": 4.135296821594238,
+ "learning_rate": 6.7286127751381194e-06,
+ "loss": 0.1755,
+ "step": 22677
+ },
+ {
+ "epoch": 61.79291553133515,
+ "grad_norm": 4.67214298248291,
+ "learning_rate": 6.727778851339592e-06,
+ "loss": 0.0864,
+ "step": 22678
+ },
+ {
+ "epoch": 61.79564032697548,
+ "grad_norm": 3.8387014865875244,
+ "learning_rate": 6.726944953025019e-06,
+ "loss": 0.1451,
+ "step": 22679
+ },
+ {
+ "epoch": 61.798365122615806,
+ "grad_norm": 3.663045883178711,
+ "learning_rate": 6.7261110802008944e-06,
+ "loss": 0.0599,
+ "step": 22680
+ },
+ {
+ "epoch": 61.80108991825613,
+ "grad_norm": 3.5640475749969482,
+ "learning_rate": 6.72527723287371e-06,
+ "loss": 0.1829,
+ "step": 22681
+ },
+ {
+ "epoch": 61.80381471389646,
+ "grad_norm": 6.209664821624756,
+ "learning_rate": 6.724443411049961e-06,
+ "loss": 0.2145,
+ "step": 22682
+ },
+ {
+ "epoch": 61.80653950953678,
+ "grad_norm": 4.0792717933654785,
+ "learning_rate": 6.723609614736142e-06,
+ "loss": 0.0376,
+ "step": 22683
+ },
+ {
+ "epoch": 61.80926430517711,
+ "grad_norm": 3.1523070335388184,
+ "learning_rate": 6.722775843938745e-06,
+ "loss": 0.0529,
+ "step": 22684
+ },
+ {
+ "epoch": 61.81198910081744,
+ "grad_norm": 4.342679500579834,
+ "learning_rate": 6.721942098664264e-06,
+ "loss": 0.1316,
+ "step": 22685
+ },
+ {
+ "epoch": 61.81471389645777,
+ "grad_norm": 4.211147308349609,
+ "learning_rate": 6.72110837891919e-06,
+ "loss": 0.0855,
+ "step": 22686
+ },
+ {
+ "epoch": 61.817438692098094,
+ "grad_norm": 5.1515631675720215,
+ "learning_rate": 6.720274684710023e-06,
+ "loss": 0.1734,
+ "step": 22687
+ },
+ {
+ "epoch": 61.82016348773842,
+ "grad_norm": 2.444735050201416,
+ "learning_rate": 6.719441016043249e-06,
+ "loss": 0.1014,
+ "step": 22688
+ },
+ {
+ "epoch": 61.822888283378745,
+ "grad_norm": 3.6656153202056885,
+ "learning_rate": 6.718607372925365e-06,
+ "loss": 0.2574,
+ "step": 22689
+ },
+ {
+ "epoch": 61.82561307901907,
+ "grad_norm": 4.523416996002197,
+ "learning_rate": 6.717773755362857e-06,
+ "loss": 0.1183,
+ "step": 22690
+ },
+ {
+ "epoch": 61.828337874659404,
+ "grad_norm": 3.1440584659576416,
+ "learning_rate": 6.716940163362227e-06,
+ "loss": 0.0417,
+ "step": 22691
+ },
+ {
+ "epoch": 61.83106267029973,
+ "grad_norm": 4.38675594329834,
+ "learning_rate": 6.716106596929956e-06,
+ "loss": 0.0693,
+ "step": 22692
+ },
+ {
+ "epoch": 61.833787465940055,
+ "grad_norm": 4.36245584487915,
+ "learning_rate": 6.715273056072545e-06,
+ "loss": 0.0868,
+ "step": 22693
+ },
+ {
+ "epoch": 61.83651226158038,
+ "grad_norm": 3.322178602218628,
+ "learning_rate": 6.71443954079648e-06,
+ "loss": 0.0582,
+ "step": 22694
+ },
+ {
+ "epoch": 61.83923705722071,
+ "grad_norm": 3.655691385269165,
+ "learning_rate": 6.713606051108252e-06,
+ "loss": 0.2231,
+ "step": 22695
+ },
+ {
+ "epoch": 61.84196185286103,
+ "grad_norm": 3.9152729511260986,
+ "learning_rate": 6.712772587014359e-06,
+ "loss": 0.1323,
+ "step": 22696
+ },
+ {
+ "epoch": 61.844686648501366,
+ "grad_norm": 3.867809534072876,
+ "learning_rate": 6.711939148521284e-06,
+ "loss": 0.1256,
+ "step": 22697
+ },
+ {
+ "epoch": 61.84741144414169,
+ "grad_norm": 3.225816249847412,
+ "learning_rate": 6.711105735635524e-06,
+ "loss": 0.1185,
+ "step": 22698
+ },
+ {
+ "epoch": 61.85013623978202,
+ "grad_norm": 3.8987462520599365,
+ "learning_rate": 6.710272348363563e-06,
+ "loss": 0.12,
+ "step": 22699
+ },
+ {
+ "epoch": 61.85286103542234,
+ "grad_norm": 3.257603645324707,
+ "learning_rate": 6.709438986711898e-06,
+ "loss": 0.0507,
+ "step": 22700
+ },
+ {
+ "epoch": 61.85558583106267,
+ "grad_norm": 3.559697151184082,
+ "learning_rate": 6.708605650687014e-06,
+ "loss": 0.0934,
+ "step": 22701
+ },
+ {
+ "epoch": 61.858310626702995,
+ "grad_norm": 2.652071952819824,
+ "learning_rate": 6.707772340295404e-06,
+ "loss": 0.0525,
+ "step": 22702
+ },
+ {
+ "epoch": 61.86103542234333,
+ "grad_norm": 4.298716068267822,
+ "learning_rate": 6.706939055543558e-06,
+ "loss": 0.1298,
+ "step": 22703
+ },
+ {
+ "epoch": 61.86376021798365,
+ "grad_norm": 6.449079513549805,
+ "learning_rate": 6.70610579643796e-06,
+ "loss": 0.0603,
+ "step": 22704
+ },
+ {
+ "epoch": 61.86648501362398,
+ "grad_norm": 3.8100218772888184,
+ "learning_rate": 6.70527256298511e-06,
+ "loss": 0.1174,
+ "step": 22705
+ },
+ {
+ "epoch": 61.869209809264305,
+ "grad_norm": 5.430166244506836,
+ "learning_rate": 6.704439355191487e-06,
+ "loss": 0.1655,
+ "step": 22706
+ },
+ {
+ "epoch": 61.87193460490463,
+ "grad_norm": 4.131312847137451,
+ "learning_rate": 6.703606173063588e-06,
+ "loss": 0.1358,
+ "step": 22707
+ },
+ {
+ "epoch": 61.87465940054496,
+ "grad_norm": 5.626758098602295,
+ "learning_rate": 6.702773016607895e-06,
+ "loss": 0.0786,
+ "step": 22708
+ },
+ {
+ "epoch": 61.87738419618529,
+ "grad_norm": 3.967013359069824,
+ "learning_rate": 6.701939885830904e-06,
+ "loss": 0.1383,
+ "step": 22709
+ },
+ {
+ "epoch": 61.880108991825615,
+ "grad_norm": 3.8643786907196045,
+ "learning_rate": 6.701106780739095e-06,
+ "loss": 0.0678,
+ "step": 22710
+ },
+ {
+ "epoch": 61.88283378746594,
+ "grad_norm": 4.2384843826293945,
+ "learning_rate": 6.700273701338962e-06,
+ "loss": 0.0711,
+ "step": 22711
+ },
+ {
+ "epoch": 61.88555858310627,
+ "grad_norm": 4.261518478393555,
+ "learning_rate": 6.69944064763699e-06,
+ "loss": 0.0486,
+ "step": 22712
+ },
+ {
+ "epoch": 61.88828337874659,
+ "grad_norm": 3.5158252716064453,
+ "learning_rate": 6.69860761963967e-06,
+ "loss": 0.134,
+ "step": 22713
+ },
+ {
+ "epoch": 61.89100817438692,
+ "grad_norm": 3.4491991996765137,
+ "learning_rate": 6.697774617353485e-06,
+ "loss": 0.0877,
+ "step": 22714
+ },
+ {
+ "epoch": 61.89373297002725,
+ "grad_norm": 2.8204474449157715,
+ "learning_rate": 6.6969416407849264e-06,
+ "loss": 0.1753,
+ "step": 22715
+ },
+ {
+ "epoch": 61.89645776566758,
+ "grad_norm": 6.21249532699585,
+ "learning_rate": 6.696108689940479e-06,
+ "loss": 0.0854,
+ "step": 22716
+ },
+ {
+ "epoch": 61.8991825613079,
+ "grad_norm": 4.418528079986572,
+ "learning_rate": 6.695275764826633e-06,
+ "loss": 0.0992,
+ "step": 22717
+ },
+ {
+ "epoch": 61.90190735694823,
+ "grad_norm": 3.096376895904541,
+ "learning_rate": 6.694442865449871e-06,
+ "loss": 0.1378,
+ "step": 22718
+ },
+ {
+ "epoch": 61.904632152588555,
+ "grad_norm": 4.136012077331543,
+ "learning_rate": 6.6936099918166805e-06,
+ "loss": 0.2316,
+ "step": 22719
+ },
+ {
+ "epoch": 61.90735694822888,
+ "grad_norm": 3.673497438430786,
+ "learning_rate": 6.692777143933552e-06,
+ "loss": 0.053,
+ "step": 22720
+ },
+ {
+ "epoch": 61.91008174386921,
+ "grad_norm": 3.3672080039978027,
+ "learning_rate": 6.6919443218069645e-06,
+ "loss": 0.102,
+ "step": 22721
+ },
+ {
+ "epoch": 61.91280653950954,
+ "grad_norm": 2.9719884395599365,
+ "learning_rate": 6.69111152544341e-06,
+ "loss": 0.1133,
+ "step": 22722
+ },
+ {
+ "epoch": 61.915531335149865,
+ "grad_norm": 3.9197938442230225,
+ "learning_rate": 6.690278754849374e-06,
+ "loss": 0.0572,
+ "step": 22723
+ },
+ {
+ "epoch": 61.91825613079019,
+ "grad_norm": 3.8324594497680664,
+ "learning_rate": 6.68944601003134e-06,
+ "loss": 0.1418,
+ "step": 22724
+ },
+ {
+ "epoch": 61.920980926430516,
+ "grad_norm": 2.728116989135742,
+ "learning_rate": 6.688613290995794e-06,
+ "loss": 0.0543,
+ "step": 22725
+ },
+ {
+ "epoch": 61.92370572207084,
+ "grad_norm": 3.0618062019348145,
+ "learning_rate": 6.6877805977492205e-06,
+ "loss": 0.0735,
+ "step": 22726
+ },
+ {
+ "epoch": 61.926430517711175,
+ "grad_norm": 4.998763561248779,
+ "learning_rate": 6.686947930298107e-06,
+ "loss": 0.0668,
+ "step": 22727
+ },
+ {
+ "epoch": 61.9291553133515,
+ "grad_norm": 4.105166435241699,
+ "learning_rate": 6.686115288648933e-06,
+ "loss": 0.0877,
+ "step": 22728
+ },
+ {
+ "epoch": 61.93188010899183,
+ "grad_norm": 4.189581394195557,
+ "learning_rate": 6.68528267280819e-06,
+ "loss": 0.089,
+ "step": 22729
+ },
+ {
+ "epoch": 61.93460490463215,
+ "grad_norm": 4.31670618057251,
+ "learning_rate": 6.684450082782357e-06,
+ "loss": 0.1864,
+ "step": 22730
+ },
+ {
+ "epoch": 61.93732970027248,
+ "grad_norm": 3.497159957885742,
+ "learning_rate": 6.6836175185779205e-06,
+ "loss": 0.138,
+ "step": 22731
+ },
+ {
+ "epoch": 61.940054495912804,
+ "grad_norm": 3.2771823406219482,
+ "learning_rate": 6.682784980201363e-06,
+ "loss": 0.0448,
+ "step": 22732
+ },
+ {
+ "epoch": 61.94277929155314,
+ "grad_norm": 4.763228893280029,
+ "learning_rate": 6.681952467659172e-06,
+ "loss": 0.142,
+ "step": 22733
+ },
+ {
+ "epoch": 61.94550408719346,
+ "grad_norm": 13.746893882751465,
+ "learning_rate": 6.681119980957825e-06,
+ "loss": 0.1821,
+ "step": 22734
+ },
+ {
+ "epoch": 61.94822888283379,
+ "grad_norm": 3.962510824203491,
+ "learning_rate": 6.680287520103812e-06,
+ "loss": 0.0684,
+ "step": 22735
+ },
+ {
+ "epoch": 61.950953678474114,
+ "grad_norm": 2.830461263656616,
+ "learning_rate": 6.67945508510361e-06,
+ "loss": 0.0412,
+ "step": 22736
+ },
+ {
+ "epoch": 61.95367847411444,
+ "grad_norm": 3.46307635307312,
+ "learning_rate": 6.678622675963708e-06,
+ "loss": 0.0438,
+ "step": 22737
+ },
+ {
+ "epoch": 61.956403269754766,
+ "grad_norm": 3.4912824630737305,
+ "learning_rate": 6.677790292690578e-06,
+ "loss": 0.1202,
+ "step": 22738
+ },
+ {
+ "epoch": 61.95912806539509,
+ "grad_norm": 3.3099188804626465,
+ "learning_rate": 6.676957935290718e-06,
+ "loss": 0.0973,
+ "step": 22739
+ },
+ {
+ "epoch": 61.961852861035425,
+ "grad_norm": 5.242749214172363,
+ "learning_rate": 6.676125603770599e-06,
+ "loss": 0.1739,
+ "step": 22740
+ },
+ {
+ "epoch": 61.96457765667575,
+ "grad_norm": 3.9065499305725098,
+ "learning_rate": 6.675293298136709e-06,
+ "loss": 0.0613,
+ "step": 22741
+ },
+ {
+ "epoch": 61.967302452316076,
+ "grad_norm": 3.916933298110962,
+ "learning_rate": 6.674461018395527e-06,
+ "loss": 0.0955,
+ "step": 22742
+ },
+ {
+ "epoch": 61.9700272479564,
+ "grad_norm": 4.395709037780762,
+ "learning_rate": 6.6736287645535365e-06,
+ "loss": 0.1493,
+ "step": 22743
+ },
+ {
+ "epoch": 61.97275204359673,
+ "grad_norm": 4.850771427154541,
+ "learning_rate": 6.672796536617218e-06,
+ "loss": 0.1787,
+ "step": 22744
+ },
+ {
+ "epoch": 61.97547683923706,
+ "grad_norm": 4.9623613357543945,
+ "learning_rate": 6.671964334593053e-06,
+ "loss": 0.0814,
+ "step": 22745
+ },
+ {
+ "epoch": 61.97820163487739,
+ "grad_norm": 3.231295585632324,
+ "learning_rate": 6.671132158487521e-06,
+ "loss": 0.0752,
+ "step": 22746
+ },
+ {
+ "epoch": 61.98092643051771,
+ "grad_norm": 3.3611910343170166,
+ "learning_rate": 6.6703000083071065e-06,
+ "loss": 0.0971,
+ "step": 22747
+ },
+ {
+ "epoch": 61.98365122615804,
+ "grad_norm": 3.1871542930603027,
+ "learning_rate": 6.669467884058287e-06,
+ "loss": 0.1521,
+ "step": 22748
+ },
+ {
+ "epoch": 61.986376021798364,
+ "grad_norm": 3.035025119781494,
+ "learning_rate": 6.668635785747547e-06,
+ "loss": 0.0436,
+ "step": 22749
+ },
+ {
+ "epoch": 61.98910081743869,
+ "grad_norm": 3.5299737453460693,
+ "learning_rate": 6.667803713381362e-06,
+ "loss": 0.1288,
+ "step": 22750
+ },
+ {
+ "epoch": 61.991825613079016,
+ "grad_norm": 4.229928970336914,
+ "learning_rate": 6.666971666966216e-06,
+ "loss": 0.0722,
+ "step": 22751
+ },
+ {
+ "epoch": 61.99455040871935,
+ "grad_norm": 4.067253112792969,
+ "learning_rate": 6.6661396465085845e-06,
+ "loss": 0.087,
+ "step": 22752
+ },
+ {
+ "epoch": 61.997275204359674,
+ "grad_norm": 4.779962062835693,
+ "learning_rate": 6.665307652014954e-06,
+ "loss": 0.1442,
+ "step": 22753
+ },
+ {
+ "epoch": 62.0,
+ "grad_norm": 3.2834765911102295,
+ "learning_rate": 6.664475683491797e-06,
+ "loss": 0.0675,
+ "step": 22754
+ },
+ {
+ "epoch": 62.002724795640326,
+ "grad_norm": 4.060825347900391,
+ "learning_rate": 6.663643740945594e-06,
+ "loss": 0.0841,
+ "step": 22755
+ },
+ {
+ "epoch": 62.00544959128065,
+ "grad_norm": 2.8694839477539062,
+ "learning_rate": 6.66281182438283e-06,
+ "loss": 0.1142,
+ "step": 22756
+ },
+ {
+ "epoch": 62.00817438692098,
+ "grad_norm": 3.719338893890381,
+ "learning_rate": 6.6619799338099785e-06,
+ "loss": 0.1246,
+ "step": 22757
+ },
+ {
+ "epoch": 62.01089918256131,
+ "grad_norm": 2.9884769916534424,
+ "learning_rate": 6.661148069233522e-06,
+ "loss": 0.0321,
+ "step": 22758
+ },
+ {
+ "epoch": 62.013623978201636,
+ "grad_norm": 3.96706485748291,
+ "learning_rate": 6.660316230659935e-06,
+ "loss": 0.1392,
+ "step": 22759
+ },
+ {
+ "epoch": 62.01634877384196,
+ "grad_norm": 3.522141695022583,
+ "learning_rate": 6.6594844180956965e-06,
+ "loss": 0.0771,
+ "step": 22760
+ },
+ {
+ "epoch": 62.01907356948229,
+ "grad_norm": 3.5420284271240234,
+ "learning_rate": 6.658652631547288e-06,
+ "loss": 0.1777,
+ "step": 22761
+ },
+ {
+ "epoch": 62.02179836512261,
+ "grad_norm": 9.910497665405273,
+ "learning_rate": 6.657820871021185e-06,
+ "loss": 0.1206,
+ "step": 22762
+ },
+ {
+ "epoch": 62.02452316076294,
+ "grad_norm": 5.194899559020996,
+ "learning_rate": 6.656989136523866e-06,
+ "loss": 0.1064,
+ "step": 22763
+ },
+ {
+ "epoch": 62.02724795640327,
+ "grad_norm": 3.178278923034668,
+ "learning_rate": 6.656157428061807e-06,
+ "loss": 0.1294,
+ "step": 22764
+ },
+ {
+ "epoch": 62.0299727520436,
+ "grad_norm": 4.71618127822876,
+ "learning_rate": 6.655325745641488e-06,
+ "loss": 0.1202,
+ "step": 22765
+ },
+ {
+ "epoch": 62.032697547683924,
+ "grad_norm": 6.225197792053223,
+ "learning_rate": 6.654494089269381e-06,
+ "loss": 0.2833,
+ "step": 22766
+ },
+ {
+ "epoch": 62.03542234332425,
+ "grad_norm": 3.802011489868164,
+ "learning_rate": 6.6536624589519705e-06,
+ "loss": 0.0608,
+ "step": 22767
+ },
+ {
+ "epoch": 62.038147138964575,
+ "grad_norm": 3.725999116897583,
+ "learning_rate": 6.652830854695726e-06,
+ "loss": 0.0752,
+ "step": 22768
+ },
+ {
+ "epoch": 62.0408719346049,
+ "grad_norm": 3.6398305892944336,
+ "learning_rate": 6.651999276507129e-06,
+ "loss": 0.4103,
+ "step": 22769
+ },
+ {
+ "epoch": 62.043596730245234,
+ "grad_norm": 3.8327982425689697,
+ "learning_rate": 6.651167724392653e-06,
+ "loss": 0.15,
+ "step": 22770
+ },
+ {
+ "epoch": 62.04632152588556,
+ "grad_norm": 3.733111619949341,
+ "learning_rate": 6.650336198358776e-06,
+ "loss": 0.1134,
+ "step": 22771
+ },
+ {
+ "epoch": 62.049046321525886,
+ "grad_norm": 5.347125053405762,
+ "learning_rate": 6.649504698411968e-06,
+ "loss": 0.0584,
+ "step": 22772
+ },
+ {
+ "epoch": 62.05177111716621,
+ "grad_norm": 3.4746041297912598,
+ "learning_rate": 6.648673224558713e-06,
+ "loss": 0.117,
+ "step": 22773
+ },
+ {
+ "epoch": 62.05449591280654,
+ "grad_norm": 3.1897616386413574,
+ "learning_rate": 6.647841776805485e-06,
+ "loss": 0.1207,
+ "step": 22774
+ },
+ {
+ "epoch": 62.05722070844686,
+ "grad_norm": 4.475643157958984,
+ "learning_rate": 6.647010355158754e-06,
+ "loss": 0.1592,
+ "step": 22775
+ },
+ {
+ "epoch": 62.059945504087196,
+ "grad_norm": 3.1270174980163574,
+ "learning_rate": 6.646178959625002e-06,
+ "loss": 0.1147,
+ "step": 22776
+ },
+ {
+ "epoch": 62.06267029972752,
+ "grad_norm": 2.9499459266662598,
+ "learning_rate": 6.6453475902106975e-06,
+ "loss": 0.1028,
+ "step": 22777
+ },
+ {
+ "epoch": 62.06539509536785,
+ "grad_norm": 3.9508938789367676,
+ "learning_rate": 6.644516246922321e-06,
+ "loss": 0.0623,
+ "step": 22778
+ },
+ {
+ "epoch": 62.06811989100817,
+ "grad_norm": 3.2466988563537598,
+ "learning_rate": 6.643684929766341e-06,
+ "loss": 0.0425,
+ "step": 22779
+ },
+ {
+ "epoch": 62.0708446866485,
+ "grad_norm": 2.71771240234375,
+ "learning_rate": 6.642853638749236e-06,
+ "loss": 0.0589,
+ "step": 22780
+ },
+ {
+ "epoch": 62.073569482288825,
+ "grad_norm": 3.7683777809143066,
+ "learning_rate": 6.642022373877479e-06,
+ "loss": 0.0885,
+ "step": 22781
+ },
+ {
+ "epoch": 62.07629427792916,
+ "grad_norm": 4.404494762420654,
+ "learning_rate": 6.641191135157542e-06,
+ "loss": 0.1542,
+ "step": 22782
+ },
+ {
+ "epoch": 62.079019073569484,
+ "grad_norm": 4.745907306671143,
+ "learning_rate": 6.640359922595902e-06,
+ "loss": 0.1162,
+ "step": 22783
+ },
+ {
+ "epoch": 62.08174386920981,
+ "grad_norm": 3.791114568710327,
+ "learning_rate": 6.6395287361990305e-06,
+ "loss": 0.0473,
+ "step": 22784
+ },
+ {
+ "epoch": 62.084468664850135,
+ "grad_norm": 4.590917587280273,
+ "learning_rate": 6.638697575973402e-06,
+ "loss": 0.1544,
+ "step": 22785
+ },
+ {
+ "epoch": 62.08719346049046,
+ "grad_norm": 3.7019877433776855,
+ "learning_rate": 6.637866441925487e-06,
+ "loss": 0.0684,
+ "step": 22786
+ },
+ {
+ "epoch": 62.08991825613079,
+ "grad_norm": 3.172245740890503,
+ "learning_rate": 6.637035334061761e-06,
+ "loss": 0.0663,
+ "step": 22787
+ },
+ {
+ "epoch": 62.09264305177112,
+ "grad_norm": 3.8884174823760986,
+ "learning_rate": 6.636204252388694e-06,
+ "loss": 0.0614,
+ "step": 22788
+ },
+ {
+ "epoch": 62.095367847411445,
+ "grad_norm": 3.3587937355041504,
+ "learning_rate": 6.6353731969127625e-06,
+ "loss": 0.0681,
+ "step": 22789
+ },
+ {
+ "epoch": 62.09809264305177,
+ "grad_norm": 3.02647066116333,
+ "learning_rate": 6.634542167640432e-06,
+ "loss": 0.0498,
+ "step": 22790
+ },
+ {
+ "epoch": 62.1008174386921,
+ "grad_norm": 3.483935594558716,
+ "learning_rate": 6.63371116457818e-06,
+ "loss": 0.1736,
+ "step": 22791
+ },
+ {
+ "epoch": 62.10354223433242,
+ "grad_norm": 3.6119918823242188,
+ "learning_rate": 6.63288018773248e-06,
+ "loss": 0.074,
+ "step": 22792
+ },
+ {
+ "epoch": 62.10626702997275,
+ "grad_norm": 4.372816562652588,
+ "learning_rate": 6.632049237109799e-06,
+ "loss": 0.0492,
+ "step": 22793
+ },
+ {
+ "epoch": 62.10899182561308,
+ "grad_norm": 3.2949540615081787,
+ "learning_rate": 6.6312183127166115e-06,
+ "loss": 0.2069,
+ "step": 22794
+ },
+ {
+ "epoch": 62.11171662125341,
+ "grad_norm": 5.566655158996582,
+ "learning_rate": 6.630387414559386e-06,
+ "loss": 0.0888,
+ "step": 22795
+ },
+ {
+ "epoch": 62.11444141689373,
+ "grad_norm": 3.3440206050872803,
+ "learning_rate": 6.629556542644597e-06,
+ "loss": 0.1294,
+ "step": 22796
+ },
+ {
+ "epoch": 62.11716621253406,
+ "grad_norm": 3.6065633296966553,
+ "learning_rate": 6.628725696978711e-06,
+ "loss": 0.0712,
+ "step": 22797
+ },
+ {
+ "epoch": 62.119891008174385,
+ "grad_norm": 3.9488348960876465,
+ "learning_rate": 6.627894877568202e-06,
+ "loss": 0.1127,
+ "step": 22798
+ },
+ {
+ "epoch": 62.12261580381471,
+ "grad_norm": 4.37799072265625,
+ "learning_rate": 6.6270640844195365e-06,
+ "loss": 0.1417,
+ "step": 22799
+ },
+ {
+ "epoch": 62.12534059945504,
+ "grad_norm": 4.148244857788086,
+ "learning_rate": 6.626233317539191e-06,
+ "loss": 0.162,
+ "step": 22800
+ },
+ {
+ "epoch": 62.12806539509537,
+ "grad_norm": 3.745007276535034,
+ "learning_rate": 6.6254025769336295e-06,
+ "loss": 0.0533,
+ "step": 22801
+ },
+ {
+ "epoch": 62.130790190735695,
+ "grad_norm": 5.023813724517822,
+ "learning_rate": 6.624571862609326e-06,
+ "loss": 0.181,
+ "step": 22802
+ },
+ {
+ "epoch": 62.13351498637602,
+ "grad_norm": 3.1756930351257324,
+ "learning_rate": 6.623741174572746e-06,
+ "loss": 0.0804,
+ "step": 22803
+ },
+ {
+ "epoch": 62.13623978201635,
+ "grad_norm": 3.4608798027038574,
+ "learning_rate": 6.622910512830363e-06,
+ "loss": 0.0426,
+ "step": 22804
+ },
+ {
+ "epoch": 62.13896457765667,
+ "grad_norm": 3.84564208984375,
+ "learning_rate": 6.622079877388643e-06,
+ "loss": 0.0689,
+ "step": 22805
+ },
+ {
+ "epoch": 62.141689373297005,
+ "grad_norm": 3.2299728393554688,
+ "learning_rate": 6.6212492682540555e-06,
+ "loss": 0.1371,
+ "step": 22806
+ },
+ {
+ "epoch": 62.14441416893733,
+ "grad_norm": 3.502675771713257,
+ "learning_rate": 6.620418685433068e-06,
+ "loss": 0.2039,
+ "step": 22807
+ },
+ {
+ "epoch": 62.14713896457766,
+ "grad_norm": 2.6872618198394775,
+ "learning_rate": 6.619588128932155e-06,
+ "loss": 0.2084,
+ "step": 22808
+ },
+ {
+ "epoch": 62.14986376021798,
+ "grad_norm": 3.869669198989868,
+ "learning_rate": 6.618757598757779e-06,
+ "loss": 0.078,
+ "step": 22809
+ },
+ {
+ "epoch": 62.15258855585831,
+ "grad_norm": 4.502622604370117,
+ "learning_rate": 6.617927094916412e-06,
+ "loss": 0.1044,
+ "step": 22810
+ },
+ {
+ "epoch": 62.155313351498634,
+ "grad_norm": 2.8535523414611816,
+ "learning_rate": 6.617096617414518e-06,
+ "loss": 0.0967,
+ "step": 22811
+ },
+ {
+ "epoch": 62.15803814713897,
+ "grad_norm": 3.1820380687713623,
+ "learning_rate": 6.616266166258568e-06,
+ "loss": 0.2063,
+ "step": 22812
+ },
+ {
+ "epoch": 62.16076294277929,
+ "grad_norm": 3.9617884159088135,
+ "learning_rate": 6.615435741455026e-06,
+ "loss": 0.0825,
+ "step": 22813
+ },
+ {
+ "epoch": 62.16348773841962,
+ "grad_norm": 4.588679790496826,
+ "learning_rate": 6.614605343010365e-06,
+ "loss": 0.1096,
+ "step": 22814
+ },
+ {
+ "epoch": 62.166212534059945,
+ "grad_norm": 4.685179233551025,
+ "learning_rate": 6.6137749709310465e-06,
+ "loss": 0.1026,
+ "step": 22815
+ },
+ {
+ "epoch": 62.16893732970027,
+ "grad_norm": 3.87353777885437,
+ "learning_rate": 6.612944625223541e-06,
+ "loss": 0.1091,
+ "step": 22816
+ },
+ {
+ "epoch": 62.171662125340596,
+ "grad_norm": 4.411993980407715,
+ "learning_rate": 6.61211430589431e-06,
+ "loss": 0.0944,
+ "step": 22817
+ },
+ {
+ "epoch": 62.17438692098093,
+ "grad_norm": 3.567234992980957,
+ "learning_rate": 6.611284012949828e-06,
+ "loss": 0.1051,
+ "step": 22818
+ },
+ {
+ "epoch": 62.177111716621255,
+ "grad_norm": 3.051919460296631,
+ "learning_rate": 6.610453746396555e-06,
+ "loss": 0.1047,
+ "step": 22819
+ },
+ {
+ "epoch": 62.17983651226158,
+ "grad_norm": 2.727727174758911,
+ "learning_rate": 6.609623506240961e-06,
+ "loss": 0.1108,
+ "step": 22820
+ },
+ {
+ "epoch": 62.182561307901906,
+ "grad_norm": 4.26987886428833,
+ "learning_rate": 6.608793292489506e-06,
+ "loss": 0.121,
+ "step": 22821
+ },
+ {
+ "epoch": 62.18528610354223,
+ "grad_norm": 3.376009702682495,
+ "learning_rate": 6.607963105148664e-06,
+ "loss": 0.0849,
+ "step": 22822
+ },
+ {
+ "epoch": 62.18801089918256,
+ "grad_norm": 3.40041446685791,
+ "learning_rate": 6.607132944224893e-06,
+ "loss": 0.1266,
+ "step": 22823
+ },
+ {
+ "epoch": 62.19073569482289,
+ "grad_norm": 3.012694835662842,
+ "learning_rate": 6.6063028097246605e-06,
+ "loss": 0.0609,
+ "step": 22824
+ },
+ {
+ "epoch": 62.19346049046322,
+ "grad_norm": 2.8245034217834473,
+ "learning_rate": 6.605472701654434e-06,
+ "loss": 0.0454,
+ "step": 22825
+ },
+ {
+ "epoch": 62.19618528610354,
+ "grad_norm": 3.4797093868255615,
+ "learning_rate": 6.604642620020678e-06,
+ "loss": 0.0927,
+ "step": 22826
+ },
+ {
+ "epoch": 62.19891008174387,
+ "grad_norm": 6.359492778778076,
+ "learning_rate": 6.603812564829855e-06,
+ "loss": 0.0571,
+ "step": 22827
+ },
+ {
+ "epoch": 62.201634877384194,
+ "grad_norm": 3.569110870361328,
+ "learning_rate": 6.602982536088431e-06,
+ "loss": 0.1096,
+ "step": 22828
+ },
+ {
+ "epoch": 62.20435967302452,
+ "grad_norm": 5.001374244689941,
+ "learning_rate": 6.60215253380287e-06,
+ "loss": 0.1512,
+ "step": 22829
+ },
+ {
+ "epoch": 62.20708446866485,
+ "grad_norm": 2.981616973876953,
+ "learning_rate": 6.601322557979636e-06,
+ "loss": 0.1859,
+ "step": 22830
+ },
+ {
+ "epoch": 62.20980926430518,
+ "grad_norm": 3.294882297515869,
+ "learning_rate": 6.600492608625191e-06,
+ "loss": 0.0759,
+ "step": 22831
+ },
+ {
+ "epoch": 62.212534059945504,
+ "grad_norm": 4.741713523864746,
+ "learning_rate": 6.599662685746002e-06,
+ "loss": 0.0959,
+ "step": 22832
+ },
+ {
+ "epoch": 62.21525885558583,
+ "grad_norm": 4.462095260620117,
+ "learning_rate": 6.598832789348529e-06,
+ "loss": 0.1026,
+ "step": 22833
+ },
+ {
+ "epoch": 62.217983651226156,
+ "grad_norm": 4.4329962730407715,
+ "learning_rate": 6.598002919439239e-06,
+ "loss": 0.1621,
+ "step": 22834
+ },
+ {
+ "epoch": 62.22070844686648,
+ "grad_norm": 3.6745359897613525,
+ "learning_rate": 6.59717307602459e-06,
+ "loss": 0.1032,
+ "step": 22835
+ },
+ {
+ "epoch": 62.223433242506815,
+ "grad_norm": 4.1733784675598145,
+ "learning_rate": 6.59634325911105e-06,
+ "loss": 0.1479,
+ "step": 22836
+ },
+ {
+ "epoch": 62.22615803814714,
+ "grad_norm": 2.0391476154327393,
+ "learning_rate": 6.595513468705077e-06,
+ "loss": 0.0373,
+ "step": 22837
+ },
+ {
+ "epoch": 62.228882833787466,
+ "grad_norm": 14.953900337219238,
+ "learning_rate": 6.594683704813137e-06,
+ "loss": 0.2215,
+ "step": 22838
+ },
+ {
+ "epoch": 62.23160762942779,
+ "grad_norm": 3.2969255447387695,
+ "learning_rate": 6.5938539674416905e-06,
+ "loss": 0.1065,
+ "step": 22839
+ },
+ {
+ "epoch": 62.23433242506812,
+ "grad_norm": 3.650846242904663,
+ "learning_rate": 6.5930242565972e-06,
+ "loss": 0.0568,
+ "step": 22840
+ },
+ {
+ "epoch": 62.237057220708444,
+ "grad_norm": 3.5891788005828857,
+ "learning_rate": 6.592194572286124e-06,
+ "loss": 0.0856,
+ "step": 22841
+ },
+ {
+ "epoch": 62.23978201634878,
+ "grad_norm": 3.088629961013794,
+ "learning_rate": 6.591364914514927e-06,
+ "loss": 0.0868,
+ "step": 22842
+ },
+ {
+ "epoch": 62.2425068119891,
+ "grad_norm": 3.256484031677246,
+ "learning_rate": 6.590535283290074e-06,
+ "loss": 0.1134,
+ "step": 22843
+ },
+ {
+ "epoch": 62.24523160762943,
+ "grad_norm": 3.364840030670166,
+ "learning_rate": 6.58970567861802e-06,
+ "loss": 0.0648,
+ "step": 22844
+ },
+ {
+ "epoch": 62.247956403269754,
+ "grad_norm": 3.455981731414795,
+ "learning_rate": 6.5888761005052304e-06,
+ "loss": 0.1585,
+ "step": 22845
+ },
+ {
+ "epoch": 62.25068119891008,
+ "grad_norm": 3.8239667415618896,
+ "learning_rate": 6.588046548958162e-06,
+ "loss": 0.1382,
+ "step": 22846
+ },
+ {
+ "epoch": 62.253405994550405,
+ "grad_norm": 4.428664207458496,
+ "learning_rate": 6.587217023983278e-06,
+ "loss": 0.1051,
+ "step": 22847
+ },
+ {
+ "epoch": 62.25613079019074,
+ "grad_norm": 3.8833417892456055,
+ "learning_rate": 6.586387525587039e-06,
+ "loss": 0.0665,
+ "step": 22848
+ },
+ {
+ "epoch": 62.258855585831064,
+ "grad_norm": 4.516501426696777,
+ "learning_rate": 6.585558053775902e-06,
+ "loss": 0.1367,
+ "step": 22849
+ },
+ {
+ "epoch": 62.26158038147139,
+ "grad_norm": 3.3930704593658447,
+ "learning_rate": 6.584728608556332e-06,
+ "loss": 0.3072,
+ "step": 22850
+ },
+ {
+ "epoch": 62.264305177111716,
+ "grad_norm": 3.414585828781128,
+ "learning_rate": 6.583899189934784e-06,
+ "loss": 0.1806,
+ "step": 22851
+ },
+ {
+ "epoch": 62.26702997275204,
+ "grad_norm": 3.077812433242798,
+ "learning_rate": 6.58306979791772e-06,
+ "loss": 0.1024,
+ "step": 22852
+ },
+ {
+ "epoch": 62.26975476839237,
+ "grad_norm": 3.2056987285614014,
+ "learning_rate": 6.5822404325115964e-06,
+ "loss": 0.1084,
+ "step": 22853
+ },
+ {
+ "epoch": 62.2724795640327,
+ "grad_norm": 3.5665276050567627,
+ "learning_rate": 6.581411093722876e-06,
+ "loss": 0.106,
+ "step": 22854
+ },
+ {
+ "epoch": 62.275204359673026,
+ "grad_norm": 4.732414245605469,
+ "learning_rate": 6.580581781558015e-06,
+ "loss": 0.0642,
+ "step": 22855
+ },
+ {
+ "epoch": 62.27792915531335,
+ "grad_norm": 2.251091957092285,
+ "learning_rate": 6.579752496023475e-06,
+ "loss": 0.0789,
+ "step": 22856
+ },
+ {
+ "epoch": 62.28065395095368,
+ "grad_norm": 3.588737964630127,
+ "learning_rate": 6.578923237125709e-06,
+ "loss": 0.0486,
+ "step": 22857
+ },
+ {
+ "epoch": 62.283378746594,
+ "grad_norm": 3.733673334121704,
+ "learning_rate": 6.578094004871178e-06,
+ "loss": 0.0958,
+ "step": 22858
+ },
+ {
+ "epoch": 62.28610354223433,
+ "grad_norm": 3.861920118331909,
+ "learning_rate": 6.577264799266345e-06,
+ "loss": 0.0709,
+ "step": 22859
+ },
+ {
+ "epoch": 62.28882833787466,
+ "grad_norm": 3.939540386199951,
+ "learning_rate": 6.5764356203176605e-06,
+ "loss": 0.1253,
+ "step": 22860
+ },
+ {
+ "epoch": 62.29155313351499,
+ "grad_norm": 8.028321266174316,
+ "learning_rate": 6.575606468031589e-06,
+ "loss": 0.0796,
+ "step": 22861
+ },
+ {
+ "epoch": 62.294277929155314,
+ "grad_norm": 2.7306878566741943,
+ "learning_rate": 6.57477734241458e-06,
+ "loss": 0.0484,
+ "step": 22862
+ },
+ {
+ "epoch": 62.29700272479564,
+ "grad_norm": 3.1638236045837402,
+ "learning_rate": 6.573948243473098e-06,
+ "loss": 0.0798,
+ "step": 22863
+ },
+ {
+ "epoch": 62.299727520435965,
+ "grad_norm": 2.6454055309295654,
+ "learning_rate": 6.5731191712135954e-06,
+ "loss": 0.0588,
+ "step": 22864
+ },
+ {
+ "epoch": 62.30245231607629,
+ "grad_norm": 3.520888090133667,
+ "learning_rate": 6.572290125642531e-06,
+ "loss": 0.1743,
+ "step": 22865
+ },
+ {
+ "epoch": 62.305177111716624,
+ "grad_norm": 3.0653371810913086,
+ "learning_rate": 6.571461106766359e-06,
+ "loss": 0.0354,
+ "step": 22866
+ },
+ {
+ "epoch": 62.30790190735695,
+ "grad_norm": 3.277329683303833,
+ "learning_rate": 6.570632114591541e-06,
+ "loss": 0.0808,
+ "step": 22867
+ },
+ {
+ "epoch": 62.310626702997276,
+ "grad_norm": 3.780304193496704,
+ "learning_rate": 6.569803149124526e-06,
+ "loss": 0.1052,
+ "step": 22868
+ },
+ {
+ "epoch": 62.3133514986376,
+ "grad_norm": 5.893295764923096,
+ "learning_rate": 6.568974210371775e-06,
+ "loss": 0.0695,
+ "step": 22869
+ },
+ {
+ "epoch": 62.31607629427793,
+ "grad_norm": 3.770939826965332,
+ "learning_rate": 6.568145298339743e-06,
+ "loss": 0.2501,
+ "step": 22870
+ },
+ {
+ "epoch": 62.31880108991825,
+ "grad_norm": 5.348854064941406,
+ "learning_rate": 6.567316413034884e-06,
+ "loss": 0.1459,
+ "step": 22871
+ },
+ {
+ "epoch": 62.321525885558586,
+ "grad_norm": 4.396578311920166,
+ "learning_rate": 6.566487554463657e-06,
+ "loss": 0.0785,
+ "step": 22872
+ },
+ {
+ "epoch": 62.32425068119891,
+ "grad_norm": 3.6802093982696533,
+ "learning_rate": 6.5656587226325105e-06,
+ "loss": 0.0627,
+ "step": 22873
+ },
+ {
+ "epoch": 62.32697547683924,
+ "grad_norm": 6.617048740386963,
+ "learning_rate": 6.564829917547907e-06,
+ "loss": 0.0515,
+ "step": 22874
+ },
+ {
+ "epoch": 62.32970027247956,
+ "grad_norm": 2.9462718963623047,
+ "learning_rate": 6.564001139216294e-06,
+ "loss": 0.0632,
+ "step": 22875
+ },
+ {
+ "epoch": 62.33242506811989,
+ "grad_norm": 2.8858888149261475,
+ "learning_rate": 6.563172387644129e-06,
+ "loss": 0.0726,
+ "step": 22876
+ },
+ {
+ "epoch": 62.335149863760215,
+ "grad_norm": 4.954010963439941,
+ "learning_rate": 6.56234366283787e-06,
+ "loss": 0.1487,
+ "step": 22877
+ },
+ {
+ "epoch": 62.33787465940055,
+ "grad_norm": 3.1028778553009033,
+ "learning_rate": 6.561514964803966e-06,
+ "loss": 0.0567,
+ "step": 22878
+ },
+ {
+ "epoch": 62.34059945504087,
+ "grad_norm": 3.4563522338867188,
+ "learning_rate": 6.560686293548875e-06,
+ "loss": 0.0522,
+ "step": 22879
+ },
+ {
+ "epoch": 62.3433242506812,
+ "grad_norm": 4.651001930236816,
+ "learning_rate": 6.5598576490790465e-06,
+ "loss": 0.0906,
+ "step": 22880
+ },
+ {
+ "epoch": 62.346049046321525,
+ "grad_norm": 3.897664785385132,
+ "learning_rate": 6.559029031400937e-06,
+ "loss": 0.1486,
+ "step": 22881
+ },
+ {
+ "epoch": 62.34877384196185,
+ "grad_norm": 4.379997253417969,
+ "learning_rate": 6.558200440520999e-06,
+ "loss": 0.0798,
+ "step": 22882
+ },
+ {
+ "epoch": 62.35149863760218,
+ "grad_norm": 3.9950928688049316,
+ "learning_rate": 6.557371876445684e-06,
+ "loss": 0.0663,
+ "step": 22883
+ },
+ {
+ "epoch": 62.35422343324251,
+ "grad_norm": 4.069232940673828,
+ "learning_rate": 6.556543339181447e-06,
+ "loss": 0.1113,
+ "step": 22884
+ },
+ {
+ "epoch": 62.356948228882835,
+ "grad_norm": 3.1827847957611084,
+ "learning_rate": 6.555714828734739e-06,
+ "loss": 0.158,
+ "step": 22885
+ },
+ {
+ "epoch": 62.35967302452316,
+ "grad_norm": 5.421937942504883,
+ "learning_rate": 6.554886345112013e-06,
+ "loss": 0.1692,
+ "step": 22886
+ },
+ {
+ "epoch": 62.36239782016349,
+ "grad_norm": 7.863237380981445,
+ "learning_rate": 6.554057888319723e-06,
+ "loss": 0.0802,
+ "step": 22887
+ },
+ {
+ "epoch": 62.36512261580381,
+ "grad_norm": 3.065836191177368,
+ "learning_rate": 6.553229458364317e-06,
+ "loss": 0.062,
+ "step": 22888
+ },
+ {
+ "epoch": 62.36784741144414,
+ "grad_norm": 2.846912384033203,
+ "learning_rate": 6.552401055252251e-06,
+ "loss": 0.1029,
+ "step": 22889
+ },
+ {
+ "epoch": 62.37057220708447,
+ "grad_norm": 3.9938836097717285,
+ "learning_rate": 6.551572678989973e-06,
+ "loss": 0.0571,
+ "step": 22890
+ },
+ {
+ "epoch": 62.3732970027248,
+ "grad_norm": 3.762964963912964,
+ "learning_rate": 6.550744329583934e-06,
+ "loss": 0.1132,
+ "step": 22891
+ },
+ {
+ "epoch": 62.37602179836512,
+ "grad_norm": 2.934399127960205,
+ "learning_rate": 6.5499160070405906e-06,
+ "loss": 0.1613,
+ "step": 22892
+ },
+ {
+ "epoch": 62.37874659400545,
+ "grad_norm": 5.411092281341553,
+ "learning_rate": 6.549087711366386e-06,
+ "loss": 0.2198,
+ "step": 22893
+ },
+ {
+ "epoch": 62.381471389645775,
+ "grad_norm": 3.6235530376434326,
+ "learning_rate": 6.548259442567778e-06,
+ "loss": 0.2015,
+ "step": 22894
+ },
+ {
+ "epoch": 62.3841961852861,
+ "grad_norm": 3.070939302444458,
+ "learning_rate": 6.547431200651217e-06,
+ "loss": 0.0508,
+ "step": 22895
+ },
+ {
+ "epoch": 62.38692098092643,
+ "grad_norm": 3.4948794841766357,
+ "learning_rate": 6.546602985623147e-06,
+ "loss": 0.067,
+ "step": 22896
+ },
+ {
+ "epoch": 62.38964577656676,
+ "grad_norm": 3.767698287963867,
+ "learning_rate": 6.545774797490025e-06,
+ "loss": 0.084,
+ "step": 22897
+ },
+ {
+ "epoch": 62.392370572207085,
+ "grad_norm": 2.9165124893188477,
+ "learning_rate": 6.544946636258295e-06,
+ "loss": 0.076,
+ "step": 22898
+ },
+ {
+ "epoch": 62.39509536784741,
+ "grad_norm": 4.044775485992432,
+ "learning_rate": 6.544118501934411e-06,
+ "loss": 0.067,
+ "step": 22899
+ },
+ {
+ "epoch": 62.39782016348774,
+ "grad_norm": 4.254181385040283,
+ "learning_rate": 6.543290394524819e-06,
+ "loss": 0.1345,
+ "step": 22900
+ },
+ {
+ "epoch": 62.40054495912806,
+ "grad_norm": 4.1424174308776855,
+ "learning_rate": 6.542462314035973e-06,
+ "loss": 0.0813,
+ "step": 22901
+ },
+ {
+ "epoch": 62.403269754768395,
+ "grad_norm": 3.561481237411499,
+ "learning_rate": 6.541634260474317e-06,
+ "loss": 0.161,
+ "step": 22902
+ },
+ {
+ "epoch": 62.40599455040872,
+ "grad_norm": 4.19312047958374,
+ "learning_rate": 6.540806233846304e-06,
+ "loss": 0.1083,
+ "step": 22903
+ },
+ {
+ "epoch": 62.40871934604905,
+ "grad_norm": 3.018279552459717,
+ "learning_rate": 6.539978234158379e-06,
+ "loss": 0.1363,
+ "step": 22904
+ },
+ {
+ "epoch": 62.41144414168937,
+ "grad_norm": 3.0838325023651123,
+ "learning_rate": 6.539150261416993e-06,
+ "loss": 0.148,
+ "step": 22905
+ },
+ {
+ "epoch": 62.4141689373297,
+ "grad_norm": 4.2507195472717285,
+ "learning_rate": 6.538322315628593e-06,
+ "loss": 0.1253,
+ "step": 22906
+ },
+ {
+ "epoch": 62.416893732970024,
+ "grad_norm": 3.0164480209350586,
+ "learning_rate": 6.537494396799629e-06,
+ "loss": 0.1134,
+ "step": 22907
+ },
+ {
+ "epoch": 62.41961852861036,
+ "grad_norm": 3.5077004432678223,
+ "learning_rate": 6.536666504936544e-06,
+ "loss": 0.068,
+ "step": 22908
+ },
+ {
+ "epoch": 62.42234332425068,
+ "grad_norm": 3.6945509910583496,
+ "learning_rate": 6.53583864004579e-06,
+ "loss": 0.1392,
+ "step": 22909
+ },
+ {
+ "epoch": 62.42506811989101,
+ "grad_norm": 3.732836961746216,
+ "learning_rate": 6.53501080213381e-06,
+ "loss": 0.1401,
+ "step": 22910
+ },
+ {
+ "epoch": 62.427792915531334,
+ "grad_norm": 4.5331525802612305,
+ "learning_rate": 6.534182991207059e-06,
+ "loss": 0.0895,
+ "step": 22911
+ },
+ {
+ "epoch": 62.43051771117166,
+ "grad_norm": 2.5722134113311768,
+ "learning_rate": 6.533355207271976e-06,
+ "loss": 0.0633,
+ "step": 22912
+ },
+ {
+ "epoch": 62.433242506811986,
+ "grad_norm": 4.173740863800049,
+ "learning_rate": 6.532527450335016e-06,
+ "loss": 0.1205,
+ "step": 22913
+ },
+ {
+ "epoch": 62.43596730245232,
+ "grad_norm": 4.303950786590576,
+ "learning_rate": 6.531699720402616e-06,
+ "loss": 0.0599,
+ "step": 22914
+ },
+ {
+ "epoch": 62.438692098092645,
+ "grad_norm": 4.381292343139648,
+ "learning_rate": 6.530872017481232e-06,
+ "loss": 0.1366,
+ "step": 22915
+ },
+ {
+ "epoch": 62.44141689373297,
+ "grad_norm": 4.8696699142456055,
+ "learning_rate": 6.5300443415772995e-06,
+ "loss": 0.0825,
+ "step": 22916
+ },
+ {
+ "epoch": 62.444141689373296,
+ "grad_norm": 4.519044399261475,
+ "learning_rate": 6.529216692697273e-06,
+ "loss": 0.0635,
+ "step": 22917
+ },
+ {
+ "epoch": 62.44686648501362,
+ "grad_norm": 3.354917287826538,
+ "learning_rate": 6.528389070847594e-06,
+ "loss": 0.1498,
+ "step": 22918
+ },
+ {
+ "epoch": 62.44959128065395,
+ "grad_norm": 2.6892342567443848,
+ "learning_rate": 6.527561476034712e-06,
+ "loss": 0.0421,
+ "step": 22919
+ },
+ {
+ "epoch": 62.45231607629428,
+ "grad_norm": 11.079471588134766,
+ "learning_rate": 6.526733908265066e-06,
+ "loss": 0.1292,
+ "step": 22920
+ },
+ {
+ "epoch": 62.45504087193461,
+ "grad_norm": 3.2886509895324707,
+ "learning_rate": 6.525906367545108e-06,
+ "loss": 0.1325,
+ "step": 22921
+ },
+ {
+ "epoch": 62.45776566757493,
+ "grad_norm": 5.297695159912109,
+ "learning_rate": 6.525078853881275e-06,
+ "loss": 0.0459,
+ "step": 22922
+ },
+ {
+ "epoch": 62.46049046321526,
+ "grad_norm": 5.968097686767578,
+ "learning_rate": 6.524251367280019e-06,
+ "loss": 0.0914,
+ "step": 22923
+ },
+ {
+ "epoch": 62.463215258855584,
+ "grad_norm": 3.63021183013916,
+ "learning_rate": 6.5234239077477815e-06,
+ "loss": 0.1216,
+ "step": 22924
+ },
+ {
+ "epoch": 62.46594005449591,
+ "grad_norm": 7.625444412231445,
+ "learning_rate": 6.522596475291005e-06,
+ "loss": 0.2645,
+ "step": 22925
+ },
+ {
+ "epoch": 62.46866485013624,
+ "grad_norm": 2.5148627758026123,
+ "learning_rate": 6.521769069916136e-06,
+ "loss": 0.0398,
+ "step": 22926
+ },
+ {
+ "epoch": 62.47138964577657,
+ "grad_norm": 3.4624040126800537,
+ "learning_rate": 6.520941691629615e-06,
+ "loss": 0.0617,
+ "step": 22927
+ },
+ {
+ "epoch": 62.474114441416894,
+ "grad_norm": 4.036266803741455,
+ "learning_rate": 6.520114340437892e-06,
+ "loss": 0.1025,
+ "step": 22928
+ },
+ {
+ "epoch": 62.47683923705722,
+ "grad_norm": 4.457673072814941,
+ "learning_rate": 6.5192870163474045e-06,
+ "loss": 0.1141,
+ "step": 22929
+ },
+ {
+ "epoch": 62.479564032697546,
+ "grad_norm": 3.806377649307251,
+ "learning_rate": 6.518459719364601e-06,
+ "loss": 0.2224,
+ "step": 22930
+ },
+ {
+ "epoch": 62.48228882833787,
+ "grad_norm": 3.7779488563537598,
+ "learning_rate": 6.517632449495916e-06,
+ "loss": 0.0782,
+ "step": 22931
+ },
+ {
+ "epoch": 62.485013623978205,
+ "grad_norm": 3.29911732673645,
+ "learning_rate": 6.516805206747803e-06,
+ "loss": 0.0529,
+ "step": 22932
+ },
+ {
+ "epoch": 62.48773841961853,
+ "grad_norm": 3.861456871032715,
+ "learning_rate": 6.515977991126694e-06,
+ "loss": 0.1291,
+ "step": 22933
+ },
+ {
+ "epoch": 62.490463215258856,
+ "grad_norm": 2.820650815963745,
+ "learning_rate": 6.515150802639037e-06,
+ "loss": 0.1041,
+ "step": 22934
+ },
+ {
+ "epoch": 62.49318801089918,
+ "grad_norm": 3.721628427505493,
+ "learning_rate": 6.514323641291276e-06,
+ "loss": 0.072,
+ "step": 22935
+ },
+ {
+ "epoch": 62.49591280653951,
+ "grad_norm": 5.200292587280273,
+ "learning_rate": 6.5134965070898496e-06,
+ "loss": 0.165,
+ "step": 22936
+ },
+ {
+ "epoch": 62.49863760217983,
+ "grad_norm": 5.09596061706543,
+ "learning_rate": 6.512669400041201e-06,
+ "loss": 0.1449,
+ "step": 22937
+ },
+ {
+ "epoch": 62.50136239782017,
+ "grad_norm": 4.042686462402344,
+ "learning_rate": 6.5118423201517665e-06,
+ "loss": 0.1748,
+ "step": 22938
+ },
+ {
+ "epoch": 62.50408719346049,
+ "grad_norm": 3.972289562225342,
+ "learning_rate": 6.511015267427997e-06,
+ "loss": 0.0756,
+ "step": 22939
+ },
+ {
+ "epoch": 62.50681198910082,
+ "grad_norm": 3.087763547897339,
+ "learning_rate": 6.510188241876325e-06,
+ "loss": 0.0502,
+ "step": 22940
+ },
+ {
+ "epoch": 62.509536784741144,
+ "grad_norm": 3.365104913711548,
+ "learning_rate": 6.509361243503196e-06,
+ "loss": 0.1303,
+ "step": 22941
+ },
+ {
+ "epoch": 62.51226158038147,
+ "grad_norm": 2.906590700149536,
+ "learning_rate": 6.508534272315048e-06,
+ "loss": 0.1028,
+ "step": 22942
+ },
+ {
+ "epoch": 62.514986376021795,
+ "grad_norm": 3.973233938217163,
+ "learning_rate": 6.507707328318326e-06,
+ "loss": 0.0884,
+ "step": 22943
+ },
+ {
+ "epoch": 62.51771117166213,
+ "grad_norm": 2.7279627323150635,
+ "learning_rate": 6.50688041151946e-06,
+ "loss": 0.0567,
+ "step": 22944
+ },
+ {
+ "epoch": 62.520435967302454,
+ "grad_norm": 3.1076507568359375,
+ "learning_rate": 6.506053521924902e-06,
+ "loss": 0.1277,
+ "step": 22945
+ },
+ {
+ "epoch": 62.52316076294278,
+ "grad_norm": 2.818887710571289,
+ "learning_rate": 6.5052266595410874e-06,
+ "loss": 0.0497,
+ "step": 22946
+ },
+ {
+ "epoch": 62.525885558583106,
+ "grad_norm": 3.5251336097717285,
+ "learning_rate": 6.504399824374453e-06,
+ "loss": 0.1078,
+ "step": 22947
+ },
+ {
+ "epoch": 62.52861035422343,
+ "grad_norm": 4.230286121368408,
+ "learning_rate": 6.503573016431442e-06,
+ "loss": 0.1738,
+ "step": 22948
+ },
+ {
+ "epoch": 62.53133514986376,
+ "grad_norm": 5.084421634674072,
+ "learning_rate": 6.502746235718491e-06,
+ "loss": 0.0744,
+ "step": 22949
+ },
+ {
+ "epoch": 62.53405994550409,
+ "grad_norm": 4.893348693847656,
+ "learning_rate": 6.50191948224204e-06,
+ "loss": 0.2584,
+ "step": 22950
+ },
+ {
+ "epoch": 62.536784741144416,
+ "grad_norm": 2.828664779663086,
+ "learning_rate": 6.501092756008527e-06,
+ "loss": 0.0339,
+ "step": 22951
+ },
+ {
+ "epoch": 62.53950953678474,
+ "grad_norm": 3.1087496280670166,
+ "learning_rate": 6.500266057024392e-06,
+ "loss": 0.0791,
+ "step": 22952
+ },
+ {
+ "epoch": 62.54223433242507,
+ "grad_norm": 4.159045219421387,
+ "learning_rate": 6.499439385296071e-06,
+ "loss": 0.0734,
+ "step": 22953
+ },
+ {
+ "epoch": 62.54495912806539,
+ "grad_norm": 4.612759113311768,
+ "learning_rate": 6.498612740830006e-06,
+ "loss": 0.1996,
+ "step": 22954
+ },
+ {
+ "epoch": 62.54768392370572,
+ "grad_norm": 3.0963053703308105,
+ "learning_rate": 6.497786123632628e-06,
+ "loss": 0.2474,
+ "step": 22955
+ },
+ {
+ "epoch": 62.55040871934605,
+ "grad_norm": 3.6551713943481445,
+ "learning_rate": 6.4969595337103806e-06,
+ "loss": 0.1128,
+ "step": 22956
+ },
+ {
+ "epoch": 62.55313351498638,
+ "grad_norm": 4.4289469718933105,
+ "learning_rate": 6.496132971069702e-06,
+ "loss": 0.099,
+ "step": 22957
+ },
+ {
+ "epoch": 62.555858310626704,
+ "grad_norm": 4.449501991271973,
+ "learning_rate": 6.495306435717024e-06,
+ "loss": 0.1284,
+ "step": 22958
+ },
+ {
+ "epoch": 62.55858310626703,
+ "grad_norm": 3.4457151889801025,
+ "learning_rate": 6.49447992765879e-06,
+ "loss": 0.071,
+ "step": 22959
+ },
+ {
+ "epoch": 62.561307901907355,
+ "grad_norm": 3.6617636680603027,
+ "learning_rate": 6.49365344690143e-06,
+ "loss": 0.1488,
+ "step": 22960
+ },
+ {
+ "epoch": 62.56403269754768,
+ "grad_norm": 4.430767059326172,
+ "learning_rate": 6.492826993451386e-06,
+ "loss": 0.0816,
+ "step": 22961
+ },
+ {
+ "epoch": 62.566757493188014,
+ "grad_norm": 2.1721184253692627,
+ "learning_rate": 6.49200056731509e-06,
+ "loss": 0.049,
+ "step": 22962
+ },
+ {
+ "epoch": 62.56948228882834,
+ "grad_norm": 3.556936740875244,
+ "learning_rate": 6.491174168498981e-06,
+ "loss": 0.0695,
+ "step": 22963
+ },
+ {
+ "epoch": 62.572207084468666,
+ "grad_norm": 2.796623468399048,
+ "learning_rate": 6.490347797009498e-06,
+ "loss": 0.1317,
+ "step": 22964
+ },
+ {
+ "epoch": 62.57493188010899,
+ "grad_norm": 3.142650842666626,
+ "learning_rate": 6.489521452853071e-06,
+ "loss": 0.0619,
+ "step": 22965
+ },
+ {
+ "epoch": 62.57765667574932,
+ "grad_norm": 3.462892532348633,
+ "learning_rate": 6.488695136036141e-06,
+ "loss": 0.1504,
+ "step": 22966
+ },
+ {
+ "epoch": 62.58038147138964,
+ "grad_norm": 3.852605104446411,
+ "learning_rate": 6.487868846565136e-06,
+ "loss": 0.0701,
+ "step": 22967
+ },
+ {
+ "epoch": 62.583106267029976,
+ "grad_norm": 3.334852933883667,
+ "learning_rate": 6.487042584446499e-06,
+ "loss": 0.1001,
+ "step": 22968
+ },
+ {
+ "epoch": 62.5858310626703,
+ "grad_norm": 3.1268060207366943,
+ "learning_rate": 6.486216349686658e-06,
+ "loss": 0.0504,
+ "step": 22969
+ },
+ {
+ "epoch": 62.58855585831063,
+ "grad_norm": 3.4463112354278564,
+ "learning_rate": 6.485390142292054e-06,
+ "loss": 0.1764,
+ "step": 22970
+ },
+ {
+ "epoch": 62.59128065395095,
+ "grad_norm": 3.072113275527954,
+ "learning_rate": 6.484563962269117e-06,
+ "loss": 0.2094,
+ "step": 22971
+ },
+ {
+ "epoch": 62.59400544959128,
+ "grad_norm": 3.998873710632324,
+ "learning_rate": 6.483737809624284e-06,
+ "loss": 0.0854,
+ "step": 22972
+ },
+ {
+ "epoch": 62.596730245231605,
+ "grad_norm": 5.751617431640625,
+ "learning_rate": 6.482911684363985e-06,
+ "loss": 0.0551,
+ "step": 22973
+ },
+ {
+ "epoch": 62.59945504087194,
+ "grad_norm": 4.150777339935303,
+ "learning_rate": 6.48208558649466e-06,
+ "loss": 0.1185,
+ "step": 22974
+ },
+ {
+ "epoch": 62.60217983651226,
+ "grad_norm": 3.205233335494995,
+ "learning_rate": 6.481259516022735e-06,
+ "loss": 0.0503,
+ "step": 22975
+ },
+ {
+ "epoch": 62.60490463215259,
+ "grad_norm": 2.293523073196411,
+ "learning_rate": 6.480433472954653e-06,
+ "loss": 0.0456,
+ "step": 22976
+ },
+ {
+ "epoch": 62.607629427792915,
+ "grad_norm": 5.082372188568115,
+ "learning_rate": 6.479607457296837e-06,
+ "loss": 0.1792,
+ "step": 22977
+ },
+ {
+ "epoch": 62.61035422343324,
+ "grad_norm": 3.6771934032440186,
+ "learning_rate": 6.4787814690557264e-06,
+ "loss": 0.066,
+ "step": 22978
+ },
+ {
+ "epoch": 62.61307901907357,
+ "grad_norm": 5.0433125495910645,
+ "learning_rate": 6.47795550823775e-06,
+ "loss": 0.1291,
+ "step": 22979
+ },
+ {
+ "epoch": 62.6158038147139,
+ "grad_norm": 4.6060638427734375,
+ "learning_rate": 6.4771295748493455e-06,
+ "loss": 0.1177,
+ "step": 22980
+ },
+ {
+ "epoch": 62.618528610354225,
+ "grad_norm": 4.242333889007568,
+ "learning_rate": 6.476303668896941e-06,
+ "loss": 0.165,
+ "step": 22981
+ },
+ {
+ "epoch": 62.62125340599455,
+ "grad_norm": 3.4630861282348633,
+ "learning_rate": 6.475477790386974e-06,
+ "loss": 0.0747,
+ "step": 22982
+ },
+ {
+ "epoch": 62.62397820163488,
+ "grad_norm": 4.103496551513672,
+ "learning_rate": 6.474651939325869e-06,
+ "loss": 0.0476,
+ "step": 22983
+ },
+ {
+ "epoch": 62.6267029972752,
+ "grad_norm": 3.7876334190368652,
+ "learning_rate": 6.473826115720063e-06,
+ "loss": 0.0741,
+ "step": 22984
+ },
+ {
+ "epoch": 62.62942779291553,
+ "grad_norm": 3.482868194580078,
+ "learning_rate": 6.473000319575985e-06,
+ "loss": 0.0423,
+ "step": 22985
+ },
+ {
+ "epoch": 62.63215258855586,
+ "grad_norm": 3.449143648147583,
+ "learning_rate": 6.472174550900068e-06,
+ "loss": 0.1145,
+ "step": 22986
+ },
+ {
+ "epoch": 62.63487738419619,
+ "grad_norm": 3.775345802307129,
+ "learning_rate": 6.471348809698741e-06,
+ "loss": 0.0668,
+ "step": 22987
+ },
+ {
+ "epoch": 62.63760217983651,
+ "grad_norm": 4.094781875610352,
+ "learning_rate": 6.470523095978436e-06,
+ "loss": 0.0812,
+ "step": 22988
+ },
+ {
+ "epoch": 62.64032697547684,
+ "grad_norm": 3.8218133449554443,
+ "learning_rate": 6.469697409745583e-06,
+ "loss": 0.0597,
+ "step": 22989
+ },
+ {
+ "epoch": 62.643051771117165,
+ "grad_norm": 3.766822338104248,
+ "learning_rate": 6.468871751006614e-06,
+ "loss": 0.1651,
+ "step": 22990
+ },
+ {
+ "epoch": 62.64577656675749,
+ "grad_norm": 4.768446445465088,
+ "learning_rate": 6.468046119767956e-06,
+ "loss": 0.0915,
+ "step": 22991
+ },
+ {
+ "epoch": 62.64850136239782,
+ "grad_norm": 4.536155700683594,
+ "learning_rate": 6.4672205160360455e-06,
+ "loss": 0.09,
+ "step": 22992
+ },
+ {
+ "epoch": 62.65122615803815,
+ "grad_norm": 2.9946510791778564,
+ "learning_rate": 6.466394939817305e-06,
+ "loss": 0.0805,
+ "step": 22993
+ },
+ {
+ "epoch": 62.653950953678475,
+ "grad_norm": 5.23456335067749,
+ "learning_rate": 6.465569391118167e-06,
+ "loss": 0.0767,
+ "step": 22994
+ },
+ {
+ "epoch": 62.6566757493188,
+ "grad_norm": 4.049919605255127,
+ "learning_rate": 6.464743869945061e-06,
+ "loss": 0.1955,
+ "step": 22995
+ },
+ {
+ "epoch": 62.65940054495913,
+ "grad_norm": 3.183833599090576,
+ "learning_rate": 6.4639183763044124e-06,
+ "loss": 0.0743,
+ "step": 22996
+ },
+ {
+ "epoch": 62.66212534059945,
+ "grad_norm": 2.2236080169677734,
+ "learning_rate": 6.463092910202656e-06,
+ "loss": 0.0352,
+ "step": 22997
+ },
+ {
+ "epoch": 62.664850136239785,
+ "grad_norm": 4.320413112640381,
+ "learning_rate": 6.462267471646221e-06,
+ "loss": 0.0835,
+ "step": 22998
+ },
+ {
+ "epoch": 62.66757493188011,
+ "grad_norm": 4.502333641052246,
+ "learning_rate": 6.461442060641531e-06,
+ "loss": 0.0905,
+ "step": 22999
+ },
+ {
+ "epoch": 62.67029972752044,
+ "grad_norm": 3.6087913513183594,
+ "learning_rate": 6.460616677195017e-06,
+ "loss": 0.2139,
+ "step": 23000
+ },
+ {
+ "epoch": 62.67302452316076,
+ "grad_norm": 3.9240729808807373,
+ "learning_rate": 6.4597913213131054e-06,
+ "loss": 0.151,
+ "step": 23001
+ },
+ {
+ "epoch": 62.67574931880109,
+ "grad_norm": 3.8604400157928467,
+ "learning_rate": 6.458965993002228e-06,
+ "loss": 0.1207,
+ "step": 23002
+ },
+ {
+ "epoch": 62.678474114441414,
+ "grad_norm": 3.887859344482422,
+ "learning_rate": 6.458140692268806e-06,
+ "loss": 0.1225,
+ "step": 23003
+ },
+ {
+ "epoch": 62.68119891008175,
+ "grad_norm": 3.3446779251098633,
+ "learning_rate": 6.457315419119273e-06,
+ "loss": 0.1642,
+ "step": 23004
+ },
+ {
+ "epoch": 62.68392370572207,
+ "grad_norm": 3.9583802223205566,
+ "learning_rate": 6.45649017356005e-06,
+ "loss": 0.052,
+ "step": 23005
+ },
+ {
+ "epoch": 62.6866485013624,
+ "grad_norm": 4.6864142417907715,
+ "learning_rate": 6.4556649555975715e-06,
+ "loss": 0.0983,
+ "step": 23006
+ },
+ {
+ "epoch": 62.689373297002724,
+ "grad_norm": 4.684879779815674,
+ "learning_rate": 6.454839765238259e-06,
+ "loss": 0.1146,
+ "step": 23007
+ },
+ {
+ "epoch": 62.69209809264305,
+ "grad_norm": 1.921517014503479,
+ "learning_rate": 6.45401460248854e-06,
+ "loss": 0.0321,
+ "step": 23008
+ },
+ {
+ "epoch": 62.694822888283376,
+ "grad_norm": 3.720921754837036,
+ "learning_rate": 6.45318946735484e-06,
+ "loss": 0.0698,
+ "step": 23009
+ },
+ {
+ "epoch": 62.69754768392371,
+ "grad_norm": 5.4707512855529785,
+ "learning_rate": 6.452364359843588e-06,
+ "loss": 0.1797,
+ "step": 23010
+ },
+ {
+ "epoch": 62.700272479564035,
+ "grad_norm": 6.212604522705078,
+ "learning_rate": 6.451539279961206e-06,
+ "loss": 0.1189,
+ "step": 23011
+ },
+ {
+ "epoch": 62.70299727520436,
+ "grad_norm": 3.161020517349243,
+ "learning_rate": 6.450714227714126e-06,
+ "loss": 0.0461,
+ "step": 23012
+ },
+ {
+ "epoch": 62.705722070844686,
+ "grad_norm": 4.240825176239014,
+ "learning_rate": 6.449889203108762e-06,
+ "loss": 0.0928,
+ "step": 23013
+ },
+ {
+ "epoch": 62.70844686648501,
+ "grad_norm": 3.6804215908050537,
+ "learning_rate": 6.449064206151551e-06,
+ "loss": 0.0814,
+ "step": 23014
+ },
+ {
+ "epoch": 62.71117166212534,
+ "grad_norm": 3.9061172008514404,
+ "learning_rate": 6.448239236848914e-06,
+ "loss": 0.0518,
+ "step": 23015
+ },
+ {
+ "epoch": 62.71389645776567,
+ "grad_norm": 3.953368663787842,
+ "learning_rate": 6.447414295207275e-06,
+ "loss": 0.0742,
+ "step": 23016
+ },
+ {
+ "epoch": 62.716621253406,
+ "grad_norm": 3.946296215057373,
+ "learning_rate": 6.446589381233062e-06,
+ "loss": 0.1001,
+ "step": 23017
+ },
+ {
+ "epoch": 62.71934604904632,
+ "grad_norm": 2.48675799369812,
+ "learning_rate": 6.445764494932691e-06,
+ "loss": 0.0501,
+ "step": 23018
+ },
+ {
+ "epoch": 62.72207084468665,
+ "grad_norm": 5.315413475036621,
+ "learning_rate": 6.444939636312597e-06,
+ "loss": 0.0797,
+ "step": 23019
+ },
+ {
+ "epoch": 62.724795640326974,
+ "grad_norm": 3.369425058364868,
+ "learning_rate": 6.4441148053791956e-06,
+ "loss": 0.1928,
+ "step": 23020
+ },
+ {
+ "epoch": 62.7275204359673,
+ "grad_norm": 5.1165900230407715,
+ "learning_rate": 6.443290002138913e-06,
+ "loss": 0.1932,
+ "step": 23021
+ },
+ {
+ "epoch": 62.73024523160763,
+ "grad_norm": 3.6062586307525635,
+ "learning_rate": 6.442465226598177e-06,
+ "loss": 0.0462,
+ "step": 23022
+ },
+ {
+ "epoch": 62.73297002724796,
+ "grad_norm": 4.3308186531066895,
+ "learning_rate": 6.4416404787634045e-06,
+ "loss": 0.0815,
+ "step": 23023
+ },
+ {
+ "epoch": 62.735694822888284,
+ "grad_norm": 4.880808353424072,
+ "learning_rate": 6.440815758641023e-06,
+ "loss": 0.0867,
+ "step": 23024
+ },
+ {
+ "epoch": 62.73841961852861,
+ "grad_norm": 4.942392349243164,
+ "learning_rate": 6.439991066237452e-06,
+ "loss": 0.0578,
+ "step": 23025
+ },
+ {
+ "epoch": 62.741144414168936,
+ "grad_norm": 7.794327735900879,
+ "learning_rate": 6.4391664015591185e-06,
+ "loss": 0.1435,
+ "step": 23026
+ },
+ {
+ "epoch": 62.74386920980926,
+ "grad_norm": 5.124037265777588,
+ "learning_rate": 6.438341764612439e-06,
+ "loss": 0.0851,
+ "step": 23027
+ },
+ {
+ "epoch": 62.746594005449595,
+ "grad_norm": 3.0087430477142334,
+ "learning_rate": 6.437517155403843e-06,
+ "loss": 0.0451,
+ "step": 23028
+ },
+ {
+ "epoch": 62.74931880108992,
+ "grad_norm": 3.278937339782715,
+ "learning_rate": 6.4366925739397456e-06,
+ "loss": 0.0645,
+ "step": 23029
+ },
+ {
+ "epoch": 62.752043596730246,
+ "grad_norm": 4.432502746582031,
+ "learning_rate": 6.4358680202265696e-06,
+ "loss": 0.0653,
+ "step": 23030
+ },
+ {
+ "epoch": 62.75476839237057,
+ "grad_norm": 3.406248092651367,
+ "learning_rate": 6.435043494270743e-06,
+ "loss": 0.0725,
+ "step": 23031
+ },
+ {
+ "epoch": 62.7574931880109,
+ "grad_norm": 3.52441143989563,
+ "learning_rate": 6.434218996078683e-06,
+ "loss": 0.1595,
+ "step": 23032
+ },
+ {
+ "epoch": 62.76021798365122,
+ "grad_norm": 4.138480186462402,
+ "learning_rate": 6.43339452565681e-06,
+ "loss": 0.0607,
+ "step": 23033
+ },
+ {
+ "epoch": 62.762942779291556,
+ "grad_norm": 2.9758920669555664,
+ "learning_rate": 6.432570083011544e-06,
+ "loss": 0.028,
+ "step": 23034
+ },
+ {
+ "epoch": 62.76566757493188,
+ "grad_norm": 1.8794962167739868,
+ "learning_rate": 6.43174566814931e-06,
+ "loss": 0.0844,
+ "step": 23035
+ },
+ {
+ "epoch": 62.76839237057221,
+ "grad_norm": 3.843134880065918,
+ "learning_rate": 6.4309212810765245e-06,
+ "loss": 0.0503,
+ "step": 23036
+ },
+ {
+ "epoch": 62.771117166212534,
+ "grad_norm": 2.8406097888946533,
+ "learning_rate": 6.43009692179961e-06,
+ "loss": 0.0443,
+ "step": 23037
+ },
+ {
+ "epoch": 62.77384196185286,
+ "grad_norm": 3.2359085083007812,
+ "learning_rate": 6.429272590324984e-06,
+ "loss": 0.048,
+ "step": 23038
+ },
+ {
+ "epoch": 62.776566757493185,
+ "grad_norm": 4.195863246917725,
+ "learning_rate": 6.428448286659071e-06,
+ "loss": 0.1102,
+ "step": 23039
+ },
+ {
+ "epoch": 62.77929155313352,
+ "grad_norm": 4.652376651763916,
+ "learning_rate": 6.427624010808284e-06,
+ "loss": 0.0817,
+ "step": 23040
+ },
+ {
+ "epoch": 62.782016348773844,
+ "grad_norm": 4.894301414489746,
+ "learning_rate": 6.42679976277905e-06,
+ "loss": 0.1194,
+ "step": 23041
+ },
+ {
+ "epoch": 62.78474114441417,
+ "grad_norm": 3.5861191749572754,
+ "learning_rate": 6.425975542577783e-06,
+ "loss": 0.0572,
+ "step": 23042
+ },
+ {
+ "epoch": 62.787465940054496,
+ "grad_norm": 3.2628448009490967,
+ "learning_rate": 6.425151350210901e-06,
+ "loss": 0.1383,
+ "step": 23043
+ },
+ {
+ "epoch": 62.79019073569482,
+ "grad_norm": 3.143688678741455,
+ "learning_rate": 6.424327185684829e-06,
+ "loss": 0.0881,
+ "step": 23044
+ },
+ {
+ "epoch": 62.79291553133515,
+ "grad_norm": 3.5223324298858643,
+ "learning_rate": 6.423503049005979e-06,
+ "loss": 0.1007,
+ "step": 23045
+ },
+ {
+ "epoch": 62.79564032697548,
+ "grad_norm": 3.900768518447876,
+ "learning_rate": 6.422678940180775e-06,
+ "loss": 0.0517,
+ "step": 23046
+ },
+ {
+ "epoch": 62.798365122615806,
+ "grad_norm": 3.8422086238861084,
+ "learning_rate": 6.42185485921563e-06,
+ "loss": 0.2194,
+ "step": 23047
+ },
+ {
+ "epoch": 62.80108991825613,
+ "grad_norm": 11.169679641723633,
+ "learning_rate": 6.421030806116961e-06,
+ "loss": 0.0797,
+ "step": 23048
+ },
+ {
+ "epoch": 62.80381471389646,
+ "grad_norm": 2.756113052368164,
+ "learning_rate": 6.420206780891194e-06,
+ "loss": 0.1232,
+ "step": 23049
+ },
+ {
+ "epoch": 62.80653950953678,
+ "grad_norm": 4.002607822418213,
+ "learning_rate": 6.419382783544739e-06,
+ "loss": 0.0707,
+ "step": 23050
+ },
+ {
+ "epoch": 62.80926430517711,
+ "grad_norm": 2.948599100112915,
+ "learning_rate": 6.4185588140840195e-06,
+ "loss": 0.05,
+ "step": 23051
+ },
+ {
+ "epoch": 62.81198910081744,
+ "grad_norm": 2.4843387603759766,
+ "learning_rate": 6.417734872515444e-06,
+ "loss": 0.1476,
+ "step": 23052
+ },
+ {
+ "epoch": 62.81471389645777,
+ "grad_norm": 4.173250675201416,
+ "learning_rate": 6.416910958845437e-06,
+ "loss": 0.0786,
+ "step": 23053
+ },
+ {
+ "epoch": 62.817438692098094,
+ "grad_norm": 3.032074213027954,
+ "learning_rate": 6.41608707308041e-06,
+ "loss": 0.0606,
+ "step": 23054
+ },
+ {
+ "epoch": 62.82016348773842,
+ "grad_norm": 3.3955652713775635,
+ "learning_rate": 6.415263215226785e-06,
+ "loss": 0.0556,
+ "step": 23055
+ },
+ {
+ "epoch": 62.822888283378745,
+ "grad_norm": 4.590451717376709,
+ "learning_rate": 6.414439385290971e-06,
+ "loss": 0.1345,
+ "step": 23056
+ },
+ {
+ "epoch": 62.82561307901907,
+ "grad_norm": 3.456740379333496,
+ "learning_rate": 6.41361558327939e-06,
+ "loss": 0.1016,
+ "step": 23057
+ },
+ {
+ "epoch": 62.828337874659404,
+ "grad_norm": 3.6677567958831787,
+ "learning_rate": 6.412791809198453e-06,
+ "loss": 0.2228,
+ "step": 23058
+ },
+ {
+ "epoch": 62.83106267029973,
+ "grad_norm": 3.0606536865234375,
+ "learning_rate": 6.411968063054581e-06,
+ "loss": 0.1989,
+ "step": 23059
+ },
+ {
+ "epoch": 62.833787465940055,
+ "grad_norm": 3.7640984058380127,
+ "learning_rate": 6.411144344854183e-06,
+ "loss": 0.0694,
+ "step": 23060
+ },
+ {
+ "epoch": 62.83651226158038,
+ "grad_norm": 4.457794666290283,
+ "learning_rate": 6.410320654603681e-06,
+ "loss": 0.1596,
+ "step": 23061
+ },
+ {
+ "epoch": 62.83923705722071,
+ "grad_norm": 3.6370296478271484,
+ "learning_rate": 6.409496992309483e-06,
+ "loss": 0.0636,
+ "step": 23062
+ },
+ {
+ "epoch": 62.84196185286103,
+ "grad_norm": 3.8966104984283447,
+ "learning_rate": 6.408673357978009e-06,
+ "loss": 0.1126,
+ "step": 23063
+ },
+ {
+ "epoch": 62.844686648501366,
+ "grad_norm": 2.9331953525543213,
+ "learning_rate": 6.407849751615669e-06,
+ "loss": 0.0573,
+ "step": 23064
+ },
+ {
+ "epoch": 62.84741144414169,
+ "grad_norm": 4.1566643714904785,
+ "learning_rate": 6.407026173228878e-06,
+ "loss": 0.2003,
+ "step": 23065
+ },
+ {
+ "epoch": 62.85013623978202,
+ "grad_norm": 3.167177438735962,
+ "learning_rate": 6.406202622824054e-06,
+ "loss": 0.1327,
+ "step": 23066
+ },
+ {
+ "epoch": 62.85286103542234,
+ "grad_norm": 3.376971960067749,
+ "learning_rate": 6.40537910040761e-06,
+ "loss": 0.0528,
+ "step": 23067
+ },
+ {
+ "epoch": 62.85558583106267,
+ "grad_norm": 4.459584712982178,
+ "learning_rate": 6.404555605985956e-06,
+ "loss": 0.13,
+ "step": 23068
+ },
+ {
+ "epoch": 62.858310626702995,
+ "grad_norm": 2.184400796890259,
+ "learning_rate": 6.403732139565508e-06,
+ "loss": 0.1063,
+ "step": 23069
+ },
+ {
+ "epoch": 62.86103542234333,
+ "grad_norm": 3.7576041221618652,
+ "learning_rate": 6.402908701152677e-06,
+ "loss": 0.0779,
+ "step": 23070
+ },
+ {
+ "epoch": 62.86376021798365,
+ "grad_norm": 2.7387702465057373,
+ "learning_rate": 6.40208529075388e-06,
+ "loss": 0.0501,
+ "step": 23071
+ },
+ {
+ "epoch": 62.86648501362398,
+ "grad_norm": 3.7353484630584717,
+ "learning_rate": 6.401261908375525e-06,
+ "loss": 0.106,
+ "step": 23072
+ },
+ {
+ "epoch": 62.869209809264305,
+ "grad_norm": 3.082329750061035,
+ "learning_rate": 6.4004385540240266e-06,
+ "loss": 0.1467,
+ "step": 23073
+ },
+ {
+ "epoch": 62.87193460490463,
+ "grad_norm": 3.7303121089935303,
+ "learning_rate": 6.399615227705797e-06,
+ "loss": 0.1449,
+ "step": 23074
+ },
+ {
+ "epoch": 62.87465940054496,
+ "grad_norm": 4.027122497558594,
+ "learning_rate": 6.398791929427248e-06,
+ "loss": 0.1382,
+ "step": 23075
+ },
+ {
+ "epoch": 62.87738419618529,
+ "grad_norm": 6.679190158843994,
+ "learning_rate": 6.397968659194792e-06,
+ "loss": 0.0637,
+ "step": 23076
+ },
+ {
+ "epoch": 62.880108991825615,
+ "grad_norm": 3.6560263633728027,
+ "learning_rate": 6.397145417014841e-06,
+ "loss": 0.2501,
+ "step": 23077
+ },
+ {
+ "epoch": 62.88283378746594,
+ "grad_norm": 3.46293044090271,
+ "learning_rate": 6.3963222028938035e-06,
+ "loss": 0.1211,
+ "step": 23078
+ },
+ {
+ "epoch": 62.88555858310627,
+ "grad_norm": 3.248948097229004,
+ "learning_rate": 6.395499016838095e-06,
+ "loss": 0.1566,
+ "step": 23079
+ },
+ {
+ "epoch": 62.88828337874659,
+ "grad_norm": 3.2963860034942627,
+ "learning_rate": 6.394675858854121e-06,
+ "loss": 0.0635,
+ "step": 23080
+ },
+ {
+ "epoch": 62.89100817438692,
+ "grad_norm": 2.887035608291626,
+ "learning_rate": 6.393852728948299e-06,
+ "loss": 0.0419,
+ "step": 23081
+ },
+ {
+ "epoch": 62.89373297002725,
+ "grad_norm": 3.3246560096740723,
+ "learning_rate": 6.393029627127031e-06,
+ "loss": 0.1175,
+ "step": 23082
+ },
+ {
+ "epoch": 62.89645776566758,
+ "grad_norm": 3.9478142261505127,
+ "learning_rate": 6.392206553396734e-06,
+ "loss": 0.1017,
+ "step": 23083
+ },
+ {
+ "epoch": 62.8991825613079,
+ "grad_norm": 3.3078768253326416,
+ "learning_rate": 6.391383507763816e-06,
+ "loss": 0.0651,
+ "step": 23084
+ },
+ {
+ "epoch": 62.90190735694823,
+ "grad_norm": 2.7478339672088623,
+ "learning_rate": 6.39056049023469e-06,
+ "loss": 0.0435,
+ "step": 23085
+ },
+ {
+ "epoch": 62.904632152588555,
+ "grad_norm": 2.965304374694824,
+ "learning_rate": 6.3897375008157606e-06,
+ "loss": 0.0603,
+ "step": 23086
+ },
+ {
+ "epoch": 62.90735694822888,
+ "grad_norm": 3.521054744720459,
+ "learning_rate": 6.388914539513441e-06,
+ "loss": 0.0816,
+ "step": 23087
+ },
+ {
+ "epoch": 62.91008174386921,
+ "grad_norm": 3.507844924926758,
+ "learning_rate": 6.388091606334137e-06,
+ "loss": 0.257,
+ "step": 23088
+ },
+ {
+ "epoch": 62.91280653950954,
+ "grad_norm": 3.3088457584381104,
+ "learning_rate": 6.387268701284261e-06,
+ "loss": 0.1144,
+ "step": 23089
+ },
+ {
+ "epoch": 62.915531335149865,
+ "grad_norm": 3.2807881832122803,
+ "learning_rate": 6.386445824370218e-06,
+ "loss": 0.0795,
+ "step": 23090
+ },
+ {
+ "epoch": 62.91825613079019,
+ "grad_norm": 2.9147677421569824,
+ "learning_rate": 6.385622975598422e-06,
+ "loss": 0.0522,
+ "step": 23091
+ },
+ {
+ "epoch": 62.920980926430516,
+ "grad_norm": 2.9333882331848145,
+ "learning_rate": 6.384800154975274e-06,
+ "loss": 0.1078,
+ "step": 23092
+ },
+ {
+ "epoch": 62.92370572207084,
+ "grad_norm": 5.346883773803711,
+ "learning_rate": 6.38397736250719e-06,
+ "loss": 0.1202,
+ "step": 23093
+ },
+ {
+ "epoch": 62.926430517711175,
+ "grad_norm": 3.9388911724090576,
+ "learning_rate": 6.38315459820057e-06,
+ "loss": 0.0678,
+ "step": 23094
+ },
+ {
+ "epoch": 62.9291553133515,
+ "grad_norm": 3.2417473793029785,
+ "learning_rate": 6.382331862061828e-06,
+ "loss": 0.2092,
+ "step": 23095
+ },
+ {
+ "epoch": 62.93188010899183,
+ "grad_norm": 4.299763202667236,
+ "learning_rate": 6.381509154097367e-06,
+ "loss": 0.2748,
+ "step": 23096
+ },
+ {
+ "epoch": 62.93460490463215,
+ "grad_norm": 3.4272220134735107,
+ "learning_rate": 6.3806864743136e-06,
+ "loss": 0.1067,
+ "step": 23097
+ },
+ {
+ "epoch": 62.93732970027248,
+ "grad_norm": 2.880706310272217,
+ "learning_rate": 6.379863822716926e-06,
+ "loss": 0.0938,
+ "step": 23098
+ },
+ {
+ "epoch": 62.940054495912804,
+ "grad_norm": 3.2244069576263428,
+ "learning_rate": 6.379041199313756e-06,
+ "loss": 0.0526,
+ "step": 23099
+ },
+ {
+ "epoch": 62.94277929155314,
+ "grad_norm": 3.6588704586029053,
+ "learning_rate": 6.378218604110499e-06,
+ "loss": 0.1616,
+ "step": 23100
+ },
+ {
+ "epoch": 62.94550408719346,
+ "grad_norm": 3.856618642807007,
+ "learning_rate": 6.377396037113557e-06,
+ "loss": 0.1594,
+ "step": 23101
+ },
+ {
+ "epoch": 62.94822888283379,
+ "grad_norm": 2.894587516784668,
+ "learning_rate": 6.376573498329341e-06,
+ "loss": 0.0425,
+ "step": 23102
+ },
+ {
+ "epoch": 62.950953678474114,
+ "grad_norm": 3.4893734455108643,
+ "learning_rate": 6.375750987764251e-06,
+ "loss": 0.0518,
+ "step": 23103
+ },
+ {
+ "epoch": 62.95367847411444,
+ "grad_norm": 3.840693950653076,
+ "learning_rate": 6.374928505424698e-06,
+ "loss": 0.0658,
+ "step": 23104
+ },
+ {
+ "epoch": 62.956403269754766,
+ "grad_norm": 4.003078937530518,
+ "learning_rate": 6.374106051317084e-06,
+ "loss": 0.1181,
+ "step": 23105
+ },
+ {
+ "epoch": 62.95912806539509,
+ "grad_norm": 3.1735715866088867,
+ "learning_rate": 6.373283625447817e-06,
+ "loss": 0.0516,
+ "step": 23106
+ },
+ {
+ "epoch": 62.961852861035425,
+ "grad_norm": 2.5085859298706055,
+ "learning_rate": 6.372461227823297e-06,
+ "loss": 0.0466,
+ "step": 23107
+ },
+ {
+ "epoch": 62.96457765667575,
+ "grad_norm": 2.9543776512145996,
+ "learning_rate": 6.371638858449933e-06,
+ "loss": 0.0694,
+ "step": 23108
+ },
+ {
+ "epoch": 62.967302452316076,
+ "grad_norm": 2.8159821033477783,
+ "learning_rate": 6.370816517334132e-06,
+ "loss": 0.0855,
+ "step": 23109
+ },
+ {
+ "epoch": 62.9700272479564,
+ "grad_norm": 2.9434163570404053,
+ "learning_rate": 6.369994204482293e-06,
+ "loss": 0.0479,
+ "step": 23110
+ },
+ {
+ "epoch": 62.97275204359673,
+ "grad_norm": 3.5817837715148926,
+ "learning_rate": 6.369171919900823e-06,
+ "loss": 0.0796,
+ "step": 23111
+ },
+ {
+ "epoch": 62.97547683923706,
+ "grad_norm": 4.305360317230225,
+ "learning_rate": 6.368349663596123e-06,
+ "loss": 0.0885,
+ "step": 23112
+ },
+ {
+ "epoch": 62.97820163487739,
+ "grad_norm": 2.948730707168579,
+ "learning_rate": 6.367527435574602e-06,
+ "loss": 0.1264,
+ "step": 23113
+ },
+ {
+ "epoch": 62.98092643051771,
+ "grad_norm": 3.276205539703369,
+ "learning_rate": 6.366705235842658e-06,
+ "loss": 0.0605,
+ "step": 23114
+ },
+ {
+ "epoch": 62.98365122615804,
+ "grad_norm": 3.5483663082122803,
+ "learning_rate": 6.365883064406699e-06,
+ "loss": 0.0799,
+ "step": 23115
+ },
+ {
+ "epoch": 62.986376021798364,
+ "grad_norm": 3.094501495361328,
+ "learning_rate": 6.365060921273121e-06,
+ "loss": 0.0563,
+ "step": 23116
+ },
+ {
+ "epoch": 62.98910081743869,
+ "grad_norm": 3.6306135654449463,
+ "learning_rate": 6.364238806448335e-06,
+ "loss": 0.0665,
+ "step": 23117
+ },
+ {
+ "epoch": 62.991825613079016,
+ "grad_norm": 4.325113296508789,
+ "learning_rate": 6.3634167199387405e-06,
+ "loss": 0.1833,
+ "step": 23118
+ },
+ {
+ "epoch": 62.99455040871935,
+ "grad_norm": 4.262590408325195,
+ "learning_rate": 6.362594661750739e-06,
+ "loss": 0.2229,
+ "step": 23119
+ },
+ {
+ "epoch": 62.997275204359674,
+ "grad_norm": 4.426522731781006,
+ "learning_rate": 6.361772631890735e-06,
+ "loss": 0.0679,
+ "step": 23120
+ },
+ {
+ "epoch": 63.0,
+ "grad_norm": 3.957909345626831,
+ "learning_rate": 6.360950630365126e-06,
+ "loss": 0.0765,
+ "step": 23121
+ },
+ {
+ "epoch": 63.002724795640326,
+ "grad_norm": 2.1313045024871826,
+ "learning_rate": 6.360128657180318e-06,
+ "loss": 0.1728,
+ "step": 23122
+ },
+ {
+ "epoch": 63.00544959128065,
+ "grad_norm": 4.392509937286377,
+ "learning_rate": 6.3593067123427096e-06,
+ "loss": 0.128,
+ "step": 23123
+ },
+ {
+ "epoch": 63.00817438692098,
+ "grad_norm": 2.8958847522735596,
+ "learning_rate": 6.358484795858704e-06,
+ "loss": 0.0489,
+ "step": 23124
+ },
+ {
+ "epoch": 63.01089918256131,
+ "grad_norm": 3.2617640495300293,
+ "learning_rate": 6.357662907734701e-06,
+ "loss": 0.079,
+ "step": 23125
+ },
+ {
+ "epoch": 63.013623978201636,
+ "grad_norm": 3.2560315132141113,
+ "learning_rate": 6.356841047977104e-06,
+ "loss": 0.1265,
+ "step": 23126
+ },
+ {
+ "epoch": 63.01634877384196,
+ "grad_norm": 3.201209783554077,
+ "learning_rate": 6.35601921659231e-06,
+ "loss": 0.0574,
+ "step": 23127
+ },
+ {
+ "epoch": 63.01907356948229,
+ "grad_norm": 3.6940200328826904,
+ "learning_rate": 6.355197413586722e-06,
+ "loss": 0.0563,
+ "step": 23128
+ },
+ {
+ "epoch": 63.02179836512261,
+ "grad_norm": 3.270508050918579,
+ "learning_rate": 6.354375638966739e-06,
+ "loss": 0.0326,
+ "step": 23129
+ },
+ {
+ "epoch": 63.02452316076294,
+ "grad_norm": 4.936068534851074,
+ "learning_rate": 6.35355389273876e-06,
+ "loss": 0.0716,
+ "step": 23130
+ },
+ {
+ "epoch": 63.02724795640327,
+ "grad_norm": 4.696451187133789,
+ "learning_rate": 6.352732174909187e-06,
+ "loss": 0.11,
+ "step": 23131
+ },
+ {
+ "epoch": 63.0299727520436,
+ "grad_norm": 4.848161697387695,
+ "learning_rate": 6.351910485484417e-06,
+ "loss": 0.1006,
+ "step": 23132
+ },
+ {
+ "epoch": 63.032697547683924,
+ "grad_norm": 4.534578800201416,
+ "learning_rate": 6.351088824470853e-06,
+ "loss": 0.0653,
+ "step": 23133
+ },
+ {
+ "epoch": 63.03542234332425,
+ "grad_norm": 3.329862117767334,
+ "learning_rate": 6.3502671918748886e-06,
+ "loss": 0.2054,
+ "step": 23134
+ },
+ {
+ "epoch": 63.038147138964575,
+ "grad_norm": 2.6438238620758057,
+ "learning_rate": 6.349445587702927e-06,
+ "loss": 0.0395,
+ "step": 23135
+ },
+ {
+ "epoch": 63.0408719346049,
+ "grad_norm": 3.2166786193847656,
+ "learning_rate": 6.348624011961368e-06,
+ "loss": 0.0499,
+ "step": 23136
+ },
+ {
+ "epoch": 63.043596730245234,
+ "grad_norm": 3.3035888671875,
+ "learning_rate": 6.347802464656605e-06,
+ "loss": 0.2443,
+ "step": 23137
+ },
+ {
+ "epoch": 63.04632152588556,
+ "grad_norm": 2.5024590492248535,
+ "learning_rate": 6.3469809457950406e-06,
+ "loss": 0.0414,
+ "step": 23138
+ },
+ {
+ "epoch": 63.049046321525886,
+ "grad_norm": 4.230470657348633,
+ "learning_rate": 6.346159455383069e-06,
+ "loss": 0.0729,
+ "step": 23139
+ },
+ {
+ "epoch": 63.05177111716621,
+ "grad_norm": 3.702749013900757,
+ "learning_rate": 6.3453379934270945e-06,
+ "loss": 0.0662,
+ "step": 23140
+ },
+ {
+ "epoch": 63.05449591280654,
+ "grad_norm": 3.2805144786834717,
+ "learning_rate": 6.3445165599335044e-06,
+ "loss": 0.067,
+ "step": 23141
+ },
+ {
+ "epoch": 63.05722070844686,
+ "grad_norm": 3.6586036682128906,
+ "learning_rate": 6.343695154908707e-06,
+ "loss": 0.0644,
+ "step": 23142
+ },
+ {
+ "epoch": 63.059945504087196,
+ "grad_norm": 3.8456904888153076,
+ "learning_rate": 6.34287377835909e-06,
+ "loss": 0.0516,
+ "step": 23143
+ },
+ {
+ "epoch": 63.06267029972752,
+ "grad_norm": 3.517930746078491,
+ "learning_rate": 6.342052430291057e-06,
+ "loss": 0.0473,
+ "step": 23144
+ },
+ {
+ "epoch": 63.06539509536785,
+ "grad_norm": 2.3302736282348633,
+ "learning_rate": 6.341231110710999e-06,
+ "loss": 0.0396,
+ "step": 23145
+ },
+ {
+ "epoch": 63.06811989100817,
+ "grad_norm": 2.6586661338806152,
+ "learning_rate": 6.340409819625319e-06,
+ "loss": 0.0737,
+ "step": 23146
+ },
+ {
+ "epoch": 63.0708446866485,
+ "grad_norm": 3.8887076377868652,
+ "learning_rate": 6.339588557040406e-06,
+ "loss": 0.0706,
+ "step": 23147
+ },
+ {
+ "epoch": 63.073569482288825,
+ "grad_norm": 3.4590799808502197,
+ "learning_rate": 6.338767322962662e-06,
+ "loss": 0.084,
+ "step": 23148
+ },
+ {
+ "epoch": 63.07629427792916,
+ "grad_norm": 3.049461841583252,
+ "learning_rate": 6.337946117398479e-06,
+ "loss": 0.1283,
+ "step": 23149
+ },
+ {
+ "epoch": 63.079019073569484,
+ "grad_norm": 4.627965927124023,
+ "learning_rate": 6.3371249403542556e-06,
+ "loss": 0.0628,
+ "step": 23150
+ },
+ {
+ "epoch": 63.08174386920981,
+ "grad_norm": 6.178308486938477,
+ "learning_rate": 6.336303791836379e-06,
+ "loss": 0.0555,
+ "step": 23151
+ },
+ {
+ "epoch": 63.084468664850135,
+ "grad_norm": 3.0092344284057617,
+ "learning_rate": 6.335482671851256e-06,
+ "loss": 0.0935,
+ "step": 23152
+ },
+ {
+ "epoch": 63.08719346049046,
+ "grad_norm": 4.038009166717529,
+ "learning_rate": 6.334661580405274e-06,
+ "loss": 0.1331,
+ "step": 23153
+ },
+ {
+ "epoch": 63.08991825613079,
+ "grad_norm": 4.0561089515686035,
+ "learning_rate": 6.333840517504832e-06,
+ "loss": 0.0791,
+ "step": 23154
+ },
+ {
+ "epoch": 63.09264305177112,
+ "grad_norm": 3.6039934158325195,
+ "learning_rate": 6.333019483156322e-06,
+ "loss": 0.0545,
+ "step": 23155
+ },
+ {
+ "epoch": 63.095367847411445,
+ "grad_norm": 5.1222758293151855,
+ "learning_rate": 6.332198477366138e-06,
+ "loss": 0.1295,
+ "step": 23156
+ },
+ {
+ "epoch": 63.09809264305177,
+ "grad_norm": 3.006937026977539,
+ "learning_rate": 6.331377500140672e-06,
+ "loss": 0.1013,
+ "step": 23157
+ },
+ {
+ "epoch": 63.1008174386921,
+ "grad_norm": 2.899261474609375,
+ "learning_rate": 6.330556551486324e-06,
+ "loss": 0.0502,
+ "step": 23158
+ },
+ {
+ "epoch": 63.10354223433242,
+ "grad_norm": 2.8537375926971436,
+ "learning_rate": 6.329735631409479e-06,
+ "loss": 0.093,
+ "step": 23159
+ },
+ {
+ "epoch": 63.10626702997275,
+ "grad_norm": 5.385002613067627,
+ "learning_rate": 6.328914739916539e-06,
+ "loss": 0.1324,
+ "step": 23160
+ },
+ {
+ "epoch": 63.10899182561308,
+ "grad_norm": 3.247054100036621,
+ "learning_rate": 6.328093877013888e-06,
+ "loss": 0.0566,
+ "step": 23161
+ },
+ {
+ "epoch": 63.11171662125341,
+ "grad_norm": 4.962833404541016,
+ "learning_rate": 6.327273042707929e-06,
+ "loss": 0.0938,
+ "step": 23162
+ },
+ {
+ "epoch": 63.11444141689373,
+ "grad_norm": 3.9605371952056885,
+ "learning_rate": 6.3264522370050455e-06,
+ "loss": 0.1092,
+ "step": 23163
+ },
+ {
+ "epoch": 63.11716621253406,
+ "grad_norm": 5.63825798034668,
+ "learning_rate": 6.325631459911635e-06,
+ "loss": 0.1948,
+ "step": 23164
+ },
+ {
+ "epoch": 63.119891008174385,
+ "grad_norm": 8.609911918640137,
+ "learning_rate": 6.324810711434089e-06,
+ "loss": 0.0495,
+ "step": 23165
+ },
+ {
+ "epoch": 63.12261580381471,
+ "grad_norm": 2.54370379447937,
+ "learning_rate": 6.3239899915787985e-06,
+ "loss": 0.1144,
+ "step": 23166
+ },
+ {
+ "epoch": 63.12534059945504,
+ "grad_norm": 3.7156083583831787,
+ "learning_rate": 6.323169300352155e-06,
+ "loss": 0.0787,
+ "step": 23167
+ },
+ {
+ "epoch": 63.12806539509537,
+ "grad_norm": 2.9712140560150146,
+ "learning_rate": 6.322348637760547e-06,
+ "loss": 0.083,
+ "step": 23168
+ },
+ {
+ "epoch": 63.130790190735695,
+ "grad_norm": 3.4311819076538086,
+ "learning_rate": 6.321528003810375e-06,
+ "loss": 0.0789,
+ "step": 23169
+ },
+ {
+ "epoch": 63.13351498637602,
+ "grad_norm": 4.052380084991455,
+ "learning_rate": 6.320707398508021e-06,
+ "loss": 0.2009,
+ "step": 23170
+ },
+ {
+ "epoch": 63.13623978201635,
+ "grad_norm": 3.0860378742218018,
+ "learning_rate": 6.3198868218598805e-06,
+ "loss": 0.0515,
+ "step": 23171
+ },
+ {
+ "epoch": 63.13896457765667,
+ "grad_norm": 3.465501070022583,
+ "learning_rate": 6.319066273872345e-06,
+ "loss": 0.0596,
+ "step": 23172
+ },
+ {
+ "epoch": 63.141689373297005,
+ "grad_norm": 2.6912052631378174,
+ "learning_rate": 6.318245754551802e-06,
+ "loss": 0.1229,
+ "step": 23173
+ },
+ {
+ "epoch": 63.14441416893733,
+ "grad_norm": 4.115647792816162,
+ "learning_rate": 6.317425263904643e-06,
+ "loss": 0.288,
+ "step": 23174
+ },
+ {
+ "epoch": 63.14713896457766,
+ "grad_norm": 3.4655401706695557,
+ "learning_rate": 6.316604801937256e-06,
+ "loss": 0.1119,
+ "step": 23175
+ },
+ {
+ "epoch": 63.14986376021798,
+ "grad_norm": 3.3207101821899414,
+ "learning_rate": 6.315784368656034e-06,
+ "loss": 0.1297,
+ "step": 23176
+ },
+ {
+ "epoch": 63.15258855585831,
+ "grad_norm": 3.8398549556732178,
+ "learning_rate": 6.314963964067362e-06,
+ "loss": 0.1018,
+ "step": 23177
+ },
+ {
+ "epoch": 63.155313351498634,
+ "grad_norm": 2.4407057762145996,
+ "learning_rate": 6.314143588177636e-06,
+ "loss": 0.0443,
+ "step": 23178
+ },
+ {
+ "epoch": 63.15803814713897,
+ "grad_norm": 3.8973379135131836,
+ "learning_rate": 6.313323240993237e-06,
+ "loss": 0.1692,
+ "step": 23179
+ },
+ {
+ "epoch": 63.16076294277929,
+ "grad_norm": 3.2764265537261963,
+ "learning_rate": 6.312502922520562e-06,
+ "loss": 0.0479,
+ "step": 23180
+ },
+ {
+ "epoch": 63.16348773841962,
+ "grad_norm": 3.1338770389556885,
+ "learning_rate": 6.311682632765992e-06,
+ "loss": 0.0828,
+ "step": 23181
+ },
+ {
+ "epoch": 63.166212534059945,
+ "grad_norm": 3.19219708442688,
+ "learning_rate": 6.310862371735922e-06,
+ "loss": 0.1193,
+ "step": 23182
+ },
+ {
+ "epoch": 63.16893732970027,
+ "grad_norm": 2.779780626296997,
+ "learning_rate": 6.310042139436734e-06,
+ "loss": 0.0954,
+ "step": 23183
+ },
+ {
+ "epoch": 63.171662125340596,
+ "grad_norm": 2.7828152179718018,
+ "learning_rate": 6.309221935874822e-06,
+ "loss": 0.159,
+ "step": 23184
+ },
+ {
+ "epoch": 63.17438692098093,
+ "grad_norm": 4.583054542541504,
+ "learning_rate": 6.308401761056566e-06,
+ "loss": 0.1784,
+ "step": 23185
+ },
+ {
+ "epoch": 63.177111716621255,
+ "grad_norm": 4.487547874450684,
+ "learning_rate": 6.30758161498836e-06,
+ "loss": 0.056,
+ "step": 23186
+ },
+ {
+ "epoch": 63.17983651226158,
+ "grad_norm": 2.659743309020996,
+ "learning_rate": 6.306761497676594e-06,
+ "loss": 0.0419,
+ "step": 23187
+ },
+ {
+ "epoch": 63.182561307901906,
+ "grad_norm": 3.0457241535186768,
+ "learning_rate": 6.305941409127646e-06,
+ "loss": 0.155,
+ "step": 23188
+ },
+ {
+ "epoch": 63.18528610354223,
+ "grad_norm": 3.6640207767486572,
+ "learning_rate": 6.305121349347911e-06,
+ "loss": 0.1206,
+ "step": 23189
+ },
+ {
+ "epoch": 63.18801089918256,
+ "grad_norm": 4.56561803817749,
+ "learning_rate": 6.304301318343768e-06,
+ "loss": 0.0968,
+ "step": 23190
+ },
+ {
+ "epoch": 63.19073569482289,
+ "grad_norm": 2.028547763824463,
+ "learning_rate": 6.303481316121611e-06,
+ "loss": 0.0346,
+ "step": 23191
+ },
+ {
+ "epoch": 63.19346049046322,
+ "grad_norm": 2.4169869422912598,
+ "learning_rate": 6.302661342687822e-06,
+ "loss": 0.1654,
+ "step": 23192
+ },
+ {
+ "epoch": 63.19618528610354,
+ "grad_norm": 2.399566888809204,
+ "learning_rate": 6.3018413980487865e-06,
+ "loss": 0.0388,
+ "step": 23193
+ },
+ {
+ "epoch": 63.19891008174387,
+ "grad_norm": 3.032816171646118,
+ "learning_rate": 6.301021482210889e-06,
+ "loss": 0.1188,
+ "step": 23194
+ },
+ {
+ "epoch": 63.201634877384194,
+ "grad_norm": 2.597745895385742,
+ "learning_rate": 6.30020159518052e-06,
+ "loss": 0.0819,
+ "step": 23195
+ },
+ {
+ "epoch": 63.20435967302452,
+ "grad_norm": 4.5145440101623535,
+ "learning_rate": 6.2993817369640616e-06,
+ "loss": 0.0866,
+ "step": 23196
+ },
+ {
+ "epoch": 63.20708446866485,
+ "grad_norm": 2.7119181156158447,
+ "learning_rate": 6.2985619075678985e-06,
+ "loss": 0.113,
+ "step": 23197
+ },
+ {
+ "epoch": 63.20980926430518,
+ "grad_norm": 3.1414027214050293,
+ "learning_rate": 6.297742106998417e-06,
+ "loss": 0.0728,
+ "step": 23198
+ },
+ {
+ "epoch": 63.212534059945504,
+ "grad_norm": 3.252021312713623,
+ "learning_rate": 6.296922335262e-06,
+ "loss": 0.0826,
+ "step": 23199
+ },
+ {
+ "epoch": 63.21525885558583,
+ "grad_norm": 4.101782321929932,
+ "learning_rate": 6.296102592365035e-06,
+ "loss": 0.0869,
+ "step": 23200
+ },
+ {
+ "epoch": 63.217983651226156,
+ "grad_norm": 3.352304697036743,
+ "learning_rate": 6.2952828783139e-06,
+ "loss": 0.0724,
+ "step": 23201
+ },
+ {
+ "epoch": 63.22070844686648,
+ "grad_norm": 3.0583438873291016,
+ "learning_rate": 6.294463193114982e-06,
+ "loss": 0.1035,
+ "step": 23202
+ },
+ {
+ "epoch": 63.223433242506815,
+ "grad_norm": 2.796839714050293,
+ "learning_rate": 6.293643536774668e-06,
+ "loss": 0.0969,
+ "step": 23203
+ },
+ {
+ "epoch": 63.22615803814714,
+ "grad_norm": 4.15037727355957,
+ "learning_rate": 6.292823909299338e-06,
+ "loss": 0.1032,
+ "step": 23204
+ },
+ {
+ "epoch": 63.228882833787466,
+ "grad_norm": 2.8994171619415283,
+ "learning_rate": 6.2920043106953774e-06,
+ "loss": 0.0624,
+ "step": 23205
+ },
+ {
+ "epoch": 63.23160762942779,
+ "grad_norm": 2.9009017944335938,
+ "learning_rate": 6.291184740969168e-06,
+ "loss": 0.044,
+ "step": 23206
+ },
+ {
+ "epoch": 63.23433242506812,
+ "grad_norm": 3.7608728408813477,
+ "learning_rate": 6.290365200127091e-06,
+ "loss": 0.0563,
+ "step": 23207
+ },
+ {
+ "epoch": 63.237057220708444,
+ "grad_norm": 3.7963707447052,
+ "learning_rate": 6.289545688175531e-06,
+ "loss": 0.1759,
+ "step": 23208
+ },
+ {
+ "epoch": 63.23978201634878,
+ "grad_norm": 7.580491065979004,
+ "learning_rate": 6.2887262051208704e-06,
+ "loss": 0.1625,
+ "step": 23209
+ },
+ {
+ "epoch": 63.2425068119891,
+ "grad_norm": 3.113636016845703,
+ "learning_rate": 6.28790675096949e-06,
+ "loss": 0.0569,
+ "step": 23210
+ },
+ {
+ "epoch": 63.24523160762943,
+ "grad_norm": 4.224898338317871,
+ "learning_rate": 6.287087325727774e-06,
+ "loss": 0.0839,
+ "step": 23211
+ },
+ {
+ "epoch": 63.247956403269754,
+ "grad_norm": 3.5268211364746094,
+ "learning_rate": 6.286267929402099e-06,
+ "loss": 0.0683,
+ "step": 23212
+ },
+ {
+ "epoch": 63.25068119891008,
+ "grad_norm": 3.5836639404296875,
+ "learning_rate": 6.285448561998853e-06,
+ "loss": 0.0988,
+ "step": 23213
+ },
+ {
+ "epoch": 63.253405994550405,
+ "grad_norm": 2.8314950466156006,
+ "learning_rate": 6.284629223524412e-06,
+ "loss": 0.0655,
+ "step": 23214
+ },
+ {
+ "epoch": 63.25613079019074,
+ "grad_norm": 2.798389196395874,
+ "learning_rate": 6.283809913985162e-06,
+ "loss": 0.143,
+ "step": 23215
+ },
+ {
+ "epoch": 63.258855585831064,
+ "grad_norm": 3.1230967044830322,
+ "learning_rate": 6.282990633387477e-06,
+ "loss": 0.0964,
+ "step": 23216
+ },
+ {
+ "epoch": 63.26158038147139,
+ "grad_norm": 3.065552234649658,
+ "learning_rate": 6.282171381737742e-06,
+ "loss": 0.106,
+ "step": 23217
+ },
+ {
+ "epoch": 63.264305177111716,
+ "grad_norm": 4.310557842254639,
+ "learning_rate": 6.281352159042338e-06,
+ "loss": 0.0504,
+ "step": 23218
+ },
+ {
+ "epoch": 63.26702997275204,
+ "grad_norm": 3.7876176834106445,
+ "learning_rate": 6.280532965307643e-06,
+ "loss": 0.1395,
+ "step": 23219
+ },
+ {
+ "epoch": 63.26975476839237,
+ "grad_norm": 3.4245898723602295,
+ "learning_rate": 6.279713800540035e-06,
+ "loss": 0.1101,
+ "step": 23220
+ },
+ {
+ "epoch": 63.2724795640327,
+ "grad_norm": 4.20367431640625,
+ "learning_rate": 6.2788946647459e-06,
+ "loss": 0.0961,
+ "step": 23221
+ },
+ {
+ "epoch": 63.275204359673026,
+ "grad_norm": 3.2108347415924072,
+ "learning_rate": 6.278075557931611e-06,
+ "loss": 0.0642,
+ "step": 23222
+ },
+ {
+ "epoch": 63.27792915531335,
+ "grad_norm": 6.693216800689697,
+ "learning_rate": 6.277256480103553e-06,
+ "loss": 0.1121,
+ "step": 23223
+ },
+ {
+ "epoch": 63.28065395095368,
+ "grad_norm": 3.909276247024536,
+ "learning_rate": 6.276437431268098e-06,
+ "loss": 0.0429,
+ "step": 23224
+ },
+ {
+ "epoch": 63.283378746594,
+ "grad_norm": 3.625056028366089,
+ "learning_rate": 6.275618411431633e-06,
+ "loss": 0.1419,
+ "step": 23225
+ },
+ {
+ "epoch": 63.28610354223433,
+ "grad_norm": 3.083132266998291,
+ "learning_rate": 6.274799420600528e-06,
+ "loss": 0.0598,
+ "step": 23226
+ },
+ {
+ "epoch": 63.28882833787466,
+ "grad_norm": 3.109088897705078,
+ "learning_rate": 6.273980458781168e-06,
+ "loss": 0.0653,
+ "step": 23227
+ },
+ {
+ "epoch": 63.29155313351499,
+ "grad_norm": 6.317144870758057,
+ "learning_rate": 6.273161525979926e-06,
+ "loss": 0.0505,
+ "step": 23228
+ },
+ {
+ "epoch": 63.294277929155314,
+ "grad_norm": 4.329389572143555,
+ "learning_rate": 6.2723426222031845e-06,
+ "loss": 0.0939,
+ "step": 23229
+ },
+ {
+ "epoch": 63.29700272479564,
+ "grad_norm": 2.5851826667785645,
+ "learning_rate": 6.271523747457316e-06,
+ "loss": 0.0514,
+ "step": 23230
+ },
+ {
+ "epoch": 63.299727520435965,
+ "grad_norm": 2.7832398414611816,
+ "learning_rate": 6.270704901748703e-06,
+ "loss": 0.196,
+ "step": 23231
+ },
+ {
+ "epoch": 63.30245231607629,
+ "grad_norm": 3.224717378616333,
+ "learning_rate": 6.269886085083718e-06,
+ "loss": 0.0691,
+ "step": 23232
+ },
+ {
+ "epoch": 63.305177111716624,
+ "grad_norm": 2.864311933517456,
+ "learning_rate": 6.269067297468743e-06,
+ "loss": 0.056,
+ "step": 23233
+ },
+ {
+ "epoch": 63.30790190735695,
+ "grad_norm": 3.1728298664093018,
+ "learning_rate": 6.268248538910149e-06,
+ "loss": 0.1322,
+ "step": 23234
+ },
+ {
+ "epoch": 63.310626702997276,
+ "grad_norm": 3.160740852355957,
+ "learning_rate": 6.267429809414316e-06,
+ "loss": 0.0515,
+ "step": 23235
+ },
+ {
+ "epoch": 63.3133514986376,
+ "grad_norm": 2.3517680168151855,
+ "learning_rate": 6.266611108987619e-06,
+ "loss": 0.0548,
+ "step": 23236
+ },
+ {
+ "epoch": 63.31607629427793,
+ "grad_norm": 2.645186185836792,
+ "learning_rate": 6.265792437636433e-06,
+ "loss": 0.1263,
+ "step": 23237
+ },
+ {
+ "epoch": 63.31880108991825,
+ "grad_norm": 4.053886413574219,
+ "learning_rate": 6.264973795367136e-06,
+ "loss": 0.2391,
+ "step": 23238
+ },
+ {
+ "epoch": 63.321525885558586,
+ "grad_norm": 3.03579044342041,
+ "learning_rate": 6.264155182186105e-06,
+ "loss": 0.0501,
+ "step": 23239
+ },
+ {
+ "epoch": 63.32425068119891,
+ "grad_norm": 3.4309818744659424,
+ "learning_rate": 6.263336598099712e-06,
+ "loss": 0.0423,
+ "step": 23240
+ },
+ {
+ "epoch": 63.32697547683924,
+ "grad_norm": 4.73743200302124,
+ "learning_rate": 6.262518043114336e-06,
+ "loss": 0.1231,
+ "step": 23241
+ },
+ {
+ "epoch": 63.32970027247956,
+ "grad_norm": 4.359729290008545,
+ "learning_rate": 6.261699517236346e-06,
+ "loss": 0.0983,
+ "step": 23242
+ },
+ {
+ "epoch": 63.33242506811989,
+ "grad_norm": 4.368567943572998,
+ "learning_rate": 6.260881020472122e-06,
+ "loss": 0.1999,
+ "step": 23243
+ },
+ {
+ "epoch": 63.335149863760215,
+ "grad_norm": 4.852414608001709,
+ "learning_rate": 6.260062552828035e-06,
+ "loss": 0.0729,
+ "step": 23244
+ },
+ {
+ "epoch": 63.33787465940055,
+ "grad_norm": 3.412858724594116,
+ "learning_rate": 6.259244114310461e-06,
+ "loss": 0.0379,
+ "step": 23245
+ },
+ {
+ "epoch": 63.34059945504087,
+ "grad_norm": 2.490328550338745,
+ "learning_rate": 6.2584257049257724e-06,
+ "loss": 0.0409,
+ "step": 23246
+ },
+ {
+ "epoch": 63.3433242506812,
+ "grad_norm": 2.6413326263427734,
+ "learning_rate": 6.257607324680346e-06,
+ "loss": 0.0684,
+ "step": 23247
+ },
+ {
+ "epoch": 63.346049046321525,
+ "grad_norm": 3.239886999130249,
+ "learning_rate": 6.25678897358055e-06,
+ "loss": 0.0564,
+ "step": 23248
+ },
+ {
+ "epoch": 63.34877384196185,
+ "grad_norm": 8.035508155822754,
+ "learning_rate": 6.255970651632764e-06,
+ "loss": 0.1955,
+ "step": 23249
+ },
+ {
+ "epoch": 63.35149863760218,
+ "grad_norm": 3.526515245437622,
+ "learning_rate": 6.255152358843357e-06,
+ "loss": 0.0843,
+ "step": 23250
+ },
+ {
+ "epoch": 63.35422343324251,
+ "grad_norm": 3.029080629348755,
+ "learning_rate": 6.254334095218704e-06,
+ "loss": 0.2116,
+ "step": 23251
+ },
+ {
+ "epoch": 63.356948228882835,
+ "grad_norm": 3.12518572807312,
+ "learning_rate": 6.253515860765175e-06,
+ "loss": 0.1754,
+ "step": 23252
+ },
+ {
+ "epoch": 63.35967302452316,
+ "grad_norm": 4.568018913269043,
+ "learning_rate": 6.252697655489145e-06,
+ "loss": 0.1433,
+ "step": 23253
+ },
+ {
+ "epoch": 63.36239782016349,
+ "grad_norm": 5.089962959289551,
+ "learning_rate": 6.2518794793969815e-06,
+ "loss": 0.0689,
+ "step": 23254
+ },
+ {
+ "epoch": 63.36512261580381,
+ "grad_norm": 3.837120771408081,
+ "learning_rate": 6.251061332495062e-06,
+ "loss": 0.1469,
+ "step": 23255
+ },
+ {
+ "epoch": 63.36784741144414,
+ "grad_norm": 3.126713752746582,
+ "learning_rate": 6.2502432147897584e-06,
+ "loss": 0.0976,
+ "step": 23256
+ },
+ {
+ "epoch": 63.37057220708447,
+ "grad_norm": 2.7455477714538574,
+ "learning_rate": 6.249425126287439e-06,
+ "loss": 0.0451,
+ "step": 23257
+ },
+ {
+ "epoch": 63.3732970027248,
+ "grad_norm": 3.298961877822876,
+ "learning_rate": 6.248607066994473e-06,
+ "loss": 0.1045,
+ "step": 23258
+ },
+ {
+ "epoch": 63.37602179836512,
+ "grad_norm": 3.4833261966705322,
+ "learning_rate": 6.247789036917238e-06,
+ "loss": 0.0773,
+ "step": 23259
+ },
+ {
+ "epoch": 63.37874659400545,
+ "grad_norm": 3.407968044281006,
+ "learning_rate": 6.246971036062099e-06,
+ "loss": 0.0694,
+ "step": 23260
+ },
+ {
+ "epoch": 63.381471389645775,
+ "grad_norm": 3.166114568710327,
+ "learning_rate": 6.246153064435432e-06,
+ "loss": 0.0649,
+ "step": 23261
+ },
+ {
+ "epoch": 63.3841961852861,
+ "grad_norm": 3.347496271133423,
+ "learning_rate": 6.245335122043601e-06,
+ "loss": 0.0461,
+ "step": 23262
+ },
+ {
+ "epoch": 63.38692098092643,
+ "grad_norm": 2.5239617824554443,
+ "learning_rate": 6.244517208892982e-06,
+ "loss": 0.0366,
+ "step": 23263
+ },
+ {
+ "epoch": 63.38964577656676,
+ "grad_norm": 5.172435760498047,
+ "learning_rate": 6.243699324989941e-06,
+ "loss": 0.1966,
+ "step": 23264
+ },
+ {
+ "epoch": 63.392370572207085,
+ "grad_norm": 3.0878472328186035,
+ "learning_rate": 6.242881470340848e-06,
+ "loss": 0.1901,
+ "step": 23265
+ },
+ {
+ "epoch": 63.39509536784741,
+ "grad_norm": 3.729919910430908,
+ "learning_rate": 6.242063644952072e-06,
+ "loss": 0.214,
+ "step": 23266
+ },
+ {
+ "epoch": 63.39782016348774,
+ "grad_norm": 3.1580615043640137,
+ "learning_rate": 6.241245848829986e-06,
+ "loss": 0.1801,
+ "step": 23267
+ },
+ {
+ "epoch": 63.40054495912806,
+ "grad_norm": 4.145963191986084,
+ "learning_rate": 6.240428081980955e-06,
+ "loss": 0.0921,
+ "step": 23268
+ },
+ {
+ "epoch": 63.403269754768395,
+ "grad_norm": 4.048202037811279,
+ "learning_rate": 6.239610344411351e-06,
+ "loss": 0.1434,
+ "step": 23269
+ },
+ {
+ "epoch": 63.40599455040872,
+ "grad_norm": 3.7490174770355225,
+ "learning_rate": 6.238792636127537e-06,
+ "loss": 0.0401,
+ "step": 23270
+ },
+ {
+ "epoch": 63.40871934604905,
+ "grad_norm": 3.656370162963867,
+ "learning_rate": 6.2379749571358835e-06,
+ "loss": 0.1079,
+ "step": 23271
+ },
+ {
+ "epoch": 63.41144414168937,
+ "grad_norm": 2.9822680950164795,
+ "learning_rate": 6.237157307442765e-06,
+ "loss": 0.0524,
+ "step": 23272
+ },
+ {
+ "epoch": 63.4141689373297,
+ "grad_norm": 3.4221558570861816,
+ "learning_rate": 6.2363396870545425e-06,
+ "loss": 0.0777,
+ "step": 23273
+ },
+ {
+ "epoch": 63.416893732970024,
+ "grad_norm": 3.2517075538635254,
+ "learning_rate": 6.235522095977586e-06,
+ "loss": 0.043,
+ "step": 23274
+ },
+ {
+ "epoch": 63.41961852861036,
+ "grad_norm": 4.3678388595581055,
+ "learning_rate": 6.234704534218261e-06,
+ "loss": 0.0559,
+ "step": 23275
+ },
+ {
+ "epoch": 63.42234332425068,
+ "grad_norm": 2.94924259185791,
+ "learning_rate": 6.233887001782937e-06,
+ "loss": 0.0751,
+ "step": 23276
+ },
+ {
+ "epoch": 63.42506811989101,
+ "grad_norm": 3.8434195518493652,
+ "learning_rate": 6.233069498677979e-06,
+ "loss": 0.1142,
+ "step": 23277
+ },
+ {
+ "epoch": 63.427792915531334,
+ "grad_norm": 4.644426345825195,
+ "learning_rate": 6.232252024909755e-06,
+ "loss": 0.1899,
+ "step": 23278
+ },
+ {
+ "epoch": 63.43051771117166,
+ "grad_norm": 3.1543736457824707,
+ "learning_rate": 6.231434580484631e-06,
+ "loss": 0.117,
+ "step": 23279
+ },
+ {
+ "epoch": 63.433242506811986,
+ "grad_norm": 11.50169563293457,
+ "learning_rate": 6.230617165408974e-06,
+ "loss": 0.0844,
+ "step": 23280
+ },
+ {
+ "epoch": 63.43596730245232,
+ "grad_norm": 2.459075450897217,
+ "learning_rate": 6.229799779689147e-06,
+ "loss": 0.1937,
+ "step": 23281
+ },
+ {
+ "epoch": 63.438692098092645,
+ "grad_norm": 3.03531813621521,
+ "learning_rate": 6.228982423331519e-06,
+ "loss": 0.0462,
+ "step": 23282
+ },
+ {
+ "epoch": 63.44141689373297,
+ "grad_norm": 4.1016364097595215,
+ "learning_rate": 6.228165096342456e-06,
+ "loss": 0.1717,
+ "step": 23283
+ },
+ {
+ "epoch": 63.444141689373296,
+ "grad_norm": 3.0312306880950928,
+ "learning_rate": 6.227347798728319e-06,
+ "loss": 0.0757,
+ "step": 23284
+ },
+ {
+ "epoch": 63.44686648501362,
+ "grad_norm": 3.6765177249908447,
+ "learning_rate": 6.2265305304954796e-06,
+ "loss": 0.0562,
+ "step": 23285
+ },
+ {
+ "epoch": 63.44959128065395,
+ "grad_norm": 4.016444206237793,
+ "learning_rate": 6.225713291650295e-06,
+ "loss": 0.0948,
+ "step": 23286
+ },
+ {
+ "epoch": 63.45231607629428,
+ "grad_norm": 2.561192750930786,
+ "learning_rate": 6.224896082199137e-06,
+ "loss": 0.0612,
+ "step": 23287
+ },
+ {
+ "epoch": 63.45504087193461,
+ "grad_norm": 4.448768615722656,
+ "learning_rate": 6.224078902148365e-06,
+ "loss": 0.1659,
+ "step": 23288
+ },
+ {
+ "epoch": 63.45776566757493,
+ "grad_norm": 3.9424736499786377,
+ "learning_rate": 6.223261751504343e-06,
+ "loss": 0.0883,
+ "step": 23289
+ },
+ {
+ "epoch": 63.46049046321526,
+ "grad_norm": 2.7465972900390625,
+ "learning_rate": 6.222444630273439e-06,
+ "loss": 0.1047,
+ "step": 23290
+ },
+ {
+ "epoch": 63.463215258855584,
+ "grad_norm": 3.563305139541626,
+ "learning_rate": 6.221627538462015e-06,
+ "loss": 0.1321,
+ "step": 23291
+ },
+ {
+ "epoch": 63.46594005449591,
+ "grad_norm": 2.556574583053589,
+ "learning_rate": 6.2208104760764355e-06,
+ "loss": 0.0486,
+ "step": 23292
+ },
+ {
+ "epoch": 63.46866485013624,
+ "grad_norm": 3.7904469966888428,
+ "learning_rate": 6.21999344312306e-06,
+ "loss": 0.2267,
+ "step": 23293
+ },
+ {
+ "epoch": 63.47138964577657,
+ "grad_norm": 3.538381576538086,
+ "learning_rate": 6.219176439608256e-06,
+ "loss": 0.0865,
+ "step": 23294
+ },
+ {
+ "epoch": 63.474114441416894,
+ "grad_norm": 5.882189750671387,
+ "learning_rate": 6.218359465538383e-06,
+ "loss": 0.1995,
+ "step": 23295
+ },
+ {
+ "epoch": 63.47683923705722,
+ "grad_norm": 4.156144142150879,
+ "learning_rate": 6.217542520919806e-06,
+ "loss": 0.1735,
+ "step": 23296
+ },
+ {
+ "epoch": 63.479564032697546,
+ "grad_norm": 3.2747654914855957,
+ "learning_rate": 6.2167256057588845e-06,
+ "loss": 0.2048,
+ "step": 23297
+ },
+ {
+ "epoch": 63.48228882833787,
+ "grad_norm": 4.409388065338135,
+ "learning_rate": 6.215908720061983e-06,
+ "loss": 0.1567,
+ "step": 23298
+ },
+ {
+ "epoch": 63.485013623978205,
+ "grad_norm": 3.5134851932525635,
+ "learning_rate": 6.2150918638354614e-06,
+ "loss": 0.0733,
+ "step": 23299
+ },
+ {
+ "epoch": 63.48773841961853,
+ "grad_norm": 2.8112776279449463,
+ "learning_rate": 6.214275037085685e-06,
+ "loss": 0.0524,
+ "step": 23300
+ },
+ {
+ "epoch": 63.490463215258856,
+ "grad_norm": 2.8188395500183105,
+ "learning_rate": 6.21345823981901e-06,
+ "loss": 0.1395,
+ "step": 23301
+ },
+ {
+ "epoch": 63.49318801089918,
+ "grad_norm": 3.1712307929992676,
+ "learning_rate": 6.212641472041803e-06,
+ "loss": 0.047,
+ "step": 23302
+ },
+ {
+ "epoch": 63.49591280653951,
+ "grad_norm": 6.838955879211426,
+ "learning_rate": 6.211824733760421e-06,
+ "loss": 0.1084,
+ "step": 23303
+ },
+ {
+ "epoch": 63.49863760217983,
+ "grad_norm": 9.094196319580078,
+ "learning_rate": 6.211008024981224e-06,
+ "loss": 0.0401,
+ "step": 23304
+ },
+ {
+ "epoch": 63.50136239782017,
+ "grad_norm": 3.0622928142547607,
+ "learning_rate": 6.210191345710579e-06,
+ "loss": 0.0586,
+ "step": 23305
+ },
+ {
+ "epoch": 63.50408719346049,
+ "grad_norm": 2.8008289337158203,
+ "learning_rate": 6.209374695954835e-06,
+ "loss": 0.0498,
+ "step": 23306
+ },
+ {
+ "epoch": 63.50681198910082,
+ "grad_norm": 3.7828431129455566,
+ "learning_rate": 6.208558075720363e-06,
+ "loss": 0.1245,
+ "step": 23307
+ },
+ {
+ "epoch": 63.509536784741144,
+ "grad_norm": 2.386240243911743,
+ "learning_rate": 6.20774148501352e-06,
+ "loss": 0.0478,
+ "step": 23308
+ },
+ {
+ "epoch": 63.51226158038147,
+ "grad_norm": 3.705430030822754,
+ "learning_rate": 6.206924923840663e-06,
+ "loss": 0.0741,
+ "step": 23309
+ },
+ {
+ "epoch": 63.514986376021795,
+ "grad_norm": 4.189337253570557,
+ "learning_rate": 6.206108392208153e-06,
+ "loss": 0.1043,
+ "step": 23310
+ },
+ {
+ "epoch": 63.51771117166213,
+ "grad_norm": 5.269558906555176,
+ "learning_rate": 6.205291890122348e-06,
+ "loss": 0.1404,
+ "step": 23311
+ },
+ {
+ "epoch": 63.520435967302454,
+ "grad_norm": 2.9411356449127197,
+ "learning_rate": 6.204475417589609e-06,
+ "loss": 0.0504,
+ "step": 23312
+ },
+ {
+ "epoch": 63.52316076294278,
+ "grad_norm": 4.213926792144775,
+ "learning_rate": 6.203658974616291e-06,
+ "loss": 0.1546,
+ "step": 23313
+ },
+ {
+ "epoch": 63.525885558583106,
+ "grad_norm": 3.6228363513946533,
+ "learning_rate": 6.202842561208759e-06,
+ "loss": 0.0669,
+ "step": 23314
+ },
+ {
+ "epoch": 63.52861035422343,
+ "grad_norm": 3.2594707012176514,
+ "learning_rate": 6.2020261773733624e-06,
+ "loss": 0.1955,
+ "step": 23315
+ },
+ {
+ "epoch": 63.53133514986376,
+ "grad_norm": 4.12902307510376,
+ "learning_rate": 6.201209823116466e-06,
+ "loss": 0.1094,
+ "step": 23316
+ },
+ {
+ "epoch": 63.53405994550409,
+ "grad_norm": 4.914697647094727,
+ "learning_rate": 6.200393498444424e-06,
+ "loss": 0.0828,
+ "step": 23317
+ },
+ {
+ "epoch": 63.536784741144416,
+ "grad_norm": 3.1628105640411377,
+ "learning_rate": 6.199577203363597e-06,
+ "loss": 0.0857,
+ "step": 23318
+ },
+ {
+ "epoch": 63.53950953678474,
+ "grad_norm": 3.894613742828369,
+ "learning_rate": 6.198760937880339e-06,
+ "loss": 0.1076,
+ "step": 23319
+ },
+ {
+ "epoch": 63.54223433242507,
+ "grad_norm": 7.148128032684326,
+ "learning_rate": 6.197944702001009e-06,
+ "loss": 0.106,
+ "step": 23320
+ },
+ {
+ "epoch": 63.54495912806539,
+ "grad_norm": 2.830425977706909,
+ "learning_rate": 6.197128495731964e-06,
+ "loss": 0.089,
+ "step": 23321
+ },
+ {
+ "epoch": 63.54768392370572,
+ "grad_norm": 3.2133290767669678,
+ "learning_rate": 6.196312319079558e-06,
+ "loss": 0.0776,
+ "step": 23322
+ },
+ {
+ "epoch": 63.55040871934605,
+ "grad_norm": 2.6843209266662598,
+ "learning_rate": 6.195496172050146e-06,
+ "loss": 0.1461,
+ "step": 23323
+ },
+ {
+ "epoch": 63.55313351498638,
+ "grad_norm": 3.6621501445770264,
+ "learning_rate": 6.194680054650093e-06,
+ "loss": 0.0686,
+ "step": 23324
+ },
+ {
+ "epoch": 63.555858310626704,
+ "grad_norm": 3.502528667449951,
+ "learning_rate": 6.193863966885746e-06,
+ "loss": 0.0671,
+ "step": 23325
+ },
+ {
+ "epoch": 63.55858310626703,
+ "grad_norm": 3.7787718772888184,
+ "learning_rate": 6.193047908763468e-06,
+ "loss": 0.1247,
+ "step": 23326
+ },
+ {
+ "epoch": 63.561307901907355,
+ "grad_norm": 4.0733137130737305,
+ "learning_rate": 6.192231880289605e-06,
+ "loss": 0.1937,
+ "step": 23327
+ },
+ {
+ "epoch": 63.56403269754768,
+ "grad_norm": 4.627094745635986,
+ "learning_rate": 6.191415881470523e-06,
+ "loss": 0.1104,
+ "step": 23328
+ },
+ {
+ "epoch": 63.566757493188014,
+ "grad_norm": 4.041052341461182,
+ "learning_rate": 6.190599912312567e-06,
+ "loss": 0.0751,
+ "step": 23329
+ },
+ {
+ "epoch": 63.56948228882834,
+ "grad_norm": 4.6674089431762695,
+ "learning_rate": 6.189783972822101e-06,
+ "loss": 0.2169,
+ "step": 23330
+ },
+ {
+ "epoch": 63.572207084468666,
+ "grad_norm": 3.0642614364624023,
+ "learning_rate": 6.18896806300547e-06,
+ "loss": 0.1121,
+ "step": 23331
+ },
+ {
+ "epoch": 63.57493188010899,
+ "grad_norm": 2.9342877864837646,
+ "learning_rate": 6.188152182869037e-06,
+ "loss": 0.052,
+ "step": 23332
+ },
+ {
+ "epoch": 63.57765667574932,
+ "grad_norm": 7.390470027923584,
+ "learning_rate": 6.187336332419149e-06,
+ "loss": 0.0707,
+ "step": 23333
+ },
+ {
+ "epoch": 63.58038147138964,
+ "grad_norm": 3.899533271789551,
+ "learning_rate": 6.186520511662167e-06,
+ "loss": 0.0682,
+ "step": 23334
+ },
+ {
+ "epoch": 63.583106267029976,
+ "grad_norm": 2.7589640617370605,
+ "learning_rate": 6.185704720604435e-06,
+ "loss": 0.0457,
+ "step": 23335
+ },
+ {
+ "epoch": 63.5858310626703,
+ "grad_norm": 4.35020637512207,
+ "learning_rate": 6.184888959252317e-06,
+ "loss": 0.0815,
+ "step": 23336
+ },
+ {
+ "epoch": 63.58855585831063,
+ "grad_norm": 3.891713857650757,
+ "learning_rate": 6.184073227612158e-06,
+ "loss": 0.0616,
+ "step": 23337
+ },
+ {
+ "epoch": 63.59128065395095,
+ "grad_norm": 3.372689962387085,
+ "learning_rate": 6.183257525690316e-06,
+ "loss": 0.1289,
+ "step": 23338
+ },
+ {
+ "epoch": 63.59400544959128,
+ "grad_norm": 4.840092182159424,
+ "learning_rate": 6.182441853493139e-06,
+ "loss": 0.0915,
+ "step": 23339
+ },
+ {
+ "epoch": 63.596730245231605,
+ "grad_norm": 3.8786606788635254,
+ "learning_rate": 6.181626211026979e-06,
+ "loss": 0.1452,
+ "step": 23340
+ },
+ {
+ "epoch": 63.59945504087194,
+ "grad_norm": 4.334212779998779,
+ "learning_rate": 6.180810598298197e-06,
+ "loss": 0.1316,
+ "step": 23341
+ },
+ {
+ "epoch": 63.60217983651226,
+ "grad_norm": 3.7547287940979004,
+ "learning_rate": 6.179995015313136e-06,
+ "loss": 0.0625,
+ "step": 23342
+ },
+ {
+ "epoch": 63.60490463215259,
+ "grad_norm": 3.1574583053588867,
+ "learning_rate": 6.1791794620781535e-06,
+ "loss": 0.0625,
+ "step": 23343
+ },
+ {
+ "epoch": 63.607629427792915,
+ "grad_norm": 3.161449670791626,
+ "learning_rate": 6.178363938599596e-06,
+ "loss": 0.1815,
+ "step": 23344
+ },
+ {
+ "epoch": 63.61035422343324,
+ "grad_norm": 3.764359712600708,
+ "learning_rate": 6.1775484448838184e-06,
+ "loss": 0.0677,
+ "step": 23345
+ },
+ {
+ "epoch": 63.61307901907357,
+ "grad_norm": 2.69553804397583,
+ "learning_rate": 6.176732980937171e-06,
+ "loss": 0.0426,
+ "step": 23346
+ },
+ {
+ "epoch": 63.6158038147139,
+ "grad_norm": 2.6529035568237305,
+ "learning_rate": 6.175917546766003e-06,
+ "loss": 0.0488,
+ "step": 23347
+ },
+ {
+ "epoch": 63.618528610354225,
+ "grad_norm": 3.1602330207824707,
+ "learning_rate": 6.175102142376668e-06,
+ "loss": 0.1056,
+ "step": 23348
+ },
+ {
+ "epoch": 63.62125340599455,
+ "grad_norm": 3.942868947982788,
+ "learning_rate": 6.1742867677755115e-06,
+ "loss": 0.089,
+ "step": 23349
+ },
+ {
+ "epoch": 63.62397820163488,
+ "grad_norm": 3.5963327884674072,
+ "learning_rate": 6.173471422968889e-06,
+ "loss": 0.1397,
+ "step": 23350
+ },
+ {
+ "epoch": 63.6267029972752,
+ "grad_norm": 3.471452474594116,
+ "learning_rate": 6.172656107963146e-06,
+ "loss": 0.0894,
+ "step": 23351
+ },
+ {
+ "epoch": 63.62942779291553,
+ "grad_norm": 3.224921464920044,
+ "learning_rate": 6.171840822764636e-06,
+ "loss": 0.077,
+ "step": 23352
+ },
+ {
+ "epoch": 63.63215258855586,
+ "grad_norm": 4.43481969833374,
+ "learning_rate": 6.1710255673797045e-06,
+ "loss": 0.1299,
+ "step": 23353
+ },
+ {
+ "epoch": 63.63487738419619,
+ "grad_norm": 3.6068527698516846,
+ "learning_rate": 6.170210341814705e-06,
+ "loss": 0.0552,
+ "step": 23354
+ },
+ {
+ "epoch": 63.63760217983651,
+ "grad_norm": 3.184776782989502,
+ "learning_rate": 6.169395146075982e-06,
+ "loss": 0.1718,
+ "step": 23355
+ },
+ {
+ "epoch": 63.64032697547684,
+ "grad_norm": 3.762660026550293,
+ "learning_rate": 6.168579980169889e-06,
+ "loss": 0.1105,
+ "step": 23356
+ },
+ {
+ "epoch": 63.643051771117165,
+ "grad_norm": 3.6248199939727783,
+ "learning_rate": 6.167764844102766e-06,
+ "loss": 0.0953,
+ "step": 23357
+ },
+ {
+ "epoch": 63.64577656675749,
+ "grad_norm": 3.9380240440368652,
+ "learning_rate": 6.16694973788097e-06,
+ "loss": 0.1276,
+ "step": 23358
+ },
+ {
+ "epoch": 63.64850136239782,
+ "grad_norm": 3.3067786693573,
+ "learning_rate": 6.166134661510848e-06,
+ "loss": 0.2126,
+ "step": 23359
+ },
+ {
+ "epoch": 63.65122615803815,
+ "grad_norm": 3.041841506958008,
+ "learning_rate": 6.165319614998744e-06,
+ "loss": 0.0539,
+ "step": 23360
+ },
+ {
+ "epoch": 63.653950953678475,
+ "grad_norm": 3.897139549255371,
+ "learning_rate": 6.164504598351009e-06,
+ "loss": 0.0902,
+ "step": 23361
+ },
+ {
+ "epoch": 63.6566757493188,
+ "grad_norm": 4.920825004577637,
+ "learning_rate": 6.1636896115739864e-06,
+ "loss": 0.119,
+ "step": 23362
+ },
+ {
+ "epoch": 63.65940054495913,
+ "grad_norm": 5.995110511779785,
+ "learning_rate": 6.1628746546740295e-06,
+ "loss": 0.12,
+ "step": 23363
+ },
+ {
+ "epoch": 63.66212534059945,
+ "grad_norm": 2.7097299098968506,
+ "learning_rate": 6.162059727657477e-06,
+ "loss": 0.0461,
+ "step": 23364
+ },
+ {
+ "epoch": 63.664850136239785,
+ "grad_norm": 3.5396687984466553,
+ "learning_rate": 6.161244830530684e-06,
+ "loss": 0.0666,
+ "step": 23365
+ },
+ {
+ "epoch": 63.66757493188011,
+ "grad_norm": 3.118617057800293,
+ "learning_rate": 6.1604299632999885e-06,
+ "loss": 0.076,
+ "step": 23366
+ },
+ {
+ "epoch": 63.67029972752044,
+ "grad_norm": 2.875271797180176,
+ "learning_rate": 6.159615125971743e-06,
+ "loss": 0.0653,
+ "step": 23367
+ },
+ {
+ "epoch": 63.67302452316076,
+ "grad_norm": 3.1477246284484863,
+ "learning_rate": 6.158800318552292e-06,
+ "loss": 0.052,
+ "step": 23368
+ },
+ {
+ "epoch": 63.67574931880109,
+ "grad_norm": 2.3785343170166016,
+ "learning_rate": 6.157985541047979e-06,
+ "loss": 0.0805,
+ "step": 23369
+ },
+ {
+ "epoch": 63.678474114441414,
+ "grad_norm": 3.3399782180786133,
+ "learning_rate": 6.157170793465153e-06,
+ "loss": 0.0467,
+ "step": 23370
+ },
+ {
+ "epoch": 63.68119891008175,
+ "grad_norm": 3.1951773166656494,
+ "learning_rate": 6.156356075810154e-06,
+ "loss": 0.0588,
+ "step": 23371
+ },
+ {
+ "epoch": 63.68392370572207,
+ "grad_norm": 4.3294291496276855,
+ "learning_rate": 6.155541388089332e-06,
+ "loss": 0.0572,
+ "step": 23372
+ },
+ {
+ "epoch": 63.6866485013624,
+ "grad_norm": 3.3137307167053223,
+ "learning_rate": 6.15472673030903e-06,
+ "loss": 0.1471,
+ "step": 23373
+ },
+ {
+ "epoch": 63.689373297002724,
+ "grad_norm": 4.323788642883301,
+ "learning_rate": 6.1539121024755935e-06,
+ "loss": 0.0858,
+ "step": 23374
+ },
+ {
+ "epoch": 63.69209809264305,
+ "grad_norm": 8.91159439086914,
+ "learning_rate": 6.153097504595362e-06,
+ "loss": 0.1609,
+ "step": 23375
+ },
+ {
+ "epoch": 63.694822888283376,
+ "grad_norm": 3.2635562419891357,
+ "learning_rate": 6.152282936674685e-06,
+ "loss": 0.0982,
+ "step": 23376
+ },
+ {
+ "epoch": 63.69754768392371,
+ "grad_norm": 6.164497375488281,
+ "learning_rate": 6.151468398719906e-06,
+ "loss": 0.0945,
+ "step": 23377
+ },
+ {
+ "epoch": 63.700272479564035,
+ "grad_norm": 3.8145058155059814,
+ "learning_rate": 6.1506538907373655e-06,
+ "loss": 0.1023,
+ "step": 23378
+ },
+ {
+ "epoch": 63.70299727520436,
+ "grad_norm": 8.545085906982422,
+ "learning_rate": 6.149839412733411e-06,
+ "loss": 0.1553,
+ "step": 23379
+ },
+ {
+ "epoch": 63.705722070844686,
+ "grad_norm": 3.8043572902679443,
+ "learning_rate": 6.149024964714382e-06,
+ "loss": 0.0795,
+ "step": 23380
+ },
+ {
+ "epoch": 63.70844686648501,
+ "grad_norm": 5.421295642852783,
+ "learning_rate": 6.148210546686624e-06,
+ "loss": 0.1608,
+ "step": 23381
+ },
+ {
+ "epoch": 63.71117166212534,
+ "grad_norm": 4.151515007019043,
+ "learning_rate": 6.1473961586564756e-06,
+ "loss": 0.1208,
+ "step": 23382
+ },
+ {
+ "epoch": 63.71389645776567,
+ "grad_norm": 3.885204553604126,
+ "learning_rate": 6.146581800630285e-06,
+ "loss": 0.05,
+ "step": 23383
+ },
+ {
+ "epoch": 63.716621253406,
+ "grad_norm": 5.078805923461914,
+ "learning_rate": 6.145767472614389e-06,
+ "loss": 0.0525,
+ "step": 23384
+ },
+ {
+ "epoch": 63.71934604904632,
+ "grad_norm": 13.722284317016602,
+ "learning_rate": 6.144953174615133e-06,
+ "loss": 0.1069,
+ "step": 23385
+ },
+ {
+ "epoch": 63.72207084468665,
+ "grad_norm": 2.9433112144470215,
+ "learning_rate": 6.1441389066388565e-06,
+ "loss": 0.0536,
+ "step": 23386
+ },
+ {
+ "epoch": 63.724795640326974,
+ "grad_norm": 5.2005934715271,
+ "learning_rate": 6.143324668691904e-06,
+ "loss": 0.0922,
+ "step": 23387
+ },
+ {
+ "epoch": 63.7275204359673,
+ "grad_norm": 32.43373107910156,
+ "learning_rate": 6.142510460780613e-06,
+ "loss": 0.1307,
+ "step": 23388
+ },
+ {
+ "epoch": 63.73024523160763,
+ "grad_norm": 3.6497414112091064,
+ "learning_rate": 6.141696282911328e-06,
+ "loss": 0.1544,
+ "step": 23389
+ },
+ {
+ "epoch": 63.73297002724796,
+ "grad_norm": 2.5020391941070557,
+ "learning_rate": 6.140882135090387e-06,
+ "loss": 0.0819,
+ "step": 23390
+ },
+ {
+ "epoch": 63.735694822888284,
+ "grad_norm": 10.11089038848877,
+ "learning_rate": 6.14006801732413e-06,
+ "loss": 0.1541,
+ "step": 23391
+ },
+ {
+ "epoch": 63.73841961852861,
+ "grad_norm": 5.140850067138672,
+ "learning_rate": 6.139253929618898e-06,
+ "loss": 0.1014,
+ "step": 23392
+ },
+ {
+ "epoch": 63.741144414168936,
+ "grad_norm": 3.9001197814941406,
+ "learning_rate": 6.138439871981037e-06,
+ "loss": 0.075,
+ "step": 23393
+ },
+ {
+ "epoch": 63.74386920980926,
+ "grad_norm": 3.613224744796753,
+ "learning_rate": 6.137625844416879e-06,
+ "loss": 0.0802,
+ "step": 23394
+ },
+ {
+ "epoch": 63.746594005449595,
+ "grad_norm": 4.303200721740723,
+ "learning_rate": 6.136811846932769e-06,
+ "loss": 0.2148,
+ "step": 23395
+ },
+ {
+ "epoch": 63.74931880108992,
+ "grad_norm": 3.9668211936950684,
+ "learning_rate": 6.135997879535042e-06,
+ "loss": 0.1465,
+ "step": 23396
+ },
+ {
+ "epoch": 63.752043596730246,
+ "grad_norm": 6.469911098480225,
+ "learning_rate": 6.135183942230041e-06,
+ "loss": 0.0962,
+ "step": 23397
+ },
+ {
+ "epoch": 63.75476839237057,
+ "grad_norm": 2.9736506938934326,
+ "learning_rate": 6.1343700350241005e-06,
+ "loss": 0.1374,
+ "step": 23398
+ },
+ {
+ "epoch": 63.7574931880109,
+ "grad_norm": 4.08699369430542,
+ "learning_rate": 6.133556157923565e-06,
+ "loss": 0.2162,
+ "step": 23399
+ },
+ {
+ "epoch": 63.76021798365122,
+ "grad_norm": 10.112793922424316,
+ "learning_rate": 6.132742310934767e-06,
+ "loss": 0.1232,
+ "step": 23400
+ },
+ {
+ "epoch": 63.762942779291556,
+ "grad_norm": 2.8908116817474365,
+ "learning_rate": 6.131928494064049e-06,
+ "loss": 0.063,
+ "step": 23401
+ },
+ {
+ "epoch": 63.76566757493188,
+ "grad_norm": 3.213243007659912,
+ "learning_rate": 6.1311147073177455e-06,
+ "loss": 0.0645,
+ "step": 23402
+ },
+ {
+ "epoch": 63.76839237057221,
+ "grad_norm": 3.9643075466156006,
+ "learning_rate": 6.1303009507021995e-06,
+ "loss": 0.071,
+ "step": 23403
+ },
+ {
+ "epoch": 63.771117166212534,
+ "grad_norm": 4.139108180999756,
+ "learning_rate": 6.129487224223741e-06,
+ "loss": 0.0958,
+ "step": 23404
+ },
+ {
+ "epoch": 63.77384196185286,
+ "grad_norm": 2.657076835632324,
+ "learning_rate": 6.128673527888715e-06,
+ "loss": 0.1464,
+ "step": 23405
+ },
+ {
+ "epoch": 63.776566757493185,
+ "grad_norm": 4.322707176208496,
+ "learning_rate": 6.127859861703453e-06,
+ "loss": 0.0725,
+ "step": 23406
+ },
+ {
+ "epoch": 63.77929155313352,
+ "grad_norm": 4.337071418762207,
+ "learning_rate": 6.127046225674294e-06,
+ "loss": 0.0573,
+ "step": 23407
+ },
+ {
+ "epoch": 63.782016348773844,
+ "grad_norm": 3.0265305042266846,
+ "learning_rate": 6.126232619807575e-06,
+ "loss": 0.089,
+ "step": 23408
+ },
+ {
+ "epoch": 63.78474114441417,
+ "grad_norm": 4.078360080718994,
+ "learning_rate": 6.125419044109629e-06,
+ "loss": 0.1439,
+ "step": 23409
+ },
+ {
+ "epoch": 63.787465940054496,
+ "grad_norm": 3.665076971054077,
+ "learning_rate": 6.124605498586796e-06,
+ "loss": 0.0772,
+ "step": 23410
+ },
+ {
+ "epoch": 63.79019073569482,
+ "grad_norm": 3.631455183029175,
+ "learning_rate": 6.123791983245411e-06,
+ "loss": 0.2251,
+ "step": 23411
+ },
+ {
+ "epoch": 63.79291553133515,
+ "grad_norm": 4.092085838317871,
+ "learning_rate": 6.122978498091809e-06,
+ "loss": 0.1069,
+ "step": 23412
+ },
+ {
+ "epoch": 63.79564032697548,
+ "grad_norm": 3.549079656600952,
+ "learning_rate": 6.1221650431323285e-06,
+ "loss": 0.0529,
+ "step": 23413
+ },
+ {
+ "epoch": 63.798365122615806,
+ "grad_norm": 4.666623592376709,
+ "learning_rate": 6.121351618373299e-06,
+ "loss": 0.1635,
+ "step": 23414
+ },
+ {
+ "epoch": 63.80108991825613,
+ "grad_norm": 4.067806243896484,
+ "learning_rate": 6.12053822382106e-06,
+ "loss": 0.1598,
+ "step": 23415
+ },
+ {
+ "epoch": 63.80381471389646,
+ "grad_norm": 3.807265520095825,
+ "learning_rate": 6.119724859481943e-06,
+ "loss": 0.2297,
+ "step": 23416
+ },
+ {
+ "epoch": 63.80653950953678,
+ "grad_norm": 5.882267951965332,
+ "learning_rate": 6.1189115253622855e-06,
+ "loss": 0.0705,
+ "step": 23417
+ },
+ {
+ "epoch": 63.80926430517711,
+ "grad_norm": 4.377636909484863,
+ "learning_rate": 6.118098221468418e-06,
+ "loss": 0.0788,
+ "step": 23418
+ },
+ {
+ "epoch": 63.81198910081744,
+ "grad_norm": 4.685329914093018,
+ "learning_rate": 6.117284947806679e-06,
+ "loss": 0.1384,
+ "step": 23419
+ },
+ {
+ "epoch": 63.81471389645777,
+ "grad_norm": 3.047091007232666,
+ "learning_rate": 6.116471704383397e-06,
+ "loss": 0.0516,
+ "step": 23420
+ },
+ {
+ "epoch": 63.817438692098094,
+ "grad_norm": 5.363067626953125,
+ "learning_rate": 6.1156584912049126e-06,
+ "loss": 0.1065,
+ "step": 23421
+ },
+ {
+ "epoch": 63.82016348773842,
+ "grad_norm": 4.223793983459473,
+ "learning_rate": 6.114845308277551e-06,
+ "loss": 0.1137,
+ "step": 23422
+ },
+ {
+ "epoch": 63.822888283378745,
+ "grad_norm": 8.914681434631348,
+ "learning_rate": 6.114032155607651e-06,
+ "loss": 0.0651,
+ "step": 23423
+ },
+ {
+ "epoch": 63.82561307901907,
+ "grad_norm": 4.6169586181640625,
+ "learning_rate": 6.113219033201543e-06,
+ "loss": 0.0403,
+ "step": 23424
+ },
+ {
+ "epoch": 63.828337874659404,
+ "grad_norm": 4.677670955657959,
+ "learning_rate": 6.11240594106556e-06,
+ "loss": 0.1227,
+ "step": 23425
+ },
+ {
+ "epoch": 63.83106267029973,
+ "grad_norm": 4.268988132476807,
+ "learning_rate": 6.111592879206032e-06,
+ "loss": 0.0742,
+ "step": 23426
+ },
+ {
+ "epoch": 63.833787465940055,
+ "grad_norm": 3.756197690963745,
+ "learning_rate": 6.110779847629295e-06,
+ "loss": 0.1008,
+ "step": 23427
+ },
+ {
+ "epoch": 63.83651226158038,
+ "grad_norm": 3.9022650718688965,
+ "learning_rate": 6.109966846341681e-06,
+ "loss": 0.1418,
+ "step": 23428
+ },
+ {
+ "epoch": 63.83923705722071,
+ "grad_norm": 4.158533096313477,
+ "learning_rate": 6.109153875349518e-06,
+ "loss": 0.1343,
+ "step": 23429
+ },
+ {
+ "epoch": 63.84196185286103,
+ "grad_norm": 3.451460838317871,
+ "learning_rate": 6.1083409346591425e-06,
+ "loss": 0.1802,
+ "step": 23430
+ },
+ {
+ "epoch": 63.844686648501366,
+ "grad_norm": 2.8260531425476074,
+ "learning_rate": 6.1075280242768785e-06,
+ "loss": 0.0645,
+ "step": 23431
+ },
+ {
+ "epoch": 63.84741144414169,
+ "grad_norm": 3.1926558017730713,
+ "learning_rate": 6.106715144209063e-06,
+ "loss": 0.0895,
+ "step": 23432
+ },
+ {
+ "epoch": 63.85013623978202,
+ "grad_norm": 2.9613037109375,
+ "learning_rate": 6.105902294462026e-06,
+ "loss": 0.0688,
+ "step": 23433
+ },
+ {
+ "epoch": 63.85286103542234,
+ "grad_norm": 2.9341928958892822,
+ "learning_rate": 6.105089475042094e-06,
+ "loss": 0.0531,
+ "step": 23434
+ },
+ {
+ "epoch": 63.85558583106267,
+ "grad_norm": 3.9897468090057373,
+ "learning_rate": 6.104276685955603e-06,
+ "loss": 0.1707,
+ "step": 23435
+ },
+ {
+ "epoch": 63.858310626702995,
+ "grad_norm": 2.8880317211151123,
+ "learning_rate": 6.103463927208877e-06,
+ "loss": 0.1079,
+ "step": 23436
+ },
+ {
+ "epoch": 63.86103542234333,
+ "grad_norm": 3.641231060028076,
+ "learning_rate": 6.10265119880825e-06,
+ "loss": 0.0816,
+ "step": 23437
+ },
+ {
+ "epoch": 63.86376021798365,
+ "grad_norm": 4.001800537109375,
+ "learning_rate": 6.101838500760049e-06,
+ "loss": 0.1587,
+ "step": 23438
+ },
+ {
+ "epoch": 63.86648501362398,
+ "grad_norm": 3.740647554397583,
+ "learning_rate": 6.101025833070607e-06,
+ "loss": 0.0818,
+ "step": 23439
+ },
+ {
+ "epoch": 63.869209809264305,
+ "grad_norm": 3.308682441711426,
+ "learning_rate": 6.100213195746246e-06,
+ "loss": 0.0719,
+ "step": 23440
+ },
+ {
+ "epoch": 63.87193460490463,
+ "grad_norm": 3.250107765197754,
+ "learning_rate": 6.099400588793303e-06,
+ "loss": 0.2026,
+ "step": 23441
+ },
+ {
+ "epoch": 63.87465940054496,
+ "grad_norm": 3.7879693508148193,
+ "learning_rate": 6.0985880122181e-06,
+ "loss": 0.247,
+ "step": 23442
+ },
+ {
+ "epoch": 63.87738419618529,
+ "grad_norm": 4.270380020141602,
+ "learning_rate": 6.097775466026966e-06,
+ "loss": 0.186,
+ "step": 23443
+ },
+ {
+ "epoch": 63.880108991825615,
+ "grad_norm": 6.7312164306640625,
+ "learning_rate": 6.096962950226235e-06,
+ "loss": 0.059,
+ "step": 23444
+ },
+ {
+ "epoch": 63.88283378746594,
+ "grad_norm": 4.286167621612549,
+ "learning_rate": 6.096150464822229e-06,
+ "loss": 0.1302,
+ "step": 23445
+ },
+ {
+ "epoch": 63.88555858310627,
+ "grad_norm": 3.4437525272369385,
+ "learning_rate": 6.095338009821279e-06,
+ "loss": 0.0749,
+ "step": 23446
+ },
+ {
+ "epoch": 63.88828337874659,
+ "grad_norm": 3.741774559020996,
+ "learning_rate": 6.09452558522971e-06,
+ "loss": 0.0961,
+ "step": 23447
+ },
+ {
+ "epoch": 63.89100817438692,
+ "grad_norm": 4.192138195037842,
+ "learning_rate": 6.093713191053852e-06,
+ "loss": 0.1778,
+ "step": 23448
+ },
+ {
+ "epoch": 63.89373297002725,
+ "grad_norm": 4.225839614868164,
+ "learning_rate": 6.092900827300028e-06,
+ "loss": 0.0554,
+ "step": 23449
+ },
+ {
+ "epoch": 63.89645776566758,
+ "grad_norm": 2.9316306114196777,
+ "learning_rate": 6.0920884939745675e-06,
+ "loss": 0.0339,
+ "step": 23450
+ },
+ {
+ "epoch": 63.8991825613079,
+ "grad_norm": 4.158364295959473,
+ "learning_rate": 6.091276191083795e-06,
+ "loss": 0.1724,
+ "step": 23451
+ },
+ {
+ "epoch": 63.90190735694823,
+ "grad_norm": 2.9727489948272705,
+ "learning_rate": 6.090463918634039e-06,
+ "loss": 0.0573,
+ "step": 23452
+ },
+ {
+ "epoch": 63.904632152588555,
+ "grad_norm": 2.535248279571533,
+ "learning_rate": 6.089651676631623e-06,
+ "loss": 0.0386,
+ "step": 23453
+ },
+ {
+ "epoch": 63.90735694822888,
+ "grad_norm": 3.114696502685547,
+ "learning_rate": 6.088839465082873e-06,
+ "loss": 0.3108,
+ "step": 23454
+ },
+ {
+ "epoch": 63.91008174386921,
+ "grad_norm": 2.4612932205200195,
+ "learning_rate": 6.088027283994118e-06,
+ "loss": 0.0494,
+ "step": 23455
+ },
+ {
+ "epoch": 63.91280653950954,
+ "grad_norm": 2.5667924880981445,
+ "learning_rate": 6.087215133371678e-06,
+ "loss": 0.0502,
+ "step": 23456
+ },
+ {
+ "epoch": 63.915531335149865,
+ "grad_norm": 4.460409164428711,
+ "learning_rate": 6.086403013221883e-06,
+ "loss": 0.0899,
+ "step": 23457
+ },
+ {
+ "epoch": 63.91825613079019,
+ "grad_norm": 3.584872245788574,
+ "learning_rate": 6.085590923551053e-06,
+ "loss": 0.1044,
+ "step": 23458
+ },
+ {
+ "epoch": 63.920980926430516,
+ "grad_norm": 3.301926374435425,
+ "learning_rate": 6.084778864365517e-06,
+ "loss": 0.104,
+ "step": 23459
+ },
+ {
+ "epoch": 63.92370572207084,
+ "grad_norm": 3.8156473636627197,
+ "learning_rate": 6.083966835671595e-06,
+ "loss": 0.1698,
+ "step": 23460
+ },
+ {
+ "epoch": 63.926430517711175,
+ "grad_norm": 3.2632346153259277,
+ "learning_rate": 6.083154837475613e-06,
+ "loss": 0.0506,
+ "step": 23461
+ },
+ {
+ "epoch": 63.9291553133515,
+ "grad_norm": 2.7662084102630615,
+ "learning_rate": 6.082342869783897e-06,
+ "loss": 0.1222,
+ "step": 23462
+ },
+ {
+ "epoch": 63.93188010899183,
+ "grad_norm": 3.916504383087158,
+ "learning_rate": 6.081530932602768e-06,
+ "loss": 0.0466,
+ "step": 23463
+ },
+ {
+ "epoch": 63.93460490463215,
+ "grad_norm": 3.228099822998047,
+ "learning_rate": 6.0807190259385506e-06,
+ "loss": 0.0453,
+ "step": 23464
+ },
+ {
+ "epoch": 63.93732970027248,
+ "grad_norm": 2.837225914001465,
+ "learning_rate": 6.079907149797567e-06,
+ "loss": 0.0531,
+ "step": 23465
+ },
+ {
+ "epoch": 63.940054495912804,
+ "grad_norm": 5.713571071624756,
+ "learning_rate": 6.079095304186141e-06,
+ "loss": 0.152,
+ "step": 23466
+ },
+ {
+ "epoch": 63.94277929155314,
+ "grad_norm": 5.183123588562012,
+ "learning_rate": 6.078283489110593e-06,
+ "loss": 0.0838,
+ "step": 23467
+ },
+ {
+ "epoch": 63.94550408719346,
+ "grad_norm": 4.887022972106934,
+ "learning_rate": 6.077471704577249e-06,
+ "loss": 0.0654,
+ "step": 23468
+ },
+ {
+ "epoch": 63.94822888283379,
+ "grad_norm": 3.4347918033599854,
+ "learning_rate": 6.076659950592427e-06,
+ "loss": 0.0449,
+ "step": 23469
+ },
+ {
+ "epoch": 63.950953678474114,
+ "grad_norm": 3.740933656692505,
+ "learning_rate": 6.075848227162453e-06,
+ "loss": 0.0723,
+ "step": 23470
+ },
+ {
+ "epoch": 63.95367847411444,
+ "grad_norm": 4.064043998718262,
+ "learning_rate": 6.075036534293646e-06,
+ "loss": 0.095,
+ "step": 23471
+ },
+ {
+ "epoch": 63.956403269754766,
+ "grad_norm": 4.198511600494385,
+ "learning_rate": 6.074224871992329e-06,
+ "loss": 0.0793,
+ "step": 23472
+ },
+ {
+ "epoch": 63.95912806539509,
+ "grad_norm": 2.671219825744629,
+ "learning_rate": 6.0734132402648205e-06,
+ "loss": 0.22,
+ "step": 23473
+ },
+ {
+ "epoch": 63.961852861035425,
+ "grad_norm": 3.583232879638672,
+ "learning_rate": 6.0726016391174435e-06,
+ "loss": 0.1097,
+ "step": 23474
+ },
+ {
+ "epoch": 63.96457765667575,
+ "grad_norm": 4.212375640869141,
+ "learning_rate": 6.071790068556519e-06,
+ "loss": 0.0852,
+ "step": 23475
+ },
+ {
+ "epoch": 63.967302452316076,
+ "grad_norm": 3.3939666748046875,
+ "learning_rate": 6.070978528588369e-06,
+ "loss": 0.2639,
+ "step": 23476
+ },
+ {
+ "epoch": 63.9700272479564,
+ "grad_norm": 3.3759117126464844,
+ "learning_rate": 6.0701670192193085e-06,
+ "loss": 0.0426,
+ "step": 23477
+ },
+ {
+ "epoch": 63.97275204359673,
+ "grad_norm": 4.86347770690918,
+ "learning_rate": 6.06935554045566e-06,
+ "loss": 0.1106,
+ "step": 23478
+ },
+ {
+ "epoch": 63.97547683923706,
+ "grad_norm": 4.830080032348633,
+ "learning_rate": 6.068544092303744e-06,
+ "loss": 0.0797,
+ "step": 23479
+ },
+ {
+ "epoch": 63.97820163487739,
+ "grad_norm": 3.3038806915283203,
+ "learning_rate": 6.067732674769884e-06,
+ "loss": 0.0478,
+ "step": 23480
+ },
+ {
+ "epoch": 63.98092643051771,
+ "grad_norm": 3.3870160579681396,
+ "learning_rate": 6.0669212878603925e-06,
+ "loss": 0.047,
+ "step": 23481
+ },
+ {
+ "epoch": 63.98365122615804,
+ "grad_norm": 3.249441623687744,
+ "learning_rate": 6.066109931581594e-06,
+ "loss": 0.1047,
+ "step": 23482
+ },
+ {
+ "epoch": 63.986376021798364,
+ "grad_norm": 3.0960967540740967,
+ "learning_rate": 6.065298605939803e-06,
+ "loss": 0.0614,
+ "step": 23483
+ },
+ {
+ "epoch": 63.98910081743869,
+ "grad_norm": 4.144088268280029,
+ "learning_rate": 6.064487310941341e-06,
+ "loss": 0.1204,
+ "step": 23484
+ },
+ {
+ "epoch": 63.991825613079016,
+ "grad_norm": 3.5295004844665527,
+ "learning_rate": 6.063676046592523e-06,
+ "loss": 0.0812,
+ "step": 23485
+ },
+ {
+ "epoch": 63.99455040871935,
+ "grad_norm": 4.128300666809082,
+ "learning_rate": 6.062864812899672e-06,
+ "loss": 0.0623,
+ "step": 23486
+ },
+ {
+ "epoch": 63.997275204359674,
+ "grad_norm": 4.500547409057617,
+ "learning_rate": 6.0620536098690995e-06,
+ "loss": 0.1733,
+ "step": 23487
+ },
+ {
+ "epoch": 64.0,
+ "grad_norm": 2.8028404712677,
+ "learning_rate": 6.061242437507131e-06,
+ "loss": 0.097,
+ "step": 23488
+ },
+ {
+ "epoch": 64.00272479564033,
+ "grad_norm": 3.697244644165039,
+ "learning_rate": 6.0604312958200754e-06,
+ "loss": 0.1127,
+ "step": 23489
+ },
+ {
+ "epoch": 64.00544959128065,
+ "grad_norm": 2.81890869140625,
+ "learning_rate": 6.059620184814258e-06,
+ "loss": 0.0508,
+ "step": 23490
+ },
+ {
+ "epoch": 64.00817438692098,
+ "grad_norm": 4.149252414703369,
+ "learning_rate": 6.058809104495988e-06,
+ "loss": 0.1435,
+ "step": 23491
+ },
+ {
+ "epoch": 64.0108991825613,
+ "grad_norm": 4.215442657470703,
+ "learning_rate": 6.05799805487159e-06,
+ "loss": 0.1213,
+ "step": 23492
+ },
+ {
+ "epoch": 64.01362397820164,
+ "grad_norm": 5.0310845375061035,
+ "learning_rate": 6.057187035947373e-06,
+ "loss": 0.0664,
+ "step": 23493
+ },
+ {
+ "epoch": 64.01634877384195,
+ "grad_norm": 4.0117316246032715,
+ "learning_rate": 6.056376047729658e-06,
+ "loss": 0.057,
+ "step": 23494
+ },
+ {
+ "epoch": 64.01907356948229,
+ "grad_norm": 4.201609134674072,
+ "learning_rate": 6.055565090224756e-06,
+ "loss": 0.0598,
+ "step": 23495
+ },
+ {
+ "epoch": 64.02179836512262,
+ "grad_norm": 2.948737382888794,
+ "learning_rate": 6.054754163438989e-06,
+ "loss": 0.1505,
+ "step": 23496
+ },
+ {
+ "epoch": 64.02452316076294,
+ "grad_norm": 3.196985960006714,
+ "learning_rate": 6.053943267378668e-06,
+ "loss": 0.0358,
+ "step": 23497
+ },
+ {
+ "epoch": 64.02724795640327,
+ "grad_norm": 3.8606789112091064,
+ "learning_rate": 6.053132402050112e-06,
+ "loss": 0.1597,
+ "step": 23498
+ },
+ {
+ "epoch": 64.02997275204359,
+ "grad_norm": 2.8317203521728516,
+ "learning_rate": 6.052321567459634e-06,
+ "loss": 0.0381,
+ "step": 23499
+ },
+ {
+ "epoch": 64.03269754768392,
+ "grad_norm": 3.4053215980529785,
+ "learning_rate": 6.051510763613548e-06,
+ "loss": 0.1608,
+ "step": 23500
+ },
+ {
+ "epoch": 64.03542234332426,
+ "grad_norm": 2.6956491470336914,
+ "learning_rate": 6.0506999905181696e-06,
+ "loss": 0.066,
+ "step": 23501
+ },
+ {
+ "epoch": 64.03814713896458,
+ "grad_norm": 3.694140672683716,
+ "learning_rate": 6.049889248179812e-06,
+ "loss": 0.0862,
+ "step": 23502
+ },
+ {
+ "epoch": 64.04087193460491,
+ "grad_norm": 4.136013031005859,
+ "learning_rate": 6.049078536604789e-06,
+ "loss": 0.0517,
+ "step": 23503
+ },
+ {
+ "epoch": 64.04359673024523,
+ "grad_norm": 3.58744215965271,
+ "learning_rate": 6.048267855799417e-06,
+ "loss": 0.1088,
+ "step": 23504
+ },
+ {
+ "epoch": 64.04632152588556,
+ "grad_norm": 5.858720302581787,
+ "learning_rate": 6.047457205770006e-06,
+ "loss": 0.1104,
+ "step": 23505
+ },
+ {
+ "epoch": 64.04904632152588,
+ "grad_norm": 4.341165542602539,
+ "learning_rate": 6.046646586522873e-06,
+ "loss": 0.0937,
+ "step": 23506
+ },
+ {
+ "epoch": 64.05177111716621,
+ "grad_norm": 3.494215250015259,
+ "learning_rate": 6.045835998064326e-06,
+ "loss": 0.0948,
+ "step": 23507
+ },
+ {
+ "epoch": 64.05449591280654,
+ "grad_norm": 4.5636444091796875,
+ "learning_rate": 6.045025440400684e-06,
+ "loss": 0.0909,
+ "step": 23508
+ },
+ {
+ "epoch": 64.05722070844686,
+ "grad_norm": 3.3840458393096924,
+ "learning_rate": 6.044214913538255e-06,
+ "loss": 0.0815,
+ "step": 23509
+ },
+ {
+ "epoch": 64.0599455040872,
+ "grad_norm": 4.306269645690918,
+ "learning_rate": 6.043404417483356e-06,
+ "loss": 0.0694,
+ "step": 23510
+ },
+ {
+ "epoch": 64.06267029972751,
+ "grad_norm": 4.181427478790283,
+ "learning_rate": 6.0425939522422926e-06,
+ "loss": 0.0867,
+ "step": 23511
+ },
+ {
+ "epoch": 64.06539509536785,
+ "grad_norm": 4.496644496917725,
+ "learning_rate": 6.041783517821378e-06,
+ "loss": 0.0971,
+ "step": 23512
+ },
+ {
+ "epoch": 64.06811989100818,
+ "grad_norm": 2.958178997039795,
+ "learning_rate": 6.040973114226929e-06,
+ "loss": 0.0444,
+ "step": 23513
+ },
+ {
+ "epoch": 64.0708446866485,
+ "grad_norm": 2.571974277496338,
+ "learning_rate": 6.0401627414652545e-06,
+ "loss": 0.2193,
+ "step": 23514
+ },
+ {
+ "epoch": 64.07356948228883,
+ "grad_norm": 4.502200603485107,
+ "learning_rate": 6.039352399542665e-06,
+ "loss": 0.0657,
+ "step": 23515
+ },
+ {
+ "epoch": 64.07629427792915,
+ "grad_norm": 3.3185508251190186,
+ "learning_rate": 6.03854208846547e-06,
+ "loss": 0.0551,
+ "step": 23516
+ },
+ {
+ "epoch": 64.07901907356948,
+ "grad_norm": 3.644416093826294,
+ "learning_rate": 6.037731808239984e-06,
+ "loss": 0.0602,
+ "step": 23517
+ },
+ {
+ "epoch": 64.0817438692098,
+ "grad_norm": 3.460526466369629,
+ "learning_rate": 6.036921558872513e-06,
+ "loss": 0.0653,
+ "step": 23518
+ },
+ {
+ "epoch": 64.08446866485014,
+ "grad_norm": 4.2937703132629395,
+ "learning_rate": 6.03611134036937e-06,
+ "loss": 0.2086,
+ "step": 23519
+ },
+ {
+ "epoch": 64.08719346049047,
+ "grad_norm": 3.382347822189331,
+ "learning_rate": 6.035301152736866e-06,
+ "loss": 0.0655,
+ "step": 23520
+ },
+ {
+ "epoch": 64.08991825613079,
+ "grad_norm": 4.8122053146362305,
+ "learning_rate": 6.0344909959813055e-06,
+ "loss": 0.134,
+ "step": 23521
+ },
+ {
+ "epoch": 64.09264305177112,
+ "grad_norm": 8.842113494873047,
+ "learning_rate": 6.033680870109005e-06,
+ "loss": 0.0767,
+ "step": 23522
+ },
+ {
+ "epoch": 64.09536784741144,
+ "grad_norm": 4.6074628829956055,
+ "learning_rate": 6.032870775126268e-06,
+ "loss": 0.0574,
+ "step": 23523
+ },
+ {
+ "epoch": 64.09809264305177,
+ "grad_norm": 2.9115238189697266,
+ "learning_rate": 6.032060711039408e-06,
+ "loss": 0.0374,
+ "step": 23524
+ },
+ {
+ "epoch": 64.1008174386921,
+ "grad_norm": 4.844232082366943,
+ "learning_rate": 6.03125067785473e-06,
+ "loss": 0.1889,
+ "step": 23525
+ },
+ {
+ "epoch": 64.10354223433242,
+ "grad_norm": 3.5602612495422363,
+ "learning_rate": 6.030440675578544e-06,
+ "loss": 0.2008,
+ "step": 23526
+ },
+ {
+ "epoch": 64.10626702997276,
+ "grad_norm": 11.935846328735352,
+ "learning_rate": 6.0296307042171575e-06,
+ "loss": 0.1966,
+ "step": 23527
+ },
+ {
+ "epoch": 64.10899182561307,
+ "grad_norm": 3.367767572402954,
+ "learning_rate": 6.0288207637768815e-06,
+ "loss": 0.0498,
+ "step": 23528
+ },
+ {
+ "epoch": 64.11171662125341,
+ "grad_norm": 4.081257343292236,
+ "learning_rate": 6.028010854264017e-06,
+ "loss": 0.113,
+ "step": 23529
+ },
+ {
+ "epoch": 64.11444141689373,
+ "grad_norm": 3.3737878799438477,
+ "learning_rate": 6.027200975684879e-06,
+ "loss": 0.075,
+ "step": 23530
+ },
+ {
+ "epoch": 64.11716621253406,
+ "grad_norm": 3.344336748123169,
+ "learning_rate": 6.026391128045773e-06,
+ "loss": 0.1097,
+ "step": 23531
+ },
+ {
+ "epoch": 64.11989100817439,
+ "grad_norm": 4.564388751983643,
+ "learning_rate": 6.0255813113530036e-06,
+ "loss": 0.1994,
+ "step": 23532
+ },
+ {
+ "epoch": 64.12261580381471,
+ "grad_norm": 5.7605085372924805,
+ "learning_rate": 6.02477152561288e-06,
+ "loss": 0.0787,
+ "step": 23533
+ },
+ {
+ "epoch": 64.12534059945504,
+ "grad_norm": 4.184399604797363,
+ "learning_rate": 6.023961770831708e-06,
+ "loss": 0.2097,
+ "step": 23534
+ },
+ {
+ "epoch": 64.12806539509536,
+ "grad_norm": 4.196770668029785,
+ "learning_rate": 6.023152047015794e-06,
+ "loss": 0.0756,
+ "step": 23535
+ },
+ {
+ "epoch": 64.1307901907357,
+ "grad_norm": 4.043728351593018,
+ "learning_rate": 6.022342354171442e-06,
+ "loss": 0.1195,
+ "step": 23536
+ },
+ {
+ "epoch": 64.13351498637603,
+ "grad_norm": 3.506322145462036,
+ "learning_rate": 6.021532692304962e-06,
+ "loss": 0.0915,
+ "step": 23537
+ },
+ {
+ "epoch": 64.13623978201635,
+ "grad_norm": 3.506742477416992,
+ "learning_rate": 6.020723061422655e-06,
+ "loss": 0.0478,
+ "step": 23538
+ },
+ {
+ "epoch": 64.13896457765668,
+ "grad_norm": 3.656735420227051,
+ "learning_rate": 6.019913461530831e-06,
+ "loss": 0.0684,
+ "step": 23539
+ },
+ {
+ "epoch": 64.141689373297,
+ "grad_norm": 4.760861873626709,
+ "learning_rate": 6.019103892635791e-06,
+ "loss": 0.2306,
+ "step": 23540
+ },
+ {
+ "epoch": 64.14441416893733,
+ "grad_norm": 9.18626880645752,
+ "learning_rate": 6.018294354743842e-06,
+ "loss": 0.1383,
+ "step": 23541
+ },
+ {
+ "epoch": 64.14713896457765,
+ "grad_norm": 4.248356819152832,
+ "learning_rate": 6.01748484786129e-06,
+ "loss": 0.0574,
+ "step": 23542
+ },
+ {
+ "epoch": 64.14986376021798,
+ "grad_norm": 8.526737213134766,
+ "learning_rate": 6.016675371994436e-06,
+ "loss": 0.0503,
+ "step": 23543
+ },
+ {
+ "epoch": 64.15258855585832,
+ "grad_norm": 4.397159099578857,
+ "learning_rate": 6.015865927149588e-06,
+ "loss": 0.0593,
+ "step": 23544
+ },
+ {
+ "epoch": 64.15531335149863,
+ "grad_norm": 4.602883338928223,
+ "learning_rate": 6.015056513333046e-06,
+ "loss": 0.0727,
+ "step": 23545
+ },
+ {
+ "epoch": 64.15803814713897,
+ "grad_norm": 4.110457420349121,
+ "learning_rate": 6.014247130551117e-06,
+ "loss": 0.1262,
+ "step": 23546
+ },
+ {
+ "epoch": 64.16076294277929,
+ "grad_norm": 5.497186183929443,
+ "learning_rate": 6.013437778810101e-06,
+ "loss": 0.1247,
+ "step": 23547
+ },
+ {
+ "epoch": 64.16348773841962,
+ "grad_norm": 3.1408705711364746,
+ "learning_rate": 6.012628458116303e-06,
+ "loss": 0.0833,
+ "step": 23548
+ },
+ {
+ "epoch": 64.16621253405995,
+ "grad_norm": 3.999343156814575,
+ "learning_rate": 6.011819168476028e-06,
+ "loss": 0.2633,
+ "step": 23549
+ },
+ {
+ "epoch": 64.16893732970027,
+ "grad_norm": 3.464352607727051,
+ "learning_rate": 6.011009909895576e-06,
+ "loss": 0.0944,
+ "step": 23550
+ },
+ {
+ "epoch": 64.1716621253406,
+ "grad_norm": 2.916966438293457,
+ "learning_rate": 6.010200682381253e-06,
+ "loss": 0.0702,
+ "step": 23551
+ },
+ {
+ "epoch": 64.17438692098092,
+ "grad_norm": 4.517367362976074,
+ "learning_rate": 6.009391485939355e-06,
+ "loss": 0.0854,
+ "step": 23552
+ },
+ {
+ "epoch": 64.17711171662125,
+ "grad_norm": 3.6340513229370117,
+ "learning_rate": 6.008582320576191e-06,
+ "loss": 0.0675,
+ "step": 23553
+ },
+ {
+ "epoch": 64.17983651226157,
+ "grad_norm": 3.23189377784729,
+ "learning_rate": 6.0077731862980584e-06,
+ "loss": 0.0867,
+ "step": 23554
+ },
+ {
+ "epoch": 64.1825613079019,
+ "grad_norm": 5.061977863311768,
+ "learning_rate": 6.00696408311126e-06,
+ "loss": 0.0566,
+ "step": 23555
+ },
+ {
+ "epoch": 64.18528610354224,
+ "grad_norm": 4.160363674163818,
+ "learning_rate": 6.0061550110220954e-06,
+ "loss": 0.1581,
+ "step": 23556
+ },
+ {
+ "epoch": 64.18801089918256,
+ "grad_norm": 2.9718129634857178,
+ "learning_rate": 6.005345970036868e-06,
+ "loss": 0.0473,
+ "step": 23557
+ },
+ {
+ "epoch": 64.19073569482289,
+ "grad_norm": 3.0926907062530518,
+ "learning_rate": 6.004536960161877e-06,
+ "loss": 0.1364,
+ "step": 23558
+ },
+ {
+ "epoch": 64.19346049046321,
+ "grad_norm": 3.834367036819458,
+ "learning_rate": 6.003727981403427e-06,
+ "loss": 0.0651,
+ "step": 23559
+ },
+ {
+ "epoch": 64.19618528610354,
+ "grad_norm": 3.2685959339141846,
+ "learning_rate": 6.0029190337678104e-06,
+ "loss": 0.0539,
+ "step": 23560
+ },
+ {
+ "epoch": 64.19891008174388,
+ "grad_norm": 4.632725715637207,
+ "learning_rate": 6.002110117261334e-06,
+ "loss": 0.3755,
+ "step": 23561
+ },
+ {
+ "epoch": 64.2016348773842,
+ "grad_norm": 2.591708183288574,
+ "learning_rate": 6.001301231890293e-06,
+ "loss": 0.044,
+ "step": 23562
+ },
+ {
+ "epoch": 64.20435967302453,
+ "grad_norm": 4.842454433441162,
+ "learning_rate": 6.0004923776609925e-06,
+ "loss": 0.1532,
+ "step": 23563
+ },
+ {
+ "epoch": 64.20708446866485,
+ "grad_norm": 4.658775806427002,
+ "learning_rate": 5.999683554579723e-06,
+ "loss": 0.0782,
+ "step": 23564
+ },
+ {
+ "epoch": 64.20980926430518,
+ "grad_norm": 5.350197792053223,
+ "learning_rate": 5.998874762652793e-06,
+ "loss": 0.1631,
+ "step": 23565
+ },
+ {
+ "epoch": 64.2125340599455,
+ "grad_norm": 5.568068027496338,
+ "learning_rate": 5.998066001886498e-06,
+ "loss": 0.1451,
+ "step": 23566
+ },
+ {
+ "epoch": 64.21525885558583,
+ "grad_norm": 5.235050678253174,
+ "learning_rate": 5.997257272287136e-06,
+ "loss": 0.0705,
+ "step": 23567
+ },
+ {
+ "epoch": 64.21798365122616,
+ "grad_norm": 2.4079315662384033,
+ "learning_rate": 5.9964485738610045e-06,
+ "loss": 0.1124,
+ "step": 23568
+ },
+ {
+ "epoch": 64.22070844686648,
+ "grad_norm": 4.350709438323975,
+ "learning_rate": 5.995639906614406e-06,
+ "loss": 0.0596,
+ "step": 23569
+ },
+ {
+ "epoch": 64.22343324250681,
+ "grad_norm": 2.903782606124878,
+ "learning_rate": 5.994831270553632e-06,
+ "loss": 0.0631,
+ "step": 23570
+ },
+ {
+ "epoch": 64.22615803814713,
+ "grad_norm": 2.8252782821655273,
+ "learning_rate": 5.994022665684985e-06,
+ "loss": 0.0819,
+ "step": 23571
+ },
+ {
+ "epoch": 64.22888283378747,
+ "grad_norm": 3.7527451515197754,
+ "learning_rate": 5.993214092014758e-06,
+ "loss": 0.073,
+ "step": 23572
+ },
+ {
+ "epoch": 64.2316076294278,
+ "grad_norm": 2.4014880657196045,
+ "learning_rate": 5.992405549549253e-06,
+ "loss": 0.0374,
+ "step": 23573
+ },
+ {
+ "epoch": 64.23433242506812,
+ "grad_norm": 3.990499258041382,
+ "learning_rate": 5.991597038294763e-06,
+ "loss": 0.0882,
+ "step": 23574
+ },
+ {
+ "epoch": 64.23705722070845,
+ "grad_norm": 3.87880277633667,
+ "learning_rate": 5.9907885582575875e-06,
+ "loss": 0.1614,
+ "step": 23575
+ },
+ {
+ "epoch": 64.23978201634877,
+ "grad_norm": 15.022882461547852,
+ "learning_rate": 5.989980109444021e-06,
+ "loss": 0.114,
+ "step": 23576
+ },
+ {
+ "epoch": 64.2425068119891,
+ "grad_norm": 7.59397029876709,
+ "learning_rate": 5.98917169186036e-06,
+ "loss": 0.1435,
+ "step": 23577
+ },
+ {
+ "epoch": 64.24523160762942,
+ "grad_norm": 3.6357462406158447,
+ "learning_rate": 5.988363305512901e-06,
+ "loss": 0.0959,
+ "step": 23578
+ },
+ {
+ "epoch": 64.24795640326975,
+ "grad_norm": 3.291400194168091,
+ "learning_rate": 5.987554950407941e-06,
+ "loss": 0.0752,
+ "step": 23579
+ },
+ {
+ "epoch": 64.25068119891009,
+ "grad_norm": 3.1410319805145264,
+ "learning_rate": 5.986746626551772e-06,
+ "loss": 0.0426,
+ "step": 23580
+ },
+ {
+ "epoch": 64.2534059945504,
+ "grad_norm": 3.742543935775757,
+ "learning_rate": 5.985938333950689e-06,
+ "loss": 0.0794,
+ "step": 23581
+ },
+ {
+ "epoch": 64.25613079019074,
+ "grad_norm": 4.182135105133057,
+ "learning_rate": 5.985130072610993e-06,
+ "loss": 0.171,
+ "step": 23582
+ },
+ {
+ "epoch": 64.25885558583106,
+ "grad_norm": 3.4071569442749023,
+ "learning_rate": 5.984321842538973e-06,
+ "loss": 0.0514,
+ "step": 23583
+ },
+ {
+ "epoch": 64.26158038147139,
+ "grad_norm": 4.205199241638184,
+ "learning_rate": 5.9835136437409235e-06,
+ "loss": 0.151,
+ "step": 23584
+ },
+ {
+ "epoch": 64.26430517711172,
+ "grad_norm": 3.668665885925293,
+ "learning_rate": 5.982705476223145e-06,
+ "loss": 0.0614,
+ "step": 23585
+ },
+ {
+ "epoch": 64.26702997275204,
+ "grad_norm": 4.014118194580078,
+ "learning_rate": 5.981897339991923e-06,
+ "loss": 0.0442,
+ "step": 23586
+ },
+ {
+ "epoch": 64.26975476839237,
+ "grad_norm": 4.413239002227783,
+ "learning_rate": 5.981089235053559e-06,
+ "loss": 0.0809,
+ "step": 23587
+ },
+ {
+ "epoch": 64.2724795640327,
+ "grad_norm": 3.7972803115844727,
+ "learning_rate": 5.980281161414339e-06,
+ "loss": 0.0749,
+ "step": 23588
+ },
+ {
+ "epoch": 64.27520435967303,
+ "grad_norm": 2.0995733737945557,
+ "learning_rate": 5.9794731190805635e-06,
+ "loss": 0.1192,
+ "step": 23589
+ },
+ {
+ "epoch": 64.27792915531334,
+ "grad_norm": 2.1572067737579346,
+ "learning_rate": 5.978665108058519e-06,
+ "loss": 0.1144,
+ "step": 23590
+ },
+ {
+ "epoch": 64.28065395095368,
+ "grad_norm": 3.133448362350464,
+ "learning_rate": 5.977857128354503e-06,
+ "loss": 0.0576,
+ "step": 23591
+ },
+ {
+ "epoch": 64.28337874659401,
+ "grad_norm": 3.8053882122039795,
+ "learning_rate": 5.977049179974804e-06,
+ "loss": 0.1044,
+ "step": 23592
+ },
+ {
+ "epoch": 64.28610354223433,
+ "grad_norm": 3.0806984901428223,
+ "learning_rate": 5.976241262925719e-06,
+ "loss": 0.0541,
+ "step": 23593
+ },
+ {
+ "epoch": 64.28882833787466,
+ "grad_norm": 3.3876729011535645,
+ "learning_rate": 5.975433377213537e-06,
+ "loss": 0.075,
+ "step": 23594
+ },
+ {
+ "epoch": 64.29155313351498,
+ "grad_norm": 3.0282328128814697,
+ "learning_rate": 5.974625522844551e-06,
+ "loss": 0.1608,
+ "step": 23595
+ },
+ {
+ "epoch": 64.29427792915531,
+ "grad_norm": 3.436739444732666,
+ "learning_rate": 5.9738176998250484e-06,
+ "loss": 0.1862,
+ "step": 23596
+ },
+ {
+ "epoch": 64.29700272479565,
+ "grad_norm": 3.1355998516082764,
+ "learning_rate": 5.973009908161328e-06,
+ "loss": 0.0927,
+ "step": 23597
+ },
+ {
+ "epoch": 64.29972752043597,
+ "grad_norm": 3.6452877521514893,
+ "learning_rate": 5.972202147859671e-06,
+ "loss": 0.0777,
+ "step": 23598
+ },
+ {
+ "epoch": 64.3024523160763,
+ "grad_norm": 3.05553936958313,
+ "learning_rate": 5.971394418926379e-06,
+ "loss": 0.1025,
+ "step": 23599
+ },
+ {
+ "epoch": 64.30517711171662,
+ "grad_norm": 4.310255527496338,
+ "learning_rate": 5.970586721367737e-06,
+ "loss": 0.1987,
+ "step": 23600
+ },
+ {
+ "epoch": 64.30790190735695,
+ "grad_norm": 3.7769877910614014,
+ "learning_rate": 5.969779055190035e-06,
+ "loss": 0.0601,
+ "step": 23601
+ },
+ {
+ "epoch": 64.31062670299727,
+ "grad_norm": 3.2985124588012695,
+ "learning_rate": 5.968971420399565e-06,
+ "loss": 0.054,
+ "step": 23602
+ },
+ {
+ "epoch": 64.3133514986376,
+ "grad_norm": 2.882575750350952,
+ "learning_rate": 5.968163817002616e-06,
+ "loss": 0.0957,
+ "step": 23603
+ },
+ {
+ "epoch": 64.31607629427793,
+ "grad_norm": 3.0860962867736816,
+ "learning_rate": 5.967356245005478e-06,
+ "loss": 0.0546,
+ "step": 23604
+ },
+ {
+ "epoch": 64.31880108991825,
+ "grad_norm": 2.7559969425201416,
+ "learning_rate": 5.966548704414436e-06,
+ "loss": 0.0598,
+ "step": 23605
+ },
+ {
+ "epoch": 64.32152588555859,
+ "grad_norm": 3.6411938667297363,
+ "learning_rate": 5.965741195235786e-06,
+ "loss": 0.0511,
+ "step": 23606
+ },
+ {
+ "epoch": 64.3242506811989,
+ "grad_norm": 3.7164576053619385,
+ "learning_rate": 5.964933717475814e-06,
+ "loss": 0.1375,
+ "step": 23607
+ },
+ {
+ "epoch": 64.32697547683924,
+ "grad_norm": 2.882533073425293,
+ "learning_rate": 5.964126271140807e-06,
+ "loss": 0.1998,
+ "step": 23608
+ },
+ {
+ "epoch": 64.32970027247957,
+ "grad_norm": 4.589282512664795,
+ "learning_rate": 5.963318856237057e-06,
+ "loss": 0.194,
+ "step": 23609
+ },
+ {
+ "epoch": 64.33242506811989,
+ "grad_norm": 3.3938426971435547,
+ "learning_rate": 5.962511472770847e-06,
+ "loss": 0.0724,
+ "step": 23610
+ },
+ {
+ "epoch": 64.33514986376022,
+ "grad_norm": 4.910046100616455,
+ "learning_rate": 5.96170412074847e-06,
+ "loss": 0.1615,
+ "step": 23611
+ },
+ {
+ "epoch": 64.33787465940054,
+ "grad_norm": 4.328702449798584,
+ "learning_rate": 5.96089680017621e-06,
+ "loss": 0.1349,
+ "step": 23612
+ },
+ {
+ "epoch": 64.34059945504087,
+ "grad_norm": 3.49149751663208,
+ "learning_rate": 5.960089511060357e-06,
+ "loss": 0.3481,
+ "step": 23613
+ },
+ {
+ "epoch": 64.34332425068119,
+ "grad_norm": 3.5896120071411133,
+ "learning_rate": 5.959282253407195e-06,
+ "loss": 0.1556,
+ "step": 23614
+ },
+ {
+ "epoch": 64.34604904632153,
+ "grad_norm": 3.272707939147949,
+ "learning_rate": 5.958475027223009e-06,
+ "loss": 0.0618,
+ "step": 23615
+ },
+ {
+ "epoch": 64.34877384196186,
+ "grad_norm": 2.840674877166748,
+ "learning_rate": 5.9576678325140956e-06,
+ "loss": 0.0625,
+ "step": 23616
+ },
+ {
+ "epoch": 64.35149863760218,
+ "grad_norm": 5.62224817276001,
+ "learning_rate": 5.9568606692867325e-06,
+ "loss": 0.0908,
+ "step": 23617
+ },
+ {
+ "epoch": 64.35422343324251,
+ "grad_norm": 4.2583417892456055,
+ "learning_rate": 5.95605353754721e-06,
+ "loss": 0.1116,
+ "step": 23618
+ },
+ {
+ "epoch": 64.35694822888283,
+ "grad_norm": 2.7511730194091797,
+ "learning_rate": 5.955246437301811e-06,
+ "loss": 0.302,
+ "step": 23619
+ },
+ {
+ "epoch": 64.35967302452316,
+ "grad_norm": 4.065578937530518,
+ "learning_rate": 5.954439368556826e-06,
+ "loss": 0.0696,
+ "step": 23620
+ },
+ {
+ "epoch": 64.3623978201635,
+ "grad_norm": 3.425901412963867,
+ "learning_rate": 5.953632331318533e-06,
+ "loss": 0.0741,
+ "step": 23621
+ },
+ {
+ "epoch": 64.36512261580381,
+ "grad_norm": 3.6608924865722656,
+ "learning_rate": 5.952825325593223e-06,
+ "loss": 0.066,
+ "step": 23622
+ },
+ {
+ "epoch": 64.36784741144415,
+ "grad_norm": 3.296431541442871,
+ "learning_rate": 5.952018351387178e-06,
+ "loss": 0.1276,
+ "step": 23623
+ },
+ {
+ "epoch": 64.37057220708446,
+ "grad_norm": 3.9703187942504883,
+ "learning_rate": 5.951211408706685e-06,
+ "loss": 0.0704,
+ "step": 23624
+ },
+ {
+ "epoch": 64.3732970027248,
+ "grad_norm": 3.351677417755127,
+ "learning_rate": 5.9504044975580265e-06,
+ "loss": 0.1034,
+ "step": 23625
+ },
+ {
+ "epoch": 64.37602179836512,
+ "grad_norm": 4.483058452606201,
+ "learning_rate": 5.9495976179474876e-06,
+ "loss": 0.049,
+ "step": 23626
+ },
+ {
+ "epoch": 64.37874659400545,
+ "grad_norm": 2.7362608909606934,
+ "learning_rate": 5.948790769881352e-06,
+ "loss": 0.1589,
+ "step": 23627
+ },
+ {
+ "epoch": 64.38147138964578,
+ "grad_norm": 2.8398773670196533,
+ "learning_rate": 5.947983953365902e-06,
+ "loss": 0.0986,
+ "step": 23628
+ },
+ {
+ "epoch": 64.3841961852861,
+ "grad_norm": 11.262439727783203,
+ "learning_rate": 5.947177168407425e-06,
+ "loss": 0.0562,
+ "step": 23629
+ },
+ {
+ "epoch": 64.38692098092643,
+ "grad_norm": 5.799773693084717,
+ "learning_rate": 5.9463704150122e-06,
+ "loss": 0.1101,
+ "step": 23630
+ },
+ {
+ "epoch": 64.38964577656675,
+ "grad_norm": 4.184062957763672,
+ "learning_rate": 5.945563693186514e-06,
+ "loss": 0.1407,
+ "step": 23631
+ },
+ {
+ "epoch": 64.39237057220708,
+ "grad_norm": 3.3891074657440186,
+ "learning_rate": 5.9447570029366456e-06,
+ "loss": 0.128,
+ "step": 23632
+ },
+ {
+ "epoch": 64.39509536784742,
+ "grad_norm": 4.880205154418945,
+ "learning_rate": 5.943950344268876e-06,
+ "loss": 0.2385,
+ "step": 23633
+ },
+ {
+ "epoch": 64.39782016348774,
+ "grad_norm": 2.8757264614105225,
+ "learning_rate": 5.943143717189495e-06,
+ "loss": 0.0491,
+ "step": 23634
+ },
+ {
+ "epoch": 64.40054495912807,
+ "grad_norm": 3.768073797225952,
+ "learning_rate": 5.942337121704779e-06,
+ "loss": 0.2386,
+ "step": 23635
+ },
+ {
+ "epoch": 64.40326975476839,
+ "grad_norm": 3.859701156616211,
+ "learning_rate": 5.941530557821012e-06,
+ "loss": 0.2186,
+ "step": 23636
+ },
+ {
+ "epoch": 64.40599455040872,
+ "grad_norm": 2.6606013774871826,
+ "learning_rate": 5.940724025544473e-06,
+ "loss": 0.0503,
+ "step": 23637
+ },
+ {
+ "epoch": 64.40871934604904,
+ "grad_norm": 2.6012561321258545,
+ "learning_rate": 5.939917524881446e-06,
+ "loss": 0.0692,
+ "step": 23638
+ },
+ {
+ "epoch": 64.41144414168937,
+ "grad_norm": 3.684028387069702,
+ "learning_rate": 5.939111055838209e-06,
+ "loss": 0.1585,
+ "step": 23639
+ },
+ {
+ "epoch": 64.4141689373297,
+ "grad_norm": 4.496323585510254,
+ "learning_rate": 5.9383046184210465e-06,
+ "loss": 0.1435,
+ "step": 23640
+ },
+ {
+ "epoch": 64.41689373297002,
+ "grad_norm": 4.281190395355225,
+ "learning_rate": 5.937498212636235e-06,
+ "loss": 0.1141,
+ "step": 23641
+ },
+ {
+ "epoch": 64.41961852861036,
+ "grad_norm": 3.095984935760498,
+ "learning_rate": 5.936691838490058e-06,
+ "loss": 0.1678,
+ "step": 23642
+ },
+ {
+ "epoch": 64.42234332425068,
+ "grad_norm": 4.5127129554748535,
+ "learning_rate": 5.935885495988794e-06,
+ "loss": 0.0855,
+ "step": 23643
+ },
+ {
+ "epoch": 64.42506811989101,
+ "grad_norm": 2.6886441707611084,
+ "learning_rate": 5.935079185138722e-06,
+ "loss": 0.0443,
+ "step": 23644
+ },
+ {
+ "epoch": 64.42779291553134,
+ "grad_norm": 3.247974395751953,
+ "learning_rate": 5.934272905946123e-06,
+ "loss": 0.0949,
+ "step": 23645
+ },
+ {
+ "epoch": 64.43051771117166,
+ "grad_norm": 3.4779772758483887,
+ "learning_rate": 5.933466658417277e-06,
+ "loss": 0.0816,
+ "step": 23646
+ },
+ {
+ "epoch": 64.433242506812,
+ "grad_norm": 4.464017868041992,
+ "learning_rate": 5.932660442558459e-06,
+ "loss": 0.0907,
+ "step": 23647
+ },
+ {
+ "epoch": 64.43596730245231,
+ "grad_norm": 4.169822692871094,
+ "learning_rate": 5.931854258375953e-06,
+ "loss": 0.1062,
+ "step": 23648
+ },
+ {
+ "epoch": 64.43869209809264,
+ "grad_norm": 2.2529373168945312,
+ "learning_rate": 5.931048105876034e-06,
+ "loss": 0.0909,
+ "step": 23649
+ },
+ {
+ "epoch": 64.44141689373296,
+ "grad_norm": 5.601505279541016,
+ "learning_rate": 5.930241985064978e-06,
+ "loss": 0.1398,
+ "step": 23650
+ },
+ {
+ "epoch": 64.4441416893733,
+ "grad_norm": 3.7766969203948975,
+ "learning_rate": 5.92943589594907e-06,
+ "loss": 0.0856,
+ "step": 23651
+ },
+ {
+ "epoch": 64.44686648501363,
+ "grad_norm": 8.199073791503906,
+ "learning_rate": 5.928629838534586e-06,
+ "loss": 0.1029,
+ "step": 23652
+ },
+ {
+ "epoch": 64.44959128065395,
+ "grad_norm": 4.182126998901367,
+ "learning_rate": 5.9278238128277975e-06,
+ "loss": 0.0928,
+ "step": 23653
+ },
+ {
+ "epoch": 64.45231607629428,
+ "grad_norm": 5.7247443199157715,
+ "learning_rate": 5.92701781883499e-06,
+ "loss": 0.0868,
+ "step": 23654
+ },
+ {
+ "epoch": 64.4550408719346,
+ "grad_norm": 4.4931206703186035,
+ "learning_rate": 5.926211856562434e-06,
+ "loss": 0.0469,
+ "step": 23655
+ },
+ {
+ "epoch": 64.45776566757493,
+ "grad_norm": 3.3259570598602295,
+ "learning_rate": 5.925405926016412e-06,
+ "loss": 0.0708,
+ "step": 23656
+ },
+ {
+ "epoch": 64.46049046321527,
+ "grad_norm": 3.7143845558166504,
+ "learning_rate": 5.924600027203194e-06,
+ "loss": 0.0705,
+ "step": 23657
+ },
+ {
+ "epoch": 64.46321525885558,
+ "grad_norm": 4.819847583770752,
+ "learning_rate": 5.923794160129064e-06,
+ "loss": 0.0793,
+ "step": 23658
+ },
+ {
+ "epoch": 64.46594005449592,
+ "grad_norm": 3.607992649078369,
+ "learning_rate": 5.92298832480029e-06,
+ "loss": 0.055,
+ "step": 23659
+ },
+ {
+ "epoch": 64.46866485013624,
+ "grad_norm": 4.808532238006592,
+ "learning_rate": 5.9221825212231545e-06,
+ "loss": 0.1354,
+ "step": 23660
+ },
+ {
+ "epoch": 64.47138964577657,
+ "grad_norm": 5.646035671234131,
+ "learning_rate": 5.921376749403928e-06,
+ "loss": 0.168,
+ "step": 23661
+ },
+ {
+ "epoch": 64.47411444141689,
+ "grad_norm": 3.122415781021118,
+ "learning_rate": 5.92057100934889e-06,
+ "loss": 0.0751,
+ "step": 23662
+ },
+ {
+ "epoch": 64.47683923705722,
+ "grad_norm": 3.0227866172790527,
+ "learning_rate": 5.919765301064311e-06,
+ "loss": 0.0569,
+ "step": 23663
+ },
+ {
+ "epoch": 64.47956403269755,
+ "grad_norm": 3.958361864089966,
+ "learning_rate": 5.9189596245564715e-06,
+ "loss": 0.0974,
+ "step": 23664
+ },
+ {
+ "epoch": 64.48228882833787,
+ "grad_norm": 2.760798215866089,
+ "learning_rate": 5.918153979831641e-06,
+ "loss": 0.0459,
+ "step": 23665
+ },
+ {
+ "epoch": 64.4850136239782,
+ "grad_norm": 4.043485164642334,
+ "learning_rate": 5.917348366896099e-06,
+ "loss": 0.0965,
+ "step": 23666
+ },
+ {
+ "epoch": 64.48773841961852,
+ "grad_norm": 3.1446847915649414,
+ "learning_rate": 5.9165427857561096e-06,
+ "loss": 0.0407,
+ "step": 23667
+ },
+ {
+ "epoch": 64.49046321525886,
+ "grad_norm": 2.5701584815979004,
+ "learning_rate": 5.915737236417957e-06,
+ "loss": 0.049,
+ "step": 23668
+ },
+ {
+ "epoch": 64.49318801089919,
+ "grad_norm": 6.109796047210693,
+ "learning_rate": 5.914931718887915e-06,
+ "loss": 0.1148,
+ "step": 23669
+ },
+ {
+ "epoch": 64.49591280653951,
+ "grad_norm": 3.7845213413238525,
+ "learning_rate": 5.9141262331722505e-06,
+ "loss": 0.0693,
+ "step": 23670
+ },
+ {
+ "epoch": 64.49863760217984,
+ "grad_norm": 2.7459239959716797,
+ "learning_rate": 5.913320779277239e-06,
+ "loss": 0.0453,
+ "step": 23671
+ },
+ {
+ "epoch": 64.50136239782016,
+ "grad_norm": 3.674323320388794,
+ "learning_rate": 5.912515357209154e-06,
+ "loss": 0.0809,
+ "step": 23672
+ },
+ {
+ "epoch": 64.50408719346049,
+ "grad_norm": 13.672555923461914,
+ "learning_rate": 5.911709966974269e-06,
+ "loss": 0.1282,
+ "step": 23673
+ },
+ {
+ "epoch": 64.50681198910081,
+ "grad_norm": 4.414234638214111,
+ "learning_rate": 5.910904608578855e-06,
+ "loss": 0.083,
+ "step": 23674
+ },
+ {
+ "epoch": 64.50953678474114,
+ "grad_norm": 3.071168899536133,
+ "learning_rate": 5.910099282029182e-06,
+ "loss": 0.1563,
+ "step": 23675
+ },
+ {
+ "epoch": 64.51226158038148,
+ "grad_norm": 3.6425254344940186,
+ "learning_rate": 5.909293987331528e-06,
+ "loss": 0.1284,
+ "step": 23676
+ },
+ {
+ "epoch": 64.5149863760218,
+ "grad_norm": 4.040872097015381,
+ "learning_rate": 5.908488724492157e-06,
+ "loss": 0.0854,
+ "step": 23677
+ },
+ {
+ "epoch": 64.51771117166213,
+ "grad_norm": 3.6724729537963867,
+ "learning_rate": 5.907683493517348e-06,
+ "loss": 0.1106,
+ "step": 23678
+ },
+ {
+ "epoch": 64.52043596730245,
+ "grad_norm": 4.090834140777588,
+ "learning_rate": 5.906878294413365e-06,
+ "loss": 0.1218,
+ "step": 23679
+ },
+ {
+ "epoch": 64.52316076294278,
+ "grad_norm": 3.1486189365386963,
+ "learning_rate": 5.906073127186485e-06,
+ "loss": 0.0427,
+ "step": 23680
+ },
+ {
+ "epoch": 64.52588555858311,
+ "grad_norm": 3.0365872383117676,
+ "learning_rate": 5.905267991842972e-06,
+ "loss": 0.0673,
+ "step": 23681
+ },
+ {
+ "epoch": 64.52861035422343,
+ "grad_norm": 5.883402347564697,
+ "learning_rate": 5.904462888389104e-06,
+ "loss": 0.1758,
+ "step": 23682
+ },
+ {
+ "epoch": 64.53133514986376,
+ "grad_norm": 4.505124092102051,
+ "learning_rate": 5.903657816831143e-06,
+ "loss": 0.0527,
+ "step": 23683
+ },
+ {
+ "epoch": 64.53405994550408,
+ "grad_norm": 4.534233570098877,
+ "learning_rate": 5.902852777175363e-06,
+ "loss": 0.1013,
+ "step": 23684
+ },
+ {
+ "epoch": 64.53678474114442,
+ "grad_norm": 3.4307634830474854,
+ "learning_rate": 5.9020477694280375e-06,
+ "loss": 0.0566,
+ "step": 23685
+ },
+ {
+ "epoch": 64.53950953678473,
+ "grad_norm": 3.6816563606262207,
+ "learning_rate": 5.9012427935954295e-06,
+ "loss": 0.1486,
+ "step": 23686
+ },
+ {
+ "epoch": 64.54223433242507,
+ "grad_norm": 4.910661220550537,
+ "learning_rate": 5.900437849683813e-06,
+ "loss": 0.0868,
+ "step": 23687
+ },
+ {
+ "epoch": 64.5449591280654,
+ "grad_norm": 4.9586310386657715,
+ "learning_rate": 5.899632937699453e-06,
+ "loss": 0.0842,
+ "step": 23688
+ },
+ {
+ "epoch": 64.54768392370572,
+ "grad_norm": 5.120810508728027,
+ "learning_rate": 5.89882805764862e-06,
+ "loss": 0.0779,
+ "step": 23689
+ },
+ {
+ "epoch": 64.55040871934605,
+ "grad_norm": 3.6106836795806885,
+ "learning_rate": 5.898023209537582e-06,
+ "loss": 0.1112,
+ "step": 23690
+ },
+ {
+ "epoch": 64.55313351498637,
+ "grad_norm": 4.148248672485352,
+ "learning_rate": 5.897218393372609e-06,
+ "loss": 0.0957,
+ "step": 23691
+ },
+ {
+ "epoch": 64.5558583106267,
+ "grad_norm": 6.041697025299072,
+ "learning_rate": 5.896413609159964e-06,
+ "loss": 0.0736,
+ "step": 23692
+ },
+ {
+ "epoch": 64.55858310626704,
+ "grad_norm": 5.618400573730469,
+ "learning_rate": 5.8956088569059185e-06,
+ "loss": 0.0865,
+ "step": 23693
+ },
+ {
+ "epoch": 64.56130790190736,
+ "grad_norm": 3.0874156951904297,
+ "learning_rate": 5.89480413661674e-06,
+ "loss": 0.0391,
+ "step": 23694
+ },
+ {
+ "epoch": 64.56403269754769,
+ "grad_norm": 3.1987128257751465,
+ "learning_rate": 5.893999448298695e-06,
+ "loss": 0.149,
+ "step": 23695
+ },
+ {
+ "epoch": 64.566757493188,
+ "grad_norm": 3.7000083923339844,
+ "learning_rate": 5.893194791958051e-06,
+ "loss": 0.059,
+ "step": 23696
+ },
+ {
+ "epoch": 64.56948228882834,
+ "grad_norm": 3.5692005157470703,
+ "learning_rate": 5.892390167601072e-06,
+ "loss": 0.0889,
+ "step": 23697
+ },
+ {
+ "epoch": 64.57220708446866,
+ "grad_norm": 4.626175403594971,
+ "learning_rate": 5.891585575234028e-06,
+ "loss": 0.0917,
+ "step": 23698
+ },
+ {
+ "epoch": 64.57493188010899,
+ "grad_norm": 3.606637477874756,
+ "learning_rate": 5.89078101486318e-06,
+ "loss": 0.0576,
+ "step": 23699
+ },
+ {
+ "epoch": 64.57765667574932,
+ "grad_norm": 3.872769355773926,
+ "learning_rate": 5.889976486494802e-06,
+ "loss": 0.0773,
+ "step": 23700
+ },
+ {
+ "epoch": 64.58038147138964,
+ "grad_norm": 2.6828160285949707,
+ "learning_rate": 5.889171990135149e-06,
+ "loss": 0.0369,
+ "step": 23701
+ },
+ {
+ "epoch": 64.58310626702998,
+ "grad_norm": 4.715063095092773,
+ "learning_rate": 5.8883675257904936e-06,
+ "loss": 0.0663,
+ "step": 23702
+ },
+ {
+ "epoch": 64.5858310626703,
+ "grad_norm": 4.230589389801025,
+ "learning_rate": 5.887563093467103e-06,
+ "loss": 0.1712,
+ "step": 23703
+ },
+ {
+ "epoch": 64.58855585831063,
+ "grad_norm": 3.561528444290161,
+ "learning_rate": 5.886758693171236e-06,
+ "loss": 0.0678,
+ "step": 23704
+ },
+ {
+ "epoch": 64.59128065395096,
+ "grad_norm": 2.2918155193328857,
+ "learning_rate": 5.885954324909162e-06,
+ "loss": 0.0359,
+ "step": 23705
+ },
+ {
+ "epoch": 64.59400544959128,
+ "grad_norm": 3.7067036628723145,
+ "learning_rate": 5.885149988687141e-06,
+ "loss": 0.1517,
+ "step": 23706
+ },
+ {
+ "epoch": 64.59673024523161,
+ "grad_norm": 3.9828476905822754,
+ "learning_rate": 5.8843456845114426e-06,
+ "loss": 0.0573,
+ "step": 23707
+ },
+ {
+ "epoch": 64.59945504087193,
+ "grad_norm": 2.729644775390625,
+ "learning_rate": 5.883541412388325e-06,
+ "loss": 0.0392,
+ "step": 23708
+ },
+ {
+ "epoch": 64.60217983651226,
+ "grad_norm": 3.2439920902252197,
+ "learning_rate": 5.8827371723240555e-06,
+ "loss": 0.0729,
+ "step": 23709
+ },
+ {
+ "epoch": 64.60490463215258,
+ "grad_norm": 2.972121000289917,
+ "learning_rate": 5.881932964324895e-06,
+ "loss": 0.0569,
+ "step": 23710
+ },
+ {
+ "epoch": 64.60762942779292,
+ "grad_norm": 3.8448119163513184,
+ "learning_rate": 5.88112878839711e-06,
+ "loss": 0.0483,
+ "step": 23711
+ },
+ {
+ "epoch": 64.61035422343325,
+ "grad_norm": 3.6391313076019287,
+ "learning_rate": 5.88032464454696e-06,
+ "loss": 0.0694,
+ "step": 23712
+ },
+ {
+ "epoch": 64.61307901907357,
+ "grad_norm": 7.126327037811279,
+ "learning_rate": 5.879520532780709e-06,
+ "loss": 0.1552,
+ "step": 23713
+ },
+ {
+ "epoch": 64.6158038147139,
+ "grad_norm": 2.7950947284698486,
+ "learning_rate": 5.87871645310462e-06,
+ "loss": 0.0911,
+ "step": 23714
+ },
+ {
+ "epoch": 64.61852861035422,
+ "grad_norm": 2.5468971729278564,
+ "learning_rate": 5.877912405524954e-06,
+ "loss": 0.0395,
+ "step": 23715
+ },
+ {
+ "epoch": 64.62125340599455,
+ "grad_norm": 4.573666095733643,
+ "learning_rate": 5.8771083900479744e-06,
+ "loss": 0.1448,
+ "step": 23716
+ },
+ {
+ "epoch": 64.62397820163488,
+ "grad_norm": 3.492250680923462,
+ "learning_rate": 5.876304406679941e-06,
+ "loss": 0.0556,
+ "step": 23717
+ },
+ {
+ "epoch": 64.6267029972752,
+ "grad_norm": 12.995576858520508,
+ "learning_rate": 5.875500455427119e-06,
+ "loss": 0.1026,
+ "step": 23718
+ },
+ {
+ "epoch": 64.62942779291554,
+ "grad_norm": 3.482884168624878,
+ "learning_rate": 5.874696536295761e-06,
+ "loss": 0.0827,
+ "step": 23719
+ },
+ {
+ "epoch": 64.63215258855585,
+ "grad_norm": 3.9052515029907227,
+ "learning_rate": 5.873892649292136e-06,
+ "loss": 0.0709,
+ "step": 23720
+ },
+ {
+ "epoch": 64.63487738419619,
+ "grad_norm": 2.956522226333618,
+ "learning_rate": 5.873088794422505e-06,
+ "loss": 0.0453,
+ "step": 23721
+ },
+ {
+ "epoch": 64.6376021798365,
+ "grad_norm": 3.4227848052978516,
+ "learning_rate": 5.872284971693123e-06,
+ "loss": 0.061,
+ "step": 23722
+ },
+ {
+ "epoch": 64.64032697547684,
+ "grad_norm": 2.823970317840576,
+ "learning_rate": 5.871481181110255e-06,
+ "loss": 0.0748,
+ "step": 23723
+ },
+ {
+ "epoch": 64.64305177111717,
+ "grad_norm": 3.349766731262207,
+ "learning_rate": 5.870677422680156e-06,
+ "loss": 0.0453,
+ "step": 23724
+ },
+ {
+ "epoch": 64.64577656675749,
+ "grad_norm": 4.023482799530029,
+ "learning_rate": 5.8698736964090904e-06,
+ "loss": 0.096,
+ "step": 23725
+ },
+ {
+ "epoch": 64.64850136239782,
+ "grad_norm": 3.8858907222747803,
+ "learning_rate": 5.8690700023033145e-06,
+ "loss": 0.1997,
+ "step": 23726
+ },
+ {
+ "epoch": 64.65122615803814,
+ "grad_norm": 3.495682954788208,
+ "learning_rate": 5.86826634036909e-06,
+ "loss": 0.0511,
+ "step": 23727
+ },
+ {
+ "epoch": 64.65395095367847,
+ "grad_norm": 4.163297176361084,
+ "learning_rate": 5.867462710612672e-06,
+ "loss": 0.0771,
+ "step": 23728
+ },
+ {
+ "epoch": 64.65667574931881,
+ "grad_norm": 3.787161111831665,
+ "learning_rate": 5.866659113040324e-06,
+ "loss": 0.2429,
+ "step": 23729
+ },
+ {
+ "epoch": 64.65940054495913,
+ "grad_norm": 4.401248455047607,
+ "learning_rate": 5.8658555476582994e-06,
+ "loss": 0.1871,
+ "step": 23730
+ },
+ {
+ "epoch": 64.66212534059946,
+ "grad_norm": 3.2518022060394287,
+ "learning_rate": 5.865052014472861e-06,
+ "loss": 0.0604,
+ "step": 23731
+ },
+ {
+ "epoch": 64.66485013623978,
+ "grad_norm": 3.5951952934265137,
+ "learning_rate": 5.8642485134902625e-06,
+ "loss": 0.0658,
+ "step": 23732
+ },
+ {
+ "epoch": 64.66757493188011,
+ "grad_norm": 2.5962295532226562,
+ "learning_rate": 5.863445044716764e-06,
+ "loss": 0.0431,
+ "step": 23733
+ },
+ {
+ "epoch": 64.67029972752043,
+ "grad_norm": 2.7388525009155273,
+ "learning_rate": 5.862641608158623e-06,
+ "loss": 0.0415,
+ "step": 23734
+ },
+ {
+ "epoch": 64.67302452316076,
+ "grad_norm": 2.9878427982330322,
+ "learning_rate": 5.861838203822096e-06,
+ "loss": 0.0564,
+ "step": 23735
+ },
+ {
+ "epoch": 64.6757493188011,
+ "grad_norm": 3.394355297088623,
+ "learning_rate": 5.861034831713435e-06,
+ "loss": 0.0978,
+ "step": 23736
+ },
+ {
+ "epoch": 64.67847411444141,
+ "grad_norm": 2.9823338985443115,
+ "learning_rate": 5.860231491838906e-06,
+ "loss": 0.084,
+ "step": 23737
+ },
+ {
+ "epoch": 64.68119891008175,
+ "grad_norm": 2.810248851776123,
+ "learning_rate": 5.859428184204761e-06,
+ "loss": 0.2109,
+ "step": 23738
+ },
+ {
+ "epoch": 64.68392370572207,
+ "grad_norm": 3.4153311252593994,
+ "learning_rate": 5.858624908817257e-06,
+ "loss": 0.092,
+ "step": 23739
+ },
+ {
+ "epoch": 64.6866485013624,
+ "grad_norm": 4.189194679260254,
+ "learning_rate": 5.857821665682646e-06,
+ "loss": 0.1303,
+ "step": 23740
+ },
+ {
+ "epoch": 64.68937329700273,
+ "grad_norm": 3.2839243412017822,
+ "learning_rate": 5.857018454807189e-06,
+ "loss": 0.041,
+ "step": 23741
+ },
+ {
+ "epoch": 64.69209809264305,
+ "grad_norm": 4.326436996459961,
+ "learning_rate": 5.856215276197137e-06,
+ "loss": 0.1038,
+ "step": 23742
+ },
+ {
+ "epoch": 64.69482288828338,
+ "grad_norm": 4.688022613525391,
+ "learning_rate": 5.855412129858749e-06,
+ "loss": 0.1052,
+ "step": 23743
+ },
+ {
+ "epoch": 64.6975476839237,
+ "grad_norm": 3.6603691577911377,
+ "learning_rate": 5.854609015798277e-06,
+ "loss": 0.0609,
+ "step": 23744
+ },
+ {
+ "epoch": 64.70027247956403,
+ "grad_norm": 3.4955921173095703,
+ "learning_rate": 5.8538059340219774e-06,
+ "loss": 0.0596,
+ "step": 23745
+ },
+ {
+ "epoch": 64.70299727520435,
+ "grad_norm": 3.845290184020996,
+ "learning_rate": 5.853002884536103e-06,
+ "loss": 0.0873,
+ "step": 23746
+ },
+ {
+ "epoch": 64.70572207084469,
+ "grad_norm": 3.763108968734741,
+ "learning_rate": 5.852199867346909e-06,
+ "loss": 0.1474,
+ "step": 23747
+ },
+ {
+ "epoch": 64.70844686648502,
+ "grad_norm": 4.986370086669922,
+ "learning_rate": 5.851396882460648e-06,
+ "loss": 0.2225,
+ "step": 23748
+ },
+ {
+ "epoch": 64.71117166212534,
+ "grad_norm": 3.1233103275299072,
+ "learning_rate": 5.850593929883577e-06,
+ "loss": 0.076,
+ "step": 23749
+ },
+ {
+ "epoch": 64.71389645776567,
+ "grad_norm": 4.560542583465576,
+ "learning_rate": 5.8497910096219435e-06,
+ "loss": 0.1405,
+ "step": 23750
+ },
+ {
+ "epoch": 64.71662125340599,
+ "grad_norm": 3.0604021549224854,
+ "learning_rate": 5.848988121682006e-06,
+ "loss": 0.0767,
+ "step": 23751
+ },
+ {
+ "epoch": 64.71934604904632,
+ "grad_norm": 23.736257553100586,
+ "learning_rate": 5.848185266070016e-06,
+ "loss": 0.1333,
+ "step": 23752
+ },
+ {
+ "epoch": 64.72207084468666,
+ "grad_norm": 4.732005596160889,
+ "learning_rate": 5.847382442792222e-06,
+ "loss": 0.0737,
+ "step": 23753
+ },
+ {
+ "epoch": 64.72479564032697,
+ "grad_norm": 3.6705281734466553,
+ "learning_rate": 5.8465796518548824e-06,
+ "loss": 0.0856,
+ "step": 23754
+ },
+ {
+ "epoch": 64.7275204359673,
+ "grad_norm": 3.666384220123291,
+ "learning_rate": 5.845776893264247e-06,
+ "loss": 0.1425,
+ "step": 23755
+ },
+ {
+ "epoch": 64.73024523160763,
+ "grad_norm": 4.7612175941467285,
+ "learning_rate": 5.844974167026567e-06,
+ "loss": 0.1459,
+ "step": 23756
+ },
+ {
+ "epoch": 64.73297002724796,
+ "grad_norm": 3.4738609790802,
+ "learning_rate": 5.8441714731480944e-06,
+ "loss": 0.2016,
+ "step": 23757
+ },
+ {
+ "epoch": 64.73569482288828,
+ "grad_norm": 4.037792682647705,
+ "learning_rate": 5.843368811635081e-06,
+ "loss": 0.0613,
+ "step": 23758
+ },
+ {
+ "epoch": 64.73841961852861,
+ "grad_norm": 3.863607406616211,
+ "learning_rate": 5.842566182493779e-06,
+ "loss": 0.1571,
+ "step": 23759
+ },
+ {
+ "epoch": 64.74114441416894,
+ "grad_norm": 3.6390492916107178,
+ "learning_rate": 5.8417635857304355e-06,
+ "loss": 0.2208,
+ "step": 23760
+ },
+ {
+ "epoch": 64.74386920980926,
+ "grad_norm": 2.9504313468933105,
+ "learning_rate": 5.840961021351305e-06,
+ "loss": 0.1737,
+ "step": 23761
+ },
+ {
+ "epoch": 64.7465940054496,
+ "grad_norm": 4.13885498046875,
+ "learning_rate": 5.840158489362635e-06,
+ "loss": 0.0879,
+ "step": 23762
+ },
+ {
+ "epoch": 64.74931880108991,
+ "grad_norm": 3.5123114585876465,
+ "learning_rate": 5.839355989770678e-06,
+ "loss": 0.0843,
+ "step": 23763
+ },
+ {
+ "epoch": 64.75204359673025,
+ "grad_norm": 3.2950191497802734,
+ "learning_rate": 5.8385535225816805e-06,
+ "loss": 0.0929,
+ "step": 23764
+ },
+ {
+ "epoch": 64.75476839237058,
+ "grad_norm": 3.906742572784424,
+ "learning_rate": 5.8377510878018975e-06,
+ "loss": 0.0736,
+ "step": 23765
+ },
+ {
+ "epoch": 64.7574931880109,
+ "grad_norm": 2.814589500427246,
+ "learning_rate": 5.836948685437573e-06,
+ "loss": 0.0522,
+ "step": 23766
+ },
+ {
+ "epoch": 64.76021798365123,
+ "grad_norm": 12.155994415283203,
+ "learning_rate": 5.836146315494956e-06,
+ "loss": 0.0752,
+ "step": 23767
+ },
+ {
+ "epoch": 64.76294277929155,
+ "grad_norm": 3.8262643814086914,
+ "learning_rate": 5.835343977980301e-06,
+ "loss": 0.1724,
+ "step": 23768
+ },
+ {
+ "epoch": 64.76566757493188,
+ "grad_norm": 5.280486106872559,
+ "learning_rate": 5.834541672899852e-06,
+ "loss": 0.1184,
+ "step": 23769
+ },
+ {
+ "epoch": 64.7683923705722,
+ "grad_norm": 5.157360076904297,
+ "learning_rate": 5.8337394002598565e-06,
+ "loss": 0.0717,
+ "step": 23770
+ },
+ {
+ "epoch": 64.77111716621253,
+ "grad_norm": 2.7944915294647217,
+ "learning_rate": 5.832937160066567e-06,
+ "loss": 0.1283,
+ "step": 23771
+ },
+ {
+ "epoch": 64.77384196185287,
+ "grad_norm": 4.003580570220947,
+ "learning_rate": 5.832134952326225e-06,
+ "loss": 0.0931,
+ "step": 23772
+ },
+ {
+ "epoch": 64.77656675749319,
+ "grad_norm": 5.369149208068848,
+ "learning_rate": 5.831332777045087e-06,
+ "loss": 0.0656,
+ "step": 23773
+ },
+ {
+ "epoch": 64.77929155313352,
+ "grad_norm": 4.331752777099609,
+ "learning_rate": 5.830530634229393e-06,
+ "loss": 0.0937,
+ "step": 23774
+ },
+ {
+ "epoch": 64.78201634877384,
+ "grad_norm": 4.510578155517578,
+ "learning_rate": 5.829728523885394e-06,
+ "loss": 0.2126,
+ "step": 23775
+ },
+ {
+ "epoch": 64.78474114441417,
+ "grad_norm": 3.1642606258392334,
+ "learning_rate": 5.82892644601933e-06,
+ "loss": 0.0441,
+ "step": 23776
+ },
+ {
+ "epoch": 64.7874659400545,
+ "grad_norm": 3.814603805541992,
+ "learning_rate": 5.828124400637456e-06,
+ "loss": 0.0558,
+ "step": 23777
+ },
+ {
+ "epoch": 64.79019073569482,
+ "grad_norm": 3.7792811393737793,
+ "learning_rate": 5.827322387746018e-06,
+ "loss": 0.1459,
+ "step": 23778
+ },
+ {
+ "epoch": 64.79291553133515,
+ "grad_norm": 2.392956256866455,
+ "learning_rate": 5.826520407351252e-06,
+ "loss": 0.0369,
+ "step": 23779
+ },
+ {
+ "epoch": 64.79564032697547,
+ "grad_norm": 4.206678867340088,
+ "learning_rate": 5.8257184594594155e-06,
+ "loss": 0.0805,
+ "step": 23780
+ },
+ {
+ "epoch": 64.7983651226158,
+ "grad_norm": 3.7099359035491943,
+ "learning_rate": 5.824916544076749e-06,
+ "loss": 0.0595,
+ "step": 23781
+ },
+ {
+ "epoch": 64.80108991825612,
+ "grad_norm": 3.81819486618042,
+ "learning_rate": 5.824114661209498e-06,
+ "loss": 0.1998,
+ "step": 23782
+ },
+ {
+ "epoch": 64.80381471389646,
+ "grad_norm": 2.6584384441375732,
+ "learning_rate": 5.823312810863904e-06,
+ "loss": 0.0494,
+ "step": 23783
+ },
+ {
+ "epoch": 64.80653950953679,
+ "grad_norm": 5.343811511993408,
+ "learning_rate": 5.82251099304622e-06,
+ "loss": 0.0862,
+ "step": 23784
+ },
+ {
+ "epoch": 64.80926430517711,
+ "grad_norm": 3.189709424972534,
+ "learning_rate": 5.821709207762684e-06,
+ "loss": 0.0693,
+ "step": 23785
+ },
+ {
+ "epoch": 64.81198910081744,
+ "grad_norm": 4.335069179534912,
+ "learning_rate": 5.8209074550195445e-06,
+ "loss": 0.0996,
+ "step": 23786
+ },
+ {
+ "epoch": 64.81471389645776,
+ "grad_norm": 2.99347186088562,
+ "learning_rate": 5.8201057348230384e-06,
+ "loss": 0.1596,
+ "step": 23787
+ },
+ {
+ "epoch": 64.8174386920981,
+ "grad_norm": 3.288522243499756,
+ "learning_rate": 5.819304047179415e-06,
+ "loss": 0.1391,
+ "step": 23788
+ },
+ {
+ "epoch": 64.82016348773843,
+ "grad_norm": 5.136707305908203,
+ "learning_rate": 5.81850239209492e-06,
+ "loss": 0.0824,
+ "step": 23789
+ },
+ {
+ "epoch": 64.82288828337875,
+ "grad_norm": 3.021090030670166,
+ "learning_rate": 5.8177007695757935e-06,
+ "loss": 0.0393,
+ "step": 23790
+ },
+ {
+ "epoch": 64.82561307901908,
+ "grad_norm": 3.8290157318115234,
+ "learning_rate": 5.816899179628279e-06,
+ "loss": 0.0666,
+ "step": 23791
+ },
+ {
+ "epoch": 64.8283378746594,
+ "grad_norm": 2.9695990085601807,
+ "learning_rate": 5.816097622258616e-06,
+ "loss": 0.0864,
+ "step": 23792
+ },
+ {
+ "epoch": 64.83106267029973,
+ "grad_norm": 3.0893306732177734,
+ "learning_rate": 5.815296097473053e-06,
+ "loss": 0.0979,
+ "step": 23793
+ },
+ {
+ "epoch": 64.83378746594005,
+ "grad_norm": 5.386440277099609,
+ "learning_rate": 5.814494605277831e-06,
+ "loss": 0.1461,
+ "step": 23794
+ },
+ {
+ "epoch": 64.83651226158038,
+ "grad_norm": 3.264275074005127,
+ "learning_rate": 5.813693145679189e-06,
+ "loss": 0.048,
+ "step": 23795
+ },
+ {
+ "epoch": 64.83923705722071,
+ "grad_norm": 6.261340141296387,
+ "learning_rate": 5.8128917186833655e-06,
+ "loss": 0.1283,
+ "step": 23796
+ },
+ {
+ "epoch": 64.84196185286103,
+ "grad_norm": 3.908447027206421,
+ "learning_rate": 5.812090324296611e-06,
+ "loss": 0.0849,
+ "step": 23797
+ },
+ {
+ "epoch": 64.84468664850137,
+ "grad_norm": 4.705367565155029,
+ "learning_rate": 5.811288962525163e-06,
+ "loss": 0.0543,
+ "step": 23798
+ },
+ {
+ "epoch": 64.84741144414168,
+ "grad_norm": 4.353753566741943,
+ "learning_rate": 5.810487633375261e-06,
+ "loss": 0.077,
+ "step": 23799
+ },
+ {
+ "epoch": 64.85013623978202,
+ "grad_norm": 3.5391647815704346,
+ "learning_rate": 5.8096863368531435e-06,
+ "loss": 0.0938,
+ "step": 23800
+ },
+ {
+ "epoch": 64.85286103542235,
+ "grad_norm": 3.7956371307373047,
+ "learning_rate": 5.808885072965057e-06,
+ "loss": 0.0657,
+ "step": 23801
+ },
+ {
+ "epoch": 64.85558583106267,
+ "grad_norm": 3.606250762939453,
+ "learning_rate": 5.808083841717238e-06,
+ "loss": 0.0892,
+ "step": 23802
+ },
+ {
+ "epoch": 64.858310626703,
+ "grad_norm": 4.2467546463012695,
+ "learning_rate": 5.807282643115924e-06,
+ "loss": 0.0761,
+ "step": 23803
+ },
+ {
+ "epoch": 64.86103542234332,
+ "grad_norm": 3.940117359161377,
+ "learning_rate": 5.8064814771673625e-06,
+ "loss": 0.0849,
+ "step": 23804
+ },
+ {
+ "epoch": 64.86376021798365,
+ "grad_norm": 3.2259116172790527,
+ "learning_rate": 5.805680343877783e-06,
+ "loss": 0.146,
+ "step": 23805
+ },
+ {
+ "epoch": 64.86648501362397,
+ "grad_norm": 3.804685592651367,
+ "learning_rate": 5.804879243253435e-06,
+ "loss": 0.0772,
+ "step": 23806
+ },
+ {
+ "epoch": 64.8692098092643,
+ "grad_norm": 4.051899433135986,
+ "learning_rate": 5.804078175300551e-06,
+ "loss": 0.0817,
+ "step": 23807
+ },
+ {
+ "epoch": 64.87193460490464,
+ "grad_norm": 2.5785562992095947,
+ "learning_rate": 5.80327714002537e-06,
+ "loss": 0.1555,
+ "step": 23808
+ },
+ {
+ "epoch": 64.87465940054496,
+ "grad_norm": 3.2376959323883057,
+ "learning_rate": 5.802476137434132e-06,
+ "loss": 0.0874,
+ "step": 23809
+ },
+ {
+ "epoch": 64.87738419618529,
+ "grad_norm": 3.2956013679504395,
+ "learning_rate": 5.801675167533078e-06,
+ "loss": 0.0406,
+ "step": 23810
+ },
+ {
+ "epoch": 64.88010899182561,
+ "grad_norm": 3.075345277786255,
+ "learning_rate": 5.80087423032844e-06,
+ "loss": 0.035,
+ "step": 23811
+ },
+ {
+ "epoch": 64.88283378746594,
+ "grad_norm": 4.006364822387695,
+ "learning_rate": 5.800073325826456e-06,
+ "loss": 0.2162,
+ "step": 23812
+ },
+ {
+ "epoch": 64.88555858310627,
+ "grad_norm": 4.077402114868164,
+ "learning_rate": 5.799272454033369e-06,
+ "loss": 0.0608,
+ "step": 23813
+ },
+ {
+ "epoch": 64.88828337874659,
+ "grad_norm": 4.445973873138428,
+ "learning_rate": 5.7984716149554136e-06,
+ "loss": 0.1193,
+ "step": 23814
+ },
+ {
+ "epoch": 64.89100817438693,
+ "grad_norm": 4.7350358963012695,
+ "learning_rate": 5.797670808598826e-06,
+ "loss": 0.0419,
+ "step": 23815
+ },
+ {
+ "epoch": 64.89373297002724,
+ "grad_norm": 4.542581558227539,
+ "learning_rate": 5.796870034969837e-06,
+ "loss": 0.058,
+ "step": 23816
+ },
+ {
+ "epoch": 64.89645776566758,
+ "grad_norm": 3.4470760822296143,
+ "learning_rate": 5.796069294074696e-06,
+ "loss": 0.1338,
+ "step": 23817
+ },
+ {
+ "epoch": 64.8991825613079,
+ "grad_norm": 6.367007255554199,
+ "learning_rate": 5.795268585919629e-06,
+ "loss": 0.0696,
+ "step": 23818
+ },
+ {
+ "epoch": 64.90190735694823,
+ "grad_norm": 4.687518119812012,
+ "learning_rate": 5.794467910510877e-06,
+ "loss": 0.0515,
+ "step": 23819
+ },
+ {
+ "epoch": 64.90463215258856,
+ "grad_norm": 3.0287528038024902,
+ "learning_rate": 5.793667267854668e-06,
+ "loss": 0.1559,
+ "step": 23820
+ },
+ {
+ "epoch": 64.90735694822888,
+ "grad_norm": 4.91618537902832,
+ "learning_rate": 5.792866657957248e-06,
+ "loss": 0.1055,
+ "step": 23821
+ },
+ {
+ "epoch": 64.91008174386921,
+ "grad_norm": 4.167760372161865,
+ "learning_rate": 5.792066080824843e-06,
+ "loss": 0.1429,
+ "step": 23822
+ },
+ {
+ "epoch": 64.91280653950953,
+ "grad_norm": 5.756951808929443,
+ "learning_rate": 5.791265536463696e-06,
+ "loss": 0.1086,
+ "step": 23823
+ },
+ {
+ "epoch": 64.91553133514986,
+ "grad_norm": 3.9203407764434814,
+ "learning_rate": 5.790465024880033e-06,
+ "loss": 0.2407,
+ "step": 23824
+ },
+ {
+ "epoch": 64.9182561307902,
+ "grad_norm": 3.6706271171569824,
+ "learning_rate": 5.7896645460800986e-06,
+ "loss": 0.0792,
+ "step": 23825
+ },
+ {
+ "epoch": 64.92098092643052,
+ "grad_norm": 2.9809834957122803,
+ "learning_rate": 5.7888641000701195e-06,
+ "loss": 0.0855,
+ "step": 23826
+ },
+ {
+ "epoch": 64.92370572207085,
+ "grad_norm": 2.1346495151519775,
+ "learning_rate": 5.788063686856331e-06,
+ "loss": 0.0711,
+ "step": 23827
+ },
+ {
+ "epoch": 64.92643051771117,
+ "grad_norm": 3.736856460571289,
+ "learning_rate": 5.7872633064449635e-06,
+ "loss": 0.1116,
+ "step": 23828
+ },
+ {
+ "epoch": 64.9291553133515,
+ "grad_norm": 3.1223020553588867,
+ "learning_rate": 5.786462958842258e-06,
+ "loss": 0.1157,
+ "step": 23829
+ },
+ {
+ "epoch": 64.93188010899182,
+ "grad_norm": 3.967301368713379,
+ "learning_rate": 5.785662644054444e-06,
+ "loss": 0.0643,
+ "step": 23830
+ },
+ {
+ "epoch": 64.93460490463215,
+ "grad_norm": 2.076726198196411,
+ "learning_rate": 5.784862362087752e-06,
+ "loss": 0.0399,
+ "step": 23831
+ },
+ {
+ "epoch": 64.93732970027249,
+ "grad_norm": 3.1352274417877197,
+ "learning_rate": 5.7840621129484135e-06,
+ "loss": 0.137,
+ "step": 23832
+ },
+ {
+ "epoch": 64.9400544959128,
+ "grad_norm": 3.6743693351745605,
+ "learning_rate": 5.783261896642667e-06,
+ "loss": 0.0588,
+ "step": 23833
+ },
+ {
+ "epoch": 64.94277929155314,
+ "grad_norm": 3.836276054382324,
+ "learning_rate": 5.7824617131767415e-06,
+ "loss": 0.1027,
+ "step": 23834
+ },
+ {
+ "epoch": 64.94550408719346,
+ "grad_norm": 3.9120116233825684,
+ "learning_rate": 5.7816615625568684e-06,
+ "loss": 0.1289,
+ "step": 23835
+ },
+ {
+ "epoch": 64.94822888283379,
+ "grad_norm": 3.290968894958496,
+ "learning_rate": 5.780861444789275e-06,
+ "loss": 0.1574,
+ "step": 23836
+ },
+ {
+ "epoch": 64.95095367847412,
+ "grad_norm": 4.4691338539123535,
+ "learning_rate": 5.780061359880201e-06,
+ "loss": 0.0539,
+ "step": 23837
+ },
+ {
+ "epoch": 64.95367847411444,
+ "grad_norm": 3.319869041442871,
+ "learning_rate": 5.779261307835873e-06,
+ "loss": 0.1171,
+ "step": 23838
+ },
+ {
+ "epoch": 64.95640326975477,
+ "grad_norm": 3.370058298110962,
+ "learning_rate": 5.778461288662519e-06,
+ "loss": 0.0974,
+ "step": 23839
+ },
+ {
+ "epoch": 64.95912806539509,
+ "grad_norm": 3.132575035095215,
+ "learning_rate": 5.777661302366375e-06,
+ "loss": 0.041,
+ "step": 23840
+ },
+ {
+ "epoch": 64.96185286103542,
+ "grad_norm": 3.5255424976348877,
+ "learning_rate": 5.7768613489536664e-06,
+ "loss": 0.2366,
+ "step": 23841
+ },
+ {
+ "epoch": 64.96457765667574,
+ "grad_norm": 6.005019664764404,
+ "learning_rate": 5.776061428430631e-06,
+ "loss": 0.0631,
+ "step": 23842
+ },
+ {
+ "epoch": 64.96730245231608,
+ "grad_norm": 3.278092384338379,
+ "learning_rate": 5.77526154080349e-06,
+ "loss": 0.055,
+ "step": 23843
+ },
+ {
+ "epoch": 64.97002724795641,
+ "grad_norm": 4.543281555175781,
+ "learning_rate": 5.774461686078474e-06,
+ "loss": 0.0932,
+ "step": 23844
+ },
+ {
+ "epoch": 64.97275204359673,
+ "grad_norm": 3.6716113090515137,
+ "learning_rate": 5.773661864261818e-06,
+ "loss": 0.0464,
+ "step": 23845
+ },
+ {
+ "epoch": 64.97547683923706,
+ "grad_norm": 4.8436408042907715,
+ "learning_rate": 5.772862075359748e-06,
+ "loss": 0.0997,
+ "step": 23846
+ },
+ {
+ "epoch": 64.97820163487738,
+ "grad_norm": 6.906503200531006,
+ "learning_rate": 5.772062319378491e-06,
+ "loss": 0.0867,
+ "step": 23847
+ },
+ {
+ "epoch": 64.98092643051771,
+ "grad_norm": 3.953674077987671,
+ "learning_rate": 5.771262596324273e-06,
+ "loss": 0.2447,
+ "step": 23848
+ },
+ {
+ "epoch": 64.98365122615803,
+ "grad_norm": 4.3087687492370605,
+ "learning_rate": 5.77046290620333e-06,
+ "loss": 0.0432,
+ "step": 23849
+ },
+ {
+ "epoch": 64.98637602179836,
+ "grad_norm": 3.8011410236358643,
+ "learning_rate": 5.7696632490218865e-06,
+ "loss": 0.1285,
+ "step": 23850
+ },
+ {
+ "epoch": 64.9891008174387,
+ "grad_norm": 2.6955769062042236,
+ "learning_rate": 5.768863624786167e-06,
+ "loss": 0.0968,
+ "step": 23851
+ },
+ {
+ "epoch": 64.99182561307902,
+ "grad_norm": 3.028332233428955,
+ "learning_rate": 5.768064033502401e-06,
+ "loss": 0.2483,
+ "step": 23852
+ },
+ {
+ "epoch": 64.99455040871935,
+ "grad_norm": 3.8396477699279785,
+ "learning_rate": 5.767264475176817e-06,
+ "loss": 0.0473,
+ "step": 23853
+ },
+ {
+ "epoch": 64.99727520435967,
+ "grad_norm": 7.509429454803467,
+ "learning_rate": 5.766464949815642e-06,
+ "loss": 0.0472,
+ "step": 23854
+ },
+ {
+ "epoch": 65.0,
+ "grad_norm": 4.404361248016357,
+ "learning_rate": 5.765665457425102e-06,
+ "loss": 0.1461,
+ "step": 23855
+ },
+ {
+ "epoch": 65.00272479564033,
+ "grad_norm": 3.704347610473633,
+ "learning_rate": 5.76486599801142e-06,
+ "loss": 0.1096,
+ "step": 23856
+ },
+ {
+ "epoch": 65.00544959128065,
+ "grad_norm": 3.681830644607544,
+ "learning_rate": 5.7640665715808244e-06,
+ "loss": 0.0545,
+ "step": 23857
+ },
+ {
+ "epoch": 65.00817438692098,
+ "grad_norm": 2.457608461380005,
+ "learning_rate": 5.763267178139544e-06,
+ "loss": 0.0389,
+ "step": 23858
+ },
+ {
+ "epoch": 65.0108991825613,
+ "grad_norm": 4.0209221839904785,
+ "learning_rate": 5.7624678176938055e-06,
+ "loss": 0.0727,
+ "step": 23859
+ },
+ {
+ "epoch": 65.01362397820164,
+ "grad_norm": 4.337145805358887,
+ "learning_rate": 5.76166849024983e-06,
+ "loss": 0.0531,
+ "step": 23860
+ },
+ {
+ "epoch": 65.01634877384195,
+ "grad_norm": 3.689896821975708,
+ "learning_rate": 5.760869195813841e-06,
+ "loss": 0.0878,
+ "step": 23861
+ },
+ {
+ "epoch": 65.01907356948229,
+ "grad_norm": 2.472669839859009,
+ "learning_rate": 5.760069934392068e-06,
+ "loss": 0.0407,
+ "step": 23862
+ },
+ {
+ "epoch": 65.02179836512262,
+ "grad_norm": 2.7535672187805176,
+ "learning_rate": 5.759270705990736e-06,
+ "loss": 0.1648,
+ "step": 23863
+ },
+ {
+ "epoch": 65.02452316076294,
+ "grad_norm": 3.401129722595215,
+ "learning_rate": 5.758471510616066e-06,
+ "loss": 0.0941,
+ "step": 23864
+ },
+ {
+ "epoch": 65.02724795640327,
+ "grad_norm": 3.3423852920532227,
+ "learning_rate": 5.75767234827428e-06,
+ "loss": 0.1656,
+ "step": 23865
+ },
+ {
+ "epoch": 65.02997275204359,
+ "grad_norm": 8.871487617492676,
+ "learning_rate": 5.756873218971609e-06,
+ "loss": 0.1037,
+ "step": 23866
+ },
+ {
+ "epoch": 65.03269754768392,
+ "grad_norm": 3.4835875034332275,
+ "learning_rate": 5.756074122714272e-06,
+ "loss": 0.0955,
+ "step": 23867
+ },
+ {
+ "epoch": 65.03542234332426,
+ "grad_norm": 4.024458408355713,
+ "learning_rate": 5.755275059508492e-06,
+ "loss": 0.1101,
+ "step": 23868
+ },
+ {
+ "epoch": 65.03814713896458,
+ "grad_norm": 6.285836219787598,
+ "learning_rate": 5.754476029360494e-06,
+ "loss": 0.0603,
+ "step": 23869
+ },
+ {
+ "epoch": 65.04087193460491,
+ "grad_norm": 2.6335160732269287,
+ "learning_rate": 5.753677032276501e-06,
+ "loss": 0.027,
+ "step": 23870
+ },
+ {
+ "epoch": 65.04359673024523,
+ "grad_norm": 7.402361869812012,
+ "learning_rate": 5.752878068262735e-06,
+ "loss": 0.0817,
+ "step": 23871
+ },
+ {
+ "epoch": 65.04632152588556,
+ "grad_norm": 3.73759388923645,
+ "learning_rate": 5.7520791373254135e-06,
+ "loss": 0.2076,
+ "step": 23872
+ },
+ {
+ "epoch": 65.04904632152588,
+ "grad_norm": 4.1924967765808105,
+ "learning_rate": 5.751280239470768e-06,
+ "loss": 0.1566,
+ "step": 23873
+ },
+ {
+ "epoch": 65.05177111716621,
+ "grad_norm": 3.7623181343078613,
+ "learning_rate": 5.750481374705011e-06,
+ "loss": 0.0936,
+ "step": 23874
+ },
+ {
+ "epoch": 65.05449591280654,
+ "grad_norm": 3.846261978149414,
+ "learning_rate": 5.749682543034371e-06,
+ "loss": 0.0799,
+ "step": 23875
+ },
+ {
+ "epoch": 65.05722070844686,
+ "grad_norm": 3.157371997833252,
+ "learning_rate": 5.748883744465067e-06,
+ "loss": 0.0922,
+ "step": 23876
+ },
+ {
+ "epoch": 65.0599455040872,
+ "grad_norm": 3.514310836791992,
+ "learning_rate": 5.748084979003317e-06,
+ "loss": 0.0944,
+ "step": 23877
+ },
+ {
+ "epoch": 65.06267029972751,
+ "grad_norm": 3.686051607131958,
+ "learning_rate": 5.7472862466553455e-06,
+ "loss": 0.0584,
+ "step": 23878
+ },
+ {
+ "epoch": 65.06539509536785,
+ "grad_norm": 3.2389907836914062,
+ "learning_rate": 5.746487547427375e-06,
+ "loss": 0.031,
+ "step": 23879
+ },
+ {
+ "epoch": 65.06811989100818,
+ "grad_norm": 4.23587703704834,
+ "learning_rate": 5.74568888132562e-06,
+ "loss": 0.0866,
+ "step": 23880
+ },
+ {
+ "epoch": 65.0708446866485,
+ "grad_norm": 3.1292333602905273,
+ "learning_rate": 5.744890248356301e-06,
+ "loss": 0.1782,
+ "step": 23881
+ },
+ {
+ "epoch": 65.07356948228883,
+ "grad_norm": 6.11333703994751,
+ "learning_rate": 5.744091648525642e-06,
+ "loss": 0.1356,
+ "step": 23882
+ },
+ {
+ "epoch": 65.07629427792915,
+ "grad_norm": 3.8605904579162598,
+ "learning_rate": 5.743293081839862e-06,
+ "loss": 0.1539,
+ "step": 23883
+ },
+ {
+ "epoch": 65.07901907356948,
+ "grad_norm": 3.3380041122436523,
+ "learning_rate": 5.742494548305177e-06,
+ "loss": 0.0656,
+ "step": 23884
+ },
+ {
+ "epoch": 65.0817438692098,
+ "grad_norm": 2.9059176445007324,
+ "learning_rate": 5.741696047927805e-06,
+ "loss": 0.1074,
+ "step": 23885
+ },
+ {
+ "epoch": 65.08446866485014,
+ "grad_norm": 4.149163246154785,
+ "learning_rate": 5.74089758071397e-06,
+ "loss": 0.1008,
+ "step": 23886
+ },
+ {
+ "epoch": 65.08719346049047,
+ "grad_norm": 5.573852062225342,
+ "learning_rate": 5.740099146669888e-06,
+ "loss": 0.1068,
+ "step": 23887
+ },
+ {
+ "epoch": 65.08991825613079,
+ "grad_norm": 2.9669737815856934,
+ "learning_rate": 5.739300745801777e-06,
+ "loss": 0.0586,
+ "step": 23888
+ },
+ {
+ "epoch": 65.09264305177112,
+ "grad_norm": 5.7165207862854,
+ "learning_rate": 5.73850237811585e-06,
+ "loss": 0.1362,
+ "step": 23889
+ },
+ {
+ "epoch": 65.09536784741144,
+ "grad_norm": 3.295400619506836,
+ "learning_rate": 5.737704043618333e-06,
+ "loss": 0.1248,
+ "step": 23890
+ },
+ {
+ "epoch": 65.09809264305177,
+ "grad_norm": 3.5518786907196045,
+ "learning_rate": 5.7369057423154376e-06,
+ "loss": 0.1259,
+ "step": 23891
+ },
+ {
+ "epoch": 65.1008174386921,
+ "grad_norm": 3.840667486190796,
+ "learning_rate": 5.736107474213385e-06,
+ "loss": 0.0872,
+ "step": 23892
+ },
+ {
+ "epoch": 65.10354223433242,
+ "grad_norm": 2.7150371074676514,
+ "learning_rate": 5.735309239318387e-06,
+ "loss": 0.0492,
+ "step": 23893
+ },
+ {
+ "epoch": 65.10626702997276,
+ "grad_norm": 4.040241718292236,
+ "learning_rate": 5.734511037636667e-06,
+ "loss": 0.102,
+ "step": 23894
+ },
+ {
+ "epoch": 65.10899182561307,
+ "grad_norm": 3.0391008853912354,
+ "learning_rate": 5.7337128691744395e-06,
+ "loss": 0.1093,
+ "step": 23895
+ },
+ {
+ "epoch": 65.11171662125341,
+ "grad_norm": 3.4439523220062256,
+ "learning_rate": 5.732914733937917e-06,
+ "loss": 0.1107,
+ "step": 23896
+ },
+ {
+ "epoch": 65.11444141689373,
+ "grad_norm": 2.2255547046661377,
+ "learning_rate": 5.732116631933313e-06,
+ "loss": 0.064,
+ "step": 23897
+ },
+ {
+ "epoch": 65.11716621253406,
+ "grad_norm": 2.6797420978546143,
+ "learning_rate": 5.731318563166852e-06,
+ "loss": 0.1443,
+ "step": 23898
+ },
+ {
+ "epoch": 65.11989100817439,
+ "grad_norm": 2.8840904235839844,
+ "learning_rate": 5.7305205276447454e-06,
+ "loss": 0.0928,
+ "step": 23899
+ },
+ {
+ "epoch": 65.12261580381471,
+ "grad_norm": 5.082234859466553,
+ "learning_rate": 5.729722525373206e-06,
+ "loss": 0.1268,
+ "step": 23900
+ },
+ {
+ "epoch": 65.12534059945504,
+ "grad_norm": 4.612484931945801,
+ "learning_rate": 5.728924556358446e-06,
+ "loss": 0.1005,
+ "step": 23901
+ },
+ {
+ "epoch": 65.12806539509536,
+ "grad_norm": 7.932746410369873,
+ "learning_rate": 5.72812662060669e-06,
+ "loss": 0.0973,
+ "step": 23902
+ },
+ {
+ "epoch": 65.1307901907357,
+ "grad_norm": 3.5816659927368164,
+ "learning_rate": 5.727328718124146e-06,
+ "loss": 0.0798,
+ "step": 23903
+ },
+ {
+ "epoch": 65.13351498637603,
+ "grad_norm": 4.132866382598877,
+ "learning_rate": 5.726530848917027e-06,
+ "loss": 0.0699,
+ "step": 23904
+ },
+ {
+ "epoch": 65.13623978201635,
+ "grad_norm": 3.856076240539551,
+ "learning_rate": 5.725733012991545e-06,
+ "loss": 0.1263,
+ "step": 23905
+ },
+ {
+ "epoch": 65.13896457765668,
+ "grad_norm": 2.9017820358276367,
+ "learning_rate": 5.724935210353921e-06,
+ "loss": 0.0398,
+ "step": 23906
+ },
+ {
+ "epoch": 65.141689373297,
+ "grad_norm": 4.9340362548828125,
+ "learning_rate": 5.724137441010363e-06,
+ "loss": 0.0603,
+ "step": 23907
+ },
+ {
+ "epoch": 65.14441416893733,
+ "grad_norm": 3.251796245574951,
+ "learning_rate": 5.723339704967081e-06,
+ "loss": 0.1711,
+ "step": 23908
+ },
+ {
+ "epoch": 65.14713896457765,
+ "grad_norm": 3.3560702800750732,
+ "learning_rate": 5.722542002230293e-06,
+ "loss": 0.0489,
+ "step": 23909
+ },
+ {
+ "epoch": 65.14986376021798,
+ "grad_norm": 2.926656723022461,
+ "learning_rate": 5.721744332806214e-06,
+ "loss": 0.1059,
+ "step": 23910
+ },
+ {
+ "epoch": 65.15258855585832,
+ "grad_norm": 3.202542781829834,
+ "learning_rate": 5.720946696701053e-06,
+ "loss": 0.0916,
+ "step": 23911
+ },
+ {
+ "epoch": 65.15531335149863,
+ "grad_norm": 2.3384954929351807,
+ "learning_rate": 5.720149093921019e-06,
+ "loss": 0.0805,
+ "step": 23912
+ },
+ {
+ "epoch": 65.15803814713897,
+ "grad_norm": 3.166487693786621,
+ "learning_rate": 5.719351524472326e-06,
+ "loss": 0.0754,
+ "step": 23913
+ },
+ {
+ "epoch": 65.16076294277929,
+ "grad_norm": 3.3758294582366943,
+ "learning_rate": 5.718553988361186e-06,
+ "loss": 0.0535,
+ "step": 23914
+ },
+ {
+ "epoch": 65.16348773841962,
+ "grad_norm": 3.6121857166290283,
+ "learning_rate": 5.717756485593811e-06,
+ "loss": 0.1576,
+ "step": 23915
+ },
+ {
+ "epoch": 65.16621253405995,
+ "grad_norm": 3.9699673652648926,
+ "learning_rate": 5.71695901617641e-06,
+ "loss": 0.1821,
+ "step": 23916
+ },
+ {
+ "epoch": 65.16893732970027,
+ "grad_norm": 5.422703266143799,
+ "learning_rate": 5.716161580115192e-06,
+ "loss": 0.0867,
+ "step": 23917
+ },
+ {
+ "epoch": 65.1716621253406,
+ "grad_norm": 3.7113823890686035,
+ "learning_rate": 5.715364177416371e-06,
+ "loss": 0.074,
+ "step": 23918
+ },
+ {
+ "epoch": 65.17438692098092,
+ "grad_norm": 3.7007954120635986,
+ "learning_rate": 5.714566808086159e-06,
+ "loss": 0.06,
+ "step": 23919
+ },
+ {
+ "epoch": 65.17711171662125,
+ "grad_norm": 2.973315954208374,
+ "learning_rate": 5.713769472130761e-06,
+ "loss": 0.0549,
+ "step": 23920
+ },
+ {
+ "epoch": 65.17983651226157,
+ "grad_norm": 3.80631685256958,
+ "learning_rate": 5.712972169556384e-06,
+ "loss": 0.1644,
+ "step": 23921
+ },
+ {
+ "epoch": 65.1825613079019,
+ "grad_norm": 3.6280059814453125,
+ "learning_rate": 5.712174900369247e-06,
+ "loss": 0.0815,
+ "step": 23922
+ },
+ {
+ "epoch": 65.18528610354224,
+ "grad_norm": 3.664151191711426,
+ "learning_rate": 5.7113776645755525e-06,
+ "loss": 0.0644,
+ "step": 23923
+ },
+ {
+ "epoch": 65.18801089918256,
+ "grad_norm": 3.0507638454437256,
+ "learning_rate": 5.710580462181512e-06,
+ "loss": 0.0471,
+ "step": 23924
+ },
+ {
+ "epoch": 65.19073569482289,
+ "grad_norm": 3.5027029514312744,
+ "learning_rate": 5.709783293193329e-06,
+ "loss": 0.0435,
+ "step": 23925
+ },
+ {
+ "epoch": 65.19346049046321,
+ "grad_norm": 3.2568349838256836,
+ "learning_rate": 5.708986157617215e-06,
+ "loss": 0.1404,
+ "step": 23926
+ },
+ {
+ "epoch": 65.19618528610354,
+ "grad_norm": 3.2480835914611816,
+ "learning_rate": 5.708189055459382e-06,
+ "loss": 0.1218,
+ "step": 23927
+ },
+ {
+ "epoch": 65.19891008174388,
+ "grad_norm": 3.107895612716675,
+ "learning_rate": 5.707391986726035e-06,
+ "loss": 0.1223,
+ "step": 23928
+ },
+ {
+ "epoch": 65.2016348773842,
+ "grad_norm": 3.600494146347046,
+ "learning_rate": 5.706594951423381e-06,
+ "loss": 0.1503,
+ "step": 23929
+ },
+ {
+ "epoch": 65.20435967302453,
+ "grad_norm": 2.3023030757904053,
+ "learning_rate": 5.705797949557624e-06,
+ "loss": 0.0413,
+ "step": 23930
+ },
+ {
+ "epoch": 65.20708446866485,
+ "grad_norm": 5.529454231262207,
+ "learning_rate": 5.705000981134979e-06,
+ "loss": 0.1598,
+ "step": 23931
+ },
+ {
+ "epoch": 65.20980926430518,
+ "grad_norm": 3.8024990558624268,
+ "learning_rate": 5.704204046161647e-06,
+ "loss": 0.0639,
+ "step": 23932
+ },
+ {
+ "epoch": 65.2125340599455,
+ "grad_norm": 2.6368520259857178,
+ "learning_rate": 5.703407144643831e-06,
+ "loss": 0.0415,
+ "step": 23933
+ },
+ {
+ "epoch": 65.21525885558583,
+ "grad_norm": 3.5451037883758545,
+ "learning_rate": 5.702610276587747e-06,
+ "loss": 0.0826,
+ "step": 23934
+ },
+ {
+ "epoch": 65.21798365122616,
+ "grad_norm": 3.3370540142059326,
+ "learning_rate": 5.701813441999596e-06,
+ "loss": 0.1027,
+ "step": 23935
+ },
+ {
+ "epoch": 65.22070844686648,
+ "grad_norm": 3.4198203086853027,
+ "learning_rate": 5.701016640885582e-06,
+ "loss": 0.1539,
+ "step": 23936
+ },
+ {
+ "epoch": 65.22343324250681,
+ "grad_norm": 2.761240243911743,
+ "learning_rate": 5.700219873251909e-06,
+ "loss": 0.0561,
+ "step": 23937
+ },
+ {
+ "epoch": 65.22615803814713,
+ "grad_norm": 3.3922760486602783,
+ "learning_rate": 5.699423139104789e-06,
+ "loss": 0.058,
+ "step": 23938
+ },
+ {
+ "epoch": 65.22888283378747,
+ "grad_norm": 4.2228875160217285,
+ "learning_rate": 5.698626438450423e-06,
+ "loss": 0.0668,
+ "step": 23939
+ },
+ {
+ "epoch": 65.2316076294278,
+ "grad_norm": 2.832742691040039,
+ "learning_rate": 5.697829771295017e-06,
+ "loss": 0.0572,
+ "step": 23940
+ },
+ {
+ "epoch": 65.23433242506812,
+ "grad_norm": 3.4886770248413086,
+ "learning_rate": 5.69703313764477e-06,
+ "loss": 0.1091,
+ "step": 23941
+ },
+ {
+ "epoch": 65.23705722070845,
+ "grad_norm": 3.390244722366333,
+ "learning_rate": 5.69623653750589e-06,
+ "loss": 0.0806,
+ "step": 23942
+ },
+ {
+ "epoch": 65.23978201634877,
+ "grad_norm": 2.5988874435424805,
+ "learning_rate": 5.695439970884585e-06,
+ "loss": 0.0569,
+ "step": 23943
+ },
+ {
+ "epoch": 65.2425068119891,
+ "grad_norm": 3.5327260494232178,
+ "learning_rate": 5.694643437787055e-06,
+ "loss": 0.0625,
+ "step": 23944
+ },
+ {
+ "epoch": 65.24523160762942,
+ "grad_norm": 3.5905511379241943,
+ "learning_rate": 5.693846938219505e-06,
+ "loss": 0.1286,
+ "step": 23945
+ },
+ {
+ "epoch": 65.24795640326975,
+ "grad_norm": 3.403218984603882,
+ "learning_rate": 5.693050472188131e-06,
+ "loss": 0.2239,
+ "step": 23946
+ },
+ {
+ "epoch": 65.25068119891009,
+ "grad_norm": 5.678621768951416,
+ "learning_rate": 5.692254039699146e-06,
+ "loss": 0.0844,
+ "step": 23947
+ },
+ {
+ "epoch": 65.2534059945504,
+ "grad_norm": 4.893455505371094,
+ "learning_rate": 5.691457640758746e-06,
+ "loss": 0.1923,
+ "step": 23948
+ },
+ {
+ "epoch": 65.25613079019074,
+ "grad_norm": 4.162020683288574,
+ "learning_rate": 5.690661275373137e-06,
+ "loss": 0.0803,
+ "step": 23949
+ },
+ {
+ "epoch": 65.25885558583106,
+ "grad_norm": 3.102487564086914,
+ "learning_rate": 5.689864943548514e-06,
+ "loss": 0.1249,
+ "step": 23950
+ },
+ {
+ "epoch": 65.26158038147139,
+ "grad_norm": 4.126766681671143,
+ "learning_rate": 5.68906864529109e-06,
+ "loss": 0.0503,
+ "step": 23951
+ },
+ {
+ "epoch": 65.26430517711172,
+ "grad_norm": 3.4668099880218506,
+ "learning_rate": 5.688272380607058e-06,
+ "loss": 0.0627,
+ "step": 23952
+ },
+ {
+ "epoch": 65.26702997275204,
+ "grad_norm": 4.390965938568115,
+ "learning_rate": 5.68747614950262e-06,
+ "loss": 0.1044,
+ "step": 23953
+ },
+ {
+ "epoch": 65.26975476839237,
+ "grad_norm": 3.341416597366333,
+ "learning_rate": 5.686679951983982e-06,
+ "loss": 0.2101,
+ "step": 23954
+ },
+ {
+ "epoch": 65.2724795640327,
+ "grad_norm": 3.0021090507507324,
+ "learning_rate": 5.6858837880573426e-06,
+ "loss": 0.1412,
+ "step": 23955
+ },
+ {
+ "epoch": 65.27520435967303,
+ "grad_norm": 3.424797534942627,
+ "learning_rate": 5.685087657728902e-06,
+ "loss": 0.0528,
+ "step": 23956
+ },
+ {
+ "epoch": 65.27792915531334,
+ "grad_norm": 5.805532932281494,
+ "learning_rate": 5.6842915610048545e-06,
+ "loss": 0.0576,
+ "step": 23957
+ },
+ {
+ "epoch": 65.28065395095368,
+ "grad_norm": 3.436185836791992,
+ "learning_rate": 5.683495497891409e-06,
+ "loss": 0.0781,
+ "step": 23958
+ },
+ {
+ "epoch": 65.28337874659401,
+ "grad_norm": 3.735299825668335,
+ "learning_rate": 5.682699468394763e-06,
+ "loss": 0.0649,
+ "step": 23959
+ },
+ {
+ "epoch": 65.28610354223433,
+ "grad_norm": 5.107840061187744,
+ "learning_rate": 5.6819034725211096e-06,
+ "loss": 0.0715,
+ "step": 23960
+ },
+ {
+ "epoch": 65.28882833787466,
+ "grad_norm": 3.0492615699768066,
+ "learning_rate": 5.681107510276658e-06,
+ "loss": 0.0492,
+ "step": 23961
+ },
+ {
+ "epoch": 65.29155313351498,
+ "grad_norm": 2.9003193378448486,
+ "learning_rate": 5.680311581667597e-06,
+ "loss": 0.0675,
+ "step": 23962
+ },
+ {
+ "epoch": 65.29427792915531,
+ "grad_norm": 4.069297790527344,
+ "learning_rate": 5.6795156867001345e-06,
+ "loss": 0.0813,
+ "step": 23963
+ },
+ {
+ "epoch": 65.29700272479565,
+ "grad_norm": 6.263089179992676,
+ "learning_rate": 5.678719825380466e-06,
+ "loss": 0.0683,
+ "step": 23964
+ },
+ {
+ "epoch": 65.29972752043597,
+ "grad_norm": 2.939884662628174,
+ "learning_rate": 5.677923997714787e-06,
+ "loss": 0.1354,
+ "step": 23965
+ },
+ {
+ "epoch": 65.3024523160763,
+ "grad_norm": 15.638578414916992,
+ "learning_rate": 5.677128203709294e-06,
+ "loss": 0.081,
+ "step": 23966
+ },
+ {
+ "epoch": 65.30517711171662,
+ "grad_norm": 3.349811315536499,
+ "learning_rate": 5.676332443370189e-06,
+ "loss": 0.2152,
+ "step": 23967
+ },
+ {
+ "epoch": 65.30790190735695,
+ "grad_norm": 2.394726037979126,
+ "learning_rate": 5.675536716703671e-06,
+ "loss": 0.0341,
+ "step": 23968
+ },
+ {
+ "epoch": 65.31062670299727,
+ "grad_norm": 5.335820198059082,
+ "learning_rate": 5.674741023715933e-06,
+ "loss": 0.1909,
+ "step": 23969
+ },
+ {
+ "epoch": 65.3133514986376,
+ "grad_norm": 3.1315112113952637,
+ "learning_rate": 5.673945364413167e-06,
+ "loss": 0.0595,
+ "step": 23970
+ },
+ {
+ "epoch": 65.31607629427793,
+ "grad_norm": 3.580753803253174,
+ "learning_rate": 5.67314973880158e-06,
+ "loss": 0.0642,
+ "step": 23971
+ },
+ {
+ "epoch": 65.31880108991825,
+ "grad_norm": 3.06107759475708,
+ "learning_rate": 5.672354146887364e-06,
+ "loss": 0.1235,
+ "step": 23972
+ },
+ {
+ "epoch": 65.32152588555859,
+ "grad_norm": 3.051346778869629,
+ "learning_rate": 5.671558588676715e-06,
+ "loss": 0.0778,
+ "step": 23973
+ },
+ {
+ "epoch": 65.3242506811989,
+ "grad_norm": 4.6618781089782715,
+ "learning_rate": 5.6707630641758235e-06,
+ "loss": 0.057,
+ "step": 23974
+ },
+ {
+ "epoch": 65.32697547683924,
+ "grad_norm": 3.14992094039917,
+ "learning_rate": 5.6699675733908955e-06,
+ "loss": 0.1994,
+ "step": 23975
+ },
+ {
+ "epoch": 65.32970027247957,
+ "grad_norm": 5.335004806518555,
+ "learning_rate": 5.6691721163281185e-06,
+ "loss": 0.11,
+ "step": 23976
+ },
+ {
+ "epoch": 65.33242506811989,
+ "grad_norm": 3.9652626514434814,
+ "learning_rate": 5.668376692993687e-06,
+ "loss": 0.0529,
+ "step": 23977
+ },
+ {
+ "epoch": 65.33514986376022,
+ "grad_norm": 2.6379270553588867,
+ "learning_rate": 5.6675813033937985e-06,
+ "loss": 0.0925,
+ "step": 23978
+ },
+ {
+ "epoch": 65.33787465940054,
+ "grad_norm": 3.380904197692871,
+ "learning_rate": 5.666785947534651e-06,
+ "loss": 0.0937,
+ "step": 23979
+ },
+ {
+ "epoch": 65.34059945504087,
+ "grad_norm": 2.9610610008239746,
+ "learning_rate": 5.6659906254224355e-06,
+ "loss": 0.0366,
+ "step": 23980
+ },
+ {
+ "epoch": 65.34332425068119,
+ "grad_norm": 4.081940174102783,
+ "learning_rate": 5.665195337063345e-06,
+ "loss": 0.0642,
+ "step": 23981
+ },
+ {
+ "epoch": 65.34604904632153,
+ "grad_norm": 3.9273087978363037,
+ "learning_rate": 5.664400082463569e-06,
+ "loss": 0.2661,
+ "step": 23982
+ },
+ {
+ "epoch": 65.34877384196186,
+ "grad_norm": 4.0738115310668945,
+ "learning_rate": 5.663604861629311e-06,
+ "loss": 0.0475,
+ "step": 23983
+ },
+ {
+ "epoch": 65.35149863760218,
+ "grad_norm": 2.5269320011138916,
+ "learning_rate": 5.662809674566759e-06,
+ "loss": 0.0425,
+ "step": 23984
+ },
+ {
+ "epoch": 65.35422343324251,
+ "grad_norm": 3.172858238220215,
+ "learning_rate": 5.662014521282104e-06,
+ "loss": 0.1479,
+ "step": 23985
+ },
+ {
+ "epoch": 65.35694822888283,
+ "grad_norm": 3.7630107402801514,
+ "learning_rate": 5.661219401781537e-06,
+ "loss": 0.1608,
+ "step": 23986
+ },
+ {
+ "epoch": 65.35967302452316,
+ "grad_norm": 2.8426389694213867,
+ "learning_rate": 5.660424316071258e-06,
+ "loss": 0.0597,
+ "step": 23987
+ },
+ {
+ "epoch": 65.3623978201635,
+ "grad_norm": 3.6083157062530518,
+ "learning_rate": 5.6596292641574535e-06,
+ "loss": 0.077,
+ "step": 23988
+ },
+ {
+ "epoch": 65.36512261580381,
+ "grad_norm": 3.9012110233306885,
+ "learning_rate": 5.658834246046319e-06,
+ "loss": 0.077,
+ "step": 23989
+ },
+ {
+ "epoch": 65.36784741144415,
+ "grad_norm": 5.432197570800781,
+ "learning_rate": 5.658039261744037e-06,
+ "loss": 0.0528,
+ "step": 23990
+ },
+ {
+ "epoch": 65.37057220708446,
+ "grad_norm": 4.274069786071777,
+ "learning_rate": 5.657244311256811e-06,
+ "loss": 0.0567,
+ "step": 23991
+ },
+ {
+ "epoch": 65.3732970027248,
+ "grad_norm": 2.6049606800079346,
+ "learning_rate": 5.656449394590826e-06,
+ "loss": 0.0566,
+ "step": 23992
+ },
+ {
+ "epoch": 65.37602179836512,
+ "grad_norm": 3.093290328979492,
+ "learning_rate": 5.655654511752274e-06,
+ "loss": 0.0436,
+ "step": 23993
+ },
+ {
+ "epoch": 65.37874659400545,
+ "grad_norm": 5.726058483123779,
+ "learning_rate": 5.654859662747337e-06,
+ "loss": 0.0719,
+ "step": 23994
+ },
+ {
+ "epoch": 65.38147138964578,
+ "grad_norm": 4.21392822265625,
+ "learning_rate": 5.6540648475822215e-06,
+ "loss": 0.1087,
+ "step": 23995
+ },
+ {
+ "epoch": 65.3841961852861,
+ "grad_norm": 7.224810600280762,
+ "learning_rate": 5.653270066263108e-06,
+ "loss": 0.2051,
+ "step": 23996
+ },
+ {
+ "epoch": 65.38692098092643,
+ "grad_norm": 2.78900408744812,
+ "learning_rate": 5.6524753187961865e-06,
+ "loss": 0.0409,
+ "step": 23997
+ },
+ {
+ "epoch": 65.38964577656675,
+ "grad_norm": 2.8519763946533203,
+ "learning_rate": 5.6516806051876435e-06,
+ "loss": 0.2213,
+ "step": 23998
+ },
+ {
+ "epoch": 65.39237057220708,
+ "grad_norm": 2.725651502609253,
+ "learning_rate": 5.650885925443678e-06,
+ "loss": 0.1322,
+ "step": 23999
+ },
+ {
+ "epoch": 65.39509536784742,
+ "grad_norm": 2.827827215194702,
+ "learning_rate": 5.650091279570471e-06,
+ "loss": 0.0543,
+ "step": 24000
+ },
+ {
+ "epoch": 65.39782016348774,
+ "grad_norm": 3.800290584564209,
+ "learning_rate": 5.649296667574215e-06,
+ "loss": 0.0997,
+ "step": 24001
+ },
+ {
+ "epoch": 65.40054495912807,
+ "grad_norm": 2.7473745346069336,
+ "learning_rate": 5.6485020894610905e-06,
+ "loss": 0.0733,
+ "step": 24002
+ },
+ {
+ "epoch": 65.40326975476839,
+ "grad_norm": 3.0474374294281006,
+ "learning_rate": 5.647707545237298e-06,
+ "loss": 0.0391,
+ "step": 24003
+ },
+ {
+ "epoch": 65.40599455040872,
+ "grad_norm": 2.3979551792144775,
+ "learning_rate": 5.646913034909016e-06,
+ "loss": 0.0303,
+ "step": 24004
+ },
+ {
+ "epoch": 65.40871934604904,
+ "grad_norm": 5.561906814575195,
+ "learning_rate": 5.646118558482438e-06,
+ "loss": 0.0617,
+ "step": 24005
+ },
+ {
+ "epoch": 65.41144414168937,
+ "grad_norm": 4.902659893035889,
+ "learning_rate": 5.645324115963742e-06,
+ "loss": 0.0445,
+ "step": 24006
+ },
+ {
+ "epoch": 65.4141689373297,
+ "grad_norm": 3.7582004070281982,
+ "learning_rate": 5.644529707359128e-06,
+ "loss": 0.1675,
+ "step": 24007
+ },
+ {
+ "epoch": 65.41689373297002,
+ "grad_norm": 2.687662124633789,
+ "learning_rate": 5.643735332674776e-06,
+ "loss": 0.0862,
+ "step": 24008
+ },
+ {
+ "epoch": 65.41961852861036,
+ "grad_norm": 7.281131744384766,
+ "learning_rate": 5.6429409919168724e-06,
+ "loss": 0.1605,
+ "step": 24009
+ },
+ {
+ "epoch": 65.42234332425068,
+ "grad_norm": 4.193109035491943,
+ "learning_rate": 5.6421466850915986e-06,
+ "loss": 0.115,
+ "step": 24010
+ },
+ {
+ "epoch": 65.42506811989101,
+ "grad_norm": 2.208326578140259,
+ "learning_rate": 5.641352412205148e-06,
+ "loss": 0.1176,
+ "step": 24011
+ },
+ {
+ "epoch": 65.42779291553134,
+ "grad_norm": 2.9011576175689697,
+ "learning_rate": 5.640558173263708e-06,
+ "loss": 0.0433,
+ "step": 24012
+ },
+ {
+ "epoch": 65.43051771117166,
+ "grad_norm": 3.144461154937744,
+ "learning_rate": 5.6397639682734616e-06,
+ "loss": 0.115,
+ "step": 24013
+ },
+ {
+ "epoch": 65.433242506812,
+ "grad_norm": 8.688531875610352,
+ "learning_rate": 5.638969797240592e-06,
+ "loss": 0.1619,
+ "step": 24014
+ },
+ {
+ "epoch": 65.43596730245231,
+ "grad_norm": 3.3656513690948486,
+ "learning_rate": 5.638175660171281e-06,
+ "loss": 0.0642,
+ "step": 24015
+ },
+ {
+ "epoch": 65.43869209809264,
+ "grad_norm": 3.899275302886963,
+ "learning_rate": 5.637381557071724e-06,
+ "loss": 0.1298,
+ "step": 24016
+ },
+ {
+ "epoch": 65.44141689373296,
+ "grad_norm": 3.7607948780059814,
+ "learning_rate": 5.636587487948096e-06,
+ "loss": 0.153,
+ "step": 24017
+ },
+ {
+ "epoch": 65.4441416893733,
+ "grad_norm": 3.140089750289917,
+ "learning_rate": 5.635793452806582e-06,
+ "loss": 0.106,
+ "step": 24018
+ },
+ {
+ "epoch": 65.44686648501363,
+ "grad_norm": 3.5234313011169434,
+ "learning_rate": 5.634999451653372e-06,
+ "loss": 0.0493,
+ "step": 24019
+ },
+ {
+ "epoch": 65.44959128065395,
+ "grad_norm": 3.7180094718933105,
+ "learning_rate": 5.6342054844946446e-06,
+ "loss": 0.0855,
+ "step": 24020
+ },
+ {
+ "epoch": 65.45231607629428,
+ "grad_norm": 2.1237192153930664,
+ "learning_rate": 5.633411551336585e-06,
+ "loss": 0.0274,
+ "step": 24021
+ },
+ {
+ "epoch": 65.4550408719346,
+ "grad_norm": 5.453552722930908,
+ "learning_rate": 5.6326176521853725e-06,
+ "loss": 0.1127,
+ "step": 24022
+ },
+ {
+ "epoch": 65.45776566757493,
+ "grad_norm": 4.5644965171813965,
+ "learning_rate": 5.631823787047196e-06,
+ "loss": 0.0522,
+ "step": 24023
+ },
+ {
+ "epoch": 65.46049046321527,
+ "grad_norm": 4.731208801269531,
+ "learning_rate": 5.631029955928236e-06,
+ "loss": 0.0849,
+ "step": 24024
+ },
+ {
+ "epoch": 65.46321525885558,
+ "grad_norm": 3.8543739318847656,
+ "learning_rate": 5.630236158834675e-06,
+ "loss": 0.0694,
+ "step": 24025
+ },
+ {
+ "epoch": 65.46594005449592,
+ "grad_norm": 6.913013935089111,
+ "learning_rate": 5.629442395772688e-06,
+ "loss": 0.0746,
+ "step": 24026
+ },
+ {
+ "epoch": 65.46866485013624,
+ "grad_norm": 3.2953193187713623,
+ "learning_rate": 5.628648666748467e-06,
+ "loss": 0.0407,
+ "step": 24027
+ },
+ {
+ "epoch": 65.47138964577657,
+ "grad_norm": 5.9116411209106445,
+ "learning_rate": 5.627854971768187e-06,
+ "loss": 0.0566,
+ "step": 24028
+ },
+ {
+ "epoch": 65.47411444141689,
+ "grad_norm": 2.8418362140655518,
+ "learning_rate": 5.627061310838035e-06,
+ "loss": 0.0636,
+ "step": 24029
+ },
+ {
+ "epoch": 65.47683923705722,
+ "grad_norm": 3.1597983837127686,
+ "learning_rate": 5.626267683964188e-06,
+ "loss": 0.2027,
+ "step": 24030
+ },
+ {
+ "epoch": 65.47956403269755,
+ "grad_norm": 4.115743637084961,
+ "learning_rate": 5.625474091152825e-06,
+ "loss": 0.0791,
+ "step": 24031
+ },
+ {
+ "epoch": 65.48228882833787,
+ "grad_norm": 2.599477767944336,
+ "learning_rate": 5.624680532410134e-06,
+ "loss": 0.0422,
+ "step": 24032
+ },
+ {
+ "epoch": 65.4850136239782,
+ "grad_norm": 3.156306028366089,
+ "learning_rate": 5.623887007742288e-06,
+ "loss": 0.0869,
+ "step": 24033
+ },
+ {
+ "epoch": 65.48773841961852,
+ "grad_norm": 3.8809096813201904,
+ "learning_rate": 5.623093517155469e-06,
+ "loss": 0.083,
+ "step": 24034
+ },
+ {
+ "epoch": 65.49046321525886,
+ "grad_norm": 3.6313915252685547,
+ "learning_rate": 5.622300060655854e-06,
+ "loss": 0.0614,
+ "step": 24035
+ },
+ {
+ "epoch": 65.49318801089919,
+ "grad_norm": 4.227549076080322,
+ "learning_rate": 5.62150663824963e-06,
+ "loss": 0.1316,
+ "step": 24036
+ },
+ {
+ "epoch": 65.49591280653951,
+ "grad_norm": 2.85221529006958,
+ "learning_rate": 5.620713249942968e-06,
+ "loss": 0.0393,
+ "step": 24037
+ },
+ {
+ "epoch": 65.49863760217984,
+ "grad_norm": 9.981179237365723,
+ "learning_rate": 5.619919895742054e-06,
+ "loss": 0.1113,
+ "step": 24038
+ },
+ {
+ "epoch": 65.50136239782016,
+ "grad_norm": 2.98490309715271,
+ "learning_rate": 5.619126575653058e-06,
+ "loss": 0.0444,
+ "step": 24039
+ },
+ {
+ "epoch": 65.50408719346049,
+ "grad_norm": 3.901944875717163,
+ "learning_rate": 5.618333289682165e-06,
+ "loss": 0.1477,
+ "step": 24040
+ },
+ {
+ "epoch": 65.50681198910081,
+ "grad_norm": 3.7826104164123535,
+ "learning_rate": 5.617540037835553e-06,
+ "loss": 0.115,
+ "step": 24041
+ },
+ {
+ "epoch": 65.50953678474114,
+ "grad_norm": 3.9240939617156982,
+ "learning_rate": 5.616746820119394e-06,
+ "loss": 0.0512,
+ "step": 24042
+ },
+ {
+ "epoch": 65.51226158038148,
+ "grad_norm": 3.282703399658203,
+ "learning_rate": 5.615953636539875e-06,
+ "loss": 0.0468,
+ "step": 24043
+ },
+ {
+ "epoch": 65.5149863760218,
+ "grad_norm": 3.200434446334839,
+ "learning_rate": 5.6151604871031665e-06,
+ "loss": 0.0706,
+ "step": 24044
+ },
+ {
+ "epoch": 65.51771117166213,
+ "grad_norm": 2.988568067550659,
+ "learning_rate": 5.6143673718154466e-06,
+ "loss": 0.1459,
+ "step": 24045
+ },
+ {
+ "epoch": 65.52043596730245,
+ "grad_norm": 3.289043426513672,
+ "learning_rate": 5.6135742906828894e-06,
+ "loss": 0.0495,
+ "step": 24046
+ },
+ {
+ "epoch": 65.52316076294278,
+ "grad_norm": 3.8344788551330566,
+ "learning_rate": 5.612781243711673e-06,
+ "loss": 0.0881,
+ "step": 24047
+ },
+ {
+ "epoch": 65.52588555858311,
+ "grad_norm": 3.664890766143799,
+ "learning_rate": 5.611988230907981e-06,
+ "loss": 0.0843,
+ "step": 24048
+ },
+ {
+ "epoch": 65.52861035422343,
+ "grad_norm": 3.223095417022705,
+ "learning_rate": 5.611195252277983e-06,
+ "loss": 0.0946,
+ "step": 24049
+ },
+ {
+ "epoch": 65.53133514986376,
+ "grad_norm": 3.1708548069000244,
+ "learning_rate": 5.610402307827855e-06,
+ "loss": 0.1086,
+ "step": 24050
+ },
+ {
+ "epoch": 65.53405994550408,
+ "grad_norm": 4.720671653747559,
+ "learning_rate": 5.609609397563768e-06,
+ "loss": 0.1158,
+ "step": 24051
+ },
+ {
+ "epoch": 65.53678474114442,
+ "grad_norm": 3.3979437351226807,
+ "learning_rate": 5.6088165214919064e-06,
+ "loss": 0.1681,
+ "step": 24052
+ },
+ {
+ "epoch": 65.53950953678473,
+ "grad_norm": 2.8669590950012207,
+ "learning_rate": 5.6080236796184395e-06,
+ "loss": 0.0421,
+ "step": 24053
+ },
+ {
+ "epoch": 65.54223433242507,
+ "grad_norm": 3.282972574234009,
+ "learning_rate": 5.607230871949543e-06,
+ "loss": 0.0595,
+ "step": 24054
+ },
+ {
+ "epoch": 65.5449591280654,
+ "grad_norm": 5.365381240844727,
+ "learning_rate": 5.606438098491388e-06,
+ "loss": 0.2275,
+ "step": 24055
+ },
+ {
+ "epoch": 65.54768392370572,
+ "grad_norm": 4.928396224975586,
+ "learning_rate": 5.605645359250155e-06,
+ "loss": 0.3508,
+ "step": 24056
+ },
+ {
+ "epoch": 65.55040871934605,
+ "grad_norm": 2.4006850719451904,
+ "learning_rate": 5.604852654232015e-06,
+ "loss": 0.042,
+ "step": 24057
+ },
+ {
+ "epoch": 65.55313351498637,
+ "grad_norm": 3.378596544265747,
+ "learning_rate": 5.604059983443139e-06,
+ "loss": 0.0603,
+ "step": 24058
+ },
+ {
+ "epoch": 65.5558583106267,
+ "grad_norm": 3.948317527770996,
+ "learning_rate": 5.6032673468897015e-06,
+ "loss": 0.1374,
+ "step": 24059
+ },
+ {
+ "epoch": 65.55858310626704,
+ "grad_norm": 3.6100611686706543,
+ "learning_rate": 5.602474744577879e-06,
+ "loss": 0.1618,
+ "step": 24060
+ },
+ {
+ "epoch": 65.56130790190736,
+ "grad_norm": 3.3356940746307373,
+ "learning_rate": 5.6016821765138405e-06,
+ "loss": 0.1528,
+ "step": 24061
+ },
+ {
+ "epoch": 65.56403269754769,
+ "grad_norm": 3.4731838703155518,
+ "learning_rate": 5.600889642703758e-06,
+ "loss": 0.0455,
+ "step": 24062
+ },
+ {
+ "epoch": 65.566757493188,
+ "grad_norm": 3.523421287536621,
+ "learning_rate": 5.6000971431538045e-06,
+ "loss": 0.063,
+ "step": 24063
+ },
+ {
+ "epoch": 65.56948228882834,
+ "grad_norm": 2.8029582500457764,
+ "learning_rate": 5.599304677870157e-06,
+ "loss": 0.0412,
+ "step": 24064
+ },
+ {
+ "epoch": 65.57220708446866,
+ "grad_norm": 3.948566198348999,
+ "learning_rate": 5.598512246858982e-06,
+ "loss": 0.0912,
+ "step": 24065
+ },
+ {
+ "epoch": 65.57493188010899,
+ "grad_norm": 3.1863033771514893,
+ "learning_rate": 5.5977198501264514e-06,
+ "loss": 0.1724,
+ "step": 24066
+ },
+ {
+ "epoch": 65.57765667574932,
+ "grad_norm": 3.802523374557495,
+ "learning_rate": 5.5969274876787334e-06,
+ "loss": 0.0417,
+ "step": 24067
+ },
+ {
+ "epoch": 65.58038147138964,
+ "grad_norm": 3.8693065643310547,
+ "learning_rate": 5.5961351595220084e-06,
+ "loss": 0.0874,
+ "step": 24068
+ },
+ {
+ "epoch": 65.58310626702998,
+ "grad_norm": 2.525731325149536,
+ "learning_rate": 5.595342865662439e-06,
+ "loss": 0.0332,
+ "step": 24069
+ },
+ {
+ "epoch": 65.5858310626703,
+ "grad_norm": 2.4688730239868164,
+ "learning_rate": 5.594550606106198e-06,
+ "loss": 0.0323,
+ "step": 24070
+ },
+ {
+ "epoch": 65.58855585831063,
+ "grad_norm": 3.272493362426758,
+ "learning_rate": 5.593758380859452e-06,
+ "loss": 0.053,
+ "step": 24071
+ },
+ {
+ "epoch": 65.59128065395096,
+ "grad_norm": 3.4990341663360596,
+ "learning_rate": 5.5929661899283775e-06,
+ "loss": 0.1053,
+ "step": 24072
+ },
+ {
+ "epoch": 65.59400544959128,
+ "grad_norm": 4.865126609802246,
+ "learning_rate": 5.59217403331914e-06,
+ "loss": 0.1447,
+ "step": 24073
+ },
+ {
+ "epoch": 65.59673024523161,
+ "grad_norm": 3.6281673908233643,
+ "learning_rate": 5.5913819110379095e-06,
+ "loss": 0.275,
+ "step": 24074
+ },
+ {
+ "epoch": 65.59945504087193,
+ "grad_norm": 2.552403211593628,
+ "learning_rate": 5.5905898230908506e-06,
+ "loss": 0.0828,
+ "step": 24075
+ },
+ {
+ "epoch": 65.60217983651226,
+ "grad_norm": 3.726198434829712,
+ "learning_rate": 5.5897977694841396e-06,
+ "loss": 0.0527,
+ "step": 24076
+ },
+ {
+ "epoch": 65.60490463215258,
+ "grad_norm": 3.713240623474121,
+ "learning_rate": 5.589005750223944e-06,
+ "loss": 0.0471,
+ "step": 24077
+ },
+ {
+ "epoch": 65.60762942779292,
+ "grad_norm": 3.081360101699829,
+ "learning_rate": 5.588213765316427e-06,
+ "loss": 0.0417,
+ "step": 24078
+ },
+ {
+ "epoch": 65.61035422343325,
+ "grad_norm": 4.682824611663818,
+ "learning_rate": 5.587421814767757e-06,
+ "loss": 0.1321,
+ "step": 24079
+ },
+ {
+ "epoch": 65.61307901907357,
+ "grad_norm": 7.3144402503967285,
+ "learning_rate": 5.586629898584103e-06,
+ "loss": 0.103,
+ "step": 24080
+ },
+ {
+ "epoch": 65.6158038147139,
+ "grad_norm": 3.2913010120391846,
+ "learning_rate": 5.5858380167716375e-06,
+ "loss": 0.1756,
+ "step": 24081
+ },
+ {
+ "epoch": 65.61852861035422,
+ "grad_norm": 3.0218420028686523,
+ "learning_rate": 5.585046169336524e-06,
+ "loss": 0.0964,
+ "step": 24082
+ },
+ {
+ "epoch": 65.62125340599455,
+ "grad_norm": 3.8760106563568115,
+ "learning_rate": 5.584254356284924e-06,
+ "loss": 0.1442,
+ "step": 24083
+ },
+ {
+ "epoch": 65.62397820163488,
+ "grad_norm": 3.4273133277893066,
+ "learning_rate": 5.583462577623013e-06,
+ "loss": 0.056,
+ "step": 24084
+ },
+ {
+ "epoch": 65.6267029972752,
+ "grad_norm": 3.849010705947876,
+ "learning_rate": 5.5826708333569536e-06,
+ "loss": 0.0884,
+ "step": 24085
+ },
+ {
+ "epoch": 65.62942779291554,
+ "grad_norm": 4.020907878875732,
+ "learning_rate": 5.58187912349291e-06,
+ "loss": 0.079,
+ "step": 24086
+ },
+ {
+ "epoch": 65.63215258855585,
+ "grad_norm": 3.489081382751465,
+ "learning_rate": 5.581087448037048e-06,
+ "loss": 0.1209,
+ "step": 24087
+ },
+ {
+ "epoch": 65.63487738419619,
+ "grad_norm": 3.759430170059204,
+ "learning_rate": 5.580295806995538e-06,
+ "loss": 0.1076,
+ "step": 24088
+ },
+ {
+ "epoch": 65.6376021798365,
+ "grad_norm": 5.0124192237854,
+ "learning_rate": 5.5795042003745416e-06,
+ "loss": 0.0612,
+ "step": 24089
+ },
+ {
+ "epoch": 65.64032697547684,
+ "grad_norm": 3.5506246089935303,
+ "learning_rate": 5.578712628180225e-06,
+ "loss": 0.0413,
+ "step": 24090
+ },
+ {
+ "epoch": 65.64305177111717,
+ "grad_norm": 4.744014263153076,
+ "learning_rate": 5.577921090418747e-06,
+ "loss": 0.0588,
+ "step": 24091
+ },
+ {
+ "epoch": 65.64577656675749,
+ "grad_norm": 5.604671478271484,
+ "learning_rate": 5.577129587096282e-06,
+ "loss": 0.148,
+ "step": 24092
+ },
+ {
+ "epoch": 65.64850136239782,
+ "grad_norm": 3.916191816329956,
+ "learning_rate": 5.576338118218989e-06,
+ "loss": 0.1333,
+ "step": 24093
+ },
+ {
+ "epoch": 65.65122615803814,
+ "grad_norm": 3.4078290462493896,
+ "learning_rate": 5.575546683793034e-06,
+ "loss": 0.1086,
+ "step": 24094
+ },
+ {
+ "epoch": 65.65395095367847,
+ "grad_norm": 3.0936272144317627,
+ "learning_rate": 5.574755283824573e-06,
+ "loss": 0.3191,
+ "step": 24095
+ },
+ {
+ "epoch": 65.65667574931881,
+ "grad_norm": 3.2433664798736572,
+ "learning_rate": 5.5739639183197805e-06,
+ "loss": 0.0491,
+ "step": 24096
+ },
+ {
+ "epoch": 65.65940054495913,
+ "grad_norm": 3.436826705932617,
+ "learning_rate": 5.57317258728481e-06,
+ "loss": 0.0872,
+ "step": 24097
+ },
+ {
+ "epoch": 65.66212534059946,
+ "grad_norm": 3.36426043510437,
+ "learning_rate": 5.572381290725833e-06,
+ "loss": 0.0732,
+ "step": 24098
+ },
+ {
+ "epoch": 65.66485013623978,
+ "grad_norm": 3.7712724208831787,
+ "learning_rate": 5.571590028649008e-06,
+ "loss": 0.0706,
+ "step": 24099
+ },
+ {
+ "epoch": 65.66757493188011,
+ "grad_norm": 2.650465726852417,
+ "learning_rate": 5.570798801060493e-06,
+ "loss": 0.0863,
+ "step": 24100
+ },
+ {
+ "epoch": 65.67029972752043,
+ "grad_norm": 3.8432295322418213,
+ "learning_rate": 5.570007607966459e-06,
+ "loss": 0.1962,
+ "step": 24101
+ },
+ {
+ "epoch": 65.67302452316076,
+ "grad_norm": 3.3361594676971436,
+ "learning_rate": 5.569216449373063e-06,
+ "loss": 0.0664,
+ "step": 24102
+ },
+ {
+ "epoch": 65.6757493188011,
+ "grad_norm": 2.96706485748291,
+ "learning_rate": 5.568425325286466e-06,
+ "loss": 0.0439,
+ "step": 24103
+ },
+ {
+ "epoch": 65.67847411444141,
+ "grad_norm": 4.701183795928955,
+ "learning_rate": 5.567634235712827e-06,
+ "loss": 0.0799,
+ "step": 24104
+ },
+ {
+ "epoch": 65.68119891008175,
+ "grad_norm": 2.7475826740264893,
+ "learning_rate": 5.566843180658313e-06,
+ "loss": 0.0347,
+ "step": 24105
+ },
+ {
+ "epoch": 65.68392370572207,
+ "grad_norm": 3.762141227722168,
+ "learning_rate": 5.566052160129083e-06,
+ "loss": 0.0479,
+ "step": 24106
+ },
+ {
+ "epoch": 65.6866485013624,
+ "grad_norm": 4.1154465675354,
+ "learning_rate": 5.565261174131291e-06,
+ "loss": 0.084,
+ "step": 24107
+ },
+ {
+ "epoch": 65.68937329700273,
+ "grad_norm": 2.481872320175171,
+ "learning_rate": 5.5644702226711055e-06,
+ "loss": 0.0817,
+ "step": 24108
+ },
+ {
+ "epoch": 65.69209809264305,
+ "grad_norm": 4.318648338317871,
+ "learning_rate": 5.563679305754685e-06,
+ "loss": 0.1184,
+ "step": 24109
+ },
+ {
+ "epoch": 65.69482288828338,
+ "grad_norm": 4.170182704925537,
+ "learning_rate": 5.5628884233881865e-06,
+ "loss": 0.1345,
+ "step": 24110
+ },
+ {
+ "epoch": 65.6975476839237,
+ "grad_norm": 3.049823522567749,
+ "learning_rate": 5.562097575577765e-06,
+ "loss": 0.0576,
+ "step": 24111
+ },
+ {
+ "epoch": 65.70027247956403,
+ "grad_norm": 3.304457664489746,
+ "learning_rate": 5.56130676232959e-06,
+ "loss": 0.1247,
+ "step": 24112
+ },
+ {
+ "epoch": 65.70299727520435,
+ "grad_norm": 2.9516074657440186,
+ "learning_rate": 5.5605159836498145e-06,
+ "loss": 0.0471,
+ "step": 24113
+ },
+ {
+ "epoch": 65.70572207084469,
+ "grad_norm": 2.629530906677246,
+ "learning_rate": 5.559725239544595e-06,
+ "loss": 0.0428,
+ "step": 24114
+ },
+ {
+ "epoch": 65.70844686648502,
+ "grad_norm": 3.6818525791168213,
+ "learning_rate": 5.558934530020095e-06,
+ "loss": 0.08,
+ "step": 24115
+ },
+ {
+ "epoch": 65.71117166212534,
+ "grad_norm": 6.104763507843018,
+ "learning_rate": 5.558143855082466e-06,
+ "loss": 0.1501,
+ "step": 24116
+ },
+ {
+ "epoch": 65.71389645776567,
+ "grad_norm": 3.2225263118743896,
+ "learning_rate": 5.557353214737875e-06,
+ "loss": 0.0893,
+ "step": 24117
+ },
+ {
+ "epoch": 65.71662125340599,
+ "grad_norm": 6.144196510314941,
+ "learning_rate": 5.556562608992473e-06,
+ "loss": 0.2236,
+ "step": 24118
+ },
+ {
+ "epoch": 65.71934604904632,
+ "grad_norm": 2.8399598598480225,
+ "learning_rate": 5.555772037852418e-06,
+ "loss": 0.0458,
+ "step": 24119
+ },
+ {
+ "epoch": 65.72207084468666,
+ "grad_norm": 3.0409440994262695,
+ "learning_rate": 5.554981501323864e-06,
+ "loss": 0.0571,
+ "step": 24120
+ },
+ {
+ "epoch": 65.72479564032697,
+ "grad_norm": 3.4222543239593506,
+ "learning_rate": 5.554190999412975e-06,
+ "loss": 0.0918,
+ "step": 24121
+ },
+ {
+ "epoch": 65.7275204359673,
+ "grad_norm": 3.6440134048461914,
+ "learning_rate": 5.553400532125903e-06,
+ "loss": 0.1618,
+ "step": 24122
+ },
+ {
+ "epoch": 65.73024523160763,
+ "grad_norm": 4.814828872680664,
+ "learning_rate": 5.552610099468805e-06,
+ "loss": 0.1118,
+ "step": 24123
+ },
+ {
+ "epoch": 65.73297002724796,
+ "grad_norm": 3.9907937049865723,
+ "learning_rate": 5.551819701447832e-06,
+ "loss": 0.1719,
+ "step": 24124
+ },
+ {
+ "epoch": 65.73569482288828,
+ "grad_norm": 3.5386910438537598,
+ "learning_rate": 5.5510293380691494e-06,
+ "loss": 0.1005,
+ "step": 24125
+ },
+ {
+ "epoch": 65.73841961852861,
+ "grad_norm": 3.8201828002929688,
+ "learning_rate": 5.550239009338905e-06,
+ "loss": 0.0532,
+ "step": 24126
+ },
+ {
+ "epoch": 65.74114441416894,
+ "grad_norm": 3.731848955154419,
+ "learning_rate": 5.549448715263252e-06,
+ "loss": 0.1585,
+ "step": 24127
+ },
+ {
+ "epoch": 65.74386920980926,
+ "grad_norm": 4.082111358642578,
+ "learning_rate": 5.548658455848355e-06,
+ "loss": 0.1388,
+ "step": 24128
+ },
+ {
+ "epoch": 65.7465940054496,
+ "grad_norm": 2.539555072784424,
+ "learning_rate": 5.547868231100362e-06,
+ "loss": 0.1853,
+ "step": 24129
+ },
+ {
+ "epoch": 65.74931880108991,
+ "grad_norm": 2.4366369247436523,
+ "learning_rate": 5.547078041025429e-06,
+ "loss": 0.0285,
+ "step": 24130
+ },
+ {
+ "epoch": 65.75204359673025,
+ "grad_norm": 8.254321098327637,
+ "learning_rate": 5.546287885629702e-06,
+ "loss": 0.0883,
+ "step": 24131
+ },
+ {
+ "epoch": 65.75476839237058,
+ "grad_norm": 3.6452460289001465,
+ "learning_rate": 5.545497764919345e-06,
+ "loss": 0.0628,
+ "step": 24132
+ },
+ {
+ "epoch": 65.7574931880109,
+ "grad_norm": 4.926702976226807,
+ "learning_rate": 5.544707678900509e-06,
+ "loss": 0.0799,
+ "step": 24133
+ },
+ {
+ "epoch": 65.76021798365123,
+ "grad_norm": 5.784377098083496,
+ "learning_rate": 5.543917627579347e-06,
+ "loss": 0.2102,
+ "step": 24134
+ },
+ {
+ "epoch": 65.76294277929155,
+ "grad_norm": 3.480914831161499,
+ "learning_rate": 5.543127610962012e-06,
+ "loss": 0.0499,
+ "step": 24135
+ },
+ {
+ "epoch": 65.76566757493188,
+ "grad_norm": 3.3300530910491943,
+ "learning_rate": 5.5423376290546526e-06,
+ "loss": 0.0835,
+ "step": 24136
+ },
+ {
+ "epoch": 65.7683923705722,
+ "grad_norm": 2.075978994369507,
+ "learning_rate": 5.541547681863426e-06,
+ "loss": 0.0348,
+ "step": 24137
+ },
+ {
+ "epoch": 65.77111716621253,
+ "grad_norm": 3.2094852924346924,
+ "learning_rate": 5.5407577693944835e-06,
+ "loss": 0.1015,
+ "step": 24138
+ },
+ {
+ "epoch": 65.77384196185287,
+ "grad_norm": 2.8756561279296875,
+ "learning_rate": 5.539967891653976e-06,
+ "loss": 0.0686,
+ "step": 24139
+ },
+ {
+ "epoch": 65.77656675749319,
+ "grad_norm": 2.7848398685455322,
+ "learning_rate": 5.539178048648051e-06,
+ "loss": 0.086,
+ "step": 24140
+ },
+ {
+ "epoch": 65.77929155313352,
+ "grad_norm": 4.2184014320373535,
+ "learning_rate": 5.538388240382868e-06,
+ "loss": 0.0904,
+ "step": 24141
+ },
+ {
+ "epoch": 65.78201634877384,
+ "grad_norm": 3.6957924365997314,
+ "learning_rate": 5.537598466864574e-06,
+ "loss": 0.1328,
+ "step": 24142
+ },
+ {
+ "epoch": 65.78474114441417,
+ "grad_norm": 3.270751714706421,
+ "learning_rate": 5.536808728099318e-06,
+ "loss": 0.0708,
+ "step": 24143
+ },
+ {
+ "epoch": 65.7874659400545,
+ "grad_norm": 3.877631425857544,
+ "learning_rate": 5.536019024093251e-06,
+ "loss": 0.0816,
+ "step": 24144
+ },
+ {
+ "epoch": 65.79019073569482,
+ "grad_norm": 2.9125187397003174,
+ "learning_rate": 5.535229354852525e-06,
+ "loss": 0.0552,
+ "step": 24145
+ },
+ {
+ "epoch": 65.79291553133515,
+ "grad_norm": 3.9231040477752686,
+ "learning_rate": 5.534439720383291e-06,
+ "loss": 0.1446,
+ "step": 24146
+ },
+ {
+ "epoch": 65.79564032697547,
+ "grad_norm": 5.722751617431641,
+ "learning_rate": 5.533650120691696e-06,
+ "loss": 0.0868,
+ "step": 24147
+ },
+ {
+ "epoch": 65.7983651226158,
+ "grad_norm": 4.944255352020264,
+ "learning_rate": 5.532860555783885e-06,
+ "loss": 0.0679,
+ "step": 24148
+ },
+ {
+ "epoch": 65.80108991825612,
+ "grad_norm": 2.7896859645843506,
+ "learning_rate": 5.5320710256660146e-06,
+ "loss": 0.0466,
+ "step": 24149
+ },
+ {
+ "epoch": 65.80381471389646,
+ "grad_norm": 4.166999816894531,
+ "learning_rate": 5.531281530344235e-06,
+ "loss": 0.0665,
+ "step": 24150
+ },
+ {
+ "epoch": 65.80653950953679,
+ "grad_norm": 3.6034128665924072,
+ "learning_rate": 5.530492069824689e-06,
+ "loss": 0.1082,
+ "step": 24151
+ },
+ {
+ "epoch": 65.80926430517711,
+ "grad_norm": 3.5304007530212402,
+ "learning_rate": 5.529702644113524e-06,
+ "loss": 0.1821,
+ "step": 24152
+ },
+ {
+ "epoch": 65.81198910081744,
+ "grad_norm": 3.4963839054107666,
+ "learning_rate": 5.528913253216896e-06,
+ "loss": 0.0515,
+ "step": 24153
+ },
+ {
+ "epoch": 65.81471389645776,
+ "grad_norm": 3.477022409439087,
+ "learning_rate": 5.528123897140946e-06,
+ "loss": 0.1316,
+ "step": 24154
+ },
+ {
+ "epoch": 65.8174386920981,
+ "grad_norm": 5.340469837188721,
+ "learning_rate": 5.5273345758918225e-06,
+ "loss": 0.214,
+ "step": 24155
+ },
+ {
+ "epoch": 65.82016348773843,
+ "grad_norm": 3.8314285278320312,
+ "learning_rate": 5.526545289475671e-06,
+ "loss": 0.1361,
+ "step": 24156
+ },
+ {
+ "epoch": 65.82288828337875,
+ "grad_norm": 4.120553970336914,
+ "learning_rate": 5.525756037898645e-06,
+ "loss": 0.1485,
+ "step": 24157
+ },
+ {
+ "epoch": 65.82561307901908,
+ "grad_norm": 3.0257270336151123,
+ "learning_rate": 5.524966821166886e-06,
+ "loss": 0.1318,
+ "step": 24158
+ },
+ {
+ "epoch": 65.8283378746594,
+ "grad_norm": 4.530957221984863,
+ "learning_rate": 5.524177639286543e-06,
+ "loss": 0.1526,
+ "step": 24159
+ },
+ {
+ "epoch": 65.83106267029973,
+ "grad_norm": 3.710131883621216,
+ "learning_rate": 5.523388492263755e-06,
+ "loss": 0.0539,
+ "step": 24160
+ },
+ {
+ "epoch": 65.83378746594005,
+ "grad_norm": 5.359655857086182,
+ "learning_rate": 5.522599380104677e-06,
+ "loss": 0.0565,
+ "step": 24161
+ },
+ {
+ "epoch": 65.83651226158038,
+ "grad_norm": 4.823092937469482,
+ "learning_rate": 5.521810302815453e-06,
+ "loss": 0.0942,
+ "step": 24162
+ },
+ {
+ "epoch": 65.83923705722071,
+ "grad_norm": 4.227487564086914,
+ "learning_rate": 5.521021260402224e-06,
+ "loss": 0.0418,
+ "step": 24163
+ },
+ {
+ "epoch": 65.84196185286103,
+ "grad_norm": 2.779810905456543,
+ "learning_rate": 5.520232252871134e-06,
+ "loss": 0.0756,
+ "step": 24164
+ },
+ {
+ "epoch": 65.84468664850137,
+ "grad_norm": 3.6005938053131104,
+ "learning_rate": 5.519443280228335e-06,
+ "loss": 0.0895,
+ "step": 24165
+ },
+ {
+ "epoch": 65.84741144414168,
+ "grad_norm": 2.7258284091949463,
+ "learning_rate": 5.5186543424799636e-06,
+ "loss": 0.152,
+ "step": 24166
+ },
+ {
+ "epoch": 65.85013623978202,
+ "grad_norm": 4.038546562194824,
+ "learning_rate": 5.517865439632173e-06,
+ "loss": 0.1054,
+ "step": 24167
+ },
+ {
+ "epoch": 65.85286103542235,
+ "grad_norm": 2.302922248840332,
+ "learning_rate": 5.517076571691096e-06,
+ "loss": 0.08,
+ "step": 24168
+ },
+ {
+ "epoch": 65.85558583106267,
+ "grad_norm": 3.5228846073150635,
+ "learning_rate": 5.516287738662887e-06,
+ "loss": 0.0398,
+ "step": 24169
+ },
+ {
+ "epoch": 65.858310626703,
+ "grad_norm": 2.2264459133148193,
+ "learning_rate": 5.515498940553685e-06,
+ "loss": 0.0675,
+ "step": 24170
+ },
+ {
+ "epoch": 65.86103542234332,
+ "grad_norm": 3.608992576599121,
+ "learning_rate": 5.514710177369634e-06,
+ "loss": 0.0973,
+ "step": 24171
+ },
+ {
+ "epoch": 65.86376021798365,
+ "grad_norm": 2.6364173889160156,
+ "learning_rate": 5.513921449116871e-06,
+ "loss": 0.0377,
+ "step": 24172
+ },
+ {
+ "epoch": 65.86648501362397,
+ "grad_norm": 3.437800645828247,
+ "learning_rate": 5.5131327558015466e-06,
+ "loss": 0.0947,
+ "step": 24173
+ },
+ {
+ "epoch": 65.8692098092643,
+ "grad_norm": 3.5913867950439453,
+ "learning_rate": 5.512344097429801e-06,
+ "loss": 0.1357,
+ "step": 24174
+ },
+ {
+ "epoch": 65.87193460490464,
+ "grad_norm": 6.768052577972412,
+ "learning_rate": 5.511555474007775e-06,
+ "loss": 0.1138,
+ "step": 24175
+ },
+ {
+ "epoch": 65.87465940054496,
+ "grad_norm": 3.4739911556243896,
+ "learning_rate": 5.510766885541606e-06,
+ "loss": 0.0492,
+ "step": 24176
+ },
+ {
+ "epoch": 65.87738419618529,
+ "grad_norm": 4.011838912963867,
+ "learning_rate": 5.509978332037444e-06,
+ "loss": 0.1477,
+ "step": 24177
+ },
+ {
+ "epoch": 65.88010899182561,
+ "grad_norm": 4.0436692237854,
+ "learning_rate": 5.509189813501427e-06,
+ "loss": 0.0764,
+ "step": 24178
+ },
+ {
+ "epoch": 65.88283378746594,
+ "grad_norm": 3.490626335144043,
+ "learning_rate": 5.508401329939695e-06,
+ "loss": 0.0556,
+ "step": 24179
+ },
+ {
+ "epoch": 65.88555858310627,
+ "grad_norm": 4.4941487312316895,
+ "learning_rate": 5.507612881358384e-06,
+ "loss": 0.2727,
+ "step": 24180
+ },
+ {
+ "epoch": 65.88828337874659,
+ "grad_norm": 7.636957168579102,
+ "learning_rate": 5.506824467763645e-06,
+ "loss": 0.0851,
+ "step": 24181
+ },
+ {
+ "epoch": 65.89100817438693,
+ "grad_norm": 3.2159922122955322,
+ "learning_rate": 5.506036089161611e-06,
+ "loss": 0.0683,
+ "step": 24182
+ },
+ {
+ "epoch": 65.89373297002724,
+ "grad_norm": 3.8589589595794678,
+ "learning_rate": 5.505247745558419e-06,
+ "loss": 0.0811,
+ "step": 24183
+ },
+ {
+ "epoch": 65.89645776566758,
+ "grad_norm": 3.433084726333618,
+ "learning_rate": 5.504459436960218e-06,
+ "loss": 0.0632,
+ "step": 24184
+ },
+ {
+ "epoch": 65.8991825613079,
+ "grad_norm": 3.2560300827026367,
+ "learning_rate": 5.5036711633731375e-06,
+ "loss": 0.06,
+ "step": 24185
+ },
+ {
+ "epoch": 65.90190735694823,
+ "grad_norm": 3.7079596519470215,
+ "learning_rate": 5.502882924803326e-06,
+ "loss": 0.0864,
+ "step": 24186
+ },
+ {
+ "epoch": 65.90463215258856,
+ "grad_norm": 3.2791967391967773,
+ "learning_rate": 5.502094721256916e-06,
+ "loss": 0.0716,
+ "step": 24187
+ },
+ {
+ "epoch": 65.90735694822888,
+ "grad_norm": 3.8873748779296875,
+ "learning_rate": 5.501306552740049e-06,
+ "loss": 0.0429,
+ "step": 24188
+ },
+ {
+ "epoch": 65.91008174386921,
+ "grad_norm": 3.6260781288146973,
+ "learning_rate": 5.500518419258858e-06,
+ "loss": 0.1358,
+ "step": 24189
+ },
+ {
+ "epoch": 65.91280653950953,
+ "grad_norm": 3.118328332901001,
+ "learning_rate": 5.499730320819487e-06,
+ "loss": 0.0476,
+ "step": 24190
+ },
+ {
+ "epoch": 65.91553133514986,
+ "grad_norm": 2.7150537967681885,
+ "learning_rate": 5.498942257428073e-06,
+ "loss": 0.0793,
+ "step": 24191
+ },
+ {
+ "epoch": 65.9182561307902,
+ "grad_norm": 3.9062442779541016,
+ "learning_rate": 5.498154229090748e-06,
+ "loss": 0.0791,
+ "step": 24192
+ },
+ {
+ "epoch": 65.92098092643052,
+ "grad_norm": 3.698467493057251,
+ "learning_rate": 5.497366235813656e-06,
+ "loss": 0.1608,
+ "step": 24193
+ },
+ {
+ "epoch": 65.92370572207085,
+ "grad_norm": 4.635098457336426,
+ "learning_rate": 5.496578277602931e-06,
+ "loss": 0.0595,
+ "step": 24194
+ },
+ {
+ "epoch": 65.92643051771117,
+ "grad_norm": 3.7649402618408203,
+ "learning_rate": 5.49579035446471e-06,
+ "loss": 0.1043,
+ "step": 24195
+ },
+ {
+ "epoch": 65.9291553133515,
+ "grad_norm": 2.6555700302124023,
+ "learning_rate": 5.495002466405124e-06,
+ "loss": 0.0343,
+ "step": 24196
+ },
+ {
+ "epoch": 65.93188010899182,
+ "grad_norm": 4.743636131286621,
+ "learning_rate": 5.4942146134303175e-06,
+ "loss": 0.0989,
+ "step": 24197
+ },
+ {
+ "epoch": 65.93460490463215,
+ "grad_norm": 2.9609110355377197,
+ "learning_rate": 5.493426795546424e-06,
+ "loss": 0.1368,
+ "step": 24198
+ },
+ {
+ "epoch": 65.93732970027249,
+ "grad_norm": 2.9740395545959473,
+ "learning_rate": 5.492639012759576e-06,
+ "loss": 0.1373,
+ "step": 24199
+ },
+ {
+ "epoch": 65.9400544959128,
+ "grad_norm": 4.133841514587402,
+ "learning_rate": 5.491851265075907e-06,
+ "loss": 0.0728,
+ "step": 24200
+ },
+ {
+ "epoch": 65.94277929155314,
+ "grad_norm": 3.930466651916504,
+ "learning_rate": 5.491063552501557e-06,
+ "loss": 0.1177,
+ "step": 24201
+ },
+ {
+ "epoch": 65.94550408719346,
+ "grad_norm": 3.093852996826172,
+ "learning_rate": 5.4902758750426596e-06,
+ "loss": 0.1674,
+ "step": 24202
+ },
+ {
+ "epoch": 65.94822888283379,
+ "grad_norm": 9.726191520690918,
+ "learning_rate": 5.489488232705351e-06,
+ "loss": 0.0435,
+ "step": 24203
+ },
+ {
+ "epoch": 65.95095367847412,
+ "grad_norm": 3.5312047004699707,
+ "learning_rate": 5.488700625495762e-06,
+ "loss": 0.1013,
+ "step": 24204
+ },
+ {
+ "epoch": 65.95367847411444,
+ "grad_norm": 3.8236422538757324,
+ "learning_rate": 5.487913053420023e-06,
+ "loss": 0.0735,
+ "step": 24205
+ },
+ {
+ "epoch": 65.95640326975477,
+ "grad_norm": 4.338160037994385,
+ "learning_rate": 5.487125516484276e-06,
+ "loss": 0.1414,
+ "step": 24206
+ },
+ {
+ "epoch": 65.95912806539509,
+ "grad_norm": 2.083596706390381,
+ "learning_rate": 5.486338014694651e-06,
+ "loss": 0.0296,
+ "step": 24207
+ },
+ {
+ "epoch": 65.96185286103542,
+ "grad_norm": 2.7186203002929688,
+ "learning_rate": 5.485550548057279e-06,
+ "loss": 0.0425,
+ "step": 24208
+ },
+ {
+ "epoch": 65.96457765667574,
+ "grad_norm": 4.528669834136963,
+ "learning_rate": 5.4847631165782914e-06,
+ "loss": 0.0521,
+ "step": 24209
+ },
+ {
+ "epoch": 65.96730245231608,
+ "grad_norm": 2.236259698867798,
+ "learning_rate": 5.483975720263827e-06,
+ "loss": 0.0689,
+ "step": 24210
+ },
+ {
+ "epoch": 65.97002724795641,
+ "grad_norm": 5.090316295623779,
+ "learning_rate": 5.4831883591200145e-06,
+ "loss": 0.1475,
+ "step": 24211
+ },
+ {
+ "epoch": 65.97275204359673,
+ "grad_norm": 3.0475664138793945,
+ "learning_rate": 5.482401033152984e-06,
+ "loss": 0.1759,
+ "step": 24212
+ },
+ {
+ "epoch": 65.97547683923706,
+ "grad_norm": 5.212029457092285,
+ "learning_rate": 5.481613742368868e-06,
+ "loss": 0.2215,
+ "step": 24213
+ },
+ {
+ "epoch": 65.97820163487738,
+ "grad_norm": 3.1095752716064453,
+ "learning_rate": 5.4808264867738e-06,
+ "loss": 0.0509,
+ "step": 24214
+ },
+ {
+ "epoch": 65.98092643051771,
+ "grad_norm": 3.6840479373931885,
+ "learning_rate": 5.480039266373911e-06,
+ "loss": 0.0353,
+ "step": 24215
+ },
+ {
+ "epoch": 65.98365122615803,
+ "grad_norm": 2.972705841064453,
+ "learning_rate": 5.479252081175326e-06,
+ "loss": 0.1874,
+ "step": 24216
+ },
+ {
+ "epoch": 65.98637602179836,
+ "grad_norm": 3.9125068187713623,
+ "learning_rate": 5.478464931184186e-06,
+ "loss": 0.0907,
+ "step": 24217
+ },
+ {
+ "epoch": 65.9891008174387,
+ "grad_norm": 3.8430469036102295,
+ "learning_rate": 5.477677816406611e-06,
+ "loss": 0.1185,
+ "step": 24218
+ },
+ {
+ "epoch": 65.99182561307902,
+ "grad_norm": 13.997435569763184,
+ "learning_rate": 5.4768907368487375e-06,
+ "loss": 0.0862,
+ "step": 24219
+ },
+ {
+ "epoch": 65.99455040871935,
+ "grad_norm": 5.113949775695801,
+ "learning_rate": 5.4761036925166946e-06,
+ "loss": 0.1009,
+ "step": 24220
+ },
+ {
+ "epoch": 65.99727520435967,
+ "grad_norm": 2.952927589416504,
+ "learning_rate": 5.475316683416607e-06,
+ "loss": 0.0448,
+ "step": 24221
+ },
+ {
+ "epoch": 66.0,
+ "grad_norm": 2.908334493637085,
+ "learning_rate": 5.4745297095546125e-06,
+ "loss": 0.1382,
+ "step": 24222
+ },
+ {
+ "epoch": 66.00272479564033,
+ "grad_norm": 4.744135856628418,
+ "learning_rate": 5.4737427709368326e-06,
+ "loss": 0.067,
+ "step": 24223
+ },
+ {
+ "epoch": 66.00544959128065,
+ "grad_norm": 3.928037166595459,
+ "learning_rate": 5.472955867569399e-06,
+ "loss": 0.0739,
+ "step": 24224
+ },
+ {
+ "epoch": 66.00817438692098,
+ "grad_norm": 4.2218427658081055,
+ "learning_rate": 5.472168999458436e-06,
+ "loss": 0.1286,
+ "step": 24225
+ },
+ {
+ "epoch": 66.0108991825613,
+ "grad_norm": 3.494382381439209,
+ "learning_rate": 5.4713821666100794e-06,
+ "loss": 0.0475,
+ "step": 24226
+ },
+ {
+ "epoch": 66.01362397820164,
+ "grad_norm": 3.000708818435669,
+ "learning_rate": 5.470595369030453e-06,
+ "loss": 0.0377,
+ "step": 24227
+ },
+ {
+ "epoch": 66.01634877384195,
+ "grad_norm": 3.6476948261260986,
+ "learning_rate": 5.4698086067256826e-06,
+ "loss": 0.0524,
+ "step": 24228
+ },
+ {
+ "epoch": 66.01907356948229,
+ "grad_norm": 3.2138516902923584,
+ "learning_rate": 5.469021879701895e-06,
+ "loss": 0.1095,
+ "step": 24229
+ },
+ {
+ "epoch": 66.02179836512262,
+ "grad_norm": 2.9181294441223145,
+ "learning_rate": 5.468235187965221e-06,
+ "loss": 0.0985,
+ "step": 24230
+ },
+ {
+ "epoch": 66.02452316076294,
+ "grad_norm": 2.7947864532470703,
+ "learning_rate": 5.467448531521786e-06,
+ "loss": 0.1065,
+ "step": 24231
+ },
+ {
+ "epoch": 66.02724795640327,
+ "grad_norm": 3.4363908767700195,
+ "learning_rate": 5.466661910377717e-06,
+ "loss": 0.0713,
+ "step": 24232
+ },
+ {
+ "epoch": 66.02997275204359,
+ "grad_norm": 5.255629539489746,
+ "learning_rate": 5.465875324539134e-06,
+ "loss": 0.2178,
+ "step": 24233
+ },
+ {
+ "epoch": 66.03269754768392,
+ "grad_norm": 2.9164540767669678,
+ "learning_rate": 5.465088774012172e-06,
+ "loss": 0.0578,
+ "step": 24234
+ },
+ {
+ "epoch": 66.03542234332426,
+ "grad_norm": 2.8132989406585693,
+ "learning_rate": 5.464302258802949e-06,
+ "loss": 0.0379,
+ "step": 24235
+ },
+ {
+ "epoch": 66.03814713896458,
+ "grad_norm": 3.0949575901031494,
+ "learning_rate": 5.463515778917598e-06,
+ "loss": 0.0759,
+ "step": 24236
+ },
+ {
+ "epoch": 66.04087193460491,
+ "grad_norm": 4.194434642791748,
+ "learning_rate": 5.462729334362238e-06,
+ "loss": 0.1513,
+ "step": 24237
+ },
+ {
+ "epoch": 66.04359673024523,
+ "grad_norm": 7.156740188598633,
+ "learning_rate": 5.461942925142998e-06,
+ "loss": 0.1032,
+ "step": 24238
+ },
+ {
+ "epoch": 66.04632152588556,
+ "grad_norm": 3.326951742172241,
+ "learning_rate": 5.4611565512660005e-06,
+ "loss": 0.0777,
+ "step": 24239
+ },
+ {
+ "epoch": 66.04904632152588,
+ "grad_norm": 4.344686508178711,
+ "learning_rate": 5.46037021273737e-06,
+ "loss": 0.0969,
+ "step": 24240
+ },
+ {
+ "epoch": 66.05177111716621,
+ "grad_norm": 3.5357677936553955,
+ "learning_rate": 5.459583909563226e-06,
+ "loss": 0.0591,
+ "step": 24241
+ },
+ {
+ "epoch": 66.05449591280654,
+ "grad_norm": 5.435465335845947,
+ "learning_rate": 5.4587976417497e-06,
+ "loss": 0.182,
+ "step": 24242
+ },
+ {
+ "epoch": 66.05722070844686,
+ "grad_norm": 2.5353848934173584,
+ "learning_rate": 5.458011409302913e-06,
+ "loss": 0.0453,
+ "step": 24243
+ },
+ {
+ "epoch": 66.0599455040872,
+ "grad_norm": 4.735696315765381,
+ "learning_rate": 5.457225212228987e-06,
+ "loss": 0.0537,
+ "step": 24244
+ },
+ {
+ "epoch": 66.06267029972751,
+ "grad_norm": 3.0745997428894043,
+ "learning_rate": 5.456439050534039e-06,
+ "loss": 0.0733,
+ "step": 24245
+ },
+ {
+ "epoch": 66.06539509536785,
+ "grad_norm": 3.17090106010437,
+ "learning_rate": 5.455652924224203e-06,
+ "loss": 0.1197,
+ "step": 24246
+ },
+ {
+ "epoch": 66.06811989100818,
+ "grad_norm": 3.086277961730957,
+ "learning_rate": 5.4548668333055954e-06,
+ "loss": 0.0427,
+ "step": 24247
+ },
+ {
+ "epoch": 66.0708446866485,
+ "grad_norm": 3.164388418197632,
+ "learning_rate": 5.454080777784338e-06,
+ "loss": 0.1118,
+ "step": 24248
+ },
+ {
+ "epoch": 66.07356948228883,
+ "grad_norm": 3.5116429328918457,
+ "learning_rate": 5.453294757666549e-06,
+ "loss": 0.0553,
+ "step": 24249
+ },
+ {
+ "epoch": 66.07629427792915,
+ "grad_norm": 2.788637638092041,
+ "learning_rate": 5.45250877295836e-06,
+ "loss": 0.0515,
+ "step": 24250
+ },
+ {
+ "epoch": 66.07901907356948,
+ "grad_norm": 2.9801645278930664,
+ "learning_rate": 5.451722823665885e-06,
+ "loss": 0.1824,
+ "step": 24251
+ },
+ {
+ "epoch": 66.0817438692098,
+ "grad_norm": 2.963919162750244,
+ "learning_rate": 5.4509369097952425e-06,
+ "loss": 0.111,
+ "step": 24252
+ },
+ {
+ "epoch": 66.08446866485014,
+ "grad_norm": 3.0374701023101807,
+ "learning_rate": 5.45015103135256e-06,
+ "loss": 0.0937,
+ "step": 24253
+ },
+ {
+ "epoch": 66.08719346049047,
+ "grad_norm": 3.2187795639038086,
+ "learning_rate": 5.449365188343952e-06,
+ "loss": 0.1229,
+ "step": 24254
+ },
+ {
+ "epoch": 66.08991825613079,
+ "grad_norm": 2.594090461730957,
+ "learning_rate": 5.448579380775545e-06,
+ "loss": 0.0431,
+ "step": 24255
+ },
+ {
+ "epoch": 66.09264305177112,
+ "grad_norm": 4.707623481750488,
+ "learning_rate": 5.447793608653456e-06,
+ "loss": 0.049,
+ "step": 24256
+ },
+ {
+ "epoch": 66.09536784741144,
+ "grad_norm": 3.289013385772705,
+ "learning_rate": 5.447007871983799e-06,
+ "loss": 0.0673,
+ "step": 24257
+ },
+ {
+ "epoch": 66.09809264305177,
+ "grad_norm": 3.820110321044922,
+ "learning_rate": 5.446222170772703e-06,
+ "loss": 0.053,
+ "step": 24258
+ },
+ {
+ "epoch": 66.1008174386921,
+ "grad_norm": 2.688070774078369,
+ "learning_rate": 5.44543650502628e-06,
+ "loss": 0.0321,
+ "step": 24259
+ },
+ {
+ "epoch": 66.10354223433242,
+ "grad_norm": 3.359084129333496,
+ "learning_rate": 5.444650874750654e-06,
+ "loss": 0.1136,
+ "step": 24260
+ },
+ {
+ "epoch": 66.10626702997276,
+ "grad_norm": 2.812195062637329,
+ "learning_rate": 5.443865279951934e-06,
+ "loss": 0.0778,
+ "step": 24261
+ },
+ {
+ "epoch": 66.10899182561307,
+ "grad_norm": 2.4813084602355957,
+ "learning_rate": 5.443079720636251e-06,
+ "loss": 0.1395,
+ "step": 24262
+ },
+ {
+ "epoch": 66.11171662125341,
+ "grad_norm": 4.899084568023682,
+ "learning_rate": 5.4422941968097145e-06,
+ "loss": 0.0998,
+ "step": 24263
+ },
+ {
+ "epoch": 66.11444141689373,
+ "grad_norm": 2.6284587383270264,
+ "learning_rate": 5.441508708478444e-06,
+ "loss": 0.1984,
+ "step": 24264
+ },
+ {
+ "epoch": 66.11716621253406,
+ "grad_norm": 3.3272786140441895,
+ "learning_rate": 5.440723255648553e-06,
+ "loss": 0.0589,
+ "step": 24265
+ },
+ {
+ "epoch": 66.11989100817439,
+ "grad_norm": 2.6776010990142822,
+ "learning_rate": 5.439937838326168e-06,
+ "loss": 0.0539,
+ "step": 24266
+ },
+ {
+ "epoch": 66.12261580381471,
+ "grad_norm": 2.8808488845825195,
+ "learning_rate": 5.439152456517398e-06,
+ "loss": 0.083,
+ "step": 24267
+ },
+ {
+ "epoch": 66.12534059945504,
+ "grad_norm": 2.9243571758270264,
+ "learning_rate": 5.438367110228364e-06,
+ "loss": 0.0718,
+ "step": 24268
+ },
+ {
+ "epoch": 66.12806539509536,
+ "grad_norm": 2.8457818031311035,
+ "learning_rate": 5.437581799465174e-06,
+ "loss": 0.1266,
+ "step": 24269
+ },
+ {
+ "epoch": 66.1307901907357,
+ "grad_norm": 3.4168143272399902,
+ "learning_rate": 5.436796524233953e-06,
+ "loss": 0.1344,
+ "step": 24270
+ },
+ {
+ "epoch": 66.13351498637603,
+ "grad_norm": 4.4502482414245605,
+ "learning_rate": 5.436011284540816e-06,
+ "loss": 0.0456,
+ "step": 24271
+ },
+ {
+ "epoch": 66.13623978201635,
+ "grad_norm": 3.203949451446533,
+ "learning_rate": 5.435226080391876e-06,
+ "loss": 0.1046,
+ "step": 24272
+ },
+ {
+ "epoch": 66.13896457765668,
+ "grad_norm": 5.92611026763916,
+ "learning_rate": 5.43444091179325e-06,
+ "loss": 0.0545,
+ "step": 24273
+ },
+ {
+ "epoch": 66.141689373297,
+ "grad_norm": 2.4659831523895264,
+ "learning_rate": 5.433655778751046e-06,
+ "loss": 0.1484,
+ "step": 24274
+ },
+ {
+ "epoch": 66.14441416893733,
+ "grad_norm": 2.714594841003418,
+ "learning_rate": 5.432870681271387e-06,
+ "loss": 0.1633,
+ "step": 24275
+ },
+ {
+ "epoch": 66.14713896457765,
+ "grad_norm": 5.0077056884765625,
+ "learning_rate": 5.432085619360385e-06,
+ "loss": 0.1349,
+ "step": 24276
+ },
+ {
+ "epoch": 66.14986376021798,
+ "grad_norm": 3.6828205585479736,
+ "learning_rate": 5.431300593024154e-06,
+ "loss": 0.0866,
+ "step": 24277
+ },
+ {
+ "epoch": 66.15258855585832,
+ "grad_norm": 3.1793949604034424,
+ "learning_rate": 5.430515602268802e-06,
+ "loss": 0.104,
+ "step": 24278
+ },
+ {
+ "epoch": 66.15531335149863,
+ "grad_norm": 3.393775701522827,
+ "learning_rate": 5.429730647100452e-06,
+ "loss": 0.185,
+ "step": 24279
+ },
+ {
+ "epoch": 66.15803814713897,
+ "grad_norm": 2.9456627368927,
+ "learning_rate": 5.428945727525212e-06,
+ "loss": 0.0303,
+ "step": 24280
+ },
+ {
+ "epoch": 66.16076294277929,
+ "grad_norm": 7.299849510192871,
+ "learning_rate": 5.428160843549192e-06,
+ "loss": 0.1888,
+ "step": 24281
+ },
+ {
+ "epoch": 66.16348773841962,
+ "grad_norm": 3.188413143157959,
+ "learning_rate": 5.427375995178512e-06,
+ "loss": 0.0408,
+ "step": 24282
+ },
+ {
+ "epoch": 66.16621253405995,
+ "grad_norm": 3.6501407623291016,
+ "learning_rate": 5.426591182419281e-06,
+ "loss": 0.2349,
+ "step": 24283
+ },
+ {
+ "epoch": 66.16893732970027,
+ "grad_norm": 4.452661514282227,
+ "learning_rate": 5.425806405277609e-06,
+ "loss": 0.2183,
+ "step": 24284
+ },
+ {
+ "epoch": 66.1716621253406,
+ "grad_norm": 3.6181628704071045,
+ "learning_rate": 5.425021663759607e-06,
+ "loss": 0.0525,
+ "step": 24285
+ },
+ {
+ "epoch": 66.17438692098092,
+ "grad_norm": 3.887105703353882,
+ "learning_rate": 5.424236957871389e-06,
+ "loss": 0.1238,
+ "step": 24286
+ },
+ {
+ "epoch": 66.17711171662125,
+ "grad_norm": 2.744150161743164,
+ "learning_rate": 5.423452287619071e-06,
+ "loss": 0.0421,
+ "step": 24287
+ },
+ {
+ "epoch": 66.17983651226157,
+ "grad_norm": 5.4936981201171875,
+ "learning_rate": 5.4226676530087575e-06,
+ "loss": 0.0257,
+ "step": 24288
+ },
+ {
+ "epoch": 66.1825613079019,
+ "grad_norm": 2.7765650749206543,
+ "learning_rate": 5.421883054046562e-06,
+ "loss": 0.0715,
+ "step": 24289
+ },
+ {
+ "epoch": 66.18528610354224,
+ "grad_norm": 3.0034921169281006,
+ "learning_rate": 5.42109849073859e-06,
+ "loss": 0.0443,
+ "step": 24290
+ },
+ {
+ "epoch": 66.18801089918256,
+ "grad_norm": 2.518137216567993,
+ "learning_rate": 5.42031396309096e-06,
+ "loss": 0.116,
+ "step": 24291
+ },
+ {
+ "epoch": 66.19073569482289,
+ "grad_norm": 2.664363145828247,
+ "learning_rate": 5.4195294711097766e-06,
+ "loss": 0.0469,
+ "step": 24292
+ },
+ {
+ "epoch": 66.19346049046321,
+ "grad_norm": 2.527747631072998,
+ "learning_rate": 5.41874501480115e-06,
+ "loss": 0.0589,
+ "step": 24293
+ },
+ {
+ "epoch": 66.19618528610354,
+ "grad_norm": 4.242908954620361,
+ "learning_rate": 5.417960594171187e-06,
+ "loss": 0.0872,
+ "step": 24294
+ },
+ {
+ "epoch": 66.19891008174388,
+ "grad_norm": 2.8034889698028564,
+ "learning_rate": 5.417176209226003e-06,
+ "loss": 0.0412,
+ "step": 24295
+ },
+ {
+ "epoch": 66.2016348773842,
+ "grad_norm": 2.995678663253784,
+ "learning_rate": 5.4163918599717015e-06,
+ "loss": 0.0459,
+ "step": 24296
+ },
+ {
+ "epoch": 66.20435967302453,
+ "grad_norm": 2.9752919673919678,
+ "learning_rate": 5.415607546414394e-06,
+ "loss": 0.1032,
+ "step": 24297
+ },
+ {
+ "epoch": 66.20708446866485,
+ "grad_norm": 3.64369535446167,
+ "learning_rate": 5.414823268560184e-06,
+ "loss": 0.1894,
+ "step": 24298
+ },
+ {
+ "epoch": 66.20980926430518,
+ "grad_norm": 6.802177906036377,
+ "learning_rate": 5.414039026415187e-06,
+ "loss": 0.0524,
+ "step": 24299
+ },
+ {
+ "epoch": 66.2125340599455,
+ "grad_norm": 3.8642148971557617,
+ "learning_rate": 5.413254819985505e-06,
+ "loss": 0.0839,
+ "step": 24300
+ },
+ {
+ "epoch": 66.21525885558583,
+ "grad_norm": 3.5432136058807373,
+ "learning_rate": 5.412470649277244e-06,
+ "loss": 0.0668,
+ "step": 24301
+ },
+ {
+ "epoch": 66.21798365122616,
+ "grad_norm": 2.77707839012146,
+ "learning_rate": 5.411686514296517e-06,
+ "loss": 0.0738,
+ "step": 24302
+ },
+ {
+ "epoch": 66.22070844686648,
+ "grad_norm": 2.6112751960754395,
+ "learning_rate": 5.410902415049428e-06,
+ "loss": 0.0455,
+ "step": 24303
+ },
+ {
+ "epoch": 66.22343324250681,
+ "grad_norm": 2.9880340099334717,
+ "learning_rate": 5.410118351542079e-06,
+ "loss": 0.089,
+ "step": 24304
+ },
+ {
+ "epoch": 66.22615803814713,
+ "grad_norm": 4.272844314575195,
+ "learning_rate": 5.409334323780586e-06,
+ "loss": 0.0798,
+ "step": 24305
+ },
+ {
+ "epoch": 66.22888283378747,
+ "grad_norm": 3.6603877544403076,
+ "learning_rate": 5.408550331771045e-06,
+ "loss": 0.2148,
+ "step": 24306
+ },
+ {
+ "epoch": 66.2316076294278,
+ "grad_norm": 2.74448561668396,
+ "learning_rate": 5.40776637551957e-06,
+ "loss": 0.0391,
+ "step": 24307
+ },
+ {
+ "epoch": 66.23433242506812,
+ "grad_norm": 13.26368522644043,
+ "learning_rate": 5.4069824550322614e-06,
+ "loss": 0.1095,
+ "step": 24308
+ },
+ {
+ "epoch": 66.23705722070845,
+ "grad_norm": 3.366335391998291,
+ "learning_rate": 5.406198570315227e-06,
+ "loss": 0.073,
+ "step": 24309
+ },
+ {
+ "epoch": 66.23978201634877,
+ "grad_norm": 3.413801431655884,
+ "learning_rate": 5.405414721374567e-06,
+ "loss": 0.0339,
+ "step": 24310
+ },
+ {
+ "epoch": 66.2425068119891,
+ "grad_norm": 3.139404535293579,
+ "learning_rate": 5.404630908216391e-06,
+ "loss": 0.109,
+ "step": 24311
+ },
+ {
+ "epoch": 66.24523160762942,
+ "grad_norm": 3.3953793048858643,
+ "learning_rate": 5.4038471308468046e-06,
+ "loss": 0.0455,
+ "step": 24312
+ },
+ {
+ "epoch": 66.24795640326975,
+ "grad_norm": 4.085725784301758,
+ "learning_rate": 5.403063389271906e-06,
+ "loss": 0.1498,
+ "step": 24313
+ },
+ {
+ "epoch": 66.25068119891009,
+ "grad_norm": 3.603846311569214,
+ "learning_rate": 5.4022796834978e-06,
+ "loss": 0.1901,
+ "step": 24314
+ },
+ {
+ "epoch": 66.2534059945504,
+ "grad_norm": 3.5509657859802246,
+ "learning_rate": 5.401496013530594e-06,
+ "loss": 0.138,
+ "step": 24315
+ },
+ {
+ "epoch": 66.25613079019074,
+ "grad_norm": 3.6874115467071533,
+ "learning_rate": 5.400712379376389e-06,
+ "loss": 0.1103,
+ "step": 24316
+ },
+ {
+ "epoch": 66.25885558583106,
+ "grad_norm": 3.6496448516845703,
+ "learning_rate": 5.399928781041289e-06,
+ "loss": 0.1321,
+ "step": 24317
+ },
+ {
+ "epoch": 66.26158038147139,
+ "grad_norm": 3.424882650375366,
+ "learning_rate": 5.399145218531392e-06,
+ "loss": 0.0404,
+ "step": 24318
+ },
+ {
+ "epoch": 66.26430517711172,
+ "grad_norm": 2.8604648113250732,
+ "learning_rate": 5.398361691852807e-06,
+ "loss": 0.0482,
+ "step": 24319
+ },
+ {
+ "epoch": 66.26702997275204,
+ "grad_norm": 3.9597084522247314,
+ "learning_rate": 5.397578201011633e-06,
+ "loss": 0.2066,
+ "step": 24320
+ },
+ {
+ "epoch": 66.26975476839237,
+ "grad_norm": 3.7965893745422363,
+ "learning_rate": 5.396794746013969e-06,
+ "loss": 0.1034,
+ "step": 24321
+ },
+ {
+ "epoch": 66.2724795640327,
+ "grad_norm": 2.308955192565918,
+ "learning_rate": 5.396011326865918e-06,
+ "loss": 0.0803,
+ "step": 24322
+ },
+ {
+ "epoch": 66.27520435967303,
+ "grad_norm": 3.434704303741455,
+ "learning_rate": 5.395227943573588e-06,
+ "loss": 0.0408,
+ "step": 24323
+ },
+ {
+ "epoch": 66.27792915531334,
+ "grad_norm": 12.772610664367676,
+ "learning_rate": 5.394444596143074e-06,
+ "loss": 0.0785,
+ "step": 24324
+ },
+ {
+ "epoch": 66.28065395095368,
+ "grad_norm": 4.06698751449585,
+ "learning_rate": 5.393661284580476e-06,
+ "loss": 0.2114,
+ "step": 24325
+ },
+ {
+ "epoch": 66.28337874659401,
+ "grad_norm": 4.142553806304932,
+ "learning_rate": 5.392878008891893e-06,
+ "loss": 0.0809,
+ "step": 24326
+ },
+ {
+ "epoch": 66.28610354223433,
+ "grad_norm": 4.444906711578369,
+ "learning_rate": 5.3920947690834315e-06,
+ "loss": 0.2025,
+ "step": 24327
+ },
+ {
+ "epoch": 66.28882833787466,
+ "grad_norm": 4.779823303222656,
+ "learning_rate": 5.391311565161188e-06,
+ "loss": 0.0845,
+ "step": 24328
+ },
+ {
+ "epoch": 66.29155313351498,
+ "grad_norm": 3.2991936206817627,
+ "learning_rate": 5.39052839713126e-06,
+ "loss": 0.2644,
+ "step": 24329
+ },
+ {
+ "epoch": 66.29427792915531,
+ "grad_norm": 6.251668453216553,
+ "learning_rate": 5.389745264999746e-06,
+ "loss": 0.0719,
+ "step": 24330
+ },
+ {
+ "epoch": 66.29700272479565,
+ "grad_norm": 2.9856066703796387,
+ "learning_rate": 5.388962168772751e-06,
+ "loss": 0.0553,
+ "step": 24331
+ },
+ {
+ "epoch": 66.29972752043597,
+ "grad_norm": 6.136131286621094,
+ "learning_rate": 5.388179108456371e-06,
+ "loss": 0.1126,
+ "step": 24332
+ },
+ {
+ "epoch": 66.3024523160763,
+ "grad_norm": 3.4155325889587402,
+ "learning_rate": 5.387396084056704e-06,
+ "loss": 0.1678,
+ "step": 24333
+ },
+ {
+ "epoch": 66.30517711171662,
+ "grad_norm": 2.889922618865967,
+ "learning_rate": 5.386613095579842e-06,
+ "loss": 0.0481,
+ "step": 24334
+ },
+ {
+ "epoch": 66.30790190735695,
+ "grad_norm": 2.9885833263397217,
+ "learning_rate": 5.385830143031894e-06,
+ "loss": 0.0802,
+ "step": 24335
+ },
+ {
+ "epoch": 66.31062670299727,
+ "grad_norm": 3.7668232917785645,
+ "learning_rate": 5.385047226418953e-06,
+ "loss": 0.0485,
+ "step": 24336
+ },
+ {
+ "epoch": 66.3133514986376,
+ "grad_norm": 2.5551421642303467,
+ "learning_rate": 5.384264345747114e-06,
+ "loss": 0.0465,
+ "step": 24337
+ },
+ {
+ "epoch": 66.31607629427793,
+ "grad_norm": 2.507850408554077,
+ "learning_rate": 5.383481501022472e-06,
+ "loss": 0.034,
+ "step": 24338
+ },
+ {
+ "epoch": 66.31880108991825,
+ "grad_norm": 4.48660945892334,
+ "learning_rate": 5.382698692251128e-06,
+ "loss": 0.052,
+ "step": 24339
+ },
+ {
+ "epoch": 66.32152588555859,
+ "grad_norm": 3.4189884662628174,
+ "learning_rate": 5.381915919439182e-06,
+ "loss": 0.2075,
+ "step": 24340
+ },
+ {
+ "epoch": 66.3242506811989,
+ "grad_norm": 3.596912384033203,
+ "learning_rate": 5.381133182592726e-06,
+ "loss": 0.0506,
+ "step": 24341
+ },
+ {
+ "epoch": 66.32697547683924,
+ "grad_norm": 2.990658760070801,
+ "learning_rate": 5.380350481717853e-06,
+ "loss": 0.1349,
+ "step": 24342
+ },
+ {
+ "epoch": 66.32970027247957,
+ "grad_norm": 3.235776901245117,
+ "learning_rate": 5.379567816820664e-06,
+ "loss": 0.0529,
+ "step": 24343
+ },
+ {
+ "epoch": 66.33242506811989,
+ "grad_norm": 5.018767356872559,
+ "learning_rate": 5.378785187907254e-06,
+ "loss": 0.1797,
+ "step": 24344
+ },
+ {
+ "epoch": 66.33514986376022,
+ "grad_norm": 2.745403528213501,
+ "learning_rate": 5.378002594983715e-06,
+ "loss": 0.034,
+ "step": 24345
+ },
+ {
+ "epoch": 66.33787465940054,
+ "grad_norm": 3.718411684036255,
+ "learning_rate": 5.377220038056139e-06,
+ "loss": 0.0623,
+ "step": 24346
+ },
+ {
+ "epoch": 66.34059945504087,
+ "grad_norm": 2.6147892475128174,
+ "learning_rate": 5.376437517130629e-06,
+ "loss": 0.0675,
+ "step": 24347
+ },
+ {
+ "epoch": 66.34332425068119,
+ "grad_norm": 3.535597324371338,
+ "learning_rate": 5.375655032213275e-06,
+ "loss": 0.1465,
+ "step": 24348
+ },
+ {
+ "epoch": 66.34604904632153,
+ "grad_norm": 3.055279493331909,
+ "learning_rate": 5.374872583310171e-06,
+ "loss": 0.127,
+ "step": 24349
+ },
+ {
+ "epoch": 66.34877384196186,
+ "grad_norm": 3.0705902576446533,
+ "learning_rate": 5.3740901704274065e-06,
+ "loss": 0.1877,
+ "step": 24350
+ },
+ {
+ "epoch": 66.35149863760218,
+ "grad_norm": 3.3683879375457764,
+ "learning_rate": 5.373307793571081e-06,
+ "loss": 0.1183,
+ "step": 24351
+ },
+ {
+ "epoch": 66.35422343324251,
+ "grad_norm": 3.221919059753418,
+ "learning_rate": 5.372525452747288e-06,
+ "loss": 0.0942,
+ "step": 24352
+ },
+ {
+ "epoch": 66.35694822888283,
+ "grad_norm": 3.9317526817321777,
+ "learning_rate": 5.3717431479621164e-06,
+ "loss": 0.1732,
+ "step": 24353
+ },
+ {
+ "epoch": 66.35967302452316,
+ "grad_norm": 4.337979793548584,
+ "learning_rate": 5.370960879221656e-06,
+ "loss": 0.038,
+ "step": 24354
+ },
+ {
+ "epoch": 66.3623978201635,
+ "grad_norm": 3.9914824962615967,
+ "learning_rate": 5.370178646532004e-06,
+ "loss": 0.0724,
+ "step": 24355
+ },
+ {
+ "epoch": 66.36512261580381,
+ "grad_norm": 3.8431718349456787,
+ "learning_rate": 5.369396449899256e-06,
+ "loss": 0.1155,
+ "step": 24356
+ },
+ {
+ "epoch": 66.36784741144415,
+ "grad_norm": 4.0201239585876465,
+ "learning_rate": 5.368614289329499e-06,
+ "loss": 0.0864,
+ "step": 24357
+ },
+ {
+ "epoch": 66.37057220708446,
+ "grad_norm": 8.328060150146484,
+ "learning_rate": 5.367832164828823e-06,
+ "loss": 0.1455,
+ "step": 24358
+ },
+ {
+ "epoch": 66.3732970027248,
+ "grad_norm": 3.160085678100586,
+ "learning_rate": 5.367050076403319e-06,
+ "loss": 0.0564,
+ "step": 24359
+ },
+ {
+ "epoch": 66.37602179836512,
+ "grad_norm": 2.751584529876709,
+ "learning_rate": 5.366268024059085e-06,
+ "loss": 0.0621,
+ "step": 24360
+ },
+ {
+ "epoch": 66.37874659400545,
+ "grad_norm": 3.876132011413574,
+ "learning_rate": 5.365486007802206e-06,
+ "loss": 0.0941,
+ "step": 24361
+ },
+ {
+ "epoch": 66.38147138964578,
+ "grad_norm": 2.637402057647705,
+ "learning_rate": 5.3647040276387695e-06,
+ "loss": 0.133,
+ "step": 24362
+ },
+ {
+ "epoch": 66.3841961852861,
+ "grad_norm": 3.3070435523986816,
+ "learning_rate": 5.363922083574869e-06,
+ "loss": 0.0534,
+ "step": 24363
+ },
+ {
+ "epoch": 66.38692098092643,
+ "grad_norm": 6.5956830978393555,
+ "learning_rate": 5.363140175616596e-06,
+ "loss": 0.1527,
+ "step": 24364
+ },
+ {
+ "epoch": 66.38964577656675,
+ "grad_norm": 3.4426121711730957,
+ "learning_rate": 5.362358303770039e-06,
+ "loss": 0.1852,
+ "step": 24365
+ },
+ {
+ "epoch": 66.39237057220708,
+ "grad_norm": 4.032536029815674,
+ "learning_rate": 5.36157646804128e-06,
+ "loss": 0.0495,
+ "step": 24366
+ },
+ {
+ "epoch": 66.39509536784742,
+ "grad_norm": 3.3472368717193604,
+ "learning_rate": 5.360794668436421e-06,
+ "loss": 0.1474,
+ "step": 24367
+ },
+ {
+ "epoch": 66.39782016348774,
+ "grad_norm": 6.354490756988525,
+ "learning_rate": 5.360012904961542e-06,
+ "loss": 0.0648,
+ "step": 24368
+ },
+ {
+ "epoch": 66.40054495912807,
+ "grad_norm": 3.3422086238861084,
+ "learning_rate": 5.359231177622735e-06,
+ "loss": 0.1479,
+ "step": 24369
+ },
+ {
+ "epoch": 66.40326975476839,
+ "grad_norm": 4.014708042144775,
+ "learning_rate": 5.358449486426081e-06,
+ "loss": 0.0974,
+ "step": 24370
+ },
+ {
+ "epoch": 66.40599455040872,
+ "grad_norm": 2.181469678878784,
+ "learning_rate": 5.357667831377676e-06,
+ "loss": 0.0366,
+ "step": 24371
+ },
+ {
+ "epoch": 66.40871934604904,
+ "grad_norm": 6.039536952972412,
+ "learning_rate": 5.356886212483603e-06,
+ "loss": 0.3392,
+ "step": 24372
+ },
+ {
+ "epoch": 66.41144414168937,
+ "grad_norm": 3.6809701919555664,
+ "learning_rate": 5.356104629749952e-06,
+ "loss": 0.1699,
+ "step": 24373
+ },
+ {
+ "epoch": 66.4141689373297,
+ "grad_norm": 4.135191440582275,
+ "learning_rate": 5.355323083182811e-06,
+ "loss": 0.1575,
+ "step": 24374
+ },
+ {
+ "epoch": 66.41689373297002,
+ "grad_norm": 2.894618272781372,
+ "learning_rate": 5.354541572788259e-06,
+ "loss": 0.0403,
+ "step": 24375
+ },
+ {
+ "epoch": 66.41961852861036,
+ "grad_norm": 3.449108123779297,
+ "learning_rate": 5.353760098572393e-06,
+ "loss": 0.0643,
+ "step": 24376
+ },
+ {
+ "epoch": 66.42234332425068,
+ "grad_norm": 5.413773059844971,
+ "learning_rate": 5.3529786605412925e-06,
+ "loss": 0.133,
+ "step": 24377
+ },
+ {
+ "epoch": 66.42506811989101,
+ "grad_norm": 2.243168592453003,
+ "learning_rate": 5.352197258701044e-06,
+ "loss": 0.0437,
+ "step": 24378
+ },
+ {
+ "epoch": 66.42779291553134,
+ "grad_norm": 4.364460468292236,
+ "learning_rate": 5.351415893057732e-06,
+ "loss": 0.1098,
+ "step": 24379
+ },
+ {
+ "epoch": 66.43051771117166,
+ "grad_norm": 2.627695083618164,
+ "learning_rate": 5.350634563617445e-06,
+ "loss": 0.041,
+ "step": 24380
+ },
+ {
+ "epoch": 66.433242506812,
+ "grad_norm": 7.7000627517700195,
+ "learning_rate": 5.3498532703862685e-06,
+ "loss": 0.1024,
+ "step": 24381
+ },
+ {
+ "epoch": 66.43596730245231,
+ "grad_norm": 3.704960823059082,
+ "learning_rate": 5.349072013370285e-06,
+ "loss": 0.1359,
+ "step": 24382
+ },
+ {
+ "epoch": 66.43869209809264,
+ "grad_norm": 3.626906156539917,
+ "learning_rate": 5.348290792575572e-06,
+ "loss": 0.1797,
+ "step": 24383
+ },
+ {
+ "epoch": 66.44141689373296,
+ "grad_norm": 4.711760997772217,
+ "learning_rate": 5.347509608008228e-06,
+ "loss": 0.0528,
+ "step": 24384
+ },
+ {
+ "epoch": 66.4441416893733,
+ "grad_norm": 3.4660227298736572,
+ "learning_rate": 5.346728459674327e-06,
+ "loss": 0.1244,
+ "step": 24385
+ },
+ {
+ "epoch": 66.44686648501363,
+ "grad_norm": 3.4487414360046387,
+ "learning_rate": 5.3459473475799565e-06,
+ "loss": 0.0642,
+ "step": 24386
+ },
+ {
+ "epoch": 66.44959128065395,
+ "grad_norm": 16.17318344116211,
+ "learning_rate": 5.345166271731195e-06,
+ "loss": 0.0778,
+ "step": 24387
+ },
+ {
+ "epoch": 66.45231607629428,
+ "grad_norm": 5.871947288513184,
+ "learning_rate": 5.344385232134131e-06,
+ "loss": 0.0867,
+ "step": 24388
+ },
+ {
+ "epoch": 66.4550408719346,
+ "grad_norm": 2.7655997276306152,
+ "learning_rate": 5.343604228794845e-06,
+ "loss": 0.0538,
+ "step": 24389
+ },
+ {
+ "epoch": 66.45776566757493,
+ "grad_norm": 2.9549553394317627,
+ "learning_rate": 5.342823261719417e-06,
+ "loss": 0.0427,
+ "step": 24390
+ },
+ {
+ "epoch": 66.46049046321527,
+ "grad_norm": 2.7028307914733887,
+ "learning_rate": 5.34204233091393e-06,
+ "loss": 0.0329,
+ "step": 24391
+ },
+ {
+ "epoch": 66.46321525885558,
+ "grad_norm": 2.3739640712738037,
+ "learning_rate": 5.341261436384472e-06,
+ "loss": 0.0387,
+ "step": 24392
+ },
+ {
+ "epoch": 66.46594005449592,
+ "grad_norm": 4.051398754119873,
+ "learning_rate": 5.34048057813712e-06,
+ "loss": 0.1547,
+ "step": 24393
+ },
+ {
+ "epoch": 66.46866485013624,
+ "grad_norm": 3.3245432376861572,
+ "learning_rate": 5.339699756177954e-06,
+ "loss": 0.0516,
+ "step": 24394
+ },
+ {
+ "epoch": 66.47138964577657,
+ "grad_norm": 2.757563352584839,
+ "learning_rate": 5.338918970513054e-06,
+ "loss": 0.1485,
+ "step": 24395
+ },
+ {
+ "epoch": 66.47411444141689,
+ "grad_norm": 2.9744319915771484,
+ "learning_rate": 5.338138221148506e-06,
+ "loss": 0.0963,
+ "step": 24396
+ },
+ {
+ "epoch": 66.47683923705722,
+ "grad_norm": 4.11489200592041,
+ "learning_rate": 5.337357508090388e-06,
+ "loss": 0.0836,
+ "step": 24397
+ },
+ {
+ "epoch": 66.47956403269755,
+ "grad_norm": 3.1040594577789307,
+ "learning_rate": 5.336576831344781e-06,
+ "loss": 0.0741,
+ "step": 24398
+ },
+ {
+ "epoch": 66.48228882833787,
+ "grad_norm": 5.489741325378418,
+ "learning_rate": 5.335796190917758e-06,
+ "loss": 0.0545,
+ "step": 24399
+ },
+ {
+ "epoch": 66.4850136239782,
+ "grad_norm": 3.4695920944213867,
+ "learning_rate": 5.335015586815408e-06,
+ "loss": 0.0577,
+ "step": 24400
+ },
+ {
+ "epoch": 66.48773841961852,
+ "grad_norm": 3.547744035720825,
+ "learning_rate": 5.3342350190438075e-06,
+ "loss": 0.0754,
+ "step": 24401
+ },
+ {
+ "epoch": 66.49046321525886,
+ "grad_norm": 3.535972833633423,
+ "learning_rate": 5.333454487609033e-06,
+ "loss": 0.0663,
+ "step": 24402
+ },
+ {
+ "epoch": 66.49318801089919,
+ "grad_norm": 4.044013977050781,
+ "learning_rate": 5.332673992517162e-06,
+ "loss": 0.2245,
+ "step": 24403
+ },
+ {
+ "epoch": 66.49591280653951,
+ "grad_norm": 3.093130111694336,
+ "learning_rate": 5.3318935337742795e-06,
+ "loss": 0.0305,
+ "step": 24404
+ },
+ {
+ "epoch": 66.49863760217984,
+ "grad_norm": 3.9721336364746094,
+ "learning_rate": 5.331113111386459e-06,
+ "loss": 0.0535,
+ "step": 24405
+ },
+ {
+ "epoch": 66.50136239782016,
+ "grad_norm": 4.23530387878418,
+ "learning_rate": 5.330332725359781e-06,
+ "loss": 0.0688,
+ "step": 24406
+ },
+ {
+ "epoch": 66.50408719346049,
+ "grad_norm": 4.098939418792725,
+ "learning_rate": 5.329552375700313e-06,
+ "loss": 0.0821,
+ "step": 24407
+ },
+ {
+ "epoch": 66.50681198910081,
+ "grad_norm": 7.238304615020752,
+ "learning_rate": 5.328772062414147e-06,
+ "loss": 0.1316,
+ "step": 24408
+ },
+ {
+ "epoch": 66.50953678474114,
+ "grad_norm": 2.327904224395752,
+ "learning_rate": 5.327991785507356e-06,
+ "loss": 0.0501,
+ "step": 24409
+ },
+ {
+ "epoch": 66.51226158038148,
+ "grad_norm": 3.332578659057617,
+ "learning_rate": 5.327211544986013e-06,
+ "loss": 0.1043,
+ "step": 24410
+ },
+ {
+ "epoch": 66.5149863760218,
+ "grad_norm": 3.3954625129699707,
+ "learning_rate": 5.326431340856193e-06,
+ "loss": 0.0434,
+ "step": 24411
+ },
+ {
+ "epoch": 66.51771117166213,
+ "grad_norm": 5.331161975860596,
+ "learning_rate": 5.3256511731239805e-06,
+ "loss": 0.1002,
+ "step": 24412
+ },
+ {
+ "epoch": 66.52043596730245,
+ "grad_norm": 3.658219337463379,
+ "learning_rate": 5.324871041795444e-06,
+ "loss": 0.2241,
+ "step": 24413
+ },
+ {
+ "epoch": 66.52316076294278,
+ "grad_norm": 4.608555793762207,
+ "learning_rate": 5.3240909468766625e-06,
+ "loss": 0.1769,
+ "step": 24414
+ },
+ {
+ "epoch": 66.52588555858311,
+ "grad_norm": 4.825925827026367,
+ "learning_rate": 5.323310888373705e-06,
+ "loss": 0.1014,
+ "step": 24415
+ },
+ {
+ "epoch": 66.52861035422343,
+ "grad_norm": 2.0899970531463623,
+ "learning_rate": 5.322530866292658e-06,
+ "loss": 0.0331,
+ "step": 24416
+ },
+ {
+ "epoch": 66.53133514986376,
+ "grad_norm": 3.315011501312256,
+ "learning_rate": 5.321750880639589e-06,
+ "loss": 0.0739,
+ "step": 24417
+ },
+ {
+ "epoch": 66.53405994550408,
+ "grad_norm": 3.0963010787963867,
+ "learning_rate": 5.320970931420572e-06,
+ "loss": 0.0825,
+ "step": 24418
+ },
+ {
+ "epoch": 66.53678474114442,
+ "grad_norm": 14.82800579071045,
+ "learning_rate": 5.3201910186416805e-06,
+ "loss": 0.138,
+ "step": 24419
+ },
+ {
+ "epoch": 66.53950953678473,
+ "grad_norm": 3.478710174560547,
+ "learning_rate": 5.3194111423089945e-06,
+ "loss": 0.0681,
+ "step": 24420
+ },
+ {
+ "epoch": 66.54223433242507,
+ "grad_norm": 3.069889783859253,
+ "learning_rate": 5.318631302428584e-06,
+ "loss": 0.1064,
+ "step": 24421
+ },
+ {
+ "epoch": 66.5449591280654,
+ "grad_norm": 4.537165641784668,
+ "learning_rate": 5.317851499006522e-06,
+ "loss": 0.2001,
+ "step": 24422
+ },
+ {
+ "epoch": 66.54768392370572,
+ "grad_norm": 3.5059680938720703,
+ "learning_rate": 5.317071732048877e-06,
+ "loss": 0.1032,
+ "step": 24423
+ },
+ {
+ "epoch": 66.55040871934605,
+ "grad_norm": 2.677603244781494,
+ "learning_rate": 5.316292001561729e-06,
+ "loss": 0.0401,
+ "step": 24424
+ },
+ {
+ "epoch": 66.55313351498637,
+ "grad_norm": 2.9905624389648438,
+ "learning_rate": 5.315512307551149e-06,
+ "loss": 0.0424,
+ "step": 24425
+ },
+ {
+ "epoch": 66.5558583106267,
+ "grad_norm": 3.9608407020568848,
+ "learning_rate": 5.314732650023211e-06,
+ "loss": 0.1701,
+ "step": 24426
+ },
+ {
+ "epoch": 66.55858310626704,
+ "grad_norm": 2.984921455383301,
+ "learning_rate": 5.3139530289839835e-06,
+ "loss": 0.0934,
+ "step": 24427
+ },
+ {
+ "epoch": 66.56130790190736,
+ "grad_norm": 3.228469133377075,
+ "learning_rate": 5.313173444439535e-06,
+ "loss": 0.1571,
+ "step": 24428
+ },
+ {
+ "epoch": 66.56403269754769,
+ "grad_norm": 2.8808178901672363,
+ "learning_rate": 5.312393896395944e-06,
+ "loss": 0.1158,
+ "step": 24429
+ },
+ {
+ "epoch": 66.566757493188,
+ "grad_norm": 2.9934260845184326,
+ "learning_rate": 5.311614384859281e-06,
+ "loss": 0.0521,
+ "step": 24430
+ },
+ {
+ "epoch": 66.56948228882834,
+ "grad_norm": 2.9923391342163086,
+ "learning_rate": 5.310834909835607e-06,
+ "loss": 0.0424,
+ "step": 24431
+ },
+ {
+ "epoch": 66.57220708446866,
+ "grad_norm": 3.9207231998443604,
+ "learning_rate": 5.310055471331006e-06,
+ "loss": 0.1289,
+ "step": 24432
+ },
+ {
+ "epoch": 66.57493188010899,
+ "grad_norm": 3.5021450519561768,
+ "learning_rate": 5.309276069351541e-06,
+ "loss": 0.1068,
+ "step": 24433
+ },
+ {
+ "epoch": 66.57765667574932,
+ "grad_norm": 5.448784828186035,
+ "learning_rate": 5.308496703903283e-06,
+ "loss": 0.197,
+ "step": 24434
+ },
+ {
+ "epoch": 66.58038147138964,
+ "grad_norm": 3.25518798828125,
+ "learning_rate": 5.307717374992298e-06,
+ "loss": 0.0947,
+ "step": 24435
+ },
+ {
+ "epoch": 66.58310626702998,
+ "grad_norm": 4.407520294189453,
+ "learning_rate": 5.306938082624663e-06,
+ "loss": 0.0852,
+ "step": 24436
+ },
+ {
+ "epoch": 66.5858310626703,
+ "grad_norm": 3.608776092529297,
+ "learning_rate": 5.306158826806443e-06,
+ "loss": 0.1135,
+ "step": 24437
+ },
+ {
+ "epoch": 66.58855585831063,
+ "grad_norm": 3.587841749191284,
+ "learning_rate": 5.305379607543708e-06,
+ "loss": 0.1764,
+ "step": 24438
+ },
+ {
+ "epoch": 66.59128065395096,
+ "grad_norm": 3.5023584365844727,
+ "learning_rate": 5.30460042484252e-06,
+ "loss": 0.0544,
+ "step": 24439
+ },
+ {
+ "epoch": 66.59400544959128,
+ "grad_norm": 3.0952892303466797,
+ "learning_rate": 5.303821278708958e-06,
+ "loss": 0.047,
+ "step": 24440
+ },
+ {
+ "epoch": 66.59673024523161,
+ "grad_norm": 3.8683419227600098,
+ "learning_rate": 5.303042169149079e-06,
+ "loss": 0.1697,
+ "step": 24441
+ },
+ {
+ "epoch": 66.59945504087193,
+ "grad_norm": 3.4120495319366455,
+ "learning_rate": 5.302263096168963e-06,
+ "loss": 0.0438,
+ "step": 24442
+ },
+ {
+ "epoch": 66.60217983651226,
+ "grad_norm": 3.191737651824951,
+ "learning_rate": 5.301484059774668e-06,
+ "loss": 0.054,
+ "step": 24443
+ },
+ {
+ "epoch": 66.60490463215258,
+ "grad_norm": 4.179776191711426,
+ "learning_rate": 5.300705059972262e-06,
+ "loss": 0.1406,
+ "step": 24444
+ },
+ {
+ "epoch": 66.60762942779292,
+ "grad_norm": 4.180954933166504,
+ "learning_rate": 5.299926096767818e-06,
+ "loss": 0.0562,
+ "step": 24445
+ },
+ {
+ "epoch": 66.61035422343325,
+ "grad_norm": 2.867324113845825,
+ "learning_rate": 5.299147170167397e-06,
+ "loss": 0.0586,
+ "step": 24446
+ },
+ {
+ "epoch": 66.61307901907357,
+ "grad_norm": 3.289529323577881,
+ "learning_rate": 5.298368280177066e-06,
+ "loss": 0.0632,
+ "step": 24447
+ },
+ {
+ "epoch": 66.6158038147139,
+ "grad_norm": 2.871412992477417,
+ "learning_rate": 5.297589426802889e-06,
+ "loss": 0.1184,
+ "step": 24448
+ },
+ {
+ "epoch": 66.61852861035422,
+ "grad_norm": 3.8014256954193115,
+ "learning_rate": 5.296810610050937e-06,
+ "loss": 0.1684,
+ "step": 24449
+ },
+ {
+ "epoch": 66.62125340599455,
+ "grad_norm": 2.6733717918395996,
+ "learning_rate": 5.296031829927274e-06,
+ "loss": 0.0539,
+ "step": 24450
+ },
+ {
+ "epoch": 66.62397820163488,
+ "grad_norm": 3.6280720233917236,
+ "learning_rate": 5.2952530864379595e-06,
+ "loss": 0.0939,
+ "step": 24451
+ },
+ {
+ "epoch": 66.6267029972752,
+ "grad_norm": 3.6763455867767334,
+ "learning_rate": 5.294474379589065e-06,
+ "loss": 0.1457,
+ "step": 24452
+ },
+ {
+ "epoch": 66.62942779291554,
+ "grad_norm": 3.1730730533599854,
+ "learning_rate": 5.293695709386655e-06,
+ "loss": 0.1938,
+ "step": 24453
+ },
+ {
+ "epoch": 66.63215258855585,
+ "grad_norm": 3.2582757472991943,
+ "learning_rate": 5.292917075836789e-06,
+ "loss": 0.1068,
+ "step": 24454
+ },
+ {
+ "epoch": 66.63487738419619,
+ "grad_norm": 3.7654495239257812,
+ "learning_rate": 5.29213847894553e-06,
+ "loss": 0.0986,
+ "step": 24455
+ },
+ {
+ "epoch": 66.6376021798365,
+ "grad_norm": 3.281188488006592,
+ "learning_rate": 5.29135991871895e-06,
+ "loss": 0.1427,
+ "step": 24456
+ },
+ {
+ "epoch": 66.64032697547684,
+ "grad_norm": 2.386540651321411,
+ "learning_rate": 5.290581395163106e-06,
+ "loss": 0.0582,
+ "step": 24457
+ },
+ {
+ "epoch": 66.64305177111717,
+ "grad_norm": 2.81923246383667,
+ "learning_rate": 5.289802908284063e-06,
+ "loss": 0.0411,
+ "step": 24458
+ },
+ {
+ "epoch": 66.64577656675749,
+ "grad_norm": 4.507114410400391,
+ "learning_rate": 5.289024458087879e-06,
+ "loss": 0.2048,
+ "step": 24459
+ },
+ {
+ "epoch": 66.64850136239782,
+ "grad_norm": 2.605423927307129,
+ "learning_rate": 5.288246044580623e-06,
+ "loss": 0.1153,
+ "step": 24460
+ },
+ {
+ "epoch": 66.65122615803814,
+ "grad_norm": 3.0955703258514404,
+ "learning_rate": 5.287467667768357e-06,
+ "loss": 0.0473,
+ "step": 24461
+ },
+ {
+ "epoch": 66.65395095367847,
+ "grad_norm": 3.8462536334991455,
+ "learning_rate": 5.286689327657142e-06,
+ "loss": 0.0389,
+ "step": 24462
+ },
+ {
+ "epoch": 66.65667574931881,
+ "grad_norm": 2.484198808670044,
+ "learning_rate": 5.285911024253039e-06,
+ "loss": 0.0515,
+ "step": 24463
+ },
+ {
+ "epoch": 66.65940054495913,
+ "grad_norm": 3.103261709213257,
+ "learning_rate": 5.2851327575621035e-06,
+ "loss": 0.079,
+ "step": 24464
+ },
+ {
+ "epoch": 66.66212534059946,
+ "grad_norm": 2.198317766189575,
+ "learning_rate": 5.284354527590407e-06,
+ "loss": 0.0314,
+ "step": 24465
+ },
+ {
+ "epoch": 66.66485013623978,
+ "grad_norm": 3.7459402084350586,
+ "learning_rate": 5.283576334344007e-06,
+ "loss": 0.0921,
+ "step": 24466
+ },
+ {
+ "epoch": 66.66757493188011,
+ "grad_norm": 1.9179775714874268,
+ "learning_rate": 5.2827981778289625e-06,
+ "loss": 0.0278,
+ "step": 24467
+ },
+ {
+ "epoch": 66.67029972752043,
+ "grad_norm": 4.033474445343018,
+ "learning_rate": 5.2820200580513295e-06,
+ "loss": 0.0628,
+ "step": 24468
+ },
+ {
+ "epoch": 66.67302452316076,
+ "grad_norm": 5.211009979248047,
+ "learning_rate": 5.281241975017176e-06,
+ "loss": 0.0908,
+ "step": 24469
+ },
+ {
+ "epoch": 66.6757493188011,
+ "grad_norm": 4.247863292694092,
+ "learning_rate": 5.280463928732557e-06,
+ "loss": 0.1162,
+ "step": 24470
+ },
+ {
+ "epoch": 66.67847411444141,
+ "grad_norm": 4.005177974700928,
+ "learning_rate": 5.279685919203537e-06,
+ "loss": 0.1159,
+ "step": 24471
+ },
+ {
+ "epoch": 66.68119891008175,
+ "grad_norm": 2.956925630569458,
+ "learning_rate": 5.278907946436164e-06,
+ "loss": 0.043,
+ "step": 24472
+ },
+ {
+ "epoch": 66.68392370572207,
+ "grad_norm": 3.3972792625427246,
+ "learning_rate": 5.278130010436509e-06,
+ "loss": 0.0568,
+ "step": 24473
+ },
+ {
+ "epoch": 66.6866485013624,
+ "grad_norm": 3.1583309173583984,
+ "learning_rate": 5.277352111210625e-06,
+ "loss": 0.123,
+ "step": 24474
+ },
+ {
+ "epoch": 66.68937329700273,
+ "grad_norm": 3.8960046768188477,
+ "learning_rate": 5.276574248764567e-06,
+ "loss": 0.0637,
+ "step": 24475
+ },
+ {
+ "epoch": 66.69209809264305,
+ "grad_norm": 3.651273250579834,
+ "learning_rate": 5.275796423104396e-06,
+ "loss": 0.0694,
+ "step": 24476
+ },
+ {
+ "epoch": 66.69482288828338,
+ "grad_norm": 4.14750862121582,
+ "learning_rate": 5.275018634236176e-06,
+ "loss": 0.0897,
+ "step": 24477
+ },
+ {
+ "epoch": 66.6975476839237,
+ "grad_norm": 3.3199069499969482,
+ "learning_rate": 5.274240882165958e-06,
+ "loss": 0.1153,
+ "step": 24478
+ },
+ {
+ "epoch": 66.70027247956403,
+ "grad_norm": 6.15848970413208,
+ "learning_rate": 5.2734631668998e-06,
+ "loss": 0.1701,
+ "step": 24479
+ },
+ {
+ "epoch": 66.70299727520435,
+ "grad_norm": 4.8711771965026855,
+ "learning_rate": 5.272685488443754e-06,
+ "loss": 0.1102,
+ "step": 24480
+ },
+ {
+ "epoch": 66.70572207084469,
+ "grad_norm": 3.2478652000427246,
+ "learning_rate": 5.271907846803885e-06,
+ "loss": 0.0948,
+ "step": 24481
+ },
+ {
+ "epoch": 66.70844686648502,
+ "grad_norm": 3.449075222015381,
+ "learning_rate": 5.271130241986246e-06,
+ "loss": 0.1392,
+ "step": 24482
+ },
+ {
+ "epoch": 66.71117166212534,
+ "grad_norm": 9.120984077453613,
+ "learning_rate": 5.270352673996893e-06,
+ "loss": 0.1362,
+ "step": 24483
+ },
+ {
+ "epoch": 66.71389645776567,
+ "grad_norm": 3.307509422302246,
+ "learning_rate": 5.269575142841876e-06,
+ "loss": 0.0432,
+ "step": 24484
+ },
+ {
+ "epoch": 66.71662125340599,
+ "grad_norm": 4.888644218444824,
+ "learning_rate": 5.268797648527262e-06,
+ "loss": 0.1129,
+ "step": 24485
+ },
+ {
+ "epoch": 66.71934604904632,
+ "grad_norm": 3.402113676071167,
+ "learning_rate": 5.268020191059098e-06,
+ "loss": 0.0675,
+ "step": 24486
+ },
+ {
+ "epoch": 66.72207084468666,
+ "grad_norm": 3.7245945930480957,
+ "learning_rate": 5.26724277044344e-06,
+ "loss": 0.1126,
+ "step": 24487
+ },
+ {
+ "epoch": 66.72479564032697,
+ "grad_norm": 3.6874537467956543,
+ "learning_rate": 5.266465386686339e-06,
+ "loss": 0.1886,
+ "step": 24488
+ },
+ {
+ "epoch": 66.7275204359673,
+ "grad_norm": 2.0126962661743164,
+ "learning_rate": 5.2656880397938585e-06,
+ "loss": 0.0286,
+ "step": 24489
+ },
+ {
+ "epoch": 66.73024523160763,
+ "grad_norm": 2.6054625511169434,
+ "learning_rate": 5.264910729772046e-06,
+ "loss": 0.0982,
+ "step": 24490
+ },
+ {
+ "epoch": 66.73297002724796,
+ "grad_norm": 3.2242088317871094,
+ "learning_rate": 5.264133456626956e-06,
+ "loss": 0.0863,
+ "step": 24491
+ },
+ {
+ "epoch": 66.73569482288828,
+ "grad_norm": 4.689243316650391,
+ "learning_rate": 5.2633562203646395e-06,
+ "loss": 0.0804,
+ "step": 24492
+ },
+ {
+ "epoch": 66.73841961852861,
+ "grad_norm": 3.8238258361816406,
+ "learning_rate": 5.262579020991152e-06,
+ "loss": 0.0925,
+ "step": 24493
+ },
+ {
+ "epoch": 66.74114441416894,
+ "grad_norm": 3.351555347442627,
+ "learning_rate": 5.26180185851255e-06,
+ "loss": 0.0536,
+ "step": 24494
+ },
+ {
+ "epoch": 66.74386920980926,
+ "grad_norm": 2.875150442123413,
+ "learning_rate": 5.261024732934883e-06,
+ "loss": 0.0337,
+ "step": 24495
+ },
+ {
+ "epoch": 66.7465940054496,
+ "grad_norm": 3.38814377784729,
+ "learning_rate": 5.260247644264199e-06,
+ "loss": 0.0902,
+ "step": 24496
+ },
+ {
+ "epoch": 66.74931880108991,
+ "grad_norm": 3.024885892868042,
+ "learning_rate": 5.259470592506558e-06,
+ "loss": 0.0865,
+ "step": 24497
+ },
+ {
+ "epoch": 66.75204359673025,
+ "grad_norm": 3.5949912071228027,
+ "learning_rate": 5.258693577668007e-06,
+ "loss": 0.0386,
+ "step": 24498
+ },
+ {
+ "epoch": 66.75476839237058,
+ "grad_norm": 3.1890130043029785,
+ "learning_rate": 5.257916599754598e-06,
+ "loss": 0.067,
+ "step": 24499
+ },
+ {
+ "epoch": 66.7574931880109,
+ "grad_norm": 2.889885663986206,
+ "learning_rate": 5.257139658772378e-06,
+ "loss": 0.0655,
+ "step": 24500
+ },
+ {
+ "epoch": 66.76021798365123,
+ "grad_norm": 3.1376566886901855,
+ "learning_rate": 5.256362754727405e-06,
+ "loss": 0.0897,
+ "step": 24501
+ },
+ {
+ "epoch": 66.76294277929155,
+ "grad_norm": 3.6445372104644775,
+ "learning_rate": 5.255585887625727e-06,
+ "loss": 0.1373,
+ "step": 24502
+ },
+ {
+ "epoch": 66.76566757493188,
+ "grad_norm": 4.082334041595459,
+ "learning_rate": 5.254809057473393e-06,
+ "loss": 0.1015,
+ "step": 24503
+ },
+ {
+ "epoch": 66.7683923705722,
+ "grad_norm": 3.480103015899658,
+ "learning_rate": 5.25403226427645e-06,
+ "loss": 0.0553,
+ "step": 24504
+ },
+ {
+ "epoch": 66.77111716621253,
+ "grad_norm": 3.3684353828430176,
+ "learning_rate": 5.253255508040954e-06,
+ "loss": 0.1454,
+ "step": 24505
+ },
+ {
+ "epoch": 66.77384196185287,
+ "grad_norm": 4.273370742797852,
+ "learning_rate": 5.252478788772952e-06,
+ "loss": 0.1254,
+ "step": 24506
+ },
+ {
+ "epoch": 66.77656675749319,
+ "grad_norm": 3.679145336151123,
+ "learning_rate": 5.251702106478491e-06,
+ "loss": 0.0507,
+ "step": 24507
+ },
+ {
+ "epoch": 66.77929155313352,
+ "grad_norm": 3.5244994163513184,
+ "learning_rate": 5.2509254611636196e-06,
+ "loss": 0.0618,
+ "step": 24508
+ },
+ {
+ "epoch": 66.78201634877384,
+ "grad_norm": 3.312422037124634,
+ "learning_rate": 5.25014885283439e-06,
+ "loss": 0.0723,
+ "step": 24509
+ },
+ {
+ "epoch": 66.78474114441417,
+ "grad_norm": 3.9562501907348633,
+ "learning_rate": 5.249372281496845e-06,
+ "loss": 0.0454,
+ "step": 24510
+ },
+ {
+ "epoch": 66.7874659400545,
+ "grad_norm": 3.1592650413513184,
+ "learning_rate": 5.248595747157039e-06,
+ "loss": 0.1629,
+ "step": 24511
+ },
+ {
+ "epoch": 66.79019073569482,
+ "grad_norm": 3.199082851409912,
+ "learning_rate": 5.247819249821018e-06,
+ "loss": 0.1506,
+ "step": 24512
+ },
+ {
+ "epoch": 66.79291553133515,
+ "grad_norm": 4.939488887786865,
+ "learning_rate": 5.247042789494823e-06,
+ "loss": 0.0471,
+ "step": 24513
+ },
+ {
+ "epoch": 66.79564032697547,
+ "grad_norm": 2.8808956146240234,
+ "learning_rate": 5.2462663661845094e-06,
+ "loss": 0.165,
+ "step": 24514
+ },
+ {
+ "epoch": 66.7983651226158,
+ "grad_norm": 4.536468982696533,
+ "learning_rate": 5.24548997989612e-06,
+ "loss": 0.0878,
+ "step": 24515
+ },
+ {
+ "epoch": 66.80108991825612,
+ "grad_norm": 4.296672821044922,
+ "learning_rate": 5.244713630635698e-06,
+ "loss": 0.0772,
+ "step": 24516
+ },
+ {
+ "epoch": 66.80381471389646,
+ "grad_norm": 4.1772918701171875,
+ "learning_rate": 5.243937318409298e-06,
+ "loss": 0.0558,
+ "step": 24517
+ },
+ {
+ "epoch": 66.80653950953679,
+ "grad_norm": 4.366561412811279,
+ "learning_rate": 5.24316104322296e-06,
+ "loss": 0.137,
+ "step": 24518
+ },
+ {
+ "epoch": 66.80926430517711,
+ "grad_norm": 4.326655387878418,
+ "learning_rate": 5.242384805082731e-06,
+ "loss": 0.0469,
+ "step": 24519
+ },
+ {
+ "epoch": 66.81198910081744,
+ "grad_norm": 3.3069229125976562,
+ "learning_rate": 5.241608603994652e-06,
+ "loss": 0.1111,
+ "step": 24520
+ },
+ {
+ "epoch": 66.81471389645776,
+ "grad_norm": 2.7045812606811523,
+ "learning_rate": 5.240832439964776e-06,
+ "loss": 0.0447,
+ "step": 24521
+ },
+ {
+ "epoch": 66.8174386920981,
+ "grad_norm": 3.258586883544922,
+ "learning_rate": 5.240056312999145e-06,
+ "loss": 0.0619,
+ "step": 24522
+ },
+ {
+ "epoch": 66.82016348773843,
+ "grad_norm": 7.099562168121338,
+ "learning_rate": 5.2392802231037996e-06,
+ "loss": 0.0847,
+ "step": 24523
+ },
+ {
+ "epoch": 66.82288828337875,
+ "grad_norm": 3.2443881034851074,
+ "learning_rate": 5.238504170284785e-06,
+ "loss": 0.0578,
+ "step": 24524
+ },
+ {
+ "epoch": 66.82561307901908,
+ "grad_norm": 3.9697070121765137,
+ "learning_rate": 5.23772815454815e-06,
+ "loss": 0.0736,
+ "step": 24525
+ },
+ {
+ "epoch": 66.8283378746594,
+ "grad_norm": 3.475645065307617,
+ "learning_rate": 5.236952175899934e-06,
+ "loss": 0.1062,
+ "step": 24526
+ },
+ {
+ "epoch": 66.83106267029973,
+ "grad_norm": 2.467761993408203,
+ "learning_rate": 5.236176234346179e-06,
+ "loss": 0.0557,
+ "step": 24527
+ },
+ {
+ "epoch": 66.83378746594005,
+ "grad_norm": 3.229022264480591,
+ "learning_rate": 5.2354003298929325e-06,
+ "loss": 0.0567,
+ "step": 24528
+ },
+ {
+ "epoch": 66.83651226158038,
+ "grad_norm": 3.237917900085449,
+ "learning_rate": 5.234624462546232e-06,
+ "loss": 0.0458,
+ "step": 24529
+ },
+ {
+ "epoch": 66.83923705722071,
+ "grad_norm": 6.592916965484619,
+ "learning_rate": 5.2338486323121266e-06,
+ "loss": 0.0707,
+ "step": 24530
+ },
+ {
+ "epoch": 66.84196185286103,
+ "grad_norm": 4.381230354309082,
+ "learning_rate": 5.233072839196653e-06,
+ "loss": 0.1391,
+ "step": 24531
+ },
+ {
+ "epoch": 66.84468664850137,
+ "grad_norm": 3.1076245307922363,
+ "learning_rate": 5.2322970832058565e-06,
+ "loss": 0.1147,
+ "step": 24532
+ },
+ {
+ "epoch": 66.84741144414168,
+ "grad_norm": 4.884410858154297,
+ "learning_rate": 5.231521364345772e-06,
+ "loss": 0.0573,
+ "step": 24533
+ },
+ {
+ "epoch": 66.85013623978202,
+ "grad_norm": 2.974672317504883,
+ "learning_rate": 5.23074568262245e-06,
+ "loss": 0.0595,
+ "step": 24534
+ },
+ {
+ "epoch": 66.85286103542235,
+ "grad_norm": 4.428715705871582,
+ "learning_rate": 5.229970038041927e-06,
+ "loss": 0.0556,
+ "step": 24535
+ },
+ {
+ "epoch": 66.85558583106267,
+ "grad_norm": 3.121584892272949,
+ "learning_rate": 5.229194430610243e-06,
+ "loss": 0.0516,
+ "step": 24536
+ },
+ {
+ "epoch": 66.858310626703,
+ "grad_norm": 3.397125005722046,
+ "learning_rate": 5.228418860333437e-06,
+ "loss": 0.1241,
+ "step": 24537
+ },
+ {
+ "epoch": 66.86103542234332,
+ "grad_norm": 1.7952107191085815,
+ "learning_rate": 5.227643327217555e-06,
+ "loss": 0.028,
+ "step": 24538
+ },
+ {
+ "epoch": 66.86376021798365,
+ "grad_norm": 3.0323386192321777,
+ "learning_rate": 5.226867831268632e-06,
+ "loss": 0.0469,
+ "step": 24539
+ },
+ {
+ "epoch": 66.86648501362397,
+ "grad_norm": 2.748408317565918,
+ "learning_rate": 5.226092372492706e-06,
+ "loss": 0.195,
+ "step": 24540
+ },
+ {
+ "epoch": 66.8692098092643,
+ "grad_norm": 2.3647797107696533,
+ "learning_rate": 5.2253169508958225e-06,
+ "loss": 0.0453,
+ "step": 24541
+ },
+ {
+ "epoch": 66.87193460490464,
+ "grad_norm": 2.489013671875,
+ "learning_rate": 5.224541566484016e-06,
+ "loss": 0.1354,
+ "step": 24542
+ },
+ {
+ "epoch": 66.87465940054496,
+ "grad_norm": 3.8515937328338623,
+ "learning_rate": 5.223766219263327e-06,
+ "loss": 0.0982,
+ "step": 24543
+ },
+ {
+ "epoch": 66.87738419618529,
+ "grad_norm": 3.0182557106018066,
+ "learning_rate": 5.222990909239789e-06,
+ "loss": 0.0692,
+ "step": 24544
+ },
+ {
+ "epoch": 66.88010899182561,
+ "grad_norm": 6.353591442108154,
+ "learning_rate": 5.222215636419443e-06,
+ "loss": 0.1967,
+ "step": 24545
+ },
+ {
+ "epoch": 66.88283378746594,
+ "grad_norm": 3.788677215576172,
+ "learning_rate": 5.221440400808333e-06,
+ "loss": 0.1314,
+ "step": 24546
+ },
+ {
+ "epoch": 66.88555858310627,
+ "grad_norm": 3.978733539581299,
+ "learning_rate": 5.220665202412492e-06,
+ "loss": 0.0494,
+ "step": 24547
+ },
+ {
+ "epoch": 66.88828337874659,
+ "grad_norm": 3.4406204223632812,
+ "learning_rate": 5.219890041237955e-06,
+ "loss": 0.1857,
+ "step": 24548
+ },
+ {
+ "epoch": 66.89100817438693,
+ "grad_norm": 2.2609307765960693,
+ "learning_rate": 5.219114917290757e-06,
+ "loss": 0.0295,
+ "step": 24549
+ },
+ {
+ "epoch": 66.89373297002724,
+ "grad_norm": 3.813671112060547,
+ "learning_rate": 5.2183398305769424e-06,
+ "loss": 0.0544,
+ "step": 24550
+ },
+ {
+ "epoch": 66.89645776566758,
+ "grad_norm": 4.5922651290893555,
+ "learning_rate": 5.217564781102543e-06,
+ "loss": 0.1875,
+ "step": 24551
+ },
+ {
+ "epoch": 66.8991825613079,
+ "grad_norm": 2.906663179397583,
+ "learning_rate": 5.216789768873596e-06,
+ "loss": 0.2047,
+ "step": 24552
+ },
+ {
+ "epoch": 66.90190735694823,
+ "grad_norm": 2.953495979309082,
+ "learning_rate": 5.2160147938961315e-06,
+ "loss": 0.194,
+ "step": 24553
+ },
+ {
+ "epoch": 66.90463215258856,
+ "grad_norm": 3.020416021347046,
+ "learning_rate": 5.215239856176194e-06,
+ "loss": 0.1086,
+ "step": 24554
+ },
+ {
+ "epoch": 66.90735694822888,
+ "grad_norm": 3.5891289710998535,
+ "learning_rate": 5.214464955719814e-06,
+ "loss": 0.0599,
+ "step": 24555
+ },
+ {
+ "epoch": 66.91008174386921,
+ "grad_norm": 3.024014472961426,
+ "learning_rate": 5.213690092533028e-06,
+ "loss": 0.0953,
+ "step": 24556
+ },
+ {
+ "epoch": 66.91280653950953,
+ "grad_norm": 3.2397093772888184,
+ "learning_rate": 5.212915266621865e-06,
+ "loss": 0.0469,
+ "step": 24557
+ },
+ {
+ "epoch": 66.91553133514986,
+ "grad_norm": 3.362849712371826,
+ "learning_rate": 5.212140477992367e-06,
+ "loss": 0.0468,
+ "step": 24558
+ },
+ {
+ "epoch": 66.9182561307902,
+ "grad_norm": 3.0881080627441406,
+ "learning_rate": 5.2113657266505655e-06,
+ "loss": 0.0532,
+ "step": 24559
+ },
+ {
+ "epoch": 66.92098092643052,
+ "grad_norm": 4.1464924812316895,
+ "learning_rate": 5.210591012602495e-06,
+ "loss": 0.1187,
+ "step": 24560
+ },
+ {
+ "epoch": 66.92370572207085,
+ "grad_norm": 2.5345964431762695,
+ "learning_rate": 5.209816335854181e-06,
+ "loss": 0.0411,
+ "step": 24561
+ },
+ {
+ "epoch": 66.92643051771117,
+ "grad_norm": 3.098723888397217,
+ "learning_rate": 5.209041696411665e-06,
+ "loss": 0.0441,
+ "step": 24562
+ },
+ {
+ "epoch": 66.9291553133515,
+ "grad_norm": 2.8344247341156006,
+ "learning_rate": 5.208267094280981e-06,
+ "loss": 0.0478,
+ "step": 24563
+ },
+ {
+ "epoch": 66.93188010899182,
+ "grad_norm": 4.4746198654174805,
+ "learning_rate": 5.20749252946816e-06,
+ "loss": 0.0524,
+ "step": 24564
+ },
+ {
+ "epoch": 66.93460490463215,
+ "grad_norm": 3.8244478702545166,
+ "learning_rate": 5.206718001979228e-06,
+ "loss": 0.1104,
+ "step": 24565
+ },
+ {
+ "epoch": 66.93732970027249,
+ "grad_norm": 3.324032783508301,
+ "learning_rate": 5.2059435118202264e-06,
+ "loss": 0.0759,
+ "step": 24566
+ },
+ {
+ "epoch": 66.9400544959128,
+ "grad_norm": 3.023571729660034,
+ "learning_rate": 5.205169058997181e-06,
+ "loss": 0.0383,
+ "step": 24567
+ },
+ {
+ "epoch": 66.94277929155314,
+ "grad_norm": 4.425686359405518,
+ "learning_rate": 5.204394643516127e-06,
+ "loss": 0.2514,
+ "step": 24568
+ },
+ {
+ "epoch": 66.94550408719346,
+ "grad_norm": 3.483464479446411,
+ "learning_rate": 5.203620265383087e-06,
+ "loss": 0.0343,
+ "step": 24569
+ },
+ {
+ "epoch": 66.94822888283379,
+ "grad_norm": 2.8341145515441895,
+ "learning_rate": 5.202845924604103e-06,
+ "loss": 0.1197,
+ "step": 24570
+ },
+ {
+ "epoch": 66.95095367847412,
+ "grad_norm": 4.877206325531006,
+ "learning_rate": 5.2020716211852e-06,
+ "loss": 0.0781,
+ "step": 24571
+ },
+ {
+ "epoch": 66.95367847411444,
+ "grad_norm": 3.90977144241333,
+ "learning_rate": 5.201297355132411e-06,
+ "loss": 0.1366,
+ "step": 24572
+ },
+ {
+ "epoch": 66.95640326975477,
+ "grad_norm": 2.614654779434204,
+ "learning_rate": 5.200523126451757e-06,
+ "loss": 0.1078,
+ "step": 24573
+ },
+ {
+ "epoch": 66.95912806539509,
+ "grad_norm": 3.2511801719665527,
+ "learning_rate": 5.19974893514928e-06,
+ "loss": 0.0475,
+ "step": 24574
+ },
+ {
+ "epoch": 66.96185286103542,
+ "grad_norm": 2.8034374713897705,
+ "learning_rate": 5.198974781231003e-06,
+ "loss": 0.0693,
+ "step": 24575
+ },
+ {
+ "epoch": 66.96457765667574,
+ "grad_norm": 3.829230308532715,
+ "learning_rate": 5.1982006647029555e-06,
+ "loss": 0.1439,
+ "step": 24576
+ },
+ {
+ "epoch": 66.96730245231608,
+ "grad_norm": 4.487547397613525,
+ "learning_rate": 5.197426585571163e-06,
+ "loss": 0.0636,
+ "step": 24577
+ },
+ {
+ "epoch": 66.97002724795641,
+ "grad_norm": 2.5402772426605225,
+ "learning_rate": 5.196652543841663e-06,
+ "loss": 0.1121,
+ "step": 24578
+ },
+ {
+ "epoch": 66.97275204359673,
+ "grad_norm": 3.519968271255493,
+ "learning_rate": 5.195878539520474e-06,
+ "loss": 0.0806,
+ "step": 24579
+ },
+ {
+ "epoch": 66.97547683923706,
+ "grad_norm": 3.5499627590179443,
+ "learning_rate": 5.195104572613631e-06,
+ "loss": 0.0921,
+ "step": 24580
+ },
+ {
+ "epoch": 66.97820163487738,
+ "grad_norm": 2.5481748580932617,
+ "learning_rate": 5.194330643127155e-06,
+ "loss": 0.0316,
+ "step": 24581
+ },
+ {
+ "epoch": 66.98092643051771,
+ "grad_norm": 3.4201138019561768,
+ "learning_rate": 5.193556751067082e-06,
+ "loss": 0.0729,
+ "step": 24582
+ },
+ {
+ "epoch": 66.98365122615803,
+ "grad_norm": 3.4435765743255615,
+ "learning_rate": 5.192782896439434e-06,
+ "loss": 0.0584,
+ "step": 24583
+ },
+ {
+ "epoch": 66.98637602179836,
+ "grad_norm": 3.1900954246520996,
+ "learning_rate": 5.192009079250239e-06,
+ "loss": 0.0371,
+ "step": 24584
+ },
+ {
+ "epoch": 66.9891008174387,
+ "grad_norm": 3.2524049282073975,
+ "learning_rate": 5.191235299505517e-06,
+ "loss": 0.0588,
+ "step": 24585
+ },
+ {
+ "epoch": 66.99182561307902,
+ "grad_norm": 3.2355782985687256,
+ "learning_rate": 5.190461557211306e-06,
+ "loss": 0.0612,
+ "step": 24586
+ },
+ {
+ "epoch": 66.99455040871935,
+ "grad_norm": 2.7511208057403564,
+ "learning_rate": 5.189687852373624e-06,
+ "loss": 0.0517,
+ "step": 24587
+ },
+ {
+ "epoch": 66.99727520435967,
+ "grad_norm": 4.004414081573486,
+ "learning_rate": 5.188914184998497e-06,
+ "loss": 0.0823,
+ "step": 24588
+ },
+ {
+ "epoch": 67.0,
+ "grad_norm": 2.313328504562378,
+ "learning_rate": 5.18814055509195e-06,
+ "loss": 0.0428,
+ "step": 24589
+ },
+ {
+ "epoch": 67.00272479564033,
+ "grad_norm": 3.8177289962768555,
+ "learning_rate": 5.187366962660012e-06,
+ "loss": 0.1239,
+ "step": 24590
+ },
+ {
+ "epoch": 67.00544959128065,
+ "grad_norm": 2.535372018814087,
+ "learning_rate": 5.186593407708706e-06,
+ "loss": 0.0375,
+ "step": 24591
+ },
+ {
+ "epoch": 67.00817438692098,
+ "grad_norm": 4.38206148147583,
+ "learning_rate": 5.185819890244055e-06,
+ "loss": 0.1362,
+ "step": 24592
+ },
+ {
+ "epoch": 67.0108991825613,
+ "grad_norm": 4.015827178955078,
+ "learning_rate": 5.185046410272079e-06,
+ "loss": 0.1009,
+ "step": 24593
+ },
+ {
+ "epoch": 67.01362397820164,
+ "grad_norm": 2.929131031036377,
+ "learning_rate": 5.184272967798811e-06,
+ "loss": 0.0477,
+ "step": 24594
+ },
+ {
+ "epoch": 67.01634877384195,
+ "grad_norm": 2.9919931888580322,
+ "learning_rate": 5.183499562830272e-06,
+ "loss": 0.0428,
+ "step": 24595
+ },
+ {
+ "epoch": 67.01907356948229,
+ "grad_norm": 3.2489945888519287,
+ "learning_rate": 5.182726195372478e-06,
+ "loss": 0.1985,
+ "step": 24596
+ },
+ {
+ "epoch": 67.02179836512262,
+ "grad_norm": 4.685133934020996,
+ "learning_rate": 5.181952865431461e-06,
+ "loss": 0.1397,
+ "step": 24597
+ },
+ {
+ "epoch": 67.02452316076294,
+ "grad_norm": 4.398831367492676,
+ "learning_rate": 5.1811795730132365e-06,
+ "loss": 0.0388,
+ "step": 24598
+ },
+ {
+ "epoch": 67.02724795640327,
+ "grad_norm": 5.002074241638184,
+ "learning_rate": 5.180406318123834e-06,
+ "loss": 0.1359,
+ "step": 24599
+ },
+ {
+ "epoch": 67.02997275204359,
+ "grad_norm": 3.0800745487213135,
+ "learning_rate": 5.1796331007692725e-06,
+ "loss": 0.1064,
+ "step": 24600
+ },
+ {
+ "epoch": 67.03269754768392,
+ "grad_norm": 3.5149998664855957,
+ "learning_rate": 5.1788599209555726e-06,
+ "loss": 0.0646,
+ "step": 24601
+ },
+ {
+ "epoch": 67.03542234332426,
+ "grad_norm": 2.087890863418579,
+ "learning_rate": 5.1780867786887535e-06,
+ "loss": 0.0303,
+ "step": 24602
+ },
+ {
+ "epoch": 67.03814713896458,
+ "grad_norm": 5.657195568084717,
+ "learning_rate": 5.177313673974842e-06,
+ "loss": 0.2395,
+ "step": 24603
+ },
+ {
+ "epoch": 67.04087193460491,
+ "grad_norm": 3.764268159866333,
+ "learning_rate": 5.176540606819857e-06,
+ "loss": 0.082,
+ "step": 24604
+ },
+ {
+ "epoch": 67.04359673024523,
+ "grad_norm": 3.439305543899536,
+ "learning_rate": 5.175767577229815e-06,
+ "loss": 0.1406,
+ "step": 24605
+ },
+ {
+ "epoch": 67.04632152588556,
+ "grad_norm": 2.306802988052368,
+ "learning_rate": 5.174994585210744e-06,
+ "loss": 0.0339,
+ "step": 24606
+ },
+ {
+ "epoch": 67.04904632152588,
+ "grad_norm": 6.121353626251221,
+ "learning_rate": 5.174221630768659e-06,
+ "loss": 0.1512,
+ "step": 24607
+ },
+ {
+ "epoch": 67.05177111716621,
+ "grad_norm": 2.480057716369629,
+ "learning_rate": 5.1734487139095815e-06,
+ "loss": 0.0481,
+ "step": 24608
+ },
+ {
+ "epoch": 67.05449591280654,
+ "grad_norm": 3.2592272758483887,
+ "learning_rate": 5.172675834639524e-06,
+ "loss": 0.2128,
+ "step": 24609
+ },
+ {
+ "epoch": 67.05722070844686,
+ "grad_norm": 2.563528299331665,
+ "learning_rate": 5.171902992964518e-06,
+ "loss": 0.0392,
+ "step": 24610
+ },
+ {
+ "epoch": 67.0599455040872,
+ "grad_norm": 4.097001552581787,
+ "learning_rate": 5.1711301888905765e-06,
+ "loss": 0.1128,
+ "step": 24611
+ },
+ {
+ "epoch": 67.06267029972751,
+ "grad_norm": 6.103743553161621,
+ "learning_rate": 5.170357422423715e-06,
+ "loss": 0.1939,
+ "step": 24612
+ },
+ {
+ "epoch": 67.06539509536785,
+ "grad_norm": 3.189117908477783,
+ "learning_rate": 5.169584693569953e-06,
+ "loss": 0.2665,
+ "step": 24613
+ },
+ {
+ "epoch": 67.06811989100818,
+ "grad_norm": 5.12296724319458,
+ "learning_rate": 5.168812002335309e-06,
+ "loss": 0.1065,
+ "step": 24614
+ },
+ {
+ "epoch": 67.0708446866485,
+ "grad_norm": 2.6996898651123047,
+ "learning_rate": 5.168039348725806e-06,
+ "loss": 0.0581,
+ "step": 24615
+ },
+ {
+ "epoch": 67.07356948228883,
+ "grad_norm": 2.8209614753723145,
+ "learning_rate": 5.167266732747455e-06,
+ "loss": 0.0461,
+ "step": 24616
+ },
+ {
+ "epoch": 67.07629427792915,
+ "grad_norm": 6.042128562927246,
+ "learning_rate": 5.166494154406279e-06,
+ "loss": 0.091,
+ "step": 24617
+ },
+ {
+ "epoch": 67.07901907356948,
+ "grad_norm": 3.844276189804077,
+ "learning_rate": 5.165721613708283e-06,
+ "loss": 0.0579,
+ "step": 24618
+ },
+ {
+ "epoch": 67.0817438692098,
+ "grad_norm": 3.6185991764068604,
+ "learning_rate": 5.164949110659498e-06,
+ "loss": 0.0936,
+ "step": 24619
+ },
+ {
+ "epoch": 67.08446866485014,
+ "grad_norm": 3.4355180263519287,
+ "learning_rate": 5.164176645265932e-06,
+ "loss": 0.1002,
+ "step": 24620
+ },
+ {
+ "epoch": 67.08719346049047,
+ "grad_norm": 4.071255683898926,
+ "learning_rate": 5.163404217533604e-06,
+ "loss": 0.0682,
+ "step": 24621
+ },
+ {
+ "epoch": 67.08991825613079,
+ "grad_norm": 2.856973171234131,
+ "learning_rate": 5.162631827468525e-06,
+ "loss": 0.1088,
+ "step": 24622
+ },
+ {
+ "epoch": 67.09264305177112,
+ "grad_norm": 3.257694721221924,
+ "learning_rate": 5.161859475076716e-06,
+ "loss": 0.1017,
+ "step": 24623
+ },
+ {
+ "epoch": 67.09536784741144,
+ "grad_norm": 3.8397223949432373,
+ "learning_rate": 5.16108716036419e-06,
+ "loss": 0.0921,
+ "step": 24624
+ },
+ {
+ "epoch": 67.09809264305177,
+ "grad_norm": 3.522420644760132,
+ "learning_rate": 5.160314883336958e-06,
+ "loss": 0.1487,
+ "step": 24625
+ },
+ {
+ "epoch": 67.1008174386921,
+ "grad_norm": 3.160970687866211,
+ "learning_rate": 5.159542644001041e-06,
+ "loss": 0.1618,
+ "step": 24626
+ },
+ {
+ "epoch": 67.10354223433242,
+ "grad_norm": 2.8199210166931152,
+ "learning_rate": 5.158770442362451e-06,
+ "loss": 0.0673,
+ "step": 24627
+ },
+ {
+ "epoch": 67.10626702997276,
+ "grad_norm": 3.246110439300537,
+ "learning_rate": 5.1579982784272005e-06,
+ "loss": 0.047,
+ "step": 24628
+ },
+ {
+ "epoch": 67.10899182561307,
+ "grad_norm": 7.186903953552246,
+ "learning_rate": 5.1572261522013e-06,
+ "loss": 0.1531,
+ "step": 24629
+ },
+ {
+ "epoch": 67.11171662125341,
+ "grad_norm": 3.513388156890869,
+ "learning_rate": 5.15645406369077e-06,
+ "loss": 0.1825,
+ "step": 24630
+ },
+ {
+ "epoch": 67.11444141689373,
+ "grad_norm": 2.9456865787506104,
+ "learning_rate": 5.155682012901616e-06,
+ "loss": 0.065,
+ "step": 24631
+ },
+ {
+ "epoch": 67.11716621253406,
+ "grad_norm": 4.3389892578125,
+ "learning_rate": 5.1549099998398585e-06,
+ "loss": 0.0904,
+ "step": 24632
+ },
+ {
+ "epoch": 67.11989100817439,
+ "grad_norm": 4.458559036254883,
+ "learning_rate": 5.154138024511506e-06,
+ "loss": 0.0767,
+ "step": 24633
+ },
+ {
+ "epoch": 67.12261580381471,
+ "grad_norm": 2.301032781600952,
+ "learning_rate": 5.153366086922567e-06,
+ "loss": 0.0394,
+ "step": 24634
+ },
+ {
+ "epoch": 67.12534059945504,
+ "grad_norm": 3.2916994094848633,
+ "learning_rate": 5.152594187079061e-06,
+ "loss": 0.0484,
+ "step": 24635
+ },
+ {
+ "epoch": 67.12806539509536,
+ "grad_norm": 2.459163188934326,
+ "learning_rate": 5.151822324986995e-06,
+ "loss": 0.0345,
+ "step": 24636
+ },
+ {
+ "epoch": 67.1307901907357,
+ "grad_norm": 2.8928542137145996,
+ "learning_rate": 5.151050500652379e-06,
+ "loss": 0.0373,
+ "step": 24637
+ },
+ {
+ "epoch": 67.13351498637603,
+ "grad_norm": 3.3529112339019775,
+ "learning_rate": 5.150278714081224e-06,
+ "loss": 0.0641,
+ "step": 24638
+ },
+ {
+ "epoch": 67.13623978201635,
+ "grad_norm": 3.647813558578491,
+ "learning_rate": 5.149506965279545e-06,
+ "loss": 0.0754,
+ "step": 24639
+ },
+ {
+ "epoch": 67.13896457765668,
+ "grad_norm": 2.7385573387145996,
+ "learning_rate": 5.148735254253351e-06,
+ "loss": 0.109,
+ "step": 24640
+ },
+ {
+ "epoch": 67.141689373297,
+ "grad_norm": 7.747296333312988,
+ "learning_rate": 5.14796358100865e-06,
+ "loss": 0.0454,
+ "step": 24641
+ },
+ {
+ "epoch": 67.14441416893733,
+ "grad_norm": 2.8267595767974854,
+ "learning_rate": 5.1471919455514484e-06,
+ "loss": 0.0412,
+ "step": 24642
+ },
+ {
+ "epoch": 67.14713896457765,
+ "grad_norm": 2.8402023315429688,
+ "learning_rate": 5.146420347887764e-06,
+ "loss": 0.0709,
+ "step": 24643
+ },
+ {
+ "epoch": 67.14986376021798,
+ "grad_norm": 3.3954174518585205,
+ "learning_rate": 5.145648788023601e-06,
+ "loss": 0.1491,
+ "step": 24644
+ },
+ {
+ "epoch": 67.15258855585832,
+ "grad_norm": 3.405459403991699,
+ "learning_rate": 5.144877265964969e-06,
+ "loss": 0.0631,
+ "step": 24645
+ },
+ {
+ "epoch": 67.15531335149863,
+ "grad_norm": 4.721367835998535,
+ "learning_rate": 5.144105781717874e-06,
+ "loss": 0.1033,
+ "step": 24646
+ },
+ {
+ "epoch": 67.15803814713897,
+ "grad_norm": 3.2868051528930664,
+ "learning_rate": 5.14333433528833e-06,
+ "loss": 0.1403,
+ "step": 24647
+ },
+ {
+ "epoch": 67.16076294277929,
+ "grad_norm": 3.087031364440918,
+ "learning_rate": 5.142562926682338e-06,
+ "loss": 0.1066,
+ "step": 24648
+ },
+ {
+ "epoch": 67.16348773841962,
+ "grad_norm": 2.8686745166778564,
+ "learning_rate": 5.141791555905913e-06,
+ "loss": 0.0997,
+ "step": 24649
+ },
+ {
+ "epoch": 67.16621253405995,
+ "grad_norm": 3.295128583908081,
+ "learning_rate": 5.141020222965056e-06,
+ "loss": 0.1319,
+ "step": 24650
+ },
+ {
+ "epoch": 67.16893732970027,
+ "grad_norm": 2.890428304672241,
+ "learning_rate": 5.140248927865781e-06,
+ "loss": 0.045,
+ "step": 24651
+ },
+ {
+ "epoch": 67.1716621253406,
+ "grad_norm": 4.1570963859558105,
+ "learning_rate": 5.139477670614091e-06,
+ "loss": 0.0606,
+ "step": 24652
+ },
+ {
+ "epoch": 67.17438692098092,
+ "grad_norm": 3.9590163230895996,
+ "learning_rate": 5.138706451215991e-06,
+ "loss": 0.1766,
+ "step": 24653
+ },
+ {
+ "epoch": 67.17711171662125,
+ "grad_norm": 3.9261727333068848,
+ "learning_rate": 5.137935269677485e-06,
+ "loss": 0.0771,
+ "step": 24654
+ },
+ {
+ "epoch": 67.17983651226157,
+ "grad_norm": 2.083590030670166,
+ "learning_rate": 5.137164126004588e-06,
+ "loss": 0.0306,
+ "step": 24655
+ },
+ {
+ "epoch": 67.1825613079019,
+ "grad_norm": 3.423569440841675,
+ "learning_rate": 5.136393020203298e-06,
+ "loss": 0.1249,
+ "step": 24656
+ },
+ {
+ "epoch": 67.18528610354224,
+ "grad_norm": 2.2648110389709473,
+ "learning_rate": 5.1356219522796255e-06,
+ "loss": 0.0422,
+ "step": 24657
+ },
+ {
+ "epoch": 67.18801089918256,
+ "grad_norm": 4.222996711730957,
+ "learning_rate": 5.134850922239567e-06,
+ "loss": 0.0985,
+ "step": 24658
+ },
+ {
+ "epoch": 67.19073569482289,
+ "grad_norm": 4.955621242523193,
+ "learning_rate": 5.134079930089138e-06,
+ "loss": 0.0536,
+ "step": 24659
+ },
+ {
+ "epoch": 67.19346049046321,
+ "grad_norm": 3.551360607147217,
+ "learning_rate": 5.1333089758343364e-06,
+ "loss": 0.0671,
+ "step": 24660
+ },
+ {
+ "epoch": 67.19618528610354,
+ "grad_norm": 3.71524977684021,
+ "learning_rate": 5.1325380594811694e-06,
+ "loss": 0.1959,
+ "step": 24661
+ },
+ {
+ "epoch": 67.19891008174388,
+ "grad_norm": 3.1517035961151123,
+ "learning_rate": 5.131767181035634e-06,
+ "loss": 0.1292,
+ "step": 24662
+ },
+ {
+ "epoch": 67.2016348773842,
+ "grad_norm": 3.6539742946624756,
+ "learning_rate": 5.130996340503744e-06,
+ "loss": 0.039,
+ "step": 24663
+ },
+ {
+ "epoch": 67.20435967302453,
+ "grad_norm": 3.0689525604248047,
+ "learning_rate": 5.130225537891498e-06,
+ "loss": 0.0363,
+ "step": 24664
+ },
+ {
+ "epoch": 67.20708446866485,
+ "grad_norm": 2.8991730213165283,
+ "learning_rate": 5.129454773204894e-06,
+ "loss": 0.1223,
+ "step": 24665
+ },
+ {
+ "epoch": 67.20980926430518,
+ "grad_norm": 3.562687635421753,
+ "learning_rate": 5.1286840464499435e-06,
+ "loss": 0.1406,
+ "step": 24666
+ },
+ {
+ "epoch": 67.2125340599455,
+ "grad_norm": 3.347503423690796,
+ "learning_rate": 5.127913357632641e-06,
+ "loss": 0.0408,
+ "step": 24667
+ },
+ {
+ "epoch": 67.21525885558583,
+ "grad_norm": 3.359271287918091,
+ "learning_rate": 5.127142706758996e-06,
+ "loss": 0.0752,
+ "step": 24668
+ },
+ {
+ "epoch": 67.21798365122616,
+ "grad_norm": 6.227237224578857,
+ "learning_rate": 5.1263720938350085e-06,
+ "loss": 0.0484,
+ "step": 24669
+ },
+ {
+ "epoch": 67.22070844686648,
+ "grad_norm": 2.8463234901428223,
+ "learning_rate": 5.125601518866672e-06,
+ "loss": 0.0459,
+ "step": 24670
+ },
+ {
+ "epoch": 67.22343324250681,
+ "grad_norm": 5.320071220397949,
+ "learning_rate": 5.12483098186e-06,
+ "loss": 0.1143,
+ "step": 24671
+ },
+ {
+ "epoch": 67.22615803814713,
+ "grad_norm": 3.1932263374328613,
+ "learning_rate": 5.124060482820986e-06,
+ "loss": 0.199,
+ "step": 24672
+ },
+ {
+ "epoch": 67.22888283378747,
+ "grad_norm": 15.600347518920898,
+ "learning_rate": 5.123290021755634e-06,
+ "loss": 0.1381,
+ "step": 24673
+ },
+ {
+ "epoch": 67.2316076294278,
+ "grad_norm": 3.40120267868042,
+ "learning_rate": 5.122519598669935e-06,
+ "loss": 0.1106,
+ "step": 24674
+ },
+ {
+ "epoch": 67.23433242506812,
+ "grad_norm": 3.6226260662078857,
+ "learning_rate": 5.121749213569903e-06,
+ "loss": 0.1756,
+ "step": 24675
+ },
+ {
+ "epoch": 67.23705722070845,
+ "grad_norm": 2.6622533798217773,
+ "learning_rate": 5.1209788664615304e-06,
+ "loss": 0.043,
+ "step": 24676
+ },
+ {
+ "epoch": 67.23978201634877,
+ "grad_norm": 2.5700666904449463,
+ "learning_rate": 5.1202085573508175e-06,
+ "loss": 0.0453,
+ "step": 24677
+ },
+ {
+ "epoch": 67.2425068119891,
+ "grad_norm": 2.4242546558380127,
+ "learning_rate": 5.119438286243759e-06,
+ "loss": 0.0648,
+ "step": 24678
+ },
+ {
+ "epoch": 67.24523160762942,
+ "grad_norm": 3.5825319290161133,
+ "learning_rate": 5.118668053146363e-06,
+ "loss": 0.0793,
+ "step": 24679
+ },
+ {
+ "epoch": 67.24795640326975,
+ "grad_norm": 3.02204966545105,
+ "learning_rate": 5.117897858064622e-06,
+ "loss": 0.0814,
+ "step": 24680
+ },
+ {
+ "epoch": 67.25068119891009,
+ "grad_norm": 4.157834529876709,
+ "learning_rate": 5.117127701004535e-06,
+ "loss": 0.187,
+ "step": 24681
+ },
+ {
+ "epoch": 67.2534059945504,
+ "grad_norm": 5.315064907073975,
+ "learning_rate": 5.116357581972098e-06,
+ "loss": 0.1216,
+ "step": 24682
+ },
+ {
+ "epoch": 67.25613079019074,
+ "grad_norm": 5.192597389221191,
+ "learning_rate": 5.115587500973309e-06,
+ "loss": 0.116,
+ "step": 24683
+ },
+ {
+ "epoch": 67.25885558583106,
+ "grad_norm": 3.724283456802368,
+ "learning_rate": 5.114817458014172e-06,
+ "loss": 0.0807,
+ "step": 24684
+ },
+ {
+ "epoch": 67.26158038147139,
+ "grad_norm": 3.5205814838409424,
+ "learning_rate": 5.11404745310068e-06,
+ "loss": 0.0721,
+ "step": 24685
+ },
+ {
+ "epoch": 67.26430517711172,
+ "grad_norm": 5.1249680519104,
+ "learning_rate": 5.113277486238829e-06,
+ "loss": 0.1646,
+ "step": 24686
+ },
+ {
+ "epoch": 67.26702997275204,
+ "grad_norm": 3.207024335861206,
+ "learning_rate": 5.112507557434612e-06,
+ "loss": 0.1413,
+ "step": 24687
+ },
+ {
+ "epoch": 67.26975476839237,
+ "grad_norm": 4.9466376304626465,
+ "learning_rate": 5.111737666694032e-06,
+ "loss": 0.1088,
+ "step": 24688
+ },
+ {
+ "epoch": 67.2724795640327,
+ "grad_norm": 2.8702213764190674,
+ "learning_rate": 5.110967814023083e-06,
+ "loss": 0.0437,
+ "step": 24689
+ },
+ {
+ "epoch": 67.27520435967303,
+ "grad_norm": 3.057664394378662,
+ "learning_rate": 5.110197999427753e-06,
+ "loss": 0.0659,
+ "step": 24690
+ },
+ {
+ "epoch": 67.27792915531334,
+ "grad_norm": 2.8249452114105225,
+ "learning_rate": 5.10942822291405e-06,
+ "loss": 0.061,
+ "step": 24691
+ },
+ {
+ "epoch": 67.28065395095368,
+ "grad_norm": 3.631533622741699,
+ "learning_rate": 5.108658484487961e-06,
+ "loss": 0.1307,
+ "step": 24692
+ },
+ {
+ "epoch": 67.28337874659401,
+ "grad_norm": 3.4069125652313232,
+ "learning_rate": 5.107888784155484e-06,
+ "loss": 0.0955,
+ "step": 24693
+ },
+ {
+ "epoch": 67.28610354223433,
+ "grad_norm": 2.5948667526245117,
+ "learning_rate": 5.107119121922606e-06,
+ "loss": 0.1235,
+ "step": 24694
+ },
+ {
+ "epoch": 67.28882833787466,
+ "grad_norm": 3.14793062210083,
+ "learning_rate": 5.106349497795331e-06,
+ "loss": 0.0542,
+ "step": 24695
+ },
+ {
+ "epoch": 67.29155313351498,
+ "grad_norm": 4.083686828613281,
+ "learning_rate": 5.105579911779649e-06,
+ "loss": 0.0805,
+ "step": 24696
+ },
+ {
+ "epoch": 67.29427792915531,
+ "grad_norm": 3.630496025085449,
+ "learning_rate": 5.104810363881554e-06,
+ "loss": 0.1727,
+ "step": 24697
+ },
+ {
+ "epoch": 67.29700272479565,
+ "grad_norm": 3.330587387084961,
+ "learning_rate": 5.104040854107033e-06,
+ "loss": 0.0753,
+ "step": 24698
+ },
+ {
+ "epoch": 67.29972752043597,
+ "grad_norm": 3.055983543395996,
+ "learning_rate": 5.103271382462085e-06,
+ "loss": 0.1081,
+ "step": 24699
+ },
+ {
+ "epoch": 67.3024523160763,
+ "grad_norm": 3.5617239475250244,
+ "learning_rate": 5.102501948952705e-06,
+ "loss": 0.062,
+ "step": 24700
+ },
+ {
+ "epoch": 67.30517711171662,
+ "grad_norm": 2.897954225540161,
+ "learning_rate": 5.101732553584883e-06,
+ "loss": 0.0431,
+ "step": 24701
+ },
+ {
+ "epoch": 67.30790190735695,
+ "grad_norm": 4.210009574890137,
+ "learning_rate": 5.10096319636461e-06,
+ "loss": 0.1356,
+ "step": 24702
+ },
+ {
+ "epoch": 67.31062670299727,
+ "grad_norm": 2.9569778442382812,
+ "learning_rate": 5.100193877297874e-06,
+ "loss": 0.0798,
+ "step": 24703
+ },
+ {
+ "epoch": 67.3133514986376,
+ "grad_norm": 2.7195286750793457,
+ "learning_rate": 5.099424596390674e-06,
+ "loss": 0.0687,
+ "step": 24704
+ },
+ {
+ "epoch": 67.31607629427793,
+ "grad_norm": 3.508420944213867,
+ "learning_rate": 5.098655353648998e-06,
+ "loss": 0.1061,
+ "step": 24705
+ },
+ {
+ "epoch": 67.31880108991825,
+ "grad_norm": 4.016233444213867,
+ "learning_rate": 5.097886149078836e-06,
+ "loss": 0.1569,
+ "step": 24706
+ },
+ {
+ "epoch": 67.32152588555859,
+ "grad_norm": 3.3125321865081787,
+ "learning_rate": 5.097116982686175e-06,
+ "loss": 0.071,
+ "step": 24707
+ },
+ {
+ "epoch": 67.3242506811989,
+ "grad_norm": 2.6926913261413574,
+ "learning_rate": 5.0963478544770125e-06,
+ "loss": 0.0903,
+ "step": 24708
+ },
+ {
+ "epoch": 67.32697547683924,
+ "grad_norm": 3.0416789054870605,
+ "learning_rate": 5.095578764457336e-06,
+ "loss": 0.074,
+ "step": 24709
+ },
+ {
+ "epoch": 67.32970027247957,
+ "grad_norm": 3.1462037563323975,
+ "learning_rate": 5.0948097126331355e-06,
+ "loss": 0.0857,
+ "step": 24710
+ },
+ {
+ "epoch": 67.33242506811989,
+ "grad_norm": 2.979736804962158,
+ "learning_rate": 5.094040699010393e-06,
+ "loss": 0.0531,
+ "step": 24711
+ },
+ {
+ "epoch": 67.33514986376022,
+ "grad_norm": 4.241286277770996,
+ "learning_rate": 5.093271723595108e-06,
+ "loss": 0.1427,
+ "step": 24712
+ },
+ {
+ "epoch": 67.33787465940054,
+ "grad_norm": 3.185534715652466,
+ "learning_rate": 5.092502786393265e-06,
+ "loss": 0.1253,
+ "step": 24713
+ },
+ {
+ "epoch": 67.34059945504087,
+ "grad_norm": 3.9344115257263184,
+ "learning_rate": 5.091733887410849e-06,
+ "loss": 0.0438,
+ "step": 24714
+ },
+ {
+ "epoch": 67.34332425068119,
+ "grad_norm": 2.4539952278137207,
+ "learning_rate": 5.090965026653856e-06,
+ "loss": 0.0662,
+ "step": 24715
+ },
+ {
+ "epoch": 67.34604904632153,
+ "grad_norm": 4.353048801422119,
+ "learning_rate": 5.090196204128268e-06,
+ "loss": 0.1334,
+ "step": 24716
+ },
+ {
+ "epoch": 67.34877384196186,
+ "grad_norm": 2.635066509246826,
+ "learning_rate": 5.08942741984007e-06,
+ "loss": 0.0972,
+ "step": 24717
+ },
+ {
+ "epoch": 67.35149863760218,
+ "grad_norm": 3.0731635093688965,
+ "learning_rate": 5.088658673795257e-06,
+ "loss": 0.0495,
+ "step": 24718
+ },
+ {
+ "epoch": 67.35422343324251,
+ "grad_norm": 3.688865900039673,
+ "learning_rate": 5.08788996599981e-06,
+ "loss": 0.0424,
+ "step": 24719
+ },
+ {
+ "epoch": 67.35694822888283,
+ "grad_norm": 4.1209917068481445,
+ "learning_rate": 5.0871212964597205e-06,
+ "loss": 0.1023,
+ "step": 24720
+ },
+ {
+ "epoch": 67.35967302452316,
+ "grad_norm": 2.7736964225769043,
+ "learning_rate": 5.086352665180971e-06,
+ "loss": 0.0804,
+ "step": 24721
+ },
+ {
+ "epoch": 67.3623978201635,
+ "grad_norm": 3.80026912689209,
+ "learning_rate": 5.085584072169551e-06,
+ "loss": 0.066,
+ "step": 24722
+ },
+ {
+ "epoch": 67.36512261580381,
+ "grad_norm": 2.247812032699585,
+ "learning_rate": 5.08481551743144e-06,
+ "loss": 0.0544,
+ "step": 24723
+ },
+ {
+ "epoch": 67.36784741144415,
+ "grad_norm": 6.78448486328125,
+ "learning_rate": 5.0840470009726295e-06,
+ "loss": 0.0496,
+ "step": 24724
+ },
+ {
+ "epoch": 67.37057220708446,
+ "grad_norm": 4.081532955169678,
+ "learning_rate": 5.083278522799104e-06,
+ "loss": 0.0775,
+ "step": 24725
+ },
+ {
+ "epoch": 67.3732970027248,
+ "grad_norm": 3.0944600105285645,
+ "learning_rate": 5.082510082916847e-06,
+ "loss": 0.1056,
+ "step": 24726
+ },
+ {
+ "epoch": 67.37602179836512,
+ "grad_norm": 3.0897984504699707,
+ "learning_rate": 5.08174168133184e-06,
+ "loss": 0.0694,
+ "step": 24727
+ },
+ {
+ "epoch": 67.37874659400545,
+ "grad_norm": 2.751068115234375,
+ "learning_rate": 5.080973318050073e-06,
+ "loss": 0.051,
+ "step": 24728
+ },
+ {
+ "epoch": 67.38147138964578,
+ "grad_norm": 2.8970413208007812,
+ "learning_rate": 5.080204993077529e-06,
+ "loss": 0.0439,
+ "step": 24729
+ },
+ {
+ "epoch": 67.3841961852861,
+ "grad_norm": 3.559302806854248,
+ "learning_rate": 5.0794367064201885e-06,
+ "loss": 0.1568,
+ "step": 24730
+ },
+ {
+ "epoch": 67.38692098092643,
+ "grad_norm": 15.17588996887207,
+ "learning_rate": 5.078668458084035e-06,
+ "loss": 0.2251,
+ "step": 24731
+ },
+ {
+ "epoch": 67.38964577656675,
+ "grad_norm": 2.577274799346924,
+ "learning_rate": 5.077900248075055e-06,
+ "loss": 0.121,
+ "step": 24732
+ },
+ {
+ "epoch": 67.39237057220708,
+ "grad_norm": 5.998250961303711,
+ "learning_rate": 5.07713207639923e-06,
+ "loss": 0.1262,
+ "step": 24733
+ },
+ {
+ "epoch": 67.39509536784742,
+ "grad_norm": 3.9774091243743896,
+ "learning_rate": 5.0763639430625385e-06,
+ "loss": 0.0612,
+ "step": 24734
+ },
+ {
+ "epoch": 67.39782016348774,
+ "grad_norm": 3.52544903755188,
+ "learning_rate": 5.0755958480709665e-06,
+ "loss": 0.0651,
+ "step": 24735
+ },
+ {
+ "epoch": 67.40054495912807,
+ "grad_norm": 3.4941420555114746,
+ "learning_rate": 5.074827791430499e-06,
+ "loss": 0.0568,
+ "step": 24736
+ },
+ {
+ "epoch": 67.40326975476839,
+ "grad_norm": 2.9969611167907715,
+ "learning_rate": 5.0740597731471134e-06,
+ "loss": 0.1178,
+ "step": 24737
+ },
+ {
+ "epoch": 67.40599455040872,
+ "grad_norm": 2.392972946166992,
+ "learning_rate": 5.073291793226791e-06,
+ "loss": 0.0384,
+ "step": 24738
+ },
+ {
+ "epoch": 67.40871934604904,
+ "grad_norm": 3.2726314067840576,
+ "learning_rate": 5.072523851675512e-06,
+ "loss": 0.0531,
+ "step": 24739
+ },
+ {
+ "epoch": 67.41144414168937,
+ "grad_norm": 4.787219047546387,
+ "learning_rate": 5.071755948499262e-06,
+ "loss": 0.0365,
+ "step": 24740
+ },
+ {
+ "epoch": 67.4141689373297,
+ "grad_norm": 7.6623663902282715,
+ "learning_rate": 5.070988083704016e-06,
+ "loss": 0.167,
+ "step": 24741
+ },
+ {
+ "epoch": 67.41689373297002,
+ "grad_norm": 3.5750341415405273,
+ "learning_rate": 5.070220257295758e-06,
+ "loss": 0.1,
+ "step": 24742
+ },
+ {
+ "epoch": 67.41961852861036,
+ "grad_norm": 3.042717933654785,
+ "learning_rate": 5.0694524692804625e-06,
+ "loss": 0.0564,
+ "step": 24743
+ },
+ {
+ "epoch": 67.42234332425068,
+ "grad_norm": 3.4299728870391846,
+ "learning_rate": 5.068684719664116e-06,
+ "loss": 0.1737,
+ "step": 24744
+ },
+ {
+ "epoch": 67.42506811989101,
+ "grad_norm": 3.153731107711792,
+ "learning_rate": 5.067917008452693e-06,
+ "loss": 0.0827,
+ "step": 24745
+ },
+ {
+ "epoch": 67.42779291553134,
+ "grad_norm": 3.2509191036224365,
+ "learning_rate": 5.067149335652175e-06,
+ "loss": 0.1035,
+ "step": 24746
+ },
+ {
+ "epoch": 67.43051771117166,
+ "grad_norm": 3.6034340858459473,
+ "learning_rate": 5.066381701268535e-06,
+ "loss": 0.114,
+ "step": 24747
+ },
+ {
+ "epoch": 67.433242506812,
+ "grad_norm": 10.852611541748047,
+ "learning_rate": 5.065614105307759e-06,
+ "loss": 0.0402,
+ "step": 24748
+ },
+ {
+ "epoch": 67.43596730245231,
+ "grad_norm": 4.52252197265625,
+ "learning_rate": 5.064846547775821e-06,
+ "loss": 0.1277,
+ "step": 24749
+ },
+ {
+ "epoch": 67.43869209809264,
+ "grad_norm": 4.758501052856445,
+ "learning_rate": 5.0640790286787e-06,
+ "loss": 0.2125,
+ "step": 24750
+ },
+ {
+ "epoch": 67.44141689373296,
+ "grad_norm": 3.4215078353881836,
+ "learning_rate": 5.0633115480223695e-06,
+ "loss": 0.0479,
+ "step": 24751
+ },
+ {
+ "epoch": 67.4441416893733,
+ "grad_norm": 3.988860845565796,
+ "learning_rate": 5.062544105812807e-06,
+ "loss": 0.1015,
+ "step": 24752
+ },
+ {
+ "epoch": 67.44686648501363,
+ "grad_norm": 3.772794008255005,
+ "learning_rate": 5.061776702055998e-06,
+ "loss": 0.0599,
+ "step": 24753
+ },
+ {
+ "epoch": 67.44959128065395,
+ "grad_norm": 4.0554280281066895,
+ "learning_rate": 5.0610093367579135e-06,
+ "loss": 0.1243,
+ "step": 24754
+ },
+ {
+ "epoch": 67.45231607629428,
+ "grad_norm": 2.8715896606445312,
+ "learning_rate": 5.060242009924525e-06,
+ "loss": 0.0636,
+ "step": 24755
+ },
+ {
+ "epoch": 67.4550408719346,
+ "grad_norm": 3.2675414085388184,
+ "learning_rate": 5.059474721561817e-06,
+ "loss": 0.0614,
+ "step": 24756
+ },
+ {
+ "epoch": 67.45776566757493,
+ "grad_norm": 2.7207672595977783,
+ "learning_rate": 5.058707471675761e-06,
+ "loss": 0.0383,
+ "step": 24757
+ },
+ {
+ "epoch": 67.46049046321527,
+ "grad_norm": 3.1995835304260254,
+ "learning_rate": 5.0579402602723315e-06,
+ "loss": 0.0915,
+ "step": 24758
+ },
+ {
+ "epoch": 67.46321525885558,
+ "grad_norm": 3.2084741592407227,
+ "learning_rate": 5.057173087357501e-06,
+ "loss": 0.0684,
+ "step": 24759
+ },
+ {
+ "epoch": 67.46594005449592,
+ "grad_norm": 3.7472259998321533,
+ "learning_rate": 5.05640595293725e-06,
+ "loss": 0.1285,
+ "step": 24760
+ },
+ {
+ "epoch": 67.46866485013624,
+ "grad_norm": 3.2161805629730225,
+ "learning_rate": 5.055638857017551e-06,
+ "loss": 0.0553,
+ "step": 24761
+ },
+ {
+ "epoch": 67.47138964577657,
+ "grad_norm": 3.6380856037139893,
+ "learning_rate": 5.054871799604377e-06,
+ "loss": 0.1469,
+ "step": 24762
+ },
+ {
+ "epoch": 67.47411444141689,
+ "grad_norm": 3.3077454566955566,
+ "learning_rate": 5.054104780703699e-06,
+ "loss": 0.0768,
+ "step": 24763
+ },
+ {
+ "epoch": 67.47683923705722,
+ "grad_norm": 3.4313948154449463,
+ "learning_rate": 5.053337800321498e-06,
+ "loss": 0.1028,
+ "step": 24764
+ },
+ {
+ "epoch": 67.47956403269755,
+ "grad_norm": 2.646376132965088,
+ "learning_rate": 5.052570858463743e-06,
+ "loss": 0.0306,
+ "step": 24765
+ },
+ {
+ "epoch": 67.48228882833787,
+ "grad_norm": 3.7639083862304688,
+ "learning_rate": 5.051803955136406e-06,
+ "loss": 0.0776,
+ "step": 24766
+ },
+ {
+ "epoch": 67.4850136239782,
+ "grad_norm": 2.773786783218384,
+ "learning_rate": 5.051037090345457e-06,
+ "loss": 0.0363,
+ "step": 24767
+ },
+ {
+ "epoch": 67.48773841961852,
+ "grad_norm": 2.877821683883667,
+ "learning_rate": 5.050270264096873e-06,
+ "loss": 0.0494,
+ "step": 24768
+ },
+ {
+ "epoch": 67.49046321525886,
+ "grad_norm": 3.5250706672668457,
+ "learning_rate": 5.049503476396627e-06,
+ "loss": 0.0428,
+ "step": 24769
+ },
+ {
+ "epoch": 67.49318801089919,
+ "grad_norm": 3.0568342208862305,
+ "learning_rate": 5.048736727250689e-06,
+ "loss": 0.1221,
+ "step": 24770
+ },
+ {
+ "epoch": 67.49591280653951,
+ "grad_norm": 3.014346122741699,
+ "learning_rate": 5.047970016665031e-06,
+ "loss": 0.0739,
+ "step": 24771
+ },
+ {
+ "epoch": 67.49863760217984,
+ "grad_norm": 3.089616537094116,
+ "learning_rate": 5.0472033446456195e-06,
+ "loss": 0.1213,
+ "step": 24772
+ },
+ {
+ "epoch": 67.50136239782016,
+ "grad_norm": 3.176083564758301,
+ "learning_rate": 5.046436711198431e-06,
+ "loss": 0.0425,
+ "step": 24773
+ },
+ {
+ "epoch": 67.50408719346049,
+ "grad_norm": 3.830902576446533,
+ "learning_rate": 5.045670116329435e-06,
+ "loss": 0.0919,
+ "step": 24774
+ },
+ {
+ "epoch": 67.50681198910081,
+ "grad_norm": 3.097994565963745,
+ "learning_rate": 5.0449035600446005e-06,
+ "loss": 0.0678,
+ "step": 24775
+ },
+ {
+ "epoch": 67.50953678474114,
+ "grad_norm": 5.094249725341797,
+ "learning_rate": 5.044137042349895e-06,
+ "loss": 0.099,
+ "step": 24776
+ },
+ {
+ "epoch": 67.51226158038148,
+ "grad_norm": 3.530489921569824,
+ "learning_rate": 5.043370563251293e-06,
+ "loss": 0.207,
+ "step": 24777
+ },
+ {
+ "epoch": 67.5149863760218,
+ "grad_norm": 3.2964890003204346,
+ "learning_rate": 5.0426041227547616e-06,
+ "loss": 0.2278,
+ "step": 24778
+ },
+ {
+ "epoch": 67.51771117166213,
+ "grad_norm": 2.7340049743652344,
+ "learning_rate": 5.041837720866266e-06,
+ "loss": 0.0463,
+ "step": 24779
+ },
+ {
+ "epoch": 67.52043596730245,
+ "grad_norm": 3.1398894786834717,
+ "learning_rate": 5.041071357591782e-06,
+ "loss": 0.0496,
+ "step": 24780
+ },
+ {
+ "epoch": 67.52316076294278,
+ "grad_norm": 2.630547285079956,
+ "learning_rate": 5.040305032937276e-06,
+ "loss": 0.1534,
+ "step": 24781
+ },
+ {
+ "epoch": 67.52588555858311,
+ "grad_norm": 2.391430377960205,
+ "learning_rate": 5.039538746908714e-06,
+ "loss": 0.0404,
+ "step": 24782
+ },
+ {
+ "epoch": 67.52861035422343,
+ "grad_norm": 3.8539505004882812,
+ "learning_rate": 5.038772499512061e-06,
+ "loss": 0.2649,
+ "step": 24783
+ },
+ {
+ "epoch": 67.53133514986376,
+ "grad_norm": 3.411309003829956,
+ "learning_rate": 5.038006290753292e-06,
+ "loss": 0.0927,
+ "step": 24784
+ },
+ {
+ "epoch": 67.53405994550408,
+ "grad_norm": 3.26887845993042,
+ "learning_rate": 5.037240120638367e-06,
+ "loss": 0.1387,
+ "step": 24785
+ },
+ {
+ "epoch": 67.53678474114442,
+ "grad_norm": 3.015413999557495,
+ "learning_rate": 5.0364739891732584e-06,
+ "loss": 0.1044,
+ "step": 24786
+ },
+ {
+ "epoch": 67.53950953678473,
+ "grad_norm": 2.9222254753112793,
+ "learning_rate": 5.0357078963639325e-06,
+ "loss": 0.1054,
+ "step": 24787
+ },
+ {
+ "epoch": 67.54223433242507,
+ "grad_norm": 5.172916412353516,
+ "learning_rate": 5.034941842216349e-06,
+ "loss": 0.1323,
+ "step": 24788
+ },
+ {
+ "epoch": 67.5449591280654,
+ "grad_norm": 4.501311302185059,
+ "learning_rate": 5.034175826736483e-06,
+ "loss": 0.139,
+ "step": 24789
+ },
+ {
+ "epoch": 67.54768392370572,
+ "grad_norm": 4.1948418617248535,
+ "learning_rate": 5.033409849930295e-06,
+ "loss": 0.0798,
+ "step": 24790
+ },
+ {
+ "epoch": 67.55040871934605,
+ "grad_norm": 2.8324954509735107,
+ "learning_rate": 5.032643911803752e-06,
+ "loss": 0.1167,
+ "step": 24791
+ },
+ {
+ "epoch": 67.55313351498637,
+ "grad_norm": 8.362939834594727,
+ "learning_rate": 5.031878012362813e-06,
+ "loss": 0.087,
+ "step": 24792
+ },
+ {
+ "epoch": 67.5558583106267,
+ "grad_norm": 2.408095598220825,
+ "learning_rate": 5.031112151613453e-06,
+ "loss": 0.0604,
+ "step": 24793
+ },
+ {
+ "epoch": 67.55858310626704,
+ "grad_norm": 3.738321304321289,
+ "learning_rate": 5.030346329561632e-06,
+ "loss": 0.0899,
+ "step": 24794
+ },
+ {
+ "epoch": 67.56130790190736,
+ "grad_norm": 2.8952131271362305,
+ "learning_rate": 5.029580546213313e-06,
+ "loss": 0.0963,
+ "step": 24795
+ },
+ {
+ "epoch": 67.56403269754769,
+ "grad_norm": 3.862053632736206,
+ "learning_rate": 5.0288148015744576e-06,
+ "loss": 0.0682,
+ "step": 24796
+ },
+ {
+ "epoch": 67.566757493188,
+ "grad_norm": 3.8780133724212646,
+ "learning_rate": 5.028049095651036e-06,
+ "loss": 0.0962,
+ "step": 24797
+ },
+ {
+ "epoch": 67.56948228882834,
+ "grad_norm": 2.654364824295044,
+ "learning_rate": 5.027283428449008e-06,
+ "loss": 0.0397,
+ "step": 24798
+ },
+ {
+ "epoch": 67.57220708446866,
+ "grad_norm": 2.4831955432891846,
+ "learning_rate": 5.0265177999743335e-06,
+ "loss": 0.0322,
+ "step": 24799
+ },
+ {
+ "epoch": 67.57493188010899,
+ "grad_norm": 3.551032304763794,
+ "learning_rate": 5.025752210232982e-06,
+ "loss": 0.1826,
+ "step": 24800
+ },
+ {
+ "epoch": 67.57765667574932,
+ "grad_norm": 3.573977470397949,
+ "learning_rate": 5.0249866592309115e-06,
+ "loss": 0.0409,
+ "step": 24801
+ },
+ {
+ "epoch": 67.58038147138964,
+ "grad_norm": 2.2330880165100098,
+ "learning_rate": 5.024221146974084e-06,
+ "loss": 0.0276,
+ "step": 24802
+ },
+ {
+ "epoch": 67.58310626702998,
+ "grad_norm": 3.4516408443450928,
+ "learning_rate": 5.02345567346846e-06,
+ "loss": 0.0809,
+ "step": 24803
+ },
+ {
+ "epoch": 67.5858310626703,
+ "grad_norm": 2.8857977390289307,
+ "learning_rate": 5.022690238720002e-06,
+ "loss": 0.0433,
+ "step": 24804
+ },
+ {
+ "epoch": 67.58855585831063,
+ "grad_norm": 2.741292953491211,
+ "learning_rate": 5.021924842734678e-06,
+ "loss": 0.0724,
+ "step": 24805
+ },
+ {
+ "epoch": 67.59128065395096,
+ "grad_norm": 2.7073473930358887,
+ "learning_rate": 5.021159485518441e-06,
+ "loss": 0.0375,
+ "step": 24806
+ },
+ {
+ "epoch": 67.59400544959128,
+ "grad_norm": 5.090786457061768,
+ "learning_rate": 5.020394167077254e-06,
+ "loss": 0.1652,
+ "step": 24807
+ },
+ {
+ "epoch": 67.59673024523161,
+ "grad_norm": 3.7017996311187744,
+ "learning_rate": 5.019628887417073e-06,
+ "loss": 0.0454,
+ "step": 24808
+ },
+ {
+ "epoch": 67.59945504087193,
+ "grad_norm": 2.341773748397827,
+ "learning_rate": 5.0188636465438654e-06,
+ "loss": 0.0507,
+ "step": 24809
+ },
+ {
+ "epoch": 67.60217983651226,
+ "grad_norm": 2.2711684703826904,
+ "learning_rate": 5.018098444463588e-06,
+ "loss": 0.0479,
+ "step": 24810
+ },
+ {
+ "epoch": 67.60490463215258,
+ "grad_norm": 2.489880323410034,
+ "learning_rate": 5.0173332811822e-06,
+ "loss": 0.0304,
+ "step": 24811
+ },
+ {
+ "epoch": 67.60762942779292,
+ "grad_norm": 5.754882335662842,
+ "learning_rate": 5.016568156705657e-06,
+ "loss": 0.1992,
+ "step": 24812
+ },
+ {
+ "epoch": 67.61035422343325,
+ "grad_norm": 3.56738018989563,
+ "learning_rate": 5.015803071039923e-06,
+ "loss": 0.079,
+ "step": 24813
+ },
+ {
+ "epoch": 67.61307901907357,
+ "grad_norm": 6.180990695953369,
+ "learning_rate": 5.015038024190954e-06,
+ "loss": 0.0558,
+ "step": 24814
+ },
+ {
+ "epoch": 67.6158038147139,
+ "grad_norm": 3.8189873695373535,
+ "learning_rate": 5.014273016164711e-06,
+ "loss": 0.0851,
+ "step": 24815
+ },
+ {
+ "epoch": 67.61852861035422,
+ "grad_norm": 4.0965681076049805,
+ "learning_rate": 5.013508046967142e-06,
+ "loss": 0.1865,
+ "step": 24816
+ },
+ {
+ "epoch": 67.62125340599455,
+ "grad_norm": 3.53777813911438,
+ "learning_rate": 5.012743116604217e-06,
+ "loss": 0.0459,
+ "step": 24817
+ },
+ {
+ "epoch": 67.62397820163488,
+ "grad_norm": 3.362224817276001,
+ "learning_rate": 5.011978225081889e-06,
+ "loss": 0.069,
+ "step": 24818
+ },
+ {
+ "epoch": 67.6267029972752,
+ "grad_norm": 3.1568098068237305,
+ "learning_rate": 5.011213372406114e-06,
+ "loss": 0.0637,
+ "step": 24819
+ },
+ {
+ "epoch": 67.62942779291554,
+ "grad_norm": 2.6528587341308594,
+ "learning_rate": 5.010448558582841e-06,
+ "loss": 0.0515,
+ "step": 24820
+ },
+ {
+ "epoch": 67.63215258855585,
+ "grad_norm": 3.075692653656006,
+ "learning_rate": 5.00968378361804e-06,
+ "loss": 0.0959,
+ "step": 24821
+ },
+ {
+ "epoch": 67.63487738419619,
+ "grad_norm": 3.195258617401123,
+ "learning_rate": 5.008919047517663e-06,
+ "loss": 0.0471,
+ "step": 24822
+ },
+ {
+ "epoch": 67.6376021798365,
+ "grad_norm": 3.759169340133667,
+ "learning_rate": 5.008154350287663e-06,
+ "loss": 0.0691,
+ "step": 24823
+ },
+ {
+ "epoch": 67.64032697547684,
+ "grad_norm": 4.912634372711182,
+ "learning_rate": 5.007389691933992e-06,
+ "loss": 0.037,
+ "step": 24824
+ },
+ {
+ "epoch": 67.64305177111717,
+ "grad_norm": 3.0033481121063232,
+ "learning_rate": 5.006625072462615e-06,
+ "loss": 0.0449,
+ "step": 24825
+ },
+ {
+ "epoch": 67.64577656675749,
+ "grad_norm": 2.47558856010437,
+ "learning_rate": 5.005860491879479e-06,
+ "loss": 0.0442,
+ "step": 24826
+ },
+ {
+ "epoch": 67.64850136239782,
+ "grad_norm": 3.771505832672119,
+ "learning_rate": 5.005095950190541e-06,
+ "loss": 0.0826,
+ "step": 24827
+ },
+ {
+ "epoch": 67.65122615803814,
+ "grad_norm": 4.252354621887207,
+ "learning_rate": 5.004331447401754e-06,
+ "loss": 0.0824,
+ "step": 24828
+ },
+ {
+ "epoch": 67.65395095367847,
+ "grad_norm": 3.3859550952911377,
+ "learning_rate": 5.003566983519073e-06,
+ "loss": 0.1013,
+ "step": 24829
+ },
+ {
+ "epoch": 67.65667574931881,
+ "grad_norm": 2.417128562927246,
+ "learning_rate": 5.002802558548454e-06,
+ "loss": 0.0727,
+ "step": 24830
+ },
+ {
+ "epoch": 67.65940054495913,
+ "grad_norm": 3.090529441833496,
+ "learning_rate": 5.002038172495847e-06,
+ "loss": 0.0413,
+ "step": 24831
+ },
+ {
+ "epoch": 67.66212534059946,
+ "grad_norm": 2.4321982860565186,
+ "learning_rate": 5.001273825367201e-06,
+ "loss": 0.1191,
+ "step": 24832
+ },
+ {
+ "epoch": 67.66485013623978,
+ "grad_norm": 4.1490983963012695,
+ "learning_rate": 5.0005095171684794e-06,
+ "loss": 0.0716,
+ "step": 24833
+ },
+ {
+ "epoch": 67.66757493188011,
+ "grad_norm": 5.533572196960449,
+ "learning_rate": 4.999745247905627e-06,
+ "loss": 0.2342,
+ "step": 24834
+ },
+ {
+ "epoch": 67.67029972752043,
+ "grad_norm": 2.7488348484039307,
+ "learning_rate": 4.998981017584598e-06,
+ "loss": 0.0645,
+ "step": 24835
+ },
+ {
+ "epoch": 67.67302452316076,
+ "grad_norm": 4.481891632080078,
+ "learning_rate": 4.99821682621134e-06,
+ "loss": 0.1657,
+ "step": 24836
+ },
+ {
+ "epoch": 67.6757493188011,
+ "grad_norm": 4.825045108795166,
+ "learning_rate": 4.9974526737918095e-06,
+ "loss": 0.1055,
+ "step": 24837
+ },
+ {
+ "epoch": 67.67847411444141,
+ "grad_norm": 3.8038241863250732,
+ "learning_rate": 4.996688560331961e-06,
+ "loss": 0.1125,
+ "step": 24838
+ },
+ {
+ "epoch": 67.68119891008175,
+ "grad_norm": 4.075389862060547,
+ "learning_rate": 4.995924485837739e-06,
+ "loss": 0.1495,
+ "step": 24839
+ },
+ {
+ "epoch": 67.68392370572207,
+ "grad_norm": 2.7468202114105225,
+ "learning_rate": 4.995160450315093e-06,
+ "loss": 0.0668,
+ "step": 24840
+ },
+ {
+ "epoch": 67.6866485013624,
+ "grad_norm": 3.0879342555999756,
+ "learning_rate": 4.99439645376998e-06,
+ "loss": 0.0592,
+ "step": 24841
+ },
+ {
+ "epoch": 67.68937329700273,
+ "grad_norm": 3.7090606689453125,
+ "learning_rate": 4.993632496208346e-06,
+ "loss": 0.2208,
+ "step": 24842
+ },
+ {
+ "epoch": 67.69209809264305,
+ "grad_norm": 2.401188373565674,
+ "learning_rate": 4.992868577636142e-06,
+ "loss": 0.0285,
+ "step": 24843
+ },
+ {
+ "epoch": 67.69482288828338,
+ "grad_norm": 5.189709663391113,
+ "learning_rate": 4.992104698059312e-06,
+ "loss": 0.0577,
+ "step": 24844
+ },
+ {
+ "epoch": 67.6975476839237,
+ "grad_norm": 2.323056221008301,
+ "learning_rate": 4.991340857483813e-06,
+ "loss": 0.047,
+ "step": 24845
+ },
+ {
+ "epoch": 67.70027247956403,
+ "grad_norm": 4.279284477233887,
+ "learning_rate": 4.9905770559155905e-06,
+ "loss": 0.0586,
+ "step": 24846
+ },
+ {
+ "epoch": 67.70299727520435,
+ "grad_norm": 2.025045871734619,
+ "learning_rate": 4.989813293360593e-06,
+ "loss": 0.0442,
+ "step": 24847
+ },
+ {
+ "epoch": 67.70572207084469,
+ "grad_norm": 3.212538480758667,
+ "learning_rate": 4.989049569824763e-06,
+ "loss": 0.0544,
+ "step": 24848
+ },
+ {
+ "epoch": 67.70844686648502,
+ "grad_norm": 3.816307783126831,
+ "learning_rate": 4.988285885314059e-06,
+ "loss": 0.044,
+ "step": 24849
+ },
+ {
+ "epoch": 67.71117166212534,
+ "grad_norm": 3.193031072616577,
+ "learning_rate": 4.987522239834422e-06,
+ "loss": 0.27,
+ "step": 24850
+ },
+ {
+ "epoch": 67.71389645776567,
+ "grad_norm": 3.969139814376831,
+ "learning_rate": 4.9867586333918015e-06,
+ "loss": 0.0459,
+ "step": 24851
+ },
+ {
+ "epoch": 67.71662125340599,
+ "grad_norm": 2.8488636016845703,
+ "learning_rate": 4.985995065992139e-06,
+ "loss": 0.0686,
+ "step": 24852
+ },
+ {
+ "epoch": 67.71934604904632,
+ "grad_norm": 4.406191349029541,
+ "learning_rate": 4.985231537641391e-06,
+ "loss": 0.1313,
+ "step": 24853
+ },
+ {
+ "epoch": 67.72207084468666,
+ "grad_norm": 2.194641590118408,
+ "learning_rate": 4.984468048345493e-06,
+ "loss": 0.0321,
+ "step": 24854
+ },
+ {
+ "epoch": 67.72479564032697,
+ "grad_norm": 3.4836697578430176,
+ "learning_rate": 4.983704598110401e-06,
+ "loss": 0.0835,
+ "step": 24855
+ },
+ {
+ "epoch": 67.7275204359673,
+ "grad_norm": 3.131699562072754,
+ "learning_rate": 4.982941186942055e-06,
+ "loss": 0.1429,
+ "step": 24856
+ },
+ {
+ "epoch": 67.73024523160763,
+ "grad_norm": 4.213091850280762,
+ "learning_rate": 4.982177814846398e-06,
+ "loss": 0.0812,
+ "step": 24857
+ },
+ {
+ "epoch": 67.73297002724796,
+ "grad_norm": 2.6906919479370117,
+ "learning_rate": 4.981414481829383e-06,
+ "loss": 0.0538,
+ "step": 24858
+ },
+ {
+ "epoch": 67.73569482288828,
+ "grad_norm": 4.27742862701416,
+ "learning_rate": 4.980651187896951e-06,
+ "loss": 0.2144,
+ "step": 24859
+ },
+ {
+ "epoch": 67.73841961852861,
+ "grad_norm": 2.63991117477417,
+ "learning_rate": 4.979887933055045e-06,
+ "loss": 0.0729,
+ "step": 24860
+ },
+ {
+ "epoch": 67.74114441416894,
+ "grad_norm": 3.841693878173828,
+ "learning_rate": 4.979124717309607e-06,
+ "loss": 0.0735,
+ "step": 24861
+ },
+ {
+ "epoch": 67.74386920980926,
+ "grad_norm": 2.9286797046661377,
+ "learning_rate": 4.978361540666587e-06,
+ "loss": 0.0447,
+ "step": 24862
+ },
+ {
+ "epoch": 67.7465940054496,
+ "grad_norm": 4.95592737197876,
+ "learning_rate": 4.977598403131927e-06,
+ "loss": 0.1634,
+ "step": 24863
+ },
+ {
+ "epoch": 67.74931880108991,
+ "grad_norm": 4.124266624450684,
+ "learning_rate": 4.976835304711565e-06,
+ "loss": 0.1666,
+ "step": 24864
+ },
+ {
+ "epoch": 67.75204359673025,
+ "grad_norm": 2.6184325218200684,
+ "learning_rate": 4.976072245411451e-06,
+ "loss": 0.0387,
+ "step": 24865
+ },
+ {
+ "epoch": 67.75476839237058,
+ "grad_norm": 3.3357319831848145,
+ "learning_rate": 4.9753092252375245e-06,
+ "loss": 0.0702,
+ "step": 24866
+ },
+ {
+ "epoch": 67.7574931880109,
+ "grad_norm": 3.164846897125244,
+ "learning_rate": 4.974546244195729e-06,
+ "loss": 0.0592,
+ "step": 24867
+ },
+ {
+ "epoch": 67.76021798365123,
+ "grad_norm": 2.907390832901001,
+ "learning_rate": 4.973783302292001e-06,
+ "loss": 0.1629,
+ "step": 24868
+ },
+ {
+ "epoch": 67.76294277929155,
+ "grad_norm": 3.3718841075897217,
+ "learning_rate": 4.973020399532291e-06,
+ "loss": 0.0482,
+ "step": 24869
+ },
+ {
+ "epoch": 67.76566757493188,
+ "grad_norm": 3.1799652576446533,
+ "learning_rate": 4.972257535922537e-06,
+ "loss": 0.1327,
+ "step": 24870
+ },
+ {
+ "epoch": 67.7683923705722,
+ "grad_norm": 3.9311981201171875,
+ "learning_rate": 4.971494711468675e-06,
+ "loss": 0.1101,
+ "step": 24871
+ },
+ {
+ "epoch": 67.77111716621253,
+ "grad_norm": 3.581341028213501,
+ "learning_rate": 4.970731926176654e-06,
+ "loss": 0.1398,
+ "step": 24872
+ },
+ {
+ "epoch": 67.77384196185287,
+ "grad_norm": 2.3169612884521484,
+ "learning_rate": 4.969969180052407e-06,
+ "loss": 0.0444,
+ "step": 24873
+ },
+ {
+ "epoch": 67.77656675749319,
+ "grad_norm": 2.0783934593200684,
+ "learning_rate": 4.969206473101883e-06,
+ "loss": 0.0263,
+ "step": 24874
+ },
+ {
+ "epoch": 67.77929155313352,
+ "grad_norm": 3.9229013919830322,
+ "learning_rate": 4.9684438053310155e-06,
+ "loss": 0.0502,
+ "step": 24875
+ },
+ {
+ "epoch": 67.78201634877384,
+ "grad_norm": 3.068594455718994,
+ "learning_rate": 4.967681176745747e-06,
+ "loss": 0.0882,
+ "step": 24876
+ },
+ {
+ "epoch": 67.78474114441417,
+ "grad_norm": 3.4225618839263916,
+ "learning_rate": 4.966918587352011e-06,
+ "loss": 0.0911,
+ "step": 24877
+ },
+ {
+ "epoch": 67.7874659400545,
+ "grad_norm": 4.238270282745361,
+ "learning_rate": 4.966156037155755e-06,
+ "loss": 0.1074,
+ "step": 24878
+ },
+ {
+ "epoch": 67.79019073569482,
+ "grad_norm": 4.291094779968262,
+ "learning_rate": 4.965393526162914e-06,
+ "loss": 0.0818,
+ "step": 24879
+ },
+ {
+ "epoch": 67.79291553133515,
+ "grad_norm": 3.67020583152771,
+ "learning_rate": 4.964631054379426e-06,
+ "loss": 0.1277,
+ "step": 24880
+ },
+ {
+ "epoch": 67.79564032697547,
+ "grad_norm": 5.443231105804443,
+ "learning_rate": 4.963868621811227e-06,
+ "loss": 0.1818,
+ "step": 24881
+ },
+ {
+ "epoch": 67.7983651226158,
+ "grad_norm": 3.1344242095947266,
+ "learning_rate": 4.963106228464258e-06,
+ "loss": 0.0418,
+ "step": 24882
+ },
+ {
+ "epoch": 67.80108991825612,
+ "grad_norm": 4.302298069000244,
+ "learning_rate": 4.962343874344457e-06,
+ "loss": 0.0737,
+ "step": 24883
+ },
+ {
+ "epoch": 67.80381471389646,
+ "grad_norm": 3.8121414184570312,
+ "learning_rate": 4.96158155945776e-06,
+ "loss": 0.0838,
+ "step": 24884
+ },
+ {
+ "epoch": 67.80653950953679,
+ "grad_norm": 3.3013153076171875,
+ "learning_rate": 4.9608192838100995e-06,
+ "loss": 0.0715,
+ "step": 24885
+ },
+ {
+ "epoch": 67.80926430517711,
+ "grad_norm": 3.171365261077881,
+ "learning_rate": 4.96005704740742e-06,
+ "loss": 0.0612,
+ "step": 24886
+ },
+ {
+ "epoch": 67.81198910081744,
+ "grad_norm": 5.323923587799072,
+ "learning_rate": 4.959294850255655e-06,
+ "loss": 0.0807,
+ "step": 24887
+ },
+ {
+ "epoch": 67.81471389645776,
+ "grad_norm": 3.057110071182251,
+ "learning_rate": 4.958532692360735e-06,
+ "loss": 0.0941,
+ "step": 24888
+ },
+ {
+ "epoch": 67.8174386920981,
+ "grad_norm": 2.6628201007843018,
+ "learning_rate": 4.9577705737286e-06,
+ "loss": 0.0561,
+ "step": 24889
+ },
+ {
+ "epoch": 67.82016348773843,
+ "grad_norm": 2.3849899768829346,
+ "learning_rate": 4.957008494365189e-06,
+ "loss": 0.102,
+ "step": 24890
+ },
+ {
+ "epoch": 67.82288828337875,
+ "grad_norm": 3.0842764377593994,
+ "learning_rate": 4.956246454276433e-06,
+ "loss": 0.054,
+ "step": 24891
+ },
+ {
+ "epoch": 67.82561307901908,
+ "grad_norm": 3.459657907485962,
+ "learning_rate": 4.955484453468269e-06,
+ "loss": 0.0528,
+ "step": 24892
+ },
+ {
+ "epoch": 67.8283378746594,
+ "grad_norm": 2.9648995399475098,
+ "learning_rate": 4.954722491946624e-06,
+ "loss": 0.0465,
+ "step": 24893
+ },
+ {
+ "epoch": 67.83106267029973,
+ "grad_norm": 4.292356491088867,
+ "learning_rate": 4.953960569717443e-06,
+ "loss": 0.0527,
+ "step": 24894
+ },
+ {
+ "epoch": 67.83378746594005,
+ "grad_norm": 2.9318783283233643,
+ "learning_rate": 4.953198686786655e-06,
+ "loss": 0.0459,
+ "step": 24895
+ },
+ {
+ "epoch": 67.83651226158038,
+ "grad_norm": 3.5212247371673584,
+ "learning_rate": 4.952436843160192e-06,
+ "loss": 0.0832,
+ "step": 24896
+ },
+ {
+ "epoch": 67.83923705722071,
+ "grad_norm": 3.3984742164611816,
+ "learning_rate": 4.951675038843985e-06,
+ "loss": 0.1136,
+ "step": 24897
+ },
+ {
+ "epoch": 67.84196185286103,
+ "grad_norm": 3.9382457733154297,
+ "learning_rate": 4.950913273843975e-06,
+ "loss": 0.094,
+ "step": 24898
+ },
+ {
+ "epoch": 67.84468664850137,
+ "grad_norm": 3.3440463542938232,
+ "learning_rate": 4.950151548166089e-06,
+ "loss": 0.0428,
+ "step": 24899
+ },
+ {
+ "epoch": 67.84741144414168,
+ "grad_norm": 3.871778964996338,
+ "learning_rate": 4.949389861816259e-06,
+ "loss": 0.0615,
+ "step": 24900
+ },
+ {
+ "epoch": 67.85013623978202,
+ "grad_norm": 2.4289021492004395,
+ "learning_rate": 4.948628214800417e-06,
+ "loss": 0.0303,
+ "step": 24901
+ },
+ {
+ "epoch": 67.85286103542235,
+ "grad_norm": 3.30828857421875,
+ "learning_rate": 4.947866607124499e-06,
+ "loss": 0.0544,
+ "step": 24902
+ },
+ {
+ "epoch": 67.85558583106267,
+ "grad_norm": 2.7102503776550293,
+ "learning_rate": 4.947105038794432e-06,
+ "loss": 0.0484,
+ "step": 24903
+ },
+ {
+ "epoch": 67.858310626703,
+ "grad_norm": 2.3424482345581055,
+ "learning_rate": 4.946343509816149e-06,
+ "loss": 0.0498,
+ "step": 24904
+ },
+ {
+ "epoch": 67.86103542234332,
+ "grad_norm": 2.4523189067840576,
+ "learning_rate": 4.945582020195576e-06,
+ "loss": 0.0594,
+ "step": 24905
+ },
+ {
+ "epoch": 67.86376021798365,
+ "grad_norm": 3.603227376937866,
+ "learning_rate": 4.944820569938649e-06,
+ "loss": 0.044,
+ "step": 24906
+ },
+ {
+ "epoch": 67.86648501362397,
+ "grad_norm": 2.3260836601257324,
+ "learning_rate": 4.9440591590512984e-06,
+ "loss": 0.0662,
+ "step": 24907
+ },
+ {
+ "epoch": 67.8692098092643,
+ "grad_norm": 3.8470189571380615,
+ "learning_rate": 4.9432977875394536e-06,
+ "loss": 0.1546,
+ "step": 24908
+ },
+ {
+ "epoch": 67.87193460490464,
+ "grad_norm": 3.7191038131713867,
+ "learning_rate": 4.942536455409039e-06,
+ "loss": 0.1139,
+ "step": 24909
+ },
+ {
+ "epoch": 67.87465940054496,
+ "grad_norm": 4.3344221115112305,
+ "learning_rate": 4.941775162665992e-06,
+ "loss": 0.0525,
+ "step": 24910
+ },
+ {
+ "epoch": 67.87738419618529,
+ "grad_norm": 2.6456716060638428,
+ "learning_rate": 4.941013909316236e-06,
+ "loss": 0.2204,
+ "step": 24911
+ },
+ {
+ "epoch": 67.88010899182561,
+ "grad_norm": 2.9865050315856934,
+ "learning_rate": 4.940252695365701e-06,
+ "loss": 0.0631,
+ "step": 24912
+ },
+ {
+ "epoch": 67.88283378746594,
+ "grad_norm": 6.068676948547363,
+ "learning_rate": 4.939491520820312e-06,
+ "loss": 0.0772,
+ "step": 24913
+ },
+ {
+ "epoch": 67.88555858310627,
+ "grad_norm": 3.0810790061950684,
+ "learning_rate": 4.938730385686004e-06,
+ "loss": 0.0483,
+ "step": 24914
+ },
+ {
+ "epoch": 67.88828337874659,
+ "grad_norm": 2.9013748168945312,
+ "learning_rate": 4.937969289968701e-06,
+ "loss": 0.0996,
+ "step": 24915
+ },
+ {
+ "epoch": 67.89100817438693,
+ "grad_norm": 4.394800662994385,
+ "learning_rate": 4.93720823367433e-06,
+ "loss": 0.1282,
+ "step": 24916
+ },
+ {
+ "epoch": 67.89373297002724,
+ "grad_norm": 2.896500587463379,
+ "learning_rate": 4.936447216808814e-06,
+ "loss": 0.0702,
+ "step": 24917
+ },
+ {
+ "epoch": 67.89645776566758,
+ "grad_norm": 2.685396909713745,
+ "learning_rate": 4.935686239378088e-06,
+ "loss": 0.0863,
+ "step": 24918
+ },
+ {
+ "epoch": 67.8991825613079,
+ "grad_norm": 2.7011332511901855,
+ "learning_rate": 4.934925301388075e-06,
+ "loss": 0.0324,
+ "step": 24919
+ },
+ {
+ "epoch": 67.90190735694823,
+ "grad_norm": 3.0609073638916016,
+ "learning_rate": 4.9341644028447014e-06,
+ "loss": 0.0397,
+ "step": 24920
+ },
+ {
+ "epoch": 67.90463215258856,
+ "grad_norm": 2.5676541328430176,
+ "learning_rate": 4.933403543753887e-06,
+ "loss": 0.0358,
+ "step": 24921
+ },
+ {
+ "epoch": 67.90735694822888,
+ "grad_norm": 2.9928839206695557,
+ "learning_rate": 4.9326427241215666e-06,
+ "loss": 0.0719,
+ "step": 24922
+ },
+ {
+ "epoch": 67.91008174386921,
+ "grad_norm": 2.7477798461914062,
+ "learning_rate": 4.9318819439536596e-06,
+ "loss": 0.0999,
+ "step": 24923
+ },
+ {
+ "epoch": 67.91280653950953,
+ "grad_norm": 4.223602294921875,
+ "learning_rate": 4.931121203256095e-06,
+ "loss": 0.0801,
+ "step": 24924
+ },
+ {
+ "epoch": 67.91553133514986,
+ "grad_norm": 2.8641223907470703,
+ "learning_rate": 4.9303605020347965e-06,
+ "loss": 0.1024,
+ "step": 24925
+ },
+ {
+ "epoch": 67.9182561307902,
+ "grad_norm": 3.264960527420044,
+ "learning_rate": 4.929599840295683e-06,
+ "loss": 0.0905,
+ "step": 24926
+ },
+ {
+ "epoch": 67.92098092643052,
+ "grad_norm": 3.5409579277038574,
+ "learning_rate": 4.928839218044687e-06,
+ "loss": 0.087,
+ "step": 24927
+ },
+ {
+ "epoch": 67.92370572207085,
+ "grad_norm": 3.775388717651367,
+ "learning_rate": 4.928078635287726e-06,
+ "loss": 0.0643,
+ "step": 24928
+ },
+ {
+ "epoch": 67.92643051771117,
+ "grad_norm": 3.0450453758239746,
+ "learning_rate": 4.927318092030723e-06,
+ "loss": 0.0672,
+ "step": 24929
+ },
+ {
+ "epoch": 67.9291553133515,
+ "grad_norm": 4.1666669845581055,
+ "learning_rate": 4.9265575882796076e-06,
+ "loss": 0.0853,
+ "step": 24930
+ },
+ {
+ "epoch": 67.93188010899182,
+ "grad_norm": 3.8314664363861084,
+ "learning_rate": 4.925797124040298e-06,
+ "loss": 0.232,
+ "step": 24931
+ },
+ {
+ "epoch": 67.93460490463215,
+ "grad_norm": 4.507056713104248,
+ "learning_rate": 4.925036699318717e-06,
+ "loss": 0.0599,
+ "step": 24932
+ },
+ {
+ "epoch": 67.93732970027249,
+ "grad_norm": 3.821880578994751,
+ "learning_rate": 4.9242763141207825e-06,
+ "loss": 0.1515,
+ "step": 24933
+ },
+ {
+ "epoch": 67.9400544959128,
+ "grad_norm": 2.9991466999053955,
+ "learning_rate": 4.9235159684524256e-06,
+ "loss": 0.1734,
+ "step": 24934
+ },
+ {
+ "epoch": 67.94277929155314,
+ "grad_norm": 2.7332661151885986,
+ "learning_rate": 4.922755662319563e-06,
+ "loss": 0.0352,
+ "step": 24935
+ },
+ {
+ "epoch": 67.94550408719346,
+ "grad_norm": 4.4129252433776855,
+ "learning_rate": 4.9219953957281154e-06,
+ "loss": 0.0785,
+ "step": 24936
+ },
+ {
+ "epoch": 67.94822888283379,
+ "grad_norm": 2.548818588256836,
+ "learning_rate": 4.9212351686839995e-06,
+ "loss": 0.0363,
+ "step": 24937
+ },
+ {
+ "epoch": 67.95095367847412,
+ "grad_norm": 5.2256646156311035,
+ "learning_rate": 4.920474981193146e-06,
+ "loss": 0.1432,
+ "step": 24938
+ },
+ {
+ "epoch": 67.95367847411444,
+ "grad_norm": 3.511392116546631,
+ "learning_rate": 4.9197148332614685e-06,
+ "loss": 0.0745,
+ "step": 24939
+ },
+ {
+ "epoch": 67.95640326975477,
+ "grad_norm": 2.386901378631592,
+ "learning_rate": 4.9189547248948856e-06,
+ "loss": 0.0296,
+ "step": 24940
+ },
+ {
+ "epoch": 67.95912806539509,
+ "grad_norm": 3.104686975479126,
+ "learning_rate": 4.918194656099323e-06,
+ "loss": 0.0769,
+ "step": 24941
+ },
+ {
+ "epoch": 67.96185286103542,
+ "grad_norm": 3.6968278884887695,
+ "learning_rate": 4.917434626880694e-06,
+ "loss": 0.1325,
+ "step": 24942
+ },
+ {
+ "epoch": 67.96457765667574,
+ "grad_norm": 2.0700976848602295,
+ "learning_rate": 4.916674637244924e-06,
+ "loss": 0.0848,
+ "step": 24943
+ },
+ {
+ "epoch": 67.96730245231608,
+ "grad_norm": 2.490745782852173,
+ "learning_rate": 4.915914687197928e-06,
+ "loss": 0.0805,
+ "step": 24944
+ },
+ {
+ "epoch": 67.97002724795641,
+ "grad_norm": 3.9408082962036133,
+ "learning_rate": 4.915154776745624e-06,
+ "loss": 0.0811,
+ "step": 24945
+ },
+ {
+ "epoch": 67.97275204359673,
+ "grad_norm": 3.8298580646514893,
+ "learning_rate": 4.914394905893928e-06,
+ "loss": 0.2028,
+ "step": 24946
+ },
+ {
+ "epoch": 67.97547683923706,
+ "grad_norm": 8.07292652130127,
+ "learning_rate": 4.913635074648765e-06,
+ "loss": 0.0823,
+ "step": 24947
+ },
+ {
+ "epoch": 67.97820163487738,
+ "grad_norm": 2.2788009643554688,
+ "learning_rate": 4.912875283016047e-06,
+ "loss": 0.0249,
+ "step": 24948
+ },
+ {
+ "epoch": 67.98092643051771,
+ "grad_norm": 3.7298474311828613,
+ "learning_rate": 4.9121155310016946e-06,
+ "loss": 0.1421,
+ "step": 24949
+ },
+ {
+ "epoch": 67.98365122615803,
+ "grad_norm": 5.163436412811279,
+ "learning_rate": 4.911355818611618e-06,
+ "loss": 0.153,
+ "step": 24950
+ },
+ {
+ "epoch": 67.98637602179836,
+ "grad_norm": 3.9633572101593018,
+ "learning_rate": 4.9105961458517415e-06,
+ "loss": 0.1678,
+ "step": 24951
+ },
+ {
+ "epoch": 67.9891008174387,
+ "grad_norm": 4.479075908660889,
+ "learning_rate": 4.909836512727978e-06,
+ "loss": 0.1247,
+ "step": 24952
+ },
+ {
+ "epoch": 67.99182561307902,
+ "grad_norm": 3.044597625732422,
+ "learning_rate": 4.909076919246242e-06,
+ "loss": 0.1124,
+ "step": 24953
+ },
+ {
+ "epoch": 67.99455040871935,
+ "grad_norm": 3.070491313934326,
+ "learning_rate": 4.908317365412454e-06,
+ "loss": 0.1288,
+ "step": 24954
+ },
+ {
+ "epoch": 67.99727520435967,
+ "grad_norm": 3.2853972911834717,
+ "learning_rate": 4.9075578512325266e-06,
+ "loss": 0.1325,
+ "step": 24955
+ },
+ {
+ "epoch": 68.0,
+ "grad_norm": 4.042403221130371,
+ "learning_rate": 4.9067983767123736e-06,
+ "loss": 0.1736,
+ "step": 24956
+ },
+ {
+ "epoch": 68.00272479564033,
+ "grad_norm": 2.7494149208068848,
+ "learning_rate": 4.906038941857908e-06,
+ "loss": 0.0768,
+ "step": 24957
+ },
+ {
+ "epoch": 68.00544959128065,
+ "grad_norm": 3.2249743938446045,
+ "learning_rate": 4.905279546675047e-06,
+ "loss": 0.0774,
+ "step": 24958
+ },
+ {
+ "epoch": 68.00817438692098,
+ "grad_norm": 2.04597806930542,
+ "learning_rate": 4.904520191169709e-06,
+ "loss": 0.0732,
+ "step": 24959
+ },
+ {
+ "epoch": 68.0108991825613,
+ "grad_norm": 3.357067584991455,
+ "learning_rate": 4.903760875347804e-06,
+ "loss": 0.0507,
+ "step": 24960
+ },
+ {
+ "epoch": 68.01362397820164,
+ "grad_norm": 3.263263702392578,
+ "learning_rate": 4.9030015992152445e-06,
+ "loss": 0.0539,
+ "step": 24961
+ },
+ {
+ "epoch": 68.01634877384195,
+ "grad_norm": 3.323880672454834,
+ "learning_rate": 4.902242362777942e-06,
+ "loss": 0.1754,
+ "step": 24962
+ },
+ {
+ "epoch": 68.01907356948229,
+ "grad_norm": 3.205150604248047,
+ "learning_rate": 4.901483166041815e-06,
+ "loss": 0.1094,
+ "step": 24963
+ },
+ {
+ "epoch": 68.02179836512262,
+ "grad_norm": 3.1998703479766846,
+ "learning_rate": 4.900724009012773e-06,
+ "loss": 0.0441,
+ "step": 24964
+ },
+ {
+ "epoch": 68.02452316076294,
+ "grad_norm": 9.504284858703613,
+ "learning_rate": 4.899964891696728e-06,
+ "loss": 0.1081,
+ "step": 24965
+ },
+ {
+ "epoch": 68.02724795640327,
+ "grad_norm": 3.5057647228240967,
+ "learning_rate": 4.899205814099589e-06,
+ "loss": 0.083,
+ "step": 24966
+ },
+ {
+ "epoch": 68.02997275204359,
+ "grad_norm": 8.63381290435791,
+ "learning_rate": 4.898446776227274e-06,
+ "loss": 0.1381,
+ "step": 24967
+ },
+ {
+ "epoch": 68.03269754768392,
+ "grad_norm": 3.1937215328216553,
+ "learning_rate": 4.897687778085693e-06,
+ "loss": 0.136,
+ "step": 24968
+ },
+ {
+ "epoch": 68.03542234332426,
+ "grad_norm": 2.3671205043792725,
+ "learning_rate": 4.896928819680753e-06,
+ "loss": 0.0353,
+ "step": 24969
+ },
+ {
+ "epoch": 68.03814713896458,
+ "grad_norm": 6.201351642608643,
+ "learning_rate": 4.896169901018365e-06,
+ "loss": 0.0942,
+ "step": 24970
+ },
+ {
+ "epoch": 68.04087193460491,
+ "grad_norm": 3.7104909420013428,
+ "learning_rate": 4.8954110221044435e-06,
+ "loss": 0.0563,
+ "step": 24971
+ },
+ {
+ "epoch": 68.04359673024523,
+ "grad_norm": 2.5792465209960938,
+ "learning_rate": 4.894652182944899e-06,
+ "loss": 0.122,
+ "step": 24972
+ },
+ {
+ "epoch": 68.04632152588556,
+ "grad_norm": 2.297308921813965,
+ "learning_rate": 4.893893383545633e-06,
+ "loss": 0.1426,
+ "step": 24973
+ },
+ {
+ "epoch": 68.04904632152588,
+ "grad_norm": 3.3279075622558594,
+ "learning_rate": 4.893134623912567e-06,
+ "loss": 0.122,
+ "step": 24974
+ },
+ {
+ "epoch": 68.05177111716621,
+ "grad_norm": 2.6865179538726807,
+ "learning_rate": 4.892375904051599e-06,
+ "loss": 0.1871,
+ "step": 24975
+ },
+ {
+ "epoch": 68.05449591280654,
+ "grad_norm": 3.0044872760772705,
+ "learning_rate": 4.891617223968648e-06,
+ "loss": 0.0392,
+ "step": 24976
+ },
+ {
+ "epoch": 68.05722070844686,
+ "grad_norm": 4.275487422943115,
+ "learning_rate": 4.890858583669616e-06,
+ "loss": 0.1134,
+ "step": 24977
+ },
+ {
+ "epoch": 68.0599455040872,
+ "grad_norm": 3.2748069763183594,
+ "learning_rate": 4.89009998316041e-06,
+ "loss": 0.117,
+ "step": 24978
+ },
+ {
+ "epoch": 68.06267029972751,
+ "grad_norm": 3.3147456645965576,
+ "learning_rate": 4.889341422446945e-06,
+ "loss": 0.1342,
+ "step": 24979
+ },
+ {
+ "epoch": 68.06539509536785,
+ "grad_norm": 3.7245795726776123,
+ "learning_rate": 4.888582901535124e-06,
+ "loss": 0.2111,
+ "step": 24980
+ },
+ {
+ "epoch": 68.06811989100818,
+ "grad_norm": 2.658000946044922,
+ "learning_rate": 4.887824420430854e-06,
+ "loss": 0.1104,
+ "step": 24981
+ },
+ {
+ "epoch": 68.0708446866485,
+ "grad_norm": 2.3336551189422607,
+ "learning_rate": 4.887065979140041e-06,
+ "loss": 0.0396,
+ "step": 24982
+ },
+ {
+ "epoch": 68.07356948228883,
+ "grad_norm": 3.099041700363159,
+ "learning_rate": 4.886307577668596e-06,
+ "loss": 0.1679,
+ "step": 24983
+ },
+ {
+ "epoch": 68.07629427792915,
+ "grad_norm": 3.471858024597168,
+ "learning_rate": 4.885549216022424e-06,
+ "loss": 0.0494,
+ "step": 24984
+ },
+ {
+ "epoch": 68.07901907356948,
+ "grad_norm": 4.856651782989502,
+ "learning_rate": 4.8847908942074295e-06,
+ "loss": 0.0645,
+ "step": 24985
+ },
+ {
+ "epoch": 68.0817438692098,
+ "grad_norm": 2.4537742137908936,
+ "learning_rate": 4.884032612229515e-06,
+ "loss": 0.0337,
+ "step": 24986
+ },
+ {
+ "epoch": 68.08446866485014,
+ "grad_norm": 3.4039788246154785,
+ "learning_rate": 4.8832743700945936e-06,
+ "loss": 0.0667,
+ "step": 24987
+ },
+ {
+ "epoch": 68.08719346049047,
+ "grad_norm": 3.9975268840789795,
+ "learning_rate": 4.882516167808568e-06,
+ "loss": 0.0868,
+ "step": 24988
+ },
+ {
+ "epoch": 68.08991825613079,
+ "grad_norm": 3.4598822593688965,
+ "learning_rate": 4.881758005377339e-06,
+ "loss": 0.0667,
+ "step": 24989
+ },
+ {
+ "epoch": 68.09264305177112,
+ "grad_norm": 3.3750131130218506,
+ "learning_rate": 4.880999882806813e-06,
+ "loss": 0.0661,
+ "step": 24990
+ },
+ {
+ "epoch": 68.09536784741144,
+ "grad_norm": 2.525282382965088,
+ "learning_rate": 4.880241800102897e-06,
+ "loss": 0.0454,
+ "step": 24991
+ },
+ {
+ "epoch": 68.09809264305177,
+ "grad_norm": 3.315260648727417,
+ "learning_rate": 4.87948375727149e-06,
+ "loss": 0.3172,
+ "step": 24992
+ },
+ {
+ "epoch": 68.1008174386921,
+ "grad_norm": 2.868989944458008,
+ "learning_rate": 4.878725754318503e-06,
+ "loss": 0.0721,
+ "step": 24993
+ },
+ {
+ "epoch": 68.10354223433242,
+ "grad_norm": 5.609745025634766,
+ "learning_rate": 4.877967791249831e-06,
+ "loss": 0.1983,
+ "step": 24994
+ },
+ {
+ "epoch": 68.10626702997276,
+ "grad_norm": 2.8073129653930664,
+ "learning_rate": 4.877209868071384e-06,
+ "loss": 0.0581,
+ "step": 24995
+ },
+ {
+ "epoch": 68.10899182561307,
+ "grad_norm": 3.576669692993164,
+ "learning_rate": 4.876451984789062e-06,
+ "loss": 0.1892,
+ "step": 24996
+ },
+ {
+ "epoch": 68.11171662125341,
+ "grad_norm": 3.127253770828247,
+ "learning_rate": 4.8756941414087675e-06,
+ "loss": 0.156,
+ "step": 24997
+ },
+ {
+ "epoch": 68.11444141689373,
+ "grad_norm": 2.397226572036743,
+ "learning_rate": 4.874936337936399e-06,
+ "loss": 0.0437,
+ "step": 24998
+ },
+ {
+ "epoch": 68.11716621253406,
+ "grad_norm": 2.780616283416748,
+ "learning_rate": 4.874178574377863e-06,
+ "loss": 0.0316,
+ "step": 24999
+ },
+ {
+ "epoch": 68.11989100817439,
+ "grad_norm": 3.2752492427825928,
+ "learning_rate": 4.8734208507390615e-06,
+ "loss": 0.0516,
+ "step": 25000
+ },
+ {
+ "epoch": 68.12261580381471,
+ "grad_norm": 3.1068167686462402,
+ "learning_rate": 4.872663167025893e-06,
+ "loss": 0.0899,
+ "step": 25001
+ },
+ {
+ "epoch": 68.12534059945504,
+ "grad_norm": 3.745326280593872,
+ "learning_rate": 4.8719055232442535e-06,
+ "loss": 0.0589,
+ "step": 25002
+ },
+ {
+ "epoch": 68.12806539509536,
+ "grad_norm": 2.551170825958252,
+ "learning_rate": 4.871147919400053e-06,
+ "loss": 0.048,
+ "step": 25003
+ },
+ {
+ "epoch": 68.1307901907357,
+ "grad_norm": 2.6059932708740234,
+ "learning_rate": 4.8703903554991885e-06,
+ "loss": 0.0439,
+ "step": 25004
+ },
+ {
+ "epoch": 68.13351498637603,
+ "grad_norm": 2.7945291996002197,
+ "learning_rate": 4.869632831547559e-06,
+ "loss": 0.0345,
+ "step": 25005
+ },
+ {
+ "epoch": 68.13623978201635,
+ "grad_norm": 4.376722812652588,
+ "learning_rate": 4.868875347551059e-06,
+ "loss": 0.0386,
+ "step": 25006
+ },
+ {
+ "epoch": 68.13896457765668,
+ "grad_norm": 2.1037650108337402,
+ "learning_rate": 4.868117903515596e-06,
+ "loss": 0.0377,
+ "step": 25007
+ },
+ {
+ "epoch": 68.141689373297,
+ "grad_norm": 3.319108009338379,
+ "learning_rate": 4.867360499447066e-06,
+ "loss": 0.05,
+ "step": 25008
+ },
+ {
+ "epoch": 68.14441416893733,
+ "grad_norm": 2.9765584468841553,
+ "learning_rate": 4.866603135351365e-06,
+ "loss": 0.1211,
+ "step": 25009
+ },
+ {
+ "epoch": 68.14713896457765,
+ "grad_norm": 2.914546251296997,
+ "learning_rate": 4.8658458112343955e-06,
+ "loss": 0.0883,
+ "step": 25010
+ },
+ {
+ "epoch": 68.14986376021798,
+ "grad_norm": 2.722857713699341,
+ "learning_rate": 4.8650885271020495e-06,
+ "loss": 0.1046,
+ "step": 25011
+ },
+ {
+ "epoch": 68.15258855585832,
+ "grad_norm": 3.4026708602905273,
+ "learning_rate": 4.864331282960234e-06,
+ "loss": 0.0672,
+ "step": 25012
+ },
+ {
+ "epoch": 68.15531335149863,
+ "grad_norm": 2.9237442016601562,
+ "learning_rate": 4.86357407881484e-06,
+ "loss": 0.0826,
+ "step": 25013
+ },
+ {
+ "epoch": 68.15803814713897,
+ "grad_norm": 3.331533670425415,
+ "learning_rate": 4.862816914671763e-06,
+ "loss": 0.1254,
+ "step": 25014
+ },
+ {
+ "epoch": 68.16076294277929,
+ "grad_norm": 3.147104024887085,
+ "learning_rate": 4.862059790536906e-06,
+ "loss": 0.0859,
+ "step": 25015
+ },
+ {
+ "epoch": 68.16348773841962,
+ "grad_norm": 2.5917232036590576,
+ "learning_rate": 4.861302706416162e-06,
+ "loss": 0.0624,
+ "step": 25016
+ },
+ {
+ "epoch": 68.16621253405995,
+ "grad_norm": 4.823266983032227,
+ "learning_rate": 4.860545662315427e-06,
+ "loss": 0.0767,
+ "step": 25017
+ },
+ {
+ "epoch": 68.16893732970027,
+ "grad_norm": 3.8482394218444824,
+ "learning_rate": 4.859788658240593e-06,
+ "loss": 0.1534,
+ "step": 25018
+ },
+ {
+ "epoch": 68.1716621253406,
+ "grad_norm": 4.588294506072998,
+ "learning_rate": 4.859031694197563e-06,
+ "loss": 0.0899,
+ "step": 25019
+ },
+ {
+ "epoch": 68.17438692098092,
+ "grad_norm": 2.63802170753479,
+ "learning_rate": 4.858274770192229e-06,
+ "loss": 0.1056,
+ "step": 25020
+ },
+ {
+ "epoch": 68.17711171662125,
+ "grad_norm": 2.652108669281006,
+ "learning_rate": 4.8575178862304865e-06,
+ "loss": 0.044,
+ "step": 25021
+ },
+ {
+ "epoch": 68.17983651226157,
+ "grad_norm": 4.528519630432129,
+ "learning_rate": 4.856761042318224e-06,
+ "loss": 0.1687,
+ "step": 25022
+ },
+ {
+ "epoch": 68.1825613079019,
+ "grad_norm": 5.335216999053955,
+ "learning_rate": 4.856004238461346e-06,
+ "loss": 0.0651,
+ "step": 25023
+ },
+ {
+ "epoch": 68.18528610354224,
+ "grad_norm": 3.355959892272949,
+ "learning_rate": 4.8552474746657405e-06,
+ "loss": 0.1393,
+ "step": 25024
+ },
+ {
+ "epoch": 68.18801089918256,
+ "grad_norm": 3.15427303314209,
+ "learning_rate": 4.854490750937303e-06,
+ "loss": 0.1628,
+ "step": 25025
+ },
+ {
+ "epoch": 68.19073569482289,
+ "grad_norm": 3.5091757774353027,
+ "learning_rate": 4.853734067281922e-06,
+ "loss": 0.0499,
+ "step": 25026
+ },
+ {
+ "epoch": 68.19346049046321,
+ "grad_norm": 3.323369264602661,
+ "learning_rate": 4.852977423705494e-06,
+ "loss": 0.0527,
+ "step": 25027
+ },
+ {
+ "epoch": 68.19618528610354,
+ "grad_norm": 4.669510841369629,
+ "learning_rate": 4.852220820213915e-06,
+ "loss": 0.0706,
+ "step": 25028
+ },
+ {
+ "epoch": 68.19891008174388,
+ "grad_norm": 5.563045978546143,
+ "learning_rate": 4.851464256813076e-06,
+ "loss": 0.1015,
+ "step": 25029
+ },
+ {
+ "epoch": 68.2016348773842,
+ "grad_norm": 3.3602840900421143,
+ "learning_rate": 4.850707733508868e-06,
+ "loss": 0.0472,
+ "step": 25030
+ },
+ {
+ "epoch": 68.20435967302453,
+ "grad_norm": 3.2086257934570312,
+ "learning_rate": 4.8499512503071775e-06,
+ "loss": 0.073,
+ "step": 25031
+ },
+ {
+ "epoch": 68.20708446866485,
+ "grad_norm": 4.109739780426025,
+ "learning_rate": 4.849194807213905e-06,
+ "loss": 0.1155,
+ "step": 25032
+ },
+ {
+ "epoch": 68.20980926430518,
+ "grad_norm": 5.412731170654297,
+ "learning_rate": 4.848438404234937e-06,
+ "loss": 0.158,
+ "step": 25033
+ },
+ {
+ "epoch": 68.2125340599455,
+ "grad_norm": 2.9590957164764404,
+ "learning_rate": 4.847682041376166e-06,
+ "loss": 0.042,
+ "step": 25034
+ },
+ {
+ "epoch": 68.21525885558583,
+ "grad_norm": 2.1525983810424805,
+ "learning_rate": 4.846925718643478e-06,
+ "loss": 0.067,
+ "step": 25035
+ },
+ {
+ "epoch": 68.21798365122616,
+ "grad_norm": 3.3515589237213135,
+ "learning_rate": 4.846169436042769e-06,
+ "loss": 0.0527,
+ "step": 25036
+ },
+ {
+ "epoch": 68.22070844686648,
+ "grad_norm": 2.3968660831451416,
+ "learning_rate": 4.845413193579927e-06,
+ "loss": 0.04,
+ "step": 25037
+ },
+ {
+ "epoch": 68.22343324250681,
+ "grad_norm": 2.7044997215270996,
+ "learning_rate": 4.844656991260838e-06,
+ "loss": 0.0377,
+ "step": 25038
+ },
+ {
+ "epoch": 68.22615803814713,
+ "grad_norm": 3.2693943977355957,
+ "learning_rate": 4.843900829091398e-06,
+ "loss": 0.1073,
+ "step": 25039
+ },
+ {
+ "epoch": 68.22888283378747,
+ "grad_norm": 3.2461183071136475,
+ "learning_rate": 4.8431447070774916e-06,
+ "loss": 0.1183,
+ "step": 25040
+ },
+ {
+ "epoch": 68.2316076294278,
+ "grad_norm": 5.564183235168457,
+ "learning_rate": 4.842388625225009e-06,
+ "loss": 0.1141,
+ "step": 25041
+ },
+ {
+ "epoch": 68.23433242506812,
+ "grad_norm": 6.375480651855469,
+ "learning_rate": 4.841632583539835e-06,
+ "loss": 0.0521,
+ "step": 25042
+ },
+ {
+ "epoch": 68.23705722070845,
+ "grad_norm": 2.3081696033477783,
+ "learning_rate": 4.840876582027863e-06,
+ "loss": 0.0383,
+ "step": 25043
+ },
+ {
+ "epoch": 68.23978201634877,
+ "grad_norm": 3.0546491146087646,
+ "learning_rate": 4.840120620694974e-06,
+ "loss": 0.112,
+ "step": 25044
+ },
+ {
+ "epoch": 68.2425068119891,
+ "grad_norm": 2.5620908737182617,
+ "learning_rate": 4.839364699547064e-06,
+ "loss": 0.1705,
+ "step": 25045
+ },
+ {
+ "epoch": 68.24523160762942,
+ "grad_norm": 3.5948729515075684,
+ "learning_rate": 4.8386088185900145e-06,
+ "loss": 0.1684,
+ "step": 25046
+ },
+ {
+ "epoch": 68.24795640326975,
+ "grad_norm": 3.0221545696258545,
+ "learning_rate": 4.837852977829711e-06,
+ "loss": 0.1146,
+ "step": 25047
+ },
+ {
+ "epoch": 68.25068119891009,
+ "grad_norm": 6.115458965301514,
+ "learning_rate": 4.837097177272045e-06,
+ "loss": 0.0545,
+ "step": 25048
+ },
+ {
+ "epoch": 68.2534059945504,
+ "grad_norm": 3.122903823852539,
+ "learning_rate": 4.836341416922901e-06,
+ "loss": 0.1152,
+ "step": 25049
+ },
+ {
+ "epoch": 68.25613079019074,
+ "grad_norm": 3.8173673152923584,
+ "learning_rate": 4.835585696788163e-06,
+ "loss": 0.1432,
+ "step": 25050
+ },
+ {
+ "epoch": 68.25885558583106,
+ "grad_norm": 2.7445411682128906,
+ "learning_rate": 4.834830016873715e-06,
+ "loss": 0.0638,
+ "step": 25051
+ },
+ {
+ "epoch": 68.26158038147139,
+ "grad_norm": 3.772977590560913,
+ "learning_rate": 4.834074377185447e-06,
+ "loss": 0.0469,
+ "step": 25052
+ },
+ {
+ "epoch": 68.26430517711172,
+ "grad_norm": 3.452272891998291,
+ "learning_rate": 4.833318777729243e-06,
+ "loss": 0.1427,
+ "step": 25053
+ },
+ {
+ "epoch": 68.26702997275204,
+ "grad_norm": 2.9316632747650146,
+ "learning_rate": 4.832563218510984e-06,
+ "loss": 0.0623,
+ "step": 25054
+ },
+ {
+ "epoch": 68.26975476839237,
+ "grad_norm": 3.105860948562622,
+ "learning_rate": 4.831807699536554e-06,
+ "loss": 0.0934,
+ "step": 25055
+ },
+ {
+ "epoch": 68.2724795640327,
+ "grad_norm": 3.162024974822998,
+ "learning_rate": 4.831052220811843e-06,
+ "loss": 0.0623,
+ "step": 25056
+ },
+ {
+ "epoch": 68.27520435967303,
+ "grad_norm": 3.763082504272461,
+ "learning_rate": 4.8302967823427296e-06,
+ "loss": 0.0968,
+ "step": 25057
+ },
+ {
+ "epoch": 68.27792915531334,
+ "grad_norm": 4.577455043792725,
+ "learning_rate": 4.8295413841350995e-06,
+ "loss": 0.1031,
+ "step": 25058
+ },
+ {
+ "epoch": 68.28065395095368,
+ "grad_norm": 3.669177532196045,
+ "learning_rate": 4.8287860261948305e-06,
+ "loss": 0.1281,
+ "step": 25059
+ },
+ {
+ "epoch": 68.28337874659401,
+ "grad_norm": 2.364025831222534,
+ "learning_rate": 4.828030708527814e-06,
+ "loss": 0.0313,
+ "step": 25060
+ },
+ {
+ "epoch": 68.28610354223433,
+ "grad_norm": 2.397878885269165,
+ "learning_rate": 4.827275431139924e-06,
+ "loss": 0.0421,
+ "step": 25061
+ },
+ {
+ "epoch": 68.28882833787466,
+ "grad_norm": 2.458519458770752,
+ "learning_rate": 4.82652019403705e-06,
+ "loss": 0.0901,
+ "step": 25062
+ },
+ {
+ "epoch": 68.29155313351498,
+ "grad_norm": 2.9947876930236816,
+ "learning_rate": 4.825764997225066e-06,
+ "loss": 0.1044,
+ "step": 25063
+ },
+ {
+ "epoch": 68.29427792915531,
+ "grad_norm": 2.8236539363861084,
+ "learning_rate": 4.825009840709862e-06,
+ "loss": 0.0447,
+ "step": 25064
+ },
+ {
+ "epoch": 68.29700272479565,
+ "grad_norm": 2.933349847793579,
+ "learning_rate": 4.8242547244973144e-06,
+ "loss": 0.0408,
+ "step": 25065
+ },
+ {
+ "epoch": 68.29972752043597,
+ "grad_norm": 4.040036678314209,
+ "learning_rate": 4.823499648593305e-06,
+ "loss": 0.0641,
+ "step": 25066
+ },
+ {
+ "epoch": 68.3024523160763,
+ "grad_norm": 4.4302239418029785,
+ "learning_rate": 4.82274461300371e-06,
+ "loss": 0.0918,
+ "step": 25067
+ },
+ {
+ "epoch": 68.30517711171662,
+ "grad_norm": 3.477489709854126,
+ "learning_rate": 4.821989617734416e-06,
+ "loss": 0.0495,
+ "step": 25068
+ },
+ {
+ "epoch": 68.30790190735695,
+ "grad_norm": 3.266461133956909,
+ "learning_rate": 4.821234662791302e-06,
+ "loss": 0.0541,
+ "step": 25069
+ },
+ {
+ "epoch": 68.31062670299727,
+ "grad_norm": 2.8733971118927,
+ "learning_rate": 4.820479748180245e-06,
+ "loss": 0.0477,
+ "step": 25070
+ },
+ {
+ "epoch": 68.3133514986376,
+ "grad_norm": 2.9562008380889893,
+ "learning_rate": 4.81972487390712e-06,
+ "loss": 0.0463,
+ "step": 25071
+ },
+ {
+ "epoch": 68.31607629427793,
+ "grad_norm": 2.757918119430542,
+ "learning_rate": 4.818970039977816e-06,
+ "loss": 0.1046,
+ "step": 25072
+ },
+ {
+ "epoch": 68.31880108991825,
+ "grad_norm": 3.5135529041290283,
+ "learning_rate": 4.818215246398206e-06,
+ "loss": 0.0466,
+ "step": 25073
+ },
+ {
+ "epoch": 68.32152588555859,
+ "grad_norm": 15.699817657470703,
+ "learning_rate": 4.81746049317417e-06,
+ "loss": 0.0823,
+ "step": 25074
+ },
+ {
+ "epoch": 68.3242506811989,
+ "grad_norm": 3.147193431854248,
+ "learning_rate": 4.81670578031158e-06,
+ "loss": 0.0471,
+ "step": 25075
+ },
+ {
+ "epoch": 68.32697547683924,
+ "grad_norm": 3.7153866291046143,
+ "learning_rate": 4.815951107816322e-06,
+ "loss": 0.0506,
+ "step": 25076
+ },
+ {
+ "epoch": 68.32970027247957,
+ "grad_norm": 4.23006534576416,
+ "learning_rate": 4.815196475694271e-06,
+ "loss": 0.0737,
+ "step": 25077
+ },
+ {
+ "epoch": 68.33242506811989,
+ "grad_norm": 3.3838913440704346,
+ "learning_rate": 4.814441883951299e-06,
+ "loss": 0.0731,
+ "step": 25078
+ },
+ {
+ "epoch": 68.33514986376022,
+ "grad_norm": 5.721966743469238,
+ "learning_rate": 4.813687332593287e-06,
+ "loss": 0.0741,
+ "step": 25079
+ },
+ {
+ "epoch": 68.33787465940054,
+ "grad_norm": 4.798506736755371,
+ "learning_rate": 4.812932821626113e-06,
+ "loss": 0.2038,
+ "step": 25080
+ },
+ {
+ "epoch": 68.34059945504087,
+ "grad_norm": 7.884695053100586,
+ "learning_rate": 4.812178351055653e-06,
+ "loss": 0.0779,
+ "step": 25081
+ },
+ {
+ "epoch": 68.34332425068119,
+ "grad_norm": 2.769942283630371,
+ "learning_rate": 4.811423920887781e-06,
+ "loss": 0.0533,
+ "step": 25082
+ },
+ {
+ "epoch": 68.34604904632153,
+ "grad_norm": 2.734086751937866,
+ "learning_rate": 4.810669531128368e-06,
+ "loss": 0.0589,
+ "step": 25083
+ },
+ {
+ "epoch": 68.34877384196186,
+ "grad_norm": 2.627162456512451,
+ "learning_rate": 4.809915181783298e-06,
+ "loss": 0.064,
+ "step": 25084
+ },
+ {
+ "epoch": 68.35149863760218,
+ "grad_norm": 3.023695468902588,
+ "learning_rate": 4.809160872858442e-06,
+ "loss": 0.0705,
+ "step": 25085
+ },
+ {
+ "epoch": 68.35422343324251,
+ "grad_norm": 3.268885374069214,
+ "learning_rate": 4.8084066043596724e-06,
+ "loss": 0.0597,
+ "step": 25086
+ },
+ {
+ "epoch": 68.35694822888283,
+ "grad_norm": 3.398163080215454,
+ "learning_rate": 4.807652376292863e-06,
+ "loss": 0.0813,
+ "step": 25087
+ },
+ {
+ "epoch": 68.35967302452316,
+ "grad_norm": 3.454350709915161,
+ "learning_rate": 4.806898188663892e-06,
+ "loss": 0.2177,
+ "step": 25088
+ },
+ {
+ "epoch": 68.3623978201635,
+ "grad_norm": 4.0141143798828125,
+ "learning_rate": 4.806144041478632e-06,
+ "loss": 0.1013,
+ "step": 25089
+ },
+ {
+ "epoch": 68.36512261580381,
+ "grad_norm": 8.191872596740723,
+ "learning_rate": 4.8053899347429545e-06,
+ "loss": 0.2007,
+ "step": 25090
+ },
+ {
+ "epoch": 68.36784741144415,
+ "grad_norm": 2.948700189590454,
+ "learning_rate": 4.804635868462729e-06,
+ "loss": 0.0463,
+ "step": 25091
+ },
+ {
+ "epoch": 68.37057220708446,
+ "grad_norm": 4.066028594970703,
+ "learning_rate": 4.803881842643837e-06,
+ "loss": 0.1249,
+ "step": 25092
+ },
+ {
+ "epoch": 68.3732970027248,
+ "grad_norm": 2.9195990562438965,
+ "learning_rate": 4.803127857292145e-06,
+ "loss": 0.0515,
+ "step": 25093
+ },
+ {
+ "epoch": 68.37602179836512,
+ "grad_norm": 3.255952835083008,
+ "learning_rate": 4.802373912413526e-06,
+ "loss": 0.062,
+ "step": 25094
+ },
+ {
+ "epoch": 68.37874659400545,
+ "grad_norm": 2.8404171466827393,
+ "learning_rate": 4.801620008013849e-06,
+ "loss": 0.0496,
+ "step": 25095
+ },
+ {
+ "epoch": 68.38147138964578,
+ "grad_norm": 3.142814874649048,
+ "learning_rate": 4.800866144098987e-06,
+ "loss": 0.1768,
+ "step": 25096
+ },
+ {
+ "epoch": 68.3841961852861,
+ "grad_norm": 2.899886131286621,
+ "learning_rate": 4.800112320674816e-06,
+ "loss": 0.0634,
+ "step": 25097
+ },
+ {
+ "epoch": 68.38692098092643,
+ "grad_norm": 2.8207359313964844,
+ "learning_rate": 4.799358537747203e-06,
+ "loss": 0.0508,
+ "step": 25098
+ },
+ {
+ "epoch": 68.38964577656675,
+ "grad_norm": 3.2844810485839844,
+ "learning_rate": 4.798604795322018e-06,
+ "loss": 0.2419,
+ "step": 25099
+ },
+ {
+ "epoch": 68.39237057220708,
+ "grad_norm": 3.1961586475372314,
+ "learning_rate": 4.797851093405128e-06,
+ "loss": 0.0828,
+ "step": 25100
+ },
+ {
+ "epoch": 68.39509536784742,
+ "grad_norm": 2.9002537727355957,
+ "learning_rate": 4.79709743200241e-06,
+ "loss": 0.033,
+ "step": 25101
+ },
+ {
+ "epoch": 68.39782016348774,
+ "grad_norm": 2.4350409507751465,
+ "learning_rate": 4.7963438111197306e-06,
+ "loss": 0.0447,
+ "step": 25102
+ },
+ {
+ "epoch": 68.40054495912807,
+ "grad_norm": 3.0927481651306152,
+ "learning_rate": 4.795590230762953e-06,
+ "loss": 0.0529,
+ "step": 25103
+ },
+ {
+ "epoch": 68.40326975476839,
+ "grad_norm": 2.9737613201141357,
+ "learning_rate": 4.794836690937955e-06,
+ "loss": 0.0373,
+ "step": 25104
+ },
+ {
+ "epoch": 68.40599455040872,
+ "grad_norm": 3.585712432861328,
+ "learning_rate": 4.794083191650603e-06,
+ "loss": 0.1791,
+ "step": 25105
+ },
+ {
+ "epoch": 68.40871934604904,
+ "grad_norm": 2.8583109378814697,
+ "learning_rate": 4.793329732906762e-06,
+ "loss": 0.0605,
+ "step": 25106
+ },
+ {
+ "epoch": 68.41144414168937,
+ "grad_norm": 3.3776392936706543,
+ "learning_rate": 4.792576314712297e-06,
+ "loss": 0.0766,
+ "step": 25107
+ },
+ {
+ "epoch": 68.4141689373297,
+ "grad_norm": 3.646101951599121,
+ "learning_rate": 4.7918229370730855e-06,
+ "loss": 0.07,
+ "step": 25108
+ },
+ {
+ "epoch": 68.41689373297002,
+ "grad_norm": 4.175693035125732,
+ "learning_rate": 4.7910695999949885e-06,
+ "loss": 0.0617,
+ "step": 25109
+ },
+ {
+ "epoch": 68.41961852861036,
+ "grad_norm": 3.119385242462158,
+ "learning_rate": 4.790316303483874e-06,
+ "loss": 0.0679,
+ "step": 25110
+ },
+ {
+ "epoch": 68.42234332425068,
+ "grad_norm": 3.341418504714966,
+ "learning_rate": 4.7895630475456054e-06,
+ "loss": 0.0559,
+ "step": 25111
+ },
+ {
+ "epoch": 68.42506811989101,
+ "grad_norm": 2.7829813957214355,
+ "learning_rate": 4.788809832186051e-06,
+ "loss": 0.0468,
+ "step": 25112
+ },
+ {
+ "epoch": 68.42779291553134,
+ "grad_norm": 4.060194969177246,
+ "learning_rate": 4.788056657411082e-06,
+ "loss": 0.0869,
+ "step": 25113
+ },
+ {
+ "epoch": 68.43051771117166,
+ "grad_norm": 2.6804492473602295,
+ "learning_rate": 4.787303523226561e-06,
+ "loss": 0.2156,
+ "step": 25114
+ },
+ {
+ "epoch": 68.433242506812,
+ "grad_norm": 5.664914608001709,
+ "learning_rate": 4.786550429638352e-06,
+ "loss": 0.1709,
+ "step": 25115
+ },
+ {
+ "epoch": 68.43596730245231,
+ "grad_norm": 2.7411012649536133,
+ "learning_rate": 4.785797376652315e-06,
+ "loss": 0.0668,
+ "step": 25116
+ },
+ {
+ "epoch": 68.43869209809264,
+ "grad_norm": 3.996340036392212,
+ "learning_rate": 4.785044364274325e-06,
+ "loss": 0.1414,
+ "step": 25117
+ },
+ {
+ "epoch": 68.44141689373296,
+ "grad_norm": 2.0779170989990234,
+ "learning_rate": 4.784291392510242e-06,
+ "loss": 0.0569,
+ "step": 25118
+ },
+ {
+ "epoch": 68.4441416893733,
+ "grad_norm": 2.0381622314453125,
+ "learning_rate": 4.78353846136593e-06,
+ "loss": 0.0256,
+ "step": 25119
+ },
+ {
+ "epoch": 68.44686648501363,
+ "grad_norm": 6.922408580780029,
+ "learning_rate": 4.782785570847248e-06,
+ "loss": 0.0789,
+ "step": 25120
+ },
+ {
+ "epoch": 68.44959128065395,
+ "grad_norm": 4.676624774932861,
+ "learning_rate": 4.782032720960068e-06,
+ "loss": 0.0395,
+ "step": 25121
+ },
+ {
+ "epoch": 68.45231607629428,
+ "grad_norm": 3.942620277404785,
+ "learning_rate": 4.781279911710249e-06,
+ "loss": 0.0855,
+ "step": 25122
+ },
+ {
+ "epoch": 68.4550408719346,
+ "grad_norm": 2.670901298522949,
+ "learning_rate": 4.780527143103655e-06,
+ "loss": 0.1506,
+ "step": 25123
+ },
+ {
+ "epoch": 68.45776566757493,
+ "grad_norm": 3.5805327892303467,
+ "learning_rate": 4.779774415146143e-06,
+ "loss": 0.1134,
+ "step": 25124
+ },
+ {
+ "epoch": 68.46049046321527,
+ "grad_norm": 3.4640166759490967,
+ "learning_rate": 4.779021727843585e-06,
+ "loss": 0.0546,
+ "step": 25125
+ },
+ {
+ "epoch": 68.46321525885558,
+ "grad_norm": 2.886509895324707,
+ "learning_rate": 4.7782690812018365e-06,
+ "loss": 0.1032,
+ "step": 25126
+ },
+ {
+ "epoch": 68.46594005449592,
+ "grad_norm": 3.5943520069122314,
+ "learning_rate": 4.777516475226757e-06,
+ "loss": 0.0892,
+ "step": 25127
+ },
+ {
+ "epoch": 68.46866485013624,
+ "grad_norm": 7.02865743637085,
+ "learning_rate": 4.776763909924215e-06,
+ "loss": 0.0359,
+ "step": 25128
+ },
+ {
+ "epoch": 68.47138964577657,
+ "grad_norm": 4.470008850097656,
+ "learning_rate": 4.776011385300066e-06,
+ "loss": 0.1249,
+ "step": 25129
+ },
+ {
+ "epoch": 68.47411444141689,
+ "grad_norm": 3.266449213027954,
+ "learning_rate": 4.77525890136017e-06,
+ "loss": 0.0592,
+ "step": 25130
+ },
+ {
+ "epoch": 68.47683923705722,
+ "grad_norm": 2.963853120803833,
+ "learning_rate": 4.774506458110393e-06,
+ "loss": 0.1043,
+ "step": 25131
+ },
+ {
+ "epoch": 68.47956403269755,
+ "grad_norm": 6.4120073318481445,
+ "learning_rate": 4.773754055556588e-06,
+ "loss": 0.0614,
+ "step": 25132
+ },
+ {
+ "epoch": 68.48228882833787,
+ "grad_norm": 4.997405529022217,
+ "learning_rate": 4.773001693704622e-06,
+ "loss": 0.0437,
+ "step": 25133
+ },
+ {
+ "epoch": 68.4850136239782,
+ "grad_norm": 3.729607343673706,
+ "learning_rate": 4.77224937256035e-06,
+ "loss": 0.1769,
+ "step": 25134
+ },
+ {
+ "epoch": 68.48773841961852,
+ "grad_norm": 3.7368216514587402,
+ "learning_rate": 4.7714970921296325e-06,
+ "loss": 0.1098,
+ "step": 25135
+ },
+ {
+ "epoch": 68.49046321525886,
+ "grad_norm": 3.899833917617798,
+ "learning_rate": 4.770744852418322e-06,
+ "loss": 0.0862,
+ "step": 25136
+ },
+ {
+ "epoch": 68.49318801089919,
+ "grad_norm": 3.8085601329803467,
+ "learning_rate": 4.769992653432287e-06,
+ "loss": 0.1327,
+ "step": 25137
+ },
+ {
+ "epoch": 68.49591280653951,
+ "grad_norm": 2.893799304962158,
+ "learning_rate": 4.7692404951773815e-06,
+ "loss": 0.0662,
+ "step": 25138
+ },
+ {
+ "epoch": 68.49863760217984,
+ "grad_norm": 2.687007427215576,
+ "learning_rate": 4.768488377659462e-06,
+ "loss": 0.0639,
+ "step": 25139
+ },
+ {
+ "epoch": 68.50136239782016,
+ "grad_norm": 3.9088146686553955,
+ "learning_rate": 4.767736300884384e-06,
+ "loss": 0.1024,
+ "step": 25140
+ },
+ {
+ "epoch": 68.50408719346049,
+ "grad_norm": 3.08231520652771,
+ "learning_rate": 4.766984264858009e-06,
+ "loss": 0.0434,
+ "step": 25141
+ },
+ {
+ "epoch": 68.50681198910081,
+ "grad_norm": 2.6814839839935303,
+ "learning_rate": 4.766232269586193e-06,
+ "loss": 0.1448,
+ "step": 25142
+ },
+ {
+ "epoch": 68.50953678474114,
+ "grad_norm": 2.983130693435669,
+ "learning_rate": 4.7654803150747915e-06,
+ "loss": 0.1021,
+ "step": 25143
+ },
+ {
+ "epoch": 68.51226158038148,
+ "grad_norm": 3.5604686737060547,
+ "learning_rate": 4.764728401329658e-06,
+ "loss": 0.1013,
+ "step": 25144
+ },
+ {
+ "epoch": 68.5149863760218,
+ "grad_norm": 4.0818281173706055,
+ "learning_rate": 4.763976528356654e-06,
+ "loss": 0.0871,
+ "step": 25145
+ },
+ {
+ "epoch": 68.51771117166213,
+ "grad_norm": 2.9919230937957764,
+ "learning_rate": 4.763224696161633e-06,
+ "loss": 0.0374,
+ "step": 25146
+ },
+ {
+ "epoch": 68.52043596730245,
+ "grad_norm": 3.354459524154663,
+ "learning_rate": 4.7624729047504455e-06,
+ "loss": 0.0532,
+ "step": 25147
+ },
+ {
+ "epoch": 68.52316076294278,
+ "grad_norm": 6.059757709503174,
+ "learning_rate": 4.76172115412895e-06,
+ "loss": 0.1336,
+ "step": 25148
+ },
+ {
+ "epoch": 68.52588555858311,
+ "grad_norm": 3.0966076850891113,
+ "learning_rate": 4.760969444303006e-06,
+ "loss": 0.1218,
+ "step": 25149
+ },
+ {
+ "epoch": 68.52861035422343,
+ "grad_norm": 3.0650575160980225,
+ "learning_rate": 4.7602177752784625e-06,
+ "loss": 0.1357,
+ "step": 25150
+ },
+ {
+ "epoch": 68.53133514986376,
+ "grad_norm": 3.5466384887695312,
+ "learning_rate": 4.7594661470611745e-06,
+ "loss": 0.0509,
+ "step": 25151
+ },
+ {
+ "epoch": 68.53405994550408,
+ "grad_norm": 10.345356941223145,
+ "learning_rate": 4.7587145596569925e-06,
+ "loss": 0.0422,
+ "step": 25152
+ },
+ {
+ "epoch": 68.53678474114442,
+ "grad_norm": 4.462990760803223,
+ "learning_rate": 4.757963013071777e-06,
+ "loss": 0.04,
+ "step": 25153
+ },
+ {
+ "epoch": 68.53950953678473,
+ "grad_norm": 5.018280029296875,
+ "learning_rate": 4.7572115073113755e-06,
+ "loss": 0.1542,
+ "step": 25154
+ },
+ {
+ "epoch": 68.54223433242507,
+ "grad_norm": 3.254812717437744,
+ "learning_rate": 4.756460042381642e-06,
+ "loss": 0.0706,
+ "step": 25155
+ },
+ {
+ "epoch": 68.5449591280654,
+ "grad_norm": 3.239781141281128,
+ "learning_rate": 4.755708618288426e-06,
+ "loss": 0.0707,
+ "step": 25156
+ },
+ {
+ "epoch": 68.54768392370572,
+ "grad_norm": 2.7286837100982666,
+ "learning_rate": 4.7549572350375864e-06,
+ "loss": 0.0435,
+ "step": 25157
+ },
+ {
+ "epoch": 68.55040871934605,
+ "grad_norm": 3.584249258041382,
+ "learning_rate": 4.75420589263497e-06,
+ "loss": 0.0806,
+ "step": 25158
+ },
+ {
+ "epoch": 68.55313351498637,
+ "grad_norm": 4.158878803253174,
+ "learning_rate": 4.753454591086431e-06,
+ "loss": 0.1047,
+ "step": 25159
+ },
+ {
+ "epoch": 68.5558583106267,
+ "grad_norm": 3.319026231765747,
+ "learning_rate": 4.7527033303978135e-06,
+ "loss": 0.047,
+ "step": 25160
+ },
+ {
+ "epoch": 68.55858310626704,
+ "grad_norm": 4.47884464263916,
+ "learning_rate": 4.751952110574977e-06,
+ "loss": 0.0943,
+ "step": 25161
+ },
+ {
+ "epoch": 68.56130790190736,
+ "grad_norm": 3.4570767879486084,
+ "learning_rate": 4.75120093162377e-06,
+ "loss": 0.0436,
+ "step": 25162
+ },
+ {
+ "epoch": 68.56403269754769,
+ "grad_norm": 2.990640878677368,
+ "learning_rate": 4.75044979355004e-06,
+ "loss": 0.0877,
+ "step": 25163
+ },
+ {
+ "epoch": 68.566757493188,
+ "grad_norm": 3.3707058429718018,
+ "learning_rate": 4.749698696359635e-06,
+ "loss": 0.0883,
+ "step": 25164
+ },
+ {
+ "epoch": 68.56948228882834,
+ "grad_norm": 5.598540306091309,
+ "learning_rate": 4.748947640058407e-06,
+ "loss": 0.07,
+ "step": 25165
+ },
+ {
+ "epoch": 68.57220708446866,
+ "grad_norm": 3.6774098873138428,
+ "learning_rate": 4.74819662465221e-06,
+ "loss": 0.1686,
+ "step": 25166
+ },
+ {
+ "epoch": 68.57493188010899,
+ "grad_norm": 2.633655309677124,
+ "learning_rate": 4.747445650146888e-06,
+ "loss": 0.0332,
+ "step": 25167
+ },
+ {
+ "epoch": 68.57765667574932,
+ "grad_norm": 2.769691228866577,
+ "learning_rate": 4.746694716548288e-06,
+ "loss": 0.1756,
+ "step": 25168
+ },
+ {
+ "epoch": 68.58038147138964,
+ "grad_norm": 3.9401910305023193,
+ "learning_rate": 4.745943823862263e-06,
+ "loss": 0.1578,
+ "step": 25169
+ },
+ {
+ "epoch": 68.58310626702998,
+ "grad_norm": 2.708097457885742,
+ "learning_rate": 4.745192972094659e-06,
+ "loss": 0.0359,
+ "step": 25170
+ },
+ {
+ "epoch": 68.5858310626703,
+ "grad_norm": 3.1952457427978516,
+ "learning_rate": 4.744442161251323e-06,
+ "loss": 0.1823,
+ "step": 25171
+ },
+ {
+ "epoch": 68.58855585831063,
+ "grad_norm": 2.921765089035034,
+ "learning_rate": 4.743691391338096e-06,
+ "loss": 0.2089,
+ "step": 25172
+ },
+ {
+ "epoch": 68.59128065395096,
+ "grad_norm": 2.713057279586792,
+ "learning_rate": 4.742940662360839e-06,
+ "loss": 0.0447,
+ "step": 25173
+ },
+ {
+ "epoch": 68.59400544959128,
+ "grad_norm": 2.8322789669036865,
+ "learning_rate": 4.742189974325389e-06,
+ "loss": 0.096,
+ "step": 25174
+ },
+ {
+ "epoch": 68.59673024523161,
+ "grad_norm": 6.807580471038818,
+ "learning_rate": 4.741439327237594e-06,
+ "loss": 0.0619,
+ "step": 25175
+ },
+ {
+ "epoch": 68.59945504087193,
+ "grad_norm": 3.18601393699646,
+ "learning_rate": 4.740688721103297e-06,
+ "loss": 0.1193,
+ "step": 25176
+ },
+ {
+ "epoch": 68.60217983651226,
+ "grad_norm": 3.1044204235076904,
+ "learning_rate": 4.739938155928351e-06,
+ "loss": 0.2166,
+ "step": 25177
+ },
+ {
+ "epoch": 68.60490463215258,
+ "grad_norm": 3.3225605487823486,
+ "learning_rate": 4.739187631718597e-06,
+ "loss": 0.0378,
+ "step": 25178
+ },
+ {
+ "epoch": 68.60762942779292,
+ "grad_norm": 3.8188860416412354,
+ "learning_rate": 4.73843714847988e-06,
+ "loss": 0.1016,
+ "step": 25179
+ },
+ {
+ "epoch": 68.61035422343325,
+ "grad_norm": 3.6552019119262695,
+ "learning_rate": 4.737686706218042e-06,
+ "loss": 0.0608,
+ "step": 25180
+ },
+ {
+ "epoch": 68.61307901907357,
+ "grad_norm": 2.598064661026001,
+ "learning_rate": 4.736936304938929e-06,
+ "loss": 0.1276,
+ "step": 25181
+ },
+ {
+ "epoch": 68.6158038147139,
+ "grad_norm": 6.786052227020264,
+ "learning_rate": 4.736185944648393e-06,
+ "loss": 0.0641,
+ "step": 25182
+ },
+ {
+ "epoch": 68.61852861035422,
+ "grad_norm": 5.362548828125,
+ "learning_rate": 4.73543562535227e-06,
+ "loss": 0.0602,
+ "step": 25183
+ },
+ {
+ "epoch": 68.62125340599455,
+ "grad_norm": 3.872605085372925,
+ "learning_rate": 4.734685347056405e-06,
+ "loss": 0.1098,
+ "step": 25184
+ },
+ {
+ "epoch": 68.62397820163488,
+ "grad_norm": 3.679784059524536,
+ "learning_rate": 4.7339351097666375e-06,
+ "loss": 0.0483,
+ "step": 25185
+ },
+ {
+ "epoch": 68.6267029972752,
+ "grad_norm": 3.1309032440185547,
+ "learning_rate": 4.733184913488817e-06,
+ "loss": 0.042,
+ "step": 25186
+ },
+ {
+ "epoch": 68.62942779291554,
+ "grad_norm": 4.85702657699585,
+ "learning_rate": 4.732434758228784e-06,
+ "loss": 0.1734,
+ "step": 25187
+ },
+ {
+ "epoch": 68.63215258855585,
+ "grad_norm": 4.458306789398193,
+ "learning_rate": 4.731684643992375e-06,
+ "loss": 0.059,
+ "step": 25188
+ },
+ {
+ "epoch": 68.63487738419619,
+ "grad_norm": 2.068485975265503,
+ "learning_rate": 4.730934570785441e-06,
+ "loss": 0.0292,
+ "step": 25189
+ },
+ {
+ "epoch": 68.6376021798365,
+ "grad_norm": 3.625941753387451,
+ "learning_rate": 4.730184538613818e-06,
+ "loss": 0.1159,
+ "step": 25190
+ },
+ {
+ "epoch": 68.64032697547684,
+ "grad_norm": 3.8161723613739014,
+ "learning_rate": 4.729434547483349e-06,
+ "loss": 0.1458,
+ "step": 25191
+ },
+ {
+ "epoch": 68.64305177111717,
+ "grad_norm": 4.030821323394775,
+ "learning_rate": 4.72868459739987e-06,
+ "loss": 0.1822,
+ "step": 25192
+ },
+ {
+ "epoch": 68.64577656675749,
+ "grad_norm": 3.8183062076568604,
+ "learning_rate": 4.727934688369229e-06,
+ "loss": 0.0592,
+ "step": 25193
+ },
+ {
+ "epoch": 68.64850136239782,
+ "grad_norm": 2.4527411460876465,
+ "learning_rate": 4.727184820397263e-06,
+ "loss": 0.0386,
+ "step": 25194
+ },
+ {
+ "epoch": 68.65122615803814,
+ "grad_norm": 2.4861347675323486,
+ "learning_rate": 4.7264349934898124e-06,
+ "loss": 0.1229,
+ "step": 25195
+ },
+ {
+ "epoch": 68.65395095367847,
+ "grad_norm": 3.8023078441619873,
+ "learning_rate": 4.725685207652712e-06,
+ "loss": 0.081,
+ "step": 25196
+ },
+ {
+ "epoch": 68.65667574931881,
+ "grad_norm": 3.4263360500335693,
+ "learning_rate": 4.724935462891811e-06,
+ "loss": 0.0855,
+ "step": 25197
+ },
+ {
+ "epoch": 68.65940054495913,
+ "grad_norm": 3.7822086811065674,
+ "learning_rate": 4.724185759212937e-06,
+ "loss": 0.0851,
+ "step": 25198
+ },
+ {
+ "epoch": 68.66212534059946,
+ "grad_norm": 3.5324831008911133,
+ "learning_rate": 4.723436096621939e-06,
+ "loss": 0.0527,
+ "step": 25199
+ },
+ {
+ "epoch": 68.66485013623978,
+ "grad_norm": 3.150998830795288,
+ "learning_rate": 4.722686475124652e-06,
+ "loss": 0.0605,
+ "step": 25200
+ },
+ {
+ "epoch": 68.66757493188011,
+ "grad_norm": 4.413564682006836,
+ "learning_rate": 4.7219368947269074e-06,
+ "loss": 0.0959,
+ "step": 25201
+ },
+ {
+ "epoch": 68.67029972752043,
+ "grad_norm": 2.7410242557525635,
+ "learning_rate": 4.721187355434553e-06,
+ "loss": 0.0351,
+ "step": 25202
+ },
+ {
+ "epoch": 68.67302452316076,
+ "grad_norm": 5.757294178009033,
+ "learning_rate": 4.720437857253421e-06,
+ "loss": 0.232,
+ "step": 25203
+ },
+ {
+ "epoch": 68.6757493188011,
+ "grad_norm": 4.090802192687988,
+ "learning_rate": 4.719688400189349e-06,
+ "loss": 0.0994,
+ "step": 25204
+ },
+ {
+ "epoch": 68.67847411444141,
+ "grad_norm": 3.794888973236084,
+ "learning_rate": 4.718938984248171e-06,
+ "loss": 0.0756,
+ "step": 25205
+ },
+ {
+ "epoch": 68.68119891008175,
+ "grad_norm": 3.559938907623291,
+ "learning_rate": 4.71818960943573e-06,
+ "loss": 0.1147,
+ "step": 25206
+ },
+ {
+ "epoch": 68.68392370572207,
+ "grad_norm": 5.694897174835205,
+ "learning_rate": 4.717440275757858e-06,
+ "loss": 0.083,
+ "step": 25207
+ },
+ {
+ "epoch": 68.6866485013624,
+ "grad_norm": 3.655093193054199,
+ "learning_rate": 4.71669098322039e-06,
+ "loss": 0.0837,
+ "step": 25208
+ },
+ {
+ "epoch": 68.68937329700273,
+ "grad_norm": 4.3597235679626465,
+ "learning_rate": 4.7159417318291604e-06,
+ "loss": 0.0904,
+ "step": 25209
+ },
+ {
+ "epoch": 68.69209809264305,
+ "grad_norm": 3.2580018043518066,
+ "learning_rate": 4.715192521590009e-06,
+ "loss": 0.0925,
+ "step": 25210
+ },
+ {
+ "epoch": 68.69482288828338,
+ "grad_norm": 2.5528197288513184,
+ "learning_rate": 4.7144433525087685e-06,
+ "loss": 0.1412,
+ "step": 25211
+ },
+ {
+ "epoch": 68.6975476839237,
+ "grad_norm": 2.148444175720215,
+ "learning_rate": 4.71369422459127e-06,
+ "loss": 0.0908,
+ "step": 25212
+ },
+ {
+ "epoch": 68.70027247956403,
+ "grad_norm": 2.996722936630249,
+ "learning_rate": 4.712945137843353e-06,
+ "loss": 0.135,
+ "step": 25213
+ },
+ {
+ "epoch": 68.70299727520435,
+ "grad_norm": 3.0027120113372803,
+ "learning_rate": 4.712196092270851e-06,
+ "loss": 0.087,
+ "step": 25214
+ },
+ {
+ "epoch": 68.70572207084469,
+ "grad_norm": 3.3666679859161377,
+ "learning_rate": 4.711447087879595e-06,
+ "loss": 0.0638,
+ "step": 25215
+ },
+ {
+ "epoch": 68.70844686648502,
+ "grad_norm": 3.1055893898010254,
+ "learning_rate": 4.710698124675415e-06,
+ "loss": 0.1127,
+ "step": 25216
+ },
+ {
+ "epoch": 68.71117166212534,
+ "grad_norm": 2.238966703414917,
+ "learning_rate": 4.709949202664147e-06,
+ "loss": 0.0344,
+ "step": 25217
+ },
+ {
+ "epoch": 68.71389645776567,
+ "grad_norm": 2.6818714141845703,
+ "learning_rate": 4.709200321851629e-06,
+ "loss": 0.0261,
+ "step": 25218
+ },
+ {
+ "epoch": 68.71662125340599,
+ "grad_norm": 3.0138466358184814,
+ "learning_rate": 4.708451482243688e-06,
+ "loss": 0.0363,
+ "step": 25219
+ },
+ {
+ "epoch": 68.71934604904632,
+ "grad_norm": 3.702580451965332,
+ "learning_rate": 4.707702683846157e-06,
+ "loss": 0.1585,
+ "step": 25220
+ },
+ {
+ "epoch": 68.72207084468666,
+ "grad_norm": 3.066445827484131,
+ "learning_rate": 4.706953926664863e-06,
+ "loss": 0.0378,
+ "step": 25221
+ },
+ {
+ "epoch": 68.72479564032697,
+ "grad_norm": 2.9520070552825928,
+ "learning_rate": 4.706205210705645e-06,
+ "loss": 0.059,
+ "step": 25222
+ },
+ {
+ "epoch": 68.7275204359673,
+ "grad_norm": 10.24441146850586,
+ "learning_rate": 4.705456535974332e-06,
+ "loss": 0.052,
+ "step": 25223
+ },
+ {
+ "epoch": 68.73024523160763,
+ "grad_norm": 3.098729372024536,
+ "learning_rate": 4.704707902476752e-06,
+ "loss": 0.0672,
+ "step": 25224
+ },
+ {
+ "epoch": 68.73297002724796,
+ "grad_norm": 2.529139995574951,
+ "learning_rate": 4.703959310218733e-06,
+ "loss": 0.0333,
+ "step": 25225
+ },
+ {
+ "epoch": 68.73569482288828,
+ "grad_norm": 6.588604927062988,
+ "learning_rate": 4.703210759206112e-06,
+ "loss": 0.0867,
+ "step": 25226
+ },
+ {
+ "epoch": 68.73841961852861,
+ "grad_norm": 3.233839511871338,
+ "learning_rate": 4.702462249444714e-06,
+ "loss": 0.1194,
+ "step": 25227
+ },
+ {
+ "epoch": 68.74114441416894,
+ "grad_norm": 4.281998634338379,
+ "learning_rate": 4.7017137809403716e-06,
+ "loss": 0.1756,
+ "step": 25228
+ },
+ {
+ "epoch": 68.74386920980926,
+ "grad_norm": 4.349316596984863,
+ "learning_rate": 4.700965353698907e-06,
+ "loss": 0.0985,
+ "step": 25229
+ },
+ {
+ "epoch": 68.7465940054496,
+ "grad_norm": 3.625556707382202,
+ "learning_rate": 4.700216967726157e-06,
+ "loss": 0.1254,
+ "step": 25230
+ },
+ {
+ "epoch": 68.74931880108991,
+ "grad_norm": 5.871299743652344,
+ "learning_rate": 4.699468623027948e-06,
+ "loss": 0.0972,
+ "step": 25231
+ },
+ {
+ "epoch": 68.75204359673025,
+ "grad_norm": 3.9378881454467773,
+ "learning_rate": 4.698720319610105e-06,
+ "loss": 0.1128,
+ "step": 25232
+ },
+ {
+ "epoch": 68.75476839237058,
+ "grad_norm": 2.4924910068511963,
+ "learning_rate": 4.69797205747845e-06,
+ "loss": 0.0284,
+ "step": 25233
+ },
+ {
+ "epoch": 68.7574931880109,
+ "grad_norm": 5.077095985412598,
+ "learning_rate": 4.6972238366388265e-06,
+ "loss": 0.0569,
+ "step": 25234
+ },
+ {
+ "epoch": 68.76021798365123,
+ "grad_norm": 3.356592893600464,
+ "learning_rate": 4.696475657097054e-06,
+ "loss": 0.0822,
+ "step": 25235
+ },
+ {
+ "epoch": 68.76294277929155,
+ "grad_norm": 4.1355881690979,
+ "learning_rate": 4.6957275188589565e-06,
+ "loss": 0.0346,
+ "step": 25236
+ },
+ {
+ "epoch": 68.76566757493188,
+ "grad_norm": 4.216447353363037,
+ "learning_rate": 4.69497942193036e-06,
+ "loss": 0.0641,
+ "step": 25237
+ },
+ {
+ "epoch": 68.7683923705722,
+ "grad_norm": 4.259905815124512,
+ "learning_rate": 4.694231366317096e-06,
+ "loss": 0.0797,
+ "step": 25238
+ },
+ {
+ "epoch": 68.77111716621253,
+ "grad_norm": 2.423780918121338,
+ "learning_rate": 4.693483352024988e-06,
+ "loss": 0.036,
+ "step": 25239
+ },
+ {
+ "epoch": 68.77384196185287,
+ "grad_norm": 3.8292150497436523,
+ "learning_rate": 4.6927353790598595e-06,
+ "loss": 0.0732,
+ "step": 25240
+ },
+ {
+ "epoch": 68.77656675749319,
+ "grad_norm": 4.539219856262207,
+ "learning_rate": 4.691987447427535e-06,
+ "loss": 0.1038,
+ "step": 25241
+ },
+ {
+ "epoch": 68.77929155313352,
+ "grad_norm": 2.4098050594329834,
+ "learning_rate": 4.691239557133844e-06,
+ "loss": 0.031,
+ "step": 25242
+ },
+ {
+ "epoch": 68.78201634877384,
+ "grad_norm": 3.4923839569091797,
+ "learning_rate": 4.690491708184609e-06,
+ "loss": 0.1443,
+ "step": 25243
+ },
+ {
+ "epoch": 68.78474114441417,
+ "grad_norm": 2.1044909954071045,
+ "learning_rate": 4.689743900585654e-06,
+ "loss": 0.0782,
+ "step": 25244
+ },
+ {
+ "epoch": 68.7874659400545,
+ "grad_norm": 3.4952354431152344,
+ "learning_rate": 4.688996134342798e-06,
+ "loss": 0.082,
+ "step": 25245
+ },
+ {
+ "epoch": 68.79019073569482,
+ "grad_norm": 4.9752912521362305,
+ "learning_rate": 4.688248409461873e-06,
+ "loss": 0.1302,
+ "step": 25246
+ },
+ {
+ "epoch": 68.79291553133515,
+ "grad_norm": 3.041003942489624,
+ "learning_rate": 4.687500725948699e-06,
+ "loss": 0.0425,
+ "step": 25247
+ },
+ {
+ "epoch": 68.79564032697547,
+ "grad_norm": 3.128225564956665,
+ "learning_rate": 4.686753083809098e-06,
+ "loss": 0.2146,
+ "step": 25248
+ },
+ {
+ "epoch": 68.7983651226158,
+ "grad_norm": 3.4257009029388428,
+ "learning_rate": 4.68600548304889e-06,
+ "loss": 0.084,
+ "step": 25249
+ },
+ {
+ "epoch": 68.80108991825612,
+ "grad_norm": 3.7465832233428955,
+ "learning_rate": 4.685257923673899e-06,
+ "loss": 0.2516,
+ "step": 25250
+ },
+ {
+ "epoch": 68.80381471389646,
+ "grad_norm": 2.69468092918396,
+ "learning_rate": 4.6845104056899525e-06,
+ "loss": 0.0383,
+ "step": 25251
+ },
+ {
+ "epoch": 68.80653950953679,
+ "grad_norm": 2.782733917236328,
+ "learning_rate": 4.683762929102868e-06,
+ "loss": 0.036,
+ "step": 25252
+ },
+ {
+ "epoch": 68.80926430517711,
+ "grad_norm": 12.41683578491211,
+ "learning_rate": 4.683015493918463e-06,
+ "loss": 0.0443,
+ "step": 25253
+ },
+ {
+ "epoch": 68.81198910081744,
+ "grad_norm": 3.2941360473632812,
+ "learning_rate": 4.682268100142567e-06,
+ "loss": 0.1425,
+ "step": 25254
+ },
+ {
+ "epoch": 68.81471389645776,
+ "grad_norm": 3.0366806983947754,
+ "learning_rate": 4.681520747780994e-06,
+ "loss": 0.0552,
+ "step": 25255
+ },
+ {
+ "epoch": 68.8174386920981,
+ "grad_norm": 5.389036655426025,
+ "learning_rate": 4.680773436839566e-06,
+ "loss": 0.0725,
+ "step": 25256
+ },
+ {
+ "epoch": 68.82016348773843,
+ "grad_norm": 4.012606620788574,
+ "learning_rate": 4.680026167324101e-06,
+ "loss": 0.144,
+ "step": 25257
+ },
+ {
+ "epoch": 68.82288828337875,
+ "grad_norm": 3.0946478843688965,
+ "learning_rate": 4.6792789392404246e-06,
+ "loss": 0.0747,
+ "step": 25258
+ },
+ {
+ "epoch": 68.82561307901908,
+ "grad_norm": 3.341019630432129,
+ "learning_rate": 4.678531752594352e-06,
+ "loss": 0.0629,
+ "step": 25259
+ },
+ {
+ "epoch": 68.8283378746594,
+ "grad_norm": 2.997502565383911,
+ "learning_rate": 4.677784607391703e-06,
+ "loss": 0.0772,
+ "step": 25260
+ },
+ {
+ "epoch": 68.83106267029973,
+ "grad_norm": 2.483455181121826,
+ "learning_rate": 4.677037503638293e-06,
+ "loss": 0.1807,
+ "step": 25261
+ },
+ {
+ "epoch": 68.83378746594005,
+ "grad_norm": 3.285806179046631,
+ "learning_rate": 4.6762904413399465e-06,
+ "loss": 0.1326,
+ "step": 25262
+ },
+ {
+ "epoch": 68.83651226158038,
+ "grad_norm": 4.679166793823242,
+ "learning_rate": 4.675543420502479e-06,
+ "loss": 0.0922,
+ "step": 25263
+ },
+ {
+ "epoch": 68.83923705722071,
+ "grad_norm": 2.4225618839263916,
+ "learning_rate": 4.674796441131708e-06,
+ "loss": 0.0405,
+ "step": 25264
+ },
+ {
+ "epoch": 68.84196185286103,
+ "grad_norm": 2.8314013481140137,
+ "learning_rate": 4.6740495032334475e-06,
+ "loss": 0.0441,
+ "step": 25265
+ },
+ {
+ "epoch": 68.84468664850137,
+ "grad_norm": 3.1308062076568604,
+ "learning_rate": 4.673302606813521e-06,
+ "loss": 0.0679,
+ "step": 25266
+ },
+ {
+ "epoch": 68.84741144414168,
+ "grad_norm": 2.5626614093780518,
+ "learning_rate": 4.67255575187774e-06,
+ "loss": 0.1095,
+ "step": 25267
+ },
+ {
+ "epoch": 68.85013623978202,
+ "grad_norm": 4.718066215515137,
+ "learning_rate": 4.671808938431927e-06,
+ "loss": 0.1733,
+ "step": 25268
+ },
+ {
+ "epoch": 68.85286103542235,
+ "grad_norm": 2.801140785217285,
+ "learning_rate": 4.671062166481893e-06,
+ "loss": 0.115,
+ "step": 25269
+ },
+ {
+ "epoch": 68.85558583106267,
+ "grad_norm": 3.2998874187469482,
+ "learning_rate": 4.670315436033452e-06,
+ "loss": 0.0647,
+ "step": 25270
+ },
+ {
+ "epoch": 68.858310626703,
+ "grad_norm": 2.5194222927093506,
+ "learning_rate": 4.669568747092427e-06,
+ "loss": 0.0493,
+ "step": 25271
+ },
+ {
+ "epoch": 68.86103542234332,
+ "grad_norm": 2.6707797050476074,
+ "learning_rate": 4.668822099664629e-06,
+ "loss": 0.0793,
+ "step": 25272
+ },
+ {
+ "epoch": 68.86376021798365,
+ "grad_norm": 3.8744704723358154,
+ "learning_rate": 4.668075493755873e-06,
+ "loss": 0.029,
+ "step": 25273
+ },
+ {
+ "epoch": 68.86648501362397,
+ "grad_norm": 3.476962089538574,
+ "learning_rate": 4.667328929371969e-06,
+ "loss": 0.1315,
+ "step": 25274
+ },
+ {
+ "epoch": 68.8692098092643,
+ "grad_norm": 3.791701078414917,
+ "learning_rate": 4.66658240651874e-06,
+ "loss": 0.0587,
+ "step": 25275
+ },
+ {
+ "epoch": 68.87193460490464,
+ "grad_norm": 2.206984758377075,
+ "learning_rate": 4.665835925201995e-06,
+ "loss": 0.0261,
+ "step": 25276
+ },
+ {
+ "epoch": 68.87465940054496,
+ "grad_norm": 7.005254745483398,
+ "learning_rate": 4.665089485427546e-06,
+ "loss": 0.0725,
+ "step": 25277
+ },
+ {
+ "epoch": 68.87738419618529,
+ "grad_norm": 2.7205026149749756,
+ "learning_rate": 4.664343087201211e-06,
+ "loss": 0.0532,
+ "step": 25278
+ },
+ {
+ "epoch": 68.88010899182561,
+ "grad_norm": 4.036895751953125,
+ "learning_rate": 4.6635967305288e-06,
+ "loss": 0.048,
+ "step": 25279
+ },
+ {
+ "epoch": 68.88283378746594,
+ "grad_norm": 2.835393190383911,
+ "learning_rate": 4.662850415416127e-06,
+ "loss": 0.1298,
+ "step": 25280
+ },
+ {
+ "epoch": 68.88555858310627,
+ "grad_norm": 3.6264708042144775,
+ "learning_rate": 4.6621041418689985e-06,
+ "loss": 0.0497,
+ "step": 25281
+ },
+ {
+ "epoch": 68.88828337874659,
+ "grad_norm": 2.5192103385925293,
+ "learning_rate": 4.661357909893235e-06,
+ "loss": 0.0923,
+ "step": 25282
+ },
+ {
+ "epoch": 68.89100817438693,
+ "grad_norm": 5.387713432312012,
+ "learning_rate": 4.660611719494644e-06,
+ "loss": 0.1054,
+ "step": 25283
+ },
+ {
+ "epoch": 68.89373297002724,
+ "grad_norm": 3.527350902557373,
+ "learning_rate": 4.6598655706790344e-06,
+ "loss": 0.0993,
+ "step": 25284
+ },
+ {
+ "epoch": 68.89645776566758,
+ "grad_norm": 4.775354862213135,
+ "learning_rate": 4.659119463452223e-06,
+ "loss": 0.055,
+ "step": 25285
+ },
+ {
+ "epoch": 68.8991825613079,
+ "grad_norm": 5.509058475494385,
+ "learning_rate": 4.658373397820013e-06,
+ "loss": 0.059,
+ "step": 25286
+ },
+ {
+ "epoch": 68.90190735694823,
+ "grad_norm": 3.4188144207000732,
+ "learning_rate": 4.657627373788224e-06,
+ "loss": 0.0444,
+ "step": 25287
+ },
+ {
+ "epoch": 68.90463215258856,
+ "grad_norm": 2.3662898540496826,
+ "learning_rate": 4.65688139136266e-06,
+ "loss": 0.0293,
+ "step": 25288
+ },
+ {
+ "epoch": 68.90735694822888,
+ "grad_norm": 4.150286674499512,
+ "learning_rate": 4.656135450549132e-06,
+ "loss": 0.1194,
+ "step": 25289
+ },
+ {
+ "epoch": 68.91008174386921,
+ "grad_norm": 3.394137144088745,
+ "learning_rate": 4.655389551353445e-06,
+ "loss": 0.0794,
+ "step": 25290
+ },
+ {
+ "epoch": 68.91280653950953,
+ "grad_norm": 3.964113235473633,
+ "learning_rate": 4.654643693781417e-06,
+ "loss": 0.22,
+ "step": 25291
+ },
+ {
+ "epoch": 68.91553133514986,
+ "grad_norm": 2.2684898376464844,
+ "learning_rate": 4.653897877838851e-06,
+ "loss": 0.0394,
+ "step": 25292
+ },
+ {
+ "epoch": 68.9182561307902,
+ "grad_norm": 2.652017593383789,
+ "learning_rate": 4.6531521035315566e-06,
+ "loss": 0.0661,
+ "step": 25293
+ },
+ {
+ "epoch": 68.92098092643052,
+ "grad_norm": 3.710247278213501,
+ "learning_rate": 4.652406370865338e-06,
+ "loss": 0.0798,
+ "step": 25294
+ },
+ {
+ "epoch": 68.92370572207085,
+ "grad_norm": 4.017529487609863,
+ "learning_rate": 4.65166067984601e-06,
+ "loss": 0.0678,
+ "step": 25295
+ },
+ {
+ "epoch": 68.92643051771117,
+ "grad_norm": 3.1239895820617676,
+ "learning_rate": 4.650915030479376e-06,
+ "loss": 0.1691,
+ "step": 25296
+ },
+ {
+ "epoch": 68.9291553133515,
+ "grad_norm": 2.6684730052948,
+ "learning_rate": 4.65016942277124e-06,
+ "loss": 0.278,
+ "step": 25297
+ },
+ {
+ "epoch": 68.93188010899182,
+ "grad_norm": 1.8895353078842163,
+ "learning_rate": 4.6494238567274175e-06,
+ "loss": 0.0257,
+ "step": 25298
+ },
+ {
+ "epoch": 68.93460490463215,
+ "grad_norm": 3.6534266471862793,
+ "learning_rate": 4.648678332353709e-06,
+ "loss": 0.0791,
+ "step": 25299
+ },
+ {
+ "epoch": 68.93732970027249,
+ "grad_norm": 3.0218663215637207,
+ "learning_rate": 4.64793284965592e-06,
+ "loss": 0.0404,
+ "step": 25300
+ },
+ {
+ "epoch": 68.9400544959128,
+ "grad_norm": 2.994173049926758,
+ "learning_rate": 4.647187408639855e-06,
+ "loss": 0.0413,
+ "step": 25301
+ },
+ {
+ "epoch": 68.94277929155314,
+ "grad_norm": 3.136317491531372,
+ "learning_rate": 4.646442009311323e-06,
+ "loss": 0.0766,
+ "step": 25302
+ },
+ {
+ "epoch": 68.94550408719346,
+ "grad_norm": 3.6843063831329346,
+ "learning_rate": 4.645696651676131e-06,
+ "loss": 0.1817,
+ "step": 25303
+ },
+ {
+ "epoch": 68.94822888283379,
+ "grad_norm": 4.230409145355225,
+ "learning_rate": 4.644951335740081e-06,
+ "loss": 0.1955,
+ "step": 25304
+ },
+ {
+ "epoch": 68.95095367847412,
+ "grad_norm": 3.020812749862671,
+ "learning_rate": 4.644206061508979e-06,
+ "loss": 0.1499,
+ "step": 25305
+ },
+ {
+ "epoch": 68.95367847411444,
+ "grad_norm": 3.0145413875579834,
+ "learning_rate": 4.643460828988623e-06,
+ "loss": 0.0394,
+ "step": 25306
+ },
+ {
+ "epoch": 68.95640326975477,
+ "grad_norm": 2.7844457626342773,
+ "learning_rate": 4.642715638184825e-06,
+ "loss": 0.0361,
+ "step": 25307
+ },
+ {
+ "epoch": 68.95912806539509,
+ "grad_norm": 3.670297861099243,
+ "learning_rate": 4.641970489103386e-06,
+ "loss": 0.0626,
+ "step": 25308
+ },
+ {
+ "epoch": 68.96185286103542,
+ "grad_norm": 3.8738906383514404,
+ "learning_rate": 4.641225381750109e-06,
+ "loss": 0.0491,
+ "step": 25309
+ },
+ {
+ "epoch": 68.96457765667574,
+ "grad_norm": 4.277965068817139,
+ "learning_rate": 4.640480316130791e-06,
+ "loss": 0.1066,
+ "step": 25310
+ },
+ {
+ "epoch": 68.96730245231608,
+ "grad_norm": 2.212169647216797,
+ "learning_rate": 4.639735292251244e-06,
+ "loss": 0.0364,
+ "step": 25311
+ },
+ {
+ "epoch": 68.97002724795641,
+ "grad_norm": 2.7719273567199707,
+ "learning_rate": 4.638990310117266e-06,
+ "loss": 0.0607,
+ "step": 25312
+ },
+ {
+ "epoch": 68.97275204359673,
+ "grad_norm": 4.156070232391357,
+ "learning_rate": 4.638245369734659e-06,
+ "loss": 0.056,
+ "step": 25313
+ },
+ {
+ "epoch": 68.97547683923706,
+ "grad_norm": 2.888261079788208,
+ "learning_rate": 4.637500471109222e-06,
+ "loss": 0.0426,
+ "step": 25314
+ },
+ {
+ "epoch": 68.97820163487738,
+ "grad_norm": 2.8456966876983643,
+ "learning_rate": 4.6367556142467605e-06,
+ "loss": 0.0748,
+ "step": 25315
+ },
+ {
+ "epoch": 68.98092643051771,
+ "grad_norm": 3.2775473594665527,
+ "learning_rate": 4.636010799153074e-06,
+ "loss": 0.0408,
+ "step": 25316
+ },
+ {
+ "epoch": 68.98365122615803,
+ "grad_norm": 3.8727123737335205,
+ "learning_rate": 4.635266025833964e-06,
+ "loss": 0.0355,
+ "step": 25317
+ },
+ {
+ "epoch": 68.98637602179836,
+ "grad_norm": 3.1337437629699707,
+ "learning_rate": 4.6345212942952255e-06,
+ "loss": 0.0447,
+ "step": 25318
+ },
+ {
+ "epoch": 68.9891008174387,
+ "grad_norm": 3.4043190479278564,
+ "learning_rate": 4.6337766045426625e-06,
+ "loss": 0.0977,
+ "step": 25319
+ },
+ {
+ "epoch": 68.99182561307902,
+ "grad_norm": 2.9682180881500244,
+ "learning_rate": 4.633031956582077e-06,
+ "loss": 0.0658,
+ "step": 25320
+ },
+ {
+ "epoch": 68.99455040871935,
+ "grad_norm": 2.725248336791992,
+ "learning_rate": 4.6322873504192675e-06,
+ "loss": 0.0964,
+ "step": 25321
+ },
+ {
+ "epoch": 68.99727520435967,
+ "grad_norm": 2.6156909465789795,
+ "learning_rate": 4.631542786060027e-06,
+ "loss": 0.069,
+ "step": 25322
+ },
+ {
+ "epoch": 69.0,
+ "grad_norm": 3.5765891075134277,
+ "learning_rate": 4.630798263510162e-06,
+ "loss": 0.1748,
+ "step": 25323
+ },
+ {
+ "epoch": 69.00272479564033,
+ "grad_norm": 2.973284959793091,
+ "learning_rate": 4.630053782775467e-06,
+ "loss": 0.0512,
+ "step": 25324
+ },
+ {
+ "epoch": 69.00544959128065,
+ "grad_norm": 2.2170028686523438,
+ "learning_rate": 4.629309343861741e-06,
+ "loss": 0.0336,
+ "step": 25325
+ },
+ {
+ "epoch": 69.00817438692098,
+ "grad_norm": 2.648892641067505,
+ "learning_rate": 4.628564946774777e-06,
+ "loss": 0.0665,
+ "step": 25326
+ },
+ {
+ "epoch": 69.0108991825613,
+ "grad_norm": 3.3921704292297363,
+ "learning_rate": 4.62782059152038e-06,
+ "loss": 0.1104,
+ "step": 25327
+ },
+ {
+ "epoch": 69.01362397820164,
+ "grad_norm": 2.8230392932891846,
+ "learning_rate": 4.627076278104343e-06,
+ "loss": 0.0478,
+ "step": 25328
+ },
+ {
+ "epoch": 69.01634877384195,
+ "grad_norm": 2.938129186630249,
+ "learning_rate": 4.626332006532464e-06,
+ "loss": 0.0954,
+ "step": 25329
+ },
+ {
+ "epoch": 69.01907356948229,
+ "grad_norm": 4.370748996734619,
+ "learning_rate": 4.625587776810534e-06,
+ "loss": 0.0938,
+ "step": 25330
+ },
+ {
+ "epoch": 69.02179836512262,
+ "grad_norm": 2.6737706661224365,
+ "learning_rate": 4.624843588944357e-06,
+ "loss": 0.0499,
+ "step": 25331
+ },
+ {
+ "epoch": 69.02452316076294,
+ "grad_norm": 3.3993330001831055,
+ "learning_rate": 4.624099442939726e-06,
+ "loss": 0.0714,
+ "step": 25332
+ },
+ {
+ "epoch": 69.02724795640327,
+ "grad_norm": 2.5821268558502197,
+ "learning_rate": 4.623355338802434e-06,
+ "loss": 0.081,
+ "step": 25333
+ },
+ {
+ "epoch": 69.02997275204359,
+ "grad_norm": 3.2227485179901123,
+ "learning_rate": 4.622611276538276e-06,
+ "loss": 0.0677,
+ "step": 25334
+ },
+ {
+ "epoch": 69.03269754768392,
+ "grad_norm": 2.1117255687713623,
+ "learning_rate": 4.62186725615305e-06,
+ "loss": 0.0333,
+ "step": 25335
+ },
+ {
+ "epoch": 69.03542234332426,
+ "grad_norm": 3.1656744480133057,
+ "learning_rate": 4.621123277652546e-06,
+ "loss": 0.037,
+ "step": 25336
+ },
+ {
+ "epoch": 69.03814713896458,
+ "grad_norm": 4.241729736328125,
+ "learning_rate": 4.620379341042564e-06,
+ "loss": 0.1225,
+ "step": 25337
+ },
+ {
+ "epoch": 69.04087193460491,
+ "grad_norm": 4.0763349533081055,
+ "learning_rate": 4.619635446328895e-06,
+ "loss": 0.0599,
+ "step": 25338
+ },
+ {
+ "epoch": 69.04359673024523,
+ "grad_norm": 4.741207599639893,
+ "learning_rate": 4.618891593517328e-06,
+ "loss": 0.1084,
+ "step": 25339
+ },
+ {
+ "epoch": 69.04632152588556,
+ "grad_norm": 3.7330992221832275,
+ "learning_rate": 4.618147782613663e-06,
+ "loss": 0.0644,
+ "step": 25340
+ },
+ {
+ "epoch": 69.04904632152588,
+ "grad_norm": 2.286592721939087,
+ "learning_rate": 4.617404013623692e-06,
+ "loss": 0.0336,
+ "step": 25341
+ },
+ {
+ "epoch": 69.05177111716621,
+ "grad_norm": 2.8393232822418213,
+ "learning_rate": 4.616660286553199e-06,
+ "loss": 0.061,
+ "step": 25342
+ },
+ {
+ "epoch": 69.05449591280654,
+ "grad_norm": 2.792849540710449,
+ "learning_rate": 4.615916601407988e-06,
+ "loss": 0.1103,
+ "step": 25343
+ },
+ {
+ "epoch": 69.05722070844686,
+ "grad_norm": 3.050400972366333,
+ "learning_rate": 4.615172958193845e-06,
+ "loss": 0.0836,
+ "step": 25344
+ },
+ {
+ "epoch": 69.0599455040872,
+ "grad_norm": 3.8424429893493652,
+ "learning_rate": 4.614429356916561e-06,
+ "loss": 0.1374,
+ "step": 25345
+ },
+ {
+ "epoch": 69.06267029972751,
+ "grad_norm": 3.551499128341675,
+ "learning_rate": 4.613685797581925e-06,
+ "loss": 0.0867,
+ "step": 25346
+ },
+ {
+ "epoch": 69.06539509536785,
+ "grad_norm": 5.33734655380249,
+ "learning_rate": 4.612942280195734e-06,
+ "loss": 0.0901,
+ "step": 25347
+ },
+ {
+ "epoch": 69.06811989100818,
+ "grad_norm": 2.7843034267425537,
+ "learning_rate": 4.612198804763775e-06,
+ "loss": 0.077,
+ "step": 25348
+ },
+ {
+ "epoch": 69.0708446866485,
+ "grad_norm": 3.4353561401367188,
+ "learning_rate": 4.611455371291837e-06,
+ "loss": 0.1888,
+ "step": 25349
+ },
+ {
+ "epoch": 69.07356948228883,
+ "grad_norm": 3.2494888305664062,
+ "learning_rate": 4.6107119797857096e-06,
+ "loss": 0.0602,
+ "step": 25350
+ },
+ {
+ "epoch": 69.07629427792915,
+ "grad_norm": 2.899702548980713,
+ "learning_rate": 4.609968630251187e-06,
+ "loss": 0.056,
+ "step": 25351
+ },
+ {
+ "epoch": 69.07901907356948,
+ "grad_norm": 2.1720457077026367,
+ "learning_rate": 4.6092253226940546e-06,
+ "loss": 0.0361,
+ "step": 25352
+ },
+ {
+ "epoch": 69.0817438692098,
+ "grad_norm": 2.9516775608062744,
+ "learning_rate": 4.608482057120099e-06,
+ "loss": 0.116,
+ "step": 25353
+ },
+ {
+ "epoch": 69.08446866485014,
+ "grad_norm": 2.660510540008545,
+ "learning_rate": 4.6077388335351144e-06,
+ "loss": 0.0417,
+ "step": 25354
+ },
+ {
+ "epoch": 69.08719346049047,
+ "grad_norm": 5.641421318054199,
+ "learning_rate": 4.6069956519448836e-06,
+ "loss": 0.0838,
+ "step": 25355
+ },
+ {
+ "epoch": 69.08991825613079,
+ "grad_norm": 3.240388870239258,
+ "learning_rate": 4.606252512355199e-06,
+ "loss": 0.0466,
+ "step": 25356
+ },
+ {
+ "epoch": 69.09264305177112,
+ "grad_norm": 3.065953254699707,
+ "learning_rate": 4.605509414771847e-06,
+ "loss": 0.185,
+ "step": 25357
+ },
+ {
+ "epoch": 69.09536784741144,
+ "grad_norm": 2.6469898223876953,
+ "learning_rate": 4.6047663592006155e-06,
+ "loss": 0.0436,
+ "step": 25358
+ },
+ {
+ "epoch": 69.09809264305177,
+ "grad_norm": 3.0340006351470947,
+ "learning_rate": 4.6040233456472845e-06,
+ "loss": 0.042,
+ "step": 25359
+ },
+ {
+ "epoch": 69.1008174386921,
+ "grad_norm": 3.9148831367492676,
+ "learning_rate": 4.60328037411765e-06,
+ "loss": 0.0393,
+ "step": 25360
+ },
+ {
+ "epoch": 69.10354223433242,
+ "grad_norm": 3.3091955184936523,
+ "learning_rate": 4.602537444617495e-06,
+ "loss": 0.1229,
+ "step": 25361
+ },
+ {
+ "epoch": 69.10626702997276,
+ "grad_norm": 2.4060099124908447,
+ "learning_rate": 4.601794557152602e-06,
+ "loss": 0.1009,
+ "step": 25362
+ },
+ {
+ "epoch": 69.10899182561307,
+ "grad_norm": 5.231338977813721,
+ "learning_rate": 4.60105171172876e-06,
+ "loss": 0.0999,
+ "step": 25363
+ },
+ {
+ "epoch": 69.11171662125341,
+ "grad_norm": 2.4197018146514893,
+ "learning_rate": 4.6003089083517545e-06,
+ "loss": 0.029,
+ "step": 25364
+ },
+ {
+ "epoch": 69.11444141689373,
+ "grad_norm": 4.155883312225342,
+ "learning_rate": 4.599566147027371e-06,
+ "loss": 0.1456,
+ "step": 25365
+ },
+ {
+ "epoch": 69.11716621253406,
+ "grad_norm": 10.01461124420166,
+ "learning_rate": 4.598823427761387e-06,
+ "loss": 0.0622,
+ "step": 25366
+ },
+ {
+ "epoch": 69.11989100817439,
+ "grad_norm": 3.3596034049987793,
+ "learning_rate": 4.598080750559597e-06,
+ "loss": 0.0503,
+ "step": 25367
+ },
+ {
+ "epoch": 69.12261580381471,
+ "grad_norm": 2.7877581119537354,
+ "learning_rate": 4.597338115427781e-06,
+ "loss": 0.0411,
+ "step": 25368
+ },
+ {
+ "epoch": 69.12534059945504,
+ "grad_norm": 2.8343818187713623,
+ "learning_rate": 4.596595522371721e-06,
+ "loss": 0.0636,
+ "step": 25369
+ },
+ {
+ "epoch": 69.12806539509536,
+ "grad_norm": 4.523220062255859,
+ "learning_rate": 4.595852971397197e-06,
+ "loss": 0.0883,
+ "step": 25370
+ },
+ {
+ "epoch": 69.1307901907357,
+ "grad_norm": 2.302170991897583,
+ "learning_rate": 4.595110462509996e-06,
+ "loss": 0.0339,
+ "step": 25371
+ },
+ {
+ "epoch": 69.13351498637603,
+ "grad_norm": 2.4652061462402344,
+ "learning_rate": 4.594367995715905e-06,
+ "loss": 0.1065,
+ "step": 25372
+ },
+ {
+ "epoch": 69.13623978201635,
+ "grad_norm": 2.82228946685791,
+ "learning_rate": 4.593625571020702e-06,
+ "loss": 0.0816,
+ "step": 25373
+ },
+ {
+ "epoch": 69.13896457765668,
+ "grad_norm": 2.334242105484009,
+ "learning_rate": 4.592883188430169e-06,
+ "loss": 0.0354,
+ "step": 25374
+ },
+ {
+ "epoch": 69.141689373297,
+ "grad_norm": 2.4624836444854736,
+ "learning_rate": 4.592140847950085e-06,
+ "loss": 0.0329,
+ "step": 25375
+ },
+ {
+ "epoch": 69.14441416893733,
+ "grad_norm": 2.9783990383148193,
+ "learning_rate": 4.591398549586237e-06,
+ "loss": 0.1948,
+ "step": 25376
+ },
+ {
+ "epoch": 69.14713896457765,
+ "grad_norm": 3.096959114074707,
+ "learning_rate": 4.5906562933444024e-06,
+ "loss": 0.1198,
+ "step": 25377
+ },
+ {
+ "epoch": 69.14986376021798,
+ "grad_norm": 3.8093245029449463,
+ "learning_rate": 4.589914079230363e-06,
+ "loss": 0.0987,
+ "step": 25378
+ },
+ {
+ "epoch": 69.15258855585832,
+ "grad_norm": 2.3881402015686035,
+ "learning_rate": 4.589171907249895e-06,
+ "loss": 0.0416,
+ "step": 25379
+ },
+ {
+ "epoch": 69.15531335149863,
+ "grad_norm": 4.455782413482666,
+ "learning_rate": 4.588429777408785e-06,
+ "loss": 0.1728,
+ "step": 25380
+ },
+ {
+ "epoch": 69.15803814713897,
+ "grad_norm": 9.765618324279785,
+ "learning_rate": 4.587687689712811e-06,
+ "loss": 0.0506,
+ "step": 25381
+ },
+ {
+ "epoch": 69.16076294277929,
+ "grad_norm": 3.4322943687438965,
+ "learning_rate": 4.586945644167751e-06,
+ "loss": 0.0459,
+ "step": 25382
+ },
+ {
+ "epoch": 69.16348773841962,
+ "grad_norm": 4.60107421875,
+ "learning_rate": 4.586203640779379e-06,
+ "loss": 0.188,
+ "step": 25383
+ },
+ {
+ "epoch": 69.16621253405995,
+ "grad_norm": 1.8150352239608765,
+ "learning_rate": 4.5854616795534835e-06,
+ "loss": 0.0265,
+ "step": 25384
+ },
+ {
+ "epoch": 69.16893732970027,
+ "grad_norm": 3.624239444732666,
+ "learning_rate": 4.584719760495838e-06,
+ "loss": 0.0658,
+ "step": 25385
+ },
+ {
+ "epoch": 69.1716621253406,
+ "grad_norm": 2.3626153469085693,
+ "learning_rate": 4.583977883612218e-06,
+ "loss": 0.0668,
+ "step": 25386
+ },
+ {
+ "epoch": 69.17438692098092,
+ "grad_norm": 2.6876978874206543,
+ "learning_rate": 4.583236048908406e-06,
+ "loss": 0.1338,
+ "step": 25387
+ },
+ {
+ "epoch": 69.17711171662125,
+ "grad_norm": 3.021451711654663,
+ "learning_rate": 4.582494256390174e-06,
+ "loss": 0.0364,
+ "step": 25388
+ },
+ {
+ "epoch": 69.17983651226157,
+ "grad_norm": 3.472978353500366,
+ "learning_rate": 4.581752506063306e-06,
+ "loss": 0.0623,
+ "step": 25389
+ },
+ {
+ "epoch": 69.1825613079019,
+ "grad_norm": 3.0560572147369385,
+ "learning_rate": 4.581010797933576e-06,
+ "loss": 0.077,
+ "step": 25390
+ },
+ {
+ "epoch": 69.18528610354224,
+ "grad_norm": 2.9825806617736816,
+ "learning_rate": 4.580269132006755e-06,
+ "loss": 0.0321,
+ "step": 25391
+ },
+ {
+ "epoch": 69.18801089918256,
+ "grad_norm": 3.3844103813171387,
+ "learning_rate": 4.579527508288627e-06,
+ "loss": 0.0364,
+ "step": 25392
+ },
+ {
+ "epoch": 69.19073569482289,
+ "grad_norm": 2.671772003173828,
+ "learning_rate": 4.578785926784966e-06,
+ "loss": 0.0554,
+ "step": 25393
+ },
+ {
+ "epoch": 69.19346049046321,
+ "grad_norm": 2.484617233276367,
+ "learning_rate": 4.578044387501544e-06,
+ "loss": 0.0392,
+ "step": 25394
+ },
+ {
+ "epoch": 69.19618528610354,
+ "grad_norm": 3.5257954597473145,
+ "learning_rate": 4.577302890444134e-06,
+ "loss": 0.0505,
+ "step": 25395
+ },
+ {
+ "epoch": 69.19891008174388,
+ "grad_norm": 3.391948699951172,
+ "learning_rate": 4.57656143561852e-06,
+ "loss": 0.0438,
+ "step": 25396
+ },
+ {
+ "epoch": 69.2016348773842,
+ "grad_norm": 4.001677513122559,
+ "learning_rate": 4.575820023030469e-06,
+ "loss": 0.1583,
+ "step": 25397
+ },
+ {
+ "epoch": 69.20435967302453,
+ "grad_norm": 2.1667492389678955,
+ "learning_rate": 4.575078652685758e-06,
+ "loss": 0.0436,
+ "step": 25398
+ },
+ {
+ "epoch": 69.20708446866485,
+ "grad_norm": 3.1260199546813965,
+ "learning_rate": 4.574337324590156e-06,
+ "loss": 0.1362,
+ "step": 25399
+ },
+ {
+ "epoch": 69.20980926430518,
+ "grad_norm": 2.11391282081604,
+ "learning_rate": 4.573596038749444e-06,
+ "loss": 0.2222,
+ "step": 25400
+ },
+ {
+ "epoch": 69.2125340599455,
+ "grad_norm": 2.815260648727417,
+ "learning_rate": 4.572854795169392e-06,
+ "loss": 0.0791,
+ "step": 25401
+ },
+ {
+ "epoch": 69.21525885558583,
+ "grad_norm": 3.2800514698028564,
+ "learning_rate": 4.572113593855771e-06,
+ "loss": 0.0716,
+ "step": 25402
+ },
+ {
+ "epoch": 69.21798365122616,
+ "grad_norm": 2.0049800872802734,
+ "learning_rate": 4.571372434814352e-06,
+ "loss": 0.0353,
+ "step": 25403
+ },
+ {
+ "epoch": 69.22070844686648,
+ "grad_norm": 4.266651630401611,
+ "learning_rate": 4.570631318050913e-06,
+ "loss": 0.1376,
+ "step": 25404
+ },
+ {
+ "epoch": 69.22343324250681,
+ "grad_norm": 4.971512794494629,
+ "learning_rate": 4.569890243571219e-06,
+ "loss": 0.0445,
+ "step": 25405
+ },
+ {
+ "epoch": 69.22615803814713,
+ "grad_norm": 3.709139347076416,
+ "learning_rate": 4.569149211381049e-06,
+ "loss": 0.0814,
+ "step": 25406
+ },
+ {
+ "epoch": 69.22888283378747,
+ "grad_norm": 3.2884321212768555,
+ "learning_rate": 4.568408221486166e-06,
+ "loss": 0.1194,
+ "step": 25407
+ },
+ {
+ "epoch": 69.2316076294278,
+ "grad_norm": 2.227508306503296,
+ "learning_rate": 4.567667273892349e-06,
+ "loss": 0.0274,
+ "step": 25408
+ },
+ {
+ "epoch": 69.23433242506812,
+ "grad_norm": 3.514317750930786,
+ "learning_rate": 4.566926368605364e-06,
+ "loss": 0.0488,
+ "step": 25409
+ },
+ {
+ "epoch": 69.23705722070845,
+ "grad_norm": 7.666079521179199,
+ "learning_rate": 4.566185505630981e-06,
+ "loss": 0.2268,
+ "step": 25410
+ },
+ {
+ "epoch": 69.23978201634877,
+ "grad_norm": 3.4058709144592285,
+ "learning_rate": 4.565444684974968e-06,
+ "loss": 0.1507,
+ "step": 25411
+ },
+ {
+ "epoch": 69.2425068119891,
+ "grad_norm": 3.5763678550720215,
+ "learning_rate": 4.5647039066431e-06,
+ "loss": 0.0785,
+ "step": 25412
+ },
+ {
+ "epoch": 69.24523160762942,
+ "grad_norm": 2.9784834384918213,
+ "learning_rate": 4.563963170641143e-06,
+ "loss": 0.1684,
+ "step": 25413
+ },
+ {
+ "epoch": 69.24795640326975,
+ "grad_norm": 2.819248676300049,
+ "learning_rate": 4.563222476974866e-06,
+ "loss": 0.1865,
+ "step": 25414
+ },
+ {
+ "epoch": 69.25068119891009,
+ "grad_norm": 3.5395994186401367,
+ "learning_rate": 4.562481825650034e-06,
+ "loss": 0.0434,
+ "step": 25415
+ },
+ {
+ "epoch": 69.2534059945504,
+ "grad_norm": 4.175273418426514,
+ "learning_rate": 4.561741216672422e-06,
+ "loss": 0.0573,
+ "step": 25416
+ },
+ {
+ "epoch": 69.25613079019074,
+ "grad_norm": 3.1356163024902344,
+ "learning_rate": 4.5610006500477935e-06,
+ "loss": 0.0513,
+ "step": 25417
+ },
+ {
+ "epoch": 69.25885558583106,
+ "grad_norm": 2.5869336128234863,
+ "learning_rate": 4.560260125781918e-06,
+ "loss": 0.0385,
+ "step": 25418
+ },
+ {
+ "epoch": 69.26158038147139,
+ "grad_norm": 2.9099714756011963,
+ "learning_rate": 4.559519643880556e-06,
+ "loss": 0.0331,
+ "step": 25419
+ },
+ {
+ "epoch": 69.26430517711172,
+ "grad_norm": 3.585111141204834,
+ "learning_rate": 4.5587792043494865e-06,
+ "loss": 0.095,
+ "step": 25420
+ },
+ {
+ "epoch": 69.26702997275204,
+ "grad_norm": 3.7343595027923584,
+ "learning_rate": 4.558038807194468e-06,
+ "loss": 0.1624,
+ "step": 25421
+ },
+ {
+ "epoch": 69.26975476839237,
+ "grad_norm": 5.514522552490234,
+ "learning_rate": 4.557298452421264e-06,
+ "loss": 0.0472,
+ "step": 25422
+ },
+ {
+ "epoch": 69.2724795640327,
+ "grad_norm": 4.171028137207031,
+ "learning_rate": 4.556558140035648e-06,
+ "loss": 0.1025,
+ "step": 25423
+ },
+ {
+ "epoch": 69.27520435967303,
+ "grad_norm": 3.00070858001709,
+ "learning_rate": 4.555817870043379e-06,
+ "loss": 0.1122,
+ "step": 25424
+ },
+ {
+ "epoch": 69.27792915531334,
+ "grad_norm": 3.1932849884033203,
+ "learning_rate": 4.55507764245023e-06,
+ "loss": 0.0466,
+ "step": 25425
+ },
+ {
+ "epoch": 69.28065395095368,
+ "grad_norm": 3.068021535873413,
+ "learning_rate": 4.554337457261959e-06,
+ "loss": 0.0559,
+ "step": 25426
+ },
+ {
+ "epoch": 69.28337874659401,
+ "grad_norm": 3.2480483055114746,
+ "learning_rate": 4.55359731448433e-06,
+ "loss": 0.0857,
+ "step": 25427
+ },
+ {
+ "epoch": 69.28610354223433,
+ "grad_norm": 3.1276259422302246,
+ "learning_rate": 4.552857214123115e-06,
+ "loss": 0.0659,
+ "step": 25428
+ },
+ {
+ "epoch": 69.28882833787466,
+ "grad_norm": 4.520638942718506,
+ "learning_rate": 4.5521171561840696e-06,
+ "loss": 0.0964,
+ "step": 25429
+ },
+ {
+ "epoch": 69.29155313351498,
+ "grad_norm": 4.583598613739014,
+ "learning_rate": 4.551377140672962e-06,
+ "loss": 0.111,
+ "step": 25430
+ },
+ {
+ "epoch": 69.29427792915531,
+ "grad_norm": 1.993520975112915,
+ "learning_rate": 4.55063716759555e-06,
+ "loss": 0.0574,
+ "step": 25431
+ },
+ {
+ "epoch": 69.29700272479565,
+ "grad_norm": 4.2229790687561035,
+ "learning_rate": 4.549897236957605e-06,
+ "loss": 0.0444,
+ "step": 25432
+ },
+ {
+ "epoch": 69.29972752043597,
+ "grad_norm": 3.21101450920105,
+ "learning_rate": 4.549157348764883e-06,
+ "loss": 0.053,
+ "step": 25433
+ },
+ {
+ "epoch": 69.3024523160763,
+ "grad_norm": 3.129916191101074,
+ "learning_rate": 4.548417503023149e-06,
+ "loss": 0.0939,
+ "step": 25434
+ },
+ {
+ "epoch": 69.30517711171662,
+ "grad_norm": 3.284067153930664,
+ "learning_rate": 4.5476776997381615e-06,
+ "loss": 0.0561,
+ "step": 25435
+ },
+ {
+ "epoch": 69.30790190735695,
+ "grad_norm": 2.7819948196411133,
+ "learning_rate": 4.5469379389156865e-06,
+ "loss": 0.0524,
+ "step": 25436
+ },
+ {
+ "epoch": 69.31062670299727,
+ "grad_norm": 2.6426141262054443,
+ "learning_rate": 4.546198220561484e-06,
+ "loss": 0.061,
+ "step": 25437
+ },
+ {
+ "epoch": 69.3133514986376,
+ "grad_norm": 3.2954511642456055,
+ "learning_rate": 4.545458544681315e-06,
+ "loss": 0.0492,
+ "step": 25438
+ },
+ {
+ "epoch": 69.31607629427793,
+ "grad_norm": 3.160815954208374,
+ "learning_rate": 4.544718911280934e-06,
+ "loss": 0.1001,
+ "step": 25439
+ },
+ {
+ "epoch": 69.31880108991825,
+ "grad_norm": 3.6648552417755127,
+ "learning_rate": 4.5439793203661075e-06,
+ "loss": 0.066,
+ "step": 25440
+ },
+ {
+ "epoch": 69.32152588555859,
+ "grad_norm": 2.691915273666382,
+ "learning_rate": 4.543239771942599e-06,
+ "loss": 0.0614,
+ "step": 25441
+ },
+ {
+ "epoch": 69.3242506811989,
+ "grad_norm": 4.521756172180176,
+ "learning_rate": 4.542500266016162e-06,
+ "loss": 0.1956,
+ "step": 25442
+ },
+ {
+ "epoch": 69.32697547683924,
+ "grad_norm": 2.222311496734619,
+ "learning_rate": 4.541760802592558e-06,
+ "loss": 0.0263,
+ "step": 25443
+ },
+ {
+ "epoch": 69.32970027247957,
+ "grad_norm": 3.0697567462921143,
+ "learning_rate": 4.541021381677541e-06,
+ "loss": 0.1766,
+ "step": 25444
+ },
+ {
+ "epoch": 69.33242506811989,
+ "grad_norm": 3.325167417526245,
+ "learning_rate": 4.540282003276879e-06,
+ "loss": 0.1471,
+ "step": 25445
+ },
+ {
+ "epoch": 69.33514986376022,
+ "grad_norm": 2.820826292037964,
+ "learning_rate": 4.5395426673963235e-06,
+ "loss": 0.1574,
+ "step": 25446
+ },
+ {
+ "epoch": 69.33787465940054,
+ "grad_norm": 2.6701645851135254,
+ "learning_rate": 4.5388033740416344e-06,
+ "loss": 0.059,
+ "step": 25447
+ },
+ {
+ "epoch": 69.34059945504087,
+ "grad_norm": 3.161954164505005,
+ "learning_rate": 4.538064123218565e-06,
+ "loss": 0.0481,
+ "step": 25448
+ },
+ {
+ "epoch": 69.34332425068119,
+ "grad_norm": 3.1632397174835205,
+ "learning_rate": 4.53732491493288e-06,
+ "loss": 0.1351,
+ "step": 25449
+ },
+ {
+ "epoch": 69.34604904632153,
+ "grad_norm": 2.487396240234375,
+ "learning_rate": 4.536585749190334e-06,
+ "loss": 0.0715,
+ "step": 25450
+ },
+ {
+ "epoch": 69.34877384196186,
+ "grad_norm": 4.762503147125244,
+ "learning_rate": 4.535846625996677e-06,
+ "loss": 0.0933,
+ "step": 25451
+ },
+ {
+ "epoch": 69.35149863760218,
+ "grad_norm": 2.5551226139068604,
+ "learning_rate": 4.5351075453576755e-06,
+ "loss": 0.1213,
+ "step": 25452
+ },
+ {
+ "epoch": 69.35422343324251,
+ "grad_norm": 3.0940890312194824,
+ "learning_rate": 4.53436850727908e-06,
+ "loss": 0.0664,
+ "step": 25453
+ },
+ {
+ "epoch": 69.35694822888283,
+ "grad_norm": 3.4480948448181152,
+ "learning_rate": 4.533629511766646e-06,
+ "loss": 0.176,
+ "step": 25454
+ },
+ {
+ "epoch": 69.35967302452316,
+ "grad_norm": 3.455458164215088,
+ "learning_rate": 4.5328905588261274e-06,
+ "loss": 0.0783,
+ "step": 25455
+ },
+ {
+ "epoch": 69.3623978201635,
+ "grad_norm": 2.989150047302246,
+ "learning_rate": 4.53215164846328e-06,
+ "loss": 0.0788,
+ "step": 25456
+ },
+ {
+ "epoch": 69.36512261580381,
+ "grad_norm": 3.5107991695404053,
+ "learning_rate": 4.531412780683864e-06,
+ "loss": 0.128,
+ "step": 25457
+ },
+ {
+ "epoch": 69.36784741144415,
+ "grad_norm": 2.281085729598999,
+ "learning_rate": 4.530673955493629e-06,
+ "loss": 0.0885,
+ "step": 25458
+ },
+ {
+ "epoch": 69.37057220708446,
+ "grad_norm": 2.156769037246704,
+ "learning_rate": 4.529935172898327e-06,
+ "loss": 0.0369,
+ "step": 25459
+ },
+ {
+ "epoch": 69.3732970027248,
+ "grad_norm": 3.0936028957366943,
+ "learning_rate": 4.529196432903713e-06,
+ "loss": 0.0468,
+ "step": 25460
+ },
+ {
+ "epoch": 69.37602179836512,
+ "grad_norm": 2.3070435523986816,
+ "learning_rate": 4.528457735515544e-06,
+ "loss": 0.0441,
+ "step": 25461
+ },
+ {
+ "epoch": 69.37874659400545,
+ "grad_norm": 5.0418925285339355,
+ "learning_rate": 4.5277190807395695e-06,
+ "loss": 0.0459,
+ "step": 25462
+ },
+ {
+ "epoch": 69.38147138964578,
+ "grad_norm": 4.551960468292236,
+ "learning_rate": 4.526980468581543e-06,
+ "loss": 0.0971,
+ "step": 25463
+ },
+ {
+ "epoch": 69.3841961852861,
+ "grad_norm": 2.7737889289855957,
+ "learning_rate": 4.526241899047213e-06,
+ "loss": 0.038,
+ "step": 25464
+ },
+ {
+ "epoch": 69.38692098092643,
+ "grad_norm": 2.7282233238220215,
+ "learning_rate": 4.525503372142339e-06,
+ "loss": 0.0535,
+ "step": 25465
+ },
+ {
+ "epoch": 69.38964577656675,
+ "grad_norm": 2.7730906009674072,
+ "learning_rate": 4.524764887872668e-06,
+ "loss": 0.0842,
+ "step": 25466
+ },
+ {
+ "epoch": 69.39237057220708,
+ "grad_norm": 2.8168158531188965,
+ "learning_rate": 4.524026446243952e-06,
+ "loss": 0.0758,
+ "step": 25467
+ },
+ {
+ "epoch": 69.39509536784742,
+ "grad_norm": 3.4718661308288574,
+ "learning_rate": 4.523288047261938e-06,
+ "loss": 0.1124,
+ "step": 25468
+ },
+ {
+ "epoch": 69.39782016348774,
+ "grad_norm": 3.580873966217041,
+ "learning_rate": 4.522549690932384e-06,
+ "loss": 0.1165,
+ "step": 25469
+ },
+ {
+ "epoch": 69.40054495912807,
+ "grad_norm": 2.9290521144866943,
+ "learning_rate": 4.521811377261036e-06,
+ "loss": 0.0466,
+ "step": 25470
+ },
+ {
+ "epoch": 69.40326975476839,
+ "grad_norm": 3.4112048149108887,
+ "learning_rate": 4.521073106253643e-06,
+ "loss": 0.048,
+ "step": 25471
+ },
+ {
+ "epoch": 69.40599455040872,
+ "grad_norm": 2.107800006866455,
+ "learning_rate": 4.5203348779159585e-06,
+ "loss": 0.0748,
+ "step": 25472
+ },
+ {
+ "epoch": 69.40871934604904,
+ "grad_norm": 3.148745059967041,
+ "learning_rate": 4.51959669225373e-06,
+ "loss": 0.057,
+ "step": 25473
+ },
+ {
+ "epoch": 69.41144414168937,
+ "grad_norm": 4.197068691253662,
+ "learning_rate": 4.518858549272702e-06,
+ "loss": 0.0384,
+ "step": 25474
+ },
+ {
+ "epoch": 69.4141689373297,
+ "grad_norm": 4.478817462921143,
+ "learning_rate": 4.518120448978631e-06,
+ "loss": 0.058,
+ "step": 25475
+ },
+ {
+ "epoch": 69.41689373297002,
+ "grad_norm": 3.8297202587127686,
+ "learning_rate": 4.517382391377258e-06,
+ "loss": 0.0664,
+ "step": 25476
+ },
+ {
+ "epoch": 69.41961852861036,
+ "grad_norm": 4.742251873016357,
+ "learning_rate": 4.516644376474339e-06,
+ "loss": 0.1049,
+ "step": 25477
+ },
+ {
+ "epoch": 69.42234332425068,
+ "grad_norm": 2.337071180343628,
+ "learning_rate": 4.515906404275615e-06,
+ "loss": 0.0331,
+ "step": 25478
+ },
+ {
+ "epoch": 69.42506811989101,
+ "grad_norm": 3.4373509883880615,
+ "learning_rate": 4.515168474786837e-06,
+ "loss": 0.0445,
+ "step": 25479
+ },
+ {
+ "epoch": 69.42779291553134,
+ "grad_norm": 3.0513668060302734,
+ "learning_rate": 4.514430588013746e-06,
+ "loss": 0.1766,
+ "step": 25480
+ },
+ {
+ "epoch": 69.43051771117166,
+ "grad_norm": 3.0420408248901367,
+ "learning_rate": 4.513692743962097e-06,
+ "loss": 0.0719,
+ "step": 25481
+ },
+ {
+ "epoch": 69.433242506812,
+ "grad_norm": 2.7636256217956543,
+ "learning_rate": 4.512954942637633e-06,
+ "loss": 0.0361,
+ "step": 25482
+ },
+ {
+ "epoch": 69.43596730245231,
+ "grad_norm": 2.655750036239624,
+ "learning_rate": 4.512217184046098e-06,
+ "loss": 0.0628,
+ "step": 25483
+ },
+ {
+ "epoch": 69.43869209809264,
+ "grad_norm": 2.935687780380249,
+ "learning_rate": 4.511479468193236e-06,
+ "loss": 0.1653,
+ "step": 25484
+ },
+ {
+ "epoch": 69.44141689373296,
+ "grad_norm": 2.878584623336792,
+ "learning_rate": 4.5107417950848e-06,
+ "loss": 0.0874,
+ "step": 25485
+ },
+ {
+ "epoch": 69.4441416893733,
+ "grad_norm": 3.644692897796631,
+ "learning_rate": 4.510004164726529e-06,
+ "loss": 0.2839,
+ "step": 25486
+ },
+ {
+ "epoch": 69.44686648501363,
+ "grad_norm": 2.3344852924346924,
+ "learning_rate": 4.509266577124169e-06,
+ "loss": 0.0359,
+ "step": 25487
+ },
+ {
+ "epoch": 69.44959128065395,
+ "grad_norm": 2.944648265838623,
+ "learning_rate": 4.508529032283461e-06,
+ "loss": 0.0493,
+ "step": 25488
+ },
+ {
+ "epoch": 69.45231607629428,
+ "grad_norm": 3.3743457794189453,
+ "learning_rate": 4.507791530210155e-06,
+ "loss": 0.074,
+ "step": 25489
+ },
+ {
+ "epoch": 69.4550408719346,
+ "grad_norm": 2.828557252883911,
+ "learning_rate": 4.507054070909992e-06,
+ "loss": 0.0324,
+ "step": 25490
+ },
+ {
+ "epoch": 69.45776566757493,
+ "grad_norm": 2.988844871520996,
+ "learning_rate": 4.506316654388712e-06,
+ "loss": 0.0744,
+ "step": 25491
+ },
+ {
+ "epoch": 69.46049046321527,
+ "grad_norm": 3.0800795555114746,
+ "learning_rate": 4.50557928065206e-06,
+ "loss": 0.0557,
+ "step": 25492
+ },
+ {
+ "epoch": 69.46321525885558,
+ "grad_norm": 3.5992672443389893,
+ "learning_rate": 4.5048419497057835e-06,
+ "loss": 0.0938,
+ "step": 25493
+ },
+ {
+ "epoch": 69.46594005449592,
+ "grad_norm": 4.743727684020996,
+ "learning_rate": 4.504104661555623e-06,
+ "loss": 0.056,
+ "step": 25494
+ },
+ {
+ "epoch": 69.46866485013624,
+ "grad_norm": 3.1263489723205566,
+ "learning_rate": 4.503367416207316e-06,
+ "loss": 0.0294,
+ "step": 25495
+ },
+ {
+ "epoch": 69.47138964577657,
+ "grad_norm": 4.683835506439209,
+ "learning_rate": 4.502630213666605e-06,
+ "loss": 0.0782,
+ "step": 25496
+ },
+ {
+ "epoch": 69.47411444141689,
+ "grad_norm": 2.891843557357788,
+ "learning_rate": 4.501893053939236e-06,
+ "loss": 0.0497,
+ "step": 25497
+ },
+ {
+ "epoch": 69.47683923705722,
+ "grad_norm": 3.1541855335235596,
+ "learning_rate": 4.501155937030946e-06,
+ "loss": 0.0846,
+ "step": 25498
+ },
+ {
+ "epoch": 69.47956403269755,
+ "grad_norm": 3.3001279830932617,
+ "learning_rate": 4.500418862947478e-06,
+ "loss": 0.0539,
+ "step": 25499
+ },
+ {
+ "epoch": 69.48228882833787,
+ "grad_norm": 2.4647982120513916,
+ "learning_rate": 4.4996818316945655e-06,
+ "loss": 0.0347,
+ "step": 25500
+ },
+ {
+ "epoch": 69.4850136239782,
+ "grad_norm": 6.2668609619140625,
+ "learning_rate": 4.498944843277959e-06,
+ "loss": 0.112,
+ "step": 25501
+ },
+ {
+ "epoch": 69.48773841961852,
+ "grad_norm": 4.0989203453063965,
+ "learning_rate": 4.498207897703393e-06,
+ "loss": 0.0499,
+ "step": 25502
+ },
+ {
+ "epoch": 69.49046321525886,
+ "grad_norm": 3.043545961380005,
+ "learning_rate": 4.497470994976606e-06,
+ "loss": 0.1422,
+ "step": 25503
+ },
+ {
+ "epoch": 69.49318801089919,
+ "grad_norm": 2.963949680328369,
+ "learning_rate": 4.496734135103334e-06,
+ "loss": 0.1138,
+ "step": 25504
+ },
+ {
+ "epoch": 69.49591280653951,
+ "grad_norm": 2.8195641040802,
+ "learning_rate": 4.4959973180893235e-06,
+ "loss": 0.0539,
+ "step": 25505
+ },
+ {
+ "epoch": 69.49863760217984,
+ "grad_norm": 3.33978533744812,
+ "learning_rate": 4.49526054394031e-06,
+ "loss": 0.0545,
+ "step": 25506
+ },
+ {
+ "epoch": 69.50136239782016,
+ "grad_norm": 2.9912805557250977,
+ "learning_rate": 4.4945238126620286e-06,
+ "loss": 0.0379,
+ "step": 25507
+ },
+ {
+ "epoch": 69.50408719346049,
+ "grad_norm": 4.629179000854492,
+ "learning_rate": 4.493787124260215e-06,
+ "loss": 0.054,
+ "step": 25508
+ },
+ {
+ "epoch": 69.50681198910081,
+ "grad_norm": 4.750308036804199,
+ "learning_rate": 4.49305047874061e-06,
+ "loss": 0.1869,
+ "step": 25509
+ },
+ {
+ "epoch": 69.50953678474114,
+ "grad_norm": 3.1100518703460693,
+ "learning_rate": 4.492313876108955e-06,
+ "loss": 0.0395,
+ "step": 25510
+ },
+ {
+ "epoch": 69.51226158038148,
+ "grad_norm": 3.0238888263702393,
+ "learning_rate": 4.491577316370982e-06,
+ "loss": 0.0413,
+ "step": 25511
+ },
+ {
+ "epoch": 69.5149863760218,
+ "grad_norm": 3.627363681793213,
+ "learning_rate": 4.490840799532428e-06,
+ "loss": 0.1171,
+ "step": 25512
+ },
+ {
+ "epoch": 69.51771117166213,
+ "grad_norm": 3.2774410247802734,
+ "learning_rate": 4.490104325599024e-06,
+ "loss": 0.0684,
+ "step": 25513
+ },
+ {
+ "epoch": 69.52043596730245,
+ "grad_norm": 3.144773483276367,
+ "learning_rate": 4.489367894576514e-06,
+ "loss": 0.0516,
+ "step": 25514
+ },
+ {
+ "epoch": 69.52316076294278,
+ "grad_norm": 4.020216464996338,
+ "learning_rate": 4.4886315064706295e-06,
+ "loss": 0.1232,
+ "step": 25515
+ },
+ {
+ "epoch": 69.52588555858311,
+ "grad_norm": 3.6075801849365234,
+ "learning_rate": 4.487895161287102e-06,
+ "loss": 0.0765,
+ "step": 25516
+ },
+ {
+ "epoch": 69.52861035422343,
+ "grad_norm": 3.4577956199645996,
+ "learning_rate": 4.487158859031674e-06,
+ "loss": 0.0423,
+ "step": 25517
+ },
+ {
+ "epoch": 69.53133514986376,
+ "grad_norm": 4.301992893218994,
+ "learning_rate": 4.486422599710074e-06,
+ "loss": 0.1098,
+ "step": 25518
+ },
+ {
+ "epoch": 69.53405994550408,
+ "grad_norm": 2.895936965942383,
+ "learning_rate": 4.4856863833280384e-06,
+ "loss": 0.0528,
+ "step": 25519
+ },
+ {
+ "epoch": 69.53678474114442,
+ "grad_norm": 2.136328935623169,
+ "learning_rate": 4.484950209891296e-06,
+ "loss": 0.035,
+ "step": 25520
+ },
+ {
+ "epoch": 69.53950953678473,
+ "grad_norm": 4.753259658813477,
+ "learning_rate": 4.484214079405587e-06,
+ "loss": 0.1188,
+ "step": 25521
+ },
+ {
+ "epoch": 69.54223433242507,
+ "grad_norm": 3.827326536178589,
+ "learning_rate": 4.483477991876642e-06,
+ "loss": 0.1702,
+ "step": 25522
+ },
+ {
+ "epoch": 69.5449591280654,
+ "grad_norm": 3.497188091278076,
+ "learning_rate": 4.482741947310192e-06,
+ "loss": 0.088,
+ "step": 25523
+ },
+ {
+ "epoch": 69.54768392370572,
+ "grad_norm": 6.807163715362549,
+ "learning_rate": 4.482005945711965e-06,
+ "loss": 0.1857,
+ "step": 25524
+ },
+ {
+ "epoch": 69.55040871934605,
+ "grad_norm": 3.836564540863037,
+ "learning_rate": 4.4812699870877e-06,
+ "loss": 0.0589,
+ "step": 25525
+ },
+ {
+ "epoch": 69.55313351498637,
+ "grad_norm": 48.24660110473633,
+ "learning_rate": 4.480534071443131e-06,
+ "loss": 0.1138,
+ "step": 25526
+ },
+ {
+ "epoch": 69.5558583106267,
+ "grad_norm": 3.2530205249786377,
+ "learning_rate": 4.479798198783984e-06,
+ "loss": 0.0359,
+ "step": 25527
+ },
+ {
+ "epoch": 69.55858310626704,
+ "grad_norm": 3.3195722103118896,
+ "learning_rate": 4.479062369115992e-06,
+ "loss": 0.0471,
+ "step": 25528
+ },
+ {
+ "epoch": 69.56130790190736,
+ "grad_norm": 3.158198356628418,
+ "learning_rate": 4.4783265824448795e-06,
+ "loss": 0.0878,
+ "step": 25529
+ },
+ {
+ "epoch": 69.56403269754769,
+ "grad_norm": 2.6671762466430664,
+ "learning_rate": 4.477590838776386e-06,
+ "loss": 0.0351,
+ "step": 25530
+ },
+ {
+ "epoch": 69.566757493188,
+ "grad_norm": 3.4229178428649902,
+ "learning_rate": 4.4768551381162375e-06,
+ "loss": 0.1534,
+ "step": 25531
+ },
+ {
+ "epoch": 69.56948228882834,
+ "grad_norm": 7.585022926330566,
+ "learning_rate": 4.476119480470163e-06,
+ "loss": 0.1878,
+ "step": 25532
+ },
+ {
+ "epoch": 69.57220708446866,
+ "grad_norm": 3.3582346439361572,
+ "learning_rate": 4.475383865843889e-06,
+ "loss": 0.0483,
+ "step": 25533
+ },
+ {
+ "epoch": 69.57493188010899,
+ "grad_norm": 3.0538430213928223,
+ "learning_rate": 4.474648294243151e-06,
+ "loss": 0.2468,
+ "step": 25534
+ },
+ {
+ "epoch": 69.57765667574932,
+ "grad_norm": 5.0180792808532715,
+ "learning_rate": 4.473912765673676e-06,
+ "loss": 0.1554,
+ "step": 25535
+ },
+ {
+ "epoch": 69.58038147138964,
+ "grad_norm": 2.2239420413970947,
+ "learning_rate": 4.473177280141185e-06,
+ "loss": 0.0411,
+ "step": 25536
+ },
+ {
+ "epoch": 69.58310626702998,
+ "grad_norm": 2.517350435256958,
+ "learning_rate": 4.4724418376514155e-06,
+ "loss": 0.132,
+ "step": 25537
+ },
+ {
+ "epoch": 69.5858310626703,
+ "grad_norm": 3.0453567504882812,
+ "learning_rate": 4.47170643821009e-06,
+ "loss": 0.0819,
+ "step": 25538
+ },
+ {
+ "epoch": 69.58855585831063,
+ "grad_norm": 2.4413506984710693,
+ "learning_rate": 4.470971081822938e-06,
+ "loss": 0.0421,
+ "step": 25539
+ },
+ {
+ "epoch": 69.59128065395096,
+ "grad_norm": 4.459550857543945,
+ "learning_rate": 4.470235768495682e-06,
+ "loss": 0.1374,
+ "step": 25540
+ },
+ {
+ "epoch": 69.59400544959128,
+ "grad_norm": 3.1329100131988525,
+ "learning_rate": 4.469500498234055e-06,
+ "loss": 0.0528,
+ "step": 25541
+ },
+ {
+ "epoch": 69.59673024523161,
+ "grad_norm": 2.6712231636047363,
+ "learning_rate": 4.468765271043777e-06,
+ "loss": 0.0397,
+ "step": 25542
+ },
+ {
+ "epoch": 69.59945504087193,
+ "grad_norm": 3.0572385787963867,
+ "learning_rate": 4.4680300869305795e-06,
+ "loss": 0.0921,
+ "step": 25543
+ },
+ {
+ "epoch": 69.60217983651226,
+ "grad_norm": 2.4251370429992676,
+ "learning_rate": 4.467294945900186e-06,
+ "loss": 0.0479,
+ "step": 25544
+ },
+ {
+ "epoch": 69.60490463215258,
+ "grad_norm": 2.989567279815674,
+ "learning_rate": 4.466559847958318e-06,
+ "loss": 0.1138,
+ "step": 25545
+ },
+ {
+ "epoch": 69.60762942779292,
+ "grad_norm": 3.232569456100464,
+ "learning_rate": 4.465824793110708e-06,
+ "loss": 0.1992,
+ "step": 25546
+ },
+ {
+ "epoch": 69.61035422343325,
+ "grad_norm": 4.112090110778809,
+ "learning_rate": 4.4650897813630755e-06,
+ "loss": 0.0689,
+ "step": 25547
+ },
+ {
+ "epoch": 69.61307901907357,
+ "grad_norm": 2.628995895385742,
+ "learning_rate": 4.464354812721147e-06,
+ "loss": 0.0612,
+ "step": 25548
+ },
+ {
+ "epoch": 69.6158038147139,
+ "grad_norm": 3.160435199737549,
+ "learning_rate": 4.46361988719064e-06,
+ "loss": 0.0529,
+ "step": 25549
+ },
+ {
+ "epoch": 69.61852861035422,
+ "grad_norm": 3.192359685897827,
+ "learning_rate": 4.462885004777287e-06,
+ "loss": 0.1992,
+ "step": 25550
+ },
+ {
+ "epoch": 69.62125340599455,
+ "grad_norm": 4.834630966186523,
+ "learning_rate": 4.462150165486807e-06,
+ "loss": 0.0504,
+ "step": 25551
+ },
+ {
+ "epoch": 69.62397820163488,
+ "grad_norm": 3.1146316528320312,
+ "learning_rate": 4.461415369324924e-06,
+ "loss": 0.1613,
+ "step": 25552
+ },
+ {
+ "epoch": 69.6267029972752,
+ "grad_norm": 3.7600176334381104,
+ "learning_rate": 4.460680616297356e-06,
+ "loss": 0.1573,
+ "step": 25553
+ },
+ {
+ "epoch": 69.62942779291554,
+ "grad_norm": 3.2461941242218018,
+ "learning_rate": 4.459945906409832e-06,
+ "loss": 0.1423,
+ "step": 25554
+ },
+ {
+ "epoch": 69.63215258855585,
+ "grad_norm": 3.6472384929656982,
+ "learning_rate": 4.459211239668073e-06,
+ "loss": 0.0822,
+ "step": 25555
+ },
+ {
+ "epoch": 69.63487738419619,
+ "grad_norm": 2.415484666824341,
+ "learning_rate": 4.458476616077797e-06,
+ "loss": 0.1135,
+ "step": 25556
+ },
+ {
+ "epoch": 69.6376021798365,
+ "grad_norm": 17.882747650146484,
+ "learning_rate": 4.457742035644723e-06,
+ "loss": 0.1495,
+ "step": 25557
+ },
+ {
+ "epoch": 69.64032697547684,
+ "grad_norm": 3.5511679649353027,
+ "learning_rate": 4.4570074983745806e-06,
+ "loss": 0.1856,
+ "step": 25558
+ },
+ {
+ "epoch": 69.64305177111717,
+ "grad_norm": 4.503655433654785,
+ "learning_rate": 4.456273004273084e-06,
+ "loss": 0.0797,
+ "step": 25559
+ },
+ {
+ "epoch": 69.64577656675749,
+ "grad_norm": 2.438267469406128,
+ "learning_rate": 4.4555385533459515e-06,
+ "loss": 0.1115,
+ "step": 25560
+ },
+ {
+ "epoch": 69.64850136239782,
+ "grad_norm": 3.1369853019714355,
+ "learning_rate": 4.454804145598907e-06,
+ "loss": 0.1224,
+ "step": 25561
+ },
+ {
+ "epoch": 69.65122615803814,
+ "grad_norm": 3.708622455596924,
+ "learning_rate": 4.4540697810376724e-06,
+ "loss": 0.1498,
+ "step": 25562
+ },
+ {
+ "epoch": 69.65395095367847,
+ "grad_norm": 3.237105131149292,
+ "learning_rate": 4.453335459667964e-06,
+ "loss": 0.0391,
+ "step": 25563
+ },
+ {
+ "epoch": 69.65667574931881,
+ "grad_norm": 3.6461849212646484,
+ "learning_rate": 4.4526011814955e-06,
+ "loss": 0.046,
+ "step": 25564
+ },
+ {
+ "epoch": 69.65940054495913,
+ "grad_norm": 2.78324031829834,
+ "learning_rate": 4.451866946525997e-06,
+ "loss": 0.0709,
+ "step": 25565
+ },
+ {
+ "epoch": 69.66212534059946,
+ "grad_norm": 3.4655065536499023,
+ "learning_rate": 4.451132754765179e-06,
+ "loss": 0.1083,
+ "step": 25566
+ },
+ {
+ "epoch": 69.66485013623978,
+ "grad_norm": 3.751417875289917,
+ "learning_rate": 4.450398606218759e-06,
+ "loss": 0.1404,
+ "step": 25567
+ },
+ {
+ "epoch": 69.66757493188011,
+ "grad_norm": 2.905965566635132,
+ "learning_rate": 4.449664500892456e-06,
+ "loss": 0.154,
+ "step": 25568
+ },
+ {
+ "epoch": 69.67029972752043,
+ "grad_norm": 3.733325481414795,
+ "learning_rate": 4.448930438791986e-06,
+ "loss": 0.1691,
+ "step": 25569
+ },
+ {
+ "epoch": 69.67302452316076,
+ "grad_norm": 2.9593799114227295,
+ "learning_rate": 4.448196419923068e-06,
+ "loss": 0.0616,
+ "step": 25570
+ },
+ {
+ "epoch": 69.6757493188011,
+ "grad_norm": 3.1292717456817627,
+ "learning_rate": 4.447462444291421e-06,
+ "loss": 0.0477,
+ "step": 25571
+ },
+ {
+ "epoch": 69.67847411444141,
+ "grad_norm": 2.4466569423675537,
+ "learning_rate": 4.446728511902755e-06,
+ "loss": 0.0267,
+ "step": 25572
+ },
+ {
+ "epoch": 69.68119891008175,
+ "grad_norm": 3.170085906982422,
+ "learning_rate": 4.445994622762786e-06,
+ "loss": 0.0603,
+ "step": 25573
+ },
+ {
+ "epoch": 69.68392370572207,
+ "grad_norm": 3.642721652984619,
+ "learning_rate": 4.445260776877235e-06,
+ "loss": 0.1093,
+ "step": 25574
+ },
+ {
+ "epoch": 69.6866485013624,
+ "grad_norm": 2.6193416118621826,
+ "learning_rate": 4.444526974251815e-06,
+ "loss": 0.1013,
+ "step": 25575
+ },
+ {
+ "epoch": 69.68937329700273,
+ "grad_norm": 2.3695764541625977,
+ "learning_rate": 4.443793214892241e-06,
+ "loss": 0.1401,
+ "step": 25576
+ },
+ {
+ "epoch": 69.69209809264305,
+ "grad_norm": 2.5913591384887695,
+ "learning_rate": 4.443059498804217e-06,
+ "loss": 0.0389,
+ "step": 25577
+ },
+ {
+ "epoch": 69.69482288828338,
+ "grad_norm": 2.943362236022949,
+ "learning_rate": 4.442325825993475e-06,
+ "loss": 0.1036,
+ "step": 25578
+ },
+ {
+ "epoch": 69.6975476839237,
+ "grad_norm": 3.2677478790283203,
+ "learning_rate": 4.441592196465722e-06,
+ "loss": 0.1509,
+ "step": 25579
+ },
+ {
+ "epoch": 69.70027247956403,
+ "grad_norm": 4.0697503089904785,
+ "learning_rate": 4.440858610226668e-06,
+ "loss": 0.0494,
+ "step": 25580
+ },
+ {
+ "epoch": 69.70299727520435,
+ "grad_norm": 2.5456671714782715,
+ "learning_rate": 4.440125067282026e-06,
+ "loss": 0.1437,
+ "step": 25581
+ },
+ {
+ "epoch": 69.70572207084469,
+ "grad_norm": 2.466583251953125,
+ "learning_rate": 4.439391567637514e-06,
+ "loss": 0.0759,
+ "step": 25582
+ },
+ {
+ "epoch": 69.70844686648502,
+ "grad_norm": 3.052860736846924,
+ "learning_rate": 4.438658111298842e-06,
+ "loss": 0.0524,
+ "step": 25583
+ },
+ {
+ "epoch": 69.71117166212534,
+ "grad_norm": 5.271154880523682,
+ "learning_rate": 4.437924698271721e-06,
+ "loss": 0.0925,
+ "step": 25584
+ },
+ {
+ "epoch": 69.71389645776567,
+ "grad_norm": 3.734518051147461,
+ "learning_rate": 4.437191328561861e-06,
+ "loss": 0.1157,
+ "step": 25585
+ },
+ {
+ "epoch": 69.71662125340599,
+ "grad_norm": 2.750703811645508,
+ "learning_rate": 4.436458002174978e-06,
+ "loss": 0.1127,
+ "step": 25586
+ },
+ {
+ "epoch": 69.71934604904632,
+ "grad_norm": 2.8358259201049805,
+ "learning_rate": 4.435724719116781e-06,
+ "loss": 0.1227,
+ "step": 25587
+ },
+ {
+ "epoch": 69.72207084468666,
+ "grad_norm": 3.0903167724609375,
+ "learning_rate": 4.434991479392983e-06,
+ "loss": 0.0764,
+ "step": 25588
+ },
+ {
+ "epoch": 69.72479564032697,
+ "grad_norm": 3.4187843799591064,
+ "learning_rate": 4.434258283009287e-06,
+ "loss": 0.0634,
+ "step": 25589
+ },
+ {
+ "epoch": 69.7275204359673,
+ "grad_norm": 3.107501745223999,
+ "learning_rate": 4.433525129971412e-06,
+ "loss": 0.028,
+ "step": 25590
+ },
+ {
+ "epoch": 69.73024523160763,
+ "grad_norm": 8.434030532836914,
+ "learning_rate": 4.432792020285065e-06,
+ "loss": 0.0943,
+ "step": 25591
+ },
+ {
+ "epoch": 69.73297002724796,
+ "grad_norm": 2.6484265327453613,
+ "learning_rate": 4.432058953955954e-06,
+ "loss": 0.0498,
+ "step": 25592
+ },
+ {
+ "epoch": 69.73569482288828,
+ "grad_norm": 4.696080684661865,
+ "learning_rate": 4.4313259309897835e-06,
+ "loss": 0.1324,
+ "step": 25593
+ },
+ {
+ "epoch": 69.73841961852861,
+ "grad_norm": 3.7561469078063965,
+ "learning_rate": 4.430592951392269e-06,
+ "loss": 0.1034,
+ "step": 25594
+ },
+ {
+ "epoch": 69.74114441416894,
+ "grad_norm": 3.9254508018493652,
+ "learning_rate": 4.42986001516912e-06,
+ "loss": 0.1331,
+ "step": 25595
+ },
+ {
+ "epoch": 69.74386920980926,
+ "grad_norm": 3.06659197807312,
+ "learning_rate": 4.429127122326044e-06,
+ "loss": 0.042,
+ "step": 25596
+ },
+ {
+ "epoch": 69.7465940054496,
+ "grad_norm": 3.235938787460327,
+ "learning_rate": 4.428394272868746e-06,
+ "loss": 0.06,
+ "step": 25597
+ },
+ {
+ "epoch": 69.74931880108991,
+ "grad_norm": 4.666807651519775,
+ "learning_rate": 4.427661466802929e-06,
+ "loss": 0.0695,
+ "step": 25598
+ },
+ {
+ "epoch": 69.75204359673025,
+ "grad_norm": 3.2119932174682617,
+ "learning_rate": 4.4269287041343105e-06,
+ "loss": 0.0961,
+ "step": 25599
+ },
+ {
+ "epoch": 69.75476839237058,
+ "grad_norm": 2.497992753982544,
+ "learning_rate": 4.42619598486859e-06,
+ "loss": 0.0415,
+ "step": 25600
+ },
+ {
+ "epoch": 69.7574931880109,
+ "grad_norm": 3.476628303527832,
+ "learning_rate": 4.425463309011473e-06,
+ "loss": 0.1269,
+ "step": 25601
+ },
+ {
+ "epoch": 69.76021798365123,
+ "grad_norm": 2.7838804721832275,
+ "learning_rate": 4.4247306765686726e-06,
+ "loss": 0.0975,
+ "step": 25602
+ },
+ {
+ "epoch": 69.76294277929155,
+ "grad_norm": 3.8740968704223633,
+ "learning_rate": 4.42399808754589e-06,
+ "loss": 0.0683,
+ "step": 25603
+ },
+ {
+ "epoch": 69.76566757493188,
+ "grad_norm": 3.0945353507995605,
+ "learning_rate": 4.42326554194883e-06,
+ "loss": 0.1353,
+ "step": 25604
+ },
+ {
+ "epoch": 69.7683923705722,
+ "grad_norm": 2.226154088973999,
+ "learning_rate": 4.422533039783196e-06,
+ "loss": 0.0273,
+ "step": 25605
+ },
+ {
+ "epoch": 69.77111716621253,
+ "grad_norm": 4.142420768737793,
+ "learning_rate": 4.421800581054698e-06,
+ "loss": 0.1002,
+ "step": 25606
+ },
+ {
+ "epoch": 69.77384196185287,
+ "grad_norm": 3.0412681102752686,
+ "learning_rate": 4.421068165769038e-06,
+ "loss": 0.0761,
+ "step": 25607
+ },
+ {
+ "epoch": 69.77656675749319,
+ "grad_norm": 3.305342435836792,
+ "learning_rate": 4.420335793931919e-06,
+ "loss": 0.0297,
+ "step": 25608
+ },
+ {
+ "epoch": 69.77929155313352,
+ "grad_norm": 3.126786708831787,
+ "learning_rate": 4.419603465549042e-06,
+ "loss": 0.0981,
+ "step": 25609
+ },
+ {
+ "epoch": 69.78201634877384,
+ "grad_norm": 2.439060688018799,
+ "learning_rate": 4.418871180626118e-06,
+ "loss": 0.0776,
+ "step": 25610
+ },
+ {
+ "epoch": 69.78474114441417,
+ "grad_norm": 3.507622003555298,
+ "learning_rate": 4.41813893916884e-06,
+ "loss": 0.0572,
+ "step": 25611
+ },
+ {
+ "epoch": 69.7874659400545,
+ "grad_norm": 1.6027233600616455,
+ "learning_rate": 4.417406741182921e-06,
+ "loss": 0.0211,
+ "step": 25612
+ },
+ {
+ "epoch": 69.79019073569482,
+ "grad_norm": 2.8347413539886475,
+ "learning_rate": 4.416674586674059e-06,
+ "loss": 0.0736,
+ "step": 25613
+ },
+ {
+ "epoch": 69.79291553133515,
+ "grad_norm": 2.759368896484375,
+ "learning_rate": 4.415942475647952e-06,
+ "loss": 0.0456,
+ "step": 25614
+ },
+ {
+ "epoch": 69.79564032697547,
+ "grad_norm": 4.204044818878174,
+ "learning_rate": 4.415210408110308e-06,
+ "loss": 0.0493,
+ "step": 25615
+ },
+ {
+ "epoch": 69.7983651226158,
+ "grad_norm": 3.0013973712921143,
+ "learning_rate": 4.414478384066827e-06,
+ "loss": 0.1487,
+ "step": 25616
+ },
+ {
+ "epoch": 69.80108991825612,
+ "grad_norm": 2.776397943496704,
+ "learning_rate": 4.413746403523208e-06,
+ "loss": 0.0492,
+ "step": 25617
+ },
+ {
+ "epoch": 69.80381471389646,
+ "grad_norm": 3.0675408840179443,
+ "learning_rate": 4.413014466485148e-06,
+ "loss": 0.2052,
+ "step": 25618
+ },
+ {
+ "epoch": 69.80653950953679,
+ "grad_norm": 2.969741106033325,
+ "learning_rate": 4.412282572958356e-06,
+ "loss": 0.0487,
+ "step": 25619
+ },
+ {
+ "epoch": 69.80926430517711,
+ "grad_norm": 2.379892587661743,
+ "learning_rate": 4.411550722948527e-06,
+ "loss": 0.1333,
+ "step": 25620
+ },
+ {
+ "epoch": 69.81198910081744,
+ "grad_norm": 2.675790548324585,
+ "learning_rate": 4.410818916461362e-06,
+ "loss": 0.0952,
+ "step": 25621
+ },
+ {
+ "epoch": 69.81471389645776,
+ "grad_norm": 3.693694591522217,
+ "learning_rate": 4.410087153502554e-06,
+ "loss": 0.0805,
+ "step": 25622
+ },
+ {
+ "epoch": 69.8174386920981,
+ "grad_norm": 2.791461944580078,
+ "learning_rate": 4.409355434077812e-06,
+ "loss": 0.1232,
+ "step": 25623
+ },
+ {
+ "epoch": 69.82016348773843,
+ "grad_norm": 3.2176051139831543,
+ "learning_rate": 4.408623758192829e-06,
+ "loss": 0.0851,
+ "step": 25624
+ },
+ {
+ "epoch": 69.82288828337875,
+ "grad_norm": 3.1415207386016846,
+ "learning_rate": 4.4078921258533026e-06,
+ "loss": 0.0891,
+ "step": 25625
+ },
+ {
+ "epoch": 69.82561307901908,
+ "grad_norm": 3.862701416015625,
+ "learning_rate": 4.407160537064934e-06,
+ "loss": 0.0749,
+ "step": 25626
+ },
+ {
+ "epoch": 69.8283378746594,
+ "grad_norm": 5.554037570953369,
+ "learning_rate": 4.40642899183342e-06,
+ "loss": 0.147,
+ "step": 25627
+ },
+ {
+ "epoch": 69.83106267029973,
+ "grad_norm": 3.3573391437530518,
+ "learning_rate": 4.4056974901644565e-06,
+ "loss": 0.0807,
+ "step": 25628
+ },
+ {
+ "epoch": 69.83378746594005,
+ "grad_norm": 2.9982717037200928,
+ "learning_rate": 4.404966032063738e-06,
+ "loss": 0.0752,
+ "step": 25629
+ },
+ {
+ "epoch": 69.83651226158038,
+ "grad_norm": 10.977214813232422,
+ "learning_rate": 4.404234617536964e-06,
+ "loss": 0.1221,
+ "step": 25630
+ },
+ {
+ "epoch": 69.83923705722071,
+ "grad_norm": 3.395043134689331,
+ "learning_rate": 4.403503246589834e-06,
+ "loss": 0.1199,
+ "step": 25631
+ },
+ {
+ "epoch": 69.84196185286103,
+ "grad_norm": 2.596799612045288,
+ "learning_rate": 4.402771919228041e-06,
+ "loss": 0.0495,
+ "step": 25632
+ },
+ {
+ "epoch": 69.84468664850137,
+ "grad_norm": 3.859687566757202,
+ "learning_rate": 4.402040635457279e-06,
+ "loss": 0.0637,
+ "step": 25633
+ },
+ {
+ "epoch": 69.84741144414168,
+ "grad_norm": 4.322866439819336,
+ "learning_rate": 4.401309395283241e-06,
+ "loss": 0.107,
+ "step": 25634
+ },
+ {
+ "epoch": 69.85013623978202,
+ "grad_norm": 3.5606908798217773,
+ "learning_rate": 4.400578198711629e-06,
+ "loss": 0.1245,
+ "step": 25635
+ },
+ {
+ "epoch": 69.85286103542235,
+ "grad_norm": 2.4128639698028564,
+ "learning_rate": 4.399847045748134e-06,
+ "loss": 0.0301,
+ "step": 25636
+ },
+ {
+ "epoch": 69.85558583106267,
+ "grad_norm": 3.8043482303619385,
+ "learning_rate": 4.39911593639845e-06,
+ "loss": 0.0649,
+ "step": 25637
+ },
+ {
+ "epoch": 69.858310626703,
+ "grad_norm": 2.828317165374756,
+ "learning_rate": 4.398384870668267e-06,
+ "loss": 0.2023,
+ "step": 25638
+ },
+ {
+ "epoch": 69.86103542234332,
+ "grad_norm": 3.3704493045806885,
+ "learning_rate": 4.397653848563287e-06,
+ "loss": 0.0682,
+ "step": 25639
+ },
+ {
+ "epoch": 69.86376021798365,
+ "grad_norm": 3.1510908603668213,
+ "learning_rate": 4.396922870089197e-06,
+ "loss": 0.0609,
+ "step": 25640
+ },
+ {
+ "epoch": 69.86648501362397,
+ "grad_norm": 3.364135265350342,
+ "learning_rate": 4.396191935251694e-06,
+ "loss": 0.1387,
+ "step": 25641
+ },
+ {
+ "epoch": 69.8692098092643,
+ "grad_norm": 3.898624897003174,
+ "learning_rate": 4.395461044056462e-06,
+ "loss": 0.0904,
+ "step": 25642
+ },
+ {
+ "epoch": 69.87193460490464,
+ "grad_norm": 3.5249741077423096,
+ "learning_rate": 4.394730196509203e-06,
+ "loss": 0.0581,
+ "step": 25643
+ },
+ {
+ "epoch": 69.87465940054496,
+ "grad_norm": 5.282028675079346,
+ "learning_rate": 4.393999392615604e-06,
+ "loss": 0.0977,
+ "step": 25644
+ },
+ {
+ "epoch": 69.87738419618529,
+ "grad_norm": 3.129587173461914,
+ "learning_rate": 4.393268632381354e-06,
+ "loss": 0.039,
+ "step": 25645
+ },
+ {
+ "epoch": 69.88010899182561,
+ "grad_norm": 3.003549814224243,
+ "learning_rate": 4.392537915812148e-06,
+ "loss": 0.1757,
+ "step": 25646
+ },
+ {
+ "epoch": 69.88283378746594,
+ "grad_norm": 2.8321433067321777,
+ "learning_rate": 4.391807242913679e-06,
+ "loss": 0.0421,
+ "step": 25647
+ },
+ {
+ "epoch": 69.88555858310627,
+ "grad_norm": 3.6392486095428467,
+ "learning_rate": 4.391076613691636e-06,
+ "loss": 0.0545,
+ "step": 25648
+ },
+ {
+ "epoch": 69.88828337874659,
+ "grad_norm": 3.471306562423706,
+ "learning_rate": 4.390346028151708e-06,
+ "loss": 0.0431,
+ "step": 25649
+ },
+ {
+ "epoch": 69.89100817438693,
+ "grad_norm": 3.0239179134368896,
+ "learning_rate": 4.38961548629958e-06,
+ "loss": 0.0341,
+ "step": 25650
+ },
+ {
+ "epoch": 69.89373297002724,
+ "grad_norm": 7.585079669952393,
+ "learning_rate": 4.38888498814095e-06,
+ "loss": 0.1591,
+ "step": 25651
+ },
+ {
+ "epoch": 69.89645776566758,
+ "grad_norm": 4.792723655700684,
+ "learning_rate": 4.388154533681502e-06,
+ "loss": 0.1317,
+ "step": 25652
+ },
+ {
+ "epoch": 69.8991825613079,
+ "grad_norm": 3.157466173171997,
+ "learning_rate": 4.387424122926927e-06,
+ "loss": 0.0898,
+ "step": 25653
+ },
+ {
+ "epoch": 69.90190735694823,
+ "grad_norm": 2.9385287761688232,
+ "learning_rate": 4.386693755882909e-06,
+ "loss": 0.0555,
+ "step": 25654
+ },
+ {
+ "epoch": 69.90463215258856,
+ "grad_norm": 3.342075824737549,
+ "learning_rate": 4.385963432555142e-06,
+ "loss": 0.073,
+ "step": 25655
+ },
+ {
+ "epoch": 69.90735694822888,
+ "grad_norm": 3.559858798980713,
+ "learning_rate": 4.385233152949312e-06,
+ "loss": 0.101,
+ "step": 25656
+ },
+ {
+ "epoch": 69.91008174386921,
+ "grad_norm": 4.819878578186035,
+ "learning_rate": 4.3845029170711055e-06,
+ "loss": 0.0646,
+ "step": 25657
+ },
+ {
+ "epoch": 69.91280653950953,
+ "grad_norm": 2.4177775382995605,
+ "learning_rate": 4.383772724926205e-06,
+ "loss": 0.1697,
+ "step": 25658
+ },
+ {
+ "epoch": 69.91553133514986,
+ "grad_norm": 3.4610695838928223,
+ "learning_rate": 4.383042576520306e-06,
+ "loss": 0.1073,
+ "step": 25659
+ },
+ {
+ "epoch": 69.9182561307902,
+ "grad_norm": 4.215226173400879,
+ "learning_rate": 4.38231247185909e-06,
+ "loss": 0.1097,
+ "step": 25660
+ },
+ {
+ "epoch": 69.92098092643052,
+ "grad_norm": 2.705392837524414,
+ "learning_rate": 4.381582410948244e-06,
+ "loss": 0.1132,
+ "step": 25661
+ },
+ {
+ "epoch": 69.92370572207085,
+ "grad_norm": 2.679771900177002,
+ "learning_rate": 4.380852393793451e-06,
+ "loss": 0.0356,
+ "step": 25662
+ },
+ {
+ "epoch": 69.92643051771117,
+ "grad_norm": 3.200523614883423,
+ "learning_rate": 4.380122420400397e-06,
+ "loss": 0.0553,
+ "step": 25663
+ },
+ {
+ "epoch": 69.9291553133515,
+ "grad_norm": 2.936349630355835,
+ "learning_rate": 4.379392490774773e-06,
+ "loss": 0.1744,
+ "step": 25664
+ },
+ {
+ "epoch": 69.93188010899182,
+ "grad_norm": 4.008108139038086,
+ "learning_rate": 4.378662604922259e-06,
+ "loss": 0.1185,
+ "step": 25665
+ },
+ {
+ "epoch": 69.93460490463215,
+ "grad_norm": 5.427388668060303,
+ "learning_rate": 4.3779327628485365e-06,
+ "loss": 0.112,
+ "step": 25666
+ },
+ {
+ "epoch": 69.93732970027249,
+ "grad_norm": 2.4391846656799316,
+ "learning_rate": 4.377202964559296e-06,
+ "loss": 0.1328,
+ "step": 25667
+ },
+ {
+ "epoch": 69.9400544959128,
+ "grad_norm": 2.8574271202087402,
+ "learning_rate": 4.376473210060219e-06,
+ "loss": 0.042,
+ "step": 25668
+ },
+ {
+ "epoch": 69.94277929155314,
+ "grad_norm": 2.2506847381591797,
+ "learning_rate": 4.375743499356987e-06,
+ "loss": 0.0739,
+ "step": 25669
+ },
+ {
+ "epoch": 69.94550408719346,
+ "grad_norm": 3.2817273139953613,
+ "learning_rate": 4.375013832455279e-06,
+ "loss": 0.1347,
+ "step": 25670
+ },
+ {
+ "epoch": 69.94822888283379,
+ "grad_norm": 3.0046727657318115,
+ "learning_rate": 4.374284209360787e-06,
+ "loss": 0.0601,
+ "step": 25671
+ },
+ {
+ "epoch": 69.95095367847412,
+ "grad_norm": 4.249406814575195,
+ "learning_rate": 4.373554630079187e-06,
+ "loss": 0.095,
+ "step": 25672
+ },
+ {
+ "epoch": 69.95367847411444,
+ "grad_norm": 3.763875722885132,
+ "learning_rate": 4.3728250946161644e-06,
+ "loss": 0.0977,
+ "step": 25673
+ },
+ {
+ "epoch": 69.95640326975477,
+ "grad_norm": 3.7556955814361572,
+ "learning_rate": 4.372095602977394e-06,
+ "loss": 0.067,
+ "step": 25674
+ },
+ {
+ "epoch": 69.95912806539509,
+ "grad_norm": 3.5178794860839844,
+ "learning_rate": 4.371366155168566e-06,
+ "loss": 0.0613,
+ "step": 25675
+ },
+ {
+ "epoch": 69.96185286103542,
+ "grad_norm": 3.5529630184173584,
+ "learning_rate": 4.370636751195357e-06,
+ "loss": 0.0539,
+ "step": 25676
+ },
+ {
+ "epoch": 69.96457765667574,
+ "grad_norm": 3.3359811305999756,
+ "learning_rate": 4.369907391063448e-06,
+ "loss": 0.1426,
+ "step": 25677
+ },
+ {
+ "epoch": 69.96730245231608,
+ "grad_norm": 2.9579179286956787,
+ "learning_rate": 4.369178074778516e-06,
+ "loss": 0.1469,
+ "step": 25678
+ },
+ {
+ "epoch": 69.97002724795641,
+ "grad_norm": 3.1833534240722656,
+ "learning_rate": 4.368448802346247e-06,
+ "loss": 0.0935,
+ "step": 25679
+ },
+ {
+ "epoch": 69.97275204359673,
+ "grad_norm": 3.3022069931030273,
+ "learning_rate": 4.367719573772313e-06,
+ "loss": 0.0816,
+ "step": 25680
+ },
+ {
+ "epoch": 69.97547683923706,
+ "grad_norm": 3.098957061767578,
+ "learning_rate": 4.366990389062402e-06,
+ "loss": 0.0598,
+ "step": 25681
+ },
+ {
+ "epoch": 69.97820163487738,
+ "grad_norm": 3.772223711013794,
+ "learning_rate": 4.366261248222189e-06,
+ "loss": 0.0484,
+ "step": 25682
+ },
+ {
+ "epoch": 69.98092643051771,
+ "grad_norm": 2.9102935791015625,
+ "learning_rate": 4.3655321512573475e-06,
+ "loss": 0.0849,
+ "step": 25683
+ },
+ {
+ "epoch": 69.98365122615803,
+ "grad_norm": 4.268817901611328,
+ "learning_rate": 4.364803098173566e-06,
+ "loss": 0.0833,
+ "step": 25684
+ },
+ {
+ "epoch": 69.98637602179836,
+ "grad_norm": 2.0717179775238037,
+ "learning_rate": 4.364074088976514e-06,
+ "loss": 0.031,
+ "step": 25685
+ },
+ {
+ "epoch": 69.9891008174387,
+ "grad_norm": 2.721580743789673,
+ "learning_rate": 4.363345123671873e-06,
+ "loss": 0.0813,
+ "step": 25686
+ },
+ {
+ "epoch": 69.99182561307902,
+ "grad_norm": 5.713351726531982,
+ "learning_rate": 4.362616202265315e-06,
+ "loss": 0.0604,
+ "step": 25687
+ },
+ {
+ "epoch": 69.99455040871935,
+ "grad_norm": 5.006141662597656,
+ "learning_rate": 4.3618873247625235e-06,
+ "loss": 0.0677,
+ "step": 25688
+ },
+ {
+ "epoch": 69.99727520435967,
+ "grad_norm": 4.068763732910156,
+ "learning_rate": 4.361158491169173e-06,
+ "loss": 0.1026,
+ "step": 25689
+ },
+ {
+ "epoch": 70.0,
+ "grad_norm": 3.37605881690979,
+ "learning_rate": 4.360429701490935e-06,
+ "loss": 0.0605,
+ "step": 25690
+ },
+ {
+ "epoch": 70.00272479564033,
+ "grad_norm": 2.612733840942383,
+ "learning_rate": 4.359700955733492e-06,
+ "loss": 0.0424,
+ "step": 25691
+ },
+ {
+ "epoch": 70.00544959128065,
+ "grad_norm": 3.462092161178589,
+ "learning_rate": 4.358972253902517e-06,
+ "loss": 0.1157,
+ "step": 25692
+ },
+ {
+ "epoch": 70.00817438692098,
+ "grad_norm": 2.9180169105529785,
+ "learning_rate": 4.358243596003684e-06,
+ "loss": 0.0549,
+ "step": 25693
+ },
+ {
+ "epoch": 70.0108991825613,
+ "grad_norm": 3.7692203521728516,
+ "learning_rate": 4.357514982042664e-06,
+ "loss": 0.1095,
+ "step": 25694
+ },
+ {
+ "epoch": 70.01362397820164,
+ "grad_norm": 3.2022128105163574,
+ "learning_rate": 4.3567864120251406e-06,
+ "loss": 0.1199,
+ "step": 25695
+ },
+ {
+ "epoch": 70.01634877384195,
+ "grad_norm": 5.526648044586182,
+ "learning_rate": 4.356057885956782e-06,
+ "loss": 0.1713,
+ "step": 25696
+ },
+ {
+ "epoch": 70.01907356948229,
+ "grad_norm": 2.456502914428711,
+ "learning_rate": 4.35532940384326e-06,
+ "loss": 0.0632,
+ "step": 25697
+ },
+ {
+ "epoch": 70.02179836512262,
+ "grad_norm": 3.7020177841186523,
+ "learning_rate": 4.354600965690255e-06,
+ "loss": 0.1594,
+ "step": 25698
+ },
+ {
+ "epoch": 70.02452316076294,
+ "grad_norm": 3.0396926403045654,
+ "learning_rate": 4.353872571503431e-06,
+ "loss": 0.1524,
+ "step": 25699
+ },
+ {
+ "epoch": 70.02724795640327,
+ "grad_norm": 3.463225841522217,
+ "learning_rate": 4.353144221288471e-06,
+ "loss": 0.0591,
+ "step": 25700
+ },
+ {
+ "epoch": 70.02997275204359,
+ "grad_norm": 2.843632698059082,
+ "learning_rate": 4.352415915051042e-06,
+ "loss": 0.0925,
+ "step": 25701
+ },
+ {
+ "epoch": 70.03269754768392,
+ "grad_norm": 2.684150457382202,
+ "learning_rate": 4.351687652796815e-06,
+ "loss": 0.08,
+ "step": 25702
+ },
+ {
+ "epoch": 70.03542234332426,
+ "grad_norm": 2.7099454402923584,
+ "learning_rate": 4.3509594345314585e-06,
+ "loss": 0.0472,
+ "step": 25703
+ },
+ {
+ "epoch": 70.03814713896458,
+ "grad_norm": 2.846945285797119,
+ "learning_rate": 4.350231260260653e-06,
+ "loss": 0.0433,
+ "step": 25704
+ },
+ {
+ "epoch": 70.04087193460491,
+ "grad_norm": 2.798208475112915,
+ "learning_rate": 4.349503129990065e-06,
+ "loss": 0.0679,
+ "step": 25705
+ },
+ {
+ "epoch": 70.04359673024523,
+ "grad_norm": 3.0003740787506104,
+ "learning_rate": 4.348775043725364e-06,
+ "loss": 0.0504,
+ "step": 25706
+ },
+ {
+ "epoch": 70.04632152588556,
+ "grad_norm": 3.941540479660034,
+ "learning_rate": 4.348047001472217e-06,
+ "loss": 0.0373,
+ "step": 25707
+ },
+ {
+ "epoch": 70.04904632152588,
+ "grad_norm": 3.7867789268493652,
+ "learning_rate": 4.347319003236302e-06,
+ "loss": 0.1158,
+ "step": 25708
+ },
+ {
+ "epoch": 70.05177111716621,
+ "grad_norm": 3.8642520904541016,
+ "learning_rate": 4.346591049023286e-06,
+ "loss": 0.1307,
+ "step": 25709
+ },
+ {
+ "epoch": 70.05449591280654,
+ "grad_norm": 3.514848470687866,
+ "learning_rate": 4.34586313883883e-06,
+ "loss": 0.0669,
+ "step": 25710
+ },
+ {
+ "epoch": 70.05722070844686,
+ "grad_norm": 2.442347526550293,
+ "learning_rate": 4.345135272688617e-06,
+ "loss": 0.0349,
+ "step": 25711
+ },
+ {
+ "epoch": 70.0599455040872,
+ "grad_norm": 2.755409002304077,
+ "learning_rate": 4.3444074505783075e-06,
+ "loss": 0.0613,
+ "step": 25712
+ },
+ {
+ "epoch": 70.06267029972751,
+ "grad_norm": 3.864417791366577,
+ "learning_rate": 4.34367967251357e-06,
+ "loss": 0.0722,
+ "step": 25713
+ },
+ {
+ "epoch": 70.06539509536785,
+ "grad_norm": 1.9272481203079224,
+ "learning_rate": 4.342951938500069e-06,
+ "loss": 0.0521,
+ "step": 25714
+ },
+ {
+ "epoch": 70.06811989100818,
+ "grad_norm": 4.0011887550354,
+ "learning_rate": 4.342224248543479e-06,
+ "loss": 0.0657,
+ "step": 25715
+ },
+ {
+ "epoch": 70.0708446866485,
+ "grad_norm": 2.9652342796325684,
+ "learning_rate": 4.341496602649465e-06,
+ "loss": 0.0505,
+ "step": 25716
+ },
+ {
+ "epoch": 70.07356948228883,
+ "grad_norm": 2.233431577682495,
+ "learning_rate": 4.340769000823695e-06,
+ "loss": 0.0522,
+ "step": 25717
+ },
+ {
+ "epoch": 70.07629427792915,
+ "grad_norm": 2.004546880722046,
+ "learning_rate": 4.340041443071833e-06,
+ "loss": 0.0246,
+ "step": 25718
+ },
+ {
+ "epoch": 70.07901907356948,
+ "grad_norm": 2.3655498027801514,
+ "learning_rate": 4.339313929399543e-06,
+ "loss": 0.0996,
+ "step": 25719
+ },
+ {
+ "epoch": 70.0817438692098,
+ "grad_norm": 4.205402851104736,
+ "learning_rate": 4.338586459812498e-06,
+ "loss": 0.0624,
+ "step": 25720
+ },
+ {
+ "epoch": 70.08446866485014,
+ "grad_norm": 3.3054966926574707,
+ "learning_rate": 4.337859034316358e-06,
+ "loss": 0.1,
+ "step": 25721
+ },
+ {
+ "epoch": 70.08719346049047,
+ "grad_norm": 2.6024978160858154,
+ "learning_rate": 4.337131652916792e-06,
+ "loss": 0.0862,
+ "step": 25722
+ },
+ {
+ "epoch": 70.08991825613079,
+ "grad_norm": 3.2785117626190186,
+ "learning_rate": 4.3364043156194566e-06,
+ "loss": 0.0414,
+ "step": 25723
+ },
+ {
+ "epoch": 70.09264305177112,
+ "grad_norm": 2.1956186294555664,
+ "learning_rate": 4.335677022430027e-06,
+ "loss": 0.0895,
+ "step": 25724
+ },
+ {
+ "epoch": 70.09536784741144,
+ "grad_norm": 2.7542428970336914,
+ "learning_rate": 4.334949773354161e-06,
+ "loss": 0.0884,
+ "step": 25725
+ },
+ {
+ "epoch": 70.09809264305177,
+ "grad_norm": 8.024162292480469,
+ "learning_rate": 4.334222568397526e-06,
+ "loss": 0.0363,
+ "step": 25726
+ },
+ {
+ "epoch": 70.1008174386921,
+ "grad_norm": 2.9970154762268066,
+ "learning_rate": 4.333495407565777e-06,
+ "loss": 0.2539,
+ "step": 25727
+ },
+ {
+ "epoch": 70.10354223433242,
+ "grad_norm": 2.9449198246002197,
+ "learning_rate": 4.33276829086459e-06,
+ "loss": 0.1015,
+ "step": 25728
+ },
+ {
+ "epoch": 70.10626702997276,
+ "grad_norm": 2.850621461868286,
+ "learning_rate": 4.332041218299619e-06,
+ "loss": 0.1877,
+ "step": 25729
+ },
+ {
+ "epoch": 70.10899182561307,
+ "grad_norm": 3.671219825744629,
+ "learning_rate": 4.331314189876528e-06,
+ "loss": 0.0564,
+ "step": 25730
+ },
+ {
+ "epoch": 70.11171662125341,
+ "grad_norm": 3.8866076469421387,
+ "learning_rate": 4.330587205600978e-06,
+ "loss": 0.0603,
+ "step": 25731
+ },
+ {
+ "epoch": 70.11444141689373,
+ "grad_norm": 3.623387575149536,
+ "learning_rate": 4.329860265478631e-06,
+ "loss": 0.1453,
+ "step": 25732
+ },
+ {
+ "epoch": 70.11716621253406,
+ "grad_norm": 5.383785724639893,
+ "learning_rate": 4.329133369515155e-06,
+ "loss": 0.0817,
+ "step": 25733
+ },
+ {
+ "epoch": 70.11989100817439,
+ "grad_norm": 3.942452907562256,
+ "learning_rate": 4.328406517716205e-06,
+ "loss": 0.188,
+ "step": 25734
+ },
+ {
+ "epoch": 70.12261580381471,
+ "grad_norm": 4.4679951667785645,
+ "learning_rate": 4.327679710087438e-06,
+ "loss": 0.1185,
+ "step": 25735
+ },
+ {
+ "epoch": 70.12534059945504,
+ "grad_norm": 3.4070608615875244,
+ "learning_rate": 4.326952946634523e-06,
+ "loss": 0.1402,
+ "step": 25736
+ },
+ {
+ "epoch": 70.12806539509536,
+ "grad_norm": 4.057241916656494,
+ "learning_rate": 4.326226227363116e-06,
+ "loss": 0.1239,
+ "step": 25737
+ },
+ {
+ "epoch": 70.1307901907357,
+ "grad_norm": 3.2047441005706787,
+ "learning_rate": 4.325499552278877e-06,
+ "loss": 0.0428,
+ "step": 25738
+ },
+ {
+ "epoch": 70.13351498637603,
+ "grad_norm": 3.029756546020508,
+ "learning_rate": 4.32477292138746e-06,
+ "loss": 0.1284,
+ "step": 25739
+ },
+ {
+ "epoch": 70.13623978201635,
+ "grad_norm": 3.8635129928588867,
+ "learning_rate": 4.324046334694534e-06,
+ "loss": 0.0568,
+ "step": 25740
+ },
+ {
+ "epoch": 70.13896457765668,
+ "grad_norm": 4.335892200469971,
+ "learning_rate": 4.3233197922057515e-06,
+ "loss": 0.0934,
+ "step": 25741
+ },
+ {
+ "epoch": 70.141689373297,
+ "grad_norm": 2.3393070697784424,
+ "learning_rate": 4.322593293926771e-06,
+ "loss": 0.1254,
+ "step": 25742
+ },
+ {
+ "epoch": 70.14441416893733,
+ "grad_norm": 4.349730968475342,
+ "learning_rate": 4.321866839863249e-06,
+ "loss": 0.0705,
+ "step": 25743
+ },
+ {
+ "epoch": 70.14713896457765,
+ "grad_norm": 5.032073020935059,
+ "learning_rate": 4.321140430020848e-06,
+ "loss": 0.0822,
+ "step": 25744
+ },
+ {
+ "epoch": 70.14986376021798,
+ "grad_norm": 2.0033092498779297,
+ "learning_rate": 4.320414064405223e-06,
+ "loss": 0.0285,
+ "step": 25745
+ },
+ {
+ "epoch": 70.15258855585832,
+ "grad_norm": 3.244332790374756,
+ "learning_rate": 4.319687743022031e-06,
+ "loss": 0.0398,
+ "step": 25746
+ },
+ {
+ "epoch": 70.15531335149863,
+ "grad_norm": 4.38469123840332,
+ "learning_rate": 4.318961465876924e-06,
+ "loss": 0.1832,
+ "step": 25747
+ },
+ {
+ "epoch": 70.15803814713897,
+ "grad_norm": 2.730025053024292,
+ "learning_rate": 4.318235232975565e-06,
+ "loss": 0.0361,
+ "step": 25748
+ },
+ {
+ "epoch": 70.16076294277929,
+ "grad_norm": 2.532407522201538,
+ "learning_rate": 4.317509044323605e-06,
+ "loss": 0.0421,
+ "step": 25749
+ },
+ {
+ "epoch": 70.16348773841962,
+ "grad_norm": 3.7165937423706055,
+ "learning_rate": 4.316782899926704e-06,
+ "loss": 0.045,
+ "step": 25750
+ },
+ {
+ "epoch": 70.16621253405995,
+ "grad_norm": 2.5522847175598145,
+ "learning_rate": 4.316056799790512e-06,
+ "loss": 0.0396,
+ "step": 25751
+ },
+ {
+ "epoch": 70.16893732970027,
+ "grad_norm": 2.729966163635254,
+ "learning_rate": 4.31533074392069e-06,
+ "loss": 0.0488,
+ "step": 25752
+ },
+ {
+ "epoch": 70.1716621253406,
+ "grad_norm": 2.9957115650177,
+ "learning_rate": 4.314604732322889e-06,
+ "loss": 0.049,
+ "step": 25753
+ },
+ {
+ "epoch": 70.17438692098092,
+ "grad_norm": 3.1514878273010254,
+ "learning_rate": 4.313878765002763e-06,
+ "loss": 0.0741,
+ "step": 25754
+ },
+ {
+ "epoch": 70.17711171662125,
+ "grad_norm": 2.544762134552002,
+ "learning_rate": 4.313152841965964e-06,
+ "loss": 0.0594,
+ "step": 25755
+ },
+ {
+ "epoch": 70.17983651226157,
+ "grad_norm": 2.818070888519287,
+ "learning_rate": 4.31242696321815e-06,
+ "loss": 0.0461,
+ "step": 25756
+ },
+ {
+ "epoch": 70.1825613079019,
+ "grad_norm": 2.1443002223968506,
+ "learning_rate": 4.311701128764974e-06,
+ "loss": 0.1193,
+ "step": 25757
+ },
+ {
+ "epoch": 70.18528610354224,
+ "grad_norm": 5.600152969360352,
+ "learning_rate": 4.310975338612084e-06,
+ "loss": 0.1201,
+ "step": 25758
+ },
+ {
+ "epoch": 70.18801089918256,
+ "grad_norm": 3.2574639320373535,
+ "learning_rate": 4.310249592765133e-06,
+ "loss": 0.0676,
+ "step": 25759
+ },
+ {
+ "epoch": 70.19073569482289,
+ "grad_norm": 2.508854627609253,
+ "learning_rate": 4.309523891229777e-06,
+ "loss": 0.0537,
+ "step": 25760
+ },
+ {
+ "epoch": 70.19346049046321,
+ "grad_norm": 2.628046751022339,
+ "learning_rate": 4.3087982340116665e-06,
+ "loss": 0.0623,
+ "step": 25761
+ },
+ {
+ "epoch": 70.19618528610354,
+ "grad_norm": 3.702197551727295,
+ "learning_rate": 4.308072621116453e-06,
+ "loss": 0.1033,
+ "step": 25762
+ },
+ {
+ "epoch": 70.19891008174388,
+ "grad_norm": 2.7948198318481445,
+ "learning_rate": 4.307347052549781e-06,
+ "loss": 0.0927,
+ "step": 25763
+ },
+ {
+ "epoch": 70.2016348773842,
+ "grad_norm": 4.994749069213867,
+ "learning_rate": 4.306621528317312e-06,
+ "loss": 0.041,
+ "step": 25764
+ },
+ {
+ "epoch": 70.20435967302453,
+ "grad_norm": 2.5164976119995117,
+ "learning_rate": 4.305896048424691e-06,
+ "loss": 0.0393,
+ "step": 25765
+ },
+ {
+ "epoch": 70.20708446866485,
+ "grad_norm": 3.661639451980591,
+ "learning_rate": 4.305170612877565e-06,
+ "loss": 0.048,
+ "step": 25766
+ },
+ {
+ "epoch": 70.20980926430518,
+ "grad_norm": 3.312103033065796,
+ "learning_rate": 4.304445221681592e-06,
+ "loss": 0.0444,
+ "step": 25767
+ },
+ {
+ "epoch": 70.2125340599455,
+ "grad_norm": 2.6454432010650635,
+ "learning_rate": 4.3037198748424105e-06,
+ "loss": 0.0386,
+ "step": 25768
+ },
+ {
+ "epoch": 70.21525885558583,
+ "grad_norm": 2.856839656829834,
+ "learning_rate": 4.30299457236568e-06,
+ "loss": 0.0964,
+ "step": 25769
+ },
+ {
+ "epoch": 70.21798365122616,
+ "grad_norm": 3.4453814029693604,
+ "learning_rate": 4.302269314257044e-06,
+ "loss": 0.0806,
+ "step": 25770
+ },
+ {
+ "epoch": 70.22070844686648,
+ "grad_norm": 3.521606206893921,
+ "learning_rate": 4.301544100522151e-06,
+ "loss": 0.0744,
+ "step": 25771
+ },
+ {
+ "epoch": 70.22343324250681,
+ "grad_norm": 3.4696497917175293,
+ "learning_rate": 4.300818931166645e-06,
+ "loss": 0.0745,
+ "step": 25772
+ },
+ {
+ "epoch": 70.22615803814713,
+ "grad_norm": 4.244225978851318,
+ "learning_rate": 4.3000938061961825e-06,
+ "loss": 0.0535,
+ "step": 25773
+ },
+ {
+ "epoch": 70.22888283378747,
+ "grad_norm": 2.9358582496643066,
+ "learning_rate": 4.299368725616405e-06,
+ "loss": 0.0884,
+ "step": 25774
+ },
+ {
+ "epoch": 70.2316076294278,
+ "grad_norm": 3.3426084518432617,
+ "learning_rate": 4.298643689432958e-06,
+ "loss": 0.0664,
+ "step": 25775
+ },
+ {
+ "epoch": 70.23433242506812,
+ "grad_norm": 3.7609598636627197,
+ "learning_rate": 4.297918697651493e-06,
+ "loss": 0.1675,
+ "step": 25776
+ },
+ {
+ "epoch": 70.23705722070845,
+ "grad_norm": 3.2763009071350098,
+ "learning_rate": 4.297193750277654e-06,
+ "loss": 0.1055,
+ "step": 25777
+ },
+ {
+ "epoch": 70.23978201634877,
+ "grad_norm": 3.5721278190612793,
+ "learning_rate": 4.296468847317086e-06,
+ "loss": 0.0665,
+ "step": 25778
+ },
+ {
+ "epoch": 70.2425068119891,
+ "grad_norm": 3.158398151397705,
+ "learning_rate": 4.2957439887754325e-06,
+ "loss": 0.0466,
+ "step": 25779
+ },
+ {
+ "epoch": 70.24523160762942,
+ "grad_norm": 2.066787004470825,
+ "learning_rate": 4.295019174658344e-06,
+ "loss": 0.154,
+ "step": 25780
+ },
+ {
+ "epoch": 70.24795640326975,
+ "grad_norm": 3.3044679164886475,
+ "learning_rate": 4.294294404971464e-06,
+ "loss": 0.1755,
+ "step": 25781
+ },
+ {
+ "epoch": 70.25068119891009,
+ "grad_norm": 5.466963291168213,
+ "learning_rate": 4.293569679720434e-06,
+ "loss": 0.1676,
+ "step": 25782
+ },
+ {
+ "epoch": 70.2534059945504,
+ "grad_norm": 3.4783709049224854,
+ "learning_rate": 4.2928449989108964e-06,
+ "loss": 0.0965,
+ "step": 25783
+ },
+ {
+ "epoch": 70.25613079019074,
+ "grad_norm": 2.85040283203125,
+ "learning_rate": 4.292120362548499e-06,
+ "loss": 0.0299,
+ "step": 25784
+ },
+ {
+ "epoch": 70.25885558583106,
+ "grad_norm": 2.3949267864227295,
+ "learning_rate": 4.291395770638888e-06,
+ "loss": 0.0344,
+ "step": 25785
+ },
+ {
+ "epoch": 70.26158038147139,
+ "grad_norm": 2.427435874938965,
+ "learning_rate": 4.290671223187701e-06,
+ "loss": 0.1092,
+ "step": 25786
+ },
+ {
+ "epoch": 70.26430517711172,
+ "grad_norm": 2.70589542388916,
+ "learning_rate": 4.289946720200585e-06,
+ "loss": 0.1229,
+ "step": 25787
+ },
+ {
+ "epoch": 70.26702997275204,
+ "grad_norm": 2.6562418937683105,
+ "learning_rate": 4.289222261683176e-06,
+ "loss": 0.0531,
+ "step": 25788
+ },
+ {
+ "epoch": 70.26975476839237,
+ "grad_norm": 2.682788848876953,
+ "learning_rate": 4.2884978476411235e-06,
+ "loss": 0.0811,
+ "step": 25789
+ },
+ {
+ "epoch": 70.2724795640327,
+ "grad_norm": 3.2893130779266357,
+ "learning_rate": 4.287773478080066e-06,
+ "loss": 0.0965,
+ "step": 25790
+ },
+ {
+ "epoch": 70.27520435967303,
+ "grad_norm": 2.856510639190674,
+ "learning_rate": 4.287049153005644e-06,
+ "loss": 0.13,
+ "step": 25791
+ },
+ {
+ "epoch": 70.27792915531334,
+ "grad_norm": 4.285785675048828,
+ "learning_rate": 4.286324872423497e-06,
+ "loss": 0.1433,
+ "step": 25792
+ },
+ {
+ "epoch": 70.28065395095368,
+ "grad_norm": 2.9691834449768066,
+ "learning_rate": 4.2856006363392726e-06,
+ "loss": 0.1299,
+ "step": 25793
+ },
+ {
+ "epoch": 70.28337874659401,
+ "grad_norm": 2.4945054054260254,
+ "learning_rate": 4.284876444758604e-06,
+ "loss": 0.0714,
+ "step": 25794
+ },
+ {
+ "epoch": 70.28610354223433,
+ "grad_norm": 3.0490522384643555,
+ "learning_rate": 4.284152297687136e-06,
+ "loss": 0.0664,
+ "step": 25795
+ },
+ {
+ "epoch": 70.28882833787466,
+ "grad_norm": 4.4501729011535645,
+ "learning_rate": 4.2834281951305e-06,
+ "loss": 0.1,
+ "step": 25796
+ },
+ {
+ "epoch": 70.29155313351498,
+ "grad_norm": 1.6889508962631226,
+ "learning_rate": 4.2827041370943465e-06,
+ "loss": 0.0254,
+ "step": 25797
+ },
+ {
+ "epoch": 70.29427792915531,
+ "grad_norm": 3.197612762451172,
+ "learning_rate": 4.2819801235843086e-06,
+ "loss": 0.066,
+ "step": 25798
+ },
+ {
+ "epoch": 70.29700272479565,
+ "grad_norm": 2.619960308074951,
+ "learning_rate": 4.2812561546060215e-06,
+ "loss": 0.0985,
+ "step": 25799
+ },
+ {
+ "epoch": 70.29972752043597,
+ "grad_norm": 2.725442409515381,
+ "learning_rate": 4.280532230165132e-06,
+ "loss": 0.107,
+ "step": 25800
+ },
+ {
+ "epoch": 70.3024523160763,
+ "grad_norm": 3.8378942012786865,
+ "learning_rate": 4.2798083502672695e-06,
+ "loss": 0.062,
+ "step": 25801
+ },
+ {
+ "epoch": 70.30517711171662,
+ "grad_norm": 2.5743367671966553,
+ "learning_rate": 4.2790845149180784e-06,
+ "loss": 0.0678,
+ "step": 25802
+ },
+ {
+ "epoch": 70.30790190735695,
+ "grad_norm": 2.618525266647339,
+ "learning_rate": 4.278360724123194e-06,
+ "loss": 0.0742,
+ "step": 25803
+ },
+ {
+ "epoch": 70.31062670299727,
+ "grad_norm": 2.9353785514831543,
+ "learning_rate": 4.277636977888248e-06,
+ "loss": 0.039,
+ "step": 25804
+ },
+ {
+ "epoch": 70.3133514986376,
+ "grad_norm": 3.842531204223633,
+ "learning_rate": 4.276913276218885e-06,
+ "loss": 0.0964,
+ "step": 25805
+ },
+ {
+ "epoch": 70.31607629427793,
+ "grad_norm": 4.603367805480957,
+ "learning_rate": 4.2761896191207365e-06,
+ "loss": 0.0517,
+ "step": 25806
+ },
+ {
+ "epoch": 70.31880108991825,
+ "grad_norm": 2.459416151046753,
+ "learning_rate": 4.275466006599439e-06,
+ "loss": 0.0362,
+ "step": 25807
+ },
+ {
+ "epoch": 70.32152588555859,
+ "grad_norm": 3.6822526454925537,
+ "learning_rate": 4.2747424386606255e-06,
+ "loss": 0.0474,
+ "step": 25808
+ },
+ {
+ "epoch": 70.3242506811989,
+ "grad_norm": 3.025571823120117,
+ "learning_rate": 4.2740189153099355e-06,
+ "loss": 0.1482,
+ "step": 25809
+ },
+ {
+ "epoch": 70.32697547683924,
+ "grad_norm": 3.692002296447754,
+ "learning_rate": 4.2732954365530034e-06,
+ "loss": 0.1535,
+ "step": 25810
+ },
+ {
+ "epoch": 70.32970027247957,
+ "grad_norm": 2.6477317810058594,
+ "learning_rate": 4.2725720023954605e-06,
+ "loss": 0.0352,
+ "step": 25811
+ },
+ {
+ "epoch": 70.33242506811989,
+ "grad_norm": 2.575512647628784,
+ "learning_rate": 4.27184861284294e-06,
+ "loss": 0.1223,
+ "step": 25812
+ },
+ {
+ "epoch": 70.33514986376022,
+ "grad_norm": 13.949918746948242,
+ "learning_rate": 4.271125267901083e-06,
+ "loss": 0.0697,
+ "step": 25813
+ },
+ {
+ "epoch": 70.33787465940054,
+ "grad_norm": 2.2304110527038574,
+ "learning_rate": 4.2704019675755155e-06,
+ "loss": 0.039,
+ "step": 25814
+ },
+ {
+ "epoch": 70.34059945504087,
+ "grad_norm": 3.124695062637329,
+ "learning_rate": 4.269678711871875e-06,
+ "loss": 0.0675,
+ "step": 25815
+ },
+ {
+ "epoch": 70.34332425068119,
+ "grad_norm": 6.387601852416992,
+ "learning_rate": 4.268955500795788e-06,
+ "loss": 0.0655,
+ "step": 25816
+ },
+ {
+ "epoch": 70.34604904632153,
+ "grad_norm": 2.7448737621307373,
+ "learning_rate": 4.268232334352895e-06,
+ "loss": 0.0449,
+ "step": 25817
+ },
+ {
+ "epoch": 70.34877384196186,
+ "grad_norm": 2.030609369277954,
+ "learning_rate": 4.267509212548821e-06,
+ "loss": 0.0385,
+ "step": 25818
+ },
+ {
+ "epoch": 70.35149863760218,
+ "grad_norm": 2.8909125328063965,
+ "learning_rate": 4.266786135389203e-06,
+ "loss": 0.1641,
+ "step": 25819
+ },
+ {
+ "epoch": 70.35422343324251,
+ "grad_norm": 6.593447208404541,
+ "learning_rate": 4.2660631028796665e-06,
+ "loss": 0.1597,
+ "step": 25820
+ },
+ {
+ "epoch": 70.35694822888283,
+ "grad_norm": 2.1756784915924072,
+ "learning_rate": 4.26534011502585e-06,
+ "loss": 0.0674,
+ "step": 25821
+ },
+ {
+ "epoch": 70.35967302452316,
+ "grad_norm": 3.2333314418792725,
+ "learning_rate": 4.264617171833381e-06,
+ "loss": 0.2454,
+ "step": 25822
+ },
+ {
+ "epoch": 70.3623978201635,
+ "grad_norm": 2.5491182804107666,
+ "learning_rate": 4.263894273307888e-06,
+ "loss": 0.1337,
+ "step": 25823
+ },
+ {
+ "epoch": 70.36512261580381,
+ "grad_norm": 3.0634193420410156,
+ "learning_rate": 4.263171419454998e-06,
+ "loss": 0.0298,
+ "step": 25824
+ },
+ {
+ "epoch": 70.36784741144415,
+ "grad_norm": 3.094879150390625,
+ "learning_rate": 4.262448610280348e-06,
+ "loss": 0.0624,
+ "step": 25825
+ },
+ {
+ "epoch": 70.37057220708446,
+ "grad_norm": 1.936737060546875,
+ "learning_rate": 4.261725845789564e-06,
+ "loss": 0.0263,
+ "step": 25826
+ },
+ {
+ "epoch": 70.3732970027248,
+ "grad_norm": 5.852288246154785,
+ "learning_rate": 4.261003125988275e-06,
+ "loss": 0.0854,
+ "step": 25827
+ },
+ {
+ "epoch": 70.37602179836512,
+ "grad_norm": 2.6277921199798584,
+ "learning_rate": 4.260280450882104e-06,
+ "loss": 0.1037,
+ "step": 25828
+ },
+ {
+ "epoch": 70.37874659400545,
+ "grad_norm": 4.712032318115234,
+ "learning_rate": 4.259557820476689e-06,
+ "loss": 0.0596,
+ "step": 25829
+ },
+ {
+ "epoch": 70.38147138964578,
+ "grad_norm": 2.8652727603912354,
+ "learning_rate": 4.258835234777652e-06,
+ "loss": 0.0579,
+ "step": 25830
+ },
+ {
+ "epoch": 70.3841961852861,
+ "grad_norm": 2.4967751502990723,
+ "learning_rate": 4.2581126937906215e-06,
+ "loss": 0.0493,
+ "step": 25831
+ },
+ {
+ "epoch": 70.38692098092643,
+ "grad_norm": 3.6561508178710938,
+ "learning_rate": 4.257390197521221e-06,
+ "loss": 0.14,
+ "step": 25832
+ },
+ {
+ "epoch": 70.38964577656675,
+ "grad_norm": 5.42636251449585,
+ "learning_rate": 4.256667745975084e-06,
+ "loss": 0.1609,
+ "step": 25833
+ },
+ {
+ "epoch": 70.39237057220708,
+ "grad_norm": 3.0732507705688477,
+ "learning_rate": 4.255945339157834e-06,
+ "loss": 0.0536,
+ "step": 25834
+ },
+ {
+ "epoch": 70.39509536784742,
+ "grad_norm": 3.269412040710449,
+ "learning_rate": 4.255222977075094e-06,
+ "loss": 0.126,
+ "step": 25835
+ },
+ {
+ "epoch": 70.39782016348774,
+ "grad_norm": 2.7422266006469727,
+ "learning_rate": 4.254500659732496e-06,
+ "loss": 0.0561,
+ "step": 25836
+ },
+ {
+ "epoch": 70.40054495912807,
+ "grad_norm": 3.6423215866088867,
+ "learning_rate": 4.253778387135658e-06,
+ "loss": 0.1019,
+ "step": 25837
+ },
+ {
+ "epoch": 70.40326975476839,
+ "grad_norm": 3.569866418838501,
+ "learning_rate": 4.253056159290212e-06,
+ "loss": 0.0896,
+ "step": 25838
+ },
+ {
+ "epoch": 70.40599455040872,
+ "grad_norm": 3.734497308731079,
+ "learning_rate": 4.2523339762017805e-06,
+ "loss": 0.0434,
+ "step": 25839
+ },
+ {
+ "epoch": 70.40871934604904,
+ "grad_norm": 3.439307689666748,
+ "learning_rate": 4.2516118378759826e-06,
+ "loss": 0.1112,
+ "step": 25840
+ },
+ {
+ "epoch": 70.41144414168937,
+ "grad_norm": 3.146479368209839,
+ "learning_rate": 4.250889744318452e-06,
+ "loss": 0.0579,
+ "step": 25841
+ },
+ {
+ "epoch": 70.4141689373297,
+ "grad_norm": 3.413196086883545,
+ "learning_rate": 4.2501676955348045e-06,
+ "loss": 0.0801,
+ "step": 25842
+ },
+ {
+ "epoch": 70.41689373297002,
+ "grad_norm": 3.2361388206481934,
+ "learning_rate": 4.249445691530668e-06,
+ "loss": 0.0838,
+ "step": 25843
+ },
+ {
+ "epoch": 70.41961852861036,
+ "grad_norm": 3.2097456455230713,
+ "learning_rate": 4.24872373231166e-06,
+ "loss": 0.0547,
+ "step": 25844
+ },
+ {
+ "epoch": 70.42234332425068,
+ "grad_norm": 6.420253276824951,
+ "learning_rate": 4.248001817883408e-06,
+ "loss": 0.0391,
+ "step": 25845
+ },
+ {
+ "epoch": 70.42506811989101,
+ "grad_norm": 3.8383002281188965,
+ "learning_rate": 4.247279948251534e-06,
+ "loss": 0.1797,
+ "step": 25846
+ },
+ {
+ "epoch": 70.42779291553134,
+ "grad_norm": 3.0335421562194824,
+ "learning_rate": 4.246558123421658e-06,
+ "loss": 0.1228,
+ "step": 25847
+ },
+ {
+ "epoch": 70.43051771117166,
+ "grad_norm": 3.270625114440918,
+ "learning_rate": 4.2458363433994e-06,
+ "loss": 0.0631,
+ "step": 25848
+ },
+ {
+ "epoch": 70.433242506812,
+ "grad_norm": 2.877497673034668,
+ "learning_rate": 4.245114608190385e-06,
+ "loss": 0.1059,
+ "step": 25849
+ },
+ {
+ "epoch": 70.43596730245231,
+ "grad_norm": 3.6067934036254883,
+ "learning_rate": 4.244392917800234e-06,
+ "loss": 0.1098,
+ "step": 25850
+ },
+ {
+ "epoch": 70.43869209809264,
+ "grad_norm": 2.9734182357788086,
+ "learning_rate": 4.243671272234564e-06,
+ "loss": 0.0341,
+ "step": 25851
+ },
+ {
+ "epoch": 70.44141689373296,
+ "grad_norm": 2.876863718032837,
+ "learning_rate": 4.242949671498995e-06,
+ "loss": 0.0609,
+ "step": 25852
+ },
+ {
+ "epoch": 70.4441416893733,
+ "grad_norm": 2.675910472869873,
+ "learning_rate": 4.242228115599147e-06,
+ "loss": 0.0461,
+ "step": 25853
+ },
+ {
+ "epoch": 70.44686648501363,
+ "grad_norm": 2.7128145694732666,
+ "learning_rate": 4.2415066045406465e-06,
+ "loss": 0.0781,
+ "step": 25854
+ },
+ {
+ "epoch": 70.44959128065395,
+ "grad_norm": 3.816506862640381,
+ "learning_rate": 4.2407851383291055e-06,
+ "loss": 0.1031,
+ "step": 25855
+ },
+ {
+ "epoch": 70.45231607629428,
+ "grad_norm": 3.5927624702453613,
+ "learning_rate": 4.240063716970145e-06,
+ "loss": 0.1814,
+ "step": 25856
+ },
+ {
+ "epoch": 70.4550408719346,
+ "grad_norm": 2.925413131713867,
+ "learning_rate": 4.23934234046938e-06,
+ "loss": 0.1628,
+ "step": 25857
+ },
+ {
+ "epoch": 70.45776566757493,
+ "grad_norm": 3.3901381492614746,
+ "learning_rate": 4.2386210088324355e-06,
+ "loss": 0.0498,
+ "step": 25858
+ },
+ {
+ "epoch": 70.46049046321527,
+ "grad_norm": 2.0617852210998535,
+ "learning_rate": 4.2378997220649235e-06,
+ "loss": 0.0362,
+ "step": 25859
+ },
+ {
+ "epoch": 70.46321525885558,
+ "grad_norm": 3.5812828540802,
+ "learning_rate": 4.23717848017246e-06,
+ "loss": 0.047,
+ "step": 25860
+ },
+ {
+ "epoch": 70.46594005449592,
+ "grad_norm": 2.932439088821411,
+ "learning_rate": 4.236457283160669e-06,
+ "loss": 0.0564,
+ "step": 25861
+ },
+ {
+ "epoch": 70.46866485013624,
+ "grad_norm": 2.2549376487731934,
+ "learning_rate": 4.235736131035163e-06,
+ "loss": 0.0869,
+ "step": 25862
+ },
+ {
+ "epoch": 70.47138964577657,
+ "grad_norm": 1.828937292098999,
+ "learning_rate": 4.235015023801558e-06,
+ "loss": 0.0252,
+ "step": 25863
+ },
+ {
+ "epoch": 70.47411444141689,
+ "grad_norm": 4.041618347167969,
+ "learning_rate": 4.234293961465467e-06,
+ "loss": 0.0933,
+ "step": 25864
+ },
+ {
+ "epoch": 70.47683923705722,
+ "grad_norm": 2.6297528743743896,
+ "learning_rate": 4.233572944032514e-06,
+ "loss": 0.143,
+ "step": 25865
+ },
+ {
+ "epoch": 70.47956403269755,
+ "grad_norm": 2.1373395919799805,
+ "learning_rate": 4.232851971508308e-06,
+ "loss": 0.0629,
+ "step": 25866
+ },
+ {
+ "epoch": 70.48228882833787,
+ "grad_norm": 3.39882230758667,
+ "learning_rate": 4.232131043898465e-06,
+ "loss": 0.1496,
+ "step": 25867
+ },
+ {
+ "epoch": 70.4850136239782,
+ "grad_norm": 2.437934398651123,
+ "learning_rate": 4.231410161208598e-06,
+ "loss": 0.0359,
+ "step": 25868
+ },
+ {
+ "epoch": 70.48773841961852,
+ "grad_norm": 2.1555838584899902,
+ "learning_rate": 4.230689323444322e-06,
+ "loss": 0.1669,
+ "step": 25869
+ },
+ {
+ "epoch": 70.49046321525886,
+ "grad_norm": 2.7060513496398926,
+ "learning_rate": 4.229968530611255e-06,
+ "loss": 0.1156,
+ "step": 25870
+ },
+ {
+ "epoch": 70.49318801089919,
+ "grad_norm": 2.6989705562591553,
+ "learning_rate": 4.229247782715007e-06,
+ "loss": 0.0523,
+ "step": 25871
+ },
+ {
+ "epoch": 70.49591280653951,
+ "grad_norm": 2.2723169326782227,
+ "learning_rate": 4.228527079761192e-06,
+ "loss": 0.0348,
+ "step": 25872
+ },
+ {
+ "epoch": 70.49863760217984,
+ "grad_norm": 3.039783477783203,
+ "learning_rate": 4.2278064217554194e-06,
+ "loss": 0.0844,
+ "step": 25873
+ },
+ {
+ "epoch": 70.50136239782016,
+ "grad_norm": 2.909681558609009,
+ "learning_rate": 4.2270858087033075e-06,
+ "loss": 0.0731,
+ "step": 25874
+ },
+ {
+ "epoch": 70.50408719346049,
+ "grad_norm": 3.2307498455047607,
+ "learning_rate": 4.226365240610465e-06,
+ "loss": 0.0416,
+ "step": 25875
+ },
+ {
+ "epoch": 70.50681198910081,
+ "grad_norm": 3.36785626411438,
+ "learning_rate": 4.225644717482506e-06,
+ "loss": 0.1876,
+ "step": 25876
+ },
+ {
+ "epoch": 70.50953678474114,
+ "grad_norm": 3.2695765495300293,
+ "learning_rate": 4.224924239325035e-06,
+ "loss": 0.0391,
+ "step": 25877
+ },
+ {
+ "epoch": 70.51226158038148,
+ "grad_norm": 2.80440092086792,
+ "learning_rate": 4.224203806143672e-06,
+ "loss": 0.0435,
+ "step": 25878
+ },
+ {
+ "epoch": 70.5149863760218,
+ "grad_norm": 3.8948888778686523,
+ "learning_rate": 4.223483417944024e-06,
+ "loss": 0.149,
+ "step": 25879
+ },
+ {
+ "epoch": 70.51771117166213,
+ "grad_norm": 1.9615836143493652,
+ "learning_rate": 4.2227630747317e-06,
+ "loss": 0.0629,
+ "step": 25880
+ },
+ {
+ "epoch": 70.52043596730245,
+ "grad_norm": 2.87920880317688,
+ "learning_rate": 4.22204277651231e-06,
+ "loss": 0.0539,
+ "step": 25881
+ },
+ {
+ "epoch": 70.52316076294278,
+ "grad_norm": 2.286112070083618,
+ "learning_rate": 4.221322523291467e-06,
+ "loss": 0.0665,
+ "step": 25882
+ },
+ {
+ "epoch": 70.52588555858311,
+ "grad_norm": 2.731645107269287,
+ "learning_rate": 4.2206023150747785e-06,
+ "loss": 0.1524,
+ "step": 25883
+ },
+ {
+ "epoch": 70.52861035422343,
+ "grad_norm": 3.801405906677246,
+ "learning_rate": 4.21988215186785e-06,
+ "loss": 0.1102,
+ "step": 25884
+ },
+ {
+ "epoch": 70.53133514986376,
+ "grad_norm": 3.687263250350952,
+ "learning_rate": 4.2191620336762965e-06,
+ "loss": 0.1469,
+ "step": 25885
+ },
+ {
+ "epoch": 70.53405994550408,
+ "grad_norm": 2.582698106765747,
+ "learning_rate": 4.218441960505723e-06,
+ "loss": 0.1292,
+ "step": 25886
+ },
+ {
+ "epoch": 70.53678474114442,
+ "grad_norm": 5.0590410232543945,
+ "learning_rate": 4.217721932361734e-06,
+ "loss": 0.0522,
+ "step": 25887
+ },
+ {
+ "epoch": 70.53950953678473,
+ "grad_norm": 2.432004451751709,
+ "learning_rate": 4.217001949249944e-06,
+ "loss": 0.0542,
+ "step": 25888
+ },
+ {
+ "epoch": 70.54223433242507,
+ "grad_norm": 2.6614952087402344,
+ "learning_rate": 4.216282011175953e-06,
+ "loss": 0.1065,
+ "step": 25889
+ },
+ {
+ "epoch": 70.5449591280654,
+ "grad_norm": 3.007277011871338,
+ "learning_rate": 4.2155621181453745e-06,
+ "loss": 0.0856,
+ "step": 25890
+ },
+ {
+ "epoch": 70.54768392370572,
+ "grad_norm": 3.1674139499664307,
+ "learning_rate": 4.214842270163813e-06,
+ "loss": 0.1291,
+ "step": 25891
+ },
+ {
+ "epoch": 70.55040871934605,
+ "grad_norm": 3.7338919639587402,
+ "learning_rate": 4.214122467236873e-06,
+ "loss": 0.151,
+ "step": 25892
+ },
+ {
+ "epoch": 70.55313351498637,
+ "grad_norm": 3.014159679412842,
+ "learning_rate": 4.213402709370158e-06,
+ "loss": 0.1756,
+ "step": 25893
+ },
+ {
+ "epoch": 70.5558583106267,
+ "grad_norm": 2.431577444076538,
+ "learning_rate": 4.21268299656928e-06,
+ "loss": 0.1085,
+ "step": 25894
+ },
+ {
+ "epoch": 70.55858310626704,
+ "grad_norm": 2.7618846893310547,
+ "learning_rate": 4.211963328839841e-06,
+ "loss": 0.0823,
+ "step": 25895
+ },
+ {
+ "epoch": 70.56130790190736,
+ "grad_norm": 4.54824686050415,
+ "learning_rate": 4.2112437061874445e-06,
+ "loss": 0.0673,
+ "step": 25896
+ },
+ {
+ "epoch": 70.56403269754769,
+ "grad_norm": 3.0391998291015625,
+ "learning_rate": 4.210524128617692e-06,
+ "loss": 0.0446,
+ "step": 25897
+ },
+ {
+ "epoch": 70.566757493188,
+ "grad_norm": 2.9395833015441895,
+ "learning_rate": 4.209804596136195e-06,
+ "loss": 0.091,
+ "step": 25898
+ },
+ {
+ "epoch": 70.56948228882834,
+ "grad_norm": 3.116922616958618,
+ "learning_rate": 4.209085108748554e-06,
+ "loss": 0.0931,
+ "step": 25899
+ },
+ {
+ "epoch": 70.57220708446866,
+ "grad_norm": 5.059455394744873,
+ "learning_rate": 4.208365666460371e-06,
+ "loss": 0.0735,
+ "step": 25900
+ },
+ {
+ "epoch": 70.57493188010899,
+ "grad_norm": 2.790809392929077,
+ "learning_rate": 4.207646269277247e-06,
+ "loss": 0.0394,
+ "step": 25901
+ },
+ {
+ "epoch": 70.57765667574932,
+ "grad_norm": 3.0464560985565186,
+ "learning_rate": 4.206926917204791e-06,
+ "loss": 0.0437,
+ "step": 25902
+ },
+ {
+ "epoch": 70.58038147138964,
+ "grad_norm": 2.7532222270965576,
+ "learning_rate": 4.2062076102486016e-06,
+ "loss": 0.1169,
+ "step": 25903
+ },
+ {
+ "epoch": 70.58310626702998,
+ "grad_norm": 2.997598886489868,
+ "learning_rate": 4.2054883484142765e-06,
+ "loss": 0.0469,
+ "step": 25904
+ },
+ {
+ "epoch": 70.5858310626703,
+ "grad_norm": 2.8382644653320312,
+ "learning_rate": 4.204769131707422e-06,
+ "loss": 0.0505,
+ "step": 25905
+ },
+ {
+ "epoch": 70.58855585831063,
+ "grad_norm": 4.03818416595459,
+ "learning_rate": 4.204049960133643e-06,
+ "loss": 0.1391,
+ "step": 25906
+ },
+ {
+ "epoch": 70.59128065395096,
+ "grad_norm": 3.1195859909057617,
+ "learning_rate": 4.203330833698536e-06,
+ "loss": 0.0954,
+ "step": 25907
+ },
+ {
+ "epoch": 70.59400544959128,
+ "grad_norm": 2.6667582988739014,
+ "learning_rate": 4.202611752407703e-06,
+ "loss": 0.0805,
+ "step": 25908
+ },
+ {
+ "epoch": 70.59673024523161,
+ "grad_norm": 3.4228203296661377,
+ "learning_rate": 4.201892716266738e-06,
+ "loss": 0.0639,
+ "step": 25909
+ },
+ {
+ "epoch": 70.59945504087193,
+ "grad_norm": 2.626016855239868,
+ "learning_rate": 4.2011737252812505e-06,
+ "loss": 0.1139,
+ "step": 25910
+ },
+ {
+ "epoch": 70.60217983651226,
+ "grad_norm": 3.4347877502441406,
+ "learning_rate": 4.200454779456834e-06,
+ "loss": 0.0523,
+ "step": 25911
+ },
+ {
+ "epoch": 70.60490463215258,
+ "grad_norm": 3.0663342475891113,
+ "learning_rate": 4.199735878799091e-06,
+ "loss": 0.2209,
+ "step": 25912
+ },
+ {
+ "epoch": 70.60762942779292,
+ "grad_norm": 3.306182384490967,
+ "learning_rate": 4.199017023313613e-06,
+ "loss": 0.0766,
+ "step": 25913
+ },
+ {
+ "epoch": 70.61035422343325,
+ "grad_norm": 4.746140956878662,
+ "learning_rate": 4.198298213006008e-06,
+ "loss": 0.0685,
+ "step": 25914
+ },
+ {
+ "epoch": 70.61307901907357,
+ "grad_norm": 3.576681613922119,
+ "learning_rate": 4.19757944788187e-06,
+ "loss": 0.0785,
+ "step": 25915
+ },
+ {
+ "epoch": 70.6158038147139,
+ "grad_norm": 2.961754083633423,
+ "learning_rate": 4.196860727946796e-06,
+ "loss": 0.0369,
+ "step": 25916
+ },
+ {
+ "epoch": 70.61852861035422,
+ "grad_norm": 2.2688803672790527,
+ "learning_rate": 4.19614205320638e-06,
+ "loss": 0.0481,
+ "step": 25917
+ },
+ {
+ "epoch": 70.62125340599455,
+ "grad_norm": 2.811814785003662,
+ "learning_rate": 4.1954234236662275e-06,
+ "loss": 0.0391,
+ "step": 25918
+ },
+ {
+ "epoch": 70.62397820163488,
+ "grad_norm": 4.069333553314209,
+ "learning_rate": 4.19470483933193e-06,
+ "loss": 0.1037,
+ "step": 25919
+ },
+ {
+ "epoch": 70.6267029972752,
+ "grad_norm": 2.943814992904663,
+ "learning_rate": 4.193986300209084e-06,
+ "loss": 0.0365,
+ "step": 25920
+ },
+ {
+ "epoch": 70.62942779291554,
+ "grad_norm": 6.791131496429443,
+ "learning_rate": 4.193267806303283e-06,
+ "loss": 0.0644,
+ "step": 25921
+ },
+ {
+ "epoch": 70.63215258855585,
+ "grad_norm": 4.604465007781982,
+ "learning_rate": 4.192549357620125e-06,
+ "loss": 0.0799,
+ "step": 25922
+ },
+ {
+ "epoch": 70.63487738419619,
+ "grad_norm": 2.72743821144104,
+ "learning_rate": 4.19183095416521e-06,
+ "loss": 0.0838,
+ "step": 25923
+ },
+ {
+ "epoch": 70.6376021798365,
+ "grad_norm": 2.7363224029541016,
+ "learning_rate": 4.191112595944128e-06,
+ "loss": 0.043,
+ "step": 25924
+ },
+ {
+ "epoch": 70.64032697547684,
+ "grad_norm": 2.6797404289245605,
+ "learning_rate": 4.19039428296247e-06,
+ "loss": 0.0378,
+ "step": 25925
+ },
+ {
+ "epoch": 70.64305177111717,
+ "grad_norm": 2.8015358448028564,
+ "learning_rate": 4.189676015225838e-06,
+ "loss": 0.0956,
+ "step": 25926
+ },
+ {
+ "epoch": 70.64577656675749,
+ "grad_norm": 2.488412380218506,
+ "learning_rate": 4.188957792739824e-06,
+ "loss": 0.074,
+ "step": 25927
+ },
+ {
+ "epoch": 70.64850136239782,
+ "grad_norm": 2.5805211067199707,
+ "learning_rate": 4.188239615510018e-06,
+ "loss": 0.0305,
+ "step": 25928
+ },
+ {
+ "epoch": 70.65122615803814,
+ "grad_norm": 2.696093797683716,
+ "learning_rate": 4.1875214835420116e-06,
+ "loss": 0.0352,
+ "step": 25929
+ },
+ {
+ "epoch": 70.65395095367847,
+ "grad_norm": 3.0278303623199463,
+ "learning_rate": 4.186803396841405e-06,
+ "loss": 0.1216,
+ "step": 25930
+ },
+ {
+ "epoch": 70.65667574931881,
+ "grad_norm": 3.1114132404327393,
+ "learning_rate": 4.186085355413785e-06,
+ "loss": 0.0631,
+ "step": 25931
+ },
+ {
+ "epoch": 70.65940054495913,
+ "grad_norm": 3.6098079681396484,
+ "learning_rate": 4.185367359264746e-06,
+ "loss": 0.0503,
+ "step": 25932
+ },
+ {
+ "epoch": 70.66212534059946,
+ "grad_norm": 3.1527180671691895,
+ "learning_rate": 4.184649408399876e-06,
+ "loss": 0.069,
+ "step": 25933
+ },
+ {
+ "epoch": 70.66485013623978,
+ "grad_norm": 4.23618745803833,
+ "learning_rate": 4.183931502824772e-06,
+ "loss": 0.053,
+ "step": 25934
+ },
+ {
+ "epoch": 70.66757493188011,
+ "grad_norm": 3.9020419120788574,
+ "learning_rate": 4.183213642545022e-06,
+ "loss": 0.0759,
+ "step": 25935
+ },
+ {
+ "epoch": 70.67029972752043,
+ "grad_norm": 2.308504819869995,
+ "learning_rate": 4.182495827566217e-06,
+ "loss": 0.046,
+ "step": 25936
+ },
+ {
+ "epoch": 70.67302452316076,
+ "grad_norm": 1.9191436767578125,
+ "learning_rate": 4.181778057893944e-06,
+ "loss": 0.0359,
+ "step": 25937
+ },
+ {
+ "epoch": 70.6757493188011,
+ "grad_norm": 3.608513832092285,
+ "learning_rate": 4.1810603335337964e-06,
+ "loss": 0.0914,
+ "step": 25938
+ },
+ {
+ "epoch": 70.67847411444141,
+ "grad_norm": 3.003201961517334,
+ "learning_rate": 4.180342654491368e-06,
+ "loss": 0.0913,
+ "step": 25939
+ },
+ {
+ "epoch": 70.68119891008175,
+ "grad_norm": 3.0630545616149902,
+ "learning_rate": 4.179625020772242e-06,
+ "loss": 0.0898,
+ "step": 25940
+ },
+ {
+ "epoch": 70.68392370572207,
+ "grad_norm": 2.7549078464508057,
+ "learning_rate": 4.17890743238201e-06,
+ "loss": 0.1082,
+ "step": 25941
+ },
+ {
+ "epoch": 70.6866485013624,
+ "grad_norm": 3.135922431945801,
+ "learning_rate": 4.178189889326255e-06,
+ "loss": 0.1457,
+ "step": 25942
+ },
+ {
+ "epoch": 70.68937329700273,
+ "grad_norm": 3.149646043777466,
+ "learning_rate": 4.177472391610574e-06,
+ "loss": 0.1164,
+ "step": 25943
+ },
+ {
+ "epoch": 70.69209809264305,
+ "grad_norm": 2.631542444229126,
+ "learning_rate": 4.176754939240552e-06,
+ "loss": 0.0353,
+ "step": 25944
+ },
+ {
+ "epoch": 70.69482288828338,
+ "grad_norm": 3.2081425189971924,
+ "learning_rate": 4.176037532221772e-06,
+ "loss": 0.097,
+ "step": 25945
+ },
+ {
+ "epoch": 70.6975476839237,
+ "grad_norm": 3.6365292072296143,
+ "learning_rate": 4.175320170559823e-06,
+ "loss": 0.041,
+ "step": 25946
+ },
+ {
+ "epoch": 70.70027247956403,
+ "grad_norm": 2.3372373580932617,
+ "learning_rate": 4.174602854260297e-06,
+ "loss": 0.0653,
+ "step": 25947
+ },
+ {
+ "epoch": 70.70299727520435,
+ "grad_norm": 2.405831813812256,
+ "learning_rate": 4.173885583328775e-06,
+ "loss": 0.0461,
+ "step": 25948
+ },
+ {
+ "epoch": 70.70572207084469,
+ "grad_norm": 2.79573392868042,
+ "learning_rate": 4.173168357770842e-06,
+ "loss": 0.0835,
+ "step": 25949
+ },
+ {
+ "epoch": 70.70844686648502,
+ "grad_norm": 2.502190351486206,
+ "learning_rate": 4.172451177592089e-06,
+ "loss": 0.0775,
+ "step": 25950
+ },
+ {
+ "epoch": 70.71117166212534,
+ "grad_norm": 3.4877779483795166,
+ "learning_rate": 4.171734042798099e-06,
+ "loss": 0.075,
+ "step": 25951
+ },
+ {
+ "epoch": 70.71389645776567,
+ "grad_norm": 2.578361749649048,
+ "learning_rate": 4.171016953394457e-06,
+ "loss": 0.0379,
+ "step": 25952
+ },
+ {
+ "epoch": 70.71662125340599,
+ "grad_norm": 2.6028637886047363,
+ "learning_rate": 4.1702999093867435e-06,
+ "loss": 0.0482,
+ "step": 25953
+ },
+ {
+ "epoch": 70.71934604904632,
+ "grad_norm": 3.591414451599121,
+ "learning_rate": 4.169582910780551e-06,
+ "loss": 0.0986,
+ "step": 25954
+ },
+ {
+ "epoch": 70.72207084468666,
+ "grad_norm": 3.5944488048553467,
+ "learning_rate": 4.1688659575814535e-06,
+ "loss": 0.0641,
+ "step": 25955
+ },
+ {
+ "epoch": 70.72479564032697,
+ "grad_norm": 2.303833484649658,
+ "learning_rate": 4.168149049795046e-06,
+ "loss": 0.0593,
+ "step": 25956
+ },
+ {
+ "epoch": 70.7275204359673,
+ "grad_norm": 2.972484827041626,
+ "learning_rate": 4.1674321874269055e-06,
+ "loss": 0.0712,
+ "step": 25957
+ },
+ {
+ "epoch": 70.73024523160763,
+ "grad_norm": 3.417473793029785,
+ "learning_rate": 4.166715370482611e-06,
+ "loss": 0.0587,
+ "step": 25958
+ },
+ {
+ "epoch": 70.73297002724796,
+ "grad_norm": 3.3364315032958984,
+ "learning_rate": 4.165998598967754e-06,
+ "loss": 0.0787,
+ "step": 25959
+ },
+ {
+ "epoch": 70.73569482288828,
+ "grad_norm": 3.5824971199035645,
+ "learning_rate": 4.165281872887912e-06,
+ "loss": 0.0763,
+ "step": 25960
+ },
+ {
+ "epoch": 70.73841961852861,
+ "grad_norm": 2.5481116771698,
+ "learning_rate": 4.164565192248667e-06,
+ "loss": 0.0489,
+ "step": 25961
+ },
+ {
+ "epoch": 70.74114441416894,
+ "grad_norm": 3.1502392292022705,
+ "learning_rate": 4.163848557055596e-06,
+ "loss": 0.1133,
+ "step": 25962
+ },
+ {
+ "epoch": 70.74386920980926,
+ "grad_norm": 2.2232277393341064,
+ "learning_rate": 4.163131967314289e-06,
+ "loss": 0.0336,
+ "step": 25963
+ },
+ {
+ "epoch": 70.7465940054496,
+ "grad_norm": 2.860795259475708,
+ "learning_rate": 4.162415423030321e-06,
+ "loss": 0.0461,
+ "step": 25964
+ },
+ {
+ "epoch": 70.74931880108991,
+ "grad_norm": 2.332071542739868,
+ "learning_rate": 4.161698924209275e-06,
+ "loss": 0.0678,
+ "step": 25965
+ },
+ {
+ "epoch": 70.75204359673025,
+ "grad_norm": 3.48745059967041,
+ "learning_rate": 4.160982470856727e-06,
+ "loss": 0.1695,
+ "step": 25966
+ },
+ {
+ "epoch": 70.75476839237058,
+ "grad_norm": 3.1752967834472656,
+ "learning_rate": 4.160266062978262e-06,
+ "loss": 0.1834,
+ "step": 25967
+ },
+ {
+ "epoch": 70.7574931880109,
+ "grad_norm": 3.0846974849700928,
+ "learning_rate": 4.159549700579459e-06,
+ "loss": 0.0219,
+ "step": 25968
+ },
+ {
+ "epoch": 70.76021798365123,
+ "grad_norm": 3.33652925491333,
+ "learning_rate": 4.158833383665892e-06,
+ "loss": 0.0914,
+ "step": 25969
+ },
+ {
+ "epoch": 70.76294277929155,
+ "grad_norm": 2.3236277103424072,
+ "learning_rate": 4.158117112243141e-06,
+ "loss": 0.0824,
+ "step": 25970
+ },
+ {
+ "epoch": 70.76566757493188,
+ "grad_norm": 4.714158058166504,
+ "learning_rate": 4.157400886316788e-06,
+ "loss": 0.1673,
+ "step": 25971
+ },
+ {
+ "epoch": 70.7683923705722,
+ "grad_norm": 2.822706460952759,
+ "learning_rate": 4.15668470589241e-06,
+ "loss": 0.0381,
+ "step": 25972
+ },
+ {
+ "epoch": 70.77111716621253,
+ "grad_norm": 3.422696113586426,
+ "learning_rate": 4.15596857097558e-06,
+ "loss": 0.0576,
+ "step": 25973
+ },
+ {
+ "epoch": 70.77384196185287,
+ "grad_norm": 2.4212465286254883,
+ "learning_rate": 4.155252481571878e-06,
+ "loss": 0.0307,
+ "step": 25974
+ },
+ {
+ "epoch": 70.77656675749319,
+ "grad_norm": 2.283277988433838,
+ "learning_rate": 4.154536437686886e-06,
+ "loss": 0.0396,
+ "step": 25975
+ },
+ {
+ "epoch": 70.77929155313352,
+ "grad_norm": 2.959416151046753,
+ "learning_rate": 4.153820439326175e-06,
+ "loss": 0.0521,
+ "step": 25976
+ },
+ {
+ "epoch": 70.78201634877384,
+ "grad_norm": 2.2339015007019043,
+ "learning_rate": 4.153104486495323e-06,
+ "loss": 0.0343,
+ "step": 25977
+ },
+ {
+ "epoch": 70.78474114441417,
+ "grad_norm": 2.94073748588562,
+ "learning_rate": 4.152388579199901e-06,
+ "loss": 0.0439,
+ "step": 25978
+ },
+ {
+ "epoch": 70.7874659400545,
+ "grad_norm": 3.225032329559326,
+ "learning_rate": 4.151672717445493e-06,
+ "loss": 0.1102,
+ "step": 25979
+ },
+ {
+ "epoch": 70.79019073569482,
+ "grad_norm": 3.0006580352783203,
+ "learning_rate": 4.150956901237668e-06,
+ "loss": 0.1253,
+ "step": 25980
+ },
+ {
+ "epoch": 70.79291553133515,
+ "grad_norm": 3.542045831680298,
+ "learning_rate": 4.1502411305820035e-06,
+ "loss": 0.0784,
+ "step": 25981
+ },
+ {
+ "epoch": 70.79564032697547,
+ "grad_norm": 3.6604087352752686,
+ "learning_rate": 4.1495254054840696e-06,
+ "loss": 0.2117,
+ "step": 25982
+ },
+ {
+ "epoch": 70.7983651226158,
+ "grad_norm": 2.596848249435425,
+ "learning_rate": 4.1488097259494464e-06,
+ "loss": 0.0434,
+ "step": 25983
+ },
+ {
+ "epoch": 70.80108991825612,
+ "grad_norm": 2.6084728240966797,
+ "learning_rate": 4.148094091983705e-06,
+ "loss": 0.1646,
+ "step": 25984
+ },
+ {
+ "epoch": 70.80381471389646,
+ "grad_norm": 3.3621985912323,
+ "learning_rate": 4.147378503592418e-06,
+ "loss": 0.1964,
+ "step": 25985
+ },
+ {
+ "epoch": 70.80653950953679,
+ "grad_norm": 3.769082546234131,
+ "learning_rate": 4.146662960781156e-06,
+ "loss": 0.0913,
+ "step": 25986
+ },
+ {
+ "epoch": 70.80926430517711,
+ "grad_norm": 2.646458864212036,
+ "learning_rate": 4.145947463555499e-06,
+ "loss": 0.0423,
+ "step": 25987
+ },
+ {
+ "epoch": 70.81198910081744,
+ "grad_norm": 4.7483391761779785,
+ "learning_rate": 4.1452320119210136e-06,
+ "loss": 0.0302,
+ "step": 25988
+ },
+ {
+ "epoch": 70.81471389645776,
+ "grad_norm": 3.348487138748169,
+ "learning_rate": 4.144516605883272e-06,
+ "loss": 0.0766,
+ "step": 25989
+ },
+ {
+ "epoch": 70.8174386920981,
+ "grad_norm": 3.6103594303131104,
+ "learning_rate": 4.14380124544784e-06,
+ "loss": 0.1516,
+ "step": 25990
+ },
+ {
+ "epoch": 70.82016348773843,
+ "grad_norm": 3.0230557918548584,
+ "learning_rate": 4.143085930620303e-06,
+ "loss": 0.1126,
+ "step": 25991
+ },
+ {
+ "epoch": 70.82288828337875,
+ "grad_norm": 5.467724800109863,
+ "learning_rate": 4.142370661406224e-06,
+ "loss": 0.0657,
+ "step": 25992
+ },
+ {
+ "epoch": 70.82561307901908,
+ "grad_norm": 3.4226467609405518,
+ "learning_rate": 4.141655437811174e-06,
+ "loss": 0.1201,
+ "step": 25993
+ },
+ {
+ "epoch": 70.8283378746594,
+ "grad_norm": 3.245389223098755,
+ "learning_rate": 4.140940259840719e-06,
+ "loss": 0.1575,
+ "step": 25994
+ },
+ {
+ "epoch": 70.83106267029973,
+ "grad_norm": 2.476825475692749,
+ "learning_rate": 4.140225127500437e-06,
+ "loss": 0.0518,
+ "step": 25995
+ },
+ {
+ "epoch": 70.83378746594005,
+ "grad_norm": 3.047578811645508,
+ "learning_rate": 4.139510040795892e-06,
+ "loss": 0.0637,
+ "step": 25996
+ },
+ {
+ "epoch": 70.83651226158038,
+ "grad_norm": 2.880866765975952,
+ "learning_rate": 4.138794999732655e-06,
+ "loss": 0.0289,
+ "step": 25997
+ },
+ {
+ "epoch": 70.83923705722071,
+ "grad_norm": 3.4764673709869385,
+ "learning_rate": 4.138080004316289e-06,
+ "loss": 0.079,
+ "step": 25998
+ },
+ {
+ "epoch": 70.84196185286103,
+ "grad_norm": 3.865513324737549,
+ "learning_rate": 4.137365054552372e-06,
+ "loss": 0.1019,
+ "step": 25999
+ },
+ {
+ "epoch": 70.84468664850137,
+ "grad_norm": 2.4694693088531494,
+ "learning_rate": 4.136650150446468e-06,
+ "loss": 0.0377,
+ "step": 26000
+ },
+ {
+ "epoch": 70.84741144414168,
+ "grad_norm": 3.7884268760681152,
+ "learning_rate": 4.135935292004143e-06,
+ "loss": 0.1641,
+ "step": 26001
+ },
+ {
+ "epoch": 70.85013623978202,
+ "grad_norm": 2.340000629425049,
+ "learning_rate": 4.135220479230961e-06,
+ "loss": 0.076,
+ "step": 26002
+ },
+ {
+ "epoch": 70.85286103542235,
+ "grad_norm": 2.3376033306121826,
+ "learning_rate": 4.134505712132498e-06,
+ "loss": 0.0408,
+ "step": 26003
+ },
+ {
+ "epoch": 70.85558583106267,
+ "grad_norm": 2.3368735313415527,
+ "learning_rate": 4.133790990714316e-06,
+ "loss": 0.0497,
+ "step": 26004
+ },
+ {
+ "epoch": 70.858310626703,
+ "grad_norm": 3.3468737602233887,
+ "learning_rate": 4.133076314981979e-06,
+ "loss": 0.1053,
+ "step": 26005
+ },
+ {
+ "epoch": 70.86103542234332,
+ "grad_norm": 2.214991569519043,
+ "learning_rate": 4.132361684941053e-06,
+ "loss": 0.0491,
+ "step": 26006
+ },
+ {
+ "epoch": 70.86376021798365,
+ "grad_norm": 2.790736675262451,
+ "learning_rate": 4.131647100597105e-06,
+ "loss": 0.0403,
+ "step": 26007
+ },
+ {
+ "epoch": 70.86648501362397,
+ "grad_norm": 3.3679144382476807,
+ "learning_rate": 4.130932561955704e-06,
+ "loss": 0.158,
+ "step": 26008
+ },
+ {
+ "epoch": 70.8692098092643,
+ "grad_norm": 2.829746723175049,
+ "learning_rate": 4.13021806902241e-06,
+ "loss": 0.0355,
+ "step": 26009
+ },
+ {
+ "epoch": 70.87193460490464,
+ "grad_norm": 3.5523321628570557,
+ "learning_rate": 4.12950362180279e-06,
+ "loss": 0.0962,
+ "step": 26010
+ },
+ {
+ "epoch": 70.87465940054496,
+ "grad_norm": 2.690026044845581,
+ "learning_rate": 4.128789220302404e-06,
+ "loss": 0.0773,
+ "step": 26011
+ },
+ {
+ "epoch": 70.87738419618529,
+ "grad_norm": 2.1563637256622314,
+ "learning_rate": 4.128074864526821e-06,
+ "loss": 0.0261,
+ "step": 26012
+ },
+ {
+ "epoch": 70.88010899182561,
+ "grad_norm": 3.8262779712677,
+ "learning_rate": 4.127360554481602e-06,
+ "loss": 0.1447,
+ "step": 26013
+ },
+ {
+ "epoch": 70.88283378746594,
+ "grad_norm": 2.838820695877075,
+ "learning_rate": 4.126646290172307e-06,
+ "loss": 0.0839,
+ "step": 26014
+ },
+ {
+ "epoch": 70.88555858310627,
+ "grad_norm": 2.9895541667938232,
+ "learning_rate": 4.125932071604505e-06,
+ "loss": 0.0793,
+ "step": 26015
+ },
+ {
+ "epoch": 70.88828337874659,
+ "grad_norm": 5.860555171966553,
+ "learning_rate": 4.125217898783756e-06,
+ "loss": 0.0819,
+ "step": 26016
+ },
+ {
+ "epoch": 70.89100817438693,
+ "grad_norm": 3.254020929336548,
+ "learning_rate": 4.124503771715619e-06,
+ "loss": 0.0414,
+ "step": 26017
+ },
+ {
+ "epoch": 70.89373297002724,
+ "grad_norm": 3.3897457122802734,
+ "learning_rate": 4.123789690405655e-06,
+ "loss": 0.0878,
+ "step": 26018
+ },
+ {
+ "epoch": 70.89645776566758,
+ "grad_norm": 4.130880832672119,
+ "learning_rate": 4.1230756548594305e-06,
+ "loss": 0.0962,
+ "step": 26019
+ },
+ {
+ "epoch": 70.8991825613079,
+ "grad_norm": 2.7152228355407715,
+ "learning_rate": 4.122361665082505e-06,
+ "loss": 0.0319,
+ "step": 26020
+ },
+ {
+ "epoch": 70.90190735694823,
+ "grad_norm": 2.5247933864593506,
+ "learning_rate": 4.121647721080436e-06,
+ "loss": 0.0282,
+ "step": 26021
+ },
+ {
+ "epoch": 70.90463215258856,
+ "grad_norm": 3.517009973526001,
+ "learning_rate": 4.120933822858784e-06,
+ "loss": 0.127,
+ "step": 26022
+ },
+ {
+ "epoch": 70.90735694822888,
+ "grad_norm": 2.396376132965088,
+ "learning_rate": 4.120219970423112e-06,
+ "loss": 0.205,
+ "step": 26023
+ },
+ {
+ "epoch": 70.91008174386921,
+ "grad_norm": 3.3002827167510986,
+ "learning_rate": 4.119506163778974e-06,
+ "loss": 0.0691,
+ "step": 26024
+ },
+ {
+ "epoch": 70.91280653950953,
+ "grad_norm": 3.1291379928588867,
+ "learning_rate": 4.1187924029319374e-06,
+ "loss": 0.0411,
+ "step": 26025
+ },
+ {
+ "epoch": 70.91553133514986,
+ "grad_norm": 5.469636917114258,
+ "learning_rate": 4.118078687887556e-06,
+ "loss": 0.055,
+ "step": 26026
+ },
+ {
+ "epoch": 70.9182561307902,
+ "grad_norm": 2.640181064605713,
+ "learning_rate": 4.117365018651385e-06,
+ "loss": 0.0946,
+ "step": 26027
+ },
+ {
+ "epoch": 70.92098092643052,
+ "grad_norm": 3.6619114875793457,
+ "learning_rate": 4.1166513952289885e-06,
+ "loss": 0.0475,
+ "step": 26028
+ },
+ {
+ "epoch": 70.92370572207085,
+ "grad_norm": 3.9255616664886475,
+ "learning_rate": 4.115937817625923e-06,
+ "loss": 0.1015,
+ "step": 26029
+ },
+ {
+ "epoch": 70.92643051771117,
+ "grad_norm": 2.6056079864501953,
+ "learning_rate": 4.1152242858477435e-06,
+ "loss": 0.2065,
+ "step": 26030
+ },
+ {
+ "epoch": 70.9291553133515,
+ "grad_norm": 3.3639891147613525,
+ "learning_rate": 4.114510799900003e-06,
+ "loss": 0.0343,
+ "step": 26031
+ },
+ {
+ "epoch": 70.93188010899182,
+ "grad_norm": 3.2747297286987305,
+ "learning_rate": 4.113797359788269e-06,
+ "loss": 0.055,
+ "step": 26032
+ },
+ {
+ "epoch": 70.93460490463215,
+ "grad_norm": 2.6767966747283936,
+ "learning_rate": 4.11308396551809e-06,
+ "loss": 0.0361,
+ "step": 26033
+ },
+ {
+ "epoch": 70.93732970027249,
+ "grad_norm": 3.1328749656677246,
+ "learning_rate": 4.11237061709502e-06,
+ "loss": 0.0398,
+ "step": 26034
+ },
+ {
+ "epoch": 70.9400544959128,
+ "grad_norm": 3.5282037258148193,
+ "learning_rate": 4.111657314524623e-06,
+ "loss": 0.069,
+ "step": 26035
+ },
+ {
+ "epoch": 70.94277929155314,
+ "grad_norm": 2.897711992263794,
+ "learning_rate": 4.110944057812449e-06,
+ "loss": 0.0635,
+ "step": 26036
+ },
+ {
+ "epoch": 70.94550408719346,
+ "grad_norm": 2.598701238632202,
+ "learning_rate": 4.110230846964053e-06,
+ "loss": 0.082,
+ "step": 26037
+ },
+ {
+ "epoch": 70.94822888283379,
+ "grad_norm": 3.073129653930664,
+ "learning_rate": 4.109517681984986e-06,
+ "loss": 0.0628,
+ "step": 26038
+ },
+ {
+ "epoch": 70.95095367847412,
+ "grad_norm": 2.4614381790161133,
+ "learning_rate": 4.108804562880809e-06,
+ "loss": 0.0339,
+ "step": 26039
+ },
+ {
+ "epoch": 70.95367847411444,
+ "grad_norm": 4.100926876068115,
+ "learning_rate": 4.108091489657072e-06,
+ "loss": 0.1,
+ "step": 26040
+ },
+ {
+ "epoch": 70.95640326975477,
+ "grad_norm": 5.091050624847412,
+ "learning_rate": 4.107378462319327e-06,
+ "loss": 0.1347,
+ "step": 26041
+ },
+ {
+ "epoch": 70.95912806539509,
+ "grad_norm": 12.523394584655762,
+ "learning_rate": 4.106665480873131e-06,
+ "loss": 0.0619,
+ "step": 26042
+ },
+ {
+ "epoch": 70.96185286103542,
+ "grad_norm": 4.1175103187561035,
+ "learning_rate": 4.105952545324031e-06,
+ "loss": 0.1031,
+ "step": 26043
+ },
+ {
+ "epoch": 70.96457765667574,
+ "grad_norm": 3.6107232570648193,
+ "learning_rate": 4.105239655677586e-06,
+ "loss": 0.1041,
+ "step": 26044
+ },
+ {
+ "epoch": 70.96730245231608,
+ "grad_norm": 3.0365426540374756,
+ "learning_rate": 4.104526811939347e-06,
+ "loss": 0.0681,
+ "step": 26045
+ },
+ {
+ "epoch": 70.97002724795641,
+ "grad_norm": 2.794994592666626,
+ "learning_rate": 4.103814014114862e-06,
+ "loss": 0.0465,
+ "step": 26046
+ },
+ {
+ "epoch": 70.97275204359673,
+ "grad_norm": 5.480357646942139,
+ "learning_rate": 4.10310126220968e-06,
+ "loss": 0.1777,
+ "step": 26047
+ },
+ {
+ "epoch": 70.97547683923706,
+ "grad_norm": 4.1183061599731445,
+ "learning_rate": 4.102388556229358e-06,
+ "loss": 0.1387,
+ "step": 26048
+ },
+ {
+ "epoch": 70.97820163487738,
+ "grad_norm": 2.9127626419067383,
+ "learning_rate": 4.101675896179446e-06,
+ "loss": 0.0362,
+ "step": 26049
+ },
+ {
+ "epoch": 70.98092643051771,
+ "grad_norm": 3.8233654499053955,
+ "learning_rate": 4.100963282065492e-06,
+ "loss": 0.25,
+ "step": 26050
+ },
+ {
+ "epoch": 70.98365122615803,
+ "grad_norm": 2.501060724258423,
+ "learning_rate": 4.100250713893043e-06,
+ "loss": 0.0319,
+ "step": 26051
+ },
+ {
+ "epoch": 70.98637602179836,
+ "grad_norm": 4.0335516929626465,
+ "learning_rate": 4.099538191667654e-06,
+ "loss": 0.0705,
+ "step": 26052
+ },
+ {
+ "epoch": 70.9891008174387,
+ "grad_norm": 2.2477872371673584,
+ "learning_rate": 4.098825715394872e-06,
+ "loss": 0.0394,
+ "step": 26053
+ },
+ {
+ "epoch": 70.99182561307902,
+ "grad_norm": 2.850425958633423,
+ "learning_rate": 4.098113285080245e-06,
+ "loss": 0.0631,
+ "step": 26054
+ },
+ {
+ "epoch": 70.99455040871935,
+ "grad_norm": 3.4741532802581787,
+ "learning_rate": 4.097400900729319e-06,
+ "loss": 0.2365,
+ "step": 26055
+ },
+ {
+ "epoch": 70.99727520435967,
+ "grad_norm": 3.390138864517212,
+ "learning_rate": 4.0966885623476485e-06,
+ "loss": 0.0896,
+ "step": 26056
+ },
+ {
+ "epoch": 71.0,
+ "grad_norm": 7.1555657386779785,
+ "learning_rate": 4.095976269940777e-06,
+ "loss": 0.1655,
+ "step": 26057
+ },
+ {
+ "epoch": 71.00272479564033,
+ "grad_norm": 2.8527214527130127,
+ "learning_rate": 4.095264023514248e-06,
+ "loss": 0.0885,
+ "step": 26058
+ },
+ {
+ "epoch": 71.00544959128065,
+ "grad_norm": 3.099708318710327,
+ "learning_rate": 4.094551823073614e-06,
+ "loss": 0.1058,
+ "step": 26059
+ },
+ {
+ "epoch": 71.00817438692098,
+ "grad_norm": 1.9717785120010376,
+ "learning_rate": 4.093839668624423e-06,
+ "loss": 0.0329,
+ "step": 26060
+ },
+ {
+ "epoch": 71.0108991825613,
+ "grad_norm": 2.0244579315185547,
+ "learning_rate": 4.0931275601722194e-06,
+ "loss": 0.0348,
+ "step": 26061
+ },
+ {
+ "epoch": 71.01362397820164,
+ "grad_norm": 2.797454595565796,
+ "learning_rate": 4.092415497722547e-06,
+ "loss": 0.0442,
+ "step": 26062
+ },
+ {
+ "epoch": 71.01634877384195,
+ "grad_norm": 3.133096694946289,
+ "learning_rate": 4.091703481280951e-06,
+ "loss": 0.0616,
+ "step": 26063
+ },
+ {
+ "epoch": 71.01907356948229,
+ "grad_norm": 3.9310803413391113,
+ "learning_rate": 4.090991510852979e-06,
+ "loss": 0.1391,
+ "step": 26064
+ },
+ {
+ "epoch": 71.02179836512262,
+ "grad_norm": 4.202494144439697,
+ "learning_rate": 4.090279586444177e-06,
+ "loss": 0.0672,
+ "step": 26065
+ },
+ {
+ "epoch": 71.02452316076294,
+ "grad_norm": 4.340561389923096,
+ "learning_rate": 4.089567708060087e-06,
+ "loss": 0.0555,
+ "step": 26066
+ },
+ {
+ "epoch": 71.02724795640327,
+ "grad_norm": 3.2145681381225586,
+ "learning_rate": 4.08885587570625e-06,
+ "loss": 0.0755,
+ "step": 26067
+ },
+ {
+ "epoch": 71.02997275204359,
+ "grad_norm": 2.5824227333068848,
+ "learning_rate": 4.088144089388216e-06,
+ "loss": 0.1028,
+ "step": 26068
+ },
+ {
+ "epoch": 71.03269754768392,
+ "grad_norm": 3.8116767406463623,
+ "learning_rate": 4.087432349111527e-06,
+ "loss": 0.0409,
+ "step": 26069
+ },
+ {
+ "epoch": 71.03542234332426,
+ "grad_norm": 2.5581002235412598,
+ "learning_rate": 4.086720654881723e-06,
+ "loss": 0.0396,
+ "step": 26070
+ },
+ {
+ "epoch": 71.03814713896458,
+ "grad_norm": 2.855933427810669,
+ "learning_rate": 4.086009006704345e-06,
+ "loss": 0.0517,
+ "step": 26071
+ },
+ {
+ "epoch": 71.04087193460491,
+ "grad_norm": 2.431560516357422,
+ "learning_rate": 4.085297404584942e-06,
+ "loss": 0.0293,
+ "step": 26072
+ },
+ {
+ "epoch": 71.04359673024523,
+ "grad_norm": 2.369784355163574,
+ "learning_rate": 4.0845858485290535e-06,
+ "loss": 0.0846,
+ "step": 26073
+ },
+ {
+ "epoch": 71.04632152588556,
+ "grad_norm": 2.523799419403076,
+ "learning_rate": 4.0838743385422195e-06,
+ "loss": 0.039,
+ "step": 26074
+ },
+ {
+ "epoch": 71.04904632152588,
+ "grad_norm": 2.0205631256103516,
+ "learning_rate": 4.083162874629978e-06,
+ "loss": 0.0347,
+ "step": 26075
+ },
+ {
+ "epoch": 71.05177111716621,
+ "grad_norm": 2.60185170173645,
+ "learning_rate": 4.082451456797873e-06,
+ "loss": 0.0305,
+ "step": 26076
+ },
+ {
+ "epoch": 71.05449591280654,
+ "grad_norm": 3.9647903442382812,
+ "learning_rate": 4.08174008505145e-06,
+ "loss": 0.1401,
+ "step": 26077
+ },
+ {
+ "epoch": 71.05722070844686,
+ "grad_norm": 4.09466028213501,
+ "learning_rate": 4.081028759396245e-06,
+ "loss": 0.0725,
+ "step": 26078
+ },
+ {
+ "epoch": 71.0599455040872,
+ "grad_norm": 3.022454261779785,
+ "learning_rate": 4.080317479837793e-06,
+ "loss": 0.0576,
+ "step": 26079
+ },
+ {
+ "epoch": 71.06267029972751,
+ "grad_norm": 4.466739654541016,
+ "learning_rate": 4.079606246381642e-06,
+ "loss": 0.0723,
+ "step": 26080
+ },
+ {
+ "epoch": 71.06539509536785,
+ "grad_norm": 3.1590499877929688,
+ "learning_rate": 4.0788950590333265e-06,
+ "loss": 0.0515,
+ "step": 26081
+ },
+ {
+ "epoch": 71.06811989100818,
+ "grad_norm": 2.5963423252105713,
+ "learning_rate": 4.078183917798386e-06,
+ "loss": 0.0456,
+ "step": 26082
+ },
+ {
+ "epoch": 71.0708446866485,
+ "grad_norm": 3.6453804969787598,
+ "learning_rate": 4.0774728226823556e-06,
+ "loss": 0.0561,
+ "step": 26083
+ },
+ {
+ "epoch": 71.07356948228883,
+ "grad_norm": 3.618593215942383,
+ "learning_rate": 4.07676177369078e-06,
+ "loss": 0.083,
+ "step": 26084
+ },
+ {
+ "epoch": 71.07629427792915,
+ "grad_norm": 2.215276002883911,
+ "learning_rate": 4.076050770829192e-06,
+ "loss": 0.0389,
+ "step": 26085
+ },
+ {
+ "epoch": 71.07901907356948,
+ "grad_norm": 3.5353288650512695,
+ "learning_rate": 4.075339814103131e-06,
+ "loss": 0.0706,
+ "step": 26086
+ },
+ {
+ "epoch": 71.0817438692098,
+ "grad_norm": 2.7013566493988037,
+ "learning_rate": 4.074628903518129e-06,
+ "loss": 0.0413,
+ "step": 26087
+ },
+ {
+ "epoch": 71.08446866485014,
+ "grad_norm": 2.762425422668457,
+ "learning_rate": 4.073918039079729e-06,
+ "loss": 0.0934,
+ "step": 26088
+ },
+ {
+ "epoch": 71.08719346049047,
+ "grad_norm": 3.5204782485961914,
+ "learning_rate": 4.073207220793465e-06,
+ "loss": 0.0751,
+ "step": 26089
+ },
+ {
+ "epoch": 71.08991825613079,
+ "grad_norm": 3.8314247131347656,
+ "learning_rate": 4.072496448664872e-06,
+ "loss": 0.1176,
+ "step": 26090
+ },
+ {
+ "epoch": 71.09264305177112,
+ "grad_norm": 1.8714334964752197,
+ "learning_rate": 4.071785722699484e-06,
+ "loss": 0.0521,
+ "step": 26091
+ },
+ {
+ "epoch": 71.09536784741144,
+ "grad_norm": 3.3808674812316895,
+ "learning_rate": 4.07107504290284e-06,
+ "loss": 0.0588,
+ "step": 26092
+ },
+ {
+ "epoch": 71.09809264305177,
+ "grad_norm": 2.3348703384399414,
+ "learning_rate": 4.0703644092804695e-06,
+ "loss": 0.1567,
+ "step": 26093
+ },
+ {
+ "epoch": 71.1008174386921,
+ "grad_norm": 2.7863707542419434,
+ "learning_rate": 4.069653821837913e-06,
+ "loss": 0.0605,
+ "step": 26094
+ },
+ {
+ "epoch": 71.10354223433242,
+ "grad_norm": 3.885864019393921,
+ "learning_rate": 4.068943280580704e-06,
+ "loss": 0.1171,
+ "step": 26095
+ },
+ {
+ "epoch": 71.10626702997276,
+ "grad_norm": 3.8391263484954834,
+ "learning_rate": 4.068232785514368e-06,
+ "loss": 0.0768,
+ "step": 26096
+ },
+ {
+ "epoch": 71.10899182561307,
+ "grad_norm": 6.129915237426758,
+ "learning_rate": 4.067522336644448e-06,
+ "loss": 0.0483,
+ "step": 26097
+ },
+ {
+ "epoch": 71.11171662125341,
+ "grad_norm": 4.418376445770264,
+ "learning_rate": 4.0668119339764746e-06,
+ "loss": 0.0855,
+ "step": 26098
+ },
+ {
+ "epoch": 71.11444141689373,
+ "grad_norm": 2.6548573970794678,
+ "learning_rate": 4.066101577515974e-06,
+ "loss": 0.0302,
+ "step": 26099
+ },
+ {
+ "epoch": 71.11716621253406,
+ "grad_norm": 3.826864004135132,
+ "learning_rate": 4.065391267268487e-06,
+ "loss": 0.087,
+ "step": 26100
+ },
+ {
+ "epoch": 71.11989100817439,
+ "grad_norm": 2.5251123905181885,
+ "learning_rate": 4.064681003239543e-06,
+ "loss": 0.1032,
+ "step": 26101
+ },
+ {
+ "epoch": 71.12261580381471,
+ "grad_norm": 2.869708776473999,
+ "learning_rate": 4.063970785434671e-06,
+ "loss": 0.1286,
+ "step": 26102
+ },
+ {
+ "epoch": 71.12534059945504,
+ "grad_norm": 3.617197275161743,
+ "learning_rate": 4.0632606138594e-06,
+ "loss": 0.0651,
+ "step": 26103
+ },
+ {
+ "epoch": 71.12806539509536,
+ "grad_norm": 1.9999364614486694,
+ "learning_rate": 4.062550488519268e-06,
+ "loss": 0.0355,
+ "step": 26104
+ },
+ {
+ "epoch": 71.1307901907357,
+ "grad_norm": 3.306886672973633,
+ "learning_rate": 4.0618404094198016e-06,
+ "loss": 0.0713,
+ "step": 26105
+ },
+ {
+ "epoch": 71.13351498637603,
+ "grad_norm": 3.030975103378296,
+ "learning_rate": 4.061130376566531e-06,
+ "loss": 0.0258,
+ "step": 26106
+ },
+ {
+ "epoch": 71.13623978201635,
+ "grad_norm": 2.435028076171875,
+ "learning_rate": 4.060420389964983e-06,
+ "loss": 0.04,
+ "step": 26107
+ },
+ {
+ "epoch": 71.13896457765668,
+ "grad_norm": 2.20660400390625,
+ "learning_rate": 4.059710449620693e-06,
+ "loss": 0.1839,
+ "step": 26108
+ },
+ {
+ "epoch": 71.141689373297,
+ "grad_norm": 4.439379692077637,
+ "learning_rate": 4.0590005555391865e-06,
+ "loss": 0.1027,
+ "step": 26109
+ },
+ {
+ "epoch": 71.14441416893733,
+ "grad_norm": 3.1821601390838623,
+ "learning_rate": 4.0582907077259894e-06,
+ "loss": 0.1882,
+ "step": 26110
+ },
+ {
+ "epoch": 71.14713896457765,
+ "grad_norm": 3.6115283966064453,
+ "learning_rate": 4.057580906186637e-06,
+ "loss": 0.0664,
+ "step": 26111
+ },
+ {
+ "epoch": 71.14986376021798,
+ "grad_norm": 3.003767728805542,
+ "learning_rate": 4.056871150926649e-06,
+ "loss": 0.0875,
+ "step": 26112
+ },
+ {
+ "epoch": 71.15258855585832,
+ "grad_norm": 3.3359696865081787,
+ "learning_rate": 4.056161441951561e-06,
+ "loss": 0.0916,
+ "step": 26113
+ },
+ {
+ "epoch": 71.15531335149863,
+ "grad_norm": 2.4242122173309326,
+ "learning_rate": 4.055451779266896e-06,
+ "loss": 0.105,
+ "step": 26114
+ },
+ {
+ "epoch": 71.15803814713897,
+ "grad_norm": 2.911146402359009,
+ "learning_rate": 4.0547421628781815e-06,
+ "loss": 0.0528,
+ "step": 26115
+ },
+ {
+ "epoch": 71.16076294277929,
+ "grad_norm": 3.8165996074676514,
+ "learning_rate": 4.05403259279094e-06,
+ "loss": 0.1203,
+ "step": 26116
+ },
+ {
+ "epoch": 71.16348773841962,
+ "grad_norm": 2.963271379470825,
+ "learning_rate": 4.053323069010704e-06,
+ "loss": 0.0522,
+ "step": 26117
+ },
+ {
+ "epoch": 71.16621253405995,
+ "grad_norm": 2.903336763381958,
+ "learning_rate": 4.052613591542998e-06,
+ "loss": 0.0382,
+ "step": 26118
+ },
+ {
+ "epoch": 71.16893732970027,
+ "grad_norm": 2.796835422515869,
+ "learning_rate": 4.051904160393345e-06,
+ "loss": 0.128,
+ "step": 26119
+ },
+ {
+ "epoch": 71.1716621253406,
+ "grad_norm": 2.7993125915527344,
+ "learning_rate": 4.051194775567268e-06,
+ "loss": 0.0348,
+ "step": 26120
+ },
+ {
+ "epoch": 71.17438692098092,
+ "grad_norm": 3.7094621658325195,
+ "learning_rate": 4.050485437070297e-06,
+ "loss": 0.0987,
+ "step": 26121
+ },
+ {
+ "epoch": 71.17711171662125,
+ "grad_norm": 2.9672060012817383,
+ "learning_rate": 4.049776144907955e-06,
+ "loss": 0.0529,
+ "step": 26122
+ },
+ {
+ "epoch": 71.17983651226157,
+ "grad_norm": 2.5991804599761963,
+ "learning_rate": 4.0490668990857615e-06,
+ "loss": 0.0952,
+ "step": 26123
+ },
+ {
+ "epoch": 71.1825613079019,
+ "grad_norm": 3.1416094303131104,
+ "learning_rate": 4.048357699609246e-06,
+ "loss": 0.1398,
+ "step": 26124
+ },
+ {
+ "epoch": 71.18528610354224,
+ "grad_norm": 2.1139564514160156,
+ "learning_rate": 4.047648546483931e-06,
+ "loss": 0.0409,
+ "step": 26125
+ },
+ {
+ "epoch": 71.18801089918256,
+ "grad_norm": 2.8843088150024414,
+ "learning_rate": 4.046939439715336e-06,
+ "loss": 0.0394,
+ "step": 26126
+ },
+ {
+ "epoch": 71.19073569482289,
+ "grad_norm": 3.3568787574768066,
+ "learning_rate": 4.046230379308982e-06,
+ "loss": 0.1828,
+ "step": 26127
+ },
+ {
+ "epoch": 71.19346049046321,
+ "grad_norm": 2.49369215965271,
+ "learning_rate": 4.045521365270394e-06,
+ "loss": 0.1426,
+ "step": 26128
+ },
+ {
+ "epoch": 71.19618528610354,
+ "grad_norm": 2.4332704544067383,
+ "learning_rate": 4.044812397605098e-06,
+ "loss": 0.0322,
+ "step": 26129
+ },
+ {
+ "epoch": 71.19891008174388,
+ "grad_norm": 4.03870153427124,
+ "learning_rate": 4.044103476318612e-06,
+ "loss": 0.0394,
+ "step": 26130
+ },
+ {
+ "epoch": 71.2016348773842,
+ "grad_norm": 2.979018211364746,
+ "learning_rate": 4.043394601416455e-06,
+ "loss": 0.0368,
+ "step": 26131
+ },
+ {
+ "epoch": 71.20435967302453,
+ "grad_norm": 2.245609760284424,
+ "learning_rate": 4.042685772904146e-06,
+ "loss": 0.0373,
+ "step": 26132
+ },
+ {
+ "epoch": 71.20708446866485,
+ "grad_norm": 3.806074857711792,
+ "learning_rate": 4.041976990787212e-06,
+ "loss": 0.0623,
+ "step": 26133
+ },
+ {
+ "epoch": 71.20980926430518,
+ "grad_norm": 2.555792808532715,
+ "learning_rate": 4.041268255071169e-06,
+ "loss": 0.1072,
+ "step": 26134
+ },
+ {
+ "epoch": 71.2125340599455,
+ "grad_norm": 3.141249179840088,
+ "learning_rate": 4.040559565761537e-06,
+ "loss": 0.0808,
+ "step": 26135
+ },
+ {
+ "epoch": 71.21525885558583,
+ "grad_norm": 3.3116321563720703,
+ "learning_rate": 4.039850922863833e-06,
+ "loss": 0.1353,
+ "step": 26136
+ },
+ {
+ "epoch": 71.21798365122616,
+ "grad_norm": 3.131275177001953,
+ "learning_rate": 4.03914232638358e-06,
+ "loss": 0.0482,
+ "step": 26137
+ },
+ {
+ "epoch": 71.22070844686648,
+ "grad_norm": 2.9546279907226562,
+ "learning_rate": 4.038433776326297e-06,
+ "loss": 0.0392,
+ "step": 26138
+ },
+ {
+ "epoch": 71.22343324250681,
+ "grad_norm": 2.3739166259765625,
+ "learning_rate": 4.037725272697498e-06,
+ "loss": 0.1232,
+ "step": 26139
+ },
+ {
+ "epoch": 71.22615803814713,
+ "grad_norm": 2.883281707763672,
+ "learning_rate": 4.0370168155027e-06,
+ "loss": 0.0467,
+ "step": 26140
+ },
+ {
+ "epoch": 71.22888283378747,
+ "grad_norm": 3.404445171356201,
+ "learning_rate": 4.036308404747426e-06,
+ "loss": 0.1129,
+ "step": 26141
+ },
+ {
+ "epoch": 71.2316076294278,
+ "grad_norm": 3.4998667240142822,
+ "learning_rate": 4.035600040437191e-06,
+ "loss": 0.0872,
+ "step": 26142
+ },
+ {
+ "epoch": 71.23433242506812,
+ "grad_norm": 18.2752742767334,
+ "learning_rate": 4.034891722577511e-06,
+ "loss": 0.0834,
+ "step": 26143
+ },
+ {
+ "epoch": 71.23705722070845,
+ "grad_norm": 3.492717981338501,
+ "learning_rate": 4.034183451173897e-06,
+ "loss": 0.0403,
+ "step": 26144
+ },
+ {
+ "epoch": 71.23978201634877,
+ "grad_norm": 2.7523624897003174,
+ "learning_rate": 4.033475226231872e-06,
+ "loss": 0.0685,
+ "step": 26145
+ },
+ {
+ "epoch": 71.2425068119891,
+ "grad_norm": 3.1481869220733643,
+ "learning_rate": 4.032767047756954e-06,
+ "loss": 0.0726,
+ "step": 26146
+ },
+ {
+ "epoch": 71.24523160762942,
+ "grad_norm": 2.7452948093414307,
+ "learning_rate": 4.032058915754653e-06,
+ "loss": 0.1341,
+ "step": 26147
+ },
+ {
+ "epoch": 71.24795640326975,
+ "grad_norm": 3.3518741130828857,
+ "learning_rate": 4.031350830230482e-06,
+ "loss": 0.0424,
+ "step": 26148
+ },
+ {
+ "epoch": 71.25068119891009,
+ "grad_norm": 3.4906837940216064,
+ "learning_rate": 4.0306427911899614e-06,
+ "loss": 0.1093,
+ "step": 26149
+ },
+ {
+ "epoch": 71.2534059945504,
+ "grad_norm": 2.8083479404449463,
+ "learning_rate": 4.029934798638603e-06,
+ "loss": 0.1589,
+ "step": 26150
+ },
+ {
+ "epoch": 71.25613079019074,
+ "grad_norm": 4.763759136199951,
+ "learning_rate": 4.02922685258192e-06,
+ "loss": 0.0315,
+ "step": 26151
+ },
+ {
+ "epoch": 71.25885558583106,
+ "grad_norm": 2.4466710090637207,
+ "learning_rate": 4.028518953025423e-06,
+ "loss": 0.0445,
+ "step": 26152
+ },
+ {
+ "epoch": 71.26158038147139,
+ "grad_norm": 3.23868465423584,
+ "learning_rate": 4.027811099974632e-06,
+ "loss": 0.0849,
+ "step": 26153
+ },
+ {
+ "epoch": 71.26430517711172,
+ "grad_norm": 2.836198329925537,
+ "learning_rate": 4.0271032934350555e-06,
+ "loss": 0.0887,
+ "step": 26154
+ },
+ {
+ "epoch": 71.26702997275204,
+ "grad_norm": 2.9903182983398438,
+ "learning_rate": 4.026395533412206e-06,
+ "loss": 0.0384,
+ "step": 26155
+ },
+ {
+ "epoch": 71.26975476839237,
+ "grad_norm": 2.2511773109436035,
+ "learning_rate": 4.025687819911593e-06,
+ "loss": 0.0327,
+ "step": 26156
+ },
+ {
+ "epoch": 71.2724795640327,
+ "grad_norm": 2.0673069953918457,
+ "learning_rate": 4.024980152938735e-06,
+ "loss": 0.0277,
+ "step": 26157
+ },
+ {
+ "epoch": 71.27520435967303,
+ "grad_norm": 2.301643133163452,
+ "learning_rate": 4.0242725324991375e-06,
+ "loss": 0.0329,
+ "step": 26158
+ },
+ {
+ "epoch": 71.27792915531334,
+ "grad_norm": 3.1151835918426514,
+ "learning_rate": 4.023564958598314e-06,
+ "loss": 0.0521,
+ "step": 26159
+ },
+ {
+ "epoch": 71.28065395095368,
+ "grad_norm": 2.144178628921509,
+ "learning_rate": 4.0228574312417715e-06,
+ "loss": 0.0312,
+ "step": 26160
+ },
+ {
+ "epoch": 71.28337874659401,
+ "grad_norm": 3.044750452041626,
+ "learning_rate": 4.022149950435026e-06,
+ "loss": 0.0292,
+ "step": 26161
+ },
+ {
+ "epoch": 71.28610354223433,
+ "grad_norm": 3.113910436630249,
+ "learning_rate": 4.02144251618358e-06,
+ "loss": 0.1339,
+ "step": 26162
+ },
+ {
+ "epoch": 71.28882833787466,
+ "grad_norm": 3.3358335494995117,
+ "learning_rate": 4.020735128492952e-06,
+ "loss": 0.1451,
+ "step": 26163
+ },
+ {
+ "epoch": 71.29155313351498,
+ "grad_norm": 3.408358097076416,
+ "learning_rate": 4.020027787368642e-06,
+ "loss": 0.1037,
+ "step": 26164
+ },
+ {
+ "epoch": 71.29427792915531,
+ "grad_norm": 3.093109130859375,
+ "learning_rate": 4.019320492816167e-06,
+ "loss": 0.0286,
+ "step": 26165
+ },
+ {
+ "epoch": 71.29700272479565,
+ "grad_norm": 3.21688175201416,
+ "learning_rate": 4.018613244841031e-06,
+ "loss": 0.1308,
+ "step": 26166
+ },
+ {
+ "epoch": 71.29972752043597,
+ "grad_norm": 2.772951364517212,
+ "learning_rate": 4.017906043448744e-06,
+ "loss": 0.0465,
+ "step": 26167
+ },
+ {
+ "epoch": 71.3024523160763,
+ "grad_norm": 2.1212408542633057,
+ "learning_rate": 4.017198888644807e-06,
+ "loss": 0.0362,
+ "step": 26168
+ },
+ {
+ "epoch": 71.30517711171662,
+ "grad_norm": 2.960747480392456,
+ "learning_rate": 4.016491780434737e-06,
+ "loss": 0.1397,
+ "step": 26169
+ },
+ {
+ "epoch": 71.30790190735695,
+ "grad_norm": 2.8554725646972656,
+ "learning_rate": 4.015784718824036e-06,
+ "loss": 0.0732,
+ "step": 26170
+ },
+ {
+ "epoch": 71.31062670299727,
+ "grad_norm": 3.2245540618896484,
+ "learning_rate": 4.015077703818211e-06,
+ "loss": 0.0425,
+ "step": 26171
+ },
+ {
+ "epoch": 71.3133514986376,
+ "grad_norm": 7.894142150878906,
+ "learning_rate": 4.014370735422765e-06,
+ "loss": 0.2433,
+ "step": 26172
+ },
+ {
+ "epoch": 71.31607629427793,
+ "grad_norm": 2.4632678031921387,
+ "learning_rate": 4.013663813643211e-06,
+ "loss": 0.05,
+ "step": 26173
+ },
+ {
+ "epoch": 71.31880108991825,
+ "grad_norm": 2.931635856628418,
+ "learning_rate": 4.012956938485049e-06,
+ "loss": 0.0764,
+ "step": 26174
+ },
+ {
+ "epoch": 71.32152588555859,
+ "grad_norm": 2.721539258956909,
+ "learning_rate": 4.012250109953787e-06,
+ "loss": 0.0351,
+ "step": 26175
+ },
+ {
+ "epoch": 71.3242506811989,
+ "grad_norm": 4.405660152435303,
+ "learning_rate": 4.011543328054924e-06,
+ "loss": 0.1693,
+ "step": 26176
+ },
+ {
+ "epoch": 71.32697547683924,
+ "grad_norm": 3.629136562347412,
+ "learning_rate": 4.010836592793973e-06,
+ "loss": 0.1972,
+ "step": 26177
+ },
+ {
+ "epoch": 71.32970027247957,
+ "grad_norm": 2.7203550338745117,
+ "learning_rate": 4.010129904176434e-06,
+ "loss": 0.0352,
+ "step": 26178
+ },
+ {
+ "epoch": 71.33242506811989,
+ "grad_norm": 2.688110113143921,
+ "learning_rate": 4.009423262207807e-06,
+ "loss": 0.048,
+ "step": 26179
+ },
+ {
+ "epoch": 71.33514986376022,
+ "grad_norm": 4.946422576904297,
+ "learning_rate": 4.0087166668936015e-06,
+ "loss": 0.119,
+ "step": 26180
+ },
+ {
+ "epoch": 71.33787465940054,
+ "grad_norm": 2.342850923538208,
+ "learning_rate": 4.008010118239315e-06,
+ "loss": 0.0248,
+ "step": 26181
+ },
+ {
+ "epoch": 71.34059945504087,
+ "grad_norm": 3.7198307514190674,
+ "learning_rate": 4.007303616250457e-06,
+ "loss": 0.1265,
+ "step": 26182
+ },
+ {
+ "epoch": 71.34332425068119,
+ "grad_norm": 2.975597381591797,
+ "learning_rate": 4.006597160932524e-06,
+ "loss": 0.2323,
+ "step": 26183
+ },
+ {
+ "epoch": 71.34604904632153,
+ "grad_norm": 4.063631534576416,
+ "learning_rate": 4.005890752291021e-06,
+ "loss": 0.1785,
+ "step": 26184
+ },
+ {
+ "epoch": 71.34877384196186,
+ "grad_norm": 2.9268012046813965,
+ "learning_rate": 4.005184390331443e-06,
+ "loss": 0.0501,
+ "step": 26185
+ },
+ {
+ "epoch": 71.35149863760218,
+ "grad_norm": 4.783208847045898,
+ "learning_rate": 4.0044780750593005e-06,
+ "loss": 0.0939,
+ "step": 26186
+ },
+ {
+ "epoch": 71.35422343324251,
+ "grad_norm": 2.9689512252807617,
+ "learning_rate": 4.003771806480089e-06,
+ "loss": 0.0388,
+ "step": 26187
+ },
+ {
+ "epoch": 71.35694822888283,
+ "grad_norm": 3.088300943374634,
+ "learning_rate": 4.003065584599306e-06,
+ "loss": 0.0851,
+ "step": 26188
+ },
+ {
+ "epoch": 71.35967302452316,
+ "grad_norm": 3.1855874061584473,
+ "learning_rate": 4.002359409422459e-06,
+ "loss": 0.0867,
+ "step": 26189
+ },
+ {
+ "epoch": 71.3623978201635,
+ "grad_norm": 2.78861665725708,
+ "learning_rate": 4.001653280955045e-06,
+ "loss": 0.0306,
+ "step": 26190
+ },
+ {
+ "epoch": 71.36512261580381,
+ "grad_norm": 1.984560489654541,
+ "learning_rate": 4.000947199202562e-06,
+ "loss": 0.0306,
+ "step": 26191
+ },
+ {
+ "epoch": 71.36784741144415,
+ "grad_norm": 3.627943515777588,
+ "learning_rate": 4.000241164170504e-06,
+ "loss": 0.0842,
+ "step": 26192
+ },
+ {
+ "epoch": 71.37057220708446,
+ "grad_norm": 4.622325897216797,
+ "learning_rate": 3.99953517586438e-06,
+ "loss": 0.1576,
+ "step": 26193
+ },
+ {
+ "epoch": 71.3732970027248,
+ "grad_norm": 3.2991983890533447,
+ "learning_rate": 3.9988292342896816e-06,
+ "loss": 0.0565,
+ "step": 26194
+ },
+ {
+ "epoch": 71.37602179836512,
+ "grad_norm": 2.1634292602539062,
+ "learning_rate": 3.998123339451908e-06,
+ "loss": 0.1563,
+ "step": 26195
+ },
+ {
+ "epoch": 71.37874659400545,
+ "grad_norm": 2.7750957012176514,
+ "learning_rate": 3.997417491356554e-06,
+ "loss": 0.123,
+ "step": 26196
+ },
+ {
+ "epoch": 71.38147138964578,
+ "grad_norm": 2.795283794403076,
+ "learning_rate": 3.996711690009119e-06,
+ "loss": 0.0364,
+ "step": 26197
+ },
+ {
+ "epoch": 71.3841961852861,
+ "grad_norm": 4.920372486114502,
+ "learning_rate": 3.996005935415104e-06,
+ "loss": 0.0764,
+ "step": 26198
+ },
+ {
+ "epoch": 71.38692098092643,
+ "grad_norm": 2.1958577632904053,
+ "learning_rate": 3.995300227580001e-06,
+ "loss": 0.0689,
+ "step": 26199
+ },
+ {
+ "epoch": 71.38964577656675,
+ "grad_norm": 3.190755844116211,
+ "learning_rate": 3.994594566509306e-06,
+ "loss": 0.2097,
+ "step": 26200
+ },
+ {
+ "epoch": 71.39237057220708,
+ "grad_norm": 3.133312463760376,
+ "learning_rate": 3.993888952208513e-06,
+ "loss": 0.0411,
+ "step": 26201
+ },
+ {
+ "epoch": 71.39509536784742,
+ "grad_norm": 2.8266334533691406,
+ "learning_rate": 3.993183384683124e-06,
+ "loss": 0.0562,
+ "step": 26202
+ },
+ {
+ "epoch": 71.39782016348774,
+ "grad_norm": 2.8147099018096924,
+ "learning_rate": 3.992477863938628e-06,
+ "loss": 0.1085,
+ "step": 26203
+ },
+ {
+ "epoch": 71.40054495912807,
+ "grad_norm": 3.9899539947509766,
+ "learning_rate": 3.99177238998052e-06,
+ "loss": 0.176,
+ "step": 26204
+ },
+ {
+ "epoch": 71.40326975476839,
+ "grad_norm": 3.109407424926758,
+ "learning_rate": 3.991066962814293e-06,
+ "loss": 0.2846,
+ "step": 26205
+ },
+ {
+ "epoch": 71.40599455040872,
+ "grad_norm": 2.2918648719787598,
+ "learning_rate": 3.990361582445447e-06,
+ "loss": 0.0436,
+ "step": 26206
+ },
+ {
+ "epoch": 71.40871934604904,
+ "grad_norm": 2.409806966781616,
+ "learning_rate": 3.989656248879471e-06,
+ "loss": 0.0365,
+ "step": 26207
+ },
+ {
+ "epoch": 71.41144414168937,
+ "grad_norm": 2.9081597328186035,
+ "learning_rate": 3.988950962121855e-06,
+ "loss": 0.0596,
+ "step": 26208
+ },
+ {
+ "epoch": 71.4141689373297,
+ "grad_norm": 4.1911725997924805,
+ "learning_rate": 3.988245722178099e-06,
+ "loss": 0.0565,
+ "step": 26209
+ },
+ {
+ "epoch": 71.41689373297002,
+ "grad_norm": 3.6818454265594482,
+ "learning_rate": 3.987540529053692e-06,
+ "loss": 0.1558,
+ "step": 26210
+ },
+ {
+ "epoch": 71.41961852861036,
+ "grad_norm": 2.782841920852661,
+ "learning_rate": 3.9868353827541265e-06,
+ "loss": 0.0653,
+ "step": 26211
+ },
+ {
+ "epoch": 71.42234332425068,
+ "grad_norm": 2.2606873512268066,
+ "learning_rate": 3.986130283284889e-06,
+ "loss": 0.0553,
+ "step": 26212
+ },
+ {
+ "epoch": 71.42506811989101,
+ "grad_norm": 3.6367404460906982,
+ "learning_rate": 3.985425230651479e-06,
+ "loss": 0.068,
+ "step": 26213
+ },
+ {
+ "epoch": 71.42779291553134,
+ "grad_norm": 1.963287353515625,
+ "learning_rate": 3.98472022485938e-06,
+ "loss": 0.0345,
+ "step": 26214
+ },
+ {
+ "epoch": 71.43051771117166,
+ "grad_norm": 3.1251213550567627,
+ "learning_rate": 3.984015265914091e-06,
+ "loss": 0.0858,
+ "step": 26215
+ },
+ {
+ "epoch": 71.433242506812,
+ "grad_norm": 3.200543165206909,
+ "learning_rate": 3.983310353821096e-06,
+ "loss": 0.0414,
+ "step": 26216
+ },
+ {
+ "epoch": 71.43596730245231,
+ "grad_norm": 3.0238993167877197,
+ "learning_rate": 3.982605488585884e-06,
+ "loss": 0.0729,
+ "step": 26217
+ },
+ {
+ "epoch": 71.43869209809264,
+ "grad_norm": 2.651211738586426,
+ "learning_rate": 3.9819006702139496e-06,
+ "loss": 0.1423,
+ "step": 26218
+ },
+ {
+ "epoch": 71.44141689373296,
+ "grad_norm": 2.6668174266815186,
+ "learning_rate": 3.981195898710779e-06,
+ "loss": 0.0756,
+ "step": 26219
+ },
+ {
+ "epoch": 71.4441416893733,
+ "grad_norm": 2.347923755645752,
+ "learning_rate": 3.9804911740818604e-06,
+ "loss": 0.1214,
+ "step": 26220
+ },
+ {
+ "epoch": 71.44686648501363,
+ "grad_norm": 3.0171802043914795,
+ "learning_rate": 3.97978649633268e-06,
+ "loss": 0.0752,
+ "step": 26221
+ },
+ {
+ "epoch": 71.44959128065395,
+ "grad_norm": 4.0918402671813965,
+ "learning_rate": 3.979081865468733e-06,
+ "loss": 0.1401,
+ "step": 26222
+ },
+ {
+ "epoch": 71.45231607629428,
+ "grad_norm": 2.6300928592681885,
+ "learning_rate": 3.978377281495502e-06,
+ "loss": 0.0601,
+ "step": 26223
+ },
+ {
+ "epoch": 71.4550408719346,
+ "grad_norm": 7.589695453643799,
+ "learning_rate": 3.977672744418475e-06,
+ "loss": 0.0908,
+ "step": 26224
+ },
+ {
+ "epoch": 71.45776566757493,
+ "grad_norm": 3.170612096786499,
+ "learning_rate": 3.976968254243135e-06,
+ "loss": 0.0498,
+ "step": 26225
+ },
+ {
+ "epoch": 71.46049046321527,
+ "grad_norm": 3.535686731338501,
+ "learning_rate": 3.976263810974977e-06,
+ "loss": 0.0463,
+ "step": 26226
+ },
+ {
+ "epoch": 71.46321525885558,
+ "grad_norm": 2.5216078758239746,
+ "learning_rate": 3.975559414619481e-06,
+ "loss": 0.0892,
+ "step": 26227
+ },
+ {
+ "epoch": 71.46594005449592,
+ "grad_norm": 3.490795612335205,
+ "learning_rate": 3.974855065182135e-06,
+ "loss": 0.0565,
+ "step": 26228
+ },
+ {
+ "epoch": 71.46866485013624,
+ "grad_norm": 3.58577823638916,
+ "learning_rate": 3.974150762668421e-06,
+ "loss": 0.0384,
+ "step": 26229
+ },
+ {
+ "epoch": 71.47138964577657,
+ "grad_norm": 3.07975435256958,
+ "learning_rate": 3.973446507083829e-06,
+ "loss": 0.0493,
+ "step": 26230
+ },
+ {
+ "epoch": 71.47411444141689,
+ "grad_norm": 4.166622638702393,
+ "learning_rate": 3.9727422984338384e-06,
+ "loss": 0.0915,
+ "step": 26231
+ },
+ {
+ "epoch": 71.47683923705722,
+ "grad_norm": 2.069585084915161,
+ "learning_rate": 3.972038136723941e-06,
+ "loss": 0.0372,
+ "step": 26232
+ },
+ {
+ "epoch": 71.47956403269755,
+ "grad_norm": 2.160964250564575,
+ "learning_rate": 3.971334021959613e-06,
+ "loss": 0.0457,
+ "step": 26233
+ },
+ {
+ "epoch": 71.48228882833787,
+ "grad_norm": 2.3658523559570312,
+ "learning_rate": 3.970629954146346e-06,
+ "loss": 0.0383,
+ "step": 26234
+ },
+ {
+ "epoch": 71.4850136239782,
+ "grad_norm": 3.285229444503784,
+ "learning_rate": 3.9699259332896165e-06,
+ "loss": 0.0618,
+ "step": 26235
+ },
+ {
+ "epoch": 71.48773841961852,
+ "grad_norm": 3.133434772491455,
+ "learning_rate": 3.969221959394911e-06,
+ "loss": 0.1925,
+ "step": 26236
+ },
+ {
+ "epoch": 71.49046321525886,
+ "grad_norm": 3.400329828262329,
+ "learning_rate": 3.9685180324677074e-06,
+ "loss": 0.1674,
+ "step": 26237
+ },
+ {
+ "epoch": 71.49318801089919,
+ "grad_norm": 2.832056760787964,
+ "learning_rate": 3.967814152513495e-06,
+ "loss": 0.0374,
+ "step": 26238
+ },
+ {
+ "epoch": 71.49591280653951,
+ "grad_norm": 3.7763254642486572,
+ "learning_rate": 3.967110319537751e-06,
+ "loss": 0.0504,
+ "step": 26239
+ },
+ {
+ "epoch": 71.49863760217984,
+ "grad_norm": 4.347590446472168,
+ "learning_rate": 3.966406533545959e-06,
+ "loss": 0.1006,
+ "step": 26240
+ },
+ {
+ "epoch": 71.50136239782016,
+ "grad_norm": 4.205351829528809,
+ "learning_rate": 3.965702794543594e-06,
+ "loss": 0.1328,
+ "step": 26241
+ },
+ {
+ "epoch": 71.50408719346049,
+ "grad_norm": 2.371041774749756,
+ "learning_rate": 3.964999102536145e-06,
+ "loss": 0.0659,
+ "step": 26242
+ },
+ {
+ "epoch": 71.50681198910081,
+ "grad_norm": 3.883790969848633,
+ "learning_rate": 3.96429545752909e-06,
+ "loss": 0.0662,
+ "step": 26243
+ },
+ {
+ "epoch": 71.50953678474114,
+ "grad_norm": 3.13887882232666,
+ "learning_rate": 3.963591859527906e-06,
+ "loss": 0.0958,
+ "step": 26244
+ },
+ {
+ "epoch": 71.51226158038148,
+ "grad_norm": 6.1765336990356445,
+ "learning_rate": 3.962888308538072e-06,
+ "loss": 0.1708,
+ "step": 26245
+ },
+ {
+ "epoch": 71.5149863760218,
+ "grad_norm": 2.49947190284729,
+ "learning_rate": 3.962184804565074e-06,
+ "loss": 0.0383,
+ "step": 26246
+ },
+ {
+ "epoch": 71.51771117166213,
+ "grad_norm": 2.4722323417663574,
+ "learning_rate": 3.961481347614385e-06,
+ "loss": 0.0578,
+ "step": 26247
+ },
+ {
+ "epoch": 71.52043596730245,
+ "grad_norm": 3.1850924491882324,
+ "learning_rate": 3.9607779376914814e-06,
+ "loss": 0.1161,
+ "step": 26248
+ },
+ {
+ "epoch": 71.52316076294278,
+ "grad_norm": 2.3899035453796387,
+ "learning_rate": 3.9600745748018445e-06,
+ "loss": 0.0372,
+ "step": 26249
+ },
+ {
+ "epoch": 71.52588555858311,
+ "grad_norm": 3.3634681701660156,
+ "learning_rate": 3.959371258950956e-06,
+ "loss": 0.1709,
+ "step": 26250
+ },
+ {
+ "epoch": 71.52861035422343,
+ "grad_norm": 3.508753538131714,
+ "learning_rate": 3.95866799014429e-06,
+ "loss": 0.0387,
+ "step": 26251
+ },
+ {
+ "epoch": 71.53133514986376,
+ "grad_norm": 3.0704305171966553,
+ "learning_rate": 3.957964768387324e-06,
+ "loss": 0.0405,
+ "step": 26252
+ },
+ {
+ "epoch": 71.53405994550408,
+ "grad_norm": 4.232667446136475,
+ "learning_rate": 3.957261593685529e-06,
+ "loss": 0.0623,
+ "step": 26253
+ },
+ {
+ "epoch": 71.53678474114442,
+ "grad_norm": 2.996190309524536,
+ "learning_rate": 3.9565584660443916e-06,
+ "loss": 0.0457,
+ "step": 26254
+ },
+ {
+ "epoch": 71.53950953678473,
+ "grad_norm": 3.1058871746063232,
+ "learning_rate": 3.955855385469381e-06,
+ "loss": 0.0413,
+ "step": 26255
+ },
+ {
+ "epoch": 71.54223433242507,
+ "grad_norm": 3.577069044113159,
+ "learning_rate": 3.955152351965974e-06,
+ "loss": 0.1313,
+ "step": 26256
+ },
+ {
+ "epoch": 71.5449591280654,
+ "grad_norm": 2.307096242904663,
+ "learning_rate": 3.954449365539643e-06,
+ "loss": 0.0737,
+ "step": 26257
+ },
+ {
+ "epoch": 71.54768392370572,
+ "grad_norm": 5.829807281494141,
+ "learning_rate": 3.953746426195869e-06,
+ "loss": 0.1635,
+ "step": 26258
+ },
+ {
+ "epoch": 71.55040871934605,
+ "grad_norm": 2.726738691329956,
+ "learning_rate": 3.953043533940124e-06,
+ "loss": 0.084,
+ "step": 26259
+ },
+ {
+ "epoch": 71.55313351498637,
+ "grad_norm": 2.659027099609375,
+ "learning_rate": 3.95234068877788e-06,
+ "loss": 0.0737,
+ "step": 26260
+ },
+ {
+ "epoch": 71.5558583106267,
+ "grad_norm": 3.3079888820648193,
+ "learning_rate": 3.951637890714609e-06,
+ "loss": 0.1624,
+ "step": 26261
+ },
+ {
+ "epoch": 71.55858310626704,
+ "grad_norm": 3.218881607055664,
+ "learning_rate": 3.950935139755792e-06,
+ "loss": 0.0938,
+ "step": 26262
+ },
+ {
+ "epoch": 71.56130790190736,
+ "grad_norm": 5.3799333572387695,
+ "learning_rate": 3.950232435906897e-06,
+ "loss": 0.0394,
+ "step": 26263
+ },
+ {
+ "epoch": 71.56403269754769,
+ "grad_norm": 3.419832944869995,
+ "learning_rate": 3.949529779173397e-06,
+ "loss": 0.0458,
+ "step": 26264
+ },
+ {
+ "epoch": 71.566757493188,
+ "grad_norm": 2.9798130989074707,
+ "learning_rate": 3.9488271695607595e-06,
+ "loss": 0.0911,
+ "step": 26265
+ },
+ {
+ "epoch": 71.56948228882834,
+ "grad_norm": 2.677361249923706,
+ "learning_rate": 3.948124607074463e-06,
+ "loss": 0.0869,
+ "step": 26266
+ },
+ {
+ "epoch": 71.57220708446866,
+ "grad_norm": 3.440507650375366,
+ "learning_rate": 3.94742209171998e-06,
+ "loss": 0.0583,
+ "step": 26267
+ },
+ {
+ "epoch": 71.57493188010899,
+ "grad_norm": 2.4000511169433594,
+ "learning_rate": 3.946719623502778e-06,
+ "loss": 0.0308,
+ "step": 26268
+ },
+ {
+ "epoch": 71.57765667574932,
+ "grad_norm": 3.487424850463867,
+ "learning_rate": 3.9460172024283305e-06,
+ "loss": 0.0305,
+ "step": 26269
+ },
+ {
+ "epoch": 71.58038147138964,
+ "grad_norm": 3.9430429935455322,
+ "learning_rate": 3.945314828502102e-06,
+ "loss": 0.0402,
+ "step": 26270
+ },
+ {
+ "epoch": 71.58310626702998,
+ "grad_norm": 2.019660234451294,
+ "learning_rate": 3.94461250172957e-06,
+ "loss": 0.0251,
+ "step": 26271
+ },
+ {
+ "epoch": 71.5858310626703,
+ "grad_norm": 2.686077117919922,
+ "learning_rate": 3.9439102221162016e-06,
+ "loss": 0.0975,
+ "step": 26272
+ },
+ {
+ "epoch": 71.58855585831063,
+ "grad_norm": 3.871405601501465,
+ "learning_rate": 3.943207989667461e-06,
+ "loss": 0.0735,
+ "step": 26273
+ },
+ {
+ "epoch": 71.59128065395096,
+ "grad_norm": 3.2200605869293213,
+ "learning_rate": 3.9425058043888265e-06,
+ "loss": 0.1172,
+ "step": 26274
+ },
+ {
+ "epoch": 71.59400544959128,
+ "grad_norm": 3.149120807647705,
+ "learning_rate": 3.941803666285761e-06,
+ "loss": 0.0427,
+ "step": 26275
+ },
+ {
+ "epoch": 71.59673024523161,
+ "grad_norm": 4.132558822631836,
+ "learning_rate": 3.941101575363733e-06,
+ "loss": 0.1327,
+ "step": 26276
+ },
+ {
+ "epoch": 71.59945504087193,
+ "grad_norm": 3.762106418609619,
+ "learning_rate": 3.9403995316282084e-06,
+ "loss": 0.0541,
+ "step": 26277
+ },
+ {
+ "epoch": 71.60217983651226,
+ "grad_norm": 4.901472568511963,
+ "learning_rate": 3.93969753508466e-06,
+ "loss": 0.0663,
+ "step": 26278
+ },
+ {
+ "epoch": 71.60490463215258,
+ "grad_norm": 6.244317531585693,
+ "learning_rate": 3.938995585738552e-06,
+ "loss": 0.1002,
+ "step": 26279
+ },
+ {
+ "epoch": 71.60762942779292,
+ "grad_norm": 3.195518732070923,
+ "learning_rate": 3.9382936835953525e-06,
+ "loss": 0.0531,
+ "step": 26280
+ },
+ {
+ "epoch": 71.61035422343325,
+ "grad_norm": 2.8734614849090576,
+ "learning_rate": 3.937591828660522e-06,
+ "loss": 0.0616,
+ "step": 26281
+ },
+ {
+ "epoch": 71.61307901907357,
+ "grad_norm": 2.5066661834716797,
+ "learning_rate": 3.9368900209395325e-06,
+ "loss": 0.097,
+ "step": 26282
+ },
+ {
+ "epoch": 71.6158038147139,
+ "grad_norm": 3.8755085468292236,
+ "learning_rate": 3.936188260437851e-06,
+ "loss": 0.0554,
+ "step": 26283
+ },
+ {
+ "epoch": 71.61852861035422,
+ "grad_norm": 30.757774353027344,
+ "learning_rate": 3.935486547160939e-06,
+ "loss": 0.1705,
+ "step": 26284
+ },
+ {
+ "epoch": 71.62125340599455,
+ "grad_norm": 2.776183843612671,
+ "learning_rate": 3.9347848811142644e-06,
+ "loss": 0.1033,
+ "step": 26285
+ },
+ {
+ "epoch": 71.62397820163488,
+ "grad_norm": 3.173003911972046,
+ "learning_rate": 3.934083262303287e-06,
+ "loss": 0.0992,
+ "step": 26286
+ },
+ {
+ "epoch": 71.6267029972752,
+ "grad_norm": 5.0574822425842285,
+ "learning_rate": 3.933381690733475e-06,
+ "loss": 0.0563,
+ "step": 26287
+ },
+ {
+ "epoch": 71.62942779291554,
+ "grad_norm": 2.7327327728271484,
+ "learning_rate": 3.932680166410293e-06,
+ "loss": 0.1241,
+ "step": 26288
+ },
+ {
+ "epoch": 71.63215258855585,
+ "grad_norm": 3.556267023086548,
+ "learning_rate": 3.931978689339202e-06,
+ "loss": 0.0832,
+ "step": 26289
+ },
+ {
+ "epoch": 71.63487738419619,
+ "grad_norm": 4.194163799285889,
+ "learning_rate": 3.9312772595256624e-06,
+ "loss": 0.0529,
+ "step": 26290
+ },
+ {
+ "epoch": 71.6376021798365,
+ "grad_norm": 2.6678009033203125,
+ "learning_rate": 3.9305758769751436e-06,
+ "loss": 0.0417,
+ "step": 26291
+ },
+ {
+ "epoch": 71.64032697547684,
+ "grad_norm": 3.616098403930664,
+ "learning_rate": 3.9298745416931035e-06,
+ "loss": 0.1153,
+ "step": 26292
+ },
+ {
+ "epoch": 71.64305177111717,
+ "grad_norm": 3.521211862564087,
+ "learning_rate": 3.9291732536850056e-06,
+ "loss": 0.0982,
+ "step": 26293
+ },
+ {
+ "epoch": 71.64577656675749,
+ "grad_norm": 3.013974905014038,
+ "learning_rate": 3.928472012956308e-06,
+ "loss": 0.0566,
+ "step": 26294
+ },
+ {
+ "epoch": 71.64850136239782,
+ "grad_norm": 3.37339448928833,
+ "learning_rate": 3.927770819512479e-06,
+ "loss": 0.1105,
+ "step": 26295
+ },
+ {
+ "epoch": 71.65122615803814,
+ "grad_norm": 3.3436920642852783,
+ "learning_rate": 3.927069673358976e-06,
+ "loss": 0.0822,
+ "step": 26296
+ },
+ {
+ "epoch": 71.65395095367847,
+ "grad_norm": 2.712724447250366,
+ "learning_rate": 3.926368574501253e-06,
+ "loss": 0.1009,
+ "step": 26297
+ },
+ {
+ "epoch": 71.65667574931881,
+ "grad_norm": 3.7425286769866943,
+ "learning_rate": 3.925667522944781e-06,
+ "loss": 0.0403,
+ "step": 26298
+ },
+ {
+ "epoch": 71.65940054495913,
+ "grad_norm": 2.209707498550415,
+ "learning_rate": 3.924966518695015e-06,
+ "loss": 0.0651,
+ "step": 26299
+ },
+ {
+ "epoch": 71.66212534059946,
+ "grad_norm": 2.2464306354522705,
+ "learning_rate": 3.92426556175741e-06,
+ "loss": 0.0383,
+ "step": 26300
+ },
+ {
+ "epoch": 71.66485013623978,
+ "grad_norm": 4.439968585968018,
+ "learning_rate": 3.923564652137433e-06,
+ "loss": 0.0688,
+ "step": 26301
+ },
+ {
+ "epoch": 71.66757493188011,
+ "grad_norm": 3.5255579948425293,
+ "learning_rate": 3.922863789840535e-06,
+ "loss": 0.1391,
+ "step": 26302
+ },
+ {
+ "epoch": 71.67029972752043,
+ "grad_norm": 3.0047080516815186,
+ "learning_rate": 3.922162974872182e-06,
+ "loss": 0.1164,
+ "step": 26303
+ },
+ {
+ "epoch": 71.67302452316076,
+ "grad_norm": 2.442917585372925,
+ "learning_rate": 3.9214622072378285e-06,
+ "loss": 0.0364,
+ "step": 26304
+ },
+ {
+ "epoch": 71.6757493188011,
+ "grad_norm": 3.430983543395996,
+ "learning_rate": 3.920761486942932e-06,
+ "loss": 0.1244,
+ "step": 26305
+ },
+ {
+ "epoch": 71.67847411444141,
+ "grad_norm": 2.698504686355591,
+ "learning_rate": 3.920060813992945e-06,
+ "loss": 0.055,
+ "step": 26306
+ },
+ {
+ "epoch": 71.68119891008175,
+ "grad_norm": 3.5199246406555176,
+ "learning_rate": 3.9193601883933326e-06,
+ "loss": 0.0574,
+ "step": 26307
+ },
+ {
+ "epoch": 71.68392370572207,
+ "grad_norm": 3.5285394191741943,
+ "learning_rate": 3.918659610149548e-06,
+ "loss": 0.0875,
+ "step": 26308
+ },
+ {
+ "epoch": 71.6866485013624,
+ "grad_norm": 3.1933979988098145,
+ "learning_rate": 3.917959079267045e-06,
+ "loss": 0.041,
+ "step": 26309
+ },
+ {
+ "epoch": 71.68937329700273,
+ "grad_norm": 2.9126813411712646,
+ "learning_rate": 3.917258595751279e-06,
+ "loss": 0.0882,
+ "step": 26310
+ },
+ {
+ "epoch": 71.69209809264305,
+ "grad_norm": 2.869687080383301,
+ "learning_rate": 3.916558159607711e-06,
+ "loss": 0.1528,
+ "step": 26311
+ },
+ {
+ "epoch": 71.69482288828338,
+ "grad_norm": 2.973262071609497,
+ "learning_rate": 3.9158577708417915e-06,
+ "loss": 0.1139,
+ "step": 26312
+ },
+ {
+ "epoch": 71.6975476839237,
+ "grad_norm": 3.114274740219116,
+ "learning_rate": 3.915157429458976e-06,
+ "loss": 0.1605,
+ "step": 26313
+ },
+ {
+ "epoch": 71.70027247956403,
+ "grad_norm": 2.112484931945801,
+ "learning_rate": 3.914457135464714e-06,
+ "loss": 0.0661,
+ "step": 26314
+ },
+ {
+ "epoch": 71.70299727520435,
+ "grad_norm": 2.825071334838867,
+ "learning_rate": 3.913756888864468e-06,
+ "loss": 0.1418,
+ "step": 26315
+ },
+ {
+ "epoch": 71.70572207084469,
+ "grad_norm": 3.551366090774536,
+ "learning_rate": 3.913056689663689e-06,
+ "loss": 0.0697,
+ "step": 26316
+ },
+ {
+ "epoch": 71.70844686648502,
+ "grad_norm": 3.1092236042022705,
+ "learning_rate": 3.912356537867823e-06,
+ "loss": 0.0747,
+ "step": 26317
+ },
+ {
+ "epoch": 71.71117166212534,
+ "grad_norm": 3.4141645431518555,
+ "learning_rate": 3.91165643348233e-06,
+ "loss": 0.046,
+ "step": 26318
+ },
+ {
+ "epoch": 71.71389645776567,
+ "grad_norm": 2.809612512588501,
+ "learning_rate": 3.910956376512664e-06,
+ "loss": 0.0571,
+ "step": 26319
+ },
+ {
+ "epoch": 71.71662125340599,
+ "grad_norm": 3.1274161338806152,
+ "learning_rate": 3.9102563669642724e-06,
+ "loss": 0.0474,
+ "step": 26320
+ },
+ {
+ "epoch": 71.71934604904632,
+ "grad_norm": 4.481291770935059,
+ "learning_rate": 3.909556404842609e-06,
+ "loss": 0.0911,
+ "step": 26321
+ },
+ {
+ "epoch": 71.72207084468666,
+ "grad_norm": 2.82544207572937,
+ "learning_rate": 3.908856490153121e-06,
+ "loss": 0.188,
+ "step": 26322
+ },
+ {
+ "epoch": 71.72479564032697,
+ "grad_norm": 2.664330005645752,
+ "learning_rate": 3.9081566229012665e-06,
+ "loss": 0.1044,
+ "step": 26323
+ },
+ {
+ "epoch": 71.7275204359673,
+ "grad_norm": 5.151984691619873,
+ "learning_rate": 3.907456803092492e-06,
+ "loss": 0.1964,
+ "step": 26324
+ },
+ {
+ "epoch": 71.73024523160763,
+ "grad_norm": 3.0860400199890137,
+ "learning_rate": 3.906757030732248e-06,
+ "loss": 0.0324,
+ "step": 26325
+ },
+ {
+ "epoch": 71.73297002724796,
+ "grad_norm": 2.922128677368164,
+ "learning_rate": 3.90605730582598e-06,
+ "loss": 0.0481,
+ "step": 26326
+ },
+ {
+ "epoch": 71.73569482288828,
+ "grad_norm": 2.772878885269165,
+ "learning_rate": 3.905357628379145e-06,
+ "loss": 0.0254,
+ "step": 26327
+ },
+ {
+ "epoch": 71.73841961852861,
+ "grad_norm": 2.7073915004730225,
+ "learning_rate": 3.9046579983971885e-06,
+ "loss": 0.0363,
+ "step": 26328
+ },
+ {
+ "epoch": 71.74114441416894,
+ "grad_norm": 2.901749849319458,
+ "learning_rate": 3.90395841588556e-06,
+ "loss": 0.0688,
+ "step": 26329
+ },
+ {
+ "epoch": 71.74386920980926,
+ "grad_norm": 2.3532776832580566,
+ "learning_rate": 3.903258880849703e-06,
+ "loss": 0.1116,
+ "step": 26330
+ },
+ {
+ "epoch": 71.7465940054496,
+ "grad_norm": 3.113292932510376,
+ "learning_rate": 3.902559393295073e-06,
+ "loss": 0.1108,
+ "step": 26331
+ },
+ {
+ "epoch": 71.74931880108991,
+ "grad_norm": 2.981163740158081,
+ "learning_rate": 3.901859953227115e-06,
+ "loss": 0.1457,
+ "step": 26332
+ },
+ {
+ "epoch": 71.75204359673025,
+ "grad_norm": 2.9588096141815186,
+ "learning_rate": 3.901160560651276e-06,
+ "loss": 0.0501,
+ "step": 26333
+ },
+ {
+ "epoch": 71.75476839237058,
+ "grad_norm": 3.4545843601226807,
+ "learning_rate": 3.900461215572997e-06,
+ "loss": 0.2941,
+ "step": 26334
+ },
+ {
+ "epoch": 71.7574931880109,
+ "grad_norm": 2.8437490463256836,
+ "learning_rate": 3.899761917997731e-06,
+ "loss": 0.0642,
+ "step": 26335
+ },
+ {
+ "epoch": 71.76021798365123,
+ "grad_norm": 2.816551685333252,
+ "learning_rate": 3.899062667930926e-06,
+ "loss": 0.1101,
+ "step": 26336
+ },
+ {
+ "epoch": 71.76294277929155,
+ "grad_norm": 3.1201517581939697,
+ "learning_rate": 3.898363465378025e-06,
+ "loss": 0.1431,
+ "step": 26337
+ },
+ {
+ "epoch": 71.76566757493188,
+ "grad_norm": 2.708270788192749,
+ "learning_rate": 3.897664310344469e-06,
+ "loss": 0.0624,
+ "step": 26338
+ },
+ {
+ "epoch": 71.7683923705722,
+ "grad_norm": 2.9582321643829346,
+ "learning_rate": 3.89696520283571e-06,
+ "loss": 0.0549,
+ "step": 26339
+ },
+ {
+ "epoch": 71.77111716621253,
+ "grad_norm": 2.193305492401123,
+ "learning_rate": 3.89626614285719e-06,
+ "loss": 0.0343,
+ "step": 26340
+ },
+ {
+ "epoch": 71.77384196185287,
+ "grad_norm": 2.9289002418518066,
+ "learning_rate": 3.895567130414353e-06,
+ "loss": 0.0742,
+ "step": 26341
+ },
+ {
+ "epoch": 71.77656675749319,
+ "grad_norm": 3.2769899368286133,
+ "learning_rate": 3.894868165512639e-06,
+ "loss": 0.053,
+ "step": 26342
+ },
+ {
+ "epoch": 71.77929155313352,
+ "grad_norm": 2.773853302001953,
+ "learning_rate": 3.894169248157499e-06,
+ "loss": 0.1123,
+ "step": 26343
+ },
+ {
+ "epoch": 71.78201634877384,
+ "grad_norm": 2.5914247035980225,
+ "learning_rate": 3.8934703783543715e-06,
+ "loss": 0.035,
+ "step": 26344
+ },
+ {
+ "epoch": 71.78474114441417,
+ "grad_norm": 2.399165391921997,
+ "learning_rate": 3.8927715561087006e-06,
+ "loss": 0.076,
+ "step": 26345
+ },
+ {
+ "epoch": 71.7874659400545,
+ "grad_norm": 2.775571823120117,
+ "learning_rate": 3.892072781425926e-06,
+ "loss": 0.0432,
+ "step": 26346
+ },
+ {
+ "epoch": 71.79019073569482,
+ "grad_norm": 2.0114197731018066,
+ "learning_rate": 3.8913740543114945e-06,
+ "loss": 0.024,
+ "step": 26347
+ },
+ {
+ "epoch": 71.79291553133515,
+ "grad_norm": 2.244875192642212,
+ "learning_rate": 3.8906753747708446e-06,
+ "loss": 0.0509,
+ "step": 26348
+ },
+ {
+ "epoch": 71.79564032697547,
+ "grad_norm": 4.468997955322266,
+ "learning_rate": 3.889976742809419e-06,
+ "loss": 0.2228,
+ "step": 26349
+ },
+ {
+ "epoch": 71.7983651226158,
+ "grad_norm": 2.7303740978240967,
+ "learning_rate": 3.889278158432654e-06,
+ "loss": 0.0358,
+ "step": 26350
+ },
+ {
+ "epoch": 71.80108991825612,
+ "grad_norm": 2.245702028274536,
+ "learning_rate": 3.888579621645995e-06,
+ "loss": 0.0303,
+ "step": 26351
+ },
+ {
+ "epoch": 71.80381471389646,
+ "grad_norm": 3.6175475120544434,
+ "learning_rate": 3.887881132454884e-06,
+ "loss": 0.1734,
+ "step": 26352
+ },
+ {
+ "epoch": 71.80653950953679,
+ "grad_norm": 3.4484775066375732,
+ "learning_rate": 3.887182690864758e-06,
+ "loss": 0.1582,
+ "step": 26353
+ },
+ {
+ "epoch": 71.80926430517711,
+ "grad_norm": 2.438727855682373,
+ "learning_rate": 3.886484296881057e-06,
+ "loss": 0.0757,
+ "step": 26354
+ },
+ {
+ "epoch": 71.81198910081744,
+ "grad_norm": 3.8565361499786377,
+ "learning_rate": 3.885785950509215e-06,
+ "loss": 0.0535,
+ "step": 26355
+ },
+ {
+ "epoch": 71.81471389645776,
+ "grad_norm": 3.1182069778442383,
+ "learning_rate": 3.88508765175468e-06,
+ "loss": 0.1748,
+ "step": 26356
+ },
+ {
+ "epoch": 71.8174386920981,
+ "grad_norm": 2.419715642929077,
+ "learning_rate": 3.8843894006228844e-06,
+ "loss": 0.0406,
+ "step": 26357
+ },
+ {
+ "epoch": 71.82016348773843,
+ "grad_norm": 2.741055965423584,
+ "learning_rate": 3.883691197119267e-06,
+ "loss": 0.0665,
+ "step": 26358
+ },
+ {
+ "epoch": 71.82288828337875,
+ "grad_norm": 4.048133850097656,
+ "learning_rate": 3.8829930412492636e-06,
+ "loss": 0.0986,
+ "step": 26359
+ },
+ {
+ "epoch": 71.82561307901908,
+ "grad_norm": 3.7205846309661865,
+ "learning_rate": 3.882294933018316e-06,
+ "loss": 0.1283,
+ "step": 26360
+ },
+ {
+ "epoch": 71.8283378746594,
+ "grad_norm": 4.266384601593018,
+ "learning_rate": 3.881596872431859e-06,
+ "loss": 0.0458,
+ "step": 26361
+ },
+ {
+ "epoch": 71.83106267029973,
+ "grad_norm": 2.6132822036743164,
+ "learning_rate": 3.880898859495326e-06,
+ "loss": 0.0901,
+ "step": 26362
+ },
+ {
+ "epoch": 71.83378746594005,
+ "grad_norm": 3.58284592628479,
+ "learning_rate": 3.880200894214158e-06,
+ "loss": 0.1006,
+ "step": 26363
+ },
+ {
+ "epoch": 71.83651226158038,
+ "grad_norm": 3.521472692489624,
+ "learning_rate": 3.879502976593788e-06,
+ "loss": 0.1067,
+ "step": 26364
+ },
+ {
+ "epoch": 71.83923705722071,
+ "grad_norm": 3.137671709060669,
+ "learning_rate": 3.878805106639653e-06,
+ "loss": 0.0787,
+ "step": 26365
+ },
+ {
+ "epoch": 71.84196185286103,
+ "grad_norm": 2.116220474243164,
+ "learning_rate": 3.8781072843571836e-06,
+ "loss": 0.0921,
+ "step": 26366
+ },
+ {
+ "epoch": 71.84468664850137,
+ "grad_norm": 2.7314095497131348,
+ "learning_rate": 3.87740950975182e-06,
+ "loss": 0.1198,
+ "step": 26367
+ },
+ {
+ "epoch": 71.84741144414168,
+ "grad_norm": 5.4813714027404785,
+ "learning_rate": 3.876711782828991e-06,
+ "loss": 0.0661,
+ "step": 26368
+ },
+ {
+ "epoch": 71.85013623978202,
+ "grad_norm": 2.426462411880493,
+ "learning_rate": 3.876014103594137e-06,
+ "loss": 0.0348,
+ "step": 26369
+ },
+ {
+ "epoch": 71.85286103542235,
+ "grad_norm": 3.680140256881714,
+ "learning_rate": 3.8753164720526884e-06,
+ "loss": 0.0466,
+ "step": 26370
+ },
+ {
+ "epoch": 71.85558583106267,
+ "grad_norm": 2.6533203125,
+ "learning_rate": 3.874618888210074e-06,
+ "loss": 0.1256,
+ "step": 26371
+ },
+ {
+ "epoch": 71.858310626703,
+ "grad_norm": 2.9805591106414795,
+ "learning_rate": 3.873921352071734e-06,
+ "loss": 0.158,
+ "step": 26372
+ },
+ {
+ "epoch": 71.86103542234332,
+ "grad_norm": 4.2799835205078125,
+ "learning_rate": 3.873223863643098e-06,
+ "loss": 0.2181,
+ "step": 26373
+ },
+ {
+ "epoch": 71.86376021798365,
+ "grad_norm": 3.869594097137451,
+ "learning_rate": 3.872526422929597e-06,
+ "loss": 0.0439,
+ "step": 26374
+ },
+ {
+ "epoch": 71.86648501362397,
+ "grad_norm": 3.964195728302002,
+ "learning_rate": 3.87182902993666e-06,
+ "loss": 0.1073,
+ "step": 26375
+ },
+ {
+ "epoch": 71.8692098092643,
+ "grad_norm": 2.9525675773620605,
+ "learning_rate": 3.871131684669725e-06,
+ "loss": 0.1821,
+ "step": 26376
+ },
+ {
+ "epoch": 71.87193460490464,
+ "grad_norm": 1.5886871814727783,
+ "learning_rate": 3.870434387134217e-06,
+ "loss": 0.0285,
+ "step": 26377
+ },
+ {
+ "epoch": 71.87465940054496,
+ "grad_norm": 3.222775459289551,
+ "learning_rate": 3.869737137335571e-06,
+ "loss": 0.0326,
+ "step": 26378
+ },
+ {
+ "epoch": 71.87738419618529,
+ "grad_norm": 2.483813524246216,
+ "learning_rate": 3.869039935279211e-06,
+ "loss": 0.0505,
+ "step": 26379
+ },
+ {
+ "epoch": 71.88010899182561,
+ "grad_norm": 3.57271146774292,
+ "learning_rate": 3.868342780970573e-06,
+ "loss": 0.0895,
+ "step": 26380
+ },
+ {
+ "epoch": 71.88283378746594,
+ "grad_norm": 1.9605324268341064,
+ "learning_rate": 3.867645674415085e-06,
+ "loss": 0.0333,
+ "step": 26381
+ },
+ {
+ "epoch": 71.88555858310627,
+ "grad_norm": 2.846683979034424,
+ "learning_rate": 3.8669486156181715e-06,
+ "loss": 0.05,
+ "step": 26382
+ },
+ {
+ "epoch": 71.88828337874659,
+ "grad_norm": 3.698002338409424,
+ "learning_rate": 3.866251604585268e-06,
+ "loss": 0.1028,
+ "step": 26383
+ },
+ {
+ "epoch": 71.89100817438693,
+ "grad_norm": 3.3943450450897217,
+ "learning_rate": 3.8655546413218005e-06,
+ "loss": 0.0591,
+ "step": 26384
+ },
+ {
+ "epoch": 71.89373297002724,
+ "grad_norm": 3.743924140930176,
+ "learning_rate": 3.864857725833194e-06,
+ "loss": 0.0486,
+ "step": 26385
+ },
+ {
+ "epoch": 71.89645776566758,
+ "grad_norm": 2.5327439308166504,
+ "learning_rate": 3.864160858124877e-06,
+ "loss": 0.0634,
+ "step": 26386
+ },
+ {
+ "epoch": 71.8991825613079,
+ "grad_norm": 2.6696815490722656,
+ "learning_rate": 3.863464038202276e-06,
+ "loss": 0.1281,
+ "step": 26387
+ },
+ {
+ "epoch": 71.90190735694823,
+ "grad_norm": 3.199040412902832,
+ "learning_rate": 3.862767266070824e-06,
+ "loss": 0.1714,
+ "step": 26388
+ },
+ {
+ "epoch": 71.90463215258856,
+ "grad_norm": 4.53518009185791,
+ "learning_rate": 3.8620705417359425e-06,
+ "loss": 0.0669,
+ "step": 26389
+ },
+ {
+ "epoch": 71.90735694822888,
+ "grad_norm": 4.8748884201049805,
+ "learning_rate": 3.861373865203059e-06,
+ "loss": 0.2236,
+ "step": 26390
+ },
+ {
+ "epoch": 71.91008174386921,
+ "grad_norm": 1.7121739387512207,
+ "learning_rate": 3.860677236477594e-06,
+ "loss": 0.0233,
+ "step": 26391
+ },
+ {
+ "epoch": 71.91280653950953,
+ "grad_norm": 4.375126361846924,
+ "learning_rate": 3.859980655564981e-06,
+ "loss": 0.0794,
+ "step": 26392
+ },
+ {
+ "epoch": 71.91553133514986,
+ "grad_norm": 2.77117657661438,
+ "learning_rate": 3.85928412247064e-06,
+ "loss": 0.0369,
+ "step": 26393
+ },
+ {
+ "epoch": 71.9182561307902,
+ "grad_norm": 2.893740653991699,
+ "learning_rate": 3.858587637199998e-06,
+ "loss": 0.0628,
+ "step": 26394
+ },
+ {
+ "epoch": 71.92098092643052,
+ "grad_norm": 3.6848340034484863,
+ "learning_rate": 3.857891199758473e-06,
+ "loss": 0.0715,
+ "step": 26395
+ },
+ {
+ "epoch": 71.92370572207085,
+ "grad_norm": 6.501197814941406,
+ "learning_rate": 3.8571948101514975e-06,
+ "loss": 0.0872,
+ "step": 26396
+ },
+ {
+ "epoch": 71.92643051771117,
+ "grad_norm": 3.519993543624878,
+ "learning_rate": 3.856498468384492e-06,
+ "loss": 0.0452,
+ "step": 26397
+ },
+ {
+ "epoch": 71.9291553133515,
+ "grad_norm": 3.886000871658325,
+ "learning_rate": 3.855802174462878e-06,
+ "loss": 0.0637,
+ "step": 26398
+ },
+ {
+ "epoch": 71.93188010899182,
+ "grad_norm": 2.6100046634674072,
+ "learning_rate": 3.8551059283920755e-06,
+ "loss": 0.0962,
+ "step": 26399
+ },
+ {
+ "epoch": 71.93460490463215,
+ "grad_norm": 3.729602813720703,
+ "learning_rate": 3.854409730177514e-06,
+ "loss": 0.0734,
+ "step": 26400
+ },
+ {
+ "epoch": 71.93732970027249,
+ "grad_norm": 3.0738816261291504,
+ "learning_rate": 3.8537135798246114e-06,
+ "loss": 0.0362,
+ "step": 26401
+ },
+ {
+ "epoch": 71.9400544959128,
+ "grad_norm": 2.7986834049224854,
+ "learning_rate": 3.8530174773387894e-06,
+ "loss": 0.0629,
+ "step": 26402
+ },
+ {
+ "epoch": 71.94277929155314,
+ "grad_norm": 3.095090627670288,
+ "learning_rate": 3.852321422725464e-06,
+ "loss": 0.0345,
+ "step": 26403
+ },
+ {
+ "epoch": 71.94550408719346,
+ "grad_norm": 5.287209987640381,
+ "learning_rate": 3.851625415990066e-06,
+ "loss": 0.0429,
+ "step": 26404
+ },
+ {
+ "epoch": 71.94822888283379,
+ "grad_norm": 2.890679121017456,
+ "learning_rate": 3.850929457138013e-06,
+ "loss": 0.139,
+ "step": 26405
+ },
+ {
+ "epoch": 71.95095367847412,
+ "grad_norm": 1.8992841243743896,
+ "learning_rate": 3.850233546174723e-06,
+ "loss": 0.0239,
+ "step": 26406
+ },
+ {
+ "epoch": 71.95367847411444,
+ "grad_norm": 2.375065326690674,
+ "learning_rate": 3.849537683105613e-06,
+ "loss": 0.0324,
+ "step": 26407
+ },
+ {
+ "epoch": 71.95640326975477,
+ "grad_norm": 4.101001262664795,
+ "learning_rate": 3.848841867936109e-06,
+ "loss": 0.1392,
+ "step": 26408
+ },
+ {
+ "epoch": 71.95912806539509,
+ "grad_norm": 2.77616810798645,
+ "learning_rate": 3.848146100671627e-06,
+ "loss": 0.0633,
+ "step": 26409
+ },
+ {
+ "epoch": 71.96185286103542,
+ "grad_norm": 3.357628583908081,
+ "learning_rate": 3.847450381317584e-06,
+ "loss": 0.044,
+ "step": 26410
+ },
+ {
+ "epoch": 71.96457765667574,
+ "grad_norm": 3.925208330154419,
+ "learning_rate": 3.8467547098793965e-06,
+ "loss": 0.0698,
+ "step": 26411
+ },
+ {
+ "epoch": 71.96730245231608,
+ "grad_norm": 3.3535728454589844,
+ "learning_rate": 3.846059086362489e-06,
+ "loss": 0.1013,
+ "step": 26412
+ },
+ {
+ "epoch": 71.97002724795641,
+ "grad_norm": 3.7744178771972656,
+ "learning_rate": 3.845363510772275e-06,
+ "loss": 0.1563,
+ "step": 26413
+ },
+ {
+ "epoch": 71.97275204359673,
+ "grad_norm": 3.1011741161346436,
+ "learning_rate": 3.844667983114172e-06,
+ "loss": 0.0599,
+ "step": 26414
+ },
+ {
+ "epoch": 71.97547683923706,
+ "grad_norm": 3.228482484817505,
+ "learning_rate": 3.843972503393594e-06,
+ "loss": 0.0707,
+ "step": 26415
+ },
+ {
+ "epoch": 71.97820163487738,
+ "grad_norm": 3.153712034225464,
+ "learning_rate": 3.843277071615962e-06,
+ "loss": 0.05,
+ "step": 26416
+ },
+ {
+ "epoch": 71.98092643051771,
+ "grad_norm": 6.8295769691467285,
+ "learning_rate": 3.842581687786691e-06,
+ "loss": 0.0461,
+ "step": 26417
+ },
+ {
+ "epoch": 71.98365122615803,
+ "grad_norm": 2.7410759925842285,
+ "learning_rate": 3.841886351911195e-06,
+ "loss": 0.0578,
+ "step": 26418
+ },
+ {
+ "epoch": 71.98637602179836,
+ "grad_norm": 3.6840834617614746,
+ "learning_rate": 3.841191063994887e-06,
+ "loss": 0.0611,
+ "step": 26419
+ },
+ {
+ "epoch": 71.9891008174387,
+ "grad_norm": 3.9045000076293945,
+ "learning_rate": 3.840495824043184e-06,
+ "loss": 0.0844,
+ "step": 26420
+ },
+ {
+ "epoch": 71.99182561307902,
+ "grad_norm": 1.457475185394287,
+ "learning_rate": 3.839800632061505e-06,
+ "loss": 0.0176,
+ "step": 26421
+ },
+ {
+ "epoch": 71.99455040871935,
+ "grad_norm": 4.588175296783447,
+ "learning_rate": 3.839105488055261e-06,
+ "loss": 0.0848,
+ "step": 26422
+ },
+ {
+ "epoch": 71.99727520435967,
+ "grad_norm": 4.111020565032959,
+ "learning_rate": 3.838410392029861e-06,
+ "loss": 0.0451,
+ "step": 26423
+ },
+ {
+ "epoch": 72.0,
+ "grad_norm": 3.852811813354492,
+ "learning_rate": 3.837715343990727e-06,
+ "loss": 0.1726,
+ "step": 26424
+ },
+ {
+ "epoch": 72.00272479564033,
+ "grad_norm": 3.460327625274658,
+ "learning_rate": 3.837020343943267e-06,
+ "loss": 0.0799,
+ "step": 26425
+ },
+ {
+ "epoch": 72.00544959128065,
+ "grad_norm": 4.512401103973389,
+ "learning_rate": 3.836325391892894e-06,
+ "loss": 0.1293,
+ "step": 26426
+ },
+ {
+ "epoch": 72.00817438692098,
+ "grad_norm": 4.811865329742432,
+ "learning_rate": 3.8356304878450165e-06,
+ "loss": 0.0375,
+ "step": 26427
+ },
+ {
+ "epoch": 72.0108991825613,
+ "grad_norm": 3.8618597984313965,
+ "learning_rate": 3.834935631805055e-06,
+ "loss": 0.1019,
+ "step": 26428
+ },
+ {
+ "epoch": 72.01362397820164,
+ "grad_norm": 3.3924152851104736,
+ "learning_rate": 3.834240823778416e-06,
+ "loss": 0.0459,
+ "step": 26429
+ },
+ {
+ "epoch": 72.01634877384195,
+ "grad_norm": 2.285546064376831,
+ "learning_rate": 3.833546063770512e-06,
+ "loss": 0.0358,
+ "step": 26430
+ },
+ {
+ "epoch": 72.01907356948229,
+ "grad_norm": 3.3915133476257324,
+ "learning_rate": 3.8328513517867475e-06,
+ "loss": 0.0485,
+ "step": 26431
+ },
+ {
+ "epoch": 72.02179836512262,
+ "grad_norm": 2.707864761352539,
+ "learning_rate": 3.832156687832542e-06,
+ "loss": 0.1161,
+ "step": 26432
+ },
+ {
+ "epoch": 72.02452316076294,
+ "grad_norm": 3.833160638809204,
+ "learning_rate": 3.831462071913302e-06,
+ "loss": 0.1003,
+ "step": 26433
+ },
+ {
+ "epoch": 72.02724795640327,
+ "grad_norm": 3.3467867374420166,
+ "learning_rate": 3.8307675040344375e-06,
+ "loss": 0.0579,
+ "step": 26434
+ },
+ {
+ "epoch": 72.02997275204359,
+ "grad_norm": 1.303076148033142,
+ "learning_rate": 3.830072984201353e-06,
+ "loss": 0.0191,
+ "step": 26435
+ },
+ {
+ "epoch": 72.03269754768392,
+ "grad_norm": 4.522215366363525,
+ "learning_rate": 3.829378512419465e-06,
+ "loss": 0.1038,
+ "step": 26436
+ },
+ {
+ "epoch": 72.03542234332426,
+ "grad_norm": 3.8533568382263184,
+ "learning_rate": 3.828684088694174e-06,
+ "loss": 0.1413,
+ "step": 26437
+ },
+ {
+ "epoch": 72.03814713896458,
+ "grad_norm": 3.332747459411621,
+ "learning_rate": 3.827989713030899e-06,
+ "loss": 0.0996,
+ "step": 26438
+ },
+ {
+ "epoch": 72.04087193460491,
+ "grad_norm": 2.6036112308502197,
+ "learning_rate": 3.827295385435039e-06,
+ "loss": 0.1129,
+ "step": 26439
+ },
+ {
+ "epoch": 72.04359673024523,
+ "grad_norm": 2.8100404739379883,
+ "learning_rate": 3.826601105912001e-06,
+ "loss": 0.0762,
+ "step": 26440
+ },
+ {
+ "epoch": 72.04632152588556,
+ "grad_norm": 2.9402518272399902,
+ "learning_rate": 3.825906874467199e-06,
+ "loss": 0.0324,
+ "step": 26441
+ },
+ {
+ "epoch": 72.04904632152588,
+ "grad_norm": 3.8927853107452393,
+ "learning_rate": 3.825212691106035e-06,
+ "loss": 0.0726,
+ "step": 26442
+ },
+ {
+ "epoch": 72.05177111716621,
+ "grad_norm": 3.7210917472839355,
+ "learning_rate": 3.824518555833916e-06,
+ "loss": 0.1208,
+ "step": 26443
+ },
+ {
+ "epoch": 72.05449591280654,
+ "grad_norm": 2.8822295665740967,
+ "learning_rate": 3.823824468656245e-06,
+ "loss": 0.0375,
+ "step": 26444
+ },
+ {
+ "epoch": 72.05722070844686,
+ "grad_norm": 9.227213859558105,
+ "learning_rate": 3.823130429578432e-06,
+ "loss": 0.0432,
+ "step": 26445
+ },
+ {
+ "epoch": 72.0599455040872,
+ "grad_norm": 2.4599592685699463,
+ "learning_rate": 3.822436438605881e-06,
+ "loss": 0.0275,
+ "step": 26446
+ },
+ {
+ "epoch": 72.06267029972751,
+ "grad_norm": 4.226046085357666,
+ "learning_rate": 3.821742495743993e-06,
+ "loss": 0.067,
+ "step": 26447
+ },
+ {
+ "epoch": 72.06539509536785,
+ "grad_norm": 3.2443578243255615,
+ "learning_rate": 3.82104860099818e-06,
+ "loss": 0.0379,
+ "step": 26448
+ },
+ {
+ "epoch": 72.06811989100818,
+ "grad_norm": 3.0962071418762207,
+ "learning_rate": 3.8203547543738395e-06,
+ "loss": 0.047,
+ "step": 26449
+ },
+ {
+ "epoch": 72.0708446866485,
+ "grad_norm": 2.8933916091918945,
+ "learning_rate": 3.819660955876378e-06,
+ "loss": 0.032,
+ "step": 26450
+ },
+ {
+ "epoch": 72.07356948228883,
+ "grad_norm": 4.149245738983154,
+ "learning_rate": 3.818967205511196e-06,
+ "loss": 0.1032,
+ "step": 26451
+ },
+ {
+ "epoch": 72.07629427792915,
+ "grad_norm": 5.366902828216553,
+ "learning_rate": 3.8182735032837015e-06,
+ "loss": 0.1421,
+ "step": 26452
+ },
+ {
+ "epoch": 72.07901907356948,
+ "grad_norm": 2.3826136589050293,
+ "learning_rate": 3.817579849199293e-06,
+ "loss": 0.0374,
+ "step": 26453
+ },
+ {
+ "epoch": 72.0817438692098,
+ "grad_norm": 2.4784250259399414,
+ "learning_rate": 3.816886243263371e-06,
+ "loss": 0.0509,
+ "step": 26454
+ },
+ {
+ "epoch": 72.08446866485014,
+ "grad_norm": 3.469705581665039,
+ "learning_rate": 3.816192685481344e-06,
+ "loss": 0.0487,
+ "step": 26455
+ },
+ {
+ "epoch": 72.08719346049047,
+ "grad_norm": 2.6644678115844727,
+ "learning_rate": 3.8154991758586045e-06,
+ "loss": 0.0463,
+ "step": 26456
+ },
+ {
+ "epoch": 72.08991825613079,
+ "grad_norm": 2.715855836868286,
+ "learning_rate": 3.814805714400562e-06,
+ "loss": 0.0289,
+ "step": 26457
+ },
+ {
+ "epoch": 72.09264305177112,
+ "grad_norm": 2.837583065032959,
+ "learning_rate": 3.8141123011126135e-06,
+ "loss": 0.1801,
+ "step": 26458
+ },
+ {
+ "epoch": 72.09536784741144,
+ "grad_norm": 4.77943754196167,
+ "learning_rate": 3.8134189360001604e-06,
+ "loss": 0.1445,
+ "step": 26459
+ },
+ {
+ "epoch": 72.09809264305177,
+ "grad_norm": 2.1811513900756836,
+ "learning_rate": 3.8127256190685968e-06,
+ "loss": 0.2314,
+ "step": 26460
+ },
+ {
+ "epoch": 72.1008174386921,
+ "grad_norm": 3.9631247520446777,
+ "learning_rate": 3.8120323503233315e-06,
+ "loss": 0.0357,
+ "step": 26461
+ },
+ {
+ "epoch": 72.10354223433242,
+ "grad_norm": 2.710859537124634,
+ "learning_rate": 3.811339129769758e-06,
+ "loss": 0.0996,
+ "step": 26462
+ },
+ {
+ "epoch": 72.10626702997276,
+ "grad_norm": 3.615741014480591,
+ "learning_rate": 3.810645957413277e-06,
+ "loss": 0.0389,
+ "step": 26463
+ },
+ {
+ "epoch": 72.10899182561307,
+ "grad_norm": 3.7355191707611084,
+ "learning_rate": 3.8099528332592817e-06,
+ "loss": 0.0818,
+ "step": 26464
+ },
+ {
+ "epoch": 72.11171662125341,
+ "grad_norm": 2.5932669639587402,
+ "learning_rate": 3.8092597573131796e-06,
+ "loss": 0.0276,
+ "step": 26465
+ },
+ {
+ "epoch": 72.11444141689373,
+ "grad_norm": 4.68644380569458,
+ "learning_rate": 3.8085667295803617e-06,
+ "loss": 0.1885,
+ "step": 26466
+ },
+ {
+ "epoch": 72.11716621253406,
+ "grad_norm": 4.039291858673096,
+ "learning_rate": 3.8078737500662277e-06,
+ "loss": 0.1143,
+ "step": 26467
+ },
+ {
+ "epoch": 72.11989100817439,
+ "grad_norm": 2.1027610301971436,
+ "learning_rate": 3.8071808187761696e-06,
+ "loss": 0.0307,
+ "step": 26468
+ },
+ {
+ "epoch": 72.12261580381471,
+ "grad_norm": 2.5047619342803955,
+ "learning_rate": 3.8064879357155915e-06,
+ "loss": 0.1368,
+ "step": 26469
+ },
+ {
+ "epoch": 72.12534059945504,
+ "grad_norm": 3.0962514877319336,
+ "learning_rate": 3.8057951008898865e-06,
+ "loss": 0.1067,
+ "step": 26470
+ },
+ {
+ "epoch": 72.12806539509536,
+ "grad_norm": 2.2265589237213135,
+ "learning_rate": 3.8051023143044464e-06,
+ "loss": 0.0193,
+ "step": 26471
+ },
+ {
+ "epoch": 72.1307901907357,
+ "grad_norm": 2.836852788925171,
+ "learning_rate": 3.8044095759646694e-06,
+ "loss": 0.0558,
+ "step": 26472
+ },
+ {
+ "epoch": 72.13351498637603,
+ "grad_norm": 5.074002742767334,
+ "learning_rate": 3.8037168858759556e-06,
+ "loss": 0.2786,
+ "step": 26473
+ },
+ {
+ "epoch": 72.13623978201635,
+ "grad_norm": 2.991013765335083,
+ "learning_rate": 3.8030242440436947e-06,
+ "loss": 0.0744,
+ "step": 26474
+ },
+ {
+ "epoch": 72.13896457765668,
+ "grad_norm": 3.196929931640625,
+ "learning_rate": 3.802331650473281e-06,
+ "loss": 0.0702,
+ "step": 26475
+ },
+ {
+ "epoch": 72.141689373297,
+ "grad_norm": 5.008358478546143,
+ "learning_rate": 3.8016391051701063e-06,
+ "loss": 0.0489,
+ "step": 26476
+ },
+ {
+ "epoch": 72.14441416893733,
+ "grad_norm": 2.833855152130127,
+ "learning_rate": 3.8009466081395707e-06,
+ "loss": 0.0647,
+ "step": 26477
+ },
+ {
+ "epoch": 72.14713896457765,
+ "grad_norm": 2.50533390045166,
+ "learning_rate": 3.8002541593870624e-06,
+ "loss": 0.0335,
+ "step": 26478
+ },
+ {
+ "epoch": 72.14986376021798,
+ "grad_norm": 2.8171579837799072,
+ "learning_rate": 3.7995617589179758e-06,
+ "loss": 0.0969,
+ "step": 26479
+ },
+ {
+ "epoch": 72.15258855585832,
+ "grad_norm": 2.2267115116119385,
+ "learning_rate": 3.7988694067376987e-06,
+ "loss": 0.0515,
+ "step": 26480
+ },
+ {
+ "epoch": 72.15531335149863,
+ "grad_norm": 3.8708081245422363,
+ "learning_rate": 3.7981771028516303e-06,
+ "loss": 0.0396,
+ "step": 26481
+ },
+ {
+ "epoch": 72.15803814713897,
+ "grad_norm": 2.921945571899414,
+ "learning_rate": 3.7974848472651593e-06,
+ "loss": 0.1003,
+ "step": 26482
+ },
+ {
+ "epoch": 72.16076294277929,
+ "grad_norm": 2.610873222351074,
+ "learning_rate": 3.7967926399836775e-06,
+ "loss": 0.0532,
+ "step": 26483
+ },
+ {
+ "epoch": 72.16348773841962,
+ "grad_norm": 2.5172135829925537,
+ "learning_rate": 3.796100481012571e-06,
+ "loss": 0.0315,
+ "step": 26484
+ },
+ {
+ "epoch": 72.16621253405995,
+ "grad_norm": 2.580249071121216,
+ "learning_rate": 3.7954083703572376e-06,
+ "loss": 0.0455,
+ "step": 26485
+ },
+ {
+ "epoch": 72.16893732970027,
+ "grad_norm": 3.4453303813934326,
+ "learning_rate": 3.7947163080230644e-06,
+ "loss": 0.1394,
+ "step": 26486
+ },
+ {
+ "epoch": 72.1716621253406,
+ "grad_norm": 2.4160969257354736,
+ "learning_rate": 3.7940242940154404e-06,
+ "loss": 0.0503,
+ "step": 26487
+ },
+ {
+ "epoch": 72.17438692098092,
+ "grad_norm": 5.730032920837402,
+ "learning_rate": 3.793332328339752e-06,
+ "loss": 0.0362,
+ "step": 26488
+ },
+ {
+ "epoch": 72.17711171662125,
+ "grad_norm": 3.2699761390686035,
+ "learning_rate": 3.7926404110013913e-06,
+ "loss": 0.1083,
+ "step": 26489
+ },
+ {
+ "epoch": 72.17983651226157,
+ "grad_norm": 3.17868971824646,
+ "learning_rate": 3.791948542005751e-06,
+ "loss": 0.0805,
+ "step": 26490
+ },
+ {
+ "epoch": 72.1825613079019,
+ "grad_norm": 2.672743797302246,
+ "learning_rate": 3.791256721358216e-06,
+ "loss": 0.096,
+ "step": 26491
+ },
+ {
+ "epoch": 72.18528610354224,
+ "grad_norm": 9.494412422180176,
+ "learning_rate": 3.7905649490641704e-06,
+ "loss": 0.1418,
+ "step": 26492
+ },
+ {
+ "epoch": 72.18801089918256,
+ "grad_norm": 2.820760726928711,
+ "learning_rate": 3.789873225129009e-06,
+ "loss": 0.0324,
+ "step": 26493
+ },
+ {
+ "epoch": 72.19073569482289,
+ "grad_norm": 6.814089298248291,
+ "learning_rate": 3.789181549558114e-06,
+ "loss": 0.1112,
+ "step": 26494
+ },
+ {
+ "epoch": 72.19346049046321,
+ "grad_norm": 3.728151559829712,
+ "learning_rate": 3.788489922356874e-06,
+ "loss": 0.0513,
+ "step": 26495
+ },
+ {
+ "epoch": 72.19618528610354,
+ "grad_norm": 3.132028579711914,
+ "learning_rate": 3.787798343530671e-06,
+ "loss": 0.035,
+ "step": 26496
+ },
+ {
+ "epoch": 72.19891008174388,
+ "grad_norm": 3.118652820587158,
+ "learning_rate": 3.7871068130848974e-06,
+ "loss": 0.0731,
+ "step": 26497
+ },
+ {
+ "epoch": 72.2016348773842,
+ "grad_norm": 3.4296882152557373,
+ "learning_rate": 3.7864153310249376e-06,
+ "loss": 0.0977,
+ "step": 26498
+ },
+ {
+ "epoch": 72.20435967302453,
+ "grad_norm": 2.929823637008667,
+ "learning_rate": 3.7857238973561737e-06,
+ "loss": 0.048,
+ "step": 26499
+ },
+ {
+ "epoch": 72.20708446866485,
+ "grad_norm": 4.002386569976807,
+ "learning_rate": 3.785032512083989e-06,
+ "loss": 0.0714,
+ "step": 26500
+ },
+ {
+ "epoch": 72.20980926430518,
+ "grad_norm": 2.456514835357666,
+ "learning_rate": 3.784341175213775e-06,
+ "loss": 0.0449,
+ "step": 26501
+ },
+ {
+ "epoch": 72.2125340599455,
+ "grad_norm": 2.193502187728882,
+ "learning_rate": 3.7836498867509108e-06,
+ "loss": 0.098,
+ "step": 26502
+ },
+ {
+ "epoch": 72.21525885558583,
+ "grad_norm": 3.205998420715332,
+ "learning_rate": 3.782958646700782e-06,
+ "loss": 0.1279,
+ "step": 26503
+ },
+ {
+ "epoch": 72.21798365122616,
+ "grad_norm": 3.640317916870117,
+ "learning_rate": 3.7822674550687676e-06,
+ "loss": 0.1048,
+ "step": 26504
+ },
+ {
+ "epoch": 72.22070844686648,
+ "grad_norm": 2.3547284603118896,
+ "learning_rate": 3.7815763118602577e-06,
+ "loss": 0.0247,
+ "step": 26505
+ },
+ {
+ "epoch": 72.22343324250681,
+ "grad_norm": 2.100797176361084,
+ "learning_rate": 3.7808852170806275e-06,
+ "loss": 0.0365,
+ "step": 26506
+ },
+ {
+ "epoch": 72.22615803814713,
+ "grad_norm": 1.5812318325042725,
+ "learning_rate": 3.780194170735266e-06,
+ "loss": 0.0248,
+ "step": 26507
+ },
+ {
+ "epoch": 72.22888283378747,
+ "grad_norm": 4.499730110168457,
+ "learning_rate": 3.779503172829554e-06,
+ "loss": 0.0948,
+ "step": 26508
+ },
+ {
+ "epoch": 72.2316076294278,
+ "grad_norm": 2.98199725151062,
+ "learning_rate": 3.778812223368866e-06,
+ "loss": 0.124,
+ "step": 26509
+ },
+ {
+ "epoch": 72.23433242506812,
+ "grad_norm": 3.3595364093780518,
+ "learning_rate": 3.778121322358592e-06,
+ "loss": 0.0216,
+ "step": 26510
+ },
+ {
+ "epoch": 72.23705722070845,
+ "grad_norm": 2.3541762828826904,
+ "learning_rate": 3.77743046980411e-06,
+ "loss": 0.0295,
+ "step": 26511
+ },
+ {
+ "epoch": 72.23978201634877,
+ "grad_norm": 3.811251401901245,
+ "learning_rate": 3.7767396657107936e-06,
+ "loss": 0.0624,
+ "step": 26512
+ },
+ {
+ "epoch": 72.2425068119891,
+ "grad_norm": 2.8131866455078125,
+ "learning_rate": 3.776048910084034e-06,
+ "loss": 0.0616,
+ "step": 26513
+ },
+ {
+ "epoch": 72.24523160762942,
+ "grad_norm": 2.430534601211548,
+ "learning_rate": 3.7753582029292037e-06,
+ "loss": 0.1069,
+ "step": 26514
+ },
+ {
+ "epoch": 72.24795640326975,
+ "grad_norm": 2.720771074295044,
+ "learning_rate": 3.774667544251683e-06,
+ "loss": 0.0496,
+ "step": 26515
+ },
+ {
+ "epoch": 72.25068119891009,
+ "grad_norm": 3.8845908641815186,
+ "learning_rate": 3.773976934056849e-06,
+ "loss": 0.0476,
+ "step": 26516
+ },
+ {
+ "epoch": 72.2534059945504,
+ "grad_norm": 3.750916004180908,
+ "learning_rate": 3.7732863723500855e-06,
+ "loss": 0.0674,
+ "step": 26517
+ },
+ {
+ "epoch": 72.25613079019074,
+ "grad_norm": 2.2411701679229736,
+ "learning_rate": 3.7725958591367675e-06,
+ "loss": 0.0319,
+ "step": 26518
+ },
+ {
+ "epoch": 72.25885558583106,
+ "grad_norm": 3.2152843475341797,
+ "learning_rate": 3.7719053944222715e-06,
+ "loss": 0.1024,
+ "step": 26519
+ },
+ {
+ "epoch": 72.26158038147139,
+ "grad_norm": 2.3171660900115967,
+ "learning_rate": 3.7712149782119733e-06,
+ "loss": 0.0278,
+ "step": 26520
+ },
+ {
+ "epoch": 72.26430517711172,
+ "grad_norm": 3.022448778152466,
+ "learning_rate": 3.770524610511256e-06,
+ "loss": 0.0471,
+ "step": 26521
+ },
+ {
+ "epoch": 72.26702997275204,
+ "grad_norm": 2.9819817543029785,
+ "learning_rate": 3.7698342913254913e-06,
+ "loss": 0.1696,
+ "step": 26522
+ },
+ {
+ "epoch": 72.26975476839237,
+ "grad_norm": 3.3681530952453613,
+ "learning_rate": 3.769144020660054e-06,
+ "loss": 0.0702,
+ "step": 26523
+ },
+ {
+ "epoch": 72.2724795640327,
+ "grad_norm": 3.5201833248138428,
+ "learning_rate": 3.7684537985203263e-06,
+ "loss": 0.128,
+ "step": 26524
+ },
+ {
+ "epoch": 72.27520435967303,
+ "grad_norm": 3.9061806201934814,
+ "learning_rate": 3.7677636249116755e-06,
+ "loss": 0.0609,
+ "step": 26525
+ },
+ {
+ "epoch": 72.27792915531334,
+ "grad_norm": 2.433267831802368,
+ "learning_rate": 3.7670734998394855e-06,
+ "loss": 0.1045,
+ "step": 26526
+ },
+ {
+ "epoch": 72.28065395095368,
+ "grad_norm": 3.156240224838257,
+ "learning_rate": 3.7663834233091257e-06,
+ "loss": 0.0474,
+ "step": 26527
+ },
+ {
+ "epoch": 72.28337874659401,
+ "grad_norm": 2.4976119995117188,
+ "learning_rate": 3.765693395325971e-06,
+ "loss": 0.0323,
+ "step": 26528
+ },
+ {
+ "epoch": 72.28610354223433,
+ "grad_norm": 4.028443813323975,
+ "learning_rate": 3.765003415895393e-06,
+ "loss": 0.1099,
+ "step": 26529
+ },
+ {
+ "epoch": 72.28882833787466,
+ "grad_norm": 2.569737672805786,
+ "learning_rate": 3.76431348502277e-06,
+ "loss": 0.0506,
+ "step": 26530
+ },
+ {
+ "epoch": 72.29155313351498,
+ "grad_norm": 3.3727774620056152,
+ "learning_rate": 3.7636236027134733e-06,
+ "loss": 0.0491,
+ "step": 26531
+ },
+ {
+ "epoch": 72.29427792915531,
+ "grad_norm": 10.414998054504395,
+ "learning_rate": 3.7629337689728763e-06,
+ "loss": 0.051,
+ "step": 26532
+ },
+ {
+ "epoch": 72.29700272479565,
+ "grad_norm": 2.196016788482666,
+ "learning_rate": 3.762243983806345e-06,
+ "loss": 0.0331,
+ "step": 26533
+ },
+ {
+ "epoch": 72.29972752043597,
+ "grad_norm": 4.307570457458496,
+ "learning_rate": 3.7615542472192624e-06,
+ "loss": 0.0653,
+ "step": 26534
+ },
+ {
+ "epoch": 72.3024523160763,
+ "grad_norm": 3.4602112770080566,
+ "learning_rate": 3.7608645592169935e-06,
+ "loss": 0.0495,
+ "step": 26535
+ },
+ {
+ "epoch": 72.30517711171662,
+ "grad_norm": 2.949125289916992,
+ "learning_rate": 3.7601749198049064e-06,
+ "loss": 0.0538,
+ "step": 26536
+ },
+ {
+ "epoch": 72.30790190735695,
+ "grad_norm": 3.042327880859375,
+ "learning_rate": 3.75948532898838e-06,
+ "loss": 0.1376,
+ "step": 26537
+ },
+ {
+ "epoch": 72.31062670299727,
+ "grad_norm": 3.713318109512329,
+ "learning_rate": 3.758795786772782e-06,
+ "loss": 0.0448,
+ "step": 26538
+ },
+ {
+ "epoch": 72.3133514986376,
+ "grad_norm": 3.653341770172119,
+ "learning_rate": 3.7581062931634802e-06,
+ "loss": 0.088,
+ "step": 26539
+ },
+ {
+ "epoch": 72.31607629427793,
+ "grad_norm": 2.4039220809936523,
+ "learning_rate": 3.7574168481658435e-06,
+ "loss": 0.0694,
+ "step": 26540
+ },
+ {
+ "epoch": 72.31880108991825,
+ "grad_norm": 2.4391045570373535,
+ "learning_rate": 3.7567274517852424e-06,
+ "loss": 0.0649,
+ "step": 26541
+ },
+ {
+ "epoch": 72.32152588555859,
+ "grad_norm": 2.974087715148926,
+ "learning_rate": 3.756038104027051e-06,
+ "loss": 0.167,
+ "step": 26542
+ },
+ {
+ "epoch": 72.3242506811989,
+ "grad_norm": 2.3259406089782715,
+ "learning_rate": 3.7553488048966346e-06,
+ "loss": 0.04,
+ "step": 26543
+ },
+ {
+ "epoch": 72.32697547683924,
+ "grad_norm": 3.064772844314575,
+ "learning_rate": 3.75465955439936e-06,
+ "loss": 0.0509,
+ "step": 26544
+ },
+ {
+ "epoch": 72.32970027247957,
+ "grad_norm": 2.7310149669647217,
+ "learning_rate": 3.7539703525405925e-06,
+ "loss": 0.048,
+ "step": 26545
+ },
+ {
+ "epoch": 72.33242506811989,
+ "grad_norm": 2.478053569793701,
+ "learning_rate": 3.7532811993257056e-06,
+ "loss": 0.0353,
+ "step": 26546
+ },
+ {
+ "epoch": 72.33514986376022,
+ "grad_norm": 2.859170436859131,
+ "learning_rate": 3.752592094760065e-06,
+ "loss": 0.0429,
+ "step": 26547
+ },
+ {
+ "epoch": 72.33787465940054,
+ "grad_norm": 3.3203647136688232,
+ "learning_rate": 3.751903038849034e-06,
+ "loss": 0.0537,
+ "step": 26548
+ },
+ {
+ "epoch": 72.34059945504087,
+ "grad_norm": 3.221702814102173,
+ "learning_rate": 3.7512140315979794e-06,
+ "loss": 0.1904,
+ "step": 26549
+ },
+ {
+ "epoch": 72.34332425068119,
+ "grad_norm": 2.855668783187866,
+ "learning_rate": 3.750525073012271e-06,
+ "loss": 0.1714,
+ "step": 26550
+ },
+ {
+ "epoch": 72.34604904632153,
+ "grad_norm": 3.7057361602783203,
+ "learning_rate": 3.7498361630972733e-06,
+ "loss": 0.0936,
+ "step": 26551
+ },
+ {
+ "epoch": 72.34877384196186,
+ "grad_norm": 2.206052303314209,
+ "learning_rate": 3.7491473018583503e-06,
+ "loss": 0.0285,
+ "step": 26552
+ },
+ {
+ "epoch": 72.35149863760218,
+ "grad_norm": 2.6182804107666016,
+ "learning_rate": 3.7484584893008634e-06,
+ "loss": 0.0312,
+ "step": 26553
+ },
+ {
+ "epoch": 72.35422343324251,
+ "grad_norm": 2.748892307281494,
+ "learning_rate": 3.7477697254301836e-06,
+ "loss": 0.0283,
+ "step": 26554
+ },
+ {
+ "epoch": 72.35694822888283,
+ "grad_norm": 3.3066937923431396,
+ "learning_rate": 3.7470810102516717e-06,
+ "loss": 0.0997,
+ "step": 26555
+ },
+ {
+ "epoch": 72.35967302452316,
+ "grad_norm": 2.5142152309417725,
+ "learning_rate": 3.7463923437706896e-06,
+ "loss": 0.0376,
+ "step": 26556
+ },
+ {
+ "epoch": 72.3623978201635,
+ "grad_norm": 2.5725595951080322,
+ "learning_rate": 3.7457037259926043e-06,
+ "loss": 0.0853,
+ "step": 26557
+ },
+ {
+ "epoch": 72.36512261580381,
+ "grad_norm": 2.77140212059021,
+ "learning_rate": 3.7450151569227743e-06,
+ "loss": 0.0989,
+ "step": 26558
+ },
+ {
+ "epoch": 72.36784741144415,
+ "grad_norm": 2.4653334617614746,
+ "learning_rate": 3.744326636566569e-06,
+ "loss": 0.0472,
+ "step": 26559
+ },
+ {
+ "epoch": 72.37057220708446,
+ "grad_norm": 3.0174481868743896,
+ "learning_rate": 3.7436381649293463e-06,
+ "loss": 0.0407,
+ "step": 26560
+ },
+ {
+ "epoch": 72.3732970027248,
+ "grad_norm": 3.057506561279297,
+ "learning_rate": 3.7429497420164638e-06,
+ "loss": 0.1448,
+ "step": 26561
+ },
+ {
+ "epoch": 72.37602179836512,
+ "grad_norm": 2.8814988136291504,
+ "learning_rate": 3.742261367833292e-06,
+ "loss": 0.0594,
+ "step": 26562
+ },
+ {
+ "epoch": 72.37874659400545,
+ "grad_norm": 3.040027618408203,
+ "learning_rate": 3.741573042385187e-06,
+ "loss": 0.0563,
+ "step": 26563
+ },
+ {
+ "epoch": 72.38147138964578,
+ "grad_norm": 2.5569448471069336,
+ "learning_rate": 3.740884765677509e-06,
+ "loss": 0.0541,
+ "step": 26564
+ },
+ {
+ "epoch": 72.3841961852861,
+ "grad_norm": 3.7037227153778076,
+ "learning_rate": 3.740196537715617e-06,
+ "loss": 0.0613,
+ "step": 26565
+ },
+ {
+ "epoch": 72.38692098092643,
+ "grad_norm": 2.6009268760681152,
+ "learning_rate": 3.7395083585048752e-06,
+ "loss": 0.0523,
+ "step": 26566
+ },
+ {
+ "epoch": 72.38964577656675,
+ "grad_norm": 4.700798034667969,
+ "learning_rate": 3.7388202280506413e-06,
+ "loss": 0.0878,
+ "step": 26567
+ },
+ {
+ "epoch": 72.39237057220708,
+ "grad_norm": 2.977999210357666,
+ "learning_rate": 3.738132146358273e-06,
+ "loss": 0.1726,
+ "step": 26568
+ },
+ {
+ "epoch": 72.39509536784742,
+ "grad_norm": 2.9839766025543213,
+ "learning_rate": 3.7374441134331276e-06,
+ "loss": 0.2143,
+ "step": 26569
+ },
+ {
+ "epoch": 72.39782016348774,
+ "grad_norm": 3.3047571182250977,
+ "learning_rate": 3.7367561292805686e-06,
+ "loss": 0.1686,
+ "step": 26570
+ },
+ {
+ "epoch": 72.40054495912807,
+ "grad_norm": 3.0683958530426025,
+ "learning_rate": 3.736068193905952e-06,
+ "loss": 0.1967,
+ "step": 26571
+ },
+ {
+ "epoch": 72.40326975476839,
+ "grad_norm": 1.989783525466919,
+ "learning_rate": 3.7353803073146343e-06,
+ "loss": 0.0271,
+ "step": 26572
+ },
+ {
+ "epoch": 72.40599455040872,
+ "grad_norm": 3.054657220840454,
+ "learning_rate": 3.73469246951197e-06,
+ "loss": 0.0312,
+ "step": 26573
+ },
+ {
+ "epoch": 72.40871934604904,
+ "grad_norm": 2.4195311069488525,
+ "learning_rate": 3.7340046805033224e-06,
+ "loss": 0.1068,
+ "step": 26574
+ },
+ {
+ "epoch": 72.41144414168937,
+ "grad_norm": 2.761606454849243,
+ "learning_rate": 3.7333169402940407e-06,
+ "loss": 0.234,
+ "step": 26575
+ },
+ {
+ "epoch": 72.4141689373297,
+ "grad_norm": 3.4567863941192627,
+ "learning_rate": 3.732629248889489e-06,
+ "loss": 0.1427,
+ "step": 26576
+ },
+ {
+ "epoch": 72.41689373297002,
+ "grad_norm": 3.849689245223999,
+ "learning_rate": 3.7319416062950154e-06,
+ "loss": 0.1498,
+ "step": 26577
+ },
+ {
+ "epoch": 72.41961852861036,
+ "grad_norm": 2.1619315147399902,
+ "learning_rate": 3.731254012515982e-06,
+ "loss": 0.0286,
+ "step": 26578
+ },
+ {
+ "epoch": 72.42234332425068,
+ "grad_norm": 3.229844570159912,
+ "learning_rate": 3.7305664675577415e-06,
+ "loss": 0.0593,
+ "step": 26579
+ },
+ {
+ "epoch": 72.42506811989101,
+ "grad_norm": 3.447657585144043,
+ "learning_rate": 3.729878971425647e-06,
+ "loss": 0.0839,
+ "step": 26580
+ },
+ {
+ "epoch": 72.42779291553134,
+ "grad_norm": 2.009647846221924,
+ "learning_rate": 3.72919152412505e-06,
+ "loss": 0.0259,
+ "step": 26581
+ },
+ {
+ "epoch": 72.43051771117166,
+ "grad_norm": 4.244502067565918,
+ "learning_rate": 3.7285041256613095e-06,
+ "loss": 0.0511,
+ "step": 26582
+ },
+ {
+ "epoch": 72.433242506812,
+ "grad_norm": 3.3259167671203613,
+ "learning_rate": 3.7278167760397788e-06,
+ "loss": 0.1067,
+ "step": 26583
+ },
+ {
+ "epoch": 72.43596730245231,
+ "grad_norm": 3.9733872413635254,
+ "learning_rate": 3.7271294752658093e-06,
+ "loss": 0.0612,
+ "step": 26584
+ },
+ {
+ "epoch": 72.43869209809264,
+ "grad_norm": 2.89430832862854,
+ "learning_rate": 3.7264422233447496e-06,
+ "loss": 0.046,
+ "step": 26585
+ },
+ {
+ "epoch": 72.44141689373296,
+ "grad_norm": 3.904181957244873,
+ "learning_rate": 3.7257550202819593e-06,
+ "loss": 0.3219,
+ "step": 26586
+ },
+ {
+ "epoch": 72.4441416893733,
+ "grad_norm": 2.950934886932373,
+ "learning_rate": 3.7250678660827867e-06,
+ "loss": 0.0394,
+ "step": 26587
+ },
+ {
+ "epoch": 72.44686648501363,
+ "grad_norm": 3.6347861289978027,
+ "learning_rate": 3.724380760752584e-06,
+ "loss": 0.0587,
+ "step": 26588
+ },
+ {
+ "epoch": 72.44959128065395,
+ "grad_norm": 3.4159059524536133,
+ "learning_rate": 3.723693704296698e-06,
+ "loss": 0.0834,
+ "step": 26589
+ },
+ {
+ "epoch": 72.45231607629428,
+ "grad_norm": 3.026069164276123,
+ "learning_rate": 3.723006696720487e-06,
+ "loss": 0.1139,
+ "step": 26590
+ },
+ {
+ "epoch": 72.4550408719346,
+ "grad_norm": 4.08567476272583,
+ "learning_rate": 3.7223197380292986e-06,
+ "loss": 0.0452,
+ "step": 26591
+ },
+ {
+ "epoch": 72.45776566757493,
+ "grad_norm": 3.3417935371398926,
+ "learning_rate": 3.7216328282284776e-06,
+ "loss": 0.2245,
+ "step": 26592
+ },
+ {
+ "epoch": 72.46049046321527,
+ "grad_norm": 3.017200231552124,
+ "learning_rate": 3.7209459673233817e-06,
+ "loss": 0.0349,
+ "step": 26593
+ },
+ {
+ "epoch": 72.46321525885558,
+ "grad_norm": 3.1273984909057617,
+ "learning_rate": 3.7202591553193534e-06,
+ "loss": 0.0397,
+ "step": 26594
+ },
+ {
+ "epoch": 72.46594005449592,
+ "grad_norm": 3.3112401962280273,
+ "learning_rate": 3.7195723922217487e-06,
+ "loss": 0.0501,
+ "step": 26595
+ },
+ {
+ "epoch": 72.46866485013624,
+ "grad_norm": 5.199794292449951,
+ "learning_rate": 3.7188856780359117e-06,
+ "loss": 0.0353,
+ "step": 26596
+ },
+ {
+ "epoch": 72.47138964577657,
+ "grad_norm": 4.355407238006592,
+ "learning_rate": 3.718199012767186e-06,
+ "loss": 0.3405,
+ "step": 26597
+ },
+ {
+ "epoch": 72.47411444141689,
+ "grad_norm": 3.16474986076355,
+ "learning_rate": 3.7175123964209293e-06,
+ "loss": 0.0604,
+ "step": 26598
+ },
+ {
+ "epoch": 72.47683923705722,
+ "grad_norm": 3.2281923294067383,
+ "learning_rate": 3.716825829002484e-06,
+ "loss": 0.0713,
+ "step": 26599
+ },
+ {
+ "epoch": 72.47956403269755,
+ "grad_norm": 3.2811269760131836,
+ "learning_rate": 3.716139310517196e-06,
+ "loss": 0.1078,
+ "step": 26600
+ },
+ {
+ "epoch": 72.48228882833787,
+ "grad_norm": 2.6293327808380127,
+ "learning_rate": 3.7154528409704095e-06,
+ "loss": 0.1453,
+ "step": 26601
+ },
+ {
+ "epoch": 72.4850136239782,
+ "grad_norm": 4.739869594573975,
+ "learning_rate": 3.714766420367478e-06,
+ "loss": 0.0462,
+ "step": 26602
+ },
+ {
+ "epoch": 72.48773841961852,
+ "grad_norm": 2.9011590480804443,
+ "learning_rate": 3.7140800487137428e-06,
+ "loss": 0.0772,
+ "step": 26603
+ },
+ {
+ "epoch": 72.49046321525886,
+ "grad_norm": 3.0490882396698,
+ "learning_rate": 3.71339372601455e-06,
+ "loss": 0.0356,
+ "step": 26604
+ },
+ {
+ "epoch": 72.49318801089919,
+ "grad_norm": 2.6441643238067627,
+ "learning_rate": 3.7127074522752416e-06,
+ "loss": 0.0935,
+ "step": 26605
+ },
+ {
+ "epoch": 72.49591280653951,
+ "grad_norm": 3.0331103801727295,
+ "learning_rate": 3.712021227501168e-06,
+ "loss": 0.0676,
+ "step": 26606
+ },
+ {
+ "epoch": 72.49863760217984,
+ "grad_norm": 3.3428590297698975,
+ "learning_rate": 3.711335051697671e-06,
+ "loss": 0.1346,
+ "step": 26607
+ },
+ {
+ "epoch": 72.50136239782016,
+ "grad_norm": 2.761168956756592,
+ "learning_rate": 3.710648924870094e-06,
+ "loss": 0.0494,
+ "step": 26608
+ },
+ {
+ "epoch": 72.50408719346049,
+ "grad_norm": 2.2414186000823975,
+ "learning_rate": 3.709962847023777e-06,
+ "loss": 0.1006,
+ "step": 26609
+ },
+ {
+ "epoch": 72.50681198910081,
+ "grad_norm": 1.9201786518096924,
+ "learning_rate": 3.709276818164067e-06,
+ "loss": 0.1983,
+ "step": 26610
+ },
+ {
+ "epoch": 72.50953678474114,
+ "grad_norm": 2.128126621246338,
+ "learning_rate": 3.708590838296311e-06,
+ "loss": 0.0338,
+ "step": 26611
+ },
+ {
+ "epoch": 72.51226158038148,
+ "grad_norm": 5.717984199523926,
+ "learning_rate": 3.7079049074258465e-06,
+ "loss": 0.0615,
+ "step": 26612
+ },
+ {
+ "epoch": 72.5149863760218,
+ "grad_norm": 2.956634283065796,
+ "learning_rate": 3.7072190255580153e-06,
+ "loss": 0.0443,
+ "step": 26613
+ },
+ {
+ "epoch": 72.51771117166213,
+ "grad_norm": 3.8963871002197266,
+ "learning_rate": 3.7065331926981573e-06,
+ "loss": 0.0396,
+ "step": 26614
+ },
+ {
+ "epoch": 72.52043596730245,
+ "grad_norm": 2.367657423019409,
+ "learning_rate": 3.7058474088516194e-06,
+ "loss": 0.0296,
+ "step": 26615
+ },
+ {
+ "epoch": 72.52316076294278,
+ "grad_norm": 3.041741132736206,
+ "learning_rate": 3.7051616740237396e-06,
+ "loss": 0.0977,
+ "step": 26616
+ },
+ {
+ "epoch": 72.52588555858311,
+ "grad_norm": 2.3505899906158447,
+ "learning_rate": 3.7044759882198576e-06,
+ "loss": 0.0529,
+ "step": 26617
+ },
+ {
+ "epoch": 72.52861035422343,
+ "grad_norm": 2.8662209510803223,
+ "learning_rate": 3.703790351445311e-06,
+ "loss": 0.1394,
+ "step": 26618
+ },
+ {
+ "epoch": 72.53133514986376,
+ "grad_norm": 3.9677467346191406,
+ "learning_rate": 3.703104763705446e-06,
+ "loss": 0.0593,
+ "step": 26619
+ },
+ {
+ "epoch": 72.53405994550408,
+ "grad_norm": 3.4518957138061523,
+ "learning_rate": 3.702419225005598e-06,
+ "loss": 0.1954,
+ "step": 26620
+ },
+ {
+ "epoch": 72.53678474114442,
+ "grad_norm": 2.4246394634246826,
+ "learning_rate": 3.701733735351103e-06,
+ "loss": 0.055,
+ "step": 26621
+ },
+ {
+ "epoch": 72.53950953678473,
+ "grad_norm": 2.5853323936462402,
+ "learning_rate": 3.701048294747307e-06,
+ "loss": 0.0369,
+ "step": 26622
+ },
+ {
+ "epoch": 72.54223433242507,
+ "grad_norm": 3.6149227619171143,
+ "learning_rate": 3.7003629031995436e-06,
+ "loss": 0.1518,
+ "step": 26623
+ },
+ {
+ "epoch": 72.5449591280654,
+ "grad_norm": 3.3796393871307373,
+ "learning_rate": 3.6996775607131507e-06,
+ "loss": 0.0401,
+ "step": 26624
+ },
+ {
+ "epoch": 72.54768392370572,
+ "grad_norm": 3.288841724395752,
+ "learning_rate": 3.698992267293464e-06,
+ "loss": 0.0923,
+ "step": 26625
+ },
+ {
+ "epoch": 72.55040871934605,
+ "grad_norm": 3.312417984008789,
+ "learning_rate": 3.6983070229458216e-06,
+ "loss": 0.0473,
+ "step": 26626
+ },
+ {
+ "epoch": 72.55313351498637,
+ "grad_norm": 2.734294891357422,
+ "learning_rate": 3.6976218276755647e-06,
+ "loss": 0.0445,
+ "step": 26627
+ },
+ {
+ "epoch": 72.5558583106267,
+ "grad_norm": 2.6206490993499756,
+ "learning_rate": 3.696936681488027e-06,
+ "loss": 0.0338,
+ "step": 26628
+ },
+ {
+ "epoch": 72.55858310626704,
+ "grad_norm": 2.402534246444702,
+ "learning_rate": 3.696251584388544e-06,
+ "loss": 0.0339,
+ "step": 26629
+ },
+ {
+ "epoch": 72.56130790190736,
+ "grad_norm": 3.5467193126678467,
+ "learning_rate": 3.6955665363824455e-06,
+ "loss": 0.1125,
+ "step": 26630
+ },
+ {
+ "epoch": 72.56403269754769,
+ "grad_norm": 3.2578461170196533,
+ "learning_rate": 3.694881537475077e-06,
+ "loss": 0.048,
+ "step": 26631
+ },
+ {
+ "epoch": 72.566757493188,
+ "grad_norm": 3.4806723594665527,
+ "learning_rate": 3.6941965876717667e-06,
+ "loss": 0.065,
+ "step": 26632
+ },
+ {
+ "epoch": 72.56948228882834,
+ "grad_norm": 3.2064919471740723,
+ "learning_rate": 3.693511686977852e-06,
+ "loss": 0.0941,
+ "step": 26633
+ },
+ {
+ "epoch": 72.57220708446866,
+ "grad_norm": 2.320227861404419,
+ "learning_rate": 3.692826835398661e-06,
+ "loss": 0.0995,
+ "step": 26634
+ },
+ {
+ "epoch": 72.57493188010899,
+ "grad_norm": 3.9799299240112305,
+ "learning_rate": 3.692142032939535e-06,
+ "loss": 0.1618,
+ "step": 26635
+ },
+ {
+ "epoch": 72.57765667574932,
+ "grad_norm": 2.474313497543335,
+ "learning_rate": 3.6914572796058033e-06,
+ "loss": 0.0265,
+ "step": 26636
+ },
+ {
+ "epoch": 72.58038147138964,
+ "grad_norm": 3.85147762298584,
+ "learning_rate": 3.6907725754028e-06,
+ "loss": 0.0505,
+ "step": 26637
+ },
+ {
+ "epoch": 72.58310626702998,
+ "grad_norm": 2.8720130920410156,
+ "learning_rate": 3.6900879203358543e-06,
+ "loss": 0.0906,
+ "step": 26638
+ },
+ {
+ "epoch": 72.5858310626703,
+ "grad_norm": 4.143994331359863,
+ "learning_rate": 3.6894033144103025e-06,
+ "loss": 0.2785,
+ "step": 26639
+ },
+ {
+ "epoch": 72.58855585831063,
+ "grad_norm": 2.5250139236450195,
+ "learning_rate": 3.6887187576314755e-06,
+ "loss": 0.0484,
+ "step": 26640
+ },
+ {
+ "epoch": 72.59128065395096,
+ "grad_norm": 2.678302526473999,
+ "learning_rate": 3.688034250004704e-06,
+ "loss": 0.0388,
+ "step": 26641
+ },
+ {
+ "epoch": 72.59400544959128,
+ "grad_norm": 3.1381940841674805,
+ "learning_rate": 3.687349791535314e-06,
+ "loss": 0.0447,
+ "step": 26642
+ },
+ {
+ "epoch": 72.59673024523161,
+ "grad_norm": 2.558359146118164,
+ "learning_rate": 3.6866653822286457e-06,
+ "loss": 0.0561,
+ "step": 26643
+ },
+ {
+ "epoch": 72.59945504087193,
+ "grad_norm": 2.7017393112182617,
+ "learning_rate": 3.685981022090019e-06,
+ "loss": 0.0344,
+ "step": 26644
+ },
+ {
+ "epoch": 72.60217983651226,
+ "grad_norm": 3.1276755332946777,
+ "learning_rate": 3.685296711124774e-06,
+ "loss": 0.0422,
+ "step": 26645
+ },
+ {
+ "epoch": 72.60490463215258,
+ "grad_norm": 4.713883876800537,
+ "learning_rate": 3.684612449338231e-06,
+ "loss": 0.1321,
+ "step": 26646
+ },
+ {
+ "epoch": 72.60762942779292,
+ "grad_norm": 2.7960073947906494,
+ "learning_rate": 3.6839282367357256e-06,
+ "loss": 0.0768,
+ "step": 26647
+ },
+ {
+ "epoch": 72.61035422343325,
+ "grad_norm": 2.353724479675293,
+ "learning_rate": 3.683244073322584e-06,
+ "loss": 0.0423,
+ "step": 26648
+ },
+ {
+ "epoch": 72.61307901907357,
+ "grad_norm": 2.059302568435669,
+ "learning_rate": 3.682559959104135e-06,
+ "loss": 0.0322,
+ "step": 26649
+ },
+ {
+ "epoch": 72.6158038147139,
+ "grad_norm": 5.215627193450928,
+ "learning_rate": 3.6818758940857014e-06,
+ "loss": 0.0433,
+ "step": 26650
+ },
+ {
+ "epoch": 72.61852861035422,
+ "grad_norm": 2.479736089706421,
+ "learning_rate": 3.6811918782726197e-06,
+ "loss": 0.0568,
+ "step": 26651
+ },
+ {
+ "epoch": 72.62125340599455,
+ "grad_norm": 7.511143684387207,
+ "learning_rate": 3.680507911670211e-06,
+ "loss": 0.0508,
+ "step": 26652
+ },
+ {
+ "epoch": 72.62397820163488,
+ "grad_norm": 2.905149221420288,
+ "learning_rate": 3.6798239942838042e-06,
+ "loss": 0.0319,
+ "step": 26653
+ },
+ {
+ "epoch": 72.6267029972752,
+ "grad_norm": 3.5439958572387695,
+ "learning_rate": 3.679140126118721e-06,
+ "loss": 0.0714,
+ "step": 26654
+ },
+ {
+ "epoch": 72.62942779291554,
+ "grad_norm": 2.8212172985076904,
+ "learning_rate": 3.6784563071802935e-06,
+ "loss": 0.0584,
+ "step": 26655
+ },
+ {
+ "epoch": 72.63215258855585,
+ "grad_norm": 2.913501739501953,
+ "learning_rate": 3.677772537473846e-06,
+ "loss": 0.0654,
+ "step": 26656
+ },
+ {
+ "epoch": 72.63487738419619,
+ "grad_norm": 3.516343832015991,
+ "learning_rate": 3.6770888170047026e-06,
+ "loss": 0.0756,
+ "step": 26657
+ },
+ {
+ "epoch": 72.6376021798365,
+ "grad_norm": 2.9517154693603516,
+ "learning_rate": 3.6764051457781836e-06,
+ "loss": 0.0375,
+ "step": 26658
+ },
+ {
+ "epoch": 72.64032697547684,
+ "grad_norm": 2.010986804962158,
+ "learning_rate": 3.6757215237996225e-06,
+ "loss": 0.0317,
+ "step": 26659
+ },
+ {
+ "epoch": 72.64305177111717,
+ "grad_norm": 2.282716751098633,
+ "learning_rate": 3.6750379510743374e-06,
+ "loss": 0.0457,
+ "step": 26660
+ },
+ {
+ "epoch": 72.64577656675749,
+ "grad_norm": 2.6153957843780518,
+ "learning_rate": 3.6743544276076503e-06,
+ "loss": 0.0641,
+ "step": 26661
+ },
+ {
+ "epoch": 72.64850136239782,
+ "grad_norm": 2.0542514324188232,
+ "learning_rate": 3.6736709534048877e-06,
+ "loss": 0.0901,
+ "step": 26662
+ },
+ {
+ "epoch": 72.65122615803814,
+ "grad_norm": 2.8648242950439453,
+ "learning_rate": 3.6729875284713746e-06,
+ "loss": 0.1693,
+ "step": 26663
+ },
+ {
+ "epoch": 72.65395095367847,
+ "grad_norm": 3.498901605606079,
+ "learning_rate": 3.6723041528124314e-06,
+ "loss": 0.1068,
+ "step": 26664
+ },
+ {
+ "epoch": 72.65667574931881,
+ "grad_norm": 2.831108808517456,
+ "learning_rate": 3.67162082643338e-06,
+ "loss": 0.06,
+ "step": 26665
+ },
+ {
+ "epoch": 72.65940054495913,
+ "grad_norm": 1.8966275453567505,
+ "learning_rate": 3.6709375493395383e-06,
+ "loss": 0.098,
+ "step": 26666
+ },
+ {
+ "epoch": 72.66212534059946,
+ "grad_norm": 2.278327465057373,
+ "learning_rate": 3.670254321536235e-06,
+ "loss": 0.026,
+ "step": 26667
+ },
+ {
+ "epoch": 72.66485013623978,
+ "grad_norm": 2.6790900230407715,
+ "learning_rate": 3.6695711430287873e-06,
+ "loss": 0.0507,
+ "step": 26668
+ },
+ {
+ "epoch": 72.66757493188011,
+ "grad_norm": 3.771758794784546,
+ "learning_rate": 3.6688880138225158e-06,
+ "loss": 0.057,
+ "step": 26669
+ },
+ {
+ "epoch": 72.67029972752043,
+ "grad_norm": 4.955124855041504,
+ "learning_rate": 3.6682049339227364e-06,
+ "loss": 0.1053,
+ "step": 26670
+ },
+ {
+ "epoch": 72.67302452316076,
+ "grad_norm": 3.757066011428833,
+ "learning_rate": 3.6675219033347775e-06,
+ "loss": 0.1213,
+ "step": 26671
+ },
+ {
+ "epoch": 72.6757493188011,
+ "grad_norm": 3.1228342056274414,
+ "learning_rate": 3.6668389220639545e-06,
+ "loss": 0.075,
+ "step": 26672
+ },
+ {
+ "epoch": 72.67847411444141,
+ "grad_norm": 3.0710763931274414,
+ "learning_rate": 3.6661559901155852e-06,
+ "loss": 0.0684,
+ "step": 26673
+ },
+ {
+ "epoch": 72.68119891008175,
+ "grad_norm": 3.2185308933258057,
+ "learning_rate": 3.6654731074949856e-06,
+ "loss": 0.0791,
+ "step": 26674
+ },
+ {
+ "epoch": 72.68392370572207,
+ "grad_norm": 7.934180736541748,
+ "learning_rate": 3.6647902742074825e-06,
+ "loss": 0.1657,
+ "step": 26675
+ },
+ {
+ "epoch": 72.6866485013624,
+ "grad_norm": 4.300521373748779,
+ "learning_rate": 3.6641074902583875e-06,
+ "loss": 0.0225,
+ "step": 26676
+ },
+ {
+ "epoch": 72.68937329700273,
+ "grad_norm": 2.9716007709503174,
+ "learning_rate": 3.66342475565302e-06,
+ "loss": 0.064,
+ "step": 26677
+ },
+ {
+ "epoch": 72.69209809264305,
+ "grad_norm": 3.14971661567688,
+ "learning_rate": 3.662742070396693e-06,
+ "loss": 0.0609,
+ "step": 26678
+ },
+ {
+ "epoch": 72.69482288828338,
+ "grad_norm": 3.2120299339294434,
+ "learning_rate": 3.662059434494727e-06,
+ "loss": 0.0929,
+ "step": 26679
+ },
+ {
+ "epoch": 72.6975476839237,
+ "grad_norm": 3.51916766166687,
+ "learning_rate": 3.6613768479524413e-06,
+ "loss": 0.1384,
+ "step": 26680
+ },
+ {
+ "epoch": 72.70027247956403,
+ "grad_norm": 4.655309677124023,
+ "learning_rate": 3.660694310775148e-06,
+ "loss": 0.1508,
+ "step": 26681
+ },
+ {
+ "epoch": 72.70299727520435,
+ "grad_norm": 3.1374423503875732,
+ "learning_rate": 3.6600118229681646e-06,
+ "loss": 0.0478,
+ "step": 26682
+ },
+ {
+ "epoch": 72.70572207084469,
+ "grad_norm": 2.7924439907073975,
+ "learning_rate": 3.6593293845368018e-06,
+ "loss": 0.0433,
+ "step": 26683
+ },
+ {
+ "epoch": 72.70844686648502,
+ "grad_norm": 3.6497044563293457,
+ "learning_rate": 3.65864699548638e-06,
+ "loss": 0.1211,
+ "step": 26684
+ },
+ {
+ "epoch": 72.71117166212534,
+ "grad_norm": 3.0881779193878174,
+ "learning_rate": 3.6579646558222117e-06,
+ "loss": 0.1173,
+ "step": 26685
+ },
+ {
+ "epoch": 72.71389645776567,
+ "grad_norm": 3.23443603515625,
+ "learning_rate": 3.657282365549607e-06,
+ "loss": 0.164,
+ "step": 26686
+ },
+ {
+ "epoch": 72.71662125340599,
+ "grad_norm": 3.1497604846954346,
+ "learning_rate": 3.656600124673887e-06,
+ "loss": 0.0569,
+ "step": 26687
+ },
+ {
+ "epoch": 72.71934604904632,
+ "grad_norm": 2.4993958473205566,
+ "learning_rate": 3.6559179332003603e-06,
+ "loss": 0.0498,
+ "step": 26688
+ },
+ {
+ "epoch": 72.72207084468666,
+ "grad_norm": 2.9620442390441895,
+ "learning_rate": 3.6552357911343416e-06,
+ "loss": 0.1731,
+ "step": 26689
+ },
+ {
+ "epoch": 72.72479564032697,
+ "grad_norm": 3.671299695968628,
+ "learning_rate": 3.654553698481138e-06,
+ "loss": 0.0831,
+ "step": 26690
+ },
+ {
+ "epoch": 72.7275204359673,
+ "grad_norm": 3.332897901535034,
+ "learning_rate": 3.6538716552460708e-06,
+ "loss": 0.0389,
+ "step": 26691
+ },
+ {
+ "epoch": 72.73024523160763,
+ "grad_norm": 3.292475461959839,
+ "learning_rate": 3.6531896614344454e-06,
+ "loss": 0.1481,
+ "step": 26692
+ },
+ {
+ "epoch": 72.73297002724796,
+ "grad_norm": 2.9264400005340576,
+ "learning_rate": 3.6525077170515755e-06,
+ "loss": 0.0834,
+ "step": 26693
+ },
+ {
+ "epoch": 72.73569482288828,
+ "grad_norm": 4.83539342880249,
+ "learning_rate": 3.651825822102767e-06,
+ "loss": 0.0667,
+ "step": 26694
+ },
+ {
+ "epoch": 72.73841961852861,
+ "grad_norm": 3.4476091861724854,
+ "learning_rate": 3.6511439765933355e-06,
+ "loss": 0.0489,
+ "step": 26695
+ },
+ {
+ "epoch": 72.74114441416894,
+ "grad_norm": 2.714822292327881,
+ "learning_rate": 3.6504621805285935e-06,
+ "loss": 0.0454,
+ "step": 26696
+ },
+ {
+ "epoch": 72.74386920980926,
+ "grad_norm": 2.8618080615997314,
+ "learning_rate": 3.6497804339138463e-06,
+ "loss": 0.046,
+ "step": 26697
+ },
+ {
+ "epoch": 72.7465940054496,
+ "grad_norm": 2.8192522525787354,
+ "learning_rate": 3.649098736754406e-06,
+ "loss": 0.2039,
+ "step": 26698
+ },
+ {
+ "epoch": 72.74931880108991,
+ "grad_norm": 2.843562602996826,
+ "learning_rate": 3.648417089055577e-06,
+ "loss": 0.0672,
+ "step": 26699
+ },
+ {
+ "epoch": 72.75204359673025,
+ "grad_norm": 3.9819788932800293,
+ "learning_rate": 3.647735490822675e-06,
+ "loss": 0.1324,
+ "step": 26700
+ },
+ {
+ "epoch": 72.75476839237058,
+ "grad_norm": 11.397708892822266,
+ "learning_rate": 3.647053942061004e-06,
+ "loss": 0.1266,
+ "step": 26701
+ },
+ {
+ "epoch": 72.7574931880109,
+ "grad_norm": 3.057208299636841,
+ "learning_rate": 3.646372442775873e-06,
+ "loss": 0.0311,
+ "step": 26702
+ },
+ {
+ "epoch": 72.76021798365123,
+ "grad_norm": 2.358063220977783,
+ "learning_rate": 3.645690992972585e-06,
+ "loss": 0.0453,
+ "step": 26703
+ },
+ {
+ "epoch": 72.76294277929155,
+ "grad_norm": 1.9550522565841675,
+ "learning_rate": 3.6450095926564542e-06,
+ "loss": 0.1477,
+ "step": 26704
+ },
+ {
+ "epoch": 72.76566757493188,
+ "grad_norm": 3.588242769241333,
+ "learning_rate": 3.6443282418327853e-06,
+ "loss": 0.1253,
+ "step": 26705
+ },
+ {
+ "epoch": 72.7683923705722,
+ "grad_norm": 2.846660852432251,
+ "learning_rate": 3.6436469405068787e-06,
+ "loss": 0.066,
+ "step": 26706
+ },
+ {
+ "epoch": 72.77111716621253,
+ "grad_norm": 7.941333770751953,
+ "learning_rate": 3.642965688684049e-06,
+ "loss": 0.1424,
+ "step": 26707
+ },
+ {
+ "epoch": 72.77384196185287,
+ "grad_norm": 2.316028118133545,
+ "learning_rate": 3.6422844863695983e-06,
+ "loss": 0.0395,
+ "step": 26708
+ },
+ {
+ "epoch": 72.77656675749319,
+ "grad_norm": 3.421424150466919,
+ "learning_rate": 3.6416033335688306e-06,
+ "loss": 0.0837,
+ "step": 26709
+ },
+ {
+ "epoch": 72.77929155313352,
+ "grad_norm": 2.974992513656616,
+ "learning_rate": 3.6409222302870494e-06,
+ "loss": 0.1099,
+ "step": 26710
+ },
+ {
+ "epoch": 72.78201634877384,
+ "grad_norm": 2.0351364612579346,
+ "learning_rate": 3.640241176529563e-06,
+ "loss": 0.0329,
+ "step": 26711
+ },
+ {
+ "epoch": 72.78474114441417,
+ "grad_norm": 3.1755497455596924,
+ "learning_rate": 3.6395601723016714e-06,
+ "loss": 0.0704,
+ "step": 26712
+ },
+ {
+ "epoch": 72.7874659400545,
+ "grad_norm": 2.6936593055725098,
+ "learning_rate": 3.638879217608684e-06,
+ "loss": 0.0381,
+ "step": 26713
+ },
+ {
+ "epoch": 72.79019073569482,
+ "grad_norm": 2.541172504425049,
+ "learning_rate": 3.6381983124558994e-06,
+ "loss": 0.05,
+ "step": 26714
+ },
+ {
+ "epoch": 72.79291553133515,
+ "grad_norm": 2.3149075508117676,
+ "learning_rate": 3.637517456848619e-06,
+ "loss": 0.0375,
+ "step": 26715
+ },
+ {
+ "epoch": 72.79564032697547,
+ "grad_norm": 2.674375295639038,
+ "learning_rate": 3.6368366507921514e-06,
+ "loss": 0.0748,
+ "step": 26716
+ },
+ {
+ "epoch": 72.7983651226158,
+ "grad_norm": 3.304030656814575,
+ "learning_rate": 3.636155894291795e-06,
+ "loss": 0.0609,
+ "step": 26717
+ },
+ {
+ "epoch": 72.80108991825612,
+ "grad_norm": 2.0676522254943848,
+ "learning_rate": 3.6354751873528515e-06,
+ "loss": 0.0558,
+ "step": 26718
+ },
+ {
+ "epoch": 72.80381471389646,
+ "grad_norm": 1.728627324104309,
+ "learning_rate": 3.634794529980619e-06,
+ "loss": 0.027,
+ "step": 26719
+ },
+ {
+ "epoch": 72.80653950953679,
+ "grad_norm": 2.3659069538116455,
+ "learning_rate": 3.6341139221804057e-06,
+ "loss": 0.0548,
+ "step": 26720
+ },
+ {
+ "epoch": 72.80926430517711,
+ "grad_norm": 3.3464324474334717,
+ "learning_rate": 3.633433363957507e-06,
+ "loss": 0.0561,
+ "step": 26721
+ },
+ {
+ "epoch": 72.81198910081744,
+ "grad_norm": 4.956269264221191,
+ "learning_rate": 3.6327528553172252e-06,
+ "loss": 0.0505,
+ "step": 26722
+ },
+ {
+ "epoch": 72.81471389645776,
+ "grad_norm": 2.6530561447143555,
+ "learning_rate": 3.6320723962648564e-06,
+ "loss": 0.0955,
+ "step": 26723
+ },
+ {
+ "epoch": 72.8174386920981,
+ "grad_norm": 3.5711658000946045,
+ "learning_rate": 3.631391986805706e-06,
+ "loss": 0.1004,
+ "step": 26724
+ },
+ {
+ "epoch": 72.82016348773843,
+ "grad_norm": 3.119831085205078,
+ "learning_rate": 3.6307116269450692e-06,
+ "loss": 0.1096,
+ "step": 26725
+ },
+ {
+ "epoch": 72.82288828337875,
+ "grad_norm": 2.1545567512512207,
+ "learning_rate": 3.630031316688245e-06,
+ "loss": 0.0499,
+ "step": 26726
+ },
+ {
+ "epoch": 72.82561307901908,
+ "grad_norm": 5.135312080383301,
+ "learning_rate": 3.62935105604053e-06,
+ "loss": 0.0863,
+ "step": 26727
+ },
+ {
+ "epoch": 72.8283378746594,
+ "grad_norm": 3.198873996734619,
+ "learning_rate": 3.628670845007226e-06,
+ "loss": 0.172,
+ "step": 26728
+ },
+ {
+ "epoch": 72.83106267029973,
+ "grad_norm": 2.5908055305480957,
+ "learning_rate": 3.6279906835936287e-06,
+ "loss": 0.047,
+ "step": 26729
+ },
+ {
+ "epoch": 72.83378746594005,
+ "grad_norm": 10.214290618896484,
+ "learning_rate": 3.627310571805032e-06,
+ "loss": 0.0654,
+ "step": 26730
+ },
+ {
+ "epoch": 72.83651226158038,
+ "grad_norm": 2.863939046859741,
+ "learning_rate": 3.626630509646735e-06,
+ "loss": 0.1027,
+ "step": 26731
+ },
+ {
+ "epoch": 72.83923705722071,
+ "grad_norm": 2.706066370010376,
+ "learning_rate": 3.625950497124038e-06,
+ "loss": 0.0346,
+ "step": 26732
+ },
+ {
+ "epoch": 72.84196185286103,
+ "grad_norm": 3.4561679363250732,
+ "learning_rate": 3.6252705342422335e-06,
+ "loss": 0.071,
+ "step": 26733
+ },
+ {
+ "epoch": 72.84468664850137,
+ "grad_norm": 3.2190403938293457,
+ "learning_rate": 3.6245906210066163e-06,
+ "loss": 0.058,
+ "step": 26734
+ },
+ {
+ "epoch": 72.84741144414168,
+ "grad_norm": 2.655494213104248,
+ "learning_rate": 3.6239107574224785e-06,
+ "loss": 0.08,
+ "step": 26735
+ },
+ {
+ "epoch": 72.85013623978202,
+ "grad_norm": 3.1073572635650635,
+ "learning_rate": 3.623230943495123e-06,
+ "loss": 0.062,
+ "step": 26736
+ },
+ {
+ "epoch": 72.85286103542235,
+ "grad_norm": 2.9819273948669434,
+ "learning_rate": 3.6225511792298397e-06,
+ "loss": 0.0703,
+ "step": 26737
+ },
+ {
+ "epoch": 72.85558583106267,
+ "grad_norm": 3.415374517440796,
+ "learning_rate": 3.621871464631922e-06,
+ "loss": 0.0901,
+ "step": 26738
+ },
+ {
+ "epoch": 72.858310626703,
+ "grad_norm": 2.0922327041625977,
+ "learning_rate": 3.6211917997066603e-06,
+ "loss": 0.0298,
+ "step": 26739
+ },
+ {
+ "epoch": 72.86103542234332,
+ "grad_norm": 3.240495204925537,
+ "learning_rate": 3.620512184459356e-06,
+ "loss": 0.1008,
+ "step": 26740
+ },
+ {
+ "epoch": 72.86376021798365,
+ "grad_norm": 4.21572732925415,
+ "learning_rate": 3.619832618895297e-06,
+ "loss": 0.1594,
+ "step": 26741
+ },
+ {
+ "epoch": 72.86648501362397,
+ "grad_norm": 3.3194217681884766,
+ "learning_rate": 3.619153103019776e-06,
+ "loss": 0.244,
+ "step": 26742
+ },
+ {
+ "epoch": 72.8692098092643,
+ "grad_norm": 2.888566732406616,
+ "learning_rate": 3.6184736368380813e-06,
+ "loss": 0.2054,
+ "step": 26743
+ },
+ {
+ "epoch": 72.87193460490464,
+ "grad_norm": 2.522555351257324,
+ "learning_rate": 3.6177942203555125e-06,
+ "loss": 0.049,
+ "step": 26744
+ },
+ {
+ "epoch": 72.87465940054496,
+ "grad_norm": 2.3681910037994385,
+ "learning_rate": 3.617114853577357e-06,
+ "loss": 0.0834,
+ "step": 26745
+ },
+ {
+ "epoch": 72.87738419618529,
+ "grad_norm": 2.3938636779785156,
+ "learning_rate": 3.6164355365089067e-06,
+ "loss": 0.0289,
+ "step": 26746
+ },
+ {
+ "epoch": 72.88010899182561,
+ "grad_norm": 2.468428373336792,
+ "learning_rate": 3.615756269155446e-06,
+ "loss": 0.029,
+ "step": 26747
+ },
+ {
+ "epoch": 72.88283378746594,
+ "grad_norm": 2.586638927459717,
+ "learning_rate": 3.61507705152227e-06,
+ "loss": 0.1221,
+ "step": 26748
+ },
+ {
+ "epoch": 72.88555858310627,
+ "grad_norm": 2.7505125999450684,
+ "learning_rate": 3.6143978836146733e-06,
+ "loss": 0.0405,
+ "step": 26749
+ },
+ {
+ "epoch": 72.88828337874659,
+ "grad_norm": 3.3790388107299805,
+ "learning_rate": 3.613718765437939e-06,
+ "loss": 0.0671,
+ "step": 26750
+ },
+ {
+ "epoch": 72.89100817438693,
+ "grad_norm": 3.445241928100586,
+ "learning_rate": 3.6130396969973546e-06,
+ "loss": 0.0962,
+ "step": 26751
+ },
+ {
+ "epoch": 72.89373297002724,
+ "grad_norm": 2.545253038406372,
+ "learning_rate": 3.6123606782982147e-06,
+ "loss": 0.0629,
+ "step": 26752
+ },
+ {
+ "epoch": 72.89645776566758,
+ "grad_norm": 2.597722291946411,
+ "learning_rate": 3.6116817093458034e-06,
+ "loss": 0.0369,
+ "step": 26753
+ },
+ {
+ "epoch": 72.8991825613079,
+ "grad_norm": 4.2187581062316895,
+ "learning_rate": 3.61100279014541e-06,
+ "loss": 0.1163,
+ "step": 26754
+ },
+ {
+ "epoch": 72.90190735694823,
+ "grad_norm": 2.331432819366455,
+ "learning_rate": 3.610323920702319e-06,
+ "loss": 0.0714,
+ "step": 26755
+ },
+ {
+ "epoch": 72.90463215258856,
+ "grad_norm": 2.561901807785034,
+ "learning_rate": 3.6096451010218214e-06,
+ "loss": 0.2032,
+ "step": 26756
+ },
+ {
+ "epoch": 72.90735694822888,
+ "grad_norm": 4.418798923492432,
+ "learning_rate": 3.6089663311092025e-06,
+ "loss": 0.0755,
+ "step": 26757
+ },
+ {
+ "epoch": 72.91008174386921,
+ "grad_norm": 2.8942484855651855,
+ "learning_rate": 3.6082876109697485e-06,
+ "loss": 0.0472,
+ "step": 26758
+ },
+ {
+ "epoch": 72.91280653950953,
+ "grad_norm": 3.2254064083099365,
+ "learning_rate": 3.607608940608741e-06,
+ "loss": 0.0389,
+ "step": 26759
+ },
+ {
+ "epoch": 72.91553133514986,
+ "grad_norm": 2.458869457244873,
+ "learning_rate": 3.606930320031474e-06,
+ "loss": 0.0553,
+ "step": 26760
+ },
+ {
+ "epoch": 72.9182561307902,
+ "grad_norm": 2.1937780380249023,
+ "learning_rate": 3.606251749243227e-06,
+ "loss": 0.0553,
+ "step": 26761
+ },
+ {
+ "epoch": 72.92098092643052,
+ "grad_norm": 3.7588653564453125,
+ "learning_rate": 3.605573228249285e-06,
+ "loss": 0.034,
+ "step": 26762
+ },
+ {
+ "epoch": 72.92370572207085,
+ "grad_norm": 2.7398927211761475,
+ "learning_rate": 3.604894757054931e-06,
+ "loss": 0.0645,
+ "step": 26763
+ },
+ {
+ "epoch": 72.92643051771117,
+ "grad_norm": 3.0189967155456543,
+ "learning_rate": 3.604216335665449e-06,
+ "loss": 0.0494,
+ "step": 26764
+ },
+ {
+ "epoch": 72.9291553133515,
+ "grad_norm": 2.9006359577178955,
+ "learning_rate": 3.603537964086129e-06,
+ "loss": 0.0943,
+ "step": 26765
+ },
+ {
+ "epoch": 72.93188010899182,
+ "grad_norm": 2.7495157718658447,
+ "learning_rate": 3.6028596423222484e-06,
+ "loss": 0.0894,
+ "step": 26766
+ },
+ {
+ "epoch": 72.93460490463215,
+ "grad_norm": 3.0567915439605713,
+ "learning_rate": 3.602181370379092e-06,
+ "loss": 0.0565,
+ "step": 26767
+ },
+ {
+ "epoch": 72.93732970027249,
+ "grad_norm": 2.584810972213745,
+ "learning_rate": 3.601503148261938e-06,
+ "loss": 0.0321,
+ "step": 26768
+ },
+ {
+ "epoch": 72.9400544959128,
+ "grad_norm": 3.017181396484375,
+ "learning_rate": 3.6008249759760737e-06,
+ "loss": 0.0334,
+ "step": 26769
+ },
+ {
+ "epoch": 72.94277929155314,
+ "grad_norm": 2.5840861797332764,
+ "learning_rate": 3.600146853526779e-06,
+ "loss": 0.0415,
+ "step": 26770
+ },
+ {
+ "epoch": 72.94550408719346,
+ "grad_norm": 5.155364036560059,
+ "learning_rate": 3.5994687809193317e-06,
+ "loss": 0.1858,
+ "step": 26771
+ },
+ {
+ "epoch": 72.94822888283379,
+ "grad_norm": 4.191073417663574,
+ "learning_rate": 3.598790758159019e-06,
+ "loss": 0.0839,
+ "step": 26772
+ },
+ {
+ "epoch": 72.95095367847412,
+ "grad_norm": 2.381028890609741,
+ "learning_rate": 3.5981127852511178e-06,
+ "loss": 0.1546,
+ "step": 26773
+ },
+ {
+ "epoch": 72.95367847411444,
+ "grad_norm": 3.2304797172546387,
+ "learning_rate": 3.5974348622009083e-06,
+ "loss": 0.0593,
+ "step": 26774
+ },
+ {
+ "epoch": 72.95640326975477,
+ "grad_norm": 4.244482517242432,
+ "learning_rate": 3.5967569890136654e-06,
+ "loss": 0.0524,
+ "step": 26775
+ },
+ {
+ "epoch": 72.95912806539509,
+ "grad_norm": 4.18062162399292,
+ "learning_rate": 3.596079165694677e-06,
+ "loss": 0.0507,
+ "step": 26776
+ },
+ {
+ "epoch": 72.96185286103542,
+ "grad_norm": 2.614755153656006,
+ "learning_rate": 3.595401392249218e-06,
+ "loss": 0.0442,
+ "step": 26777
+ },
+ {
+ "epoch": 72.96457765667574,
+ "grad_norm": 3.563538074493408,
+ "learning_rate": 3.5947236686825683e-06,
+ "loss": 0.0445,
+ "step": 26778
+ },
+ {
+ "epoch": 72.96730245231608,
+ "grad_norm": 2.8035526275634766,
+ "learning_rate": 3.5940459949999995e-06,
+ "loss": 0.0846,
+ "step": 26779
+ },
+ {
+ "epoch": 72.97002724795641,
+ "grad_norm": 2.8743069171905518,
+ "learning_rate": 3.593368371206798e-06,
+ "loss": 0.1351,
+ "step": 26780
+ },
+ {
+ "epoch": 72.97275204359673,
+ "grad_norm": 3.3925259113311768,
+ "learning_rate": 3.5926907973082335e-06,
+ "loss": 0.0862,
+ "step": 26781
+ },
+ {
+ "epoch": 72.97547683923706,
+ "grad_norm": 23.501739501953125,
+ "learning_rate": 3.5920132733095912e-06,
+ "loss": 0.2362,
+ "step": 26782
+ },
+ {
+ "epoch": 72.97820163487738,
+ "grad_norm": 3.532512664794922,
+ "learning_rate": 3.5913357992161422e-06,
+ "loss": 0.1372,
+ "step": 26783
+ },
+ {
+ "epoch": 72.98092643051771,
+ "grad_norm": 2.8155605792999268,
+ "learning_rate": 3.5906583750331614e-06,
+ "loss": 0.1241,
+ "step": 26784
+ },
+ {
+ "epoch": 72.98365122615803,
+ "grad_norm": 2.777841091156006,
+ "learning_rate": 3.5899810007659296e-06,
+ "loss": 0.0543,
+ "step": 26785
+ },
+ {
+ "epoch": 72.98637602179836,
+ "grad_norm": 3.0467355251312256,
+ "learning_rate": 3.589303676419721e-06,
+ "loss": 0.1655,
+ "step": 26786
+ },
+ {
+ "epoch": 72.9891008174387,
+ "grad_norm": 3.370142698287964,
+ "learning_rate": 3.5886264019998074e-06,
+ "loss": 0.0341,
+ "step": 26787
+ },
+ {
+ "epoch": 72.99182561307902,
+ "grad_norm": 4.560024261474609,
+ "learning_rate": 3.5879491775114618e-06,
+ "loss": 0.0792,
+ "step": 26788
+ },
+ {
+ "epoch": 72.99455040871935,
+ "grad_norm": 2.4999136924743652,
+ "learning_rate": 3.587272002959965e-06,
+ "loss": 0.0627,
+ "step": 26789
+ },
+ {
+ "epoch": 72.99727520435967,
+ "grad_norm": 3.5428922176361084,
+ "learning_rate": 3.5865948783505877e-06,
+ "loss": 0.1156,
+ "step": 26790
+ },
+ {
+ "epoch": 73.0,
+ "grad_norm": 5.0766706466674805,
+ "learning_rate": 3.585917803688603e-06,
+ "loss": 0.0837,
+ "step": 26791
+ },
+ {
+ "epoch": 73.00272479564033,
+ "grad_norm": 3.724759101867676,
+ "learning_rate": 3.585240778979281e-06,
+ "loss": 0.2373,
+ "step": 26792
+ },
+ {
+ "epoch": 73.00544959128065,
+ "grad_norm": 3.019198417663574,
+ "learning_rate": 3.584563804227901e-06,
+ "loss": 0.1205,
+ "step": 26793
+ },
+ {
+ "epoch": 73.00817438692098,
+ "grad_norm": 9.265463829040527,
+ "learning_rate": 3.583886879439731e-06,
+ "loss": 0.0701,
+ "step": 26794
+ },
+ {
+ "epoch": 73.0108991825613,
+ "grad_norm": 3.006812334060669,
+ "learning_rate": 3.58321000462004e-06,
+ "loss": 0.2511,
+ "step": 26795
+ },
+ {
+ "epoch": 73.01362397820164,
+ "grad_norm": 2.4832189083099365,
+ "learning_rate": 3.582533179774107e-06,
+ "loss": 0.1251,
+ "step": 26796
+ },
+ {
+ "epoch": 73.01634877384195,
+ "grad_norm": 2.5576279163360596,
+ "learning_rate": 3.581856404907198e-06,
+ "loss": 0.0389,
+ "step": 26797
+ },
+ {
+ "epoch": 73.01907356948229,
+ "grad_norm": 2.908736228942871,
+ "learning_rate": 3.5811796800245857e-06,
+ "loss": 0.1208,
+ "step": 26798
+ },
+ {
+ "epoch": 73.02179836512262,
+ "grad_norm": 1.714284896850586,
+ "learning_rate": 3.580503005131536e-06,
+ "loss": 0.0199,
+ "step": 26799
+ },
+ {
+ "epoch": 73.02452316076294,
+ "grad_norm": 3.5295302867889404,
+ "learning_rate": 3.579826380233322e-06,
+ "loss": 0.1732,
+ "step": 26800
+ },
+ {
+ "epoch": 73.02724795640327,
+ "grad_norm": 1.9285814762115479,
+ "learning_rate": 3.579149805335217e-06,
+ "loss": 0.0325,
+ "step": 26801
+ },
+ {
+ "epoch": 73.02997275204359,
+ "grad_norm": 2.4395298957824707,
+ "learning_rate": 3.578473280442486e-06,
+ "loss": 0.0834,
+ "step": 26802
+ },
+ {
+ "epoch": 73.03269754768392,
+ "grad_norm": 3.9300200939178467,
+ "learning_rate": 3.5777968055603996e-06,
+ "loss": 0.0854,
+ "step": 26803
+ },
+ {
+ "epoch": 73.03542234332426,
+ "grad_norm": 2.8045382499694824,
+ "learning_rate": 3.57712038069422e-06,
+ "loss": 0.0413,
+ "step": 26804
+ },
+ {
+ "epoch": 73.03814713896458,
+ "grad_norm": 5.196256637573242,
+ "learning_rate": 3.5764440058492255e-06,
+ "loss": 0.0957,
+ "step": 26805
+ },
+ {
+ "epoch": 73.04087193460491,
+ "grad_norm": 5.014540672302246,
+ "learning_rate": 3.5757676810306775e-06,
+ "loss": 0.0618,
+ "step": 26806
+ },
+ {
+ "epoch": 73.04359673024523,
+ "grad_norm": 3.0821545124053955,
+ "learning_rate": 3.5750914062438437e-06,
+ "loss": 0.0332,
+ "step": 26807
+ },
+ {
+ "epoch": 73.04632152588556,
+ "grad_norm": 4.059762001037598,
+ "learning_rate": 3.5744151814939874e-06,
+ "loss": 0.0518,
+ "step": 26808
+ },
+ {
+ "epoch": 73.04904632152588,
+ "grad_norm": 5.413859844207764,
+ "learning_rate": 3.5737390067863833e-06,
+ "loss": 0.1173,
+ "step": 26809
+ },
+ {
+ "epoch": 73.05177111716621,
+ "grad_norm": 3.953683853149414,
+ "learning_rate": 3.5730628821262926e-06,
+ "loss": 0.0988,
+ "step": 26810
+ },
+ {
+ "epoch": 73.05449591280654,
+ "grad_norm": 2.2801594734191895,
+ "learning_rate": 3.5723868075189817e-06,
+ "loss": 0.1122,
+ "step": 26811
+ },
+ {
+ "epoch": 73.05722070844686,
+ "grad_norm": 2.5937554836273193,
+ "learning_rate": 3.5717107829697117e-06,
+ "loss": 0.0432,
+ "step": 26812
+ },
+ {
+ "epoch": 73.0599455040872,
+ "grad_norm": 2.5698869228363037,
+ "learning_rate": 3.5710348084837543e-06,
+ "loss": 0.0367,
+ "step": 26813
+ },
+ {
+ "epoch": 73.06267029972751,
+ "grad_norm": 2.673501968383789,
+ "learning_rate": 3.5703588840663706e-06,
+ "loss": 0.0431,
+ "step": 26814
+ },
+ {
+ "epoch": 73.06539509536785,
+ "grad_norm": 3.987767219543457,
+ "learning_rate": 3.569683009722826e-06,
+ "loss": 0.0652,
+ "step": 26815
+ },
+ {
+ "epoch": 73.06811989100818,
+ "grad_norm": 3.394280195236206,
+ "learning_rate": 3.5690071854583763e-06,
+ "loss": 0.0586,
+ "step": 26816
+ },
+ {
+ "epoch": 73.0708446866485,
+ "grad_norm": 1.5364474058151245,
+ "learning_rate": 3.5683314112782972e-06,
+ "loss": 0.0171,
+ "step": 26817
+ },
+ {
+ "epoch": 73.07356948228883,
+ "grad_norm": 3.1772634983062744,
+ "learning_rate": 3.567655687187848e-06,
+ "loss": 0.06,
+ "step": 26818
+ },
+ {
+ "epoch": 73.07629427792915,
+ "grad_norm": 2.79032039642334,
+ "learning_rate": 3.566980013192288e-06,
+ "loss": 0.0966,
+ "step": 26819
+ },
+ {
+ "epoch": 73.07901907356948,
+ "grad_norm": 1.816536545753479,
+ "learning_rate": 3.566304389296877e-06,
+ "loss": 0.0203,
+ "step": 26820
+ },
+ {
+ "epoch": 73.0817438692098,
+ "grad_norm": 2.7905635833740234,
+ "learning_rate": 3.5656288155068842e-06,
+ "loss": 0.048,
+ "step": 26821
+ },
+ {
+ "epoch": 73.08446866485014,
+ "grad_norm": 3.276249408721924,
+ "learning_rate": 3.5649532918275675e-06,
+ "loss": 0.063,
+ "step": 26822
+ },
+ {
+ "epoch": 73.08719346049047,
+ "grad_norm": 3.8438339233398438,
+ "learning_rate": 3.5642778182641867e-06,
+ "loss": 0.1294,
+ "step": 26823
+ },
+ {
+ "epoch": 73.08991825613079,
+ "grad_norm": 5.634337425231934,
+ "learning_rate": 3.563602394822e-06,
+ "loss": 0.0623,
+ "step": 26824
+ },
+ {
+ "epoch": 73.09264305177112,
+ "grad_norm": 1.9742017984390259,
+ "learning_rate": 3.562927021506275e-06,
+ "loss": 0.0255,
+ "step": 26825
+ },
+ {
+ "epoch": 73.09536784741144,
+ "grad_norm": 3.014936685562134,
+ "learning_rate": 3.5622516983222656e-06,
+ "loss": 0.0507,
+ "step": 26826
+ },
+ {
+ "epoch": 73.09809264305177,
+ "grad_norm": 3.8650033473968506,
+ "learning_rate": 3.561576425275234e-06,
+ "loss": 0.1377,
+ "step": 26827
+ },
+ {
+ "epoch": 73.1008174386921,
+ "grad_norm": 2.649522066116333,
+ "learning_rate": 3.5609012023704338e-06,
+ "loss": 0.0836,
+ "step": 26828
+ },
+ {
+ "epoch": 73.10354223433242,
+ "grad_norm": 1.812314510345459,
+ "learning_rate": 3.560226029613132e-06,
+ "loss": 0.0416,
+ "step": 26829
+ },
+ {
+ "epoch": 73.10626702997276,
+ "grad_norm": 3.097317934036255,
+ "learning_rate": 3.5595509070085822e-06,
+ "loss": 0.0644,
+ "step": 26830
+ },
+ {
+ "epoch": 73.10899182561307,
+ "grad_norm": 1.8639962673187256,
+ "learning_rate": 3.558875834562042e-06,
+ "loss": 0.0397,
+ "step": 26831
+ },
+ {
+ "epoch": 73.11171662125341,
+ "grad_norm": 3.5851614475250244,
+ "learning_rate": 3.558200812278767e-06,
+ "loss": 0.0797,
+ "step": 26832
+ },
+ {
+ "epoch": 73.11444141689373,
+ "grad_norm": 2.8216004371643066,
+ "learning_rate": 3.557525840164017e-06,
+ "loss": 0.0516,
+ "step": 26833
+ },
+ {
+ "epoch": 73.11716621253406,
+ "grad_norm": 3.30781888961792,
+ "learning_rate": 3.5568509182230503e-06,
+ "loss": 0.1132,
+ "step": 26834
+ },
+ {
+ "epoch": 73.11989100817439,
+ "grad_norm": 2.6572554111480713,
+ "learning_rate": 3.5561760464611227e-06,
+ "loss": 0.1412,
+ "step": 26835
+ },
+ {
+ "epoch": 73.12261580381471,
+ "grad_norm": 2.784372329711914,
+ "learning_rate": 3.555501224883484e-06,
+ "loss": 0.058,
+ "step": 26836
+ },
+ {
+ "epoch": 73.12534059945504,
+ "grad_norm": 3.348184823989868,
+ "learning_rate": 3.554826453495399e-06,
+ "loss": 0.1309,
+ "step": 26837
+ },
+ {
+ "epoch": 73.12806539509536,
+ "grad_norm": 2.4507763385772705,
+ "learning_rate": 3.554151732302118e-06,
+ "loss": 0.2144,
+ "step": 26838
+ },
+ {
+ "epoch": 73.1307901907357,
+ "grad_norm": 2.553067684173584,
+ "learning_rate": 3.553477061308895e-06,
+ "loss": 0.0471,
+ "step": 26839
+ },
+ {
+ "epoch": 73.13351498637603,
+ "grad_norm": 4.398159980773926,
+ "learning_rate": 3.5528024405209825e-06,
+ "loss": 0.1645,
+ "step": 26840
+ },
+ {
+ "epoch": 73.13623978201635,
+ "grad_norm": 2.97829008102417,
+ "learning_rate": 3.55212786994364e-06,
+ "loss": 0.1687,
+ "step": 26841
+ },
+ {
+ "epoch": 73.13896457765668,
+ "grad_norm": 2.869852066040039,
+ "learning_rate": 3.551453349582119e-06,
+ "loss": 0.0626,
+ "step": 26842
+ },
+ {
+ "epoch": 73.141689373297,
+ "grad_norm": 2.9041504859924316,
+ "learning_rate": 3.550778879441671e-06,
+ "loss": 0.0608,
+ "step": 26843
+ },
+ {
+ "epoch": 73.14441416893733,
+ "grad_norm": 8.342033386230469,
+ "learning_rate": 3.550104459527546e-06,
+ "loss": 0.0615,
+ "step": 26844
+ },
+ {
+ "epoch": 73.14713896457765,
+ "grad_norm": 3.2290289402008057,
+ "learning_rate": 3.549430089845004e-06,
+ "loss": 0.0406,
+ "step": 26845
+ },
+ {
+ "epoch": 73.14986376021798,
+ "grad_norm": 2.333523988723755,
+ "learning_rate": 3.5487557703992927e-06,
+ "loss": 0.045,
+ "step": 26846
+ },
+ {
+ "epoch": 73.15258855585832,
+ "grad_norm": 3.0763156414031982,
+ "learning_rate": 3.5480815011956626e-06,
+ "loss": 0.1394,
+ "step": 26847
+ },
+ {
+ "epoch": 73.15531335149863,
+ "grad_norm": 3.40331768989563,
+ "learning_rate": 3.5474072822393635e-06,
+ "loss": 0.0488,
+ "step": 26848
+ },
+ {
+ "epoch": 73.15803814713897,
+ "grad_norm": 2.91113018989563,
+ "learning_rate": 3.546733113535653e-06,
+ "loss": 0.0419,
+ "step": 26849
+ },
+ {
+ "epoch": 73.16076294277929,
+ "grad_norm": 3.1495656967163086,
+ "learning_rate": 3.5460589950897726e-06,
+ "loss": 0.0999,
+ "step": 26850
+ },
+ {
+ "epoch": 73.16348773841962,
+ "grad_norm": 2.792149305343628,
+ "learning_rate": 3.545384926906982e-06,
+ "loss": 0.0665,
+ "step": 26851
+ },
+ {
+ "epoch": 73.16621253405995,
+ "grad_norm": 3.9560298919677734,
+ "learning_rate": 3.5447109089925247e-06,
+ "loss": 0.0591,
+ "step": 26852
+ },
+ {
+ "epoch": 73.16893732970027,
+ "grad_norm": 2.1874496936798096,
+ "learning_rate": 3.5440369413516474e-06,
+ "loss": 0.0312,
+ "step": 26853
+ },
+ {
+ "epoch": 73.1716621253406,
+ "grad_norm": 2.985170841217041,
+ "learning_rate": 3.5433630239896064e-06,
+ "loss": 0.0884,
+ "step": 26854
+ },
+ {
+ "epoch": 73.17438692098092,
+ "grad_norm": 2.814131736755371,
+ "learning_rate": 3.542689156911647e-06,
+ "loss": 0.0693,
+ "step": 26855
+ },
+ {
+ "epoch": 73.17711171662125,
+ "grad_norm": 2.8599281311035156,
+ "learning_rate": 3.542015340123016e-06,
+ "loss": 0.0653,
+ "step": 26856
+ },
+ {
+ "epoch": 73.17983651226157,
+ "grad_norm": 2.7674167156219482,
+ "learning_rate": 3.541341573628958e-06,
+ "loss": 0.1506,
+ "step": 26857
+ },
+ {
+ "epoch": 73.1825613079019,
+ "grad_norm": 4.389822483062744,
+ "learning_rate": 3.5406678574347287e-06,
+ "loss": 0.0493,
+ "step": 26858
+ },
+ {
+ "epoch": 73.18528610354224,
+ "grad_norm": 2.5432190895080566,
+ "learning_rate": 3.5399941915455695e-06,
+ "loss": 0.0734,
+ "step": 26859
+ },
+ {
+ "epoch": 73.18801089918256,
+ "grad_norm": 3.0489144325256348,
+ "learning_rate": 3.5393205759667237e-06,
+ "loss": 0.2063,
+ "step": 26860
+ },
+ {
+ "epoch": 73.19073569482289,
+ "grad_norm": 3.039339303970337,
+ "learning_rate": 3.5386470107034443e-06,
+ "loss": 0.1709,
+ "step": 26861
+ },
+ {
+ "epoch": 73.19346049046321,
+ "grad_norm": 2.7697556018829346,
+ "learning_rate": 3.5379734957609748e-06,
+ "loss": 0.048,
+ "step": 26862
+ },
+ {
+ "epoch": 73.19618528610354,
+ "grad_norm": 2.4593348503112793,
+ "learning_rate": 3.5373000311445604e-06,
+ "loss": 0.0749,
+ "step": 26863
+ },
+ {
+ "epoch": 73.19891008174388,
+ "grad_norm": 2.915950059890747,
+ "learning_rate": 3.536626616859441e-06,
+ "loss": 0.0623,
+ "step": 26864
+ },
+ {
+ "epoch": 73.2016348773842,
+ "grad_norm": 3.1317269802093506,
+ "learning_rate": 3.5359532529108687e-06,
+ "loss": 0.1221,
+ "step": 26865
+ },
+ {
+ "epoch": 73.20435967302453,
+ "grad_norm": 3.3596508502960205,
+ "learning_rate": 3.535279939304085e-06,
+ "loss": 0.1033,
+ "step": 26866
+ },
+ {
+ "epoch": 73.20708446866485,
+ "grad_norm": 3.8590259552001953,
+ "learning_rate": 3.53460667604433e-06,
+ "loss": 0.1652,
+ "step": 26867
+ },
+ {
+ "epoch": 73.20980926430518,
+ "grad_norm": 2.1116504669189453,
+ "learning_rate": 3.5339334631368527e-06,
+ "loss": 0.037,
+ "step": 26868
+ },
+ {
+ "epoch": 73.2125340599455,
+ "grad_norm": 2.5465245246887207,
+ "learning_rate": 3.5332603005868906e-06,
+ "loss": 0.2003,
+ "step": 26869
+ },
+ {
+ "epoch": 73.21525885558583,
+ "grad_norm": 4.480618953704834,
+ "learning_rate": 3.532587188399692e-06,
+ "loss": 0.0864,
+ "step": 26870
+ },
+ {
+ "epoch": 73.21798365122616,
+ "grad_norm": 4.117570877075195,
+ "learning_rate": 3.531914126580497e-06,
+ "loss": 0.0868,
+ "step": 26871
+ },
+ {
+ "epoch": 73.22070844686648,
+ "grad_norm": 2.355170488357544,
+ "learning_rate": 3.531241115134546e-06,
+ "loss": 0.0279,
+ "step": 26872
+ },
+ {
+ "epoch": 73.22343324250681,
+ "grad_norm": 4.68784236907959,
+ "learning_rate": 3.530568154067078e-06,
+ "loss": 0.038,
+ "step": 26873
+ },
+ {
+ "epoch": 73.22615803814713,
+ "grad_norm": 1.8216328620910645,
+ "learning_rate": 3.52989524338334e-06,
+ "loss": 0.031,
+ "step": 26874
+ },
+ {
+ "epoch": 73.22888283378747,
+ "grad_norm": 3.390501022338867,
+ "learning_rate": 3.5292223830885696e-06,
+ "loss": 0.0874,
+ "step": 26875
+ },
+ {
+ "epoch": 73.2316076294278,
+ "grad_norm": 2.6133570671081543,
+ "learning_rate": 3.528549573188007e-06,
+ "loss": 0.0349,
+ "step": 26876
+ },
+ {
+ "epoch": 73.23433242506812,
+ "grad_norm": 2.759392499923706,
+ "learning_rate": 3.527876813686889e-06,
+ "loss": 0.074,
+ "step": 26877
+ },
+ {
+ "epoch": 73.23705722070845,
+ "grad_norm": 3.0409185886383057,
+ "learning_rate": 3.5272041045904615e-06,
+ "loss": 0.0486,
+ "step": 26878
+ },
+ {
+ "epoch": 73.23978201634877,
+ "grad_norm": 3.128284215927124,
+ "learning_rate": 3.52653144590396e-06,
+ "loss": 0.0843,
+ "step": 26879
+ },
+ {
+ "epoch": 73.2425068119891,
+ "grad_norm": 4.041402339935303,
+ "learning_rate": 3.5258588376326198e-06,
+ "loss": 0.098,
+ "step": 26880
+ },
+ {
+ "epoch": 73.24523160762942,
+ "grad_norm": 2.9336047172546387,
+ "learning_rate": 3.525186279781686e-06,
+ "loss": 0.0996,
+ "step": 26881
+ },
+ {
+ "epoch": 73.24795640326975,
+ "grad_norm": 2.2768266201019287,
+ "learning_rate": 3.524513772356393e-06,
+ "loss": 0.0269,
+ "step": 26882
+ },
+ {
+ "epoch": 73.25068119891009,
+ "grad_norm": 2.5622401237487793,
+ "learning_rate": 3.5238413153619788e-06,
+ "loss": 0.028,
+ "step": 26883
+ },
+ {
+ "epoch": 73.2534059945504,
+ "grad_norm": 2.184340715408325,
+ "learning_rate": 3.5231689088036757e-06,
+ "loss": 0.0284,
+ "step": 26884
+ },
+ {
+ "epoch": 73.25613079019074,
+ "grad_norm": 3.16709566116333,
+ "learning_rate": 3.522496552686725e-06,
+ "loss": 0.0851,
+ "step": 26885
+ },
+ {
+ "epoch": 73.25885558583106,
+ "grad_norm": 3.5944974422454834,
+ "learning_rate": 3.5218242470163667e-06,
+ "loss": 0.0303,
+ "step": 26886
+ },
+ {
+ "epoch": 73.26158038147139,
+ "grad_norm": 2.809340476989746,
+ "learning_rate": 3.521151991797832e-06,
+ "loss": 0.0643,
+ "step": 26887
+ },
+ {
+ "epoch": 73.26430517711172,
+ "grad_norm": 2.621263027191162,
+ "learning_rate": 3.5204797870363573e-06,
+ "loss": 0.0615,
+ "step": 26888
+ },
+ {
+ "epoch": 73.26702997275204,
+ "grad_norm": 2.7322444915771484,
+ "learning_rate": 3.5198076327371744e-06,
+ "loss": 0.0627,
+ "step": 26889
+ },
+ {
+ "epoch": 73.26975476839237,
+ "grad_norm": 3.0294265747070312,
+ "learning_rate": 3.519135528905524e-06,
+ "loss": 0.1357,
+ "step": 26890
+ },
+ {
+ "epoch": 73.2724795640327,
+ "grad_norm": 2.9210681915283203,
+ "learning_rate": 3.5184634755466374e-06,
+ "loss": 0.0312,
+ "step": 26891
+ },
+ {
+ "epoch": 73.27520435967303,
+ "grad_norm": 2.321434736251831,
+ "learning_rate": 3.5177914726657493e-06,
+ "loss": 0.0318,
+ "step": 26892
+ },
+ {
+ "epoch": 73.27792915531334,
+ "grad_norm": 2.2671425342559814,
+ "learning_rate": 3.5171195202680887e-06,
+ "loss": 0.0356,
+ "step": 26893
+ },
+ {
+ "epoch": 73.28065395095368,
+ "grad_norm": 2.8914756774902344,
+ "learning_rate": 3.516447618358896e-06,
+ "loss": 0.0507,
+ "step": 26894
+ },
+ {
+ "epoch": 73.28337874659401,
+ "grad_norm": 2.2265446186065674,
+ "learning_rate": 3.5157757669434e-06,
+ "loss": 0.1225,
+ "step": 26895
+ },
+ {
+ "epoch": 73.28610354223433,
+ "grad_norm": 2.8981120586395264,
+ "learning_rate": 3.515103966026835e-06,
+ "loss": 0.1077,
+ "step": 26896
+ },
+ {
+ "epoch": 73.28882833787466,
+ "grad_norm": 4.0132646560668945,
+ "learning_rate": 3.5144322156144274e-06,
+ "loss": 0.0407,
+ "step": 26897
+ },
+ {
+ "epoch": 73.29155313351498,
+ "grad_norm": 2.233222007751465,
+ "learning_rate": 3.5137605157114164e-06,
+ "loss": 0.0305,
+ "step": 26898
+ },
+ {
+ "epoch": 73.29427792915531,
+ "grad_norm": 1.9654173851013184,
+ "learning_rate": 3.51308886632303e-06,
+ "loss": 0.0269,
+ "step": 26899
+ },
+ {
+ "epoch": 73.29700272479565,
+ "grad_norm": 2.161252975463867,
+ "learning_rate": 3.512417267454499e-06,
+ "loss": 0.0472,
+ "step": 26900
+ },
+ {
+ "epoch": 73.29972752043597,
+ "grad_norm": 2.825688123703003,
+ "learning_rate": 3.5117457191110495e-06,
+ "loss": 0.0636,
+ "step": 26901
+ },
+ {
+ "epoch": 73.3024523160763,
+ "grad_norm": 3.0534720420837402,
+ "learning_rate": 3.5110742212979156e-06,
+ "loss": 0.052,
+ "step": 26902
+ },
+ {
+ "epoch": 73.30517711171662,
+ "grad_norm": 2.1501169204711914,
+ "learning_rate": 3.5104027740203305e-06,
+ "loss": 0.0364,
+ "step": 26903
+ },
+ {
+ "epoch": 73.30790190735695,
+ "grad_norm": 2.993039608001709,
+ "learning_rate": 3.5097313772835195e-06,
+ "loss": 0.0481,
+ "step": 26904
+ },
+ {
+ "epoch": 73.31062670299727,
+ "grad_norm": 3.8253333568573,
+ "learning_rate": 3.509060031092708e-06,
+ "loss": 0.0461,
+ "step": 26905
+ },
+ {
+ "epoch": 73.3133514986376,
+ "grad_norm": 1.8563841581344604,
+ "learning_rate": 3.508388735453132e-06,
+ "loss": 0.0314,
+ "step": 26906
+ },
+ {
+ "epoch": 73.31607629427793,
+ "grad_norm": 2.2914717197418213,
+ "learning_rate": 3.507717490370015e-06,
+ "loss": 0.0321,
+ "step": 26907
+ },
+ {
+ "epoch": 73.31880108991825,
+ "grad_norm": 3.319343328475952,
+ "learning_rate": 3.507046295848585e-06,
+ "loss": 0.0388,
+ "step": 26908
+ },
+ {
+ "epoch": 73.32152588555859,
+ "grad_norm": 2.9802682399749756,
+ "learning_rate": 3.506375151894067e-06,
+ "loss": 0.0704,
+ "step": 26909
+ },
+ {
+ "epoch": 73.3242506811989,
+ "grad_norm": 3.0829756259918213,
+ "learning_rate": 3.505704058511694e-06,
+ "loss": 0.0415,
+ "step": 26910
+ },
+ {
+ "epoch": 73.32697547683924,
+ "grad_norm": 3.8320634365081787,
+ "learning_rate": 3.505033015706688e-06,
+ "loss": 0.1334,
+ "step": 26911
+ },
+ {
+ "epoch": 73.32970027247957,
+ "grad_norm": 4.733470916748047,
+ "learning_rate": 3.5043620234842757e-06,
+ "loss": 0.072,
+ "step": 26912
+ },
+ {
+ "epoch": 73.33242506811989,
+ "grad_norm": 2.269888401031494,
+ "learning_rate": 3.5036910818496792e-06,
+ "loss": 0.0341,
+ "step": 26913
+ },
+ {
+ "epoch": 73.33514986376022,
+ "grad_norm": 2.475080966949463,
+ "learning_rate": 3.5030201908081316e-06,
+ "loss": 0.2342,
+ "step": 26914
+ },
+ {
+ "epoch": 73.33787465940054,
+ "grad_norm": 3.1076841354370117,
+ "learning_rate": 3.5023493503648543e-06,
+ "loss": 0.0559,
+ "step": 26915
+ },
+ {
+ "epoch": 73.34059945504087,
+ "grad_norm": 4.108279705047607,
+ "learning_rate": 3.5016785605250702e-06,
+ "loss": 0.0649,
+ "step": 26916
+ },
+ {
+ "epoch": 73.34332425068119,
+ "grad_norm": 3.272644519805908,
+ "learning_rate": 3.5010078212940012e-06,
+ "loss": 0.0421,
+ "step": 26917
+ },
+ {
+ "epoch": 73.34604904632153,
+ "grad_norm": 2.5600414276123047,
+ "learning_rate": 3.5003371326768778e-06,
+ "loss": 0.0698,
+ "step": 26918
+ },
+ {
+ "epoch": 73.34877384196186,
+ "grad_norm": 3.030984878540039,
+ "learning_rate": 3.499666494678915e-06,
+ "loss": 0.0685,
+ "step": 26919
+ },
+ {
+ "epoch": 73.35149863760218,
+ "grad_norm": 2.884631395339966,
+ "learning_rate": 3.4989959073053447e-06,
+ "loss": 0.0444,
+ "step": 26920
+ },
+ {
+ "epoch": 73.35422343324251,
+ "grad_norm": 5.614757537841797,
+ "learning_rate": 3.498325370561385e-06,
+ "loss": 0.0651,
+ "step": 26921
+ },
+ {
+ "epoch": 73.35694822888283,
+ "grad_norm": 3.0250747203826904,
+ "learning_rate": 3.497654884452254e-06,
+ "loss": 0.092,
+ "step": 26922
+ },
+ {
+ "epoch": 73.35967302452316,
+ "grad_norm": 2.085069179534912,
+ "learning_rate": 3.4969844489831817e-06,
+ "loss": 0.0547,
+ "step": 26923
+ },
+ {
+ "epoch": 73.3623978201635,
+ "grad_norm": 2.7650771141052246,
+ "learning_rate": 3.496314064159385e-06,
+ "loss": 0.0411,
+ "step": 26924
+ },
+ {
+ "epoch": 73.36512261580381,
+ "grad_norm": 4.291244029998779,
+ "learning_rate": 3.495643729986081e-06,
+ "loss": 0.1238,
+ "step": 26925
+ },
+ {
+ "epoch": 73.36784741144415,
+ "grad_norm": 3.3603227138519287,
+ "learning_rate": 3.494973446468499e-06,
+ "loss": 0.1567,
+ "step": 26926
+ },
+ {
+ "epoch": 73.37057220708446,
+ "grad_norm": 2.3697690963745117,
+ "learning_rate": 3.4943032136118537e-06,
+ "loss": 0.1454,
+ "step": 26927
+ },
+ {
+ "epoch": 73.3732970027248,
+ "grad_norm": 2.098708391189575,
+ "learning_rate": 3.493633031421365e-06,
+ "loss": 0.0315,
+ "step": 26928
+ },
+ {
+ "epoch": 73.37602179836512,
+ "grad_norm": 2.689488410949707,
+ "learning_rate": 3.4929628999022502e-06,
+ "loss": 0.0404,
+ "step": 26929
+ },
+ {
+ "epoch": 73.37874659400545,
+ "grad_norm": 2.8799092769622803,
+ "learning_rate": 3.492292819059734e-06,
+ "loss": 0.055,
+ "step": 26930
+ },
+ {
+ "epoch": 73.38147138964578,
+ "grad_norm": 5.110519886016846,
+ "learning_rate": 3.491622788899033e-06,
+ "loss": 0.0582,
+ "step": 26931
+ },
+ {
+ "epoch": 73.3841961852861,
+ "grad_norm": 2.9135501384735107,
+ "learning_rate": 3.490952809425363e-06,
+ "loss": 0.0838,
+ "step": 26932
+ },
+ {
+ "epoch": 73.38692098092643,
+ "grad_norm": 3.180020570755005,
+ "learning_rate": 3.4902828806439394e-06,
+ "loss": 0.1259,
+ "step": 26933
+ },
+ {
+ "epoch": 73.38964577656675,
+ "grad_norm": 2.6474556922912598,
+ "learning_rate": 3.4896130025599874e-06,
+ "loss": 0.0837,
+ "step": 26934
+ },
+ {
+ "epoch": 73.39237057220708,
+ "grad_norm": 2.575450897216797,
+ "learning_rate": 3.4889431751787195e-06,
+ "loss": 0.0458,
+ "step": 26935
+ },
+ {
+ "epoch": 73.39509536784742,
+ "grad_norm": 2.345289468765259,
+ "learning_rate": 3.4882733985053487e-06,
+ "loss": 0.0453,
+ "step": 26936
+ },
+ {
+ "epoch": 73.39782016348774,
+ "grad_norm": 2.388676881790161,
+ "learning_rate": 3.4876036725450992e-06,
+ "loss": 0.0397,
+ "step": 26937
+ },
+ {
+ "epoch": 73.40054495912807,
+ "grad_norm": 2.2997653484344482,
+ "learning_rate": 3.486933997303179e-06,
+ "loss": 0.0381,
+ "step": 26938
+ },
+ {
+ "epoch": 73.40326975476839,
+ "grad_norm": 3.0745630264282227,
+ "learning_rate": 3.486264372784811e-06,
+ "loss": 0.0784,
+ "step": 26939
+ },
+ {
+ "epoch": 73.40599455040872,
+ "grad_norm": 2.604595899581909,
+ "learning_rate": 3.4855947989952054e-06,
+ "loss": 0.0541,
+ "step": 26940
+ },
+ {
+ "epoch": 73.40871934604904,
+ "grad_norm": 2.5068633556365967,
+ "learning_rate": 3.484925275939579e-06,
+ "loss": 0.082,
+ "step": 26941
+ },
+ {
+ "epoch": 73.41144414168937,
+ "grad_norm": 3.6491236686706543,
+ "learning_rate": 3.484255803623141e-06,
+ "loss": 0.0739,
+ "step": 26942
+ },
+ {
+ "epoch": 73.4141689373297,
+ "grad_norm": 2.814690351486206,
+ "learning_rate": 3.483586382051113e-06,
+ "loss": 0.1959,
+ "step": 26943
+ },
+ {
+ "epoch": 73.41689373297002,
+ "grad_norm": 3.3637218475341797,
+ "learning_rate": 3.4829170112287037e-06,
+ "loss": 0.0246,
+ "step": 26944
+ },
+ {
+ "epoch": 73.41961852861036,
+ "grad_norm": 3.7373859882354736,
+ "learning_rate": 3.4822476911611236e-06,
+ "loss": 0.0738,
+ "step": 26945
+ },
+ {
+ "epoch": 73.42234332425068,
+ "grad_norm": 2.808173894882202,
+ "learning_rate": 3.481578421853593e-06,
+ "loss": 0.2099,
+ "step": 26946
+ },
+ {
+ "epoch": 73.42506811989101,
+ "grad_norm": 4.274862289428711,
+ "learning_rate": 3.480909203311319e-06,
+ "loss": 0.2475,
+ "step": 26947
+ },
+ {
+ "epoch": 73.42779291553134,
+ "grad_norm": 3.3537137508392334,
+ "learning_rate": 3.480240035539515e-06,
+ "loss": 0.1645,
+ "step": 26948
+ },
+ {
+ "epoch": 73.43051771117166,
+ "grad_norm": 8.587748527526855,
+ "learning_rate": 3.479570918543388e-06,
+ "loss": 0.0923,
+ "step": 26949
+ },
+ {
+ "epoch": 73.433242506812,
+ "grad_norm": 2.934614896774292,
+ "learning_rate": 3.478901852328156e-06,
+ "loss": 0.0681,
+ "step": 26950
+ },
+ {
+ "epoch": 73.43596730245231,
+ "grad_norm": 3.0182249546051025,
+ "learning_rate": 3.478232836899026e-06,
+ "loss": 0.2357,
+ "step": 26951
+ },
+ {
+ "epoch": 73.43869209809264,
+ "grad_norm": 2.791226387023926,
+ "learning_rate": 3.4775638722612095e-06,
+ "loss": 0.0634,
+ "step": 26952
+ },
+ {
+ "epoch": 73.44141689373296,
+ "grad_norm": 4.563493251800537,
+ "learning_rate": 3.4768949584199118e-06,
+ "loss": 0.0832,
+ "step": 26953
+ },
+ {
+ "epoch": 73.4441416893733,
+ "grad_norm": 2.327061891555786,
+ "learning_rate": 3.476226095380347e-06,
+ "loss": 0.0479,
+ "step": 26954
+ },
+ {
+ "epoch": 73.44686648501363,
+ "grad_norm": 4.2786149978637695,
+ "learning_rate": 3.4755572831477267e-06,
+ "loss": 0.0615,
+ "step": 26955
+ },
+ {
+ "epoch": 73.44959128065395,
+ "grad_norm": 3.3000879287719727,
+ "learning_rate": 3.4748885217272554e-06,
+ "loss": 0.0679,
+ "step": 26956
+ },
+ {
+ "epoch": 73.45231607629428,
+ "grad_norm": 3.506911039352417,
+ "learning_rate": 3.4742198111241434e-06,
+ "loss": 0.1641,
+ "step": 26957
+ },
+ {
+ "epoch": 73.4550408719346,
+ "grad_norm": 2.9512298107147217,
+ "learning_rate": 3.473551151343594e-06,
+ "loss": 0.0411,
+ "step": 26958
+ },
+ {
+ "epoch": 73.45776566757493,
+ "grad_norm": 1.7537989616394043,
+ "learning_rate": 3.472882542390821e-06,
+ "loss": 0.024,
+ "step": 26959
+ },
+ {
+ "epoch": 73.46049046321527,
+ "grad_norm": 3.0269646644592285,
+ "learning_rate": 3.472213984271028e-06,
+ "loss": 0.0323,
+ "step": 26960
+ },
+ {
+ "epoch": 73.46321525885558,
+ "grad_norm": 2.1651768684387207,
+ "learning_rate": 3.471545476989423e-06,
+ "loss": 0.0435,
+ "step": 26961
+ },
+ {
+ "epoch": 73.46594005449592,
+ "grad_norm": 9.547691345214844,
+ "learning_rate": 3.470877020551209e-06,
+ "loss": 0.0543,
+ "step": 26962
+ },
+ {
+ "epoch": 73.46866485013624,
+ "grad_norm": 3.3503215312957764,
+ "learning_rate": 3.4702086149615975e-06,
+ "loss": 0.0611,
+ "step": 26963
+ },
+ {
+ "epoch": 73.47138964577657,
+ "grad_norm": 2.7280259132385254,
+ "learning_rate": 3.469540260225791e-06,
+ "loss": 0.0358,
+ "step": 26964
+ },
+ {
+ "epoch": 73.47411444141689,
+ "grad_norm": 2.4752163887023926,
+ "learning_rate": 3.468871956348995e-06,
+ "loss": 0.0427,
+ "step": 26965
+ },
+ {
+ "epoch": 73.47683923705722,
+ "grad_norm": 3.0498499870300293,
+ "learning_rate": 3.4682037033364115e-06,
+ "loss": 0.0215,
+ "step": 26966
+ },
+ {
+ "epoch": 73.47956403269755,
+ "grad_norm": 2.865424394607544,
+ "learning_rate": 3.4675355011932486e-06,
+ "loss": 0.0552,
+ "step": 26967
+ },
+ {
+ "epoch": 73.48228882833787,
+ "grad_norm": 2.940736770629883,
+ "learning_rate": 3.4668673499247108e-06,
+ "loss": 0.0393,
+ "step": 26968
+ },
+ {
+ "epoch": 73.4850136239782,
+ "grad_norm": 3.774017095565796,
+ "learning_rate": 3.4661992495359953e-06,
+ "loss": 0.0905,
+ "step": 26969
+ },
+ {
+ "epoch": 73.48773841961852,
+ "grad_norm": 3.683938503265381,
+ "learning_rate": 3.4655312000323137e-06,
+ "loss": 0.0574,
+ "step": 26970
+ },
+ {
+ "epoch": 73.49046321525886,
+ "grad_norm": 2.332352876663208,
+ "learning_rate": 3.464863201418861e-06,
+ "loss": 0.0668,
+ "step": 26971
+ },
+ {
+ "epoch": 73.49318801089919,
+ "grad_norm": 6.582822799682617,
+ "learning_rate": 3.464195253700847e-06,
+ "loss": 0.0527,
+ "step": 26972
+ },
+ {
+ "epoch": 73.49591280653951,
+ "grad_norm": 2.8384523391723633,
+ "learning_rate": 3.4635273568834703e-06,
+ "loss": 0.1161,
+ "step": 26973
+ },
+ {
+ "epoch": 73.49863760217984,
+ "grad_norm": 2.0593514442443848,
+ "learning_rate": 3.4628595109719286e-06,
+ "loss": 0.0277,
+ "step": 26974
+ },
+ {
+ "epoch": 73.50136239782016,
+ "grad_norm": 2.9547767639160156,
+ "learning_rate": 3.46219171597143e-06,
+ "loss": 0.0347,
+ "step": 26975
+ },
+ {
+ "epoch": 73.50408719346049,
+ "grad_norm": 3.8641443252563477,
+ "learning_rate": 3.4615239718871718e-06,
+ "loss": 0.0797,
+ "step": 26976
+ },
+ {
+ "epoch": 73.50681198910081,
+ "grad_norm": 3.758315324783325,
+ "learning_rate": 3.460856278724355e-06,
+ "loss": 0.1119,
+ "step": 26977
+ },
+ {
+ "epoch": 73.50953678474114,
+ "grad_norm": 3.827413320541382,
+ "learning_rate": 3.4601886364881754e-06,
+ "loss": 0.0715,
+ "step": 26978
+ },
+ {
+ "epoch": 73.51226158038148,
+ "grad_norm": 3.5978944301605225,
+ "learning_rate": 3.459521045183839e-06,
+ "loss": 0.0527,
+ "step": 26979
+ },
+ {
+ "epoch": 73.5149863760218,
+ "grad_norm": 3.1433017253875732,
+ "learning_rate": 3.4588535048165427e-06,
+ "loss": 0.1333,
+ "step": 26980
+ },
+ {
+ "epoch": 73.51771117166213,
+ "grad_norm": 3.6058473587036133,
+ "learning_rate": 3.4581860153914846e-06,
+ "loss": 0.0464,
+ "step": 26981
+ },
+ {
+ "epoch": 73.52043596730245,
+ "grad_norm": 3.056950092315674,
+ "learning_rate": 3.4575185769138596e-06,
+ "loss": 0.0651,
+ "step": 26982
+ },
+ {
+ "epoch": 73.52316076294278,
+ "grad_norm": 2.929863691329956,
+ "learning_rate": 3.4568511893888734e-06,
+ "loss": 0.066,
+ "step": 26983
+ },
+ {
+ "epoch": 73.52588555858311,
+ "grad_norm": 2.9831643104553223,
+ "learning_rate": 3.4561838528217197e-06,
+ "loss": 0.1566,
+ "step": 26984
+ },
+ {
+ "epoch": 73.52861035422343,
+ "grad_norm": 3.8312771320343018,
+ "learning_rate": 3.455516567217595e-06,
+ "loss": 0.0826,
+ "step": 26985
+ },
+ {
+ "epoch": 73.53133514986376,
+ "grad_norm": 3.1933791637420654,
+ "learning_rate": 3.4548493325816933e-06,
+ "loss": 0.0866,
+ "step": 26986
+ },
+ {
+ "epoch": 73.53405994550408,
+ "grad_norm": 2.4331719875335693,
+ "learning_rate": 3.4541821489192175e-06,
+ "loss": 0.0262,
+ "step": 26987
+ },
+ {
+ "epoch": 73.53678474114442,
+ "grad_norm": 2.7866642475128174,
+ "learning_rate": 3.453515016235357e-06,
+ "loss": 0.0759,
+ "step": 26988
+ },
+ {
+ "epoch": 73.53950953678473,
+ "grad_norm": 3.1756632328033447,
+ "learning_rate": 3.452847934535315e-06,
+ "loss": 0.0363,
+ "step": 26989
+ },
+ {
+ "epoch": 73.54223433242507,
+ "grad_norm": 4.05295991897583,
+ "learning_rate": 3.452180903824279e-06,
+ "loss": 0.1147,
+ "step": 26990
+ },
+ {
+ "epoch": 73.5449591280654,
+ "grad_norm": 3.641073226928711,
+ "learning_rate": 3.4515139241074504e-06,
+ "loss": 0.0383,
+ "step": 26991
+ },
+ {
+ "epoch": 73.54768392370572,
+ "grad_norm": 2.5837535858154297,
+ "learning_rate": 3.4508469953900205e-06,
+ "loss": 0.0386,
+ "step": 26992
+ },
+ {
+ "epoch": 73.55040871934605,
+ "grad_norm": 3.5125057697296143,
+ "learning_rate": 3.4501801176771844e-06,
+ "loss": 0.0497,
+ "step": 26993
+ },
+ {
+ "epoch": 73.55313351498637,
+ "grad_norm": 4.435265064239502,
+ "learning_rate": 3.44951329097413e-06,
+ "loss": 0.1471,
+ "step": 26994
+ },
+ {
+ "epoch": 73.5558583106267,
+ "grad_norm": 2.2139368057250977,
+ "learning_rate": 3.4488465152860593e-06,
+ "loss": 0.0328,
+ "step": 26995
+ },
+ {
+ "epoch": 73.55858310626704,
+ "grad_norm": 2.945382833480835,
+ "learning_rate": 3.4481797906181613e-06,
+ "loss": 0.0815,
+ "step": 26996
+ },
+ {
+ "epoch": 73.56130790190736,
+ "grad_norm": 3.154387950897217,
+ "learning_rate": 3.4475131169756284e-06,
+ "loss": 0.1188,
+ "step": 26997
+ },
+ {
+ "epoch": 73.56403269754769,
+ "grad_norm": 2.3312432765960693,
+ "learning_rate": 3.4468464943636483e-06,
+ "loss": 0.083,
+ "step": 26998
+ },
+ {
+ "epoch": 73.566757493188,
+ "grad_norm": 3.159672260284424,
+ "learning_rate": 3.4461799227874204e-06,
+ "loss": 0.0406,
+ "step": 26999
+ },
+ {
+ "epoch": 73.56948228882834,
+ "grad_norm": 4.261843681335449,
+ "learning_rate": 3.445513402252132e-06,
+ "loss": 0.0729,
+ "step": 27000
+ },
+ {
+ "epoch": 73.57220708446866,
+ "grad_norm": 2.7450103759765625,
+ "learning_rate": 3.444846932762975e-06,
+ "loss": 0.0806,
+ "step": 27001
+ },
+ {
+ "epoch": 73.57493188010899,
+ "grad_norm": 2.718365430831909,
+ "learning_rate": 3.444180514325135e-06,
+ "loss": 0.0262,
+ "step": 27002
+ },
+ {
+ "epoch": 73.57765667574932,
+ "grad_norm": 3.1965343952178955,
+ "learning_rate": 3.4435141469438103e-06,
+ "loss": 0.0765,
+ "step": 27003
+ },
+ {
+ "epoch": 73.58038147138964,
+ "grad_norm": 2.8067641258239746,
+ "learning_rate": 3.442847830624186e-06,
+ "loss": 0.0713,
+ "step": 27004
+ },
+ {
+ "epoch": 73.58310626702998,
+ "grad_norm": 3.0505402088165283,
+ "learning_rate": 3.4421815653714487e-06,
+ "loss": 0.2842,
+ "step": 27005
+ },
+ {
+ "epoch": 73.5858310626703,
+ "grad_norm": 5.876389503479004,
+ "learning_rate": 3.4415153511907928e-06,
+ "loss": 0.1074,
+ "step": 27006
+ },
+ {
+ "epoch": 73.58855585831063,
+ "grad_norm": 2.9681506156921387,
+ "learning_rate": 3.440849188087402e-06,
+ "loss": 0.0418,
+ "step": 27007
+ },
+ {
+ "epoch": 73.59128065395096,
+ "grad_norm": 3.5146090984344482,
+ "learning_rate": 3.440183076066469e-06,
+ "loss": 0.0464,
+ "step": 27008
+ },
+ {
+ "epoch": 73.59400544959128,
+ "grad_norm": 2.744197368621826,
+ "learning_rate": 3.43951701513318e-06,
+ "loss": 0.046,
+ "step": 27009
+ },
+ {
+ "epoch": 73.59673024523161,
+ "grad_norm": 3.572244882583618,
+ "learning_rate": 3.438851005292717e-06,
+ "loss": 0.0952,
+ "step": 27010
+ },
+ {
+ "epoch": 73.59945504087193,
+ "grad_norm": 4.2489776611328125,
+ "learning_rate": 3.438185046550275e-06,
+ "loss": 0.1632,
+ "step": 27011
+ },
+ {
+ "epoch": 73.60217983651226,
+ "grad_norm": 3.1429290771484375,
+ "learning_rate": 3.4375191389110376e-06,
+ "loss": 0.0349,
+ "step": 27012
+ },
+ {
+ "epoch": 73.60490463215258,
+ "grad_norm": 1.8757532835006714,
+ "learning_rate": 3.4368532823801893e-06,
+ "loss": 0.0264,
+ "step": 27013
+ },
+ {
+ "epoch": 73.60762942779292,
+ "grad_norm": 2.5090415477752686,
+ "learning_rate": 3.4361874769629123e-06,
+ "loss": 0.1728,
+ "step": 27014
+ },
+ {
+ "epoch": 73.61035422343325,
+ "grad_norm": 3.9638609886169434,
+ "learning_rate": 3.4355217226644e-06,
+ "loss": 0.0622,
+ "step": 27015
+ },
+ {
+ "epoch": 73.61307901907357,
+ "grad_norm": 2.4548087120056152,
+ "learning_rate": 3.434856019489833e-06,
+ "loss": 0.0261,
+ "step": 27016
+ },
+ {
+ "epoch": 73.6158038147139,
+ "grad_norm": 1.9381762742996216,
+ "learning_rate": 3.4341903674443967e-06,
+ "loss": 0.0293,
+ "step": 27017
+ },
+ {
+ "epoch": 73.61852861035422,
+ "grad_norm": 3.3661253452301025,
+ "learning_rate": 3.4335247665332704e-06,
+ "loss": 0.1087,
+ "step": 27018
+ },
+ {
+ "epoch": 73.62125340599455,
+ "grad_norm": 2.90206241607666,
+ "learning_rate": 3.432859216761645e-06,
+ "loss": 0.1134,
+ "step": 27019
+ },
+ {
+ "epoch": 73.62397820163488,
+ "grad_norm": 3.3400230407714844,
+ "learning_rate": 3.432193718134701e-06,
+ "loss": 0.0483,
+ "step": 27020
+ },
+ {
+ "epoch": 73.6267029972752,
+ "grad_norm": 2.2868094444274902,
+ "learning_rate": 3.4315282706576215e-06,
+ "loss": 0.0374,
+ "step": 27021
+ },
+ {
+ "epoch": 73.62942779291554,
+ "grad_norm": 2.2642598152160645,
+ "learning_rate": 3.430862874335584e-06,
+ "loss": 0.0415,
+ "step": 27022
+ },
+ {
+ "epoch": 73.63215258855585,
+ "grad_norm": 2.777907609939575,
+ "learning_rate": 3.4301975291737756e-06,
+ "loss": 0.0542,
+ "step": 27023
+ },
+ {
+ "epoch": 73.63487738419619,
+ "grad_norm": 3.489509344100952,
+ "learning_rate": 3.4295322351773807e-06,
+ "loss": 0.0942,
+ "step": 27024
+ },
+ {
+ "epoch": 73.6376021798365,
+ "grad_norm": 2.6100316047668457,
+ "learning_rate": 3.4288669923515784e-06,
+ "loss": 0.1175,
+ "step": 27025
+ },
+ {
+ "epoch": 73.64032697547684,
+ "grad_norm": 2.0358309745788574,
+ "learning_rate": 3.4282018007015472e-06,
+ "loss": 0.0279,
+ "step": 27026
+ },
+ {
+ "epoch": 73.64305177111717,
+ "grad_norm": 2.29683518409729,
+ "learning_rate": 3.4275366602324654e-06,
+ "loss": 0.0857,
+ "step": 27027
+ },
+ {
+ "epoch": 73.64577656675749,
+ "grad_norm": 5.21312141418457,
+ "learning_rate": 3.4268715709495203e-06,
+ "loss": 0.0718,
+ "step": 27028
+ },
+ {
+ "epoch": 73.64850136239782,
+ "grad_norm": 2.5061144828796387,
+ "learning_rate": 3.4262065328578876e-06,
+ "loss": 0.1363,
+ "step": 27029
+ },
+ {
+ "epoch": 73.65122615803814,
+ "grad_norm": 4.060135841369629,
+ "learning_rate": 3.4255415459627473e-06,
+ "loss": 0.1865,
+ "step": 27030
+ },
+ {
+ "epoch": 73.65395095367847,
+ "grad_norm": 4.575860023498535,
+ "learning_rate": 3.4248766102692744e-06,
+ "loss": 0.0757,
+ "step": 27031
+ },
+ {
+ "epoch": 73.65667574931881,
+ "grad_norm": 3.948610305786133,
+ "learning_rate": 3.4242117257826536e-06,
+ "loss": 0.0531,
+ "step": 27032
+ },
+ {
+ "epoch": 73.65940054495913,
+ "grad_norm": 5.607536315917969,
+ "learning_rate": 3.4235468925080607e-06,
+ "loss": 0.0486,
+ "step": 27033
+ },
+ {
+ "epoch": 73.66212534059946,
+ "grad_norm": 2.4876418113708496,
+ "learning_rate": 3.4228821104506694e-06,
+ "loss": 0.142,
+ "step": 27034
+ },
+ {
+ "epoch": 73.66485013623978,
+ "grad_norm": 3.045175313949585,
+ "learning_rate": 3.4222173796156643e-06,
+ "loss": 0.3281,
+ "step": 27035
+ },
+ {
+ "epoch": 73.66757493188011,
+ "grad_norm": 1.4952892065048218,
+ "learning_rate": 3.4215527000082183e-06,
+ "loss": 0.0228,
+ "step": 27036
+ },
+ {
+ "epoch": 73.67029972752043,
+ "grad_norm": 2.856586456298828,
+ "learning_rate": 3.420888071633508e-06,
+ "loss": 0.1139,
+ "step": 27037
+ },
+ {
+ "epoch": 73.67302452316076,
+ "grad_norm": 2.9633374214172363,
+ "learning_rate": 3.4202234944967062e-06,
+ "loss": 0.1319,
+ "step": 27038
+ },
+ {
+ "epoch": 73.6757493188011,
+ "grad_norm": 2.963578701019287,
+ "learning_rate": 3.4195589686029927e-06,
+ "loss": 0.0939,
+ "step": 27039
+ },
+ {
+ "epoch": 73.67847411444141,
+ "grad_norm": 2.4921133518218994,
+ "learning_rate": 3.418894493957545e-06,
+ "loss": 0.0971,
+ "step": 27040
+ },
+ {
+ "epoch": 73.68119891008175,
+ "grad_norm": 3.038226842880249,
+ "learning_rate": 3.418230070565535e-06,
+ "loss": 0.0568,
+ "step": 27041
+ },
+ {
+ "epoch": 73.68392370572207,
+ "grad_norm": 2.7386224269866943,
+ "learning_rate": 3.417565698432138e-06,
+ "loss": 0.0379,
+ "step": 27042
+ },
+ {
+ "epoch": 73.6866485013624,
+ "grad_norm": 2.886458158493042,
+ "learning_rate": 3.4169013775625235e-06,
+ "loss": 0.0497,
+ "step": 27043
+ },
+ {
+ "epoch": 73.68937329700273,
+ "grad_norm": 6.311750411987305,
+ "learning_rate": 3.416237107961873e-06,
+ "loss": 0.1695,
+ "step": 27044
+ },
+ {
+ "epoch": 73.69209809264305,
+ "grad_norm": 2.677231788635254,
+ "learning_rate": 3.415572889635356e-06,
+ "loss": 0.0498,
+ "step": 27045
+ },
+ {
+ "epoch": 73.69482288828338,
+ "grad_norm": 2.985056161880493,
+ "learning_rate": 3.414908722588145e-06,
+ "loss": 0.0837,
+ "step": 27046
+ },
+ {
+ "epoch": 73.6975476839237,
+ "grad_norm": 2.018767833709717,
+ "learning_rate": 3.41424460682541e-06,
+ "loss": 0.0817,
+ "step": 27047
+ },
+ {
+ "epoch": 73.70027247956403,
+ "grad_norm": 4.268989086151123,
+ "learning_rate": 3.413580542352328e-06,
+ "loss": 0.0722,
+ "step": 27048
+ },
+ {
+ "epoch": 73.70299727520435,
+ "grad_norm": 2.608004570007324,
+ "learning_rate": 3.412916529174071e-06,
+ "loss": 0.0453,
+ "step": 27049
+ },
+ {
+ "epoch": 73.70572207084469,
+ "grad_norm": 3.135223150253296,
+ "learning_rate": 3.4122525672958063e-06,
+ "loss": 0.193,
+ "step": 27050
+ },
+ {
+ "epoch": 73.70844686648502,
+ "grad_norm": 3.511472702026367,
+ "learning_rate": 3.411588656722704e-06,
+ "loss": 0.1021,
+ "step": 27051
+ },
+ {
+ "epoch": 73.71117166212534,
+ "grad_norm": 2.338649034500122,
+ "learning_rate": 3.4109247974599413e-06,
+ "loss": 0.0454,
+ "step": 27052
+ },
+ {
+ "epoch": 73.71389645776567,
+ "grad_norm": 2.984248399734497,
+ "learning_rate": 3.4102609895126824e-06,
+ "loss": 0.1779,
+ "step": 27053
+ },
+ {
+ "epoch": 73.71662125340599,
+ "grad_norm": 3.1859493255615234,
+ "learning_rate": 3.4095972328860973e-06,
+ "loss": 0.0532,
+ "step": 27054
+ },
+ {
+ "epoch": 73.71934604904632,
+ "grad_norm": 3.8830037117004395,
+ "learning_rate": 3.4089335275853585e-06,
+ "loss": 0.0443,
+ "step": 27055
+ },
+ {
+ "epoch": 73.72207084468666,
+ "grad_norm": 5.8974504470825195,
+ "learning_rate": 3.408269873615635e-06,
+ "loss": 0.1181,
+ "step": 27056
+ },
+ {
+ "epoch": 73.72479564032697,
+ "grad_norm": 3.8796021938323975,
+ "learning_rate": 3.407606270982089e-06,
+ "loss": 0.0687,
+ "step": 27057
+ },
+ {
+ "epoch": 73.7275204359673,
+ "grad_norm": 2.5573911666870117,
+ "learning_rate": 3.4069427196898973e-06,
+ "loss": 0.0217,
+ "step": 27058
+ },
+ {
+ "epoch": 73.73024523160763,
+ "grad_norm": 3.0410897731781006,
+ "learning_rate": 3.4062792197442197e-06,
+ "loss": 0.1233,
+ "step": 27059
+ },
+ {
+ "epoch": 73.73297002724796,
+ "grad_norm": 2.8239598274230957,
+ "learning_rate": 3.4056157711502304e-06,
+ "loss": 0.0787,
+ "step": 27060
+ },
+ {
+ "epoch": 73.73569482288828,
+ "grad_norm": 2.4992105960845947,
+ "learning_rate": 3.404952373913093e-06,
+ "loss": 0.1163,
+ "step": 27061
+ },
+ {
+ "epoch": 73.73841961852861,
+ "grad_norm": 3.2608139514923096,
+ "learning_rate": 3.4042890280379748e-06,
+ "loss": 0.1182,
+ "step": 27062
+ },
+ {
+ "epoch": 73.74114441416894,
+ "grad_norm": 2.4933953285217285,
+ "learning_rate": 3.403625733530038e-06,
+ "loss": 0.0467,
+ "step": 27063
+ },
+ {
+ "epoch": 73.74386920980926,
+ "grad_norm": 3.406280517578125,
+ "learning_rate": 3.402962490394456e-06,
+ "loss": 0.0725,
+ "step": 27064
+ },
+ {
+ "epoch": 73.7465940054496,
+ "grad_norm": 3.1564791202545166,
+ "learning_rate": 3.402299298636388e-06,
+ "loss": 0.0855,
+ "step": 27065
+ },
+ {
+ "epoch": 73.74931880108991,
+ "grad_norm": 3.5999932289123535,
+ "learning_rate": 3.401636158261001e-06,
+ "loss": 0.0436,
+ "step": 27066
+ },
+ {
+ "epoch": 73.75204359673025,
+ "grad_norm": 4.174797534942627,
+ "learning_rate": 3.4009730692734576e-06,
+ "loss": 0.0261,
+ "step": 27067
+ },
+ {
+ "epoch": 73.75476839237058,
+ "grad_norm": 2.6065797805786133,
+ "learning_rate": 3.4003100316789252e-06,
+ "loss": 0.0829,
+ "step": 27068
+ },
+ {
+ "epoch": 73.7574931880109,
+ "grad_norm": 3.2122576236724854,
+ "learning_rate": 3.399647045482567e-06,
+ "loss": 0.0468,
+ "step": 27069
+ },
+ {
+ "epoch": 73.76021798365123,
+ "grad_norm": 3.098024845123291,
+ "learning_rate": 3.398984110689544e-06,
+ "loss": 0.0522,
+ "step": 27070
+ },
+ {
+ "epoch": 73.76294277929155,
+ "grad_norm": 2.635446548461914,
+ "learning_rate": 3.398321227305018e-06,
+ "loss": 0.0716,
+ "step": 27071
+ },
+ {
+ "epoch": 73.76566757493188,
+ "grad_norm": 4.597242832183838,
+ "learning_rate": 3.3976583953341567e-06,
+ "loss": 0.0338,
+ "step": 27072
+ },
+ {
+ "epoch": 73.7683923705722,
+ "grad_norm": 2.7145698070526123,
+ "learning_rate": 3.396995614782119e-06,
+ "loss": 0.0444,
+ "step": 27073
+ },
+ {
+ "epoch": 73.77111716621253,
+ "grad_norm": 2.6254477500915527,
+ "learning_rate": 3.3963328856540633e-06,
+ "loss": 0.1218,
+ "step": 27074
+ },
+ {
+ "epoch": 73.77384196185287,
+ "grad_norm": 3.306751012802124,
+ "learning_rate": 3.3956702079551563e-06,
+ "loss": 0.0382,
+ "step": 27075
+ },
+ {
+ "epoch": 73.77656675749319,
+ "grad_norm": 3.099379062652588,
+ "learning_rate": 3.3950075816905593e-06,
+ "loss": 0.0506,
+ "step": 27076
+ },
+ {
+ "epoch": 73.77929155313352,
+ "grad_norm": 2.3745014667510986,
+ "learning_rate": 3.3943450068654303e-06,
+ "loss": 0.0286,
+ "step": 27077
+ },
+ {
+ "epoch": 73.78201634877384,
+ "grad_norm": 1.9496448040008545,
+ "learning_rate": 3.39368248348493e-06,
+ "loss": 0.0256,
+ "step": 27078
+ },
+ {
+ "epoch": 73.78474114441417,
+ "grad_norm": 2.7493364810943604,
+ "learning_rate": 3.3930200115542143e-06,
+ "loss": 0.1075,
+ "step": 27079
+ },
+ {
+ "epoch": 73.7874659400545,
+ "grad_norm": 3.410435676574707,
+ "learning_rate": 3.39235759107845e-06,
+ "loss": 0.1226,
+ "step": 27080
+ },
+ {
+ "epoch": 73.79019073569482,
+ "grad_norm": 1.8335320949554443,
+ "learning_rate": 3.391695222062793e-06,
+ "loss": 0.0644,
+ "step": 27081
+ },
+ {
+ "epoch": 73.79291553133515,
+ "grad_norm": 3.351548194885254,
+ "learning_rate": 3.391032904512399e-06,
+ "loss": 0.1441,
+ "step": 27082
+ },
+ {
+ "epoch": 73.79564032697547,
+ "grad_norm": 2.729797601699829,
+ "learning_rate": 3.3903706384324266e-06,
+ "loss": 0.0472,
+ "step": 27083
+ },
+ {
+ "epoch": 73.7983651226158,
+ "grad_norm": 3.343799114227295,
+ "learning_rate": 3.3897084238280366e-06,
+ "loss": 0.0427,
+ "step": 27084
+ },
+ {
+ "epoch": 73.80108991825612,
+ "grad_norm": 2.955580949783325,
+ "learning_rate": 3.389046260704385e-06,
+ "loss": 0.0447,
+ "step": 27085
+ },
+ {
+ "epoch": 73.80381471389646,
+ "grad_norm": 3.754732370376587,
+ "learning_rate": 3.3883841490666293e-06,
+ "loss": 0.1153,
+ "step": 27086
+ },
+ {
+ "epoch": 73.80653950953679,
+ "grad_norm": 6.577873706817627,
+ "learning_rate": 3.3877220889199213e-06,
+ "loss": 0.1361,
+ "step": 27087
+ },
+ {
+ "epoch": 73.80926430517711,
+ "grad_norm": 4.125805377960205,
+ "learning_rate": 3.387060080269423e-06,
+ "loss": 0.0805,
+ "step": 27088
+ },
+ {
+ "epoch": 73.81198910081744,
+ "grad_norm": 2.5797054767608643,
+ "learning_rate": 3.3863981231202892e-06,
+ "loss": 0.0347,
+ "step": 27089
+ },
+ {
+ "epoch": 73.81471389645776,
+ "grad_norm": 5.194318771362305,
+ "learning_rate": 3.385736217477674e-06,
+ "loss": 0.0739,
+ "step": 27090
+ },
+ {
+ "epoch": 73.8174386920981,
+ "grad_norm": 2.0635688304901123,
+ "learning_rate": 3.3850743633467286e-06,
+ "loss": 0.0432,
+ "step": 27091
+ },
+ {
+ "epoch": 73.82016348773843,
+ "grad_norm": 3.3392269611358643,
+ "learning_rate": 3.384412560732612e-06,
+ "loss": 0.1498,
+ "step": 27092
+ },
+ {
+ "epoch": 73.82288828337875,
+ "grad_norm": 3.1805264949798584,
+ "learning_rate": 3.383750809640479e-06,
+ "loss": 0.1225,
+ "step": 27093
+ },
+ {
+ "epoch": 73.82561307901908,
+ "grad_norm": 2.010472297668457,
+ "learning_rate": 3.3830891100754837e-06,
+ "loss": 0.1257,
+ "step": 27094
+ },
+ {
+ "epoch": 73.8283378746594,
+ "grad_norm": 3.9813106060028076,
+ "learning_rate": 3.382427462042772e-06,
+ "loss": 0.0586,
+ "step": 27095
+ },
+ {
+ "epoch": 73.83106267029973,
+ "grad_norm": 2.3568520545959473,
+ "learning_rate": 3.3817658655475074e-06,
+ "loss": 0.0579,
+ "step": 27096
+ },
+ {
+ "epoch": 73.83378746594005,
+ "grad_norm": 2.9525599479675293,
+ "learning_rate": 3.3811043205948366e-06,
+ "loss": 0.0617,
+ "step": 27097
+ },
+ {
+ "epoch": 73.83651226158038,
+ "grad_norm": 3.1131997108459473,
+ "learning_rate": 3.3804428271899127e-06,
+ "loss": 0.108,
+ "step": 27098
+ },
+ {
+ "epoch": 73.83923705722071,
+ "grad_norm": 2.993835926055908,
+ "learning_rate": 3.3797813853378827e-06,
+ "loss": 0.037,
+ "step": 27099
+ },
+ {
+ "epoch": 73.84196185286103,
+ "grad_norm": 2.7033605575561523,
+ "learning_rate": 3.3791199950439057e-06,
+ "loss": 0.1039,
+ "step": 27100
+ },
+ {
+ "epoch": 73.84468664850137,
+ "grad_norm": 2.3294596672058105,
+ "learning_rate": 3.3784586563131293e-06,
+ "loss": 0.0421,
+ "step": 27101
+ },
+ {
+ "epoch": 73.84741144414168,
+ "grad_norm": 14.998466491699219,
+ "learning_rate": 3.3777973691507047e-06,
+ "loss": 0.168,
+ "step": 27102
+ },
+ {
+ "epoch": 73.85013623978202,
+ "grad_norm": 2.1214687824249268,
+ "learning_rate": 3.3771361335617767e-06,
+ "loss": 0.0691,
+ "step": 27103
+ },
+ {
+ "epoch": 73.85286103542235,
+ "grad_norm": 2.2651479244232178,
+ "learning_rate": 3.376474949551504e-06,
+ "loss": 0.0391,
+ "step": 27104
+ },
+ {
+ "epoch": 73.85558583106267,
+ "grad_norm": 2.9230926036834717,
+ "learning_rate": 3.375813817125029e-06,
+ "loss": 0.0271,
+ "step": 27105
+ },
+ {
+ "epoch": 73.858310626703,
+ "grad_norm": 2.500877618789673,
+ "learning_rate": 3.3751527362875045e-06,
+ "loss": 0.0363,
+ "step": 27106
+ },
+ {
+ "epoch": 73.86103542234332,
+ "grad_norm": 4.30499267578125,
+ "learning_rate": 3.374491707044073e-06,
+ "loss": 0.0638,
+ "step": 27107
+ },
+ {
+ "epoch": 73.86376021798365,
+ "grad_norm": 3.7821364402770996,
+ "learning_rate": 3.3738307293998874e-06,
+ "loss": 0.0236,
+ "step": 27108
+ },
+ {
+ "epoch": 73.86648501362397,
+ "grad_norm": 2.388015031814575,
+ "learning_rate": 3.373169803360098e-06,
+ "loss": 0.037,
+ "step": 27109
+ },
+ {
+ "epoch": 73.8692098092643,
+ "grad_norm": 2.4646902084350586,
+ "learning_rate": 3.3725089289298483e-06,
+ "loss": 0.1281,
+ "step": 27110
+ },
+ {
+ "epoch": 73.87193460490464,
+ "grad_norm": 6.184477806091309,
+ "learning_rate": 3.371848106114287e-06,
+ "loss": 0.0604,
+ "step": 27111
+ },
+ {
+ "epoch": 73.87465940054496,
+ "grad_norm": 2.7357826232910156,
+ "learning_rate": 3.371187334918555e-06,
+ "loss": 0.0882,
+ "step": 27112
+ },
+ {
+ "epoch": 73.87738419618529,
+ "grad_norm": 3.2358157634735107,
+ "learning_rate": 3.370526615347807e-06,
+ "loss": 0.0877,
+ "step": 27113
+ },
+ {
+ "epoch": 73.88010899182561,
+ "grad_norm": 2.986412525177002,
+ "learning_rate": 3.369865947407184e-06,
+ "loss": 0.0349,
+ "step": 27114
+ },
+ {
+ "epoch": 73.88283378746594,
+ "grad_norm": 3.93294358253479,
+ "learning_rate": 3.36920533110183e-06,
+ "loss": 0.0363,
+ "step": 27115
+ },
+ {
+ "epoch": 73.88555858310627,
+ "grad_norm": 3.0998787879943848,
+ "learning_rate": 3.36854476643689e-06,
+ "loss": 0.0582,
+ "step": 27116
+ },
+ {
+ "epoch": 73.88828337874659,
+ "grad_norm": 12.342453956604004,
+ "learning_rate": 3.3678842534175126e-06,
+ "loss": 0.0829,
+ "step": 27117
+ },
+ {
+ "epoch": 73.89100817438693,
+ "grad_norm": 2.846457004547119,
+ "learning_rate": 3.367223792048839e-06,
+ "loss": 0.0673,
+ "step": 27118
+ },
+ {
+ "epoch": 73.89373297002724,
+ "grad_norm": 4.059755325317383,
+ "learning_rate": 3.36656338233601e-06,
+ "loss": 0.0643,
+ "step": 27119
+ },
+ {
+ "epoch": 73.89645776566758,
+ "grad_norm": 4.853326320648193,
+ "learning_rate": 3.365903024284175e-06,
+ "loss": 0.0854,
+ "step": 27120
+ },
+ {
+ "epoch": 73.8991825613079,
+ "grad_norm": 3.6625607013702393,
+ "learning_rate": 3.3652427178984748e-06,
+ "loss": 0.0558,
+ "step": 27121
+ },
+ {
+ "epoch": 73.90190735694823,
+ "grad_norm": 2.529726982116699,
+ "learning_rate": 3.3645824631840496e-06,
+ "loss": 0.1225,
+ "step": 27122
+ },
+ {
+ "epoch": 73.90463215258856,
+ "grad_norm": 2.7696170806884766,
+ "learning_rate": 3.36392226014604e-06,
+ "loss": 0.0381,
+ "step": 27123
+ },
+ {
+ "epoch": 73.90735694822888,
+ "grad_norm": 3.455655097961426,
+ "learning_rate": 3.363262108789592e-06,
+ "loss": 0.0453,
+ "step": 27124
+ },
+ {
+ "epoch": 73.91008174386921,
+ "grad_norm": 3.9635257720947266,
+ "learning_rate": 3.3626020091198443e-06,
+ "loss": 0.0882,
+ "step": 27125
+ },
+ {
+ "epoch": 73.91280653950953,
+ "grad_norm": 2.7167911529541016,
+ "learning_rate": 3.3619419611419403e-06,
+ "loss": 0.0357,
+ "step": 27126
+ },
+ {
+ "epoch": 73.91553133514986,
+ "grad_norm": 2.969172477722168,
+ "learning_rate": 3.3612819648610184e-06,
+ "loss": 0.0334,
+ "step": 27127
+ },
+ {
+ "epoch": 73.9182561307902,
+ "grad_norm": 3.717292547225952,
+ "learning_rate": 3.360622020282216e-06,
+ "loss": 0.0478,
+ "step": 27128
+ },
+ {
+ "epoch": 73.92098092643052,
+ "grad_norm": 4.75085973739624,
+ "learning_rate": 3.359962127410679e-06,
+ "loss": 0.046,
+ "step": 27129
+ },
+ {
+ "epoch": 73.92370572207085,
+ "grad_norm": 2.781536817550659,
+ "learning_rate": 3.3593022862515436e-06,
+ "loss": 0.041,
+ "step": 27130
+ },
+ {
+ "epoch": 73.92643051771117,
+ "grad_norm": 2.7844009399414062,
+ "learning_rate": 3.358642496809947e-06,
+ "loss": 0.0322,
+ "step": 27131
+ },
+ {
+ "epoch": 73.9291553133515,
+ "grad_norm": 3.279512882232666,
+ "learning_rate": 3.3579827590910274e-06,
+ "loss": 0.0511,
+ "step": 27132
+ },
+ {
+ "epoch": 73.93188010899182,
+ "grad_norm": 2.986257553100586,
+ "learning_rate": 3.3573230730999264e-06,
+ "loss": 0.092,
+ "step": 27133
+ },
+ {
+ "epoch": 73.93460490463215,
+ "grad_norm": 2.8432276248931885,
+ "learning_rate": 3.3566634388417798e-06,
+ "loss": 0.0986,
+ "step": 27134
+ },
+ {
+ "epoch": 73.93732970027249,
+ "grad_norm": 2.8598997592926025,
+ "learning_rate": 3.3560038563217244e-06,
+ "loss": 0.0708,
+ "step": 27135
+ },
+ {
+ "epoch": 73.9400544959128,
+ "grad_norm": 4.491633892059326,
+ "learning_rate": 3.355344325544894e-06,
+ "loss": 0.117,
+ "step": 27136
+ },
+ {
+ "epoch": 73.94277929155314,
+ "grad_norm": 3.8423354625701904,
+ "learning_rate": 3.354684846516432e-06,
+ "loss": 0.0404,
+ "step": 27137
+ },
+ {
+ "epoch": 73.94550408719346,
+ "grad_norm": 2.9154446125030518,
+ "learning_rate": 3.354025419241469e-06,
+ "loss": 0.0848,
+ "step": 27138
+ },
+ {
+ "epoch": 73.94822888283379,
+ "grad_norm": 4.642427921295166,
+ "learning_rate": 3.3533660437251438e-06,
+ "loss": 0.2037,
+ "step": 27139
+ },
+ {
+ "epoch": 73.95095367847412,
+ "grad_norm": 2.829484462738037,
+ "learning_rate": 3.352706719972585e-06,
+ "loss": 0.0841,
+ "step": 27140
+ },
+ {
+ "epoch": 73.95367847411444,
+ "grad_norm": 3.3154149055480957,
+ "learning_rate": 3.3520474479889365e-06,
+ "loss": 0.0518,
+ "step": 27141
+ },
+ {
+ "epoch": 73.95640326975477,
+ "grad_norm": 3.962322235107422,
+ "learning_rate": 3.3513882277793287e-06,
+ "loss": 0.0691,
+ "step": 27142
+ },
+ {
+ "epoch": 73.95912806539509,
+ "grad_norm": 2.514549732208252,
+ "learning_rate": 3.3507290593488916e-06,
+ "loss": 0.0885,
+ "step": 27143
+ },
+ {
+ "epoch": 73.96185286103542,
+ "grad_norm": 2.186782121658325,
+ "learning_rate": 3.350069942702763e-06,
+ "loss": 0.1245,
+ "step": 27144
+ },
+ {
+ "epoch": 73.96457765667574,
+ "grad_norm": 2.092263698577881,
+ "learning_rate": 3.349410877846079e-06,
+ "loss": 0.0359,
+ "step": 27145
+ },
+ {
+ "epoch": 73.96730245231608,
+ "grad_norm": 3.4706501960754395,
+ "learning_rate": 3.348751864783969e-06,
+ "loss": 0.1299,
+ "step": 27146
+ },
+ {
+ "epoch": 73.97002724795641,
+ "grad_norm": 2.9542319774627686,
+ "learning_rate": 3.3480929035215647e-06,
+ "loss": 0.1941,
+ "step": 27147
+ },
+ {
+ "epoch": 73.97275204359673,
+ "grad_norm": 3.0135879516601562,
+ "learning_rate": 3.3474339940639965e-06,
+ "loss": 0.0414,
+ "step": 27148
+ },
+ {
+ "epoch": 73.97547683923706,
+ "grad_norm": 3.0829758644104004,
+ "learning_rate": 3.3467751364164013e-06,
+ "loss": 0.0813,
+ "step": 27149
+ },
+ {
+ "epoch": 73.97820163487738,
+ "grad_norm": 2.953204870223999,
+ "learning_rate": 3.3461163305839074e-06,
+ "loss": 0.0436,
+ "step": 27150
+ },
+ {
+ "epoch": 73.98092643051771,
+ "grad_norm": 2.9540188312530518,
+ "learning_rate": 3.3454575765716446e-06,
+ "loss": 0.0531,
+ "step": 27151
+ },
+ {
+ "epoch": 73.98365122615803,
+ "grad_norm": 4.306671619415283,
+ "learning_rate": 3.3447988743847402e-06,
+ "loss": 0.1042,
+ "step": 27152
+ },
+ {
+ "epoch": 73.98637602179836,
+ "grad_norm": 2.209057331085205,
+ "learning_rate": 3.3441402240283325e-06,
+ "loss": 0.1337,
+ "step": 27153
+ },
+ {
+ "epoch": 73.9891008174387,
+ "grad_norm": 2.6406970024108887,
+ "learning_rate": 3.3434816255075464e-06,
+ "loss": 0.0736,
+ "step": 27154
+ },
+ {
+ "epoch": 73.99182561307902,
+ "grad_norm": 2.883601665496826,
+ "learning_rate": 3.3428230788275106e-06,
+ "loss": 0.0501,
+ "step": 27155
+ },
+ {
+ "epoch": 73.99455040871935,
+ "grad_norm": 2.4726920127868652,
+ "learning_rate": 3.3421645839933514e-06,
+ "loss": 0.0774,
+ "step": 27156
+ },
+ {
+ "epoch": 73.99727520435967,
+ "grad_norm": 2.8331825733184814,
+ "learning_rate": 3.3415061410102036e-06,
+ "loss": 0.1124,
+ "step": 27157
+ },
+ {
+ "epoch": 74.0,
+ "grad_norm": 5.509169101715088,
+ "learning_rate": 3.3408477498831917e-06,
+ "loss": 0.2008,
+ "step": 27158
+ },
+ {
+ "epoch": 74.00272479564033,
+ "grad_norm": 2.4617745876312256,
+ "learning_rate": 3.3401894106174427e-06,
+ "loss": 0.0408,
+ "step": 27159
+ },
+ {
+ "epoch": 74.00544959128065,
+ "grad_norm": 2.893810987472534,
+ "learning_rate": 3.3395311232180783e-06,
+ "loss": 0.0524,
+ "step": 27160
+ },
+ {
+ "epoch": 74.00817438692098,
+ "grad_norm": 2.2738749980926514,
+ "learning_rate": 3.3388728876902378e-06,
+ "loss": 0.0448,
+ "step": 27161
+ },
+ {
+ "epoch": 74.0108991825613,
+ "grad_norm": 2.066929340362549,
+ "learning_rate": 3.3382147040390402e-06,
+ "loss": 0.0301,
+ "step": 27162
+ },
+ {
+ "epoch": 74.01362397820164,
+ "grad_norm": 3.5921077728271484,
+ "learning_rate": 3.3375565722696123e-06,
+ "loss": 0.0858,
+ "step": 27163
+ },
+ {
+ "epoch": 74.01634877384195,
+ "grad_norm": 3.013620138168335,
+ "learning_rate": 3.336898492387076e-06,
+ "loss": 0.153,
+ "step": 27164
+ },
+ {
+ "epoch": 74.01907356948229,
+ "grad_norm": 2.7107770442962646,
+ "learning_rate": 3.3362404643965628e-06,
+ "loss": 0.0401,
+ "step": 27165
+ },
+ {
+ "epoch": 74.02179836512262,
+ "grad_norm": 2.825683355331421,
+ "learning_rate": 3.335582488303195e-06,
+ "loss": 0.0418,
+ "step": 27166
+ },
+ {
+ "epoch": 74.02452316076294,
+ "grad_norm": 3.1012535095214844,
+ "learning_rate": 3.3349245641120965e-06,
+ "loss": 0.0438,
+ "step": 27167
+ },
+ {
+ "epoch": 74.02724795640327,
+ "grad_norm": 2.699633836746216,
+ "learning_rate": 3.334266691828387e-06,
+ "loss": 0.0291,
+ "step": 27168
+ },
+ {
+ "epoch": 74.02997275204359,
+ "grad_norm": 2.9676756858825684,
+ "learning_rate": 3.3336088714571977e-06,
+ "loss": 0.1213,
+ "step": 27169
+ },
+ {
+ "epoch": 74.03269754768392,
+ "grad_norm": 5.069844722747803,
+ "learning_rate": 3.3329511030036476e-06,
+ "loss": 0.0487,
+ "step": 27170
+ },
+ {
+ "epoch": 74.03542234332426,
+ "grad_norm": 2.047196626663208,
+ "learning_rate": 3.33229338647286e-06,
+ "loss": 0.137,
+ "step": 27171
+ },
+ {
+ "epoch": 74.03814713896458,
+ "grad_norm": 2.680666208267212,
+ "learning_rate": 3.3316357218699535e-06,
+ "loss": 0.1425,
+ "step": 27172
+ },
+ {
+ "epoch": 74.04087193460491,
+ "grad_norm": 3.8923232555389404,
+ "learning_rate": 3.330978109200057e-06,
+ "loss": 0.1451,
+ "step": 27173
+ },
+ {
+ "epoch": 74.04359673024523,
+ "grad_norm": 2.742316961288452,
+ "learning_rate": 3.3303205484682878e-06,
+ "loss": 0.0578,
+ "step": 27174
+ },
+ {
+ "epoch": 74.04632152588556,
+ "grad_norm": 2.411404848098755,
+ "learning_rate": 3.329663039679768e-06,
+ "loss": 0.1779,
+ "step": 27175
+ },
+ {
+ "epoch": 74.04904632152588,
+ "grad_norm": 3.542120933532715,
+ "learning_rate": 3.329005582839614e-06,
+ "loss": 0.0407,
+ "step": 27176
+ },
+ {
+ "epoch": 74.05177111716621,
+ "grad_norm": 2.5981528759002686,
+ "learning_rate": 3.3283481779529503e-06,
+ "loss": 0.0433,
+ "step": 27177
+ },
+ {
+ "epoch": 74.05449591280654,
+ "grad_norm": 3.1827433109283447,
+ "learning_rate": 3.3276908250249e-06,
+ "loss": 0.0744,
+ "step": 27178
+ },
+ {
+ "epoch": 74.05722070844686,
+ "grad_norm": 2.6564531326293945,
+ "learning_rate": 3.327033524060578e-06,
+ "loss": 0.0686,
+ "step": 27179
+ },
+ {
+ "epoch": 74.0599455040872,
+ "grad_norm": 2.9468657970428467,
+ "learning_rate": 3.3263762750651043e-06,
+ "loss": 0.0564,
+ "step": 27180
+ },
+ {
+ "epoch": 74.06267029972751,
+ "grad_norm": 3.285318613052368,
+ "learning_rate": 3.325719078043593e-06,
+ "loss": 0.0664,
+ "step": 27181
+ },
+ {
+ "epoch": 74.06539509536785,
+ "grad_norm": 1.8797310590744019,
+ "learning_rate": 3.3250619330011715e-06,
+ "loss": 0.0299,
+ "step": 27182
+ },
+ {
+ "epoch": 74.06811989100818,
+ "grad_norm": 2.1970951557159424,
+ "learning_rate": 3.324404839942953e-06,
+ "loss": 0.0534,
+ "step": 27183
+ },
+ {
+ "epoch": 74.0708446866485,
+ "grad_norm": 2.397085189819336,
+ "learning_rate": 3.3237477988740508e-06,
+ "loss": 0.0339,
+ "step": 27184
+ },
+ {
+ "epoch": 74.07356948228883,
+ "grad_norm": 3.1384451389312744,
+ "learning_rate": 3.3230908097995885e-06,
+ "loss": 0.0392,
+ "step": 27185
+ },
+ {
+ "epoch": 74.07629427792915,
+ "grad_norm": 2.7506701946258545,
+ "learning_rate": 3.322433872724681e-06,
+ "loss": 0.0712,
+ "step": 27186
+ },
+ {
+ "epoch": 74.07901907356948,
+ "grad_norm": 2.195390224456787,
+ "learning_rate": 3.3217769876544437e-06,
+ "loss": 0.0418,
+ "step": 27187
+ },
+ {
+ "epoch": 74.0817438692098,
+ "grad_norm": 2.8584413528442383,
+ "learning_rate": 3.3211201545939885e-06,
+ "loss": 0.0401,
+ "step": 27188
+ },
+ {
+ "epoch": 74.08446866485014,
+ "grad_norm": 2.165010690689087,
+ "learning_rate": 3.320463373548438e-06,
+ "loss": 0.0532,
+ "step": 27189
+ },
+ {
+ "epoch": 74.08719346049047,
+ "grad_norm": 2.679511070251465,
+ "learning_rate": 3.319806644522904e-06,
+ "loss": 0.04,
+ "step": 27190
+ },
+ {
+ "epoch": 74.08991825613079,
+ "grad_norm": 3.2109289169311523,
+ "learning_rate": 3.3191499675225e-06,
+ "loss": 0.0686,
+ "step": 27191
+ },
+ {
+ "epoch": 74.09264305177112,
+ "grad_norm": 3.273088216781616,
+ "learning_rate": 3.318493342552339e-06,
+ "loss": 0.0536,
+ "step": 27192
+ },
+ {
+ "epoch": 74.09536784741144,
+ "grad_norm": 2.2636821269989014,
+ "learning_rate": 3.3178367696175396e-06,
+ "loss": 0.08,
+ "step": 27193
+ },
+ {
+ "epoch": 74.09809264305177,
+ "grad_norm": 1.867721438407898,
+ "learning_rate": 3.3171802487232087e-06,
+ "loss": 0.1226,
+ "step": 27194
+ },
+ {
+ "epoch": 74.1008174386921,
+ "grad_norm": 2.4035680294036865,
+ "learning_rate": 3.3165237798744665e-06,
+ "loss": 0.0996,
+ "step": 27195
+ },
+ {
+ "epoch": 74.10354223433242,
+ "grad_norm": 2.8854174613952637,
+ "learning_rate": 3.3158673630764216e-06,
+ "loss": 0.0377,
+ "step": 27196
+ },
+ {
+ "epoch": 74.10626702997276,
+ "grad_norm": 2.278005838394165,
+ "learning_rate": 3.315210998334184e-06,
+ "loss": 0.0347,
+ "step": 27197
+ },
+ {
+ "epoch": 74.10899182561307,
+ "grad_norm": 3.0782861709594727,
+ "learning_rate": 3.314554685652871e-06,
+ "loss": 0.0407,
+ "step": 27198
+ },
+ {
+ "epoch": 74.11171662125341,
+ "grad_norm": 4.853907585144043,
+ "learning_rate": 3.3138984250375903e-06,
+ "loss": 0.0712,
+ "step": 27199
+ },
+ {
+ "epoch": 74.11444141689373,
+ "grad_norm": 3.5312323570251465,
+ "learning_rate": 3.313242216493454e-06,
+ "loss": 0.0998,
+ "step": 27200
+ },
+ {
+ "epoch": 74.11716621253406,
+ "grad_norm": 2.485520601272583,
+ "learning_rate": 3.3125860600255686e-06,
+ "loss": 0.0353,
+ "step": 27201
+ },
+ {
+ "epoch": 74.11989100817439,
+ "grad_norm": 4.5134172439575195,
+ "learning_rate": 3.3119299556390516e-06,
+ "loss": 0.0634,
+ "step": 27202
+ },
+ {
+ "epoch": 74.12261580381471,
+ "grad_norm": 1.728415608406067,
+ "learning_rate": 3.3112739033390083e-06,
+ "loss": 0.0255,
+ "step": 27203
+ },
+ {
+ "epoch": 74.12534059945504,
+ "grad_norm": 4.402983665466309,
+ "learning_rate": 3.3106179031305497e-06,
+ "loss": 0.0326,
+ "step": 27204
+ },
+ {
+ "epoch": 74.12806539509536,
+ "grad_norm": 2.5725178718566895,
+ "learning_rate": 3.309961955018779e-06,
+ "loss": 0.1255,
+ "step": 27205
+ },
+ {
+ "epoch": 74.1307901907357,
+ "grad_norm": 2.395601511001587,
+ "learning_rate": 3.3093060590088132e-06,
+ "loss": 0.1171,
+ "step": 27206
+ },
+ {
+ "epoch": 74.13351498637603,
+ "grad_norm": 3.410938024520874,
+ "learning_rate": 3.3086502151057564e-06,
+ "loss": 0.0776,
+ "step": 27207
+ },
+ {
+ "epoch": 74.13623978201635,
+ "grad_norm": 2.5566298961639404,
+ "learning_rate": 3.3079944233147123e-06,
+ "loss": 0.06,
+ "step": 27208
+ },
+ {
+ "epoch": 74.13896457765668,
+ "grad_norm": 3.42567777633667,
+ "learning_rate": 3.307338683640796e-06,
+ "loss": 0.1214,
+ "step": 27209
+ },
+ {
+ "epoch": 74.141689373297,
+ "grad_norm": 3.425590991973877,
+ "learning_rate": 3.306682996089111e-06,
+ "loss": 0.093,
+ "step": 27210
+ },
+ {
+ "epoch": 74.14441416893733,
+ "grad_norm": 3.416318416595459,
+ "learning_rate": 3.30602736066476e-06,
+ "loss": 0.1777,
+ "step": 27211
+ },
+ {
+ "epoch": 74.14713896457765,
+ "grad_norm": 3.309035062789917,
+ "learning_rate": 3.3053717773728556e-06,
+ "loss": 0.2189,
+ "step": 27212
+ },
+ {
+ "epoch": 74.14986376021798,
+ "grad_norm": 3.4633026123046875,
+ "learning_rate": 3.3047162462184965e-06,
+ "loss": 0.0384,
+ "step": 27213
+ },
+ {
+ "epoch": 74.15258855585832,
+ "grad_norm": 2.273061990737915,
+ "learning_rate": 3.304060767206796e-06,
+ "loss": 0.0318,
+ "step": 27214
+ },
+ {
+ "epoch": 74.15531335149863,
+ "grad_norm": 4.014997482299805,
+ "learning_rate": 3.3034053403428547e-06,
+ "loss": 0.0629,
+ "step": 27215
+ },
+ {
+ "epoch": 74.15803814713897,
+ "grad_norm": 9.901772499084473,
+ "learning_rate": 3.3027499656317773e-06,
+ "loss": 0.1588,
+ "step": 27216
+ },
+ {
+ "epoch": 74.16076294277929,
+ "grad_norm": 2.357943058013916,
+ "learning_rate": 3.302094643078664e-06,
+ "loss": 0.0382,
+ "step": 27217
+ },
+ {
+ "epoch": 74.16348773841962,
+ "grad_norm": 3.563890218734741,
+ "learning_rate": 3.301439372688624e-06,
+ "loss": 0.165,
+ "step": 27218
+ },
+ {
+ "epoch": 74.16621253405995,
+ "grad_norm": 1.481551170349121,
+ "learning_rate": 3.3007841544667606e-06,
+ "loss": 0.0162,
+ "step": 27219
+ },
+ {
+ "epoch": 74.16893732970027,
+ "grad_norm": 1.9927772283554077,
+ "learning_rate": 3.300128988418173e-06,
+ "loss": 0.0314,
+ "step": 27220
+ },
+ {
+ "epoch": 74.1716621253406,
+ "grad_norm": 2.6529672145843506,
+ "learning_rate": 3.2994738745479628e-06,
+ "loss": 0.0431,
+ "step": 27221
+ },
+ {
+ "epoch": 74.17438692098092,
+ "grad_norm": 3.6385836601257324,
+ "learning_rate": 3.2988188128612374e-06,
+ "loss": 0.0459,
+ "step": 27222
+ },
+ {
+ "epoch": 74.17711171662125,
+ "grad_norm": 2.179558753967285,
+ "learning_rate": 3.2981638033630956e-06,
+ "loss": 0.0325,
+ "step": 27223
+ },
+ {
+ "epoch": 74.17983651226157,
+ "grad_norm": 3.6399078369140625,
+ "learning_rate": 3.297508846058639e-06,
+ "loss": 0.0885,
+ "step": 27224
+ },
+ {
+ "epoch": 74.1825613079019,
+ "grad_norm": 3.046405076980591,
+ "learning_rate": 3.2968539409529632e-06,
+ "loss": 0.0281,
+ "step": 27225
+ },
+ {
+ "epoch": 74.18528610354224,
+ "grad_norm": 3.1456198692321777,
+ "learning_rate": 3.2961990880511773e-06,
+ "loss": 0.0977,
+ "step": 27226
+ },
+ {
+ "epoch": 74.18801089918256,
+ "grad_norm": 2.7781946659088135,
+ "learning_rate": 3.2955442873583765e-06,
+ "loss": 0.0759,
+ "step": 27227
+ },
+ {
+ "epoch": 74.19073569482289,
+ "grad_norm": 2.615128993988037,
+ "learning_rate": 3.2948895388796585e-06,
+ "loss": 0.0274,
+ "step": 27228
+ },
+ {
+ "epoch": 74.19346049046321,
+ "grad_norm": 4.8917083740234375,
+ "learning_rate": 3.2942348426201244e-06,
+ "loss": 0.0238,
+ "step": 27229
+ },
+ {
+ "epoch": 74.19618528610354,
+ "grad_norm": 2.16357421875,
+ "learning_rate": 3.293580198584877e-06,
+ "loss": 0.0294,
+ "step": 27230
+ },
+ {
+ "epoch": 74.19891008174388,
+ "grad_norm": 2.5870048999786377,
+ "learning_rate": 3.2929256067790117e-06,
+ "loss": 0.0522,
+ "step": 27231
+ },
+ {
+ "epoch": 74.2016348773842,
+ "grad_norm": 2.3557868003845215,
+ "learning_rate": 3.292271067207625e-06,
+ "loss": 0.2176,
+ "step": 27232
+ },
+ {
+ "epoch": 74.20435967302453,
+ "grad_norm": 3.6504061222076416,
+ "learning_rate": 3.2916165798758127e-06,
+ "loss": 0.1255,
+ "step": 27233
+ },
+ {
+ "epoch": 74.20708446866485,
+ "grad_norm": 2.0222890377044678,
+ "learning_rate": 3.2909621447886773e-06,
+ "loss": 0.0349,
+ "step": 27234
+ },
+ {
+ "epoch": 74.20980926430518,
+ "grad_norm": 3.4126057624816895,
+ "learning_rate": 3.2903077619513135e-06,
+ "loss": 0.0624,
+ "step": 27235
+ },
+ {
+ "epoch": 74.2125340599455,
+ "grad_norm": 3.1359829902648926,
+ "learning_rate": 3.2896534313688165e-06,
+ "loss": 0.0958,
+ "step": 27236
+ },
+ {
+ "epoch": 74.21525885558583,
+ "grad_norm": 3.701328754425049,
+ "learning_rate": 3.2889991530462793e-06,
+ "loss": 0.0965,
+ "step": 27237
+ },
+ {
+ "epoch": 74.21798365122616,
+ "grad_norm": 2.533704996109009,
+ "learning_rate": 3.2883449269888034e-06,
+ "loss": 0.0507,
+ "step": 27238
+ },
+ {
+ "epoch": 74.22070844686648,
+ "grad_norm": 2.3656082153320312,
+ "learning_rate": 3.287690753201482e-06,
+ "loss": 0.0458,
+ "step": 27239
+ },
+ {
+ "epoch": 74.22343324250681,
+ "grad_norm": 2.510498523712158,
+ "learning_rate": 3.2870366316894086e-06,
+ "loss": 0.0416,
+ "step": 27240
+ },
+ {
+ "epoch": 74.22615803814713,
+ "grad_norm": 2.279121160507202,
+ "learning_rate": 3.2863825624576752e-06,
+ "loss": 0.1041,
+ "step": 27241
+ },
+ {
+ "epoch": 74.22888283378747,
+ "grad_norm": 2.8952863216400146,
+ "learning_rate": 3.2857285455113807e-06,
+ "loss": 0.1,
+ "step": 27242
+ },
+ {
+ "epoch": 74.2316076294278,
+ "grad_norm": 2.5696914196014404,
+ "learning_rate": 3.2850745808556174e-06,
+ "loss": 0.0292,
+ "step": 27243
+ },
+ {
+ "epoch": 74.23433242506812,
+ "grad_norm": 2.5835812091827393,
+ "learning_rate": 3.284420668495476e-06,
+ "loss": 0.0625,
+ "step": 27244
+ },
+ {
+ "epoch": 74.23705722070845,
+ "grad_norm": 3.5429649353027344,
+ "learning_rate": 3.2837668084360476e-06,
+ "loss": 0.0728,
+ "step": 27245
+ },
+ {
+ "epoch": 74.23978201634877,
+ "grad_norm": 2.635214328765869,
+ "learning_rate": 3.2831130006824274e-06,
+ "loss": 0.0596,
+ "step": 27246
+ },
+ {
+ "epoch": 74.2425068119891,
+ "grad_norm": 3.1904172897338867,
+ "learning_rate": 3.2824592452397097e-06,
+ "loss": 0.0781,
+ "step": 27247
+ },
+ {
+ "epoch": 74.24523160762942,
+ "grad_norm": 2.6193346977233887,
+ "learning_rate": 3.2818055421129837e-06,
+ "loss": 0.0857,
+ "step": 27248
+ },
+ {
+ "epoch": 74.24795640326975,
+ "grad_norm": 2.1958374977111816,
+ "learning_rate": 3.281151891307336e-06,
+ "loss": 0.0554,
+ "step": 27249
+ },
+ {
+ "epoch": 74.25068119891009,
+ "grad_norm": 2.411705732345581,
+ "learning_rate": 3.280498292827864e-06,
+ "loss": 0.0324,
+ "step": 27250
+ },
+ {
+ "epoch": 74.2534059945504,
+ "grad_norm": 2.6255908012390137,
+ "learning_rate": 3.2798447466796557e-06,
+ "loss": 0.0736,
+ "step": 27251
+ },
+ {
+ "epoch": 74.25613079019074,
+ "grad_norm": 3.314282178878784,
+ "learning_rate": 3.2791912528678004e-06,
+ "loss": 0.1105,
+ "step": 27252
+ },
+ {
+ "epoch": 74.25885558583106,
+ "grad_norm": 2.7014825344085693,
+ "learning_rate": 3.2785378113973843e-06,
+ "loss": 0.0394,
+ "step": 27253
+ },
+ {
+ "epoch": 74.26158038147139,
+ "grad_norm": 2.0100409984588623,
+ "learning_rate": 3.277884422273502e-06,
+ "loss": 0.0471,
+ "step": 27254
+ },
+ {
+ "epoch": 74.26430517711172,
+ "grad_norm": 3.3638100624084473,
+ "learning_rate": 3.277231085501239e-06,
+ "loss": 0.0718,
+ "step": 27255
+ },
+ {
+ "epoch": 74.26702997275204,
+ "grad_norm": 2.4385015964508057,
+ "learning_rate": 3.2765778010856854e-06,
+ "loss": 0.0228,
+ "step": 27256
+ },
+ {
+ "epoch": 74.26975476839237,
+ "grad_norm": 2.5477700233459473,
+ "learning_rate": 3.275924569031923e-06,
+ "loss": 0.0393,
+ "step": 27257
+ },
+ {
+ "epoch": 74.2724795640327,
+ "grad_norm": 2.120997190475464,
+ "learning_rate": 3.275271389345047e-06,
+ "loss": 0.0376,
+ "step": 27258
+ },
+ {
+ "epoch": 74.27520435967303,
+ "grad_norm": 2.6655328273773193,
+ "learning_rate": 3.2746182620301416e-06,
+ "loss": 0.172,
+ "step": 27259
+ },
+ {
+ "epoch": 74.27792915531334,
+ "grad_norm": 2.456432580947876,
+ "learning_rate": 3.2739651870922926e-06,
+ "loss": 0.0377,
+ "step": 27260
+ },
+ {
+ "epoch": 74.28065395095368,
+ "grad_norm": 2.6079587936401367,
+ "learning_rate": 3.273312164536583e-06,
+ "loss": 0.0541,
+ "step": 27261
+ },
+ {
+ "epoch": 74.28337874659401,
+ "grad_norm": 3.5972044467926025,
+ "learning_rate": 3.272659194368104e-06,
+ "loss": 0.0997,
+ "step": 27262
+ },
+ {
+ "epoch": 74.28610354223433,
+ "grad_norm": 2.5031604766845703,
+ "learning_rate": 3.2720062765919368e-06,
+ "loss": 0.0635,
+ "step": 27263
+ },
+ {
+ "epoch": 74.28882833787466,
+ "grad_norm": 2.1376121044158936,
+ "learning_rate": 3.2713534112131705e-06,
+ "loss": 0.0237,
+ "step": 27264
+ },
+ {
+ "epoch": 74.29155313351498,
+ "grad_norm": 3.359450578689575,
+ "learning_rate": 3.2707005982368877e-06,
+ "loss": 0.1266,
+ "step": 27265
+ },
+ {
+ "epoch": 74.29427792915531,
+ "grad_norm": 2.4304559230804443,
+ "learning_rate": 3.2700478376681686e-06,
+ "loss": 0.0349,
+ "step": 27266
+ },
+ {
+ "epoch": 74.29700272479565,
+ "grad_norm": 2.10734224319458,
+ "learning_rate": 3.269395129512104e-06,
+ "loss": 0.0816,
+ "step": 27267
+ },
+ {
+ "epoch": 74.29972752043597,
+ "grad_norm": 2.9545388221740723,
+ "learning_rate": 3.268742473773774e-06,
+ "loss": 0.0568,
+ "step": 27268
+ },
+ {
+ "epoch": 74.3024523160763,
+ "grad_norm": 2.317762613296509,
+ "learning_rate": 3.2680898704582562e-06,
+ "loss": 0.0915,
+ "step": 27269
+ },
+ {
+ "epoch": 74.30517711171662,
+ "grad_norm": 2.382387638092041,
+ "learning_rate": 3.267437319570642e-06,
+ "loss": 0.1144,
+ "step": 27270
+ },
+ {
+ "epoch": 74.30790190735695,
+ "grad_norm": 3.6725282669067383,
+ "learning_rate": 3.2667848211160093e-06,
+ "loss": 0.0893,
+ "step": 27271
+ },
+ {
+ "epoch": 74.31062670299727,
+ "grad_norm": 4.105287551879883,
+ "learning_rate": 3.26613237509944e-06,
+ "loss": 0.0815,
+ "step": 27272
+ },
+ {
+ "epoch": 74.3133514986376,
+ "grad_norm": 12.403950691223145,
+ "learning_rate": 3.265479981526011e-06,
+ "loss": 0.11,
+ "step": 27273
+ },
+ {
+ "epoch": 74.31607629427793,
+ "grad_norm": 2.5986974239349365,
+ "learning_rate": 3.2648276404008104e-06,
+ "loss": 0.0958,
+ "step": 27274
+ },
+ {
+ "epoch": 74.31880108991825,
+ "grad_norm": 3.031984806060791,
+ "learning_rate": 3.2641753517289164e-06,
+ "loss": 0.0336,
+ "step": 27275
+ },
+ {
+ "epoch": 74.32152588555859,
+ "grad_norm": 2.4086272716522217,
+ "learning_rate": 3.2635231155154067e-06,
+ "loss": 0.0877,
+ "step": 27276
+ },
+ {
+ "epoch": 74.3242506811989,
+ "grad_norm": 4.058390140533447,
+ "learning_rate": 3.2628709317653593e-06,
+ "loss": 0.0777,
+ "step": 27277
+ },
+ {
+ "epoch": 74.32697547683924,
+ "grad_norm": 3.4180104732513428,
+ "learning_rate": 3.2622188004838594e-06,
+ "loss": 0.0354,
+ "step": 27278
+ },
+ {
+ "epoch": 74.32970027247957,
+ "grad_norm": 3.0404999256134033,
+ "learning_rate": 3.2615667216759837e-06,
+ "loss": 0.0519,
+ "step": 27279
+ },
+ {
+ "epoch": 74.33242506811989,
+ "grad_norm": 3.8097989559173584,
+ "learning_rate": 3.260914695346805e-06,
+ "loss": 0.0366,
+ "step": 27280
+ },
+ {
+ "epoch": 74.33514986376022,
+ "grad_norm": 2.1361637115478516,
+ "learning_rate": 3.2602627215014093e-06,
+ "loss": 0.0604,
+ "step": 27281
+ },
+ {
+ "epoch": 74.33787465940054,
+ "grad_norm": 3.0930285453796387,
+ "learning_rate": 3.259610800144868e-06,
+ "loss": 0.0418,
+ "step": 27282
+ },
+ {
+ "epoch": 74.34059945504087,
+ "grad_norm": 3.5604248046875,
+ "learning_rate": 3.2589589312822634e-06,
+ "loss": 0.2219,
+ "step": 27283
+ },
+ {
+ "epoch": 74.34332425068119,
+ "grad_norm": 3.0186381340026855,
+ "learning_rate": 3.2583071149186695e-06,
+ "loss": 0.1285,
+ "step": 27284
+ },
+ {
+ "epoch": 74.34604904632153,
+ "grad_norm": 4.4371466636657715,
+ "learning_rate": 3.2576553510591636e-06,
+ "loss": 0.1368,
+ "step": 27285
+ },
+ {
+ "epoch": 74.34877384196186,
+ "grad_norm": 2.5523457527160645,
+ "learning_rate": 3.257003639708818e-06,
+ "loss": 0.1301,
+ "step": 27286
+ },
+ {
+ "epoch": 74.35149863760218,
+ "grad_norm": 4.00749397277832,
+ "learning_rate": 3.256351980872713e-06,
+ "loss": 0.0779,
+ "step": 27287
+ },
+ {
+ "epoch": 74.35422343324251,
+ "grad_norm": 2.7158422470092773,
+ "learning_rate": 3.2557003745559224e-06,
+ "loss": 0.0338,
+ "step": 27288
+ },
+ {
+ "epoch": 74.35694822888283,
+ "grad_norm": 2.823284149169922,
+ "learning_rate": 3.25504882076352e-06,
+ "loss": 0.0979,
+ "step": 27289
+ },
+ {
+ "epoch": 74.35967302452316,
+ "grad_norm": 4.403693199157715,
+ "learning_rate": 3.2543973195005764e-06,
+ "loss": 0.0682,
+ "step": 27290
+ },
+ {
+ "epoch": 74.3623978201635,
+ "grad_norm": 2.1391823291778564,
+ "learning_rate": 3.2537458707721735e-06,
+ "loss": 0.0244,
+ "step": 27291
+ },
+ {
+ "epoch": 74.36512261580381,
+ "grad_norm": 4.027947902679443,
+ "learning_rate": 3.2530944745833803e-06,
+ "loss": 0.1552,
+ "step": 27292
+ },
+ {
+ "epoch": 74.36784741144415,
+ "grad_norm": 2.293487071990967,
+ "learning_rate": 3.2524431309392667e-06,
+ "loss": 0.0498,
+ "step": 27293
+ },
+ {
+ "epoch": 74.37057220708446,
+ "grad_norm": 2.6919054985046387,
+ "learning_rate": 3.2517918398449133e-06,
+ "loss": 0.0395,
+ "step": 27294
+ },
+ {
+ "epoch": 74.3732970027248,
+ "grad_norm": 1.9174407720565796,
+ "learning_rate": 3.251140601305387e-06,
+ "loss": 0.0276,
+ "step": 27295
+ },
+ {
+ "epoch": 74.37602179836512,
+ "grad_norm": 2.551849603652954,
+ "learning_rate": 3.2504894153257603e-06,
+ "loss": 0.1889,
+ "step": 27296
+ },
+ {
+ "epoch": 74.37874659400545,
+ "grad_norm": 3.521094799041748,
+ "learning_rate": 3.2498382819111017e-06,
+ "loss": 0.0504,
+ "step": 27297
+ },
+ {
+ "epoch": 74.38147138964578,
+ "grad_norm": 3.04475998878479,
+ "learning_rate": 3.2491872010664847e-06,
+ "loss": 0.2605,
+ "step": 27298
+ },
+ {
+ "epoch": 74.3841961852861,
+ "grad_norm": 2.8988218307495117,
+ "learning_rate": 3.2485361727969846e-06,
+ "loss": 0.0897,
+ "step": 27299
+ },
+ {
+ "epoch": 74.38692098092643,
+ "grad_norm": 3.369778871536255,
+ "learning_rate": 3.2478851971076675e-06,
+ "loss": 0.1045,
+ "step": 27300
+ },
+ {
+ "epoch": 74.38964577656675,
+ "grad_norm": 3.181368827819824,
+ "learning_rate": 3.2472342740036033e-06,
+ "loss": 0.0827,
+ "step": 27301
+ },
+ {
+ "epoch": 74.39237057220708,
+ "grad_norm": 1.9666175842285156,
+ "learning_rate": 3.246583403489857e-06,
+ "loss": 0.0548,
+ "step": 27302
+ },
+ {
+ "epoch": 74.39509536784742,
+ "grad_norm": 3.336275100708008,
+ "learning_rate": 3.2459325855715063e-06,
+ "loss": 0.0313,
+ "step": 27303
+ },
+ {
+ "epoch": 74.39782016348774,
+ "grad_norm": 2.77612566947937,
+ "learning_rate": 3.245281820253614e-06,
+ "loss": 0.0394,
+ "step": 27304
+ },
+ {
+ "epoch": 74.40054495912807,
+ "grad_norm": 2.6531143188476562,
+ "learning_rate": 3.2446311075412508e-06,
+ "loss": 0.068,
+ "step": 27305
+ },
+ {
+ "epoch": 74.40326975476839,
+ "grad_norm": 3.5499050617218018,
+ "learning_rate": 3.243980447439479e-06,
+ "loss": 0.068,
+ "step": 27306
+ },
+ {
+ "epoch": 74.40599455040872,
+ "grad_norm": 3.847198247909546,
+ "learning_rate": 3.243329839953373e-06,
+ "loss": 0.0618,
+ "step": 27307
+ },
+ {
+ "epoch": 74.40871934604904,
+ "grad_norm": 2.1634271144866943,
+ "learning_rate": 3.2426792850879974e-06,
+ "loss": 0.0325,
+ "step": 27308
+ },
+ {
+ "epoch": 74.41144414168937,
+ "grad_norm": 2.917853355407715,
+ "learning_rate": 3.2420287828484175e-06,
+ "loss": 0.055,
+ "step": 27309
+ },
+ {
+ "epoch": 74.4141689373297,
+ "grad_norm": 3.1917197704315186,
+ "learning_rate": 3.2413783332396977e-06,
+ "loss": 0.1354,
+ "step": 27310
+ },
+ {
+ "epoch": 74.41689373297002,
+ "grad_norm": 4.102021217346191,
+ "learning_rate": 3.240727936266909e-06,
+ "loss": 0.0614,
+ "step": 27311
+ },
+ {
+ "epoch": 74.41961852861036,
+ "grad_norm": 2.5872745513916016,
+ "learning_rate": 3.2400775919351123e-06,
+ "loss": 0.0473,
+ "step": 27312
+ },
+ {
+ "epoch": 74.42234332425068,
+ "grad_norm": 3.0297534465789795,
+ "learning_rate": 3.2394273002493747e-06,
+ "loss": 0.092,
+ "step": 27313
+ },
+ {
+ "epoch": 74.42506811989101,
+ "grad_norm": 2.410175323486328,
+ "learning_rate": 3.2387770612147562e-06,
+ "loss": 0.0258,
+ "step": 27314
+ },
+ {
+ "epoch": 74.42779291553134,
+ "grad_norm": 2.3826498985290527,
+ "learning_rate": 3.238126874836325e-06,
+ "loss": 0.0595,
+ "step": 27315
+ },
+ {
+ "epoch": 74.43051771117166,
+ "grad_norm": 2.6610512733459473,
+ "learning_rate": 3.2374767411191468e-06,
+ "loss": 0.0374,
+ "step": 27316
+ },
+ {
+ "epoch": 74.433242506812,
+ "grad_norm": 2.922426223754883,
+ "learning_rate": 3.2368266600682817e-06,
+ "loss": 0.0337,
+ "step": 27317
+ },
+ {
+ "epoch": 74.43596730245231,
+ "grad_norm": 2.367076873779297,
+ "learning_rate": 3.23617663168879e-06,
+ "loss": 0.0326,
+ "step": 27318
+ },
+ {
+ "epoch": 74.43869209809264,
+ "grad_norm": 3.080042600631714,
+ "learning_rate": 3.23552665598574e-06,
+ "loss": 0.0982,
+ "step": 27319
+ },
+ {
+ "epoch": 74.44141689373296,
+ "grad_norm": 2.814044952392578,
+ "learning_rate": 3.2348767329641908e-06,
+ "loss": 0.096,
+ "step": 27320
+ },
+ {
+ "epoch": 74.4441416893733,
+ "grad_norm": 3.0666403770446777,
+ "learning_rate": 3.2342268626292037e-06,
+ "loss": 0.1051,
+ "step": 27321
+ },
+ {
+ "epoch": 74.44686648501363,
+ "grad_norm": 2.8949360847473145,
+ "learning_rate": 3.233577044985837e-06,
+ "loss": 0.0424,
+ "step": 27322
+ },
+ {
+ "epoch": 74.44959128065395,
+ "grad_norm": 3.484898090362549,
+ "learning_rate": 3.2329272800391586e-06,
+ "loss": 0.0908,
+ "step": 27323
+ },
+ {
+ "epoch": 74.45231607629428,
+ "grad_norm": 3.0054502487182617,
+ "learning_rate": 3.232277567794223e-06,
+ "loss": 0.0566,
+ "step": 27324
+ },
+ {
+ "epoch": 74.4550408719346,
+ "grad_norm": 3.1153807640075684,
+ "learning_rate": 3.231627908256093e-06,
+ "loss": 0.0953,
+ "step": 27325
+ },
+ {
+ "epoch": 74.45776566757493,
+ "grad_norm": 2.3662543296813965,
+ "learning_rate": 3.2309783014298235e-06,
+ "loss": 0.0504,
+ "step": 27326
+ },
+ {
+ "epoch": 74.46049046321527,
+ "grad_norm": 2.445415496826172,
+ "learning_rate": 3.2303287473204813e-06,
+ "loss": 0.0424,
+ "step": 27327
+ },
+ {
+ "epoch": 74.46321525885558,
+ "grad_norm": 12.313671112060547,
+ "learning_rate": 3.2296792459331196e-06,
+ "loss": 0.0485,
+ "step": 27328
+ },
+ {
+ "epoch": 74.46594005449592,
+ "grad_norm": 3.2492637634277344,
+ "learning_rate": 3.229029797272799e-06,
+ "loss": 0.2021,
+ "step": 27329
+ },
+ {
+ "epoch": 74.46866485013624,
+ "grad_norm": 6.003134250640869,
+ "learning_rate": 3.228380401344573e-06,
+ "loss": 0.0459,
+ "step": 27330
+ },
+ {
+ "epoch": 74.47138964577657,
+ "grad_norm": 4.572073936462402,
+ "learning_rate": 3.2277310581535046e-06,
+ "loss": 0.0863,
+ "step": 27331
+ },
+ {
+ "epoch": 74.47411444141689,
+ "grad_norm": 2.737095832824707,
+ "learning_rate": 3.2270817677046463e-06,
+ "loss": 0.16,
+ "step": 27332
+ },
+ {
+ "epoch": 74.47683923705722,
+ "grad_norm": 1.6207386255264282,
+ "learning_rate": 3.226432530003061e-06,
+ "loss": 0.0238,
+ "step": 27333
+ },
+ {
+ "epoch": 74.47956403269755,
+ "grad_norm": 4.511898994445801,
+ "learning_rate": 3.225783345053797e-06,
+ "loss": 0.031,
+ "step": 27334
+ },
+ {
+ "epoch": 74.48228882833787,
+ "grad_norm": 2.6669580936431885,
+ "learning_rate": 3.2251342128619177e-06,
+ "loss": 0.0255,
+ "step": 27335
+ },
+ {
+ "epoch": 74.4850136239782,
+ "grad_norm": 2.2407360076904297,
+ "learning_rate": 3.2244851334324755e-06,
+ "loss": 0.0307,
+ "step": 27336
+ },
+ {
+ "epoch": 74.48773841961852,
+ "grad_norm": 1.9477989673614502,
+ "learning_rate": 3.223836106770525e-06,
+ "loss": 0.0255,
+ "step": 27337
+ },
+ {
+ "epoch": 74.49046321525886,
+ "grad_norm": 2.5379209518432617,
+ "learning_rate": 3.2231871328811182e-06,
+ "loss": 0.0577,
+ "step": 27338
+ },
+ {
+ "epoch": 74.49318801089919,
+ "grad_norm": 2.7109456062316895,
+ "learning_rate": 3.2225382117693137e-06,
+ "loss": 0.0258,
+ "step": 27339
+ },
+ {
+ "epoch": 74.49591280653951,
+ "grad_norm": 3.679842233657837,
+ "learning_rate": 3.2218893434401645e-06,
+ "loss": 0.0432,
+ "step": 27340
+ },
+ {
+ "epoch": 74.49863760217984,
+ "grad_norm": 4.106472015380859,
+ "learning_rate": 3.2212405278987226e-06,
+ "loss": 0.07,
+ "step": 27341
+ },
+ {
+ "epoch": 74.50136239782016,
+ "grad_norm": 2.846247911453247,
+ "learning_rate": 3.2205917651500373e-06,
+ "loss": 0.0514,
+ "step": 27342
+ },
+ {
+ "epoch": 74.50408719346049,
+ "grad_norm": 3.2952558994293213,
+ "learning_rate": 3.2199430551991695e-06,
+ "loss": 0.0911,
+ "step": 27343
+ },
+ {
+ "epoch": 74.50681198910081,
+ "grad_norm": 3.331434965133667,
+ "learning_rate": 3.219294398051167e-06,
+ "loss": 0.1626,
+ "step": 27344
+ },
+ {
+ "epoch": 74.50953678474114,
+ "grad_norm": 2.7207252979278564,
+ "learning_rate": 3.2186457937110803e-06,
+ "loss": 0.0487,
+ "step": 27345
+ },
+ {
+ "epoch": 74.51226158038148,
+ "grad_norm": 5.137471675872803,
+ "learning_rate": 3.21799724218396e-06,
+ "loss": 0.0723,
+ "step": 27346
+ },
+ {
+ "epoch": 74.5149863760218,
+ "grad_norm": 3.6339457035064697,
+ "learning_rate": 3.217348743474862e-06,
+ "loss": 0.1025,
+ "step": 27347
+ },
+ {
+ "epoch": 74.51771117166213,
+ "grad_norm": 2.727165937423706,
+ "learning_rate": 3.216700297588833e-06,
+ "loss": 0.109,
+ "step": 27348
+ },
+ {
+ "epoch": 74.52043596730245,
+ "grad_norm": 2.7108774185180664,
+ "learning_rate": 3.2160519045309203e-06,
+ "loss": 0.1641,
+ "step": 27349
+ },
+ {
+ "epoch": 74.52316076294278,
+ "grad_norm": 3.9313526153564453,
+ "learning_rate": 3.2154035643061808e-06,
+ "loss": 0.2677,
+ "step": 27350
+ },
+ {
+ "epoch": 74.52588555858311,
+ "grad_norm": 3.4737322330474854,
+ "learning_rate": 3.214755276919657e-06,
+ "loss": 0.0931,
+ "step": 27351
+ },
+ {
+ "epoch": 74.52861035422343,
+ "grad_norm": 3.3170359134674072,
+ "learning_rate": 3.2141070423764043e-06,
+ "loss": 0.0443,
+ "step": 27352
+ },
+ {
+ "epoch": 74.53133514986376,
+ "grad_norm": 2.8323776721954346,
+ "learning_rate": 3.2134588606814665e-06,
+ "loss": 0.0626,
+ "step": 27353
+ },
+ {
+ "epoch": 74.53405994550408,
+ "grad_norm": 2.4754843711853027,
+ "learning_rate": 3.2128107318398925e-06,
+ "loss": 0.0316,
+ "step": 27354
+ },
+ {
+ "epoch": 74.53678474114442,
+ "grad_norm": 4.48448371887207,
+ "learning_rate": 3.2121626558567277e-06,
+ "loss": 0.0392,
+ "step": 27355
+ },
+ {
+ "epoch": 74.53950953678473,
+ "grad_norm": 2.2643465995788574,
+ "learning_rate": 3.211514632737025e-06,
+ "loss": 0.0391,
+ "step": 27356
+ },
+ {
+ "epoch": 74.54223433242507,
+ "grad_norm": 1.680436134338379,
+ "learning_rate": 3.2108666624858276e-06,
+ "loss": 0.0253,
+ "step": 27357
+ },
+ {
+ "epoch": 74.5449591280654,
+ "grad_norm": 2.255134344100952,
+ "learning_rate": 3.210218745108179e-06,
+ "loss": 0.0316,
+ "step": 27358
+ },
+ {
+ "epoch": 74.54768392370572,
+ "grad_norm": 2.986950635910034,
+ "learning_rate": 3.2095708806091306e-06,
+ "loss": 0.0462,
+ "step": 27359
+ },
+ {
+ "epoch": 74.55040871934605,
+ "grad_norm": 2.898524522781372,
+ "learning_rate": 3.208923068993727e-06,
+ "loss": 0.0457,
+ "step": 27360
+ },
+ {
+ "epoch": 74.55313351498637,
+ "grad_norm": 4.367632865905762,
+ "learning_rate": 3.2082753102670105e-06,
+ "loss": 0.0928,
+ "step": 27361
+ },
+ {
+ "epoch": 74.5558583106267,
+ "grad_norm": 2.7649285793304443,
+ "learning_rate": 3.207627604434025e-06,
+ "loss": 0.075,
+ "step": 27362
+ },
+ {
+ "epoch": 74.55858310626704,
+ "grad_norm": 8.433934211730957,
+ "learning_rate": 3.20697995149982e-06,
+ "loss": 0.0453,
+ "step": 27363
+ },
+ {
+ "epoch": 74.56130790190736,
+ "grad_norm": 2.8349850177764893,
+ "learning_rate": 3.2063323514694365e-06,
+ "loss": 0.0472,
+ "step": 27364
+ },
+ {
+ "epoch": 74.56403269754769,
+ "grad_norm": 2.8618035316467285,
+ "learning_rate": 3.2056848043479184e-06,
+ "loss": 0.1002,
+ "step": 27365
+ },
+ {
+ "epoch": 74.566757493188,
+ "grad_norm": 3.4427757263183594,
+ "learning_rate": 3.2050373101403053e-06,
+ "loss": 0.1556,
+ "step": 27366
+ },
+ {
+ "epoch": 74.56948228882834,
+ "grad_norm": 5.154320240020752,
+ "learning_rate": 3.2043898688516428e-06,
+ "loss": 0.0816,
+ "step": 27367
+ },
+ {
+ "epoch": 74.57220708446866,
+ "grad_norm": 2.4975204467773438,
+ "learning_rate": 3.2037424804869765e-06,
+ "loss": 0.0421,
+ "step": 27368
+ },
+ {
+ "epoch": 74.57493188010899,
+ "grad_norm": 2.318462610244751,
+ "learning_rate": 3.203095145051345e-06,
+ "loss": 0.0351,
+ "step": 27369
+ },
+ {
+ "epoch": 74.57765667574932,
+ "grad_norm": 4.079827308654785,
+ "learning_rate": 3.202447862549789e-06,
+ "loss": 0.0742,
+ "step": 27370
+ },
+ {
+ "epoch": 74.58038147138964,
+ "grad_norm": 3.9023802280426025,
+ "learning_rate": 3.2018006329873475e-06,
+ "loss": 0.0985,
+ "step": 27371
+ },
+ {
+ "epoch": 74.58310626702998,
+ "grad_norm": 3.151120185852051,
+ "learning_rate": 3.201153456369067e-06,
+ "loss": 0.0608,
+ "step": 27372
+ },
+ {
+ "epoch": 74.5858310626703,
+ "grad_norm": 7.027402877807617,
+ "learning_rate": 3.2005063326999853e-06,
+ "loss": 0.1259,
+ "step": 27373
+ },
+ {
+ "epoch": 74.58855585831063,
+ "grad_norm": 1.838041067123413,
+ "learning_rate": 3.199859261985141e-06,
+ "loss": 0.0264,
+ "step": 27374
+ },
+ {
+ "epoch": 74.59128065395096,
+ "grad_norm": 1.8210034370422363,
+ "learning_rate": 3.1992122442295702e-06,
+ "loss": 0.0347,
+ "step": 27375
+ },
+ {
+ "epoch": 74.59400544959128,
+ "grad_norm": 3.0615527629852295,
+ "learning_rate": 3.1985652794383193e-06,
+ "loss": 0.0963,
+ "step": 27376
+ },
+ {
+ "epoch": 74.59673024523161,
+ "grad_norm": 4.979789733886719,
+ "learning_rate": 3.197918367616423e-06,
+ "loss": 0.0697,
+ "step": 27377
+ },
+ {
+ "epoch": 74.59945504087193,
+ "grad_norm": 2.7697553634643555,
+ "learning_rate": 3.197271508768919e-06,
+ "loss": 0.0279,
+ "step": 27378
+ },
+ {
+ "epoch": 74.60217983651226,
+ "grad_norm": 2.101897716522217,
+ "learning_rate": 3.1966247029008433e-06,
+ "loss": 0.0374,
+ "step": 27379
+ },
+ {
+ "epoch": 74.60490463215258,
+ "grad_norm": 2.0909366607666016,
+ "learning_rate": 3.1959779500172382e-06,
+ "loss": 0.039,
+ "step": 27380
+ },
+ {
+ "epoch": 74.60762942779292,
+ "grad_norm": 2.7853620052337646,
+ "learning_rate": 3.195331250123138e-06,
+ "loss": 0.1248,
+ "step": 27381
+ },
+ {
+ "epoch": 74.61035422343325,
+ "grad_norm": 2.994997262954712,
+ "learning_rate": 3.1946846032235754e-06,
+ "loss": 0.0518,
+ "step": 27382
+ },
+ {
+ "epoch": 74.61307901907357,
+ "grad_norm": 2.473146677017212,
+ "learning_rate": 3.1940380093235932e-06,
+ "loss": 0.0805,
+ "step": 27383
+ },
+ {
+ "epoch": 74.6158038147139,
+ "grad_norm": 4.3801093101501465,
+ "learning_rate": 3.1933914684282206e-06,
+ "loss": 0.0557,
+ "step": 27384
+ },
+ {
+ "epoch": 74.61852861035422,
+ "grad_norm": 2.473504066467285,
+ "learning_rate": 3.1927449805425005e-06,
+ "loss": 0.064,
+ "step": 27385
+ },
+ {
+ "epoch": 74.62125340599455,
+ "grad_norm": 3.362474203109741,
+ "learning_rate": 3.1920985456714625e-06,
+ "loss": 0.0344,
+ "step": 27386
+ },
+ {
+ "epoch": 74.62397820163488,
+ "grad_norm": 2.301248550415039,
+ "learning_rate": 3.191452163820139e-06,
+ "loss": 0.0992,
+ "step": 27387
+ },
+ {
+ "epoch": 74.6267029972752,
+ "grad_norm": 3.087402820587158,
+ "learning_rate": 3.19080583499357e-06,
+ "loss": 0.0502,
+ "step": 27388
+ },
+ {
+ "epoch": 74.62942779291554,
+ "grad_norm": 2.3167479038238525,
+ "learning_rate": 3.190159559196786e-06,
+ "loss": 0.0351,
+ "step": 27389
+ },
+ {
+ "epoch": 74.63215258855585,
+ "grad_norm": 2.209955930709839,
+ "learning_rate": 3.1895133364348208e-06,
+ "loss": 0.0273,
+ "step": 27390
+ },
+ {
+ "epoch": 74.63487738419619,
+ "grad_norm": 2.4292988777160645,
+ "learning_rate": 3.1888671667127026e-06,
+ "loss": 0.0896,
+ "step": 27391
+ },
+ {
+ "epoch": 74.6376021798365,
+ "grad_norm": 3.015127420425415,
+ "learning_rate": 3.1882210500354705e-06,
+ "loss": 0.1085,
+ "step": 27392
+ },
+ {
+ "epoch": 74.64032697547684,
+ "grad_norm": 2.6956639289855957,
+ "learning_rate": 3.187574986408155e-06,
+ "loss": 0.1141,
+ "step": 27393
+ },
+ {
+ "epoch": 74.64305177111717,
+ "grad_norm": 4.860119342803955,
+ "learning_rate": 3.1869289758357845e-06,
+ "loss": 0.1346,
+ "step": 27394
+ },
+ {
+ "epoch": 74.64577656675749,
+ "grad_norm": 4.685331344604492,
+ "learning_rate": 3.1862830183233907e-06,
+ "loss": 0.0365,
+ "step": 27395
+ },
+ {
+ "epoch": 74.64850136239782,
+ "grad_norm": 2.2085535526275635,
+ "learning_rate": 3.185637113876007e-06,
+ "loss": 0.038,
+ "step": 27396
+ },
+ {
+ "epoch": 74.65122615803814,
+ "grad_norm": 2.1946418285369873,
+ "learning_rate": 3.184991262498662e-06,
+ "loss": 0.0293,
+ "step": 27397
+ },
+ {
+ "epoch": 74.65395095367847,
+ "grad_norm": 4.102278709411621,
+ "learning_rate": 3.1843454641963866e-06,
+ "loss": 0.1202,
+ "step": 27398
+ },
+ {
+ "epoch": 74.65667574931881,
+ "grad_norm": 2.386718273162842,
+ "learning_rate": 3.183699718974207e-06,
+ "loss": 0.0411,
+ "step": 27399
+ },
+ {
+ "epoch": 74.65940054495913,
+ "grad_norm": 3.3451311588287354,
+ "learning_rate": 3.183054026837157e-06,
+ "loss": 0.0872,
+ "step": 27400
+ },
+ {
+ "epoch": 74.66212534059946,
+ "grad_norm": 4.495838165283203,
+ "learning_rate": 3.182408387790259e-06,
+ "loss": 0.049,
+ "step": 27401
+ },
+ {
+ "epoch": 74.66485013623978,
+ "grad_norm": 2.089571475982666,
+ "learning_rate": 3.181762801838548e-06,
+ "loss": 0.0252,
+ "step": 27402
+ },
+ {
+ "epoch": 74.66757493188011,
+ "grad_norm": 2.0634653568267822,
+ "learning_rate": 3.181117268987046e-06,
+ "loss": 0.0289,
+ "step": 27403
+ },
+ {
+ "epoch": 74.67029972752043,
+ "grad_norm": 3.0624613761901855,
+ "learning_rate": 3.1804717892407877e-06,
+ "loss": 0.1385,
+ "step": 27404
+ },
+ {
+ "epoch": 74.67302452316076,
+ "grad_norm": 3.4951775074005127,
+ "learning_rate": 3.1798263626047944e-06,
+ "loss": 0.1402,
+ "step": 27405
+ },
+ {
+ "epoch": 74.6757493188011,
+ "grad_norm": 5.737732410430908,
+ "learning_rate": 3.1791809890840942e-06,
+ "loss": 0.0913,
+ "step": 27406
+ },
+ {
+ "epoch": 74.67847411444141,
+ "grad_norm": 2.3680155277252197,
+ "learning_rate": 3.1785356686837097e-06,
+ "loss": 0.1333,
+ "step": 27407
+ },
+ {
+ "epoch": 74.68119891008175,
+ "grad_norm": 3.2178423404693604,
+ "learning_rate": 3.177890401408673e-06,
+ "loss": 0.0432,
+ "step": 27408
+ },
+ {
+ "epoch": 74.68392370572207,
+ "grad_norm": 3.593608856201172,
+ "learning_rate": 3.1772451872640066e-06,
+ "loss": 0.0455,
+ "step": 27409
+ },
+ {
+ "epoch": 74.6866485013624,
+ "grad_norm": 2.4788355827331543,
+ "learning_rate": 3.1766000262547347e-06,
+ "loss": 0.135,
+ "step": 27410
+ },
+ {
+ "epoch": 74.68937329700273,
+ "grad_norm": 3.574361562728882,
+ "learning_rate": 3.1759549183858797e-06,
+ "loss": 0.1343,
+ "step": 27411
+ },
+ {
+ "epoch": 74.69209809264305,
+ "grad_norm": 2.709545373916626,
+ "learning_rate": 3.17530986366247e-06,
+ "loss": 0.0407,
+ "step": 27412
+ },
+ {
+ "epoch": 74.69482288828338,
+ "grad_norm": 5.369472980499268,
+ "learning_rate": 3.174664862089528e-06,
+ "loss": 0.0397,
+ "step": 27413
+ },
+ {
+ "epoch": 74.6975476839237,
+ "grad_norm": 4.344054222106934,
+ "learning_rate": 3.174019913672077e-06,
+ "loss": 0.1633,
+ "step": 27414
+ },
+ {
+ "epoch": 74.70027247956403,
+ "grad_norm": 2.938528537750244,
+ "learning_rate": 3.1733750184151357e-06,
+ "loss": 0.0618,
+ "step": 27415
+ },
+ {
+ "epoch": 74.70299727520435,
+ "grad_norm": 2.4566922187805176,
+ "learning_rate": 3.172730176323733e-06,
+ "loss": 0.0391,
+ "step": 27416
+ },
+ {
+ "epoch": 74.70572207084469,
+ "grad_norm": 3.157243251800537,
+ "learning_rate": 3.172085387402888e-06,
+ "loss": 0.0467,
+ "step": 27417
+ },
+ {
+ "epoch": 74.70844686648502,
+ "grad_norm": 6.23567008972168,
+ "learning_rate": 3.171440651657619e-06,
+ "loss": 0.0554,
+ "step": 27418
+ },
+ {
+ "epoch": 74.71117166212534,
+ "grad_norm": 2.5095317363739014,
+ "learning_rate": 3.1707959690929545e-06,
+ "loss": 0.0399,
+ "step": 27419
+ },
+ {
+ "epoch": 74.71389645776567,
+ "grad_norm": 2.690309524536133,
+ "learning_rate": 3.1701513397139072e-06,
+ "loss": 0.0354,
+ "step": 27420
+ },
+ {
+ "epoch": 74.71662125340599,
+ "grad_norm": 2.5978381633758545,
+ "learning_rate": 3.169506763525505e-06,
+ "loss": 0.0376,
+ "step": 27421
+ },
+ {
+ "epoch": 74.71934604904632,
+ "grad_norm": 3.6311593055725098,
+ "learning_rate": 3.168862240532764e-06,
+ "loss": 0.0861,
+ "step": 27422
+ },
+ {
+ "epoch": 74.72207084468666,
+ "grad_norm": 3.008673906326294,
+ "learning_rate": 3.1682177707407e-06,
+ "loss": 0.1461,
+ "step": 27423
+ },
+ {
+ "epoch": 74.72479564032697,
+ "grad_norm": 3.299814462661743,
+ "learning_rate": 3.167573354154341e-06,
+ "loss": 0.0843,
+ "step": 27424
+ },
+ {
+ "epoch": 74.7275204359673,
+ "grad_norm": 3.0510849952697754,
+ "learning_rate": 3.1669289907786994e-06,
+ "loss": 0.0392,
+ "step": 27425
+ },
+ {
+ "epoch": 74.73024523160763,
+ "grad_norm": 3.5574769973754883,
+ "learning_rate": 3.1662846806187952e-06,
+ "loss": 0.1855,
+ "step": 27426
+ },
+ {
+ "epoch": 74.73297002724796,
+ "grad_norm": 2.4356772899627686,
+ "learning_rate": 3.1656404236796436e-06,
+ "loss": 0.0417,
+ "step": 27427
+ },
+ {
+ "epoch": 74.73569482288828,
+ "grad_norm": 3.1003222465515137,
+ "learning_rate": 3.1649962199662665e-06,
+ "loss": 0.1738,
+ "step": 27428
+ },
+ {
+ "epoch": 74.73841961852861,
+ "grad_norm": 3.6968743801116943,
+ "learning_rate": 3.1643520694836793e-06,
+ "loss": 0.1928,
+ "step": 27429
+ },
+ {
+ "epoch": 74.74114441416894,
+ "grad_norm": 2.2422289848327637,
+ "learning_rate": 3.163707972236899e-06,
+ "loss": 0.0593,
+ "step": 27430
+ },
+ {
+ "epoch": 74.74386920980926,
+ "grad_norm": 2.408618450164795,
+ "learning_rate": 3.163063928230937e-06,
+ "loss": 0.104,
+ "step": 27431
+ },
+ {
+ "epoch": 74.7465940054496,
+ "grad_norm": 3.220341444015503,
+ "learning_rate": 3.1624199374708163e-06,
+ "loss": 0.1713,
+ "step": 27432
+ },
+ {
+ "epoch": 74.74931880108991,
+ "grad_norm": 3.2058322429656982,
+ "learning_rate": 3.1617759999615495e-06,
+ "loss": 0.041,
+ "step": 27433
+ },
+ {
+ "epoch": 74.75204359673025,
+ "grad_norm": 2.603969097137451,
+ "learning_rate": 3.161132115708151e-06,
+ "loss": 0.0929,
+ "step": 27434
+ },
+ {
+ "epoch": 74.75476839237058,
+ "grad_norm": 3.143913507461548,
+ "learning_rate": 3.1604882847156314e-06,
+ "loss": 0.1677,
+ "step": 27435
+ },
+ {
+ "epoch": 74.7574931880109,
+ "grad_norm": 4.815069198608398,
+ "learning_rate": 3.1598445069890093e-06,
+ "loss": 0.0504,
+ "step": 27436
+ },
+ {
+ "epoch": 74.76021798365123,
+ "grad_norm": 2.8605568408966064,
+ "learning_rate": 3.1592007825333015e-06,
+ "loss": 0.0369,
+ "step": 27437
+ },
+ {
+ "epoch": 74.76294277929155,
+ "grad_norm": 2.512197732925415,
+ "learning_rate": 3.1585571113535186e-06,
+ "loss": 0.1017,
+ "step": 27438
+ },
+ {
+ "epoch": 74.76566757493188,
+ "grad_norm": 3.2640180587768555,
+ "learning_rate": 3.1579134934546716e-06,
+ "loss": 0.1161,
+ "step": 27439
+ },
+ {
+ "epoch": 74.7683923705722,
+ "grad_norm": 2.781555652618408,
+ "learning_rate": 3.1572699288417708e-06,
+ "loss": 0.1141,
+ "step": 27440
+ },
+ {
+ "epoch": 74.77111716621253,
+ "grad_norm": 3.1150054931640625,
+ "learning_rate": 3.156626417519836e-06,
+ "loss": 0.0651,
+ "step": 27441
+ },
+ {
+ "epoch": 74.77384196185287,
+ "grad_norm": 3.060635805130005,
+ "learning_rate": 3.1559829594938728e-06,
+ "loss": 0.2373,
+ "step": 27442
+ },
+ {
+ "epoch": 74.77656675749319,
+ "grad_norm": 5.093193531036377,
+ "learning_rate": 3.1553395547688914e-06,
+ "loss": 0.1321,
+ "step": 27443
+ },
+ {
+ "epoch": 74.77929155313352,
+ "grad_norm": 3.535568952560425,
+ "learning_rate": 3.1546962033499084e-06,
+ "loss": 0.0812,
+ "step": 27444
+ },
+ {
+ "epoch": 74.78201634877384,
+ "grad_norm": 2.840769052505493,
+ "learning_rate": 3.1540529052419323e-06,
+ "loss": 0.0421,
+ "step": 27445
+ },
+ {
+ "epoch": 74.78474114441417,
+ "grad_norm": 3.9191110134124756,
+ "learning_rate": 3.153409660449971e-06,
+ "loss": 0.2843,
+ "step": 27446
+ },
+ {
+ "epoch": 74.7874659400545,
+ "grad_norm": 3.4338719844818115,
+ "learning_rate": 3.1527664689790316e-06,
+ "loss": 0.0596,
+ "step": 27447
+ },
+ {
+ "epoch": 74.79019073569482,
+ "grad_norm": 2.8352816104888916,
+ "learning_rate": 3.1521233308341292e-06,
+ "loss": 0.041,
+ "step": 27448
+ },
+ {
+ "epoch": 74.79291553133515,
+ "grad_norm": 3.671628952026367,
+ "learning_rate": 3.1514802460202707e-06,
+ "loss": 0.0803,
+ "step": 27449
+ },
+ {
+ "epoch": 74.79564032697547,
+ "grad_norm": 6.532846450805664,
+ "learning_rate": 3.1508372145424637e-06,
+ "loss": 0.0462,
+ "step": 27450
+ },
+ {
+ "epoch": 74.7983651226158,
+ "grad_norm": 2.7748310565948486,
+ "learning_rate": 3.1501942364057116e-06,
+ "loss": 0.082,
+ "step": 27451
+ },
+ {
+ "epoch": 74.80108991825612,
+ "grad_norm": 3.0477004051208496,
+ "learning_rate": 3.1495513116150276e-06,
+ "loss": 0.0637,
+ "step": 27452
+ },
+ {
+ "epoch": 74.80381471389646,
+ "grad_norm": 3.5865554809570312,
+ "learning_rate": 3.14890844017542e-06,
+ "loss": 0.0871,
+ "step": 27453
+ },
+ {
+ "epoch": 74.80653950953679,
+ "grad_norm": 3.582667112350464,
+ "learning_rate": 3.1482656220918938e-06,
+ "loss": 0.0389,
+ "step": 27454
+ },
+ {
+ "epoch": 74.80926430517711,
+ "grad_norm": 2.5279176235198975,
+ "learning_rate": 3.1476228573694533e-06,
+ "loss": 0.0623,
+ "step": 27455
+ },
+ {
+ "epoch": 74.81198910081744,
+ "grad_norm": 3.823660373687744,
+ "learning_rate": 3.1469801460131035e-06,
+ "loss": 0.1617,
+ "step": 27456
+ },
+ {
+ "epoch": 74.81471389645776,
+ "grad_norm": 2.192878007888794,
+ "learning_rate": 3.146337488027854e-06,
+ "loss": 0.0431,
+ "step": 27457
+ },
+ {
+ "epoch": 74.8174386920981,
+ "grad_norm": 2.2675254344940186,
+ "learning_rate": 3.1456948834187083e-06,
+ "loss": 0.0314,
+ "step": 27458
+ },
+ {
+ "epoch": 74.82016348773843,
+ "grad_norm": 6.254118919372559,
+ "learning_rate": 3.14505233219067e-06,
+ "loss": 0.0462,
+ "step": 27459
+ },
+ {
+ "epoch": 74.82288828337875,
+ "grad_norm": 3.756660223007202,
+ "learning_rate": 3.1444098343487394e-06,
+ "loss": 0.1437,
+ "step": 27460
+ },
+ {
+ "epoch": 74.82561307901908,
+ "grad_norm": 3.801999092102051,
+ "learning_rate": 3.1437673898979282e-06,
+ "loss": 0.0514,
+ "step": 27461
+ },
+ {
+ "epoch": 74.8283378746594,
+ "grad_norm": 3.2751238346099854,
+ "learning_rate": 3.143124998843237e-06,
+ "loss": 0.0385,
+ "step": 27462
+ },
+ {
+ "epoch": 74.83106267029973,
+ "grad_norm": 3.086588144302368,
+ "learning_rate": 3.1424826611896664e-06,
+ "loss": 0.2446,
+ "step": 27463
+ },
+ {
+ "epoch": 74.83378746594005,
+ "grad_norm": 3.3873214721679688,
+ "learning_rate": 3.1418403769422166e-06,
+ "loss": 0.0282,
+ "step": 27464
+ },
+ {
+ "epoch": 74.83651226158038,
+ "grad_norm": 3.4134676456451416,
+ "learning_rate": 3.1411981461058973e-06,
+ "loss": 0.1302,
+ "step": 27465
+ },
+ {
+ "epoch": 74.83923705722071,
+ "grad_norm": 2.2357282638549805,
+ "learning_rate": 3.1405559686857058e-06,
+ "loss": 0.0338,
+ "step": 27466
+ },
+ {
+ "epoch": 74.84196185286103,
+ "grad_norm": 3.2296764850616455,
+ "learning_rate": 3.1399138446866405e-06,
+ "loss": 0.0518,
+ "step": 27467
+ },
+ {
+ "epoch": 74.84468664850137,
+ "grad_norm": 3.764432191848755,
+ "learning_rate": 3.139271774113708e-06,
+ "loss": 0.0755,
+ "step": 27468
+ },
+ {
+ "epoch": 74.84741144414168,
+ "grad_norm": 1.9802919626235962,
+ "learning_rate": 3.138629756971907e-06,
+ "loss": 0.0351,
+ "step": 27469
+ },
+ {
+ "epoch": 74.85013623978202,
+ "grad_norm": 2.98422908782959,
+ "learning_rate": 3.137987793266233e-06,
+ "loss": 0.0886,
+ "step": 27470
+ },
+ {
+ "epoch": 74.85286103542235,
+ "grad_norm": 3.518028736114502,
+ "learning_rate": 3.1373458830016925e-06,
+ "loss": 0.0994,
+ "step": 27471
+ },
+ {
+ "epoch": 74.85558583106267,
+ "grad_norm": 9.135181427001953,
+ "learning_rate": 3.136704026183278e-06,
+ "loss": 0.0541,
+ "step": 27472
+ },
+ {
+ "epoch": 74.858310626703,
+ "grad_norm": 5.177651405334473,
+ "learning_rate": 3.136062222815994e-06,
+ "loss": 0.0259,
+ "step": 27473
+ },
+ {
+ "epoch": 74.86103542234332,
+ "grad_norm": 3.1518969535827637,
+ "learning_rate": 3.135420472904839e-06,
+ "loss": 0.2288,
+ "step": 27474
+ },
+ {
+ "epoch": 74.86376021798365,
+ "grad_norm": 4.267491340637207,
+ "learning_rate": 3.1347787764548064e-06,
+ "loss": 0.0771,
+ "step": 27475
+ },
+ {
+ "epoch": 74.86648501362397,
+ "grad_norm": 2.849985122680664,
+ "learning_rate": 3.1341371334708924e-06,
+ "loss": 0.0856,
+ "step": 27476
+ },
+ {
+ "epoch": 74.8692098092643,
+ "grad_norm": 2.889461040496826,
+ "learning_rate": 3.1334955439581016e-06,
+ "loss": 0.0764,
+ "step": 27477
+ },
+ {
+ "epoch": 74.87193460490464,
+ "grad_norm": 3.2429332733154297,
+ "learning_rate": 3.1328540079214264e-06,
+ "loss": 0.0383,
+ "step": 27478
+ },
+ {
+ "epoch": 74.87465940054496,
+ "grad_norm": 4.318110942840576,
+ "learning_rate": 3.132212525365863e-06,
+ "loss": 0.1022,
+ "step": 27479
+ },
+ {
+ "epoch": 74.87738419618529,
+ "grad_norm": 3.088435173034668,
+ "learning_rate": 3.131571096296404e-06,
+ "loss": 0.1602,
+ "step": 27480
+ },
+ {
+ "epoch": 74.88010899182561,
+ "grad_norm": 3.6335043907165527,
+ "learning_rate": 3.130929720718051e-06,
+ "loss": 0.0867,
+ "step": 27481
+ },
+ {
+ "epoch": 74.88283378746594,
+ "grad_norm": 2.422663688659668,
+ "learning_rate": 3.130288398635797e-06,
+ "loss": 0.0382,
+ "step": 27482
+ },
+ {
+ "epoch": 74.88555858310627,
+ "grad_norm": 2.0690314769744873,
+ "learning_rate": 3.129647130054636e-06,
+ "loss": 0.0944,
+ "step": 27483
+ },
+ {
+ "epoch": 74.88828337874659,
+ "grad_norm": 2.035308599472046,
+ "learning_rate": 3.129005914979558e-06,
+ "loss": 0.0386,
+ "step": 27484
+ },
+ {
+ "epoch": 74.89100817438693,
+ "grad_norm": 4.204923629760742,
+ "learning_rate": 3.128364753415565e-06,
+ "loss": 0.1086,
+ "step": 27485
+ },
+ {
+ "epoch": 74.89373297002724,
+ "grad_norm": 2.8162553310394287,
+ "learning_rate": 3.127723645367645e-06,
+ "loss": 0.1143,
+ "step": 27486
+ },
+ {
+ "epoch": 74.89645776566758,
+ "grad_norm": 5.131668567657471,
+ "learning_rate": 3.1270825908407897e-06,
+ "loss": 0.0968,
+ "step": 27487
+ },
+ {
+ "epoch": 74.8991825613079,
+ "grad_norm": 2.573620319366455,
+ "learning_rate": 3.1264415898399935e-06,
+ "loss": 0.0359,
+ "step": 27488
+ },
+ {
+ "epoch": 74.90190735694823,
+ "grad_norm": 2.7319297790527344,
+ "learning_rate": 3.1258006423702536e-06,
+ "loss": 0.0433,
+ "step": 27489
+ },
+ {
+ "epoch": 74.90463215258856,
+ "grad_norm": 5.500871181488037,
+ "learning_rate": 3.125159748436556e-06,
+ "loss": 0.1917,
+ "step": 27490
+ },
+ {
+ "epoch": 74.90735694822888,
+ "grad_norm": 2.8717222213745117,
+ "learning_rate": 3.124518908043892e-06,
+ "loss": 0.0293,
+ "step": 27491
+ },
+ {
+ "epoch": 74.91008174386921,
+ "grad_norm": 2.114720582962036,
+ "learning_rate": 3.123878121197251e-06,
+ "loss": 0.0366,
+ "step": 27492
+ },
+ {
+ "epoch": 74.91280653950953,
+ "grad_norm": 2.324105978012085,
+ "learning_rate": 3.12323738790163e-06,
+ "loss": 0.0734,
+ "step": 27493
+ },
+ {
+ "epoch": 74.91553133514986,
+ "grad_norm": 5.976681232452393,
+ "learning_rate": 3.1225967081620136e-06,
+ "loss": 0.0399,
+ "step": 27494
+ },
+ {
+ "epoch": 74.9182561307902,
+ "grad_norm": 2.522785186767578,
+ "learning_rate": 3.121956081983394e-06,
+ "loss": 0.0262,
+ "step": 27495
+ },
+ {
+ "epoch": 74.92098092643052,
+ "grad_norm": 2.162013292312622,
+ "learning_rate": 3.1213155093707547e-06,
+ "loss": 0.0357,
+ "step": 27496
+ },
+ {
+ "epoch": 74.92370572207085,
+ "grad_norm": 2.9040699005126953,
+ "learning_rate": 3.1206749903290924e-06,
+ "loss": 0.2002,
+ "step": 27497
+ },
+ {
+ "epoch": 74.92643051771117,
+ "grad_norm": 2.6344516277313232,
+ "learning_rate": 3.120034524863392e-06,
+ "loss": 0.0361,
+ "step": 27498
+ },
+ {
+ "epoch": 74.9291553133515,
+ "grad_norm": 4.292081832885742,
+ "learning_rate": 3.119394112978641e-06,
+ "loss": 0.1328,
+ "step": 27499
+ },
+ {
+ "epoch": 74.93188010899182,
+ "grad_norm": 2.953303575515747,
+ "learning_rate": 3.1187537546798243e-06,
+ "loss": 0.0359,
+ "step": 27500
+ },
+ {
+ "epoch": 74.93460490463215,
+ "grad_norm": 2.4193108081817627,
+ "learning_rate": 3.1181134499719346e-06,
+ "loss": 0.0311,
+ "step": 27501
+ },
+ {
+ "epoch": 74.93732970027249,
+ "grad_norm": 3.2863755226135254,
+ "learning_rate": 3.117473198859957e-06,
+ "loss": 0.0691,
+ "step": 27502
+ },
+ {
+ "epoch": 74.9400544959128,
+ "grad_norm": 3.368201971054077,
+ "learning_rate": 3.1168330013488756e-06,
+ "loss": 0.1171,
+ "step": 27503
+ },
+ {
+ "epoch": 74.94277929155314,
+ "grad_norm": 2.8241043090820312,
+ "learning_rate": 3.116192857443674e-06,
+ "loss": 0.1456,
+ "step": 27504
+ },
+ {
+ "epoch": 74.94550408719346,
+ "grad_norm": 4.0922040939331055,
+ "learning_rate": 3.1155527671493414e-06,
+ "loss": 0.0755,
+ "step": 27505
+ },
+ {
+ "epoch": 74.94822888283379,
+ "grad_norm": 3.2033066749572754,
+ "learning_rate": 3.114912730470865e-06,
+ "loss": 0.0304,
+ "step": 27506
+ },
+ {
+ "epoch": 74.95095367847412,
+ "grad_norm": 4.60787296295166,
+ "learning_rate": 3.1142727474132275e-06,
+ "loss": 0.0421,
+ "step": 27507
+ },
+ {
+ "epoch": 74.95367847411444,
+ "grad_norm": 2.8809895515441895,
+ "learning_rate": 3.113632817981408e-06,
+ "loss": 0.0502,
+ "step": 27508
+ },
+ {
+ "epoch": 74.95640326975477,
+ "grad_norm": 3.216729164123535,
+ "learning_rate": 3.1129929421803982e-06,
+ "loss": 0.0675,
+ "step": 27509
+ },
+ {
+ "epoch": 74.95912806539509,
+ "grad_norm": 2.9025216102600098,
+ "learning_rate": 3.112353120015178e-06,
+ "loss": 0.0555,
+ "step": 27510
+ },
+ {
+ "epoch": 74.96185286103542,
+ "grad_norm": 3.4627859592437744,
+ "learning_rate": 3.1117133514907294e-06,
+ "loss": 0.0776,
+ "step": 27511
+ },
+ {
+ "epoch": 74.96457765667574,
+ "grad_norm": 2.72674298286438,
+ "learning_rate": 3.111073636612032e-06,
+ "loss": 0.0797,
+ "step": 27512
+ },
+ {
+ "epoch": 74.96730245231608,
+ "grad_norm": 2.8152270317077637,
+ "learning_rate": 3.1104339753840752e-06,
+ "loss": 0.0518,
+ "step": 27513
+ },
+ {
+ "epoch": 74.97002724795641,
+ "grad_norm": 3.045332670211792,
+ "learning_rate": 3.109794367811837e-06,
+ "loss": 0.1923,
+ "step": 27514
+ },
+ {
+ "epoch": 74.97275204359673,
+ "grad_norm": 4.088866233825684,
+ "learning_rate": 3.109154813900298e-06,
+ "loss": 0.0596,
+ "step": 27515
+ },
+ {
+ "epoch": 74.97547683923706,
+ "grad_norm": 3.0625717639923096,
+ "learning_rate": 3.108515313654438e-06,
+ "loss": 0.1124,
+ "step": 27516
+ },
+ {
+ "epoch": 74.97820163487738,
+ "grad_norm": 2.966005325317383,
+ "learning_rate": 3.1078758670792397e-06,
+ "loss": 0.1448,
+ "step": 27517
+ },
+ {
+ "epoch": 74.98092643051771,
+ "grad_norm": 2.499295234680176,
+ "learning_rate": 3.1072364741796833e-06,
+ "loss": 0.0385,
+ "step": 27518
+ },
+ {
+ "epoch": 74.98365122615803,
+ "grad_norm": 2.7400944232940674,
+ "learning_rate": 3.1065971349607484e-06,
+ "loss": 0.0467,
+ "step": 27519
+ },
+ {
+ "epoch": 74.98637602179836,
+ "grad_norm": 3.302360773086548,
+ "learning_rate": 3.105957849427409e-06,
+ "loss": 0.0998,
+ "step": 27520
+ },
+ {
+ "epoch": 74.9891008174387,
+ "grad_norm": 2.534291982650757,
+ "learning_rate": 3.1053186175846474e-06,
+ "loss": 0.0341,
+ "step": 27521
+ },
+ {
+ "epoch": 74.99182561307902,
+ "grad_norm": 3.326748847961426,
+ "learning_rate": 3.104679439437447e-06,
+ "loss": 0.1436,
+ "step": 27522
+ },
+ {
+ "epoch": 74.99455040871935,
+ "grad_norm": 2.6939988136291504,
+ "learning_rate": 3.1040403149907805e-06,
+ "loss": 0.1331,
+ "step": 27523
+ },
+ {
+ "epoch": 74.99727520435967,
+ "grad_norm": 3.131129264831543,
+ "learning_rate": 3.1034012442496253e-06,
+ "loss": 0.0787,
+ "step": 27524
+ },
+ {
+ "epoch": 75.0,
+ "grad_norm": 2.8523824214935303,
+ "learning_rate": 3.1027622272189572e-06,
+ "loss": 0.1013,
+ "step": 27525
+ },
+ {
+ "epoch": 75.00272479564033,
+ "grad_norm": 3.311145782470703,
+ "learning_rate": 3.102123263903758e-06,
+ "loss": 0.0655,
+ "step": 27526
+ },
+ {
+ "epoch": 75.00544959128065,
+ "grad_norm": 2.3888118267059326,
+ "learning_rate": 3.1014843543090002e-06,
+ "loss": 0.0348,
+ "step": 27527
+ },
+ {
+ "epoch": 75.00817438692098,
+ "grad_norm": 3.0262041091918945,
+ "learning_rate": 3.1008454984396606e-06,
+ "loss": 0.0293,
+ "step": 27528
+ },
+ {
+ "epoch": 75.0108991825613,
+ "grad_norm": 2.7091064453125,
+ "learning_rate": 3.1002066963007116e-06,
+ "loss": 0.05,
+ "step": 27529
+ },
+ {
+ "epoch": 75.01362397820164,
+ "grad_norm": 2.9500162601470947,
+ "learning_rate": 3.099567947897133e-06,
+ "loss": 0.0561,
+ "step": 27530
+ },
+ {
+ "epoch": 75.01634877384195,
+ "grad_norm": 2.945417642593384,
+ "learning_rate": 3.0989292532338978e-06,
+ "loss": 0.0326,
+ "step": 27531
+ },
+ {
+ "epoch": 75.01907356948229,
+ "grad_norm": 2.4412946701049805,
+ "learning_rate": 3.098290612315976e-06,
+ "loss": 0.051,
+ "step": 27532
+ },
+ {
+ "epoch": 75.02179836512262,
+ "grad_norm": 3.124022960662842,
+ "learning_rate": 3.0976520251483476e-06,
+ "loss": 0.1109,
+ "step": 27533
+ },
+ {
+ "epoch": 75.02452316076294,
+ "grad_norm": 2.738534927368164,
+ "learning_rate": 3.097013491735984e-06,
+ "loss": 0.0518,
+ "step": 27534
+ },
+ {
+ "epoch": 75.02724795640327,
+ "grad_norm": 5.542792797088623,
+ "learning_rate": 3.0963750120838564e-06,
+ "loss": 0.0744,
+ "step": 27535
+ },
+ {
+ "epoch": 75.02997275204359,
+ "grad_norm": 4.510857105255127,
+ "learning_rate": 3.0957365861969345e-06,
+ "loss": 0.2035,
+ "step": 27536
+ },
+ {
+ "epoch": 75.03269754768392,
+ "grad_norm": 4.250611782073975,
+ "learning_rate": 3.095098214080198e-06,
+ "loss": 0.0578,
+ "step": 27537
+ },
+ {
+ "epoch": 75.03542234332426,
+ "grad_norm": 1.8988556861877441,
+ "learning_rate": 3.0944598957386107e-06,
+ "loss": 0.1159,
+ "step": 27538
+ },
+ {
+ "epoch": 75.03814713896458,
+ "grad_norm": 3.1393895149230957,
+ "learning_rate": 3.0938216311771507e-06,
+ "loss": 0.0352,
+ "step": 27539
+ },
+ {
+ "epoch": 75.04087193460491,
+ "grad_norm": 1.4722155332565308,
+ "learning_rate": 3.0931834204007862e-06,
+ "loss": 0.0173,
+ "step": 27540
+ },
+ {
+ "epoch": 75.04359673024523,
+ "grad_norm": 2.404116630554199,
+ "learning_rate": 3.0925452634144825e-06,
+ "loss": 0.0752,
+ "step": 27541
+ },
+ {
+ "epoch": 75.04632152588556,
+ "grad_norm": 2.586320161819458,
+ "learning_rate": 3.0919071602232175e-06,
+ "loss": 0.0381,
+ "step": 27542
+ },
+ {
+ "epoch": 75.04904632152588,
+ "grad_norm": 9.841873168945312,
+ "learning_rate": 3.0912691108319582e-06,
+ "loss": 0.0425,
+ "step": 27543
+ },
+ {
+ "epoch": 75.05177111716621,
+ "grad_norm": 2.585761308670044,
+ "learning_rate": 3.0906311152456713e-06,
+ "loss": 0.0844,
+ "step": 27544
+ },
+ {
+ "epoch": 75.05449591280654,
+ "grad_norm": 2.6232521533966064,
+ "learning_rate": 3.0899931734693246e-06,
+ "loss": 0.1565,
+ "step": 27545
+ },
+ {
+ "epoch": 75.05722070844686,
+ "grad_norm": 2.5462450981140137,
+ "learning_rate": 3.089355285507891e-06,
+ "loss": 0.0682,
+ "step": 27546
+ },
+ {
+ "epoch": 75.0599455040872,
+ "grad_norm": 3.3379335403442383,
+ "learning_rate": 3.0887174513663376e-06,
+ "loss": 0.2347,
+ "step": 27547
+ },
+ {
+ "epoch": 75.06267029972751,
+ "grad_norm": 2.2917251586914062,
+ "learning_rate": 3.0880796710496287e-06,
+ "loss": 0.0336,
+ "step": 27548
+ },
+ {
+ "epoch": 75.06539509536785,
+ "grad_norm": 3.615720748901367,
+ "learning_rate": 3.08744194456273e-06,
+ "loss": 0.2591,
+ "step": 27549
+ },
+ {
+ "epoch": 75.06811989100818,
+ "grad_norm": 3.1300547122955322,
+ "learning_rate": 3.0868042719106152e-06,
+ "loss": 0.0327,
+ "step": 27550
+ },
+ {
+ "epoch": 75.0708446866485,
+ "grad_norm": 2.6372008323669434,
+ "learning_rate": 3.086166653098246e-06,
+ "loss": 0.1014,
+ "step": 27551
+ },
+ {
+ "epoch": 75.07356948228883,
+ "grad_norm": 5.758232593536377,
+ "learning_rate": 3.0855290881305845e-06,
+ "loss": 0.1821,
+ "step": 27552
+ },
+ {
+ "epoch": 75.07629427792915,
+ "grad_norm": 4.68319034576416,
+ "learning_rate": 3.084891577012603e-06,
+ "loss": 0.1471,
+ "step": 27553
+ },
+ {
+ "epoch": 75.07901907356948,
+ "grad_norm": 7.116035461425781,
+ "learning_rate": 3.0842541197492637e-06,
+ "loss": 0.1569,
+ "step": 27554
+ },
+ {
+ "epoch": 75.0817438692098,
+ "grad_norm": 3.22837495803833,
+ "learning_rate": 3.08361671634553e-06,
+ "loss": 0.0503,
+ "step": 27555
+ },
+ {
+ "epoch": 75.08446866485014,
+ "grad_norm": 3.4298107624053955,
+ "learning_rate": 3.0829793668063646e-06,
+ "loss": 0.059,
+ "step": 27556
+ },
+ {
+ "epoch": 75.08719346049047,
+ "grad_norm": 2.6836814880371094,
+ "learning_rate": 3.0823420711367322e-06,
+ "loss": 0.0687,
+ "step": 27557
+ },
+ {
+ "epoch": 75.08991825613079,
+ "grad_norm": 2.5157830715179443,
+ "learning_rate": 3.0817048293416017e-06,
+ "loss": 0.1594,
+ "step": 27558
+ },
+ {
+ "epoch": 75.09264305177112,
+ "grad_norm": 2.5752265453338623,
+ "learning_rate": 3.08106764142593e-06,
+ "loss": 0.0341,
+ "step": 27559
+ },
+ {
+ "epoch": 75.09536784741144,
+ "grad_norm": 3.477228879928589,
+ "learning_rate": 3.0804305073946818e-06,
+ "loss": 0.1307,
+ "step": 27560
+ },
+ {
+ "epoch": 75.09809264305177,
+ "grad_norm": 2.9757039546966553,
+ "learning_rate": 3.079793427252814e-06,
+ "loss": 0.1973,
+ "step": 27561
+ },
+ {
+ "epoch": 75.1008174386921,
+ "grad_norm": 2.4333109855651855,
+ "learning_rate": 3.0791564010052967e-06,
+ "loss": 0.0641,
+ "step": 27562
+ },
+ {
+ "epoch": 75.10354223433242,
+ "grad_norm": 6.196342468261719,
+ "learning_rate": 3.0785194286570854e-06,
+ "loss": 0.095,
+ "step": 27563
+ },
+ {
+ "epoch": 75.10626702997276,
+ "grad_norm": 2.131510019302368,
+ "learning_rate": 3.077882510213143e-06,
+ "loss": 0.0516,
+ "step": 27564
+ },
+ {
+ "epoch": 75.10899182561307,
+ "grad_norm": 3.1831939220428467,
+ "learning_rate": 3.077245645678425e-06,
+ "loss": 0.0906,
+ "step": 27565
+ },
+ {
+ "epoch": 75.11171662125341,
+ "grad_norm": 2.7010202407836914,
+ "learning_rate": 3.0766088350578984e-06,
+ "loss": 0.173,
+ "step": 27566
+ },
+ {
+ "epoch": 75.11444141689373,
+ "grad_norm": 4.274178504943848,
+ "learning_rate": 3.0759720783565196e-06,
+ "loss": 0.1548,
+ "step": 27567
+ },
+ {
+ "epoch": 75.11716621253406,
+ "grad_norm": 3.5782458782196045,
+ "learning_rate": 3.075335375579247e-06,
+ "loss": 0.0499,
+ "step": 27568
+ },
+ {
+ "epoch": 75.11989100817439,
+ "grad_norm": 2.65104079246521,
+ "learning_rate": 3.074698726731036e-06,
+ "loss": 0.2272,
+ "step": 27569
+ },
+ {
+ "epoch": 75.12261580381471,
+ "grad_norm": 3.3322086334228516,
+ "learning_rate": 3.074062131816853e-06,
+ "loss": 0.0595,
+ "step": 27570
+ },
+ {
+ "epoch": 75.12534059945504,
+ "grad_norm": 3.812431812286377,
+ "learning_rate": 3.07342559084165e-06,
+ "loss": 0.1319,
+ "step": 27571
+ },
+ {
+ "epoch": 75.12806539509536,
+ "grad_norm": 2.5226943492889404,
+ "learning_rate": 3.0727891038103865e-06,
+ "loss": 0.0484,
+ "step": 27572
+ },
+ {
+ "epoch": 75.1307901907357,
+ "grad_norm": 3.453836441040039,
+ "learning_rate": 3.0721526707280113e-06,
+ "loss": 0.0654,
+ "step": 27573
+ },
+ {
+ "epoch": 75.13351498637603,
+ "grad_norm": 2.5528485774993896,
+ "learning_rate": 3.0715162915994944e-06,
+ "loss": 0.0306,
+ "step": 27574
+ },
+ {
+ "epoch": 75.13623978201635,
+ "grad_norm": 2.835279703140259,
+ "learning_rate": 3.0708799664297863e-06,
+ "loss": 0.1264,
+ "step": 27575
+ },
+ {
+ "epoch": 75.13896457765668,
+ "grad_norm": 3.1006345748901367,
+ "learning_rate": 3.0702436952238412e-06,
+ "loss": 0.0411,
+ "step": 27576
+ },
+ {
+ "epoch": 75.141689373297,
+ "grad_norm": 4.25516414642334,
+ "learning_rate": 3.0696074779866127e-06,
+ "loss": 0.1298,
+ "step": 27577
+ },
+ {
+ "epoch": 75.14441416893733,
+ "grad_norm": 3.170030355453491,
+ "learning_rate": 3.0689713147230617e-06,
+ "loss": 0.0373,
+ "step": 27578
+ },
+ {
+ "epoch": 75.14713896457765,
+ "grad_norm": 2.772905111312866,
+ "learning_rate": 3.068335205438139e-06,
+ "loss": 0.0337,
+ "step": 27579
+ },
+ {
+ "epoch": 75.14986376021798,
+ "grad_norm": 2.9926319122314453,
+ "learning_rate": 3.067699150136797e-06,
+ "loss": 0.037,
+ "step": 27580
+ },
+ {
+ "epoch": 75.15258855585832,
+ "grad_norm": 5.851269245147705,
+ "learning_rate": 3.067063148823989e-06,
+ "loss": 0.0896,
+ "step": 27581
+ },
+ {
+ "epoch": 75.15531335149863,
+ "grad_norm": 3.1910886764526367,
+ "learning_rate": 3.0664272015046735e-06,
+ "loss": 0.0748,
+ "step": 27582
+ },
+ {
+ "epoch": 75.15803814713897,
+ "grad_norm": 2.5612995624542236,
+ "learning_rate": 3.0657913081837987e-06,
+ "loss": 0.0662,
+ "step": 27583
+ },
+ {
+ "epoch": 75.16076294277929,
+ "grad_norm": 2.8816475868225098,
+ "learning_rate": 3.0651554688663188e-06,
+ "loss": 0.0505,
+ "step": 27584
+ },
+ {
+ "epoch": 75.16348773841962,
+ "grad_norm": 3.678269624710083,
+ "learning_rate": 3.064519683557182e-06,
+ "loss": 0.0569,
+ "step": 27585
+ },
+ {
+ "epoch": 75.16621253405995,
+ "grad_norm": 3.733116626739502,
+ "learning_rate": 3.063883952261345e-06,
+ "loss": 0.1498,
+ "step": 27586
+ },
+ {
+ "epoch": 75.16893732970027,
+ "grad_norm": 2.7683281898498535,
+ "learning_rate": 3.0632482749837578e-06,
+ "loss": 0.1222,
+ "step": 27587
+ },
+ {
+ "epoch": 75.1716621253406,
+ "grad_norm": 3.418689012527466,
+ "learning_rate": 3.0626126517293686e-06,
+ "loss": 0.1271,
+ "step": 27588
+ },
+ {
+ "epoch": 75.17438692098092,
+ "grad_norm": 2.2630598545074463,
+ "learning_rate": 3.061977082503126e-06,
+ "loss": 0.0248,
+ "step": 27589
+ },
+ {
+ "epoch": 75.17711171662125,
+ "grad_norm": 3.1087136268615723,
+ "learning_rate": 3.0613415673099822e-06,
+ "loss": 0.0364,
+ "step": 27590
+ },
+ {
+ "epoch": 75.17983651226157,
+ "grad_norm": 2.079453945159912,
+ "learning_rate": 3.0607061061548902e-06,
+ "loss": 0.0803,
+ "step": 27591
+ },
+ {
+ "epoch": 75.1825613079019,
+ "grad_norm": 2.0259814262390137,
+ "learning_rate": 3.0600706990427966e-06,
+ "loss": 0.0543,
+ "step": 27592
+ },
+ {
+ "epoch": 75.18528610354224,
+ "grad_norm": 3.862144947052002,
+ "learning_rate": 3.0594353459786484e-06,
+ "loss": 0.1582,
+ "step": 27593
+ },
+ {
+ "epoch": 75.18801089918256,
+ "grad_norm": 3.890875816345215,
+ "learning_rate": 3.058800046967392e-06,
+ "loss": 0.0651,
+ "step": 27594
+ },
+ {
+ "epoch": 75.19073569482289,
+ "grad_norm": 3.464887857437134,
+ "learning_rate": 3.058164802013979e-06,
+ "loss": 0.0947,
+ "step": 27595
+ },
+ {
+ "epoch": 75.19346049046321,
+ "grad_norm": 4.630736827850342,
+ "learning_rate": 3.0575296111233567e-06,
+ "loss": 0.1276,
+ "step": 27596
+ },
+ {
+ "epoch": 75.19618528610354,
+ "grad_norm": 5.1742844581604,
+ "learning_rate": 3.056894474300466e-06,
+ "loss": 0.0518,
+ "step": 27597
+ },
+ {
+ "epoch": 75.19891008174388,
+ "grad_norm": 3.2487473487854004,
+ "learning_rate": 3.0562593915502614e-06,
+ "loss": 0.068,
+ "step": 27598
+ },
+ {
+ "epoch": 75.2016348773842,
+ "grad_norm": 2.2730767726898193,
+ "learning_rate": 3.055624362877685e-06,
+ "loss": 0.037,
+ "step": 27599
+ },
+ {
+ "epoch": 75.20435967302453,
+ "grad_norm": 2.942718982696533,
+ "learning_rate": 3.0549893882876825e-06,
+ "loss": 0.0358,
+ "step": 27600
+ },
+ {
+ "epoch": 75.20708446866485,
+ "grad_norm": 3.3944926261901855,
+ "learning_rate": 3.0543544677851953e-06,
+ "loss": 0.0327,
+ "step": 27601
+ },
+ {
+ "epoch": 75.20980926430518,
+ "grad_norm": 2.9558629989624023,
+ "learning_rate": 3.0537196013751767e-06,
+ "loss": 0.1034,
+ "step": 27602
+ },
+ {
+ "epoch": 75.2125340599455,
+ "grad_norm": 2.820882558822632,
+ "learning_rate": 3.0530847890625646e-06,
+ "loss": 0.0258,
+ "step": 27603
+ },
+ {
+ "epoch": 75.21525885558583,
+ "grad_norm": 2.4985244274139404,
+ "learning_rate": 3.0524500308523064e-06,
+ "loss": 0.0382,
+ "step": 27604
+ },
+ {
+ "epoch": 75.21798365122616,
+ "grad_norm": 2.783466339111328,
+ "learning_rate": 3.0518153267493388e-06,
+ "loss": 0.1242,
+ "step": 27605
+ },
+ {
+ "epoch": 75.22070844686648,
+ "grad_norm": 2.2642557621002197,
+ "learning_rate": 3.051180676758614e-06,
+ "loss": 0.0503,
+ "step": 27606
+ },
+ {
+ "epoch": 75.22343324250681,
+ "grad_norm": 3.5770883560180664,
+ "learning_rate": 3.0505460808850674e-06,
+ "loss": 0.046,
+ "step": 27607
+ },
+ {
+ "epoch": 75.22615803814713,
+ "grad_norm": 2.408412456512451,
+ "learning_rate": 3.0499115391336464e-06,
+ "loss": 0.0304,
+ "step": 27608
+ },
+ {
+ "epoch": 75.22888283378747,
+ "grad_norm": 3.0149154663085938,
+ "learning_rate": 3.0492770515092917e-06,
+ "loss": 0.083,
+ "step": 27609
+ },
+ {
+ "epoch": 75.2316076294278,
+ "grad_norm": 1.9410196542739868,
+ "learning_rate": 3.0486426180169404e-06,
+ "loss": 0.0279,
+ "step": 27610
+ },
+ {
+ "epoch": 75.23433242506812,
+ "grad_norm": 2.15051007270813,
+ "learning_rate": 3.0480082386615394e-06,
+ "loss": 0.0249,
+ "step": 27611
+ },
+ {
+ "epoch": 75.23705722070845,
+ "grad_norm": 2.653397560119629,
+ "learning_rate": 3.047373913448026e-06,
+ "loss": 0.0563,
+ "step": 27612
+ },
+ {
+ "epoch": 75.23978201634877,
+ "grad_norm": 2.4434974193573,
+ "learning_rate": 3.0467396423813423e-06,
+ "loss": 0.0385,
+ "step": 27613
+ },
+ {
+ "epoch": 75.2425068119891,
+ "grad_norm": 4.21658992767334,
+ "learning_rate": 3.0461054254664225e-06,
+ "loss": 0.0706,
+ "step": 27614
+ },
+ {
+ "epoch": 75.24523160762942,
+ "grad_norm": 2.064725875854492,
+ "learning_rate": 3.0454712627082128e-06,
+ "loss": 0.0735,
+ "step": 27615
+ },
+ {
+ "epoch": 75.24795640326975,
+ "grad_norm": 3.525247573852539,
+ "learning_rate": 3.044837154111648e-06,
+ "loss": 0.0584,
+ "step": 27616
+ },
+ {
+ "epoch": 75.25068119891009,
+ "grad_norm": 2.2720861434936523,
+ "learning_rate": 3.044203099681666e-06,
+ "loss": 0.0968,
+ "step": 27617
+ },
+ {
+ "epoch": 75.2534059945504,
+ "grad_norm": 3.067094326019287,
+ "learning_rate": 3.043569099423209e-06,
+ "loss": 0.0601,
+ "step": 27618
+ },
+ {
+ "epoch": 75.25613079019074,
+ "grad_norm": 5.3943772315979,
+ "learning_rate": 3.042935153341212e-06,
+ "loss": 0.0832,
+ "step": 27619
+ },
+ {
+ "epoch": 75.25885558583106,
+ "grad_norm": 4.334679126739502,
+ "learning_rate": 3.042301261440612e-06,
+ "loss": 0.1378,
+ "step": 27620
+ },
+ {
+ "epoch": 75.26158038147139,
+ "grad_norm": 2.4944615364074707,
+ "learning_rate": 3.041667423726343e-06,
+ "loss": 0.031,
+ "step": 27621
+ },
+ {
+ "epoch": 75.26430517711172,
+ "grad_norm": 5.525595188140869,
+ "learning_rate": 3.041033640203348e-06,
+ "loss": 0.0374,
+ "step": 27622
+ },
+ {
+ "epoch": 75.26702997275204,
+ "grad_norm": 3.597632646560669,
+ "learning_rate": 3.040399910876558e-06,
+ "loss": 0.0563,
+ "step": 27623
+ },
+ {
+ "epoch": 75.26975476839237,
+ "grad_norm": 2.9683830738067627,
+ "learning_rate": 3.039766235750907e-06,
+ "loss": 0.1118,
+ "step": 27624
+ },
+ {
+ "epoch": 75.2724795640327,
+ "grad_norm": 3.4934754371643066,
+ "learning_rate": 3.039132614831335e-06,
+ "loss": 0.0343,
+ "step": 27625
+ },
+ {
+ "epoch": 75.27520435967303,
+ "grad_norm": 2.8926949501037598,
+ "learning_rate": 3.0384990481227716e-06,
+ "loss": 0.0251,
+ "step": 27626
+ },
+ {
+ "epoch": 75.27792915531334,
+ "grad_norm": 2.601649045944214,
+ "learning_rate": 3.0378655356301554e-06,
+ "loss": 0.1234,
+ "step": 27627
+ },
+ {
+ "epoch": 75.28065395095368,
+ "grad_norm": 3.4047579765319824,
+ "learning_rate": 3.0372320773584196e-06,
+ "loss": 0.1368,
+ "step": 27628
+ },
+ {
+ "epoch": 75.28337874659401,
+ "grad_norm": 3.0398342609405518,
+ "learning_rate": 3.0365986733124963e-06,
+ "loss": 0.0831,
+ "step": 27629
+ },
+ {
+ "epoch": 75.28610354223433,
+ "grad_norm": 2.6498756408691406,
+ "learning_rate": 3.0359653234973154e-06,
+ "loss": 0.0872,
+ "step": 27630
+ },
+ {
+ "epoch": 75.28882833787466,
+ "grad_norm": 2.3392951488494873,
+ "learning_rate": 3.0353320279178146e-06,
+ "loss": 0.026,
+ "step": 27631
+ },
+ {
+ "epoch": 75.29155313351498,
+ "grad_norm": 3.178831100463867,
+ "learning_rate": 3.0346987865789245e-06,
+ "loss": 0.0377,
+ "step": 27632
+ },
+ {
+ "epoch": 75.29427792915531,
+ "grad_norm": 2.388498544692993,
+ "learning_rate": 3.034065599485576e-06,
+ "loss": 0.0193,
+ "step": 27633
+ },
+ {
+ "epoch": 75.29700272479565,
+ "grad_norm": 2.380526304244995,
+ "learning_rate": 3.033432466642697e-06,
+ "loss": 0.0348,
+ "step": 27634
+ },
+ {
+ "epoch": 75.29972752043597,
+ "grad_norm": 3.2772305011749268,
+ "learning_rate": 3.032799388055225e-06,
+ "loss": 0.0394,
+ "step": 27635
+ },
+ {
+ "epoch": 75.3024523160763,
+ "grad_norm": 2.7993104457855225,
+ "learning_rate": 3.0321663637280875e-06,
+ "loss": 0.1427,
+ "step": 27636
+ },
+ {
+ "epoch": 75.30517711171662,
+ "grad_norm": 1.7309693098068237,
+ "learning_rate": 3.031533393666214e-06,
+ "loss": 0.0159,
+ "step": 27637
+ },
+ {
+ "epoch": 75.30790190735695,
+ "grad_norm": 2.8570635318756104,
+ "learning_rate": 3.030900477874531e-06,
+ "loss": 0.0799,
+ "step": 27638
+ },
+ {
+ "epoch": 75.31062670299727,
+ "grad_norm": 4.14675235748291,
+ "learning_rate": 3.0302676163579738e-06,
+ "loss": 0.0627,
+ "step": 27639
+ },
+ {
+ "epoch": 75.3133514986376,
+ "grad_norm": 2.1780340671539307,
+ "learning_rate": 3.0296348091214676e-06,
+ "loss": 0.0623,
+ "step": 27640
+ },
+ {
+ "epoch": 75.31607629427793,
+ "grad_norm": 2.5636348724365234,
+ "learning_rate": 3.0290020561699385e-06,
+ "loss": 0.054,
+ "step": 27641
+ },
+ {
+ "epoch": 75.31880108991825,
+ "grad_norm": 2.5974178314208984,
+ "learning_rate": 3.0283693575083174e-06,
+ "loss": 0.0677,
+ "step": 27642
+ },
+ {
+ "epoch": 75.32152588555859,
+ "grad_norm": 1.8714269399642944,
+ "learning_rate": 3.0277367131415336e-06,
+ "loss": 0.0333,
+ "step": 27643
+ },
+ {
+ "epoch": 75.3242506811989,
+ "grad_norm": 3.2616562843322754,
+ "learning_rate": 3.0271041230745122e-06,
+ "loss": 0.0676,
+ "step": 27644
+ },
+ {
+ "epoch": 75.32697547683924,
+ "grad_norm": 2.9135024547576904,
+ "learning_rate": 3.0264715873121796e-06,
+ "loss": 0.1273,
+ "step": 27645
+ },
+ {
+ "epoch": 75.32970027247957,
+ "grad_norm": 2.4170942306518555,
+ "learning_rate": 3.0258391058594595e-06,
+ "loss": 0.031,
+ "step": 27646
+ },
+ {
+ "epoch": 75.33242506811989,
+ "grad_norm": 2.555218458175659,
+ "learning_rate": 3.0252066787212817e-06,
+ "loss": 0.0245,
+ "step": 27647
+ },
+ {
+ "epoch": 75.33514986376022,
+ "grad_norm": 3.3662526607513428,
+ "learning_rate": 3.0245743059025713e-06,
+ "loss": 0.0355,
+ "step": 27648
+ },
+ {
+ "epoch": 75.33787465940054,
+ "grad_norm": 3.288583517074585,
+ "learning_rate": 3.023941987408251e-06,
+ "loss": 0.0867,
+ "step": 27649
+ },
+ {
+ "epoch": 75.34059945504087,
+ "grad_norm": 2.092853307723999,
+ "learning_rate": 3.0233097232432417e-06,
+ "loss": 0.0334,
+ "step": 27650
+ },
+ {
+ "epoch": 75.34332425068119,
+ "grad_norm": 2.833671808242798,
+ "learning_rate": 3.022677513412476e-06,
+ "loss": 0.0348,
+ "step": 27651
+ },
+ {
+ "epoch": 75.34604904632153,
+ "grad_norm": 2.574719190597534,
+ "learning_rate": 3.022045357920873e-06,
+ "loss": 0.0339,
+ "step": 27652
+ },
+ {
+ "epoch": 75.34877384196186,
+ "grad_norm": 2.987471342086792,
+ "learning_rate": 3.0214132567733565e-06,
+ "loss": 0.0458,
+ "step": 27653
+ },
+ {
+ "epoch": 75.35149863760218,
+ "grad_norm": 2.910118341445923,
+ "learning_rate": 3.020781209974846e-06,
+ "loss": 0.0943,
+ "step": 27654
+ },
+ {
+ "epoch": 75.35422343324251,
+ "grad_norm": 2.1420702934265137,
+ "learning_rate": 3.0201492175302695e-06,
+ "loss": 0.0319,
+ "step": 27655
+ },
+ {
+ "epoch": 75.35694822888283,
+ "grad_norm": 2.2705018520355225,
+ "learning_rate": 3.019517279444546e-06,
+ "loss": 0.038,
+ "step": 27656
+ },
+ {
+ "epoch": 75.35967302452316,
+ "grad_norm": 3.6899421215057373,
+ "learning_rate": 3.0188853957225984e-06,
+ "loss": 0.1614,
+ "step": 27657
+ },
+ {
+ "epoch": 75.3623978201635,
+ "grad_norm": 3.608517646789551,
+ "learning_rate": 3.0182535663693422e-06,
+ "loss": 0.0713,
+ "step": 27658
+ },
+ {
+ "epoch": 75.36512261580381,
+ "grad_norm": 4.432520389556885,
+ "learning_rate": 3.0176217913897034e-06,
+ "loss": 0.0383,
+ "step": 27659
+ },
+ {
+ "epoch": 75.36784741144415,
+ "grad_norm": 3.134857416152954,
+ "learning_rate": 3.0169900707886036e-06,
+ "loss": 0.0288,
+ "step": 27660
+ },
+ {
+ "epoch": 75.37057220708446,
+ "grad_norm": 2.952052116394043,
+ "learning_rate": 3.0163584045709615e-06,
+ "loss": 0.0445,
+ "step": 27661
+ },
+ {
+ "epoch": 75.3732970027248,
+ "grad_norm": 3.3065953254699707,
+ "learning_rate": 3.0157267927416912e-06,
+ "loss": 0.0955,
+ "step": 27662
+ },
+ {
+ "epoch": 75.37602179836512,
+ "grad_norm": 17.400815963745117,
+ "learning_rate": 3.0150952353057195e-06,
+ "loss": 0.038,
+ "step": 27663
+ },
+ {
+ "epoch": 75.37874659400545,
+ "grad_norm": 2.445208787918091,
+ "learning_rate": 3.0144637322679617e-06,
+ "loss": 0.0956,
+ "step": 27664
+ },
+ {
+ "epoch": 75.38147138964578,
+ "grad_norm": 3.191053867340088,
+ "learning_rate": 3.0138322836333343e-06,
+ "loss": 0.09,
+ "step": 27665
+ },
+ {
+ "epoch": 75.3841961852861,
+ "grad_norm": 3.7337753772735596,
+ "learning_rate": 3.0132008894067545e-06,
+ "loss": 0.0848,
+ "step": 27666
+ },
+ {
+ "epoch": 75.38692098092643,
+ "grad_norm": 14.248208045959473,
+ "learning_rate": 3.012569549593143e-06,
+ "loss": 0.062,
+ "step": 27667
+ },
+ {
+ "epoch": 75.38964577656675,
+ "grad_norm": 3.1568360328674316,
+ "learning_rate": 3.011938264197416e-06,
+ "loss": 0.052,
+ "step": 27668
+ },
+ {
+ "epoch": 75.39237057220708,
+ "grad_norm": 4.756346702575684,
+ "learning_rate": 3.0113070332244886e-06,
+ "loss": 0.0316,
+ "step": 27669
+ },
+ {
+ "epoch": 75.39509536784742,
+ "grad_norm": 3.052743673324585,
+ "learning_rate": 3.0106758566792737e-06,
+ "loss": 0.2044,
+ "step": 27670
+ },
+ {
+ "epoch": 75.39782016348774,
+ "grad_norm": 3.078798770904541,
+ "learning_rate": 3.0100447345666937e-06,
+ "loss": 0.0694,
+ "step": 27671
+ },
+ {
+ "epoch": 75.40054495912807,
+ "grad_norm": 2.136767864227295,
+ "learning_rate": 3.0094136668916607e-06,
+ "loss": 0.067,
+ "step": 27672
+ },
+ {
+ "epoch": 75.40326975476839,
+ "grad_norm": 3.910614490509033,
+ "learning_rate": 3.008782653659089e-06,
+ "loss": 0.0602,
+ "step": 27673
+ },
+ {
+ "epoch": 75.40599455040872,
+ "grad_norm": 2.9418959617614746,
+ "learning_rate": 3.0081516948738887e-06,
+ "loss": 0.0776,
+ "step": 27674
+ },
+ {
+ "epoch": 75.40871934604904,
+ "grad_norm": 3.3807084560394287,
+ "learning_rate": 3.007520790540982e-06,
+ "loss": 0.0402,
+ "step": 27675
+ },
+ {
+ "epoch": 75.41144414168937,
+ "grad_norm": 3.7821102142333984,
+ "learning_rate": 3.0068899406652752e-06,
+ "loss": 0.0484,
+ "step": 27676
+ },
+ {
+ "epoch": 75.4141689373297,
+ "grad_norm": 2.784954309463501,
+ "learning_rate": 3.0062591452516876e-06,
+ "loss": 0.0745,
+ "step": 27677
+ },
+ {
+ "epoch": 75.41689373297002,
+ "grad_norm": 2.7617006301879883,
+ "learning_rate": 3.0056284043051286e-06,
+ "loss": 0.0839,
+ "step": 27678
+ },
+ {
+ "epoch": 75.41961852861036,
+ "grad_norm": 6.001311779022217,
+ "learning_rate": 3.004997717830508e-06,
+ "loss": 0.0457,
+ "step": 27679
+ },
+ {
+ "epoch": 75.42234332425068,
+ "grad_norm": 3.061800241470337,
+ "learning_rate": 3.004367085832742e-06,
+ "loss": 0.0797,
+ "step": 27680
+ },
+ {
+ "epoch": 75.42506811989101,
+ "grad_norm": 2.0810399055480957,
+ "learning_rate": 3.0037365083167404e-06,
+ "loss": 0.0618,
+ "step": 27681
+ },
+ {
+ "epoch": 75.42779291553134,
+ "grad_norm": 2.682482957839966,
+ "learning_rate": 3.003105985287411e-06,
+ "loss": 0.0948,
+ "step": 27682
+ },
+ {
+ "epoch": 75.43051771117166,
+ "grad_norm": 3.283461570739746,
+ "learning_rate": 3.00247551674967e-06,
+ "loss": 0.0921,
+ "step": 27683
+ },
+ {
+ "epoch": 75.433242506812,
+ "grad_norm": 3.275836229324341,
+ "learning_rate": 3.0018451027084238e-06,
+ "loss": 0.0941,
+ "step": 27684
+ },
+ {
+ "epoch": 75.43596730245231,
+ "grad_norm": 2.952338218688965,
+ "learning_rate": 3.0012147431685832e-06,
+ "loss": 0.0492,
+ "step": 27685
+ },
+ {
+ "epoch": 75.43869209809264,
+ "grad_norm": 2.4903459548950195,
+ "learning_rate": 3.0005844381350545e-06,
+ "loss": 0.0975,
+ "step": 27686
+ },
+ {
+ "epoch": 75.44141689373296,
+ "grad_norm": 2.38456130027771,
+ "learning_rate": 2.9999541876127513e-06,
+ "loss": 0.0465,
+ "step": 27687
+ },
+ {
+ "epoch": 75.4441416893733,
+ "grad_norm": 2.847486972808838,
+ "learning_rate": 2.99932399160658e-06,
+ "loss": 0.2217,
+ "step": 27688
+ },
+ {
+ "epoch": 75.44686648501363,
+ "grad_norm": 2.646130323410034,
+ "learning_rate": 2.998693850121447e-06,
+ "loss": 0.1184,
+ "step": 27689
+ },
+ {
+ "epoch": 75.44959128065395,
+ "grad_norm": 2.516571044921875,
+ "learning_rate": 2.998063763162259e-06,
+ "loss": 0.0384,
+ "step": 27690
+ },
+ {
+ "epoch": 75.45231607629428,
+ "grad_norm": 2.517336368560791,
+ "learning_rate": 2.9974337307339274e-06,
+ "loss": 0.0426,
+ "step": 27691
+ },
+ {
+ "epoch": 75.4550408719346,
+ "grad_norm": 3.6232411861419678,
+ "learning_rate": 2.9968037528413573e-06,
+ "loss": 0.0533,
+ "step": 27692
+ },
+ {
+ "epoch": 75.45776566757493,
+ "grad_norm": 3.2437920570373535,
+ "learning_rate": 2.9961738294894504e-06,
+ "loss": 0.0405,
+ "step": 27693
+ },
+ {
+ "epoch": 75.46049046321527,
+ "grad_norm": 3.5633132457733154,
+ "learning_rate": 2.9955439606831195e-06,
+ "loss": 0.1422,
+ "step": 27694
+ },
+ {
+ "epoch": 75.46321525885558,
+ "grad_norm": 3.4561767578125,
+ "learning_rate": 2.9949141464272635e-06,
+ "loss": 0.0347,
+ "step": 27695
+ },
+ {
+ "epoch": 75.46594005449592,
+ "grad_norm": 3.184873580932617,
+ "learning_rate": 2.9942843867267947e-06,
+ "loss": 0.0481,
+ "step": 27696
+ },
+ {
+ "epoch": 75.46866485013624,
+ "grad_norm": 2.4604759216308594,
+ "learning_rate": 2.993654681586613e-06,
+ "loss": 0.0634,
+ "step": 27697
+ },
+ {
+ "epoch": 75.47138964577657,
+ "grad_norm": 2.241732120513916,
+ "learning_rate": 2.993025031011623e-06,
+ "loss": 0.0384,
+ "step": 27698
+ },
+ {
+ "epoch": 75.47411444141689,
+ "grad_norm": 2.451686382293701,
+ "learning_rate": 2.9923954350067263e-06,
+ "loss": 0.149,
+ "step": 27699
+ },
+ {
+ "epoch": 75.47683923705722,
+ "grad_norm": 2.762377977371216,
+ "learning_rate": 2.99176589357683e-06,
+ "loss": 0.1074,
+ "step": 27700
+ },
+ {
+ "epoch": 75.47956403269755,
+ "grad_norm": 3.2475740909576416,
+ "learning_rate": 2.9911364067268366e-06,
+ "loss": 0.027,
+ "step": 27701
+ },
+ {
+ "epoch": 75.48228882833787,
+ "grad_norm": 4.86683988571167,
+ "learning_rate": 2.9905069744616466e-06,
+ "loss": 0.0376,
+ "step": 27702
+ },
+ {
+ "epoch": 75.4850136239782,
+ "grad_norm": 1.99662446975708,
+ "learning_rate": 2.9898775967861605e-06,
+ "loss": 0.0282,
+ "step": 27703
+ },
+ {
+ "epoch": 75.48773841961852,
+ "grad_norm": 3.2977609634399414,
+ "learning_rate": 2.9892482737052843e-06,
+ "loss": 0.0354,
+ "step": 27704
+ },
+ {
+ "epoch": 75.49046321525886,
+ "grad_norm": 1.8643726110458374,
+ "learning_rate": 2.9886190052239173e-06,
+ "loss": 0.029,
+ "step": 27705
+ },
+ {
+ "epoch": 75.49318801089919,
+ "grad_norm": 2.6245758533477783,
+ "learning_rate": 2.987989791346957e-06,
+ "loss": 0.1093,
+ "step": 27706
+ },
+ {
+ "epoch": 75.49591280653951,
+ "grad_norm": 1.6000523567199707,
+ "learning_rate": 2.987360632079308e-06,
+ "loss": 0.0178,
+ "step": 27707
+ },
+ {
+ "epoch": 75.49863760217984,
+ "grad_norm": 2.616818428039551,
+ "learning_rate": 2.98673152742587e-06,
+ "loss": 0.0347,
+ "step": 27708
+ },
+ {
+ "epoch": 75.50136239782016,
+ "grad_norm": 2.732534408569336,
+ "learning_rate": 2.9861024773915415e-06,
+ "loss": 0.0381,
+ "step": 27709
+ },
+ {
+ "epoch": 75.50408719346049,
+ "grad_norm": 2.3392136096954346,
+ "learning_rate": 2.985473481981218e-06,
+ "loss": 0.0285,
+ "step": 27710
+ },
+ {
+ "epoch": 75.50681198910081,
+ "grad_norm": 2.6736907958984375,
+ "learning_rate": 2.9848445411998006e-06,
+ "loss": 0.0343,
+ "step": 27711
+ },
+ {
+ "epoch": 75.50953678474114,
+ "grad_norm": 4.17382287979126,
+ "learning_rate": 2.9842156550521915e-06,
+ "loss": 0.2088,
+ "step": 27712
+ },
+ {
+ "epoch": 75.51226158038148,
+ "grad_norm": 3.360193967819214,
+ "learning_rate": 2.983586823543285e-06,
+ "loss": 0.0765,
+ "step": 27713
+ },
+ {
+ "epoch": 75.5149863760218,
+ "grad_norm": 5.581449031829834,
+ "learning_rate": 2.9829580466779784e-06,
+ "loss": 0.1318,
+ "step": 27714
+ },
+ {
+ "epoch": 75.51771117166213,
+ "grad_norm": 2.783514976501465,
+ "learning_rate": 2.982329324461166e-06,
+ "loss": 0.0382,
+ "step": 27715
+ },
+ {
+ "epoch": 75.52043596730245,
+ "grad_norm": 5.091421604156494,
+ "learning_rate": 2.981700656897749e-06,
+ "loss": 0.1542,
+ "step": 27716
+ },
+ {
+ "epoch": 75.52316076294278,
+ "grad_norm": 2.9237117767333984,
+ "learning_rate": 2.981072043992623e-06,
+ "loss": 0.1121,
+ "step": 27717
+ },
+ {
+ "epoch": 75.52588555858311,
+ "grad_norm": 2.1351101398468018,
+ "learning_rate": 2.9804434857506816e-06,
+ "loss": 0.0408,
+ "step": 27718
+ },
+ {
+ "epoch": 75.52861035422343,
+ "grad_norm": 2.7612287998199463,
+ "learning_rate": 2.979814982176816e-06,
+ "loss": 0.0926,
+ "step": 27719
+ },
+ {
+ "epoch": 75.53133514986376,
+ "grad_norm": 3.3539750576019287,
+ "learning_rate": 2.9791865332759294e-06,
+ "loss": 0.1746,
+ "step": 27720
+ },
+ {
+ "epoch": 75.53405994550408,
+ "grad_norm": 3.053982734680176,
+ "learning_rate": 2.978558139052913e-06,
+ "loss": 0.0992,
+ "step": 27721
+ },
+ {
+ "epoch": 75.53678474114442,
+ "grad_norm": 2.8916139602661133,
+ "learning_rate": 2.9779297995126587e-06,
+ "loss": 0.1357,
+ "step": 27722
+ },
+ {
+ "epoch": 75.53950953678473,
+ "grad_norm": 3.015062093734741,
+ "learning_rate": 2.977301514660058e-06,
+ "loss": 0.049,
+ "step": 27723
+ },
+ {
+ "epoch": 75.54223433242507,
+ "grad_norm": 2.5487701892852783,
+ "learning_rate": 2.97667328450001e-06,
+ "loss": 0.0358,
+ "step": 27724
+ },
+ {
+ "epoch": 75.5449591280654,
+ "grad_norm": 2.8236160278320312,
+ "learning_rate": 2.9760451090374054e-06,
+ "loss": 0.1336,
+ "step": 27725
+ },
+ {
+ "epoch": 75.54768392370572,
+ "grad_norm": 2.3216240406036377,
+ "learning_rate": 2.9754169882771324e-06,
+ "loss": 0.0232,
+ "step": 27726
+ },
+ {
+ "epoch": 75.55040871934605,
+ "grad_norm": 2.9198029041290283,
+ "learning_rate": 2.9747889222240878e-06,
+ "loss": 0.1321,
+ "step": 27727
+ },
+ {
+ "epoch": 75.55313351498637,
+ "grad_norm": 2.4257829189300537,
+ "learning_rate": 2.974160910883158e-06,
+ "loss": 0.0457,
+ "step": 27728
+ },
+ {
+ "epoch": 75.5558583106267,
+ "grad_norm": 2.857954740524292,
+ "learning_rate": 2.9735329542592407e-06,
+ "loss": 0.0479,
+ "step": 27729
+ },
+ {
+ "epoch": 75.55858310626704,
+ "grad_norm": 2.7027206420898438,
+ "learning_rate": 2.9729050523572222e-06,
+ "loss": 0.0682,
+ "step": 27730
+ },
+ {
+ "epoch": 75.56130790190736,
+ "grad_norm": 3.273747205734253,
+ "learning_rate": 2.9722772051819902e-06,
+ "loss": 0.0833,
+ "step": 27731
+ },
+ {
+ "epoch": 75.56403269754769,
+ "grad_norm": 3.459521770477295,
+ "learning_rate": 2.9716494127384397e-06,
+ "loss": 0.2134,
+ "step": 27732
+ },
+ {
+ "epoch": 75.566757493188,
+ "grad_norm": 2.729978084564209,
+ "learning_rate": 2.971021675031458e-06,
+ "loss": 0.038,
+ "step": 27733
+ },
+ {
+ "epoch": 75.56948228882834,
+ "grad_norm": 3.5037550926208496,
+ "learning_rate": 2.9703939920659332e-06,
+ "loss": 0.0571,
+ "step": 27734
+ },
+ {
+ "epoch": 75.57220708446866,
+ "grad_norm": 2.6768691539764404,
+ "learning_rate": 2.96976636384675e-06,
+ "loss": 0.1088,
+ "step": 27735
+ },
+ {
+ "epoch": 75.57493188010899,
+ "grad_norm": 2.6828341484069824,
+ "learning_rate": 2.9691387903788037e-06,
+ "loss": 0.0492,
+ "step": 27736
+ },
+ {
+ "epoch": 75.57765667574932,
+ "grad_norm": 3.8994791507720947,
+ "learning_rate": 2.9685112716669783e-06,
+ "loss": 0.0544,
+ "step": 27737
+ },
+ {
+ "epoch": 75.58038147138964,
+ "grad_norm": 2.9792799949645996,
+ "learning_rate": 2.967883807716161e-06,
+ "loss": 0.1784,
+ "step": 27738
+ },
+ {
+ "epoch": 75.58310626702998,
+ "grad_norm": 3.3979854583740234,
+ "learning_rate": 2.967256398531234e-06,
+ "loss": 0.1164,
+ "step": 27739
+ },
+ {
+ "epoch": 75.5858310626703,
+ "grad_norm": 3.6894583702087402,
+ "learning_rate": 2.966629044117092e-06,
+ "loss": 0.137,
+ "step": 27740
+ },
+ {
+ "epoch": 75.58855585831063,
+ "grad_norm": 3.2741520404815674,
+ "learning_rate": 2.966001744478616e-06,
+ "loss": 0.0805,
+ "step": 27741
+ },
+ {
+ "epoch": 75.59128065395096,
+ "grad_norm": 2.296541690826416,
+ "learning_rate": 2.9653744996206926e-06,
+ "loss": 0.0402,
+ "step": 27742
+ },
+ {
+ "epoch": 75.59400544959128,
+ "grad_norm": 4.692990779876709,
+ "learning_rate": 2.964747309548203e-06,
+ "loss": 0.0397,
+ "step": 27743
+ },
+ {
+ "epoch": 75.59673024523161,
+ "grad_norm": 3.9447741508483887,
+ "learning_rate": 2.9641201742660376e-06,
+ "loss": 0.1126,
+ "step": 27744
+ },
+ {
+ "epoch": 75.59945504087193,
+ "grad_norm": 2.402883529663086,
+ "learning_rate": 2.963493093779075e-06,
+ "loss": 0.105,
+ "step": 27745
+ },
+ {
+ "epoch": 75.60217983651226,
+ "grad_norm": 8.863261222839355,
+ "learning_rate": 2.962866068092205e-06,
+ "loss": 0.057,
+ "step": 27746
+ },
+ {
+ "epoch": 75.60490463215258,
+ "grad_norm": 2.721849203109741,
+ "learning_rate": 2.9622390972103043e-06,
+ "loss": 0.0706,
+ "step": 27747
+ },
+ {
+ "epoch": 75.60762942779292,
+ "grad_norm": 2.285156726837158,
+ "learning_rate": 2.9616121811382626e-06,
+ "loss": 0.0397,
+ "step": 27748
+ },
+ {
+ "epoch": 75.61035422343325,
+ "grad_norm": 2.971112012863159,
+ "learning_rate": 2.9609853198809578e-06,
+ "loss": 0.0477,
+ "step": 27749
+ },
+ {
+ "epoch": 75.61307901907357,
+ "grad_norm": 3.614335536956787,
+ "learning_rate": 2.9603585134432733e-06,
+ "loss": 0.1705,
+ "step": 27750
+ },
+ {
+ "epoch": 75.6158038147139,
+ "grad_norm": 3.1232776641845703,
+ "learning_rate": 2.959731761830087e-06,
+ "loss": 0.0841,
+ "step": 27751
+ },
+ {
+ "epoch": 75.61852861035422,
+ "grad_norm": 1.7605881690979004,
+ "learning_rate": 2.959105065046286e-06,
+ "loss": 0.0292,
+ "step": 27752
+ },
+ {
+ "epoch": 75.62125340599455,
+ "grad_norm": 2.2683191299438477,
+ "learning_rate": 2.958478423096748e-06,
+ "loss": 0.0318,
+ "step": 27753
+ },
+ {
+ "epoch": 75.62397820163488,
+ "grad_norm": 2.2947306632995605,
+ "learning_rate": 2.9578518359863537e-06,
+ "loss": 0.0449,
+ "step": 27754
+ },
+ {
+ "epoch": 75.6267029972752,
+ "grad_norm": 2.4742581844329834,
+ "learning_rate": 2.9572253037199795e-06,
+ "loss": 0.0302,
+ "step": 27755
+ },
+ {
+ "epoch": 75.62942779291554,
+ "grad_norm": 2.044041633605957,
+ "learning_rate": 2.9565988263025114e-06,
+ "loss": 0.1055,
+ "step": 27756
+ },
+ {
+ "epoch": 75.63215258855585,
+ "grad_norm": 2.1931862831115723,
+ "learning_rate": 2.955972403738825e-06,
+ "loss": 0.0292,
+ "step": 27757
+ },
+ {
+ "epoch": 75.63487738419619,
+ "grad_norm": 2.2893283367156982,
+ "learning_rate": 2.9553460360337983e-06,
+ "loss": 0.0285,
+ "step": 27758
+ },
+ {
+ "epoch": 75.6376021798365,
+ "grad_norm": 3.866868734359741,
+ "learning_rate": 2.9547197231923065e-06,
+ "loss": 0.0428,
+ "step": 27759
+ },
+ {
+ "epoch": 75.64032697547684,
+ "grad_norm": 2.8351898193359375,
+ "learning_rate": 2.9540934652192343e-06,
+ "loss": 0.03,
+ "step": 27760
+ },
+ {
+ "epoch": 75.64305177111717,
+ "grad_norm": 3.13128399848938,
+ "learning_rate": 2.953467262119456e-06,
+ "loss": 0.1227,
+ "step": 27761
+ },
+ {
+ "epoch": 75.64577656675749,
+ "grad_norm": 2.306823492050171,
+ "learning_rate": 2.952841113897844e-06,
+ "loss": 0.0343,
+ "step": 27762
+ },
+ {
+ "epoch": 75.64850136239782,
+ "grad_norm": 3.6572632789611816,
+ "learning_rate": 2.9522150205592825e-06,
+ "loss": 0.0845,
+ "step": 27763
+ },
+ {
+ "epoch": 75.65122615803814,
+ "grad_norm": 3.499213457107544,
+ "learning_rate": 2.9515889821086395e-06,
+ "loss": 0.0363,
+ "step": 27764
+ },
+ {
+ "epoch": 75.65395095367847,
+ "grad_norm": 2.911710262298584,
+ "learning_rate": 2.950962998550798e-06,
+ "loss": 0.0303,
+ "step": 27765
+ },
+ {
+ "epoch": 75.65667574931881,
+ "grad_norm": 2.25347638130188,
+ "learning_rate": 2.9503370698906298e-06,
+ "loss": 0.026,
+ "step": 27766
+ },
+ {
+ "epoch": 75.65940054495913,
+ "grad_norm": 2.3659725189208984,
+ "learning_rate": 2.9497111961330103e-06,
+ "loss": 0.0445,
+ "step": 27767
+ },
+ {
+ "epoch": 75.66212534059946,
+ "grad_norm": 3.2874715328216553,
+ "learning_rate": 2.94908537728281e-06,
+ "loss": 0.0517,
+ "step": 27768
+ },
+ {
+ "epoch": 75.66485013623978,
+ "grad_norm": 4.073539733886719,
+ "learning_rate": 2.9484596133449086e-06,
+ "loss": 0.2055,
+ "step": 27769
+ },
+ {
+ "epoch": 75.66757493188011,
+ "grad_norm": 2.573126792907715,
+ "learning_rate": 2.9478339043241753e-06,
+ "loss": 0.1221,
+ "step": 27770
+ },
+ {
+ "epoch": 75.67029972752043,
+ "grad_norm": 4.630699157714844,
+ "learning_rate": 2.947208250225484e-06,
+ "loss": 0.2313,
+ "step": 27771
+ },
+ {
+ "epoch": 75.67302452316076,
+ "grad_norm": 2.453627109527588,
+ "learning_rate": 2.946582651053709e-06,
+ "loss": 0.0513,
+ "step": 27772
+ },
+ {
+ "epoch": 75.6757493188011,
+ "grad_norm": 5.062366008758545,
+ "learning_rate": 2.945957106813723e-06,
+ "loss": 0.1424,
+ "step": 27773
+ },
+ {
+ "epoch": 75.67847411444141,
+ "grad_norm": 2.7563202381134033,
+ "learning_rate": 2.945331617510394e-06,
+ "loss": 0.1469,
+ "step": 27774
+ },
+ {
+ "epoch": 75.68119891008175,
+ "grad_norm": 8.14344596862793,
+ "learning_rate": 2.9447061831485933e-06,
+ "loss": 0.0764,
+ "step": 27775
+ },
+ {
+ "epoch": 75.68392370572207,
+ "grad_norm": 2.9626362323760986,
+ "learning_rate": 2.944080803733197e-06,
+ "loss": 0.0455,
+ "step": 27776
+ },
+ {
+ "epoch": 75.6866485013624,
+ "grad_norm": 2.519667148590088,
+ "learning_rate": 2.943455479269073e-06,
+ "loss": 0.1069,
+ "step": 27777
+ },
+ {
+ "epoch": 75.68937329700273,
+ "grad_norm": 2.71968674659729,
+ "learning_rate": 2.9428302097610894e-06,
+ "loss": 0.0428,
+ "step": 27778
+ },
+ {
+ "epoch": 75.69209809264305,
+ "grad_norm": 2.561763286590576,
+ "learning_rate": 2.9422049952141142e-06,
+ "loss": 0.1014,
+ "step": 27779
+ },
+ {
+ "epoch": 75.69482288828338,
+ "grad_norm": 2.0596539974212646,
+ "learning_rate": 2.941579835633019e-06,
+ "loss": 0.032,
+ "step": 27780
+ },
+ {
+ "epoch": 75.6975476839237,
+ "grad_norm": 1.8910735845565796,
+ "learning_rate": 2.9409547310226773e-06,
+ "loss": 0.1788,
+ "step": 27781
+ },
+ {
+ "epoch": 75.70027247956403,
+ "grad_norm": 5.750277519226074,
+ "learning_rate": 2.9403296813879513e-06,
+ "loss": 0.0515,
+ "step": 27782
+ },
+ {
+ "epoch": 75.70299727520435,
+ "grad_norm": 1.9856802225112915,
+ "learning_rate": 2.939704686733711e-06,
+ "loss": 0.0274,
+ "step": 27783
+ },
+ {
+ "epoch": 75.70572207084469,
+ "grad_norm": 2.824207067489624,
+ "learning_rate": 2.939079747064821e-06,
+ "loss": 0.0716,
+ "step": 27784
+ },
+ {
+ "epoch": 75.70844686648502,
+ "grad_norm": 3.398721933364868,
+ "learning_rate": 2.9384548623861533e-06,
+ "loss": 0.1962,
+ "step": 27785
+ },
+ {
+ "epoch": 75.71117166212534,
+ "grad_norm": 3.622636318206787,
+ "learning_rate": 2.937830032702572e-06,
+ "loss": 0.0571,
+ "step": 27786
+ },
+ {
+ "epoch": 75.71389645776567,
+ "grad_norm": 4.732388019561768,
+ "learning_rate": 2.9372052580189424e-06,
+ "loss": 0.0569,
+ "step": 27787
+ },
+ {
+ "epoch": 75.71662125340599,
+ "grad_norm": 2.658836841583252,
+ "learning_rate": 2.936580538340129e-06,
+ "loss": 0.0514,
+ "step": 27788
+ },
+ {
+ "epoch": 75.71934604904632,
+ "grad_norm": 2.121434211730957,
+ "learning_rate": 2.9359558736710016e-06,
+ "loss": 0.0357,
+ "step": 27789
+ },
+ {
+ "epoch": 75.72207084468666,
+ "grad_norm": 3.747109889984131,
+ "learning_rate": 2.9353312640164223e-06,
+ "loss": 0.1473,
+ "step": 27790
+ },
+ {
+ "epoch": 75.72479564032697,
+ "grad_norm": 3.1915030479431152,
+ "learning_rate": 2.934706709381253e-06,
+ "loss": 0.2152,
+ "step": 27791
+ },
+ {
+ "epoch": 75.7275204359673,
+ "grad_norm": 2.266594886779785,
+ "learning_rate": 2.9340822097703626e-06,
+ "loss": 0.039,
+ "step": 27792
+ },
+ {
+ "epoch": 75.73024523160763,
+ "grad_norm": 4.012491226196289,
+ "learning_rate": 2.933457765188613e-06,
+ "loss": 0.0697,
+ "step": 27793
+ },
+ {
+ "epoch": 75.73297002724796,
+ "grad_norm": 3.757294178009033,
+ "learning_rate": 2.932833375640868e-06,
+ "loss": 0.1701,
+ "step": 27794
+ },
+ {
+ "epoch": 75.73569482288828,
+ "grad_norm": 4.026195526123047,
+ "learning_rate": 2.932209041131985e-06,
+ "loss": 0.0751,
+ "step": 27795
+ },
+ {
+ "epoch": 75.73841961852861,
+ "grad_norm": 3.2037413120269775,
+ "learning_rate": 2.9315847616668315e-06,
+ "loss": 0.0926,
+ "step": 27796
+ },
+ {
+ "epoch": 75.74114441416894,
+ "grad_norm": 2.414330005645752,
+ "learning_rate": 2.93096053725027e-06,
+ "loss": 0.0307,
+ "step": 27797
+ },
+ {
+ "epoch": 75.74386920980926,
+ "grad_norm": 2.8596391677856445,
+ "learning_rate": 2.930336367887161e-06,
+ "loss": 0.0864,
+ "step": 27798
+ },
+ {
+ "epoch": 75.7465940054496,
+ "grad_norm": 3.3420329093933105,
+ "learning_rate": 2.929712253582365e-06,
+ "loss": 0.0613,
+ "step": 27799
+ },
+ {
+ "epoch": 75.74931880108991,
+ "grad_norm": 2.1052417755126953,
+ "learning_rate": 2.929088194340739e-06,
+ "loss": 0.0838,
+ "step": 27800
+ },
+ {
+ "epoch": 75.75204359673025,
+ "grad_norm": 3.157144784927368,
+ "learning_rate": 2.928464190167151e-06,
+ "loss": 0.1619,
+ "step": 27801
+ },
+ {
+ "epoch": 75.75476839237058,
+ "grad_norm": 2.7051918506622314,
+ "learning_rate": 2.9278402410664543e-06,
+ "loss": 0.0595,
+ "step": 27802
+ },
+ {
+ "epoch": 75.7574931880109,
+ "grad_norm": 2.1615326404571533,
+ "learning_rate": 2.927216347043511e-06,
+ "loss": 0.0281,
+ "step": 27803
+ },
+ {
+ "epoch": 75.76021798365123,
+ "grad_norm": 4.368989944458008,
+ "learning_rate": 2.9265925081031767e-06,
+ "loss": 0.0499,
+ "step": 27804
+ },
+ {
+ "epoch": 75.76294277929155,
+ "grad_norm": 2.4406278133392334,
+ "learning_rate": 2.9259687242503144e-06,
+ "loss": 0.0515,
+ "step": 27805
+ },
+ {
+ "epoch": 75.76566757493188,
+ "grad_norm": 1.9840441942214966,
+ "learning_rate": 2.9253449954897807e-06,
+ "loss": 0.0221,
+ "step": 27806
+ },
+ {
+ "epoch": 75.7683923705722,
+ "grad_norm": 5.387057781219482,
+ "learning_rate": 2.9247213218264326e-06,
+ "loss": 0.1185,
+ "step": 27807
+ },
+ {
+ "epoch": 75.77111716621253,
+ "grad_norm": 3.386645555496216,
+ "learning_rate": 2.924097703265123e-06,
+ "loss": 0.15,
+ "step": 27808
+ },
+ {
+ "epoch": 75.77384196185287,
+ "grad_norm": 3.5044636726379395,
+ "learning_rate": 2.9234741398107168e-06,
+ "loss": 0.1477,
+ "step": 27809
+ },
+ {
+ "epoch": 75.77656675749319,
+ "grad_norm": 2.8873465061187744,
+ "learning_rate": 2.922850631468066e-06,
+ "loss": 0.0611,
+ "step": 27810
+ },
+ {
+ "epoch": 75.77929155313352,
+ "grad_norm": 5.114377975463867,
+ "learning_rate": 2.9222271782420264e-06,
+ "loss": 0.0489,
+ "step": 27811
+ },
+ {
+ "epoch": 75.78201634877384,
+ "grad_norm": 2.4986019134521484,
+ "learning_rate": 2.921603780137451e-06,
+ "loss": 0.0862,
+ "step": 27812
+ },
+ {
+ "epoch": 75.78474114441417,
+ "grad_norm": 10.487380981445312,
+ "learning_rate": 2.9209804371592e-06,
+ "loss": 0.0415,
+ "step": 27813
+ },
+ {
+ "epoch": 75.7874659400545,
+ "grad_norm": 2.6905405521392822,
+ "learning_rate": 2.920357149312123e-06,
+ "loss": 0.0858,
+ "step": 27814
+ },
+ {
+ "epoch": 75.79019073569482,
+ "grad_norm": 2.6635348796844482,
+ "learning_rate": 2.9197339166010795e-06,
+ "loss": 0.041,
+ "step": 27815
+ },
+ {
+ "epoch": 75.79291553133515,
+ "grad_norm": 2.844661235809326,
+ "learning_rate": 2.919110739030918e-06,
+ "loss": 0.0576,
+ "step": 27816
+ },
+ {
+ "epoch": 75.79564032697547,
+ "grad_norm": 3.05802583694458,
+ "learning_rate": 2.918487616606497e-06,
+ "loss": 0.0695,
+ "step": 27817
+ },
+ {
+ "epoch": 75.7983651226158,
+ "grad_norm": 3.6677818298339844,
+ "learning_rate": 2.9178645493326664e-06,
+ "loss": 0.0724,
+ "step": 27818
+ },
+ {
+ "epoch": 75.80108991825612,
+ "grad_norm": 2.994086980819702,
+ "learning_rate": 2.917241537214278e-06,
+ "loss": 0.04,
+ "step": 27819
+ },
+ {
+ "epoch": 75.80381471389646,
+ "grad_norm": 2.594191551208496,
+ "learning_rate": 2.916618580256182e-06,
+ "loss": 0.0652,
+ "step": 27820
+ },
+ {
+ "epoch": 75.80653950953679,
+ "grad_norm": 3.1373801231384277,
+ "learning_rate": 2.915995678463236e-06,
+ "loss": 0.0761,
+ "step": 27821
+ },
+ {
+ "epoch": 75.80926430517711,
+ "grad_norm": 2.3345096111297607,
+ "learning_rate": 2.9153728318402875e-06,
+ "loss": 0.0311,
+ "step": 27822
+ },
+ {
+ "epoch": 75.81198910081744,
+ "grad_norm": 2.6505022048950195,
+ "learning_rate": 2.914750040392187e-06,
+ "loss": 0.0343,
+ "step": 27823
+ },
+ {
+ "epoch": 75.81471389645776,
+ "grad_norm": 2.4502649307250977,
+ "learning_rate": 2.9141273041237817e-06,
+ "loss": 0.0377,
+ "step": 27824
+ },
+ {
+ "epoch": 75.8174386920981,
+ "grad_norm": 2.3624539375305176,
+ "learning_rate": 2.9135046230399288e-06,
+ "loss": 0.0392,
+ "step": 27825
+ },
+ {
+ "epoch": 75.82016348773843,
+ "grad_norm": 5.040776252746582,
+ "learning_rate": 2.9128819971454736e-06,
+ "loss": 0.0507,
+ "step": 27826
+ },
+ {
+ "epoch": 75.82288828337875,
+ "grad_norm": 1.5148581266403198,
+ "learning_rate": 2.9122594264452654e-06,
+ "loss": 0.0234,
+ "step": 27827
+ },
+ {
+ "epoch": 75.82561307901908,
+ "grad_norm": 3.950441360473633,
+ "learning_rate": 2.9116369109441487e-06,
+ "loss": 0.1785,
+ "step": 27828
+ },
+ {
+ "epoch": 75.8283378746594,
+ "grad_norm": 16.9500675201416,
+ "learning_rate": 2.9110144506469806e-06,
+ "loss": 0.0715,
+ "step": 27829
+ },
+ {
+ "epoch": 75.83106267029973,
+ "grad_norm": 2.742633819580078,
+ "learning_rate": 2.910392045558602e-06,
+ "loss": 0.1761,
+ "step": 27830
+ },
+ {
+ "epoch": 75.83378746594005,
+ "grad_norm": 2.607189655303955,
+ "learning_rate": 2.9097696956838596e-06,
+ "loss": 0.0296,
+ "step": 27831
+ },
+ {
+ "epoch": 75.83651226158038,
+ "grad_norm": 2.5312812328338623,
+ "learning_rate": 2.9091474010276024e-06,
+ "loss": 0.0247,
+ "step": 27832
+ },
+ {
+ "epoch": 75.83923705722071,
+ "grad_norm": 4.3888630867004395,
+ "learning_rate": 2.908525161594681e-06,
+ "loss": 0.0471,
+ "step": 27833
+ },
+ {
+ "epoch": 75.84196185286103,
+ "grad_norm": 3.578895092010498,
+ "learning_rate": 2.9079029773899357e-06,
+ "loss": 0.0296,
+ "step": 27834
+ },
+ {
+ "epoch": 75.84468664850137,
+ "grad_norm": 1.764914870262146,
+ "learning_rate": 2.9072808484182146e-06,
+ "loss": 0.0236,
+ "step": 27835
+ },
+ {
+ "epoch": 75.84741144414168,
+ "grad_norm": 4.9986419677734375,
+ "learning_rate": 2.90665877468436e-06,
+ "loss": 0.0736,
+ "step": 27836
+ },
+ {
+ "epoch": 75.85013623978202,
+ "grad_norm": 3.350407361984253,
+ "learning_rate": 2.9060367561932202e-06,
+ "loss": 0.0569,
+ "step": 27837
+ },
+ {
+ "epoch": 75.85286103542235,
+ "grad_norm": 2.895502805709839,
+ "learning_rate": 2.905414792949638e-06,
+ "loss": 0.059,
+ "step": 27838
+ },
+ {
+ "epoch": 75.85558583106267,
+ "grad_norm": 2.3329083919525146,
+ "learning_rate": 2.9047928849584573e-06,
+ "loss": 0.0486,
+ "step": 27839
+ },
+ {
+ "epoch": 75.858310626703,
+ "grad_norm": 2.8299543857574463,
+ "learning_rate": 2.904171032224519e-06,
+ "loss": 0.1994,
+ "step": 27840
+ },
+ {
+ "epoch": 75.86103542234332,
+ "grad_norm": 2.45097017288208,
+ "learning_rate": 2.9035492347526704e-06,
+ "loss": 0.0972,
+ "step": 27841
+ },
+ {
+ "epoch": 75.86376021798365,
+ "grad_norm": 2.9409539699554443,
+ "learning_rate": 2.902927492547751e-06,
+ "loss": 0.1533,
+ "step": 27842
+ },
+ {
+ "epoch": 75.86648501362397,
+ "grad_norm": 2.9123213291168213,
+ "learning_rate": 2.9023058056146058e-06,
+ "loss": 0.0451,
+ "step": 27843
+ },
+ {
+ "epoch": 75.8692098092643,
+ "grad_norm": 3.152182102203369,
+ "learning_rate": 2.9016841739580703e-06,
+ "loss": 0.0314,
+ "step": 27844
+ },
+ {
+ "epoch": 75.87193460490464,
+ "grad_norm": 6.103669166564941,
+ "learning_rate": 2.9010625975829944e-06,
+ "loss": 0.092,
+ "step": 27845
+ },
+ {
+ "epoch": 75.87465940054496,
+ "grad_norm": 2.2012038230895996,
+ "learning_rate": 2.9004410764942125e-06,
+ "loss": 0.0655,
+ "step": 27846
+ },
+ {
+ "epoch": 75.87738419618529,
+ "grad_norm": 2.2651119232177734,
+ "learning_rate": 2.8998196106965693e-06,
+ "loss": 0.0396,
+ "step": 27847
+ },
+ {
+ "epoch": 75.88010899182561,
+ "grad_norm": 2.6364383697509766,
+ "learning_rate": 2.899198200194897e-06,
+ "loss": 0.036,
+ "step": 27848
+ },
+ {
+ "epoch": 75.88283378746594,
+ "grad_norm": 1.9506982564926147,
+ "learning_rate": 2.8985768449940422e-06,
+ "loss": 0.0258,
+ "step": 27849
+ },
+ {
+ "epoch": 75.88555858310627,
+ "grad_norm": 2.8842601776123047,
+ "learning_rate": 2.897955545098845e-06,
+ "loss": 0.0325,
+ "step": 27850
+ },
+ {
+ "epoch": 75.88828337874659,
+ "grad_norm": 2.7214174270629883,
+ "learning_rate": 2.897334300514142e-06,
+ "loss": 0.082,
+ "step": 27851
+ },
+ {
+ "epoch": 75.89100817438693,
+ "grad_norm": 3.42515230178833,
+ "learning_rate": 2.89671311124477e-06,
+ "loss": 0.0865,
+ "step": 27852
+ },
+ {
+ "epoch": 75.89373297002724,
+ "grad_norm": 2.3143978118896484,
+ "learning_rate": 2.8960919772955642e-06,
+ "loss": 0.0284,
+ "step": 27853
+ },
+ {
+ "epoch": 75.89645776566758,
+ "grad_norm": 3.6452369689941406,
+ "learning_rate": 2.89547089867137e-06,
+ "loss": 0.0711,
+ "step": 27854
+ },
+ {
+ "epoch": 75.8991825613079,
+ "grad_norm": 3.0343549251556396,
+ "learning_rate": 2.894849875377018e-06,
+ "loss": 0.1123,
+ "step": 27855
+ },
+ {
+ "epoch": 75.90190735694823,
+ "grad_norm": 2.7725486755371094,
+ "learning_rate": 2.8942289074173447e-06,
+ "loss": 0.0851,
+ "step": 27856
+ },
+ {
+ "epoch": 75.90463215258856,
+ "grad_norm": 3.272948980331421,
+ "learning_rate": 2.8936079947971907e-06,
+ "loss": 0.115,
+ "step": 27857
+ },
+ {
+ "epoch": 75.90735694822888,
+ "grad_norm": 2.96177077293396,
+ "learning_rate": 2.8929871375213893e-06,
+ "loss": 0.0474,
+ "step": 27858
+ },
+ {
+ "epoch": 75.91008174386921,
+ "grad_norm": 2.71899151802063,
+ "learning_rate": 2.892366335594775e-06,
+ "loss": 0.0421,
+ "step": 27859
+ },
+ {
+ "epoch": 75.91280653950953,
+ "grad_norm": 2.39719557762146,
+ "learning_rate": 2.8917455890221803e-06,
+ "loss": 0.0221,
+ "step": 27860
+ },
+ {
+ "epoch": 75.91553133514986,
+ "grad_norm": 3.4639968872070312,
+ "learning_rate": 2.891124897808445e-06,
+ "loss": 0.0678,
+ "step": 27861
+ },
+ {
+ "epoch": 75.9182561307902,
+ "grad_norm": 3.6853580474853516,
+ "learning_rate": 2.890504261958399e-06,
+ "loss": 0.0255,
+ "step": 27862
+ },
+ {
+ "epoch": 75.92098092643052,
+ "grad_norm": 3.5848002433776855,
+ "learning_rate": 2.8898836814768783e-06,
+ "loss": 0.0842,
+ "step": 27863
+ },
+ {
+ "epoch": 75.92370572207085,
+ "grad_norm": 3.7451703548431396,
+ "learning_rate": 2.889263156368711e-06,
+ "loss": 0.1634,
+ "step": 27864
+ },
+ {
+ "epoch": 75.92643051771117,
+ "grad_norm": 2.401470184326172,
+ "learning_rate": 2.8886426866387342e-06,
+ "loss": 0.0686,
+ "step": 27865
+ },
+ {
+ "epoch": 75.9291553133515,
+ "grad_norm": 5.314740180969238,
+ "learning_rate": 2.8880222722917817e-06,
+ "loss": 0.0775,
+ "step": 27866
+ },
+ {
+ "epoch": 75.93188010899182,
+ "grad_norm": 2.852182149887085,
+ "learning_rate": 2.8874019133326825e-06,
+ "loss": 0.0278,
+ "step": 27867
+ },
+ {
+ "epoch": 75.93460490463215,
+ "grad_norm": 3.7330596446990967,
+ "learning_rate": 2.8867816097662693e-06,
+ "loss": 0.0779,
+ "step": 27868
+ },
+ {
+ "epoch": 75.93732970027249,
+ "grad_norm": 3.6809818744659424,
+ "learning_rate": 2.886161361597368e-06,
+ "loss": 0.1212,
+ "step": 27869
+ },
+ {
+ "epoch": 75.9400544959128,
+ "grad_norm": 2.729417324066162,
+ "learning_rate": 2.8855411688308165e-06,
+ "loss": 0.0404,
+ "step": 27870
+ },
+ {
+ "epoch": 75.94277929155314,
+ "grad_norm": 4.025170803070068,
+ "learning_rate": 2.8849210314714414e-06,
+ "loss": 0.0796,
+ "step": 27871
+ },
+ {
+ "epoch": 75.94550408719346,
+ "grad_norm": 3.068633556365967,
+ "learning_rate": 2.8843009495240724e-06,
+ "loss": 0.0654,
+ "step": 27872
+ },
+ {
+ "epoch": 75.94822888283379,
+ "grad_norm": 2.7954258918762207,
+ "learning_rate": 2.883680922993536e-06,
+ "loss": 0.1775,
+ "step": 27873
+ },
+ {
+ "epoch": 75.95095367847412,
+ "grad_norm": 2.1981656551361084,
+ "learning_rate": 2.8830609518846652e-06,
+ "loss": 0.0327,
+ "step": 27874
+ },
+ {
+ "epoch": 75.95367847411444,
+ "grad_norm": 4.070340156555176,
+ "learning_rate": 2.882441036202288e-06,
+ "loss": 0.0748,
+ "step": 27875
+ },
+ {
+ "epoch": 75.95640326975477,
+ "grad_norm": 4.704790115356445,
+ "learning_rate": 2.8818211759512306e-06,
+ "loss": 0.0441,
+ "step": 27876
+ },
+ {
+ "epoch": 75.95912806539509,
+ "grad_norm": 2.5818374156951904,
+ "learning_rate": 2.8812013711363173e-06,
+ "loss": 0.0647,
+ "step": 27877
+ },
+ {
+ "epoch": 75.96185286103542,
+ "grad_norm": 2.595198154449463,
+ "learning_rate": 2.8805816217623815e-06,
+ "loss": 0.0374,
+ "step": 27878
+ },
+ {
+ "epoch": 75.96457765667574,
+ "grad_norm": 2.841723680496216,
+ "learning_rate": 2.8799619278342474e-06,
+ "loss": 0.2167,
+ "step": 27879
+ },
+ {
+ "epoch": 75.96730245231608,
+ "grad_norm": 3.9617176055908203,
+ "learning_rate": 2.879342289356737e-06,
+ "loss": 0.1075,
+ "step": 27880
+ },
+ {
+ "epoch": 75.97002724795641,
+ "grad_norm": 2.281709909439087,
+ "learning_rate": 2.8787227063346835e-06,
+ "loss": 0.1604,
+ "step": 27881
+ },
+ {
+ "epoch": 75.97275204359673,
+ "grad_norm": 2.5206027030944824,
+ "learning_rate": 2.878103178772905e-06,
+ "loss": 0.0326,
+ "step": 27882
+ },
+ {
+ "epoch": 75.97547683923706,
+ "grad_norm": 2.060612916946411,
+ "learning_rate": 2.877483706676233e-06,
+ "loss": 0.0428,
+ "step": 27883
+ },
+ {
+ "epoch": 75.97820163487738,
+ "grad_norm": 3.6709465980529785,
+ "learning_rate": 2.876864290049488e-06,
+ "loss": 0.0366,
+ "step": 27884
+ },
+ {
+ "epoch": 75.98092643051771,
+ "grad_norm": 3.077700138092041,
+ "learning_rate": 2.8762449288974924e-06,
+ "loss": 0.0332,
+ "step": 27885
+ },
+ {
+ "epoch": 75.98365122615803,
+ "grad_norm": 3.304319381713867,
+ "learning_rate": 2.8756256232250744e-06,
+ "loss": 0.0729,
+ "step": 27886
+ },
+ {
+ "epoch": 75.98637602179836,
+ "grad_norm": 2.5324795246124268,
+ "learning_rate": 2.875006373037055e-06,
+ "loss": 0.0511,
+ "step": 27887
+ },
+ {
+ "epoch": 75.9891008174387,
+ "grad_norm": 3.1744704246520996,
+ "learning_rate": 2.874387178338257e-06,
+ "loss": 0.0573,
+ "step": 27888
+ },
+ {
+ "epoch": 75.99182561307902,
+ "grad_norm": 3.301844835281372,
+ "learning_rate": 2.873768039133499e-06,
+ "loss": 0.0862,
+ "step": 27889
+ },
+ {
+ "epoch": 75.99455040871935,
+ "grad_norm": 2.8942222595214844,
+ "learning_rate": 2.8731489554276092e-06,
+ "loss": 0.0601,
+ "step": 27890
+ },
+ {
+ "epoch": 75.99727520435967,
+ "grad_norm": 4.084033966064453,
+ "learning_rate": 2.872529927225406e-06,
+ "loss": 0.0986,
+ "step": 27891
+ },
+ {
+ "epoch": 76.0,
+ "grad_norm": 3.195117950439453,
+ "learning_rate": 2.8719109545317102e-06,
+ "loss": 0.0686,
+ "step": 27892
+ },
+ {
+ "epoch": 76.00272479564033,
+ "grad_norm": 2.6047229766845703,
+ "learning_rate": 2.871292037351339e-06,
+ "loss": 0.0732,
+ "step": 27893
+ },
+ {
+ "epoch": 76.00544959128065,
+ "grad_norm": 3.359541416168213,
+ "learning_rate": 2.8706731756891194e-06,
+ "loss": 0.0746,
+ "step": 27894
+ },
+ {
+ "epoch": 76.00817438692098,
+ "grad_norm": 2.1447629928588867,
+ "learning_rate": 2.870054369549868e-06,
+ "loss": 0.0314,
+ "step": 27895
+ },
+ {
+ "epoch": 76.0108991825613,
+ "grad_norm": 3.1212072372436523,
+ "learning_rate": 2.869435618938403e-06,
+ "loss": 0.0592,
+ "step": 27896
+ },
+ {
+ "epoch": 76.01362397820164,
+ "grad_norm": 4.256537437438965,
+ "learning_rate": 2.868816923859542e-06,
+ "loss": 0.1006,
+ "step": 27897
+ },
+ {
+ "epoch": 76.01634877384195,
+ "grad_norm": 4.424111366271973,
+ "learning_rate": 2.868198284318108e-06,
+ "loss": 0.0366,
+ "step": 27898
+ },
+ {
+ "epoch": 76.01907356948229,
+ "grad_norm": 2.855241298675537,
+ "learning_rate": 2.8675797003189155e-06,
+ "loss": 0.071,
+ "step": 27899
+ },
+ {
+ "epoch": 76.02179836512262,
+ "grad_norm": 2.134061336517334,
+ "learning_rate": 2.86696117186678e-06,
+ "loss": 0.0453,
+ "step": 27900
+ },
+ {
+ "epoch": 76.02452316076294,
+ "grad_norm": 3.598741054534912,
+ "learning_rate": 2.866342698966521e-06,
+ "loss": 0.0938,
+ "step": 27901
+ },
+ {
+ "epoch": 76.02724795640327,
+ "grad_norm": 2.796027898788452,
+ "learning_rate": 2.865724281622959e-06,
+ "loss": 0.0489,
+ "step": 27902
+ },
+ {
+ "epoch": 76.02997275204359,
+ "grad_norm": 2.716315746307373,
+ "learning_rate": 2.865105919840906e-06,
+ "loss": 0.0393,
+ "step": 27903
+ },
+ {
+ "epoch": 76.03269754768392,
+ "grad_norm": 3.5865912437438965,
+ "learning_rate": 2.86448761362518e-06,
+ "loss": 0.1215,
+ "step": 27904
+ },
+ {
+ "epoch": 76.03542234332426,
+ "grad_norm": 2.713700771331787,
+ "learning_rate": 2.8638693629805904e-06,
+ "loss": 0.1316,
+ "step": 27905
+ },
+ {
+ "epoch": 76.03814713896458,
+ "grad_norm": 2.532438039779663,
+ "learning_rate": 2.8632511679119603e-06,
+ "loss": 0.0276,
+ "step": 27906
+ },
+ {
+ "epoch": 76.04087193460491,
+ "grad_norm": 1.9082499742507935,
+ "learning_rate": 2.8626330284241e-06,
+ "loss": 0.0623,
+ "step": 27907
+ },
+ {
+ "epoch": 76.04359673024523,
+ "grad_norm": 2.3191237449645996,
+ "learning_rate": 2.862014944521824e-06,
+ "loss": 0.1041,
+ "step": 27908
+ },
+ {
+ "epoch": 76.04632152588556,
+ "grad_norm": 3.031367301940918,
+ "learning_rate": 2.861396916209942e-06,
+ "loss": 0.1075,
+ "step": 27909
+ },
+ {
+ "epoch": 76.04904632152588,
+ "grad_norm": 2.3648593425750732,
+ "learning_rate": 2.8607789434932753e-06,
+ "loss": 0.0485,
+ "step": 27910
+ },
+ {
+ "epoch": 76.05177111716621,
+ "grad_norm": 2.374833583831787,
+ "learning_rate": 2.8601610263766324e-06,
+ "loss": 0.0395,
+ "step": 27911
+ },
+ {
+ "epoch": 76.05449591280654,
+ "grad_norm": 2.5501208305358887,
+ "learning_rate": 2.8595431648648255e-06,
+ "loss": 0.0316,
+ "step": 27912
+ },
+ {
+ "epoch": 76.05722070844686,
+ "grad_norm": 2.2800769805908203,
+ "learning_rate": 2.8589253589626633e-06,
+ "loss": 0.2246,
+ "step": 27913
+ },
+ {
+ "epoch": 76.0599455040872,
+ "grad_norm": 2.5565056800842285,
+ "learning_rate": 2.8583076086749627e-06,
+ "loss": 0.0528,
+ "step": 27914
+ },
+ {
+ "epoch": 76.06267029972751,
+ "grad_norm": 8.033062934875488,
+ "learning_rate": 2.857689914006534e-06,
+ "loss": 0.1059,
+ "step": 27915
+ },
+ {
+ "epoch": 76.06539509536785,
+ "grad_norm": 2.8080556392669678,
+ "learning_rate": 2.857072274962186e-06,
+ "loss": 0.0694,
+ "step": 27916
+ },
+ {
+ "epoch": 76.06811989100818,
+ "grad_norm": 2.6445555686950684,
+ "learning_rate": 2.856454691546726e-06,
+ "loss": 0.042,
+ "step": 27917
+ },
+ {
+ "epoch": 76.0708446866485,
+ "grad_norm": 3.4859976768493652,
+ "learning_rate": 2.8558371637649674e-06,
+ "loss": 0.0708,
+ "step": 27918
+ },
+ {
+ "epoch": 76.07356948228883,
+ "grad_norm": 3.230778217315674,
+ "learning_rate": 2.855219691621721e-06,
+ "loss": 0.0956,
+ "step": 27919
+ },
+ {
+ "epoch": 76.07629427792915,
+ "grad_norm": 2.596186399459839,
+ "learning_rate": 2.854602275121795e-06,
+ "loss": 0.0324,
+ "step": 27920
+ },
+ {
+ "epoch": 76.07901907356948,
+ "grad_norm": 2.370415210723877,
+ "learning_rate": 2.853984914269993e-06,
+ "loss": 0.2181,
+ "step": 27921
+ },
+ {
+ "epoch": 76.0817438692098,
+ "grad_norm": 2.104543447494507,
+ "learning_rate": 2.8533676090711294e-06,
+ "loss": 0.0369,
+ "step": 27922
+ },
+ {
+ "epoch": 76.08446866485014,
+ "grad_norm": 2.1844191551208496,
+ "learning_rate": 2.852750359530009e-06,
+ "loss": 0.0964,
+ "step": 27923
+ },
+ {
+ "epoch": 76.08719346049047,
+ "grad_norm": 2.8125557899475098,
+ "learning_rate": 2.8521331656514383e-06,
+ "loss": 0.2011,
+ "step": 27924
+ },
+ {
+ "epoch": 76.08991825613079,
+ "grad_norm": 2.3025074005126953,
+ "learning_rate": 2.851516027440222e-06,
+ "loss": 0.028,
+ "step": 27925
+ },
+ {
+ "epoch": 76.09264305177112,
+ "grad_norm": 3.783123731613159,
+ "learning_rate": 2.8508989449011716e-06,
+ "loss": 0.1999,
+ "step": 27926
+ },
+ {
+ "epoch": 76.09536784741144,
+ "grad_norm": 9.983528137207031,
+ "learning_rate": 2.8502819180390905e-06,
+ "loss": 0.0537,
+ "step": 27927
+ },
+ {
+ "epoch": 76.09809264305177,
+ "grad_norm": 3.5010738372802734,
+ "learning_rate": 2.8496649468587835e-06,
+ "loss": 0.0777,
+ "step": 27928
+ },
+ {
+ "epoch": 76.1008174386921,
+ "grad_norm": 1.9456828832626343,
+ "learning_rate": 2.8490480313650526e-06,
+ "loss": 0.0508,
+ "step": 27929
+ },
+ {
+ "epoch": 76.10354223433242,
+ "grad_norm": 1.8603999614715576,
+ "learning_rate": 2.848431171562708e-06,
+ "loss": 0.0305,
+ "step": 27930
+ },
+ {
+ "epoch": 76.10626702997276,
+ "grad_norm": 1.9711729288101196,
+ "learning_rate": 2.847814367456552e-06,
+ "loss": 0.0224,
+ "step": 27931
+ },
+ {
+ "epoch": 76.10899182561307,
+ "grad_norm": 2.993370771408081,
+ "learning_rate": 2.8471976190513873e-06,
+ "loss": 0.1023,
+ "step": 27932
+ },
+ {
+ "epoch": 76.11171662125341,
+ "grad_norm": 1.6494911909103394,
+ "learning_rate": 2.846580926352014e-06,
+ "loss": 0.0245,
+ "step": 27933
+ },
+ {
+ "epoch": 76.11444141689373,
+ "grad_norm": 2.5368120670318604,
+ "learning_rate": 2.845964289363239e-06,
+ "loss": 0.0825,
+ "step": 27934
+ },
+ {
+ "epoch": 76.11716621253406,
+ "grad_norm": 2.156525135040283,
+ "learning_rate": 2.8453477080898663e-06,
+ "loss": 0.0362,
+ "step": 27935
+ },
+ {
+ "epoch": 76.11989100817439,
+ "grad_norm": 3.1506590843200684,
+ "learning_rate": 2.844731182536695e-06,
+ "loss": 0.0372,
+ "step": 27936
+ },
+ {
+ "epoch": 76.12261580381471,
+ "grad_norm": 2.9435369968414307,
+ "learning_rate": 2.844114712708528e-06,
+ "loss": 0.0659,
+ "step": 27937
+ },
+ {
+ "epoch": 76.12534059945504,
+ "grad_norm": 2.2656257152557373,
+ "learning_rate": 2.843498298610161e-06,
+ "loss": 0.0573,
+ "step": 27938
+ },
+ {
+ "epoch": 76.12806539509536,
+ "grad_norm": 2.793180465698242,
+ "learning_rate": 2.8428819402464024e-06,
+ "loss": 0.0764,
+ "step": 27939
+ },
+ {
+ "epoch": 76.1307901907357,
+ "grad_norm": 2.548090934753418,
+ "learning_rate": 2.842265637622049e-06,
+ "loss": 0.0552,
+ "step": 27940
+ },
+ {
+ "epoch": 76.13351498637603,
+ "grad_norm": 1.7717152833938599,
+ "learning_rate": 2.8416493907418986e-06,
+ "loss": 0.06,
+ "step": 27941
+ },
+ {
+ "epoch": 76.13623978201635,
+ "grad_norm": 2.3561151027679443,
+ "learning_rate": 2.841033199610754e-06,
+ "loss": 0.1106,
+ "step": 27942
+ },
+ {
+ "epoch": 76.13896457765668,
+ "grad_norm": 1.8871134519577026,
+ "learning_rate": 2.8404170642334126e-06,
+ "loss": 0.1241,
+ "step": 27943
+ },
+ {
+ "epoch": 76.141689373297,
+ "grad_norm": 2.2275400161743164,
+ "learning_rate": 2.8398009846146733e-06,
+ "loss": 0.0392,
+ "step": 27944
+ },
+ {
+ "epoch": 76.14441416893733,
+ "grad_norm": 2.4605019092559814,
+ "learning_rate": 2.839184960759329e-06,
+ "loss": 0.0312,
+ "step": 27945
+ },
+ {
+ "epoch": 76.14713896457765,
+ "grad_norm": 2.262267589569092,
+ "learning_rate": 2.838568992672186e-06,
+ "loss": 0.0595,
+ "step": 27946
+ },
+ {
+ "epoch": 76.14986376021798,
+ "grad_norm": 1.9158697128295898,
+ "learning_rate": 2.837953080358038e-06,
+ "loss": 0.0305,
+ "step": 27947
+ },
+ {
+ "epoch": 76.15258855585832,
+ "grad_norm": 3.2195372581481934,
+ "learning_rate": 2.837337223821679e-06,
+ "loss": 0.0617,
+ "step": 27948
+ },
+ {
+ "epoch": 76.15531335149863,
+ "grad_norm": 3.519857406616211,
+ "learning_rate": 2.836721423067905e-06,
+ "loss": 0.0342,
+ "step": 27949
+ },
+ {
+ "epoch": 76.15803814713897,
+ "grad_norm": 2.3365373611450195,
+ "learning_rate": 2.836105678101517e-06,
+ "loss": 0.0415,
+ "step": 27950
+ },
+ {
+ "epoch": 76.16076294277929,
+ "grad_norm": 2.3643312454223633,
+ "learning_rate": 2.8354899889273045e-06,
+ "loss": 0.0693,
+ "step": 27951
+ },
+ {
+ "epoch": 76.16348773841962,
+ "grad_norm": 2.281914234161377,
+ "learning_rate": 2.834874355550069e-06,
+ "loss": 0.0739,
+ "step": 27952
+ },
+ {
+ "epoch": 76.16621253405995,
+ "grad_norm": 2.2375946044921875,
+ "learning_rate": 2.8342587779746e-06,
+ "loss": 0.045,
+ "step": 27953
+ },
+ {
+ "epoch": 76.16893732970027,
+ "grad_norm": 3.7037556171417236,
+ "learning_rate": 2.8336432562056914e-06,
+ "loss": 0.1268,
+ "step": 27954
+ },
+ {
+ "epoch": 76.1716621253406,
+ "grad_norm": 3.3654592037200928,
+ "learning_rate": 2.833027790248141e-06,
+ "loss": 0.0493,
+ "step": 27955
+ },
+ {
+ "epoch": 76.17438692098092,
+ "grad_norm": 2.998358964920044,
+ "learning_rate": 2.8324123801067395e-06,
+ "loss": 0.1388,
+ "step": 27956
+ },
+ {
+ "epoch": 76.17711171662125,
+ "grad_norm": 2.6205263137817383,
+ "learning_rate": 2.8317970257862793e-06,
+ "loss": 0.1454,
+ "step": 27957
+ },
+ {
+ "epoch": 76.17983651226157,
+ "grad_norm": 2.7314774990081787,
+ "learning_rate": 2.83118172729155e-06,
+ "loss": 0.0678,
+ "step": 27958
+ },
+ {
+ "epoch": 76.1825613079019,
+ "grad_norm": 3.8011600971221924,
+ "learning_rate": 2.8305664846273507e-06,
+ "loss": 0.1158,
+ "step": 27959
+ },
+ {
+ "epoch": 76.18528610354224,
+ "grad_norm": 2.4972071647644043,
+ "learning_rate": 2.8299512977984677e-06,
+ "loss": 0.0309,
+ "step": 27960
+ },
+ {
+ "epoch": 76.18801089918256,
+ "grad_norm": 3.224722385406494,
+ "learning_rate": 2.8293361668096943e-06,
+ "loss": 0.144,
+ "step": 27961
+ },
+ {
+ "epoch": 76.19073569482289,
+ "grad_norm": 2.707001209259033,
+ "learning_rate": 2.828721091665816e-06,
+ "loss": 0.0603,
+ "step": 27962
+ },
+ {
+ "epoch": 76.19346049046321,
+ "grad_norm": 2.6368777751922607,
+ "learning_rate": 2.8281060723716303e-06,
+ "loss": 0.1009,
+ "step": 27963
+ },
+ {
+ "epoch": 76.19618528610354,
+ "grad_norm": 3.2318313121795654,
+ "learning_rate": 2.8274911089319247e-06,
+ "loss": 0.1747,
+ "step": 27964
+ },
+ {
+ "epoch": 76.19891008174388,
+ "grad_norm": 1.9589316844940186,
+ "learning_rate": 2.8268762013514826e-06,
+ "loss": 0.1039,
+ "step": 27965
+ },
+ {
+ "epoch": 76.2016348773842,
+ "grad_norm": 3.561958074569702,
+ "learning_rate": 2.826261349635102e-06,
+ "loss": 0.1214,
+ "step": 27966
+ },
+ {
+ "epoch": 76.20435967302453,
+ "grad_norm": 2.2904269695281982,
+ "learning_rate": 2.8256465537875677e-06,
+ "loss": 0.0497,
+ "step": 27967
+ },
+ {
+ "epoch": 76.20708446866485,
+ "grad_norm": 6.865897178649902,
+ "learning_rate": 2.8250318138136655e-06,
+ "loss": 0.0824,
+ "step": 27968
+ },
+ {
+ "epoch": 76.20980926430518,
+ "grad_norm": 2.350994348526001,
+ "learning_rate": 2.8244171297181834e-06,
+ "loss": 0.0295,
+ "step": 27969
+ },
+ {
+ "epoch": 76.2125340599455,
+ "grad_norm": 2.612551689147949,
+ "learning_rate": 2.823802501505909e-06,
+ "loss": 0.0493,
+ "step": 27970
+ },
+ {
+ "epoch": 76.21525885558583,
+ "grad_norm": 2.6668803691864014,
+ "learning_rate": 2.8231879291816323e-06,
+ "loss": 0.1468,
+ "step": 27971
+ },
+ {
+ "epoch": 76.21798365122616,
+ "grad_norm": 1.4058564901351929,
+ "learning_rate": 2.822573412750137e-06,
+ "loss": 0.0191,
+ "step": 27972
+ },
+ {
+ "epoch": 76.22070844686648,
+ "grad_norm": 4.3451409339904785,
+ "learning_rate": 2.8219589522162094e-06,
+ "loss": 0.0678,
+ "step": 27973
+ },
+ {
+ "epoch": 76.22343324250681,
+ "grad_norm": 3.9595370292663574,
+ "learning_rate": 2.8213445475846314e-06,
+ "loss": 0.061,
+ "step": 27974
+ },
+ {
+ "epoch": 76.22615803814713,
+ "grad_norm": 2.8853468894958496,
+ "learning_rate": 2.820730198860194e-06,
+ "loss": 0.0319,
+ "step": 27975
+ },
+ {
+ "epoch": 76.22888283378747,
+ "grad_norm": 2.830885648727417,
+ "learning_rate": 2.820115906047679e-06,
+ "loss": 0.056,
+ "step": 27976
+ },
+ {
+ "epoch": 76.2316076294278,
+ "grad_norm": 3.3954076766967773,
+ "learning_rate": 2.8195016691518708e-06,
+ "loss": 0.0363,
+ "step": 27977
+ },
+ {
+ "epoch": 76.23433242506812,
+ "grad_norm": 2.9091482162475586,
+ "learning_rate": 2.8188874881775484e-06,
+ "loss": 0.1156,
+ "step": 27978
+ },
+ {
+ "epoch": 76.23705722070845,
+ "grad_norm": 2.5474894046783447,
+ "learning_rate": 2.8182733631295023e-06,
+ "loss": 0.0461,
+ "step": 27979
+ },
+ {
+ "epoch": 76.23978201634877,
+ "grad_norm": 3.0233871936798096,
+ "learning_rate": 2.8176592940125124e-06,
+ "loss": 0.0463,
+ "step": 27980
+ },
+ {
+ "epoch": 76.2425068119891,
+ "grad_norm": 2.699345350265503,
+ "learning_rate": 2.8170452808313597e-06,
+ "loss": 0.0485,
+ "step": 27981
+ },
+ {
+ "epoch": 76.24523160762942,
+ "grad_norm": 2.619124174118042,
+ "learning_rate": 2.816431323590826e-06,
+ "loss": 0.0411,
+ "step": 27982
+ },
+ {
+ "epoch": 76.24795640326975,
+ "grad_norm": 2.5384392738342285,
+ "learning_rate": 2.815817422295696e-06,
+ "loss": 0.0391,
+ "step": 27983
+ },
+ {
+ "epoch": 76.25068119891009,
+ "grad_norm": 3.0800857543945312,
+ "learning_rate": 2.815203576950748e-06,
+ "loss": 0.1152,
+ "step": 27984
+ },
+ {
+ "epoch": 76.2534059945504,
+ "grad_norm": 3.9242215156555176,
+ "learning_rate": 2.8145897875607642e-06,
+ "loss": 0.0888,
+ "step": 27985
+ },
+ {
+ "epoch": 76.25613079019074,
+ "grad_norm": 2.9212911128997803,
+ "learning_rate": 2.813976054130517e-06,
+ "loss": 0.0359,
+ "step": 27986
+ },
+ {
+ "epoch": 76.25885558583106,
+ "grad_norm": 2.257206678390503,
+ "learning_rate": 2.8133623766648e-06,
+ "loss": 0.0341,
+ "step": 27987
+ },
+ {
+ "epoch": 76.26158038147139,
+ "grad_norm": 2.452134370803833,
+ "learning_rate": 2.812748755168385e-06,
+ "loss": 0.0352,
+ "step": 27988
+ },
+ {
+ "epoch": 76.26430517711172,
+ "grad_norm": 4.033824920654297,
+ "learning_rate": 2.8121351896460526e-06,
+ "loss": 0.0509,
+ "step": 27989
+ },
+ {
+ "epoch": 76.26702997275204,
+ "grad_norm": 3.3400137424468994,
+ "learning_rate": 2.8115216801025757e-06,
+ "loss": 0.0494,
+ "step": 27990
+ },
+ {
+ "epoch": 76.26975476839237,
+ "grad_norm": 2.57417631149292,
+ "learning_rate": 2.81090822654274e-06,
+ "loss": 0.0645,
+ "step": 27991
+ },
+ {
+ "epoch": 76.2724795640327,
+ "grad_norm": 3.750145435333252,
+ "learning_rate": 2.8102948289713192e-06,
+ "loss": 0.0961,
+ "step": 27992
+ },
+ {
+ "epoch": 76.27520435967303,
+ "grad_norm": 2.211428165435791,
+ "learning_rate": 2.8096814873930913e-06,
+ "loss": 0.0286,
+ "step": 27993
+ },
+ {
+ "epoch": 76.27792915531334,
+ "grad_norm": 5.707901954650879,
+ "learning_rate": 2.809068201812829e-06,
+ "loss": 0.0414,
+ "step": 27994
+ },
+ {
+ "epoch": 76.28065395095368,
+ "grad_norm": 2.3994359970092773,
+ "learning_rate": 2.808454972235316e-06,
+ "loss": 0.0437,
+ "step": 27995
+ },
+ {
+ "epoch": 76.28337874659401,
+ "grad_norm": 2.9409661293029785,
+ "learning_rate": 2.807841798665324e-06,
+ "loss": 0.0636,
+ "step": 27996
+ },
+ {
+ "epoch": 76.28610354223433,
+ "grad_norm": 3.0790517330169678,
+ "learning_rate": 2.8072286811076276e-06,
+ "loss": 0.0868,
+ "step": 27997
+ },
+ {
+ "epoch": 76.28882833787466,
+ "grad_norm": 3.28312349319458,
+ "learning_rate": 2.8066156195670013e-06,
+ "loss": 0.0531,
+ "step": 27998
+ },
+ {
+ "epoch": 76.29155313351498,
+ "grad_norm": 4.68637228012085,
+ "learning_rate": 2.806002614048223e-06,
+ "loss": 0.181,
+ "step": 27999
+ },
+ {
+ "epoch": 76.29427792915531,
+ "grad_norm": 2.338714361190796,
+ "learning_rate": 2.8053896645560653e-06,
+ "loss": 0.0722,
+ "step": 28000
+ },
+ {
+ "epoch": 76.29700272479565,
+ "grad_norm": 2.7918925285339355,
+ "learning_rate": 2.8047767710953013e-06,
+ "loss": 0.0634,
+ "step": 28001
+ },
+ {
+ "epoch": 76.29972752043597,
+ "grad_norm": 2.9978299140930176,
+ "learning_rate": 2.8041639336707007e-06,
+ "loss": 0.0465,
+ "step": 28002
+ },
+ {
+ "epoch": 76.3024523160763,
+ "grad_norm": 2.5506551265716553,
+ "learning_rate": 2.8035511522870395e-06,
+ "loss": 0.1142,
+ "step": 28003
+ },
+ {
+ "epoch": 76.30517711171662,
+ "grad_norm": 2.7005417346954346,
+ "learning_rate": 2.8029384269490946e-06,
+ "loss": 0.0645,
+ "step": 28004
+ },
+ {
+ "epoch": 76.30790190735695,
+ "grad_norm": 2.3669233322143555,
+ "learning_rate": 2.8023257576616327e-06,
+ "loss": 0.0862,
+ "step": 28005
+ },
+ {
+ "epoch": 76.31062670299727,
+ "grad_norm": 2.5922515392303467,
+ "learning_rate": 2.8017131444294233e-06,
+ "loss": 0.1133,
+ "step": 28006
+ },
+ {
+ "epoch": 76.3133514986376,
+ "grad_norm": 2.9336061477661133,
+ "learning_rate": 2.801100587257243e-06,
+ "loss": 0.0842,
+ "step": 28007
+ },
+ {
+ "epoch": 76.31607629427793,
+ "grad_norm": 2.012657642364502,
+ "learning_rate": 2.8004880861498595e-06,
+ "loss": 0.0312,
+ "step": 28008
+ },
+ {
+ "epoch": 76.31880108991825,
+ "grad_norm": 2.521577835083008,
+ "learning_rate": 2.7998756411120444e-06,
+ "loss": 0.0452,
+ "step": 28009
+ },
+ {
+ "epoch": 76.32152588555859,
+ "grad_norm": 1.3363769054412842,
+ "learning_rate": 2.7992632521485617e-06,
+ "loss": 0.0178,
+ "step": 28010
+ },
+ {
+ "epoch": 76.3242506811989,
+ "grad_norm": 3.8090527057647705,
+ "learning_rate": 2.7986509192641887e-06,
+ "loss": 0.2722,
+ "step": 28011
+ },
+ {
+ "epoch": 76.32697547683924,
+ "grad_norm": 2.51955246925354,
+ "learning_rate": 2.7980386424636895e-06,
+ "loss": 0.0662,
+ "step": 28012
+ },
+ {
+ "epoch": 76.32970027247957,
+ "grad_norm": 2.5476555824279785,
+ "learning_rate": 2.7974264217518355e-06,
+ "loss": 0.0414,
+ "step": 28013
+ },
+ {
+ "epoch": 76.33242506811989,
+ "grad_norm": 2.8338663578033447,
+ "learning_rate": 2.7968142571333878e-06,
+ "loss": 0.0899,
+ "step": 28014
+ },
+ {
+ "epoch": 76.33514986376022,
+ "grad_norm": 2.1845476627349854,
+ "learning_rate": 2.796202148613123e-06,
+ "loss": 0.0297,
+ "step": 28015
+ },
+ {
+ "epoch": 76.33787465940054,
+ "grad_norm": 4.120614051818848,
+ "learning_rate": 2.795590096195804e-06,
+ "loss": 0.062,
+ "step": 28016
+ },
+ {
+ "epoch": 76.34059945504087,
+ "grad_norm": 2.4877171516418457,
+ "learning_rate": 2.7949780998861966e-06,
+ "loss": 0.0369,
+ "step": 28017
+ },
+ {
+ "epoch": 76.34332425068119,
+ "grad_norm": 2.8294050693511963,
+ "learning_rate": 2.794366159689066e-06,
+ "loss": 0.0565,
+ "step": 28018
+ },
+ {
+ "epoch": 76.34604904632153,
+ "grad_norm": 2.469412088394165,
+ "learning_rate": 2.793754275609182e-06,
+ "loss": 0.0534,
+ "step": 28019
+ },
+ {
+ "epoch": 76.34877384196186,
+ "grad_norm": 3.135049819946289,
+ "learning_rate": 2.7931424476513047e-06,
+ "loss": 0.026,
+ "step": 28020
+ },
+ {
+ "epoch": 76.35149863760218,
+ "grad_norm": 2.621840476989746,
+ "learning_rate": 2.7925306758202052e-06,
+ "loss": 0.032,
+ "step": 28021
+ },
+ {
+ "epoch": 76.35422343324251,
+ "grad_norm": 2.8926784992218018,
+ "learning_rate": 2.7919189601206455e-06,
+ "loss": 0.0618,
+ "step": 28022
+ },
+ {
+ "epoch": 76.35694822888283,
+ "grad_norm": 2.510206460952759,
+ "learning_rate": 2.7913073005573854e-06,
+ "loss": 0.073,
+ "step": 28023
+ },
+ {
+ "epoch": 76.35967302452316,
+ "grad_norm": 3.0854604244232178,
+ "learning_rate": 2.790695697135195e-06,
+ "loss": 0.0657,
+ "step": 28024
+ },
+ {
+ "epoch": 76.3623978201635,
+ "grad_norm": 4.972815036773682,
+ "learning_rate": 2.790084149858835e-06,
+ "loss": 0.0562,
+ "step": 28025
+ },
+ {
+ "epoch": 76.36512261580381,
+ "grad_norm": 2.648543357849121,
+ "learning_rate": 2.7894726587330666e-06,
+ "loss": 0.0404,
+ "step": 28026
+ },
+ {
+ "epoch": 76.36784741144415,
+ "grad_norm": 2.186492681503296,
+ "learning_rate": 2.7888612237626512e-06,
+ "loss": 0.1184,
+ "step": 28027
+ },
+ {
+ "epoch": 76.37057220708446,
+ "grad_norm": 3.8680977821350098,
+ "learning_rate": 2.788249844952354e-06,
+ "loss": 0.1279,
+ "step": 28028
+ },
+ {
+ "epoch": 76.3732970027248,
+ "grad_norm": 2.42016339302063,
+ "learning_rate": 2.787638522306936e-06,
+ "loss": 0.0575,
+ "step": 28029
+ },
+ {
+ "epoch": 76.37602179836512,
+ "grad_norm": 2.315438747406006,
+ "learning_rate": 2.787027255831154e-06,
+ "loss": 0.1398,
+ "step": 28030
+ },
+ {
+ "epoch": 76.37874659400545,
+ "grad_norm": 3.082136392593384,
+ "learning_rate": 2.7864160455297753e-06,
+ "loss": 0.0778,
+ "step": 28031
+ },
+ {
+ "epoch": 76.38147138964578,
+ "grad_norm": 2.4704718589782715,
+ "learning_rate": 2.7858048914075543e-06,
+ "loss": 0.0338,
+ "step": 28032
+ },
+ {
+ "epoch": 76.3841961852861,
+ "grad_norm": 3.232985258102417,
+ "learning_rate": 2.785193793469254e-06,
+ "loss": 0.0452,
+ "step": 28033
+ },
+ {
+ "epoch": 76.38692098092643,
+ "grad_norm": 2.485524892807007,
+ "learning_rate": 2.784582751719629e-06,
+ "loss": 0.0645,
+ "step": 28034
+ },
+ {
+ "epoch": 76.38964577656675,
+ "grad_norm": 3.575551986694336,
+ "learning_rate": 2.7839717661634446e-06,
+ "loss": 0.033,
+ "step": 28035
+ },
+ {
+ "epoch": 76.39237057220708,
+ "grad_norm": 4.037444114685059,
+ "learning_rate": 2.7833608368054556e-06,
+ "loss": 0.0912,
+ "step": 28036
+ },
+ {
+ "epoch": 76.39509536784742,
+ "grad_norm": 2.73028564453125,
+ "learning_rate": 2.7827499636504164e-06,
+ "loss": 0.0389,
+ "step": 28037
+ },
+ {
+ "epoch": 76.39782016348774,
+ "grad_norm": 2.976391077041626,
+ "learning_rate": 2.7821391467030923e-06,
+ "loss": 0.073,
+ "step": 28038
+ },
+ {
+ "epoch": 76.40054495912807,
+ "grad_norm": 2.569194793701172,
+ "learning_rate": 2.781528385968233e-06,
+ "loss": 0.0475,
+ "step": 28039
+ },
+ {
+ "epoch": 76.40326975476839,
+ "grad_norm": 2.133589267730713,
+ "learning_rate": 2.780917681450601e-06,
+ "loss": 0.0782,
+ "step": 28040
+ },
+ {
+ "epoch": 76.40599455040872,
+ "grad_norm": 2.573448419570923,
+ "learning_rate": 2.7803070331549497e-06,
+ "loss": 0.041,
+ "step": 28041
+ },
+ {
+ "epoch": 76.40871934604904,
+ "grad_norm": 8.486881256103516,
+ "learning_rate": 2.7796964410860348e-06,
+ "loss": 0.0852,
+ "step": 28042
+ },
+ {
+ "epoch": 76.41144414168937,
+ "grad_norm": 2.282289981842041,
+ "learning_rate": 2.7790859052486086e-06,
+ "loss": 0.0532,
+ "step": 28043
+ },
+ {
+ "epoch": 76.4141689373297,
+ "grad_norm": 2.2929494380950928,
+ "learning_rate": 2.778475425647432e-06,
+ "loss": 0.0283,
+ "step": 28044
+ },
+ {
+ "epoch": 76.41689373297002,
+ "grad_norm": 2.257180690765381,
+ "learning_rate": 2.777865002287257e-06,
+ "loss": 0.028,
+ "step": 28045
+ },
+ {
+ "epoch": 76.41961852861036,
+ "grad_norm": 3.966956377029419,
+ "learning_rate": 2.777254635172837e-06,
+ "loss": 0.1017,
+ "step": 28046
+ },
+ {
+ "epoch": 76.42234332425068,
+ "grad_norm": 3.150528907775879,
+ "learning_rate": 2.7766443243089215e-06,
+ "loss": 0.0626,
+ "step": 28047
+ },
+ {
+ "epoch": 76.42506811989101,
+ "grad_norm": 2.919949531555176,
+ "learning_rate": 2.776034069700271e-06,
+ "loss": 0.0627,
+ "step": 28048
+ },
+ {
+ "epoch": 76.42779291553134,
+ "grad_norm": 4.475660800933838,
+ "learning_rate": 2.7754238713516347e-06,
+ "loss": 0.0263,
+ "step": 28049
+ },
+ {
+ "epoch": 76.43051771117166,
+ "grad_norm": 4.334867000579834,
+ "learning_rate": 2.7748137292677647e-06,
+ "loss": 0.0891,
+ "step": 28050
+ },
+ {
+ "epoch": 76.433242506812,
+ "grad_norm": 2.3135111331939697,
+ "learning_rate": 2.7742036434534094e-06,
+ "loss": 0.0327,
+ "step": 28051
+ },
+ {
+ "epoch": 76.43596730245231,
+ "grad_norm": 2.878211736679077,
+ "learning_rate": 2.773593613913327e-06,
+ "loss": 0.0934,
+ "step": 28052
+ },
+ {
+ "epoch": 76.43869209809264,
+ "grad_norm": 3.610713243484497,
+ "learning_rate": 2.772983640652265e-06,
+ "loss": 0.0512,
+ "step": 28053
+ },
+ {
+ "epoch": 76.44141689373296,
+ "grad_norm": 2.4285902976989746,
+ "learning_rate": 2.7723737236749705e-06,
+ "loss": 0.0773,
+ "step": 28054
+ },
+ {
+ "epoch": 76.4441416893733,
+ "grad_norm": 8.0861177444458,
+ "learning_rate": 2.7717638629861965e-06,
+ "loss": 0.1366,
+ "step": 28055
+ },
+ {
+ "epoch": 76.44686648501363,
+ "grad_norm": 2.8861968517303467,
+ "learning_rate": 2.771154058590697e-06,
+ "loss": 0.0925,
+ "step": 28056
+ },
+ {
+ "epoch": 76.44959128065395,
+ "grad_norm": 1.7526333332061768,
+ "learning_rate": 2.7705443104932163e-06,
+ "loss": 0.0517,
+ "step": 28057
+ },
+ {
+ "epoch": 76.45231607629428,
+ "grad_norm": 3.7791574001312256,
+ "learning_rate": 2.7699346186985044e-06,
+ "loss": 0.0516,
+ "step": 28058
+ },
+ {
+ "epoch": 76.4550408719346,
+ "grad_norm": 3.859914541244507,
+ "learning_rate": 2.7693249832113055e-06,
+ "loss": 0.0406,
+ "step": 28059
+ },
+ {
+ "epoch": 76.45776566757493,
+ "grad_norm": 2.121925115585327,
+ "learning_rate": 2.768715404036374e-06,
+ "loss": 0.0477,
+ "step": 28060
+ },
+ {
+ "epoch": 76.46049046321527,
+ "grad_norm": 2.7566285133361816,
+ "learning_rate": 2.7681058811784545e-06,
+ "loss": 0.0475,
+ "step": 28061
+ },
+ {
+ "epoch": 76.46321525885558,
+ "grad_norm": 6.3780837059021,
+ "learning_rate": 2.7674964146422933e-06,
+ "loss": 0.0175,
+ "step": 28062
+ },
+ {
+ "epoch": 76.46594005449592,
+ "grad_norm": 2.3032732009887695,
+ "learning_rate": 2.7668870044326335e-06,
+ "loss": 0.033,
+ "step": 28063
+ },
+ {
+ "epoch": 76.46866485013624,
+ "grad_norm": 3.9634287357330322,
+ "learning_rate": 2.7662776505542286e-06,
+ "loss": 0.0636,
+ "step": 28064
+ },
+ {
+ "epoch": 76.47138964577657,
+ "grad_norm": 2.698305368423462,
+ "learning_rate": 2.765668353011821e-06,
+ "loss": 0.1124,
+ "step": 28065
+ },
+ {
+ "epoch": 76.47411444141689,
+ "grad_norm": 1.495788812637329,
+ "learning_rate": 2.7650591118101557e-06,
+ "loss": 0.0204,
+ "step": 28066
+ },
+ {
+ "epoch": 76.47683923705722,
+ "grad_norm": 3.5963215827941895,
+ "learning_rate": 2.7644499269539728e-06,
+ "loss": 0.033,
+ "step": 28067
+ },
+ {
+ "epoch": 76.47956403269755,
+ "grad_norm": 2.6007676124572754,
+ "learning_rate": 2.7638407984480255e-06,
+ "loss": 0.04,
+ "step": 28068
+ },
+ {
+ "epoch": 76.48228882833787,
+ "grad_norm": 2.2179477214813232,
+ "learning_rate": 2.763231726297052e-06,
+ "loss": 0.1683,
+ "step": 28069
+ },
+ {
+ "epoch": 76.4850136239782,
+ "grad_norm": 3.5508370399475098,
+ "learning_rate": 2.762622710505797e-06,
+ "loss": 0.0412,
+ "step": 28070
+ },
+ {
+ "epoch": 76.48773841961852,
+ "grad_norm": 3.038764476776123,
+ "learning_rate": 2.762013751079001e-06,
+ "loss": 0.1343,
+ "step": 28071
+ },
+ {
+ "epoch": 76.49046321525886,
+ "grad_norm": 3.583001136779785,
+ "learning_rate": 2.7614048480214085e-06,
+ "loss": 0.1194,
+ "step": 28072
+ },
+ {
+ "epoch": 76.49318801089919,
+ "grad_norm": 2.5639359951019287,
+ "learning_rate": 2.7607960013377655e-06,
+ "loss": 0.0358,
+ "step": 28073
+ },
+ {
+ "epoch": 76.49591280653951,
+ "grad_norm": 2.9354007244110107,
+ "learning_rate": 2.76018721103281e-06,
+ "loss": 0.1409,
+ "step": 28074
+ },
+ {
+ "epoch": 76.49863760217984,
+ "grad_norm": 4.090127468109131,
+ "learning_rate": 2.7595784771112798e-06,
+ "loss": 0.053,
+ "step": 28075
+ },
+ {
+ "epoch": 76.50136239782016,
+ "grad_norm": 2.726362466812134,
+ "learning_rate": 2.758969799577923e-06,
+ "loss": 0.0317,
+ "step": 28076
+ },
+ {
+ "epoch": 76.50408719346049,
+ "grad_norm": 2.5246667861938477,
+ "learning_rate": 2.7583611784374766e-06,
+ "loss": 0.0327,
+ "step": 28077
+ },
+ {
+ "epoch": 76.50681198910081,
+ "grad_norm": 4.658145427703857,
+ "learning_rate": 2.7577526136946797e-06,
+ "loss": 0.027,
+ "step": 28078
+ },
+ {
+ "epoch": 76.50953678474114,
+ "grad_norm": 3.1911253929138184,
+ "learning_rate": 2.7571441053542703e-06,
+ "loss": 0.0586,
+ "step": 28079
+ },
+ {
+ "epoch": 76.51226158038148,
+ "grad_norm": 1.6940730810165405,
+ "learning_rate": 2.756535653420992e-06,
+ "loss": 0.0263,
+ "step": 28080
+ },
+ {
+ "epoch": 76.5149863760218,
+ "grad_norm": 2.7947118282318115,
+ "learning_rate": 2.755927257899581e-06,
+ "loss": 0.1399,
+ "step": 28081
+ },
+ {
+ "epoch": 76.51771117166213,
+ "grad_norm": 2.8880624771118164,
+ "learning_rate": 2.7553189187947747e-06,
+ "loss": 0.0391,
+ "step": 28082
+ },
+ {
+ "epoch": 76.52043596730245,
+ "grad_norm": 2.8466579914093018,
+ "learning_rate": 2.7547106361113087e-06,
+ "loss": 0.034,
+ "step": 28083
+ },
+ {
+ "epoch": 76.52316076294278,
+ "grad_norm": 2.4123668670654297,
+ "learning_rate": 2.754102409853927e-06,
+ "loss": 0.0248,
+ "step": 28084
+ },
+ {
+ "epoch": 76.52588555858311,
+ "grad_norm": 2.8858022689819336,
+ "learning_rate": 2.753494240027361e-06,
+ "loss": 0.049,
+ "step": 28085
+ },
+ {
+ "epoch": 76.52861035422343,
+ "grad_norm": 3.041144609451294,
+ "learning_rate": 2.7528861266363507e-06,
+ "loss": 0.0863,
+ "step": 28086
+ },
+ {
+ "epoch": 76.53133514986376,
+ "grad_norm": 3.7189900875091553,
+ "learning_rate": 2.7522780696856256e-06,
+ "loss": 0.0559,
+ "step": 28087
+ },
+ {
+ "epoch": 76.53405994550408,
+ "grad_norm": 2.4244542121887207,
+ "learning_rate": 2.751670069179928e-06,
+ "loss": 0.0654,
+ "step": 28088
+ },
+ {
+ "epoch": 76.53678474114442,
+ "grad_norm": 2.1451120376586914,
+ "learning_rate": 2.751062125123989e-06,
+ "loss": 0.0377,
+ "step": 28089
+ },
+ {
+ "epoch": 76.53950953678473,
+ "grad_norm": 3.701094627380371,
+ "learning_rate": 2.7504542375225474e-06,
+ "loss": 0.0522,
+ "step": 28090
+ },
+ {
+ "epoch": 76.54223433242507,
+ "grad_norm": 2.5902910232543945,
+ "learning_rate": 2.7498464063803342e-06,
+ "loss": 0.0261,
+ "step": 28091
+ },
+ {
+ "epoch": 76.5449591280654,
+ "grad_norm": 3.0719902515411377,
+ "learning_rate": 2.7492386317020814e-06,
+ "loss": 0.0694,
+ "step": 28092
+ },
+ {
+ "epoch": 76.54768392370572,
+ "grad_norm": 3.1734306812286377,
+ "learning_rate": 2.748630913492528e-06,
+ "loss": 0.0366,
+ "step": 28093
+ },
+ {
+ "epoch": 76.55040871934605,
+ "grad_norm": 2.8310868740081787,
+ "learning_rate": 2.7480232517564033e-06,
+ "loss": 0.1542,
+ "step": 28094
+ },
+ {
+ "epoch": 76.55313351498637,
+ "grad_norm": 2.7298359870910645,
+ "learning_rate": 2.747415646498438e-06,
+ "loss": 0.049,
+ "step": 28095
+ },
+ {
+ "epoch": 76.5558583106267,
+ "grad_norm": 2.6002743244171143,
+ "learning_rate": 2.746808097723368e-06,
+ "loss": 0.137,
+ "step": 28096
+ },
+ {
+ "epoch": 76.55858310626704,
+ "grad_norm": 2.7242491245269775,
+ "learning_rate": 2.7462006054359234e-06,
+ "loss": 0.087,
+ "step": 28097
+ },
+ {
+ "epoch": 76.56130790190736,
+ "grad_norm": 2.934518575668335,
+ "learning_rate": 2.7455931696408356e-06,
+ "loss": 0.0244,
+ "step": 28098
+ },
+ {
+ "epoch": 76.56403269754769,
+ "grad_norm": 3.0216727256774902,
+ "learning_rate": 2.7449857903428314e-06,
+ "loss": 0.1071,
+ "step": 28099
+ },
+ {
+ "epoch": 76.566757493188,
+ "grad_norm": 2.2561445236206055,
+ "learning_rate": 2.7443784675466465e-06,
+ "loss": 0.0375,
+ "step": 28100
+ },
+ {
+ "epoch": 76.56948228882834,
+ "grad_norm": 6.173305511474609,
+ "learning_rate": 2.7437712012570105e-06,
+ "loss": 0.0829,
+ "step": 28101
+ },
+ {
+ "epoch": 76.57220708446866,
+ "grad_norm": 2.828070640563965,
+ "learning_rate": 2.7431639914786488e-06,
+ "loss": 0.1561,
+ "step": 28102
+ },
+ {
+ "epoch": 76.57493188010899,
+ "grad_norm": 4.874003887176514,
+ "learning_rate": 2.7425568382162904e-06,
+ "loss": 0.0374,
+ "step": 28103
+ },
+ {
+ "epoch": 76.57765667574932,
+ "grad_norm": 3.1307716369628906,
+ "learning_rate": 2.7419497414746687e-06,
+ "loss": 0.0495,
+ "step": 28104
+ },
+ {
+ "epoch": 76.58038147138964,
+ "grad_norm": 2.9444665908813477,
+ "learning_rate": 2.741342701258509e-06,
+ "loss": 0.0503,
+ "step": 28105
+ },
+ {
+ "epoch": 76.58310626702998,
+ "grad_norm": 3.124049186706543,
+ "learning_rate": 2.7407357175725356e-06,
+ "loss": 0.0382,
+ "step": 28106
+ },
+ {
+ "epoch": 76.5858310626703,
+ "grad_norm": 3.487481117248535,
+ "learning_rate": 2.7401287904214813e-06,
+ "loss": 0.1275,
+ "step": 28107
+ },
+ {
+ "epoch": 76.58855585831063,
+ "grad_norm": 2.9745378494262695,
+ "learning_rate": 2.7395219198100674e-06,
+ "loss": 0.1387,
+ "step": 28108
+ },
+ {
+ "epoch": 76.59128065395096,
+ "grad_norm": 3.164611577987671,
+ "learning_rate": 2.7389151057430272e-06,
+ "loss": 0.0644,
+ "step": 28109
+ },
+ {
+ "epoch": 76.59400544959128,
+ "grad_norm": 2.4915006160736084,
+ "learning_rate": 2.7383083482250815e-06,
+ "loss": 0.0702,
+ "step": 28110
+ },
+ {
+ "epoch": 76.59673024523161,
+ "grad_norm": 3.8384878635406494,
+ "learning_rate": 2.7377016472609562e-06,
+ "loss": 0.0516,
+ "step": 28111
+ },
+ {
+ "epoch": 76.59945504087193,
+ "grad_norm": 3.1336984634399414,
+ "learning_rate": 2.7370950028553744e-06,
+ "loss": 0.0435,
+ "step": 28112
+ },
+ {
+ "epoch": 76.60217983651226,
+ "grad_norm": 3.026506185531616,
+ "learning_rate": 2.7364884150130667e-06,
+ "loss": 0.0527,
+ "step": 28113
+ },
+ {
+ "epoch": 76.60490463215258,
+ "grad_norm": 2.474282741546631,
+ "learning_rate": 2.7358818837387525e-06,
+ "loss": 0.06,
+ "step": 28114
+ },
+ {
+ "epoch": 76.60762942779292,
+ "grad_norm": 2.46525502204895,
+ "learning_rate": 2.7352754090371538e-06,
+ "loss": 0.0275,
+ "step": 28115
+ },
+ {
+ "epoch": 76.61035422343325,
+ "grad_norm": 3.462277412414551,
+ "learning_rate": 2.734668990912999e-06,
+ "loss": 0.0523,
+ "step": 28116
+ },
+ {
+ "epoch": 76.61307901907357,
+ "grad_norm": 4.526456356048584,
+ "learning_rate": 2.734062629371008e-06,
+ "loss": 0.1228,
+ "step": 28117
+ },
+ {
+ "epoch": 76.6158038147139,
+ "grad_norm": 2.8008873462677,
+ "learning_rate": 2.733456324415904e-06,
+ "loss": 0.0318,
+ "step": 28118
+ },
+ {
+ "epoch": 76.61852861035422,
+ "grad_norm": 3.2150888442993164,
+ "learning_rate": 2.732850076052406e-06,
+ "loss": 0.0477,
+ "step": 28119
+ },
+ {
+ "epoch": 76.62125340599455,
+ "grad_norm": 3.417959213256836,
+ "learning_rate": 2.7322438842852394e-06,
+ "loss": 0.0276,
+ "step": 28120
+ },
+ {
+ "epoch": 76.62397820163488,
+ "grad_norm": 3.4848334789276123,
+ "learning_rate": 2.7316377491191236e-06,
+ "loss": 0.0489,
+ "step": 28121
+ },
+ {
+ "epoch": 76.6267029972752,
+ "grad_norm": 2.5796701908111572,
+ "learning_rate": 2.7310316705587793e-06,
+ "loss": 0.1577,
+ "step": 28122
+ },
+ {
+ "epoch": 76.62942779291554,
+ "grad_norm": 2.8394663333892822,
+ "learning_rate": 2.730425648608923e-06,
+ "loss": 0.065,
+ "step": 28123
+ },
+ {
+ "epoch": 76.63215258855585,
+ "grad_norm": 4.187651634216309,
+ "learning_rate": 2.7298196832742786e-06,
+ "loss": 0.2452,
+ "step": 28124
+ },
+ {
+ "epoch": 76.63487738419619,
+ "grad_norm": 2.425128936767578,
+ "learning_rate": 2.729213774559567e-06,
+ "loss": 0.0353,
+ "step": 28125
+ },
+ {
+ "epoch": 76.6376021798365,
+ "grad_norm": 1.9688972234725952,
+ "learning_rate": 2.728607922469505e-06,
+ "loss": 0.0743,
+ "step": 28126
+ },
+ {
+ "epoch": 76.64032697547684,
+ "grad_norm": 3.256420135498047,
+ "learning_rate": 2.728002127008811e-06,
+ "loss": 0.0281,
+ "step": 28127
+ },
+ {
+ "epoch": 76.64305177111717,
+ "grad_norm": 2.346224784851074,
+ "learning_rate": 2.7273963881821984e-06,
+ "loss": 0.1408,
+ "step": 28128
+ },
+ {
+ "epoch": 76.64577656675749,
+ "grad_norm": 2.3820855617523193,
+ "learning_rate": 2.726790705994391e-06,
+ "loss": 0.0971,
+ "step": 28129
+ },
+ {
+ "epoch": 76.64850136239782,
+ "grad_norm": 2.2366647720336914,
+ "learning_rate": 2.7261850804501043e-06,
+ "loss": 0.045,
+ "step": 28130
+ },
+ {
+ "epoch": 76.65122615803814,
+ "grad_norm": 2.996664524078369,
+ "learning_rate": 2.725579511554055e-06,
+ "loss": 0.1373,
+ "step": 28131
+ },
+ {
+ "epoch": 76.65395095367847,
+ "grad_norm": 2.155332565307617,
+ "learning_rate": 2.724973999310954e-06,
+ "loss": 0.0671,
+ "step": 28132
+ },
+ {
+ "epoch": 76.65667574931881,
+ "grad_norm": 3.2764053344726562,
+ "learning_rate": 2.7243685437255253e-06,
+ "loss": 0.1598,
+ "step": 28133
+ },
+ {
+ "epoch": 76.65940054495913,
+ "grad_norm": 1.984950065612793,
+ "learning_rate": 2.7237631448024792e-06,
+ "loss": 0.1516,
+ "step": 28134
+ },
+ {
+ "epoch": 76.66212534059946,
+ "grad_norm": 2.99607253074646,
+ "learning_rate": 2.723157802546532e-06,
+ "loss": 0.0355,
+ "step": 28135
+ },
+ {
+ "epoch": 76.66485013623978,
+ "grad_norm": 2.9442052841186523,
+ "learning_rate": 2.7225525169623947e-06,
+ "loss": 0.1218,
+ "step": 28136
+ },
+ {
+ "epoch": 76.66757493188011,
+ "grad_norm": 3.8162875175476074,
+ "learning_rate": 2.721947288054787e-06,
+ "loss": 0.0678,
+ "step": 28137
+ },
+ {
+ "epoch": 76.67029972752043,
+ "grad_norm": 1.9887125492095947,
+ "learning_rate": 2.7213421158284203e-06,
+ "loss": 0.091,
+ "step": 28138
+ },
+ {
+ "epoch": 76.67302452316076,
+ "grad_norm": 2.8055906295776367,
+ "learning_rate": 2.720737000288003e-06,
+ "loss": 0.1335,
+ "step": 28139
+ },
+ {
+ "epoch": 76.6757493188011,
+ "grad_norm": 2.4547324180603027,
+ "learning_rate": 2.7201319414382554e-06,
+ "loss": 0.0993,
+ "step": 28140
+ },
+ {
+ "epoch": 76.67847411444141,
+ "grad_norm": 2.761908769607544,
+ "learning_rate": 2.7195269392838818e-06,
+ "loss": 0.041,
+ "step": 28141
+ },
+ {
+ "epoch": 76.68119891008175,
+ "grad_norm": 3.926360607147217,
+ "learning_rate": 2.718921993829603e-06,
+ "loss": 0.0517,
+ "step": 28142
+ },
+ {
+ "epoch": 76.68392370572207,
+ "grad_norm": 2.480558395385742,
+ "learning_rate": 2.718317105080124e-06,
+ "loss": 0.1028,
+ "step": 28143
+ },
+ {
+ "epoch": 76.6866485013624,
+ "grad_norm": 2.091433525085449,
+ "learning_rate": 2.717712273040154e-06,
+ "loss": 0.0251,
+ "step": 28144
+ },
+ {
+ "epoch": 76.68937329700273,
+ "grad_norm": 2.3875463008880615,
+ "learning_rate": 2.71710749771441e-06,
+ "loss": 0.0562,
+ "step": 28145
+ },
+ {
+ "epoch": 76.69209809264305,
+ "grad_norm": 2.630124568939209,
+ "learning_rate": 2.7165027791075984e-06,
+ "loss": 0.1114,
+ "step": 28146
+ },
+ {
+ "epoch": 76.69482288828338,
+ "grad_norm": 2.8091511726379395,
+ "learning_rate": 2.715898117224428e-06,
+ "loss": 0.0477,
+ "step": 28147
+ },
+ {
+ "epoch": 76.6975476839237,
+ "grad_norm": 2.7866899967193604,
+ "learning_rate": 2.7152935120696056e-06,
+ "loss": 0.0769,
+ "step": 28148
+ },
+ {
+ "epoch": 76.70027247956403,
+ "grad_norm": 2.8136236667633057,
+ "learning_rate": 2.7146889636478467e-06,
+ "loss": 0.0573,
+ "step": 28149
+ },
+ {
+ "epoch": 76.70299727520435,
+ "grad_norm": 2.7409310340881348,
+ "learning_rate": 2.714084471963855e-06,
+ "loss": 0.1757,
+ "step": 28150
+ },
+ {
+ "epoch": 76.70572207084469,
+ "grad_norm": 2.173962354660034,
+ "learning_rate": 2.713480037022339e-06,
+ "loss": 0.0296,
+ "step": 28151
+ },
+ {
+ "epoch": 76.70844686648502,
+ "grad_norm": 2.338724374771118,
+ "learning_rate": 2.712875658828004e-06,
+ "loss": 0.0399,
+ "step": 28152
+ },
+ {
+ "epoch": 76.71117166212534,
+ "grad_norm": 2.862715244293213,
+ "learning_rate": 2.7122713373855605e-06,
+ "loss": 0.0353,
+ "step": 28153
+ },
+ {
+ "epoch": 76.71389645776567,
+ "grad_norm": 2.498589515686035,
+ "learning_rate": 2.7116670726997142e-06,
+ "loss": 0.0765,
+ "step": 28154
+ },
+ {
+ "epoch": 76.71662125340599,
+ "grad_norm": 2.568979024887085,
+ "learning_rate": 2.7110628647751704e-06,
+ "loss": 0.1366,
+ "step": 28155
+ },
+ {
+ "epoch": 76.71934604904632,
+ "grad_norm": 2.9421985149383545,
+ "learning_rate": 2.7104587136166304e-06,
+ "loss": 0.0272,
+ "step": 28156
+ },
+ {
+ "epoch": 76.72207084468666,
+ "grad_norm": 2.875525951385498,
+ "learning_rate": 2.709854619228807e-06,
+ "loss": 0.0487,
+ "step": 28157
+ },
+ {
+ "epoch": 76.72479564032697,
+ "grad_norm": 2.8808341026306152,
+ "learning_rate": 2.709250581616397e-06,
+ "loss": 0.0318,
+ "step": 28158
+ },
+ {
+ "epoch": 76.7275204359673,
+ "grad_norm": 2.8514723777770996,
+ "learning_rate": 2.7086466007841126e-06,
+ "loss": 0.1324,
+ "step": 28159
+ },
+ {
+ "epoch": 76.73024523160763,
+ "grad_norm": 3.5004167556762695,
+ "learning_rate": 2.708042676736651e-06,
+ "loss": 0.041,
+ "step": 28160
+ },
+ {
+ "epoch": 76.73297002724796,
+ "grad_norm": 1.74006986618042,
+ "learning_rate": 2.707438809478722e-06,
+ "loss": 0.0284,
+ "step": 28161
+ },
+ {
+ "epoch": 76.73569482288828,
+ "grad_norm": 2.246943950653076,
+ "learning_rate": 2.7068349990150235e-06,
+ "loss": 0.0215,
+ "step": 28162
+ },
+ {
+ "epoch": 76.73841961852861,
+ "grad_norm": 3.3550186157226562,
+ "learning_rate": 2.7062312453502606e-06,
+ "loss": 0.126,
+ "step": 28163
+ },
+ {
+ "epoch": 76.74114441416894,
+ "grad_norm": 3.6439809799194336,
+ "learning_rate": 2.70562754848913e-06,
+ "loss": 0.0873,
+ "step": 28164
+ },
+ {
+ "epoch": 76.74386920980926,
+ "grad_norm": 3.409364938735962,
+ "learning_rate": 2.7050239084363404e-06,
+ "loss": 0.2361,
+ "step": 28165
+ },
+ {
+ "epoch": 76.7465940054496,
+ "grad_norm": 3.3585925102233887,
+ "learning_rate": 2.7044203251965907e-06,
+ "loss": 0.0896,
+ "step": 28166
+ },
+ {
+ "epoch": 76.74931880108991,
+ "grad_norm": 2.680992841720581,
+ "learning_rate": 2.703816798774579e-06,
+ "loss": 0.0342,
+ "step": 28167
+ },
+ {
+ "epoch": 76.75204359673025,
+ "grad_norm": 3.4959325790405273,
+ "learning_rate": 2.703213329175006e-06,
+ "loss": 0.1762,
+ "step": 28168
+ },
+ {
+ "epoch": 76.75476839237058,
+ "grad_norm": 3.6395339965820312,
+ "learning_rate": 2.702609916402574e-06,
+ "loss": 0.1915,
+ "step": 28169
+ },
+ {
+ "epoch": 76.7574931880109,
+ "grad_norm": 3.4512598514556885,
+ "learning_rate": 2.7020065604619826e-06,
+ "loss": 0.1554,
+ "step": 28170
+ },
+ {
+ "epoch": 76.76021798365123,
+ "grad_norm": 3.1817307472229004,
+ "learning_rate": 2.701403261357929e-06,
+ "loss": 0.1507,
+ "step": 28171
+ },
+ {
+ "epoch": 76.76294277929155,
+ "grad_norm": 2.7833666801452637,
+ "learning_rate": 2.700800019095109e-06,
+ "loss": 0.0706,
+ "step": 28172
+ },
+ {
+ "epoch": 76.76566757493188,
+ "grad_norm": 2.8812572956085205,
+ "learning_rate": 2.700196833678226e-06,
+ "loss": 0.0998,
+ "step": 28173
+ },
+ {
+ "epoch": 76.7683923705722,
+ "grad_norm": 2.6217448711395264,
+ "learning_rate": 2.6995937051119747e-06,
+ "loss": 0.0408,
+ "step": 28174
+ },
+ {
+ "epoch": 76.77111716621253,
+ "grad_norm": 2.885335683822632,
+ "learning_rate": 2.6989906334010507e-06,
+ "loss": 0.0736,
+ "step": 28175
+ },
+ {
+ "epoch": 76.77384196185287,
+ "grad_norm": 2.695162057876587,
+ "learning_rate": 2.6983876185501556e-06,
+ "loss": 0.1038,
+ "step": 28176
+ },
+ {
+ "epoch": 76.77656675749319,
+ "grad_norm": 2.176483392715454,
+ "learning_rate": 2.697784660563979e-06,
+ "loss": 0.0552,
+ "step": 28177
+ },
+ {
+ "epoch": 76.77929155313352,
+ "grad_norm": 3.070734977722168,
+ "learning_rate": 2.697181759447224e-06,
+ "loss": 0.0683,
+ "step": 28178
+ },
+ {
+ "epoch": 76.78201634877384,
+ "grad_norm": 3.0700390338897705,
+ "learning_rate": 2.6965789152045818e-06,
+ "loss": 0.0523,
+ "step": 28179
+ },
+ {
+ "epoch": 76.78474114441417,
+ "grad_norm": 3.2693450450897217,
+ "learning_rate": 2.695976127840745e-06,
+ "loss": 0.0439,
+ "step": 28180
+ },
+ {
+ "epoch": 76.7874659400545,
+ "grad_norm": 3.124469041824341,
+ "learning_rate": 2.6953733973604147e-06,
+ "loss": 0.0341,
+ "step": 28181
+ },
+ {
+ "epoch": 76.79019073569482,
+ "grad_norm": 2.651022434234619,
+ "learning_rate": 2.6947707237682807e-06,
+ "loss": 0.0321,
+ "step": 28182
+ },
+ {
+ "epoch": 76.79291553133515,
+ "grad_norm": 2.7244935035705566,
+ "learning_rate": 2.6941681070690374e-06,
+ "loss": 0.1518,
+ "step": 28183
+ },
+ {
+ "epoch": 76.79564032697547,
+ "grad_norm": 2.6263954639434814,
+ "learning_rate": 2.693565547267375e-06,
+ "loss": 0.0666,
+ "step": 28184
+ },
+ {
+ "epoch": 76.7983651226158,
+ "grad_norm": 2.7580041885375977,
+ "learning_rate": 2.6929630443679923e-06,
+ "loss": 0.0497,
+ "step": 28185
+ },
+ {
+ "epoch": 76.80108991825612,
+ "grad_norm": 3.8143322467803955,
+ "learning_rate": 2.6923605983755772e-06,
+ "loss": 0.0467,
+ "step": 28186
+ },
+ {
+ "epoch": 76.80381471389646,
+ "grad_norm": 2.6981263160705566,
+ "learning_rate": 2.6917582092948235e-06,
+ "loss": 0.0385,
+ "step": 28187
+ },
+ {
+ "epoch": 76.80653950953679,
+ "grad_norm": 2.2770352363586426,
+ "learning_rate": 2.691155877130418e-06,
+ "loss": 0.097,
+ "step": 28188
+ },
+ {
+ "epoch": 76.80926430517711,
+ "grad_norm": 3.7626657485961914,
+ "learning_rate": 2.690553601887058e-06,
+ "loss": 0.0444,
+ "step": 28189
+ },
+ {
+ "epoch": 76.81198910081744,
+ "grad_norm": 3.5276734828948975,
+ "learning_rate": 2.6899513835694323e-06,
+ "loss": 0.0593,
+ "step": 28190
+ },
+ {
+ "epoch": 76.81471389645776,
+ "grad_norm": 3.3592352867126465,
+ "learning_rate": 2.6893492221822293e-06,
+ "loss": 0.062,
+ "step": 28191
+ },
+ {
+ "epoch": 76.8174386920981,
+ "grad_norm": 3.7183713912963867,
+ "learning_rate": 2.688747117730136e-06,
+ "loss": 0.1264,
+ "step": 28192
+ },
+ {
+ "epoch": 76.82016348773843,
+ "grad_norm": 2.527022123336792,
+ "learning_rate": 2.688145070217846e-06,
+ "loss": 0.0335,
+ "step": 28193
+ },
+ {
+ "epoch": 76.82288828337875,
+ "grad_norm": 1.935794711112976,
+ "learning_rate": 2.687543079650049e-06,
+ "loss": 0.0331,
+ "step": 28194
+ },
+ {
+ "epoch": 76.82561307901908,
+ "grad_norm": 3.119727611541748,
+ "learning_rate": 2.686941146031431e-06,
+ "loss": 0.0788,
+ "step": 28195
+ },
+ {
+ "epoch": 76.8283378746594,
+ "grad_norm": 1.7302227020263672,
+ "learning_rate": 2.68633926936668e-06,
+ "loss": 0.035,
+ "step": 28196
+ },
+ {
+ "epoch": 76.83106267029973,
+ "grad_norm": 1.9190800189971924,
+ "learning_rate": 2.6857374496604805e-06,
+ "loss": 0.0282,
+ "step": 28197
+ },
+ {
+ "epoch": 76.83378746594005,
+ "grad_norm": 3.658738136291504,
+ "learning_rate": 2.685135686917526e-06,
+ "loss": 0.1258,
+ "step": 28198
+ },
+ {
+ "epoch": 76.83651226158038,
+ "grad_norm": 4.712545394897461,
+ "learning_rate": 2.6845339811424987e-06,
+ "loss": 0.1422,
+ "step": 28199
+ },
+ {
+ "epoch": 76.83923705722071,
+ "grad_norm": 3.1784772872924805,
+ "learning_rate": 2.6839323323400856e-06,
+ "loss": 0.1382,
+ "step": 28200
+ },
+ {
+ "epoch": 76.84196185286103,
+ "grad_norm": 2.335515022277832,
+ "learning_rate": 2.683330740514969e-06,
+ "loss": 0.1429,
+ "step": 28201
+ },
+ {
+ "epoch": 76.84468664850137,
+ "grad_norm": 3.69903826713562,
+ "learning_rate": 2.682729205671839e-06,
+ "loss": 0.0551,
+ "step": 28202
+ },
+ {
+ "epoch": 76.84741144414168,
+ "grad_norm": 3.7585651874542236,
+ "learning_rate": 2.68212772781538e-06,
+ "loss": 0.0995,
+ "step": 28203
+ },
+ {
+ "epoch": 76.85013623978202,
+ "grad_norm": 2.2671399116516113,
+ "learning_rate": 2.6815263069502706e-06,
+ "loss": 0.142,
+ "step": 28204
+ },
+ {
+ "epoch": 76.85286103542235,
+ "grad_norm": 2.960724353790283,
+ "learning_rate": 2.6809249430812025e-06,
+ "loss": 0.1053,
+ "step": 28205
+ },
+ {
+ "epoch": 76.85558583106267,
+ "grad_norm": 2.2976996898651123,
+ "learning_rate": 2.680323636212856e-06,
+ "loss": 0.0359,
+ "step": 28206
+ },
+ {
+ "epoch": 76.858310626703,
+ "grad_norm": 2.176069974899292,
+ "learning_rate": 2.6797223863499123e-06,
+ "loss": 0.0302,
+ "step": 28207
+ },
+ {
+ "epoch": 76.86103542234332,
+ "grad_norm": 2.679279088973999,
+ "learning_rate": 2.6791211934970516e-06,
+ "loss": 0.0996,
+ "step": 28208
+ },
+ {
+ "epoch": 76.86376021798365,
+ "grad_norm": 2.479323625564575,
+ "learning_rate": 2.678520057658961e-06,
+ "loss": 0.1651,
+ "step": 28209
+ },
+ {
+ "epoch": 76.86648501362397,
+ "grad_norm": 3.211015224456787,
+ "learning_rate": 2.6779189788403226e-06,
+ "loss": 0.1225,
+ "step": 28210
+ },
+ {
+ "epoch": 76.8692098092643,
+ "grad_norm": 2.575972557067871,
+ "learning_rate": 2.677317957045815e-06,
+ "loss": 0.0479,
+ "step": 28211
+ },
+ {
+ "epoch": 76.87193460490464,
+ "grad_norm": 2.300093650817871,
+ "learning_rate": 2.6767169922801205e-06,
+ "loss": 0.0372,
+ "step": 28212
+ },
+ {
+ "epoch": 76.87465940054496,
+ "grad_norm": 3.722437858581543,
+ "learning_rate": 2.676116084547915e-06,
+ "loss": 0.0959,
+ "step": 28213
+ },
+ {
+ "epoch": 76.87738419618529,
+ "grad_norm": 2.495455741882324,
+ "learning_rate": 2.6755152338538847e-06,
+ "loss": 0.0296,
+ "step": 28214
+ },
+ {
+ "epoch": 76.88010899182561,
+ "grad_norm": 1.7627158164978027,
+ "learning_rate": 2.674914440202706e-06,
+ "loss": 0.0229,
+ "step": 28215
+ },
+ {
+ "epoch": 76.88283378746594,
+ "grad_norm": 1.7345685958862305,
+ "learning_rate": 2.6743137035990583e-06,
+ "loss": 0.0279,
+ "step": 28216
+ },
+ {
+ "epoch": 76.88555858310627,
+ "grad_norm": 3.9004459381103516,
+ "learning_rate": 2.673713024047616e-06,
+ "loss": 0.0658,
+ "step": 28217
+ },
+ {
+ "epoch": 76.88828337874659,
+ "grad_norm": 2.0879580974578857,
+ "learning_rate": 2.673112401553064e-06,
+ "loss": 0.0262,
+ "step": 28218
+ },
+ {
+ "epoch": 76.89100817438693,
+ "grad_norm": 2.071228504180908,
+ "learning_rate": 2.6725118361200775e-06,
+ "loss": 0.0816,
+ "step": 28219
+ },
+ {
+ "epoch": 76.89373297002724,
+ "grad_norm": 2.176243543624878,
+ "learning_rate": 2.6719113277533328e-06,
+ "loss": 0.0212,
+ "step": 28220
+ },
+ {
+ "epoch": 76.89645776566758,
+ "grad_norm": 3.3080270290374756,
+ "learning_rate": 2.6713108764575035e-06,
+ "loss": 0.2384,
+ "step": 28221
+ },
+ {
+ "epoch": 76.8991825613079,
+ "grad_norm": 1.9479093551635742,
+ "learning_rate": 2.670710482237272e-06,
+ "loss": 0.0732,
+ "step": 28222
+ },
+ {
+ "epoch": 76.90190735694823,
+ "grad_norm": 2.9821300506591797,
+ "learning_rate": 2.670110145097311e-06,
+ "loss": 0.0446,
+ "step": 28223
+ },
+ {
+ "epoch": 76.90463215258856,
+ "grad_norm": 2.207801580429077,
+ "learning_rate": 2.6695098650422967e-06,
+ "loss": 0.0363,
+ "step": 28224
+ },
+ {
+ "epoch": 76.90735694822888,
+ "grad_norm": 2.4613595008850098,
+ "learning_rate": 2.6689096420769013e-06,
+ "loss": 0.0281,
+ "step": 28225
+ },
+ {
+ "epoch": 76.91008174386921,
+ "grad_norm": 3.8711798191070557,
+ "learning_rate": 2.668309476205805e-06,
+ "loss": 0.0889,
+ "step": 28226
+ },
+ {
+ "epoch": 76.91280653950953,
+ "grad_norm": 2.2596654891967773,
+ "learning_rate": 2.667709367433674e-06,
+ "loss": 0.1087,
+ "step": 28227
+ },
+ {
+ "epoch": 76.91553133514986,
+ "grad_norm": 8.316119194030762,
+ "learning_rate": 2.6671093157651908e-06,
+ "loss": 0.0371,
+ "step": 28228
+ },
+ {
+ "epoch": 76.9182561307902,
+ "grad_norm": 2.0880208015441895,
+ "learning_rate": 2.6665093212050197e-06,
+ "loss": 0.1088,
+ "step": 28229
+ },
+ {
+ "epoch": 76.92098092643052,
+ "grad_norm": 3.546389102935791,
+ "learning_rate": 2.665909383757842e-06,
+ "loss": 0.0752,
+ "step": 28230
+ },
+ {
+ "epoch": 76.92370572207085,
+ "grad_norm": 2.2764501571655273,
+ "learning_rate": 2.665309503428326e-06,
+ "loss": 0.0328,
+ "step": 28231
+ },
+ {
+ "epoch": 76.92643051771117,
+ "grad_norm": 2.9497528076171875,
+ "learning_rate": 2.664709680221144e-06,
+ "loss": 0.0358,
+ "step": 28232
+ },
+ {
+ "epoch": 76.9291553133515,
+ "grad_norm": 2.4686737060546875,
+ "learning_rate": 2.664109914140963e-06,
+ "loss": 0.0261,
+ "step": 28233
+ },
+ {
+ "epoch": 76.93188010899182,
+ "grad_norm": 2.6861212253570557,
+ "learning_rate": 2.663510205192461e-06,
+ "loss": 0.1651,
+ "step": 28234
+ },
+ {
+ "epoch": 76.93460490463215,
+ "grad_norm": 2.74786376953125,
+ "learning_rate": 2.6629105533803055e-06,
+ "loss": 0.0352,
+ "step": 28235
+ },
+ {
+ "epoch": 76.93732970027249,
+ "grad_norm": 3.4205210208892822,
+ "learning_rate": 2.6623109587091665e-06,
+ "loss": 0.0706,
+ "step": 28236
+ },
+ {
+ "epoch": 76.9400544959128,
+ "grad_norm": 2.435868740081787,
+ "learning_rate": 2.66171142118371e-06,
+ "loss": 0.028,
+ "step": 28237
+ },
+ {
+ "epoch": 76.94277929155314,
+ "grad_norm": 2.9123997688293457,
+ "learning_rate": 2.6611119408086127e-06,
+ "loss": 0.1593,
+ "step": 28238
+ },
+ {
+ "epoch": 76.94550408719346,
+ "grad_norm": 2.951160192489624,
+ "learning_rate": 2.6605125175885394e-06,
+ "loss": 0.0507,
+ "step": 28239
+ },
+ {
+ "epoch": 76.94822888283379,
+ "grad_norm": 2.1408684253692627,
+ "learning_rate": 2.6599131515281586e-06,
+ "loss": 0.0346,
+ "step": 28240
+ },
+ {
+ "epoch": 76.95095367847412,
+ "grad_norm": 3.152165412902832,
+ "learning_rate": 2.659313842632134e-06,
+ "loss": 0.1153,
+ "step": 28241
+ },
+ {
+ "epoch": 76.95367847411444,
+ "grad_norm": 2.740638017654419,
+ "learning_rate": 2.6587145909051405e-06,
+ "loss": 0.0339,
+ "step": 28242
+ },
+ {
+ "epoch": 76.95640326975477,
+ "grad_norm": 2.587643623352051,
+ "learning_rate": 2.6581153963518413e-06,
+ "loss": 0.0314,
+ "step": 28243
+ },
+ {
+ "epoch": 76.95912806539509,
+ "grad_norm": 2.3162875175476074,
+ "learning_rate": 2.6575162589769e-06,
+ "loss": 0.0368,
+ "step": 28244
+ },
+ {
+ "epoch": 76.96185286103542,
+ "grad_norm": 2.167597770690918,
+ "learning_rate": 2.6569171787849867e-06,
+ "loss": 0.0902,
+ "step": 28245
+ },
+ {
+ "epoch": 76.96457765667574,
+ "grad_norm": 2.763551712036133,
+ "learning_rate": 2.656318155780768e-06,
+ "loss": 0.0383,
+ "step": 28246
+ },
+ {
+ "epoch": 76.96730245231608,
+ "grad_norm": 2.515599489212036,
+ "learning_rate": 2.6557191899689073e-06,
+ "loss": 0.0407,
+ "step": 28247
+ },
+ {
+ "epoch": 76.97002724795641,
+ "grad_norm": 3.3870689868927,
+ "learning_rate": 2.6551202813540686e-06,
+ "loss": 0.0601,
+ "step": 28248
+ },
+ {
+ "epoch": 76.97275204359673,
+ "grad_norm": 3.033858060836792,
+ "learning_rate": 2.654521429940915e-06,
+ "loss": 0.0531,
+ "step": 28249
+ },
+ {
+ "epoch": 76.97547683923706,
+ "grad_norm": 2.1676909923553467,
+ "learning_rate": 2.653922635734115e-06,
+ "loss": 0.0474,
+ "step": 28250
+ },
+ {
+ "epoch": 76.97820163487738,
+ "grad_norm": 2.9437270164489746,
+ "learning_rate": 2.6533238987383283e-06,
+ "loss": 0.0601,
+ "step": 28251
+ },
+ {
+ "epoch": 76.98092643051771,
+ "grad_norm": 2.319300413131714,
+ "learning_rate": 2.6527252189582185e-06,
+ "loss": 0.1809,
+ "step": 28252
+ },
+ {
+ "epoch": 76.98365122615803,
+ "grad_norm": 2.7304632663726807,
+ "learning_rate": 2.6521265963984467e-06,
+ "loss": 0.1882,
+ "step": 28253
+ },
+ {
+ "epoch": 76.98637602179836,
+ "grad_norm": 2.2285587787628174,
+ "learning_rate": 2.6515280310636783e-06,
+ "loss": 0.1317,
+ "step": 28254
+ },
+ {
+ "epoch": 76.9891008174387,
+ "grad_norm": 3.706568717956543,
+ "learning_rate": 2.650929522958573e-06,
+ "loss": 0.0984,
+ "step": 28255
+ },
+ {
+ "epoch": 76.99182561307902,
+ "grad_norm": 2.6711254119873047,
+ "learning_rate": 2.6503310720877928e-06,
+ "loss": 0.0777,
+ "step": 28256
+ },
+ {
+ "epoch": 76.99455040871935,
+ "grad_norm": 2.2969894409179688,
+ "learning_rate": 2.6497326784559942e-06,
+ "loss": 0.1066,
+ "step": 28257
+ },
+ {
+ "epoch": 76.99727520435967,
+ "grad_norm": 3.119093894958496,
+ "learning_rate": 2.649134342067844e-06,
+ "loss": 0.0731,
+ "step": 28258
+ },
+ {
+ "epoch": 77.0,
+ "grad_norm": 3.4760067462921143,
+ "learning_rate": 2.648536062927999e-06,
+ "loss": 0.0501,
+ "step": 28259
+ },
+ {
+ "epoch": 77.00272479564033,
+ "grad_norm": 2.6079323291778564,
+ "learning_rate": 2.6479378410411184e-06,
+ "loss": 0.0379,
+ "step": 28260
+ },
+ {
+ "epoch": 77.00544959128065,
+ "grad_norm": 2.5225589275360107,
+ "learning_rate": 2.6473396764118575e-06,
+ "loss": 0.0651,
+ "step": 28261
+ },
+ {
+ "epoch": 77.00817438692098,
+ "grad_norm": 2.607790231704712,
+ "learning_rate": 2.6467415690448795e-06,
+ "loss": 0.1128,
+ "step": 28262
+ },
+ {
+ "epoch": 77.0108991825613,
+ "grad_norm": 3.149742841720581,
+ "learning_rate": 2.646143518944845e-06,
+ "loss": 0.0402,
+ "step": 28263
+ },
+ {
+ "epoch": 77.01362397820164,
+ "grad_norm": 3.2176196575164795,
+ "learning_rate": 2.6455455261164066e-06,
+ "loss": 0.2326,
+ "step": 28264
+ },
+ {
+ "epoch": 77.01634877384195,
+ "grad_norm": 2.213528871536255,
+ "learning_rate": 2.6449475905642242e-06,
+ "loss": 0.0215,
+ "step": 28265
+ },
+ {
+ "epoch": 77.01907356948229,
+ "grad_norm": 2.8598074913024902,
+ "learning_rate": 2.6443497122929495e-06,
+ "loss": 0.0456,
+ "step": 28266
+ },
+ {
+ "epoch": 77.02179836512262,
+ "grad_norm": 2.2847464084625244,
+ "learning_rate": 2.6437518913072456e-06,
+ "loss": 0.0284,
+ "step": 28267
+ },
+ {
+ "epoch": 77.02452316076294,
+ "grad_norm": 3.0514705181121826,
+ "learning_rate": 2.6431541276117654e-06,
+ "loss": 0.0791,
+ "step": 28268
+ },
+ {
+ "epoch": 77.02724795640327,
+ "grad_norm": 2.536168098449707,
+ "learning_rate": 2.6425564212111608e-06,
+ "loss": 0.038,
+ "step": 28269
+ },
+ {
+ "epoch": 77.02997275204359,
+ "grad_norm": 2.7003395557403564,
+ "learning_rate": 2.6419587721100938e-06,
+ "loss": 0.0629,
+ "step": 28270
+ },
+ {
+ "epoch": 77.03269754768392,
+ "grad_norm": 2.958134412765503,
+ "learning_rate": 2.6413611803132146e-06,
+ "loss": 0.0738,
+ "step": 28271
+ },
+ {
+ "epoch": 77.03542234332426,
+ "grad_norm": 1.7861578464508057,
+ "learning_rate": 2.6407636458251773e-06,
+ "loss": 0.0308,
+ "step": 28272
+ },
+ {
+ "epoch": 77.03814713896458,
+ "grad_norm": 1.8519829511642456,
+ "learning_rate": 2.640166168650633e-06,
+ "loss": 0.1506,
+ "step": 28273
+ },
+ {
+ "epoch": 77.04087193460491,
+ "grad_norm": 2.518130302429199,
+ "learning_rate": 2.639568748794241e-06,
+ "loss": 0.043,
+ "step": 28274
+ },
+ {
+ "epoch": 77.04359673024523,
+ "grad_norm": 1.6704596281051636,
+ "learning_rate": 2.6389713862606513e-06,
+ "loss": 0.0183,
+ "step": 28275
+ },
+ {
+ "epoch": 77.04632152588556,
+ "grad_norm": 2.4765989780426025,
+ "learning_rate": 2.6383740810545145e-06,
+ "loss": 0.0365,
+ "step": 28276
+ },
+ {
+ "epoch": 77.04904632152588,
+ "grad_norm": 2.888434886932373,
+ "learning_rate": 2.637776833180481e-06,
+ "loss": 0.1115,
+ "step": 28277
+ },
+ {
+ "epoch": 77.05177111716621,
+ "grad_norm": 3.075648069381714,
+ "learning_rate": 2.6371796426432038e-06,
+ "loss": 0.0443,
+ "step": 28278
+ },
+ {
+ "epoch": 77.05449591280654,
+ "grad_norm": 2.9790425300598145,
+ "learning_rate": 2.6365825094473387e-06,
+ "loss": 0.1049,
+ "step": 28279
+ },
+ {
+ "epoch": 77.05722070844686,
+ "grad_norm": 1.9135756492614746,
+ "learning_rate": 2.635985433597531e-06,
+ "loss": 0.0471,
+ "step": 28280
+ },
+ {
+ "epoch": 77.0599455040872,
+ "grad_norm": 1.6832255125045776,
+ "learning_rate": 2.6353884150984322e-06,
+ "loss": 0.0177,
+ "step": 28281
+ },
+ {
+ "epoch": 77.06267029972751,
+ "grad_norm": 2.3960390090942383,
+ "learning_rate": 2.6347914539546883e-06,
+ "loss": 0.0945,
+ "step": 28282
+ },
+ {
+ "epoch": 77.06539509536785,
+ "grad_norm": 2.7573649883270264,
+ "learning_rate": 2.634194550170954e-06,
+ "loss": 0.0348,
+ "step": 28283
+ },
+ {
+ "epoch": 77.06811989100818,
+ "grad_norm": 2.5236833095550537,
+ "learning_rate": 2.6335977037518767e-06,
+ "loss": 0.0521,
+ "step": 28284
+ },
+ {
+ "epoch": 77.0708446866485,
+ "grad_norm": 2.3994863033294678,
+ "learning_rate": 2.633000914702103e-06,
+ "loss": 0.0568,
+ "step": 28285
+ },
+ {
+ "epoch": 77.07356948228883,
+ "grad_norm": 3.348933696746826,
+ "learning_rate": 2.632404183026277e-06,
+ "loss": 0.0605,
+ "step": 28286
+ },
+ {
+ "epoch": 77.07629427792915,
+ "grad_norm": 2.594438314437866,
+ "learning_rate": 2.631807508729054e-06,
+ "loss": 0.0686,
+ "step": 28287
+ },
+ {
+ "epoch": 77.07901907356948,
+ "grad_norm": 2.689310073852539,
+ "learning_rate": 2.631210891815077e-06,
+ "loss": 0.1564,
+ "step": 28288
+ },
+ {
+ "epoch": 77.0817438692098,
+ "grad_norm": 2.0371029376983643,
+ "learning_rate": 2.63061433228899e-06,
+ "loss": 0.029,
+ "step": 28289
+ },
+ {
+ "epoch": 77.08446866485014,
+ "grad_norm": 2.612265110015869,
+ "learning_rate": 2.6300178301554436e-06,
+ "loss": 0.029,
+ "step": 28290
+ },
+ {
+ "epoch": 77.08719346049047,
+ "grad_norm": 2.674476385116577,
+ "learning_rate": 2.6294213854190807e-06,
+ "loss": 0.0578,
+ "step": 28291
+ },
+ {
+ "epoch": 77.08991825613079,
+ "grad_norm": 2.713242292404175,
+ "learning_rate": 2.628824998084547e-06,
+ "loss": 0.057,
+ "step": 28292
+ },
+ {
+ "epoch": 77.09264305177112,
+ "grad_norm": 2.3643999099731445,
+ "learning_rate": 2.628228668156485e-06,
+ "loss": 0.0653,
+ "step": 28293
+ },
+ {
+ "epoch": 77.09536784741144,
+ "grad_norm": 2.3944807052612305,
+ "learning_rate": 2.6276323956395433e-06,
+ "loss": 0.0291,
+ "step": 28294
+ },
+ {
+ "epoch": 77.09809264305177,
+ "grad_norm": 1.9519646167755127,
+ "learning_rate": 2.6270361805383593e-06,
+ "loss": 0.0367,
+ "step": 28295
+ },
+ {
+ "epoch": 77.1008174386921,
+ "grad_norm": 2.5369083881378174,
+ "learning_rate": 2.626440022857585e-06,
+ "loss": 0.1256,
+ "step": 28296
+ },
+ {
+ "epoch": 77.10354223433242,
+ "grad_norm": 2.037079095840454,
+ "learning_rate": 2.6258439226018574e-06,
+ "loss": 0.0463,
+ "step": 28297
+ },
+ {
+ "epoch": 77.10626702997276,
+ "grad_norm": 3.5799801349639893,
+ "learning_rate": 2.625247879775816e-06,
+ "loss": 0.0837,
+ "step": 28298
+ },
+ {
+ "epoch": 77.10899182561307,
+ "grad_norm": 2.167036533355713,
+ "learning_rate": 2.6246518943841115e-06,
+ "loss": 0.0272,
+ "step": 28299
+ },
+ {
+ "epoch": 77.11171662125341,
+ "grad_norm": 1.9913524389266968,
+ "learning_rate": 2.6240559664313805e-06,
+ "loss": 0.1283,
+ "step": 28300
+ },
+ {
+ "epoch": 77.11444141689373,
+ "grad_norm": 3.5613033771514893,
+ "learning_rate": 2.623460095922263e-06,
+ "loss": 0.0795,
+ "step": 28301
+ },
+ {
+ "epoch": 77.11716621253406,
+ "grad_norm": 2.2153353691101074,
+ "learning_rate": 2.622864282861399e-06,
+ "loss": 0.0369,
+ "step": 28302
+ },
+ {
+ "epoch": 77.11989100817439,
+ "grad_norm": 6.166149616241455,
+ "learning_rate": 2.6222685272534333e-06,
+ "loss": 0.0724,
+ "step": 28303
+ },
+ {
+ "epoch": 77.12261580381471,
+ "grad_norm": 2.6389477252960205,
+ "learning_rate": 2.6216728291030024e-06,
+ "loss": 0.2047,
+ "step": 28304
+ },
+ {
+ "epoch": 77.12534059945504,
+ "grad_norm": 1.5879967212677002,
+ "learning_rate": 2.6210771884147468e-06,
+ "loss": 0.0274,
+ "step": 28305
+ },
+ {
+ "epoch": 77.12806539509536,
+ "grad_norm": 2.509934902191162,
+ "learning_rate": 2.620481605193301e-06,
+ "loss": 0.0383,
+ "step": 28306
+ },
+ {
+ "epoch": 77.1307901907357,
+ "grad_norm": 3.834446907043457,
+ "learning_rate": 2.61988607944331e-06,
+ "loss": 0.1499,
+ "step": 28307
+ },
+ {
+ "epoch": 77.13351498637603,
+ "grad_norm": 1.7610657215118408,
+ "learning_rate": 2.6192906111694095e-06,
+ "loss": 0.0284,
+ "step": 28308
+ },
+ {
+ "epoch": 77.13623978201635,
+ "grad_norm": 2.327150583267212,
+ "learning_rate": 2.6186952003762355e-06,
+ "loss": 0.0209,
+ "step": 28309
+ },
+ {
+ "epoch": 77.13896457765668,
+ "grad_norm": 3.574877977371216,
+ "learning_rate": 2.618099847068423e-06,
+ "loss": 0.0795,
+ "step": 28310
+ },
+ {
+ "epoch": 77.141689373297,
+ "grad_norm": 2.3875651359558105,
+ "learning_rate": 2.6175045512506138e-06,
+ "loss": 0.0315,
+ "step": 28311
+ },
+ {
+ "epoch": 77.14441416893733,
+ "grad_norm": 2.992039203643799,
+ "learning_rate": 2.6169093129274416e-06,
+ "loss": 0.0344,
+ "step": 28312
+ },
+ {
+ "epoch": 77.14713896457765,
+ "grad_norm": 3.4359548091888428,
+ "learning_rate": 2.616314132103539e-06,
+ "loss": 0.0569,
+ "step": 28313
+ },
+ {
+ "epoch": 77.14986376021798,
+ "grad_norm": 2.833533763885498,
+ "learning_rate": 2.6157190087835437e-06,
+ "loss": 0.0392,
+ "step": 28314
+ },
+ {
+ "epoch": 77.15258855585832,
+ "grad_norm": 2.8054587841033936,
+ "learning_rate": 2.6151239429720952e-06,
+ "loss": 0.0392,
+ "step": 28315
+ },
+ {
+ "epoch": 77.15531335149863,
+ "grad_norm": 2.4326376914978027,
+ "learning_rate": 2.6145289346738234e-06,
+ "loss": 0.057,
+ "step": 28316
+ },
+ {
+ "epoch": 77.15803814713897,
+ "grad_norm": 3.105372667312622,
+ "learning_rate": 2.613933983893363e-06,
+ "loss": 0.0458,
+ "step": 28317
+ },
+ {
+ "epoch": 77.16076294277929,
+ "grad_norm": 3.383669853210449,
+ "learning_rate": 2.613339090635343e-06,
+ "loss": 0.0524,
+ "step": 28318
+ },
+ {
+ "epoch": 77.16348773841962,
+ "grad_norm": 3.113739252090454,
+ "learning_rate": 2.612744254904405e-06,
+ "loss": 0.1057,
+ "step": 28319
+ },
+ {
+ "epoch": 77.16621253405995,
+ "grad_norm": 2.453718423843384,
+ "learning_rate": 2.612149476705176e-06,
+ "loss": 0.0477,
+ "step": 28320
+ },
+ {
+ "epoch": 77.16893732970027,
+ "grad_norm": 2.184514284133911,
+ "learning_rate": 2.6115547560422884e-06,
+ "loss": 0.0405,
+ "step": 28321
+ },
+ {
+ "epoch": 77.1716621253406,
+ "grad_norm": 3.3941001892089844,
+ "learning_rate": 2.6109600929203726e-06,
+ "loss": 0.0401,
+ "step": 28322
+ },
+ {
+ "epoch": 77.17438692098092,
+ "grad_norm": 2.4680778980255127,
+ "learning_rate": 2.6103654873440642e-06,
+ "loss": 0.124,
+ "step": 28323
+ },
+ {
+ "epoch": 77.17711171662125,
+ "grad_norm": 3.5254034996032715,
+ "learning_rate": 2.6097709393179915e-06,
+ "loss": 0.1141,
+ "step": 28324
+ },
+ {
+ "epoch": 77.17983651226157,
+ "grad_norm": 1.8669538497924805,
+ "learning_rate": 2.6091764488467852e-06,
+ "loss": 0.0264,
+ "step": 28325
+ },
+ {
+ "epoch": 77.1825613079019,
+ "grad_norm": 2.805007219314575,
+ "learning_rate": 2.608582015935072e-06,
+ "loss": 0.0604,
+ "step": 28326
+ },
+ {
+ "epoch": 77.18528610354224,
+ "grad_norm": 2.943263053894043,
+ "learning_rate": 2.607987640587487e-06,
+ "loss": 0.0502,
+ "step": 28327
+ },
+ {
+ "epoch": 77.18801089918256,
+ "grad_norm": 1.7465529441833496,
+ "learning_rate": 2.6073933228086568e-06,
+ "loss": 0.0792,
+ "step": 28328
+ },
+ {
+ "epoch": 77.19073569482289,
+ "grad_norm": 2.9444684982299805,
+ "learning_rate": 2.606799062603208e-06,
+ "loss": 0.0529,
+ "step": 28329
+ },
+ {
+ "epoch": 77.19346049046321,
+ "grad_norm": 3.38279128074646,
+ "learning_rate": 2.6062048599757685e-06,
+ "loss": 0.0979,
+ "step": 28330
+ },
+ {
+ "epoch": 77.19618528610354,
+ "grad_norm": 2.9587132930755615,
+ "learning_rate": 2.6056107149309673e-06,
+ "loss": 0.0893,
+ "step": 28331
+ },
+ {
+ "epoch": 77.19891008174388,
+ "grad_norm": 2.821481466293335,
+ "learning_rate": 2.6050166274734346e-06,
+ "loss": 0.1403,
+ "step": 28332
+ },
+ {
+ "epoch": 77.2016348773842,
+ "grad_norm": 2.5020580291748047,
+ "learning_rate": 2.6044225976077954e-06,
+ "loss": 0.0394,
+ "step": 28333
+ },
+ {
+ "epoch": 77.20435967302453,
+ "grad_norm": 2.6696362495422363,
+ "learning_rate": 2.6038286253386704e-06,
+ "loss": 0.0489,
+ "step": 28334
+ },
+ {
+ "epoch": 77.20708446866485,
+ "grad_norm": 3.003931760787964,
+ "learning_rate": 2.6032347106706945e-06,
+ "loss": 0.0685,
+ "step": 28335
+ },
+ {
+ "epoch": 77.20980926430518,
+ "grad_norm": 2.7271816730499268,
+ "learning_rate": 2.602640853608488e-06,
+ "loss": 0.0413,
+ "step": 28336
+ },
+ {
+ "epoch": 77.2125340599455,
+ "grad_norm": 2.33297061920166,
+ "learning_rate": 2.6020470541566757e-06,
+ "loss": 0.127,
+ "step": 28337
+ },
+ {
+ "epoch": 77.21525885558583,
+ "grad_norm": 2.468869924545288,
+ "learning_rate": 2.6014533123198803e-06,
+ "loss": 0.0863,
+ "step": 28338
+ },
+ {
+ "epoch": 77.21798365122616,
+ "grad_norm": 2.542198896408081,
+ "learning_rate": 2.600859628102732e-06,
+ "loss": 0.0531,
+ "step": 28339
+ },
+ {
+ "epoch": 77.22070844686648,
+ "grad_norm": 4.324550628662109,
+ "learning_rate": 2.60026600150985e-06,
+ "loss": 0.0866,
+ "step": 28340
+ },
+ {
+ "epoch": 77.22343324250681,
+ "grad_norm": 2.388823986053467,
+ "learning_rate": 2.5996724325458588e-06,
+ "loss": 0.0703,
+ "step": 28341
+ },
+ {
+ "epoch": 77.22615803814713,
+ "grad_norm": 2.9211771488189697,
+ "learning_rate": 2.599078921215378e-06,
+ "loss": 0.0849,
+ "step": 28342
+ },
+ {
+ "epoch": 77.22888283378747,
+ "grad_norm": 3.4782581329345703,
+ "learning_rate": 2.598485467523034e-06,
+ "loss": 0.1114,
+ "step": 28343
+ },
+ {
+ "epoch": 77.2316076294278,
+ "grad_norm": 2.142575263977051,
+ "learning_rate": 2.597892071473448e-06,
+ "loss": 0.0821,
+ "step": 28344
+ },
+ {
+ "epoch": 77.23433242506812,
+ "grad_norm": 2.9981675148010254,
+ "learning_rate": 2.5972987330712398e-06,
+ "loss": 0.0402,
+ "step": 28345
+ },
+ {
+ "epoch": 77.23705722070845,
+ "grad_norm": 2.780332565307617,
+ "learning_rate": 2.596705452321028e-06,
+ "loss": 0.0741,
+ "step": 28346
+ },
+ {
+ "epoch": 77.23978201634877,
+ "grad_norm": 2.5900814533233643,
+ "learning_rate": 2.5961122292274353e-06,
+ "loss": 0.0463,
+ "step": 28347
+ },
+ {
+ "epoch": 77.2425068119891,
+ "grad_norm": 3.1700220108032227,
+ "learning_rate": 2.5955190637950855e-06,
+ "loss": 0.0936,
+ "step": 28348
+ },
+ {
+ "epoch": 77.24523160762942,
+ "grad_norm": 3.501685619354248,
+ "learning_rate": 2.5949259560285955e-06,
+ "loss": 0.1122,
+ "step": 28349
+ },
+ {
+ "epoch": 77.24795640326975,
+ "grad_norm": 2.62182354927063,
+ "learning_rate": 2.594332905932584e-06,
+ "loss": 0.1405,
+ "step": 28350
+ },
+ {
+ "epoch": 77.25068119891009,
+ "grad_norm": 3.6526505947113037,
+ "learning_rate": 2.593739913511666e-06,
+ "loss": 0.0448,
+ "step": 28351
+ },
+ {
+ "epoch": 77.2534059945504,
+ "grad_norm": 1.768544316291809,
+ "learning_rate": 2.5931469787704656e-06,
+ "loss": 0.0274,
+ "step": 28352
+ },
+ {
+ "epoch": 77.25613079019074,
+ "grad_norm": 2.2839407920837402,
+ "learning_rate": 2.5925541017135992e-06,
+ "loss": 0.0411,
+ "step": 28353
+ },
+ {
+ "epoch": 77.25885558583106,
+ "grad_norm": 2.1834545135498047,
+ "learning_rate": 2.5919612823456795e-06,
+ "loss": 0.0223,
+ "step": 28354
+ },
+ {
+ "epoch": 77.26158038147139,
+ "grad_norm": 2.4900600910186768,
+ "learning_rate": 2.59136852067133e-06,
+ "loss": 0.1543,
+ "step": 28355
+ },
+ {
+ "epoch": 77.26430517711172,
+ "grad_norm": 1.9542450904846191,
+ "learning_rate": 2.5907758166951635e-06,
+ "loss": 0.026,
+ "step": 28356
+ },
+ {
+ "epoch": 77.26702997275204,
+ "grad_norm": 2.0919249057769775,
+ "learning_rate": 2.5901831704217973e-06,
+ "loss": 0.0234,
+ "step": 28357
+ },
+ {
+ "epoch": 77.26975476839237,
+ "grad_norm": 3.337462902069092,
+ "learning_rate": 2.589590581855843e-06,
+ "loss": 0.1082,
+ "step": 28358
+ },
+ {
+ "epoch": 77.2724795640327,
+ "grad_norm": 2.0865652561187744,
+ "learning_rate": 2.588998051001921e-06,
+ "loss": 0.0257,
+ "step": 28359
+ },
+ {
+ "epoch": 77.27520435967303,
+ "grad_norm": 2.4404172897338867,
+ "learning_rate": 2.5884055778646443e-06,
+ "loss": 0.1117,
+ "step": 28360
+ },
+ {
+ "epoch": 77.27792915531334,
+ "grad_norm": 2.837879180908203,
+ "learning_rate": 2.5878131624486256e-06,
+ "loss": 0.0444,
+ "step": 28361
+ },
+ {
+ "epoch": 77.28065395095368,
+ "grad_norm": 2.6554408073425293,
+ "learning_rate": 2.587220804758478e-06,
+ "loss": 0.0308,
+ "step": 28362
+ },
+ {
+ "epoch": 77.28337874659401,
+ "grad_norm": 2.34537935256958,
+ "learning_rate": 2.586628504798818e-06,
+ "loss": 0.0512,
+ "step": 28363
+ },
+ {
+ "epoch": 77.28610354223433,
+ "grad_norm": 3.424349546432495,
+ "learning_rate": 2.586036262574254e-06,
+ "loss": 0.0612,
+ "step": 28364
+ },
+ {
+ "epoch": 77.28882833787466,
+ "grad_norm": 3.2750487327575684,
+ "learning_rate": 2.585444078089404e-06,
+ "loss": 0.1182,
+ "step": 28365
+ },
+ {
+ "epoch": 77.29155313351498,
+ "grad_norm": 4.671356678009033,
+ "learning_rate": 2.5848519513488767e-06,
+ "loss": 0.1176,
+ "step": 28366
+ },
+ {
+ "epoch": 77.29427792915531,
+ "grad_norm": 1.9492790699005127,
+ "learning_rate": 2.5842598823572805e-06,
+ "loss": 0.1477,
+ "step": 28367
+ },
+ {
+ "epoch": 77.29700272479565,
+ "grad_norm": 2.4482572078704834,
+ "learning_rate": 2.583667871119233e-06,
+ "loss": 0.0818,
+ "step": 28368
+ },
+ {
+ "epoch": 77.29972752043597,
+ "grad_norm": 2.9148521423339844,
+ "learning_rate": 2.583075917639342e-06,
+ "loss": 0.091,
+ "step": 28369
+ },
+ {
+ "epoch": 77.3024523160763,
+ "grad_norm": 2.2485458850860596,
+ "learning_rate": 2.582484021922216e-06,
+ "loss": 0.0435,
+ "step": 28370
+ },
+ {
+ "epoch": 77.30517711171662,
+ "grad_norm": 2.246720790863037,
+ "learning_rate": 2.581892183972463e-06,
+ "loss": 0.0347,
+ "step": 28371
+ },
+ {
+ "epoch": 77.30790190735695,
+ "grad_norm": 2.415050506591797,
+ "learning_rate": 2.5813004037946986e-06,
+ "loss": 0.0427,
+ "step": 28372
+ },
+ {
+ "epoch": 77.31062670299727,
+ "grad_norm": 2.1264264583587646,
+ "learning_rate": 2.5807086813935266e-06,
+ "loss": 0.0243,
+ "step": 28373
+ },
+ {
+ "epoch": 77.3133514986376,
+ "grad_norm": 2.6624844074249268,
+ "learning_rate": 2.580117016773558e-06,
+ "loss": 0.0432,
+ "step": 28374
+ },
+ {
+ "epoch": 77.31607629427793,
+ "grad_norm": 3.3343701362609863,
+ "learning_rate": 2.5795254099393953e-06,
+ "loss": 0.2262,
+ "step": 28375
+ },
+ {
+ "epoch": 77.31880108991825,
+ "grad_norm": 3.9192686080932617,
+ "learning_rate": 2.5789338608956526e-06,
+ "loss": 0.0735,
+ "step": 28376
+ },
+ {
+ "epoch": 77.32152588555859,
+ "grad_norm": 2.675515651702881,
+ "learning_rate": 2.5783423696469356e-06,
+ "loss": 0.0828,
+ "step": 28377
+ },
+ {
+ "epoch": 77.3242506811989,
+ "grad_norm": 2.6446645259857178,
+ "learning_rate": 2.577750936197845e-06,
+ "loss": 0.0365,
+ "step": 28378
+ },
+ {
+ "epoch": 77.32697547683924,
+ "grad_norm": 2.8183844089508057,
+ "learning_rate": 2.577159560552995e-06,
+ "loss": 0.1491,
+ "step": 28379
+ },
+ {
+ "epoch": 77.32970027247957,
+ "grad_norm": 2.186535596847534,
+ "learning_rate": 2.576568242716987e-06,
+ "loss": 0.1011,
+ "step": 28380
+ },
+ {
+ "epoch": 77.33242506811989,
+ "grad_norm": 1.7282354831695557,
+ "learning_rate": 2.5759769826944236e-06,
+ "loss": 0.0212,
+ "step": 28381
+ },
+ {
+ "epoch": 77.33514986376022,
+ "grad_norm": 2.604694128036499,
+ "learning_rate": 2.5753857804899163e-06,
+ "loss": 0.0619,
+ "step": 28382
+ },
+ {
+ "epoch": 77.33787465940054,
+ "grad_norm": 2.528526544570923,
+ "learning_rate": 2.574794636108061e-06,
+ "loss": 0.0391,
+ "step": 28383
+ },
+ {
+ "epoch": 77.34059945504087,
+ "grad_norm": 2.8281095027923584,
+ "learning_rate": 2.574203549553471e-06,
+ "loss": 0.1655,
+ "step": 28384
+ },
+ {
+ "epoch": 77.34332425068119,
+ "grad_norm": 2.5194592475891113,
+ "learning_rate": 2.573612520830744e-06,
+ "loss": 0.0715,
+ "step": 28385
+ },
+ {
+ "epoch": 77.34604904632153,
+ "grad_norm": 2.8153131008148193,
+ "learning_rate": 2.573021549944483e-06,
+ "loss": 0.0998,
+ "step": 28386
+ },
+ {
+ "epoch": 77.34877384196186,
+ "grad_norm": 2.246671438217163,
+ "learning_rate": 2.5724306368992893e-06,
+ "loss": 0.0366,
+ "step": 28387
+ },
+ {
+ "epoch": 77.35149863760218,
+ "grad_norm": 2.389148473739624,
+ "learning_rate": 2.5718397816997685e-06,
+ "loss": 0.0414,
+ "step": 28388
+ },
+ {
+ "epoch": 77.35422343324251,
+ "grad_norm": 3.353811740875244,
+ "learning_rate": 2.5712489843505207e-06,
+ "loss": 0.0623,
+ "step": 28389
+ },
+ {
+ "epoch": 77.35694822888283,
+ "grad_norm": 1.9880976676940918,
+ "learning_rate": 2.570658244856147e-06,
+ "loss": 0.0815,
+ "step": 28390
+ },
+ {
+ "epoch": 77.35967302452316,
+ "grad_norm": 2.823745012283325,
+ "learning_rate": 2.5700675632212445e-06,
+ "loss": 0.044,
+ "step": 28391
+ },
+ {
+ "epoch": 77.3623978201635,
+ "grad_norm": 2.4052863121032715,
+ "learning_rate": 2.5694769394504204e-06,
+ "loss": 0.0336,
+ "step": 28392
+ },
+ {
+ "epoch": 77.36512261580381,
+ "grad_norm": 1.7629444599151611,
+ "learning_rate": 2.5688863735482706e-06,
+ "loss": 0.0214,
+ "step": 28393
+ },
+ {
+ "epoch": 77.36784741144415,
+ "grad_norm": 2.4777607917785645,
+ "learning_rate": 2.5682958655193936e-06,
+ "loss": 0.0639,
+ "step": 28394
+ },
+ {
+ "epoch": 77.37057220708446,
+ "grad_norm": 2.55159854888916,
+ "learning_rate": 2.5677054153683868e-06,
+ "loss": 0.0357,
+ "step": 28395
+ },
+ {
+ "epoch": 77.3732970027248,
+ "grad_norm": 1.5858360528945923,
+ "learning_rate": 2.567115023099854e-06,
+ "loss": 0.0222,
+ "step": 28396
+ },
+ {
+ "epoch": 77.37602179836512,
+ "grad_norm": 2.7543575763702393,
+ "learning_rate": 2.5665246887183903e-06,
+ "loss": 0.0491,
+ "step": 28397
+ },
+ {
+ "epoch": 77.37874659400545,
+ "grad_norm": 2.8959872722625732,
+ "learning_rate": 2.5659344122285902e-06,
+ "loss": 0.0356,
+ "step": 28398
+ },
+ {
+ "epoch": 77.38147138964578,
+ "grad_norm": 3.3684165477752686,
+ "learning_rate": 2.565344193635053e-06,
+ "loss": 0.0575,
+ "step": 28399
+ },
+ {
+ "epoch": 77.3841961852861,
+ "grad_norm": 2.763245105743408,
+ "learning_rate": 2.56475403294238e-06,
+ "loss": 0.0911,
+ "step": 28400
+ },
+ {
+ "epoch": 77.38692098092643,
+ "grad_norm": 3.3602499961853027,
+ "learning_rate": 2.5641639301551622e-06,
+ "loss": 0.0258,
+ "step": 28401
+ },
+ {
+ "epoch": 77.38964577656675,
+ "grad_norm": 2.2327897548675537,
+ "learning_rate": 2.563573885277998e-06,
+ "loss": 0.0354,
+ "step": 28402
+ },
+ {
+ "epoch": 77.39237057220708,
+ "grad_norm": 3.208909034729004,
+ "learning_rate": 2.5629838983154763e-06,
+ "loss": 0.0729,
+ "step": 28403
+ },
+ {
+ "epoch": 77.39509536784742,
+ "grad_norm": 3.959651231765747,
+ "learning_rate": 2.5623939692722e-06,
+ "loss": 0.0508,
+ "step": 28404
+ },
+ {
+ "epoch": 77.39782016348774,
+ "grad_norm": 3.821998357772827,
+ "learning_rate": 2.5618040981527603e-06,
+ "loss": 0.055,
+ "step": 28405
+ },
+ {
+ "epoch": 77.40054495912807,
+ "grad_norm": 3.2189230918884277,
+ "learning_rate": 2.5612142849617516e-06,
+ "loss": 0.2097,
+ "step": 28406
+ },
+ {
+ "epoch": 77.40326975476839,
+ "grad_norm": 2.05731201171875,
+ "learning_rate": 2.5606245297037624e-06,
+ "loss": 0.0259,
+ "step": 28407
+ },
+ {
+ "epoch": 77.40599455040872,
+ "grad_norm": 3.0733771324157715,
+ "learning_rate": 2.5600348323833936e-06,
+ "loss": 0.1019,
+ "step": 28408
+ },
+ {
+ "epoch": 77.40871934604904,
+ "grad_norm": 1.7058881521224976,
+ "learning_rate": 2.5594451930052346e-06,
+ "loss": 0.1188,
+ "step": 28409
+ },
+ {
+ "epoch": 77.41144414168937,
+ "grad_norm": 3.7195069789886475,
+ "learning_rate": 2.558855611573876e-06,
+ "loss": 0.0881,
+ "step": 28410
+ },
+ {
+ "epoch": 77.4141689373297,
+ "grad_norm": 2.2621467113494873,
+ "learning_rate": 2.558266088093907e-06,
+ "loss": 0.0548,
+ "step": 28411
+ },
+ {
+ "epoch": 77.41689373297002,
+ "grad_norm": 2.409527540206909,
+ "learning_rate": 2.5576766225699267e-06,
+ "loss": 0.0314,
+ "step": 28412
+ },
+ {
+ "epoch": 77.41961852861036,
+ "grad_norm": 2.0626375675201416,
+ "learning_rate": 2.557087215006521e-06,
+ "loss": 0.035,
+ "step": 28413
+ },
+ {
+ "epoch": 77.42234332425068,
+ "grad_norm": 3.906682252883911,
+ "learning_rate": 2.5564978654082794e-06,
+ "loss": 0.0733,
+ "step": 28414
+ },
+ {
+ "epoch": 77.42506811989101,
+ "grad_norm": 2.634202718734741,
+ "learning_rate": 2.5559085737797904e-06,
+ "loss": 0.0646,
+ "step": 28415
+ },
+ {
+ "epoch": 77.42779291553134,
+ "grad_norm": 2.1719534397125244,
+ "learning_rate": 2.555319340125646e-06,
+ "loss": 0.0753,
+ "step": 28416
+ },
+ {
+ "epoch": 77.43051771117166,
+ "grad_norm": 2.6878604888916016,
+ "learning_rate": 2.5547301644504386e-06,
+ "loss": 0.082,
+ "step": 28417
+ },
+ {
+ "epoch": 77.433242506812,
+ "grad_norm": 4.437887668609619,
+ "learning_rate": 2.5541410467587512e-06,
+ "loss": 0.0317,
+ "step": 28418
+ },
+ {
+ "epoch": 77.43596730245231,
+ "grad_norm": 2.2146847248077393,
+ "learning_rate": 2.5535519870551728e-06,
+ "loss": 0.0438,
+ "step": 28419
+ },
+ {
+ "epoch": 77.43869209809264,
+ "grad_norm": 5.827820301055908,
+ "learning_rate": 2.5529629853442937e-06,
+ "loss": 0.1261,
+ "step": 28420
+ },
+ {
+ "epoch": 77.44141689373296,
+ "grad_norm": 3.3244845867156982,
+ "learning_rate": 2.5523740416306995e-06,
+ "loss": 0.0577,
+ "step": 28421
+ },
+ {
+ "epoch": 77.4441416893733,
+ "grad_norm": 3.4202892780303955,
+ "learning_rate": 2.5517851559189764e-06,
+ "loss": 0.0662,
+ "step": 28422
+ },
+ {
+ "epoch": 77.44686648501363,
+ "grad_norm": 3.468672275543213,
+ "learning_rate": 2.5511963282137077e-06,
+ "loss": 0.0556,
+ "step": 28423
+ },
+ {
+ "epoch": 77.44959128065395,
+ "grad_norm": 2.372209072113037,
+ "learning_rate": 2.5506075585194856e-06,
+ "loss": 0.0378,
+ "step": 28424
+ },
+ {
+ "epoch": 77.45231607629428,
+ "grad_norm": 3.1423909664154053,
+ "learning_rate": 2.5500188468408917e-06,
+ "loss": 0.0616,
+ "step": 28425
+ },
+ {
+ "epoch": 77.4550408719346,
+ "grad_norm": 2.312046766281128,
+ "learning_rate": 2.5494301931825117e-06,
+ "loss": 0.0883,
+ "step": 28426
+ },
+ {
+ "epoch": 77.45776566757493,
+ "grad_norm": 2.011847496032715,
+ "learning_rate": 2.5488415975489266e-06,
+ "loss": 0.0862,
+ "step": 28427
+ },
+ {
+ "epoch": 77.46049046321527,
+ "grad_norm": 2.175135850906372,
+ "learning_rate": 2.5482530599447254e-06,
+ "loss": 0.0264,
+ "step": 28428
+ },
+ {
+ "epoch": 77.46321525885558,
+ "grad_norm": 3.052598714828491,
+ "learning_rate": 2.5476645803744902e-06,
+ "loss": 0.0904,
+ "step": 28429
+ },
+ {
+ "epoch": 77.46594005449592,
+ "grad_norm": 2.514087677001953,
+ "learning_rate": 2.547076158842804e-06,
+ "loss": 0.037,
+ "step": 28430
+ },
+ {
+ "epoch": 77.46866485013624,
+ "grad_norm": 3.4340426921844482,
+ "learning_rate": 2.5464877953542457e-06,
+ "loss": 0.0733,
+ "step": 28431
+ },
+ {
+ "epoch": 77.47138964577657,
+ "grad_norm": 2.293118476867676,
+ "learning_rate": 2.5458994899134024e-06,
+ "loss": 0.0403,
+ "step": 28432
+ },
+ {
+ "epoch": 77.47411444141689,
+ "grad_norm": 2.7532589435577393,
+ "learning_rate": 2.5453112425248516e-06,
+ "loss": 0.0716,
+ "step": 28433
+ },
+ {
+ "epoch": 77.47683923705722,
+ "grad_norm": 4.328482627868652,
+ "learning_rate": 2.54472305319318e-06,
+ "loss": 0.0523,
+ "step": 28434
+ },
+ {
+ "epoch": 77.47956403269755,
+ "grad_norm": 3.9203343391418457,
+ "learning_rate": 2.544134921922965e-06,
+ "loss": 0.0409,
+ "step": 28435
+ },
+ {
+ "epoch": 77.48228882833787,
+ "grad_norm": 2.15958571434021,
+ "learning_rate": 2.543546848718784e-06,
+ "loss": 0.0343,
+ "step": 28436
+ },
+ {
+ "epoch": 77.4850136239782,
+ "grad_norm": 2.3497140407562256,
+ "learning_rate": 2.542958833585224e-06,
+ "loss": 0.0417,
+ "step": 28437
+ },
+ {
+ "epoch": 77.48773841961852,
+ "grad_norm": 2.4433770179748535,
+ "learning_rate": 2.5423708765268607e-06,
+ "loss": 0.1215,
+ "step": 28438
+ },
+ {
+ "epoch": 77.49046321525886,
+ "grad_norm": 4.357604503631592,
+ "learning_rate": 2.541782977548273e-06,
+ "loss": 0.2337,
+ "step": 28439
+ },
+ {
+ "epoch": 77.49318801089919,
+ "grad_norm": 2.417895555496216,
+ "learning_rate": 2.5411951366540357e-06,
+ "loss": 0.0518,
+ "step": 28440
+ },
+ {
+ "epoch": 77.49591280653951,
+ "grad_norm": 2.396540403366089,
+ "learning_rate": 2.540607353848733e-06,
+ "loss": 0.0302,
+ "step": 28441
+ },
+ {
+ "epoch": 77.49863760217984,
+ "grad_norm": 5.14478874206543,
+ "learning_rate": 2.5400196291369417e-06,
+ "loss": 0.1045,
+ "step": 28442
+ },
+ {
+ "epoch": 77.50136239782016,
+ "grad_norm": 3.3471691608428955,
+ "learning_rate": 2.5394319625232333e-06,
+ "loss": 0.0754,
+ "step": 28443
+ },
+ {
+ "epoch": 77.50408719346049,
+ "grad_norm": 2.0748744010925293,
+ "learning_rate": 2.538844354012192e-06,
+ "loss": 0.056,
+ "step": 28444
+ },
+ {
+ "epoch": 77.50681198910081,
+ "grad_norm": 2.3002915382385254,
+ "learning_rate": 2.538256803608391e-06,
+ "loss": 0.1092,
+ "step": 28445
+ },
+ {
+ "epoch": 77.50953678474114,
+ "grad_norm": 2.032125234603882,
+ "learning_rate": 2.5376693113164062e-06,
+ "loss": 0.0223,
+ "step": 28446
+ },
+ {
+ "epoch": 77.51226158038148,
+ "grad_norm": 2.5156798362731934,
+ "learning_rate": 2.537081877140809e-06,
+ "loss": 0.0757,
+ "step": 28447
+ },
+ {
+ "epoch": 77.5149863760218,
+ "grad_norm": 2.4647250175476074,
+ "learning_rate": 2.536494501086181e-06,
+ "loss": 0.0571,
+ "step": 28448
+ },
+ {
+ "epoch": 77.51771117166213,
+ "grad_norm": 3.689142942428589,
+ "learning_rate": 2.5359071831570937e-06,
+ "loss": 0.1352,
+ "step": 28449
+ },
+ {
+ "epoch": 77.52043596730245,
+ "grad_norm": 2.561048984527588,
+ "learning_rate": 2.5353199233581184e-06,
+ "loss": 0.0277,
+ "step": 28450
+ },
+ {
+ "epoch": 77.52316076294278,
+ "grad_norm": 2.206209897994995,
+ "learning_rate": 2.534732721693833e-06,
+ "loss": 0.0263,
+ "step": 28451
+ },
+ {
+ "epoch": 77.52588555858311,
+ "grad_norm": 2.5610644817352295,
+ "learning_rate": 2.5341455781688073e-06,
+ "loss": 0.0652,
+ "step": 28452
+ },
+ {
+ "epoch": 77.52861035422343,
+ "grad_norm": 2.32920241355896,
+ "learning_rate": 2.5335584927876178e-06,
+ "loss": 0.101,
+ "step": 28453
+ },
+ {
+ "epoch": 77.53133514986376,
+ "grad_norm": 2.0175223350524902,
+ "learning_rate": 2.5329714655548352e-06,
+ "loss": 0.0839,
+ "step": 28454
+ },
+ {
+ "epoch": 77.53405994550408,
+ "grad_norm": 4.562267303466797,
+ "learning_rate": 2.53238449647503e-06,
+ "loss": 0.1799,
+ "step": 28455
+ },
+ {
+ "epoch": 77.53678474114442,
+ "grad_norm": 2.625113010406494,
+ "learning_rate": 2.531797585552771e-06,
+ "loss": 0.1283,
+ "step": 28456
+ },
+ {
+ "epoch": 77.53950953678473,
+ "grad_norm": 2.9678537845611572,
+ "learning_rate": 2.5312107327926348e-06,
+ "loss": 0.0218,
+ "step": 28457
+ },
+ {
+ "epoch": 77.54223433242507,
+ "grad_norm": 1.9777448177337646,
+ "learning_rate": 2.5306239381991893e-06,
+ "loss": 0.0483,
+ "step": 28458
+ },
+ {
+ "epoch": 77.5449591280654,
+ "grad_norm": 2.6387410163879395,
+ "learning_rate": 2.5300372017770046e-06,
+ "loss": 0.0432,
+ "step": 28459
+ },
+ {
+ "epoch": 77.54768392370572,
+ "grad_norm": 2.3963844776153564,
+ "learning_rate": 2.5294505235306465e-06,
+ "loss": 0.1325,
+ "step": 28460
+ },
+ {
+ "epoch": 77.55040871934605,
+ "grad_norm": 3.0688164234161377,
+ "learning_rate": 2.52886390346469e-06,
+ "loss": 0.085,
+ "step": 28461
+ },
+ {
+ "epoch": 77.55313351498637,
+ "grad_norm": 1.909074306488037,
+ "learning_rate": 2.5282773415837013e-06,
+ "loss": 0.0277,
+ "step": 28462
+ },
+ {
+ "epoch": 77.5558583106267,
+ "grad_norm": 2.116577625274658,
+ "learning_rate": 2.527690837892245e-06,
+ "loss": 0.0285,
+ "step": 28463
+ },
+ {
+ "epoch": 77.55858310626704,
+ "grad_norm": 3.282200336456299,
+ "learning_rate": 2.5271043923948946e-06,
+ "loss": 0.0984,
+ "step": 28464
+ },
+ {
+ "epoch": 77.56130790190736,
+ "grad_norm": 4.2497711181640625,
+ "learning_rate": 2.5265180050962147e-06,
+ "loss": 0.0449,
+ "step": 28465
+ },
+ {
+ "epoch": 77.56403269754769,
+ "grad_norm": 3.986081838607788,
+ "learning_rate": 2.5259316760007724e-06,
+ "loss": 0.0499,
+ "step": 28466
+ },
+ {
+ "epoch": 77.566757493188,
+ "grad_norm": 2.5657618045806885,
+ "learning_rate": 2.525345405113131e-06,
+ "loss": 0.0757,
+ "step": 28467
+ },
+ {
+ "epoch": 77.56948228882834,
+ "grad_norm": 6.001152038574219,
+ "learning_rate": 2.5247591924378577e-06,
+ "loss": 0.0677,
+ "step": 28468
+ },
+ {
+ "epoch": 77.57220708446866,
+ "grad_norm": 2.1566176414489746,
+ "learning_rate": 2.5241730379795235e-06,
+ "loss": 0.0281,
+ "step": 28469
+ },
+ {
+ "epoch": 77.57493188010899,
+ "grad_norm": 3.7497494220733643,
+ "learning_rate": 2.5235869417426885e-06,
+ "loss": 0.1297,
+ "step": 28470
+ },
+ {
+ "epoch": 77.57765667574932,
+ "grad_norm": 4.071877956390381,
+ "learning_rate": 2.523000903731918e-06,
+ "loss": 0.0648,
+ "step": 28471
+ },
+ {
+ "epoch": 77.58038147138964,
+ "grad_norm": 2.499847888946533,
+ "learning_rate": 2.522414923951774e-06,
+ "loss": 0.1004,
+ "step": 28472
+ },
+ {
+ "epoch": 77.58310626702998,
+ "grad_norm": 4.971376419067383,
+ "learning_rate": 2.5218290024068224e-06,
+ "loss": 0.0852,
+ "step": 28473
+ },
+ {
+ "epoch": 77.5858310626703,
+ "grad_norm": 3.4536664485931396,
+ "learning_rate": 2.521243139101628e-06,
+ "loss": 0.0426,
+ "step": 28474
+ },
+ {
+ "epoch": 77.58855585831063,
+ "grad_norm": 2.9197516441345215,
+ "learning_rate": 2.52065733404075e-06,
+ "loss": 0.0365,
+ "step": 28475
+ },
+ {
+ "epoch": 77.59128065395096,
+ "grad_norm": 2.83383846282959,
+ "learning_rate": 2.5200715872287495e-06,
+ "loss": 0.0608,
+ "step": 28476
+ },
+ {
+ "epoch": 77.59400544959128,
+ "grad_norm": 2.68898606300354,
+ "learning_rate": 2.5194858986701933e-06,
+ "loss": 0.0448,
+ "step": 28477
+ },
+ {
+ "epoch": 77.59673024523161,
+ "grad_norm": 2.6219491958618164,
+ "learning_rate": 2.5189002683696408e-06,
+ "loss": 0.0353,
+ "step": 28478
+ },
+ {
+ "epoch": 77.59945504087193,
+ "grad_norm": 2.5507733821868896,
+ "learning_rate": 2.518314696331652e-06,
+ "loss": 0.0954,
+ "step": 28479
+ },
+ {
+ "epoch": 77.60217983651226,
+ "grad_norm": 2.0204384326934814,
+ "learning_rate": 2.5177291825607843e-06,
+ "loss": 0.0526,
+ "step": 28480
+ },
+ {
+ "epoch": 77.60490463215258,
+ "grad_norm": 2.4395458698272705,
+ "learning_rate": 2.5171437270616038e-06,
+ "loss": 0.0817,
+ "step": 28481
+ },
+ {
+ "epoch": 77.60762942779292,
+ "grad_norm": 2.6209070682525635,
+ "learning_rate": 2.5165583298386673e-06,
+ "loss": 0.1323,
+ "step": 28482
+ },
+ {
+ "epoch": 77.61035422343325,
+ "grad_norm": 2.391087055206299,
+ "learning_rate": 2.5159729908965346e-06,
+ "loss": 0.222,
+ "step": 28483
+ },
+ {
+ "epoch": 77.61307901907357,
+ "grad_norm": 3.7429230213165283,
+ "learning_rate": 2.5153877102397596e-06,
+ "loss": 0.1582,
+ "step": 28484
+ },
+ {
+ "epoch": 77.6158038147139,
+ "grad_norm": 2.515198230743408,
+ "learning_rate": 2.5148024878729037e-06,
+ "loss": 0.124,
+ "step": 28485
+ },
+ {
+ "epoch": 77.61852861035422,
+ "grad_norm": 2.550065279006958,
+ "learning_rate": 2.5142173238005286e-06,
+ "loss": 0.1448,
+ "step": 28486
+ },
+ {
+ "epoch": 77.62125340599455,
+ "grad_norm": 2.8454697132110596,
+ "learning_rate": 2.5136322180271886e-06,
+ "loss": 0.0258,
+ "step": 28487
+ },
+ {
+ "epoch": 77.62397820163488,
+ "grad_norm": 3.082376003265381,
+ "learning_rate": 2.5130471705574367e-06,
+ "loss": 0.0619,
+ "step": 28488
+ },
+ {
+ "epoch": 77.6267029972752,
+ "grad_norm": 2.665174961090088,
+ "learning_rate": 2.512462181395835e-06,
+ "loss": 0.0304,
+ "step": 28489
+ },
+ {
+ "epoch": 77.62942779291554,
+ "grad_norm": 2.899925947189331,
+ "learning_rate": 2.5118772505469367e-06,
+ "loss": 0.0466,
+ "step": 28490
+ },
+ {
+ "epoch": 77.63215258855585,
+ "grad_norm": 2.897447347640991,
+ "learning_rate": 2.5112923780152975e-06,
+ "loss": 0.0399,
+ "step": 28491
+ },
+ {
+ "epoch": 77.63487738419619,
+ "grad_norm": 1.9452128410339355,
+ "learning_rate": 2.5107075638054703e-06,
+ "loss": 0.0993,
+ "step": 28492
+ },
+ {
+ "epoch": 77.6376021798365,
+ "grad_norm": 2.642165422439575,
+ "learning_rate": 2.510122807922013e-06,
+ "loss": 0.1071,
+ "step": 28493
+ },
+ {
+ "epoch": 77.64032697547684,
+ "grad_norm": 2.3399901390075684,
+ "learning_rate": 2.5095381103694794e-06,
+ "loss": 0.1992,
+ "step": 28494
+ },
+ {
+ "epoch": 77.64305177111717,
+ "grad_norm": 1.9544345140457153,
+ "learning_rate": 2.508953471152421e-06,
+ "loss": 0.0491,
+ "step": 28495
+ },
+ {
+ "epoch": 77.64577656675749,
+ "grad_norm": 2.452011823654175,
+ "learning_rate": 2.508368890275389e-06,
+ "loss": 0.0988,
+ "step": 28496
+ },
+ {
+ "epoch": 77.64850136239782,
+ "grad_norm": 2.419713258743286,
+ "learning_rate": 2.5077843677429424e-06,
+ "loss": 0.0252,
+ "step": 28497
+ },
+ {
+ "epoch": 77.65122615803814,
+ "grad_norm": 1.995934009552002,
+ "learning_rate": 2.5071999035596297e-06,
+ "loss": 0.031,
+ "step": 28498
+ },
+ {
+ "epoch": 77.65395095367847,
+ "grad_norm": 2.7805862426757812,
+ "learning_rate": 2.5066154977300027e-06,
+ "loss": 0.0597,
+ "step": 28499
+ },
+ {
+ "epoch": 77.65667574931881,
+ "grad_norm": 2.0950520038604736,
+ "learning_rate": 2.506031150258611e-06,
+ "loss": 0.0681,
+ "step": 28500
+ },
+ {
+ "epoch": 77.65940054495913,
+ "grad_norm": 2.8751299381256104,
+ "learning_rate": 2.5054468611500106e-06,
+ "loss": 0.1098,
+ "step": 28501
+ },
+ {
+ "epoch": 77.66212534059946,
+ "grad_norm": 1.9896756410598755,
+ "learning_rate": 2.5048626304087443e-06,
+ "loss": 0.051,
+ "step": 28502
+ },
+ {
+ "epoch": 77.66485013623978,
+ "grad_norm": 2.270315647125244,
+ "learning_rate": 2.504278458039371e-06,
+ "loss": 0.0659,
+ "step": 28503
+ },
+ {
+ "epoch": 77.66757493188011,
+ "grad_norm": 2.663672924041748,
+ "learning_rate": 2.5036943440464323e-06,
+ "loss": 0.0409,
+ "step": 28504
+ },
+ {
+ "epoch": 77.67029972752043,
+ "grad_norm": 2.6846094131469727,
+ "learning_rate": 2.5031102884344837e-06,
+ "loss": 0.1217,
+ "step": 28505
+ },
+ {
+ "epoch": 77.67302452316076,
+ "grad_norm": 2.4924800395965576,
+ "learning_rate": 2.5025262912080715e-06,
+ "loss": 0.0799,
+ "step": 28506
+ },
+ {
+ "epoch": 77.6757493188011,
+ "grad_norm": 3.586364507675171,
+ "learning_rate": 2.5019423523717425e-06,
+ "loss": 0.1618,
+ "step": 28507
+ },
+ {
+ "epoch": 77.67847411444141,
+ "grad_norm": 3.409531354904175,
+ "learning_rate": 2.5013584719300423e-06,
+ "loss": 0.1027,
+ "step": 28508
+ },
+ {
+ "epoch": 77.68119891008175,
+ "grad_norm": 2.3508975505828857,
+ "learning_rate": 2.500774649887524e-06,
+ "loss": 0.0678,
+ "step": 28509
+ },
+ {
+ "epoch": 77.68392370572207,
+ "grad_norm": 2.8088393211364746,
+ "learning_rate": 2.500190886248731e-06,
+ "loss": 0.0328,
+ "step": 28510
+ },
+ {
+ "epoch": 77.6866485013624,
+ "grad_norm": 2.0199978351593018,
+ "learning_rate": 2.499607181018211e-06,
+ "loss": 0.0927,
+ "step": 28511
+ },
+ {
+ "epoch": 77.68937329700273,
+ "grad_norm": 2.5782463550567627,
+ "learning_rate": 2.4990235342005056e-06,
+ "loss": 0.0284,
+ "step": 28512
+ },
+ {
+ "epoch": 77.69209809264305,
+ "grad_norm": 4.917638301849365,
+ "learning_rate": 2.4984399458001662e-06,
+ "loss": 0.14,
+ "step": 28513
+ },
+ {
+ "epoch": 77.69482288828338,
+ "grad_norm": 3.7573370933532715,
+ "learning_rate": 2.4978564158217344e-06,
+ "loss": 0.1011,
+ "step": 28514
+ },
+ {
+ "epoch": 77.6975476839237,
+ "grad_norm": 2.4647064208984375,
+ "learning_rate": 2.497272944269756e-06,
+ "loss": 0.0746,
+ "step": 28515
+ },
+ {
+ "epoch": 77.70027247956403,
+ "grad_norm": 2.724976062774658,
+ "learning_rate": 2.4966895311487716e-06,
+ "loss": 0.0434,
+ "step": 28516
+ },
+ {
+ "epoch": 77.70299727520435,
+ "grad_norm": 1.962424635887146,
+ "learning_rate": 2.496106176463331e-06,
+ "loss": 0.1256,
+ "step": 28517
+ },
+ {
+ "epoch": 77.70572207084469,
+ "grad_norm": 2.76932430267334,
+ "learning_rate": 2.495522880217973e-06,
+ "loss": 0.1447,
+ "step": 28518
+ },
+ {
+ "epoch": 77.70844686648502,
+ "grad_norm": 3.503516674041748,
+ "learning_rate": 2.494939642417239e-06,
+ "loss": 0.0959,
+ "step": 28519
+ },
+ {
+ "epoch": 77.71117166212534,
+ "grad_norm": 3.4417996406555176,
+ "learning_rate": 2.494356463065676e-06,
+ "loss": 0.1635,
+ "step": 28520
+ },
+ {
+ "epoch": 77.71389645776567,
+ "grad_norm": 2.597670316696167,
+ "learning_rate": 2.493773342167821e-06,
+ "loss": 0.0391,
+ "step": 28521
+ },
+ {
+ "epoch": 77.71662125340599,
+ "grad_norm": 2.055619955062866,
+ "learning_rate": 2.49319027972822e-06,
+ "loss": 0.03,
+ "step": 28522
+ },
+ {
+ "epoch": 77.71934604904632,
+ "grad_norm": 2.1465537548065186,
+ "learning_rate": 2.492607275751412e-06,
+ "loss": 0.059,
+ "step": 28523
+ },
+ {
+ "epoch": 77.72207084468666,
+ "grad_norm": 2.7853634357452393,
+ "learning_rate": 2.4920243302419367e-06,
+ "loss": 0.1247,
+ "step": 28524
+ },
+ {
+ "epoch": 77.72479564032697,
+ "grad_norm": 3.553372859954834,
+ "learning_rate": 2.491441443204331e-06,
+ "loss": 0.0993,
+ "step": 28525
+ },
+ {
+ "epoch": 77.7275204359673,
+ "grad_norm": 3.1164045333862305,
+ "learning_rate": 2.4908586146431413e-06,
+ "loss": 0.0721,
+ "step": 28526
+ },
+ {
+ "epoch": 77.73024523160763,
+ "grad_norm": 2.7990827560424805,
+ "learning_rate": 2.4902758445629027e-06,
+ "loss": 0.0696,
+ "step": 28527
+ },
+ {
+ "epoch": 77.73297002724796,
+ "grad_norm": 3.442732810974121,
+ "learning_rate": 2.4896931329681508e-06,
+ "loss": 0.079,
+ "step": 28528
+ },
+ {
+ "epoch": 77.73569482288828,
+ "grad_norm": 2.3545656204223633,
+ "learning_rate": 2.4891104798634303e-06,
+ "loss": 0.0855,
+ "step": 28529
+ },
+ {
+ "epoch": 77.73841961852861,
+ "grad_norm": 2.6045665740966797,
+ "learning_rate": 2.4885278852532758e-06,
+ "loss": 0.0456,
+ "step": 28530
+ },
+ {
+ "epoch": 77.74114441416894,
+ "grad_norm": 2.317164659500122,
+ "learning_rate": 2.4879453491422236e-06,
+ "loss": 0.0657,
+ "step": 28531
+ },
+ {
+ "epoch": 77.74386920980926,
+ "grad_norm": 3.0449130535125732,
+ "learning_rate": 2.4873628715348088e-06,
+ "loss": 0.106,
+ "step": 28532
+ },
+ {
+ "epoch": 77.7465940054496,
+ "grad_norm": 2.2596282958984375,
+ "learning_rate": 2.486780452435573e-06,
+ "loss": 0.0338,
+ "step": 28533
+ },
+ {
+ "epoch": 77.74931880108991,
+ "grad_norm": 2.0528342723846436,
+ "learning_rate": 2.48619809184905e-06,
+ "loss": 0.0239,
+ "step": 28534
+ },
+ {
+ "epoch": 77.75204359673025,
+ "grad_norm": 2.289703845977783,
+ "learning_rate": 2.485615789779774e-06,
+ "loss": 0.0353,
+ "step": 28535
+ },
+ {
+ "epoch": 77.75476839237058,
+ "grad_norm": 2.7122628688812256,
+ "learning_rate": 2.485033546232277e-06,
+ "loss": 0.0579,
+ "step": 28536
+ },
+ {
+ "epoch": 77.7574931880109,
+ "grad_norm": 3.519174575805664,
+ "learning_rate": 2.4844513612110977e-06,
+ "loss": 0.0473,
+ "step": 28537
+ },
+ {
+ "epoch": 77.76021798365123,
+ "grad_norm": 3.06754207611084,
+ "learning_rate": 2.4838692347207717e-06,
+ "loss": 0.0389,
+ "step": 28538
+ },
+ {
+ "epoch": 77.76294277929155,
+ "grad_norm": 2.3011691570281982,
+ "learning_rate": 2.48328716676583e-06,
+ "loss": 0.0808,
+ "step": 28539
+ },
+ {
+ "epoch": 77.76566757493188,
+ "grad_norm": 4.819763660430908,
+ "learning_rate": 2.4827051573508067e-06,
+ "loss": 0.1052,
+ "step": 28540
+ },
+ {
+ "epoch": 77.7683923705722,
+ "grad_norm": 2.2383973598480225,
+ "learning_rate": 2.482123206480229e-06,
+ "loss": 0.096,
+ "step": 28541
+ },
+ {
+ "epoch": 77.77111716621253,
+ "grad_norm": 3.0312654972076416,
+ "learning_rate": 2.4815413141586387e-06,
+ "loss": 0.2563,
+ "step": 28542
+ },
+ {
+ "epoch": 77.77384196185287,
+ "grad_norm": 4.265959739685059,
+ "learning_rate": 2.4809594803905614e-06,
+ "loss": 0.0585,
+ "step": 28543
+ },
+ {
+ "epoch": 77.77656675749319,
+ "grad_norm": 3.2749221324920654,
+ "learning_rate": 2.48037770518053e-06,
+ "loss": 0.1504,
+ "step": 28544
+ },
+ {
+ "epoch": 77.77929155313352,
+ "grad_norm": 2.5465848445892334,
+ "learning_rate": 2.4797959885330724e-06,
+ "loss": 0.0627,
+ "step": 28545
+ },
+ {
+ "epoch": 77.78201634877384,
+ "grad_norm": 3.44708514213562,
+ "learning_rate": 2.479214330452725e-06,
+ "loss": 0.255,
+ "step": 28546
+ },
+ {
+ "epoch": 77.78474114441417,
+ "grad_norm": 3.05719256401062,
+ "learning_rate": 2.4786327309440138e-06,
+ "loss": 0.1095,
+ "step": 28547
+ },
+ {
+ "epoch": 77.7874659400545,
+ "grad_norm": 3.280073642730713,
+ "learning_rate": 2.4780511900114678e-06,
+ "loss": 0.039,
+ "step": 28548
+ },
+ {
+ "epoch": 77.79019073569482,
+ "grad_norm": 3.0980327129364014,
+ "learning_rate": 2.4774697076596154e-06,
+ "loss": 0.0374,
+ "step": 28549
+ },
+ {
+ "epoch": 77.79291553133515,
+ "grad_norm": 2.5396461486816406,
+ "learning_rate": 2.47688828389299e-06,
+ "loss": 0.0234,
+ "step": 28550
+ },
+ {
+ "epoch": 77.79564032697547,
+ "grad_norm": 2.5326597690582275,
+ "learning_rate": 2.4763069187161158e-06,
+ "loss": 0.0935,
+ "step": 28551
+ },
+ {
+ "epoch": 77.7983651226158,
+ "grad_norm": 3.904620409011841,
+ "learning_rate": 2.4757256121335182e-06,
+ "loss": 0.0399,
+ "step": 28552
+ },
+ {
+ "epoch": 77.80108991825612,
+ "grad_norm": 2.865692615509033,
+ "learning_rate": 2.4751443641497307e-06,
+ "loss": 0.0881,
+ "step": 28553
+ },
+ {
+ "epoch": 77.80381471389646,
+ "grad_norm": 2.2848098278045654,
+ "learning_rate": 2.4745631747692732e-06,
+ "loss": 0.1282,
+ "step": 28554
+ },
+ {
+ "epoch": 77.80653950953679,
+ "grad_norm": 2.0827324390411377,
+ "learning_rate": 2.473982043996679e-06,
+ "loss": 0.0274,
+ "step": 28555
+ },
+ {
+ "epoch": 77.80926430517711,
+ "grad_norm": 4.4037652015686035,
+ "learning_rate": 2.4734009718364693e-06,
+ "loss": 0.0599,
+ "step": 28556
+ },
+ {
+ "epoch": 77.81198910081744,
+ "grad_norm": 3.0163779258728027,
+ "learning_rate": 2.4728199582931687e-06,
+ "loss": 0.0578,
+ "step": 28557
+ },
+ {
+ "epoch": 77.81471389645776,
+ "grad_norm": 2.8764543533325195,
+ "learning_rate": 2.4722390033713074e-06,
+ "loss": 0.1005,
+ "step": 28558
+ },
+ {
+ "epoch": 77.8174386920981,
+ "grad_norm": 3.6553354263305664,
+ "learning_rate": 2.471658107075405e-06,
+ "loss": 0.1354,
+ "step": 28559
+ },
+ {
+ "epoch": 77.82016348773843,
+ "grad_norm": 4.242199420928955,
+ "learning_rate": 2.4710772694099885e-06,
+ "loss": 0.0526,
+ "step": 28560
+ },
+ {
+ "epoch": 77.82288828337875,
+ "grad_norm": 2.175461769104004,
+ "learning_rate": 2.470496490379576e-06,
+ "loss": 0.2264,
+ "step": 28561
+ },
+ {
+ "epoch": 77.82561307901908,
+ "grad_norm": 2.97206974029541,
+ "learning_rate": 2.4699157699886977e-06,
+ "loss": 0.0428,
+ "step": 28562
+ },
+ {
+ "epoch": 77.8283378746594,
+ "grad_norm": 4.373528957366943,
+ "learning_rate": 2.4693351082418725e-06,
+ "loss": 0.1485,
+ "step": 28563
+ },
+ {
+ "epoch": 77.83106267029973,
+ "grad_norm": 2.3471200466156006,
+ "learning_rate": 2.4687545051436233e-06,
+ "loss": 0.0856,
+ "step": 28564
+ },
+ {
+ "epoch": 77.83378746594005,
+ "grad_norm": 4.146914958953857,
+ "learning_rate": 2.46817396069847e-06,
+ "loss": 0.2022,
+ "step": 28565
+ },
+ {
+ "epoch": 77.83651226158038,
+ "grad_norm": 2.7037479877471924,
+ "learning_rate": 2.4675934749109375e-06,
+ "loss": 0.0649,
+ "step": 28566
+ },
+ {
+ "epoch": 77.83923705722071,
+ "grad_norm": 2.6036858558654785,
+ "learning_rate": 2.4670130477855437e-06,
+ "loss": 0.0867,
+ "step": 28567
+ },
+ {
+ "epoch": 77.84196185286103,
+ "grad_norm": 3.4696624279022217,
+ "learning_rate": 2.466432679326811e-06,
+ "loss": 0.0988,
+ "step": 28568
+ },
+ {
+ "epoch": 77.84468664850137,
+ "grad_norm": 3.490933418273926,
+ "learning_rate": 2.4658523695392545e-06,
+ "loss": 0.1309,
+ "step": 28569
+ },
+ {
+ "epoch": 77.84741144414168,
+ "grad_norm": 4.492375373840332,
+ "learning_rate": 2.4652721184274008e-06,
+ "loss": 0.133,
+ "step": 28570
+ },
+ {
+ "epoch": 77.85013623978202,
+ "grad_norm": 3.200601577758789,
+ "learning_rate": 2.4646919259957623e-06,
+ "loss": 0.043,
+ "step": 28571
+ },
+ {
+ "epoch": 77.85286103542235,
+ "grad_norm": 2.435253143310547,
+ "learning_rate": 2.464111792248863e-06,
+ "loss": 0.0278,
+ "step": 28572
+ },
+ {
+ "epoch": 77.85558583106267,
+ "grad_norm": 3.9881691932678223,
+ "learning_rate": 2.4635317171912164e-06,
+ "loss": 0.0846,
+ "step": 28573
+ },
+ {
+ "epoch": 77.858310626703,
+ "grad_norm": 2.9328901767730713,
+ "learning_rate": 2.462951700827344e-06,
+ "loss": 0.051,
+ "step": 28574
+ },
+ {
+ "epoch": 77.86103542234332,
+ "grad_norm": 2.805507183074951,
+ "learning_rate": 2.462371743161762e-06,
+ "loss": 0.1161,
+ "step": 28575
+ },
+ {
+ "epoch": 77.86376021798365,
+ "grad_norm": 2.6177818775177,
+ "learning_rate": 2.461791844198986e-06,
+ "loss": 0.0343,
+ "step": 28576
+ },
+ {
+ "epoch": 77.86648501362397,
+ "grad_norm": 3.3624141216278076,
+ "learning_rate": 2.4612120039435306e-06,
+ "loss": 0.0402,
+ "step": 28577
+ },
+ {
+ "epoch": 77.8692098092643,
+ "grad_norm": 2.7366902828216553,
+ "learning_rate": 2.4606322223999147e-06,
+ "loss": 0.0373,
+ "step": 28578
+ },
+ {
+ "epoch": 77.87193460490464,
+ "grad_norm": 3.220646619796753,
+ "learning_rate": 2.4600524995726537e-06,
+ "loss": 0.063,
+ "step": 28579
+ },
+ {
+ "epoch": 77.87465940054496,
+ "grad_norm": 2.4427764415740967,
+ "learning_rate": 2.45947283546626e-06,
+ "loss": 0.0569,
+ "step": 28580
+ },
+ {
+ "epoch": 77.87738419618529,
+ "grad_norm": 2.1700329780578613,
+ "learning_rate": 2.4588932300852476e-06,
+ "loss": 0.0531,
+ "step": 28581
+ },
+ {
+ "epoch": 77.88010899182561,
+ "grad_norm": 3.691664457321167,
+ "learning_rate": 2.4583136834341336e-06,
+ "loss": 0.0465,
+ "step": 28582
+ },
+ {
+ "epoch": 77.88283378746594,
+ "grad_norm": 3.2681214809417725,
+ "learning_rate": 2.4577341955174307e-06,
+ "loss": 0.0373,
+ "step": 28583
+ },
+ {
+ "epoch": 77.88555858310627,
+ "grad_norm": 3.141700029373169,
+ "learning_rate": 2.4571547663396513e-06,
+ "loss": 0.0994,
+ "step": 28584
+ },
+ {
+ "epoch": 77.88828337874659,
+ "grad_norm": 2.2609872817993164,
+ "learning_rate": 2.456575395905304e-06,
+ "loss": 0.0366,
+ "step": 28585
+ },
+ {
+ "epoch": 77.89100817438693,
+ "grad_norm": 2.097759962081909,
+ "learning_rate": 2.455996084218909e-06,
+ "loss": 0.0322,
+ "step": 28586
+ },
+ {
+ "epoch": 77.89373297002724,
+ "grad_norm": 2.123995780944824,
+ "learning_rate": 2.4554168312849724e-06,
+ "loss": 0.0785,
+ "step": 28587
+ },
+ {
+ "epoch": 77.89645776566758,
+ "grad_norm": 2.2426674365997314,
+ "learning_rate": 2.454837637108004e-06,
+ "loss": 0.0409,
+ "step": 28588
+ },
+ {
+ "epoch": 77.8991825613079,
+ "grad_norm": 3.0533556938171387,
+ "learning_rate": 2.4542585016925215e-06,
+ "loss": 0.0635,
+ "step": 28589
+ },
+ {
+ "epoch": 77.90190735694823,
+ "grad_norm": 4.239056587219238,
+ "learning_rate": 2.4536794250430264e-06,
+ "loss": 0.0288,
+ "step": 28590
+ },
+ {
+ "epoch": 77.90463215258856,
+ "grad_norm": 2.0648422241210938,
+ "learning_rate": 2.453100407164036e-06,
+ "loss": 0.1212,
+ "step": 28591
+ },
+ {
+ "epoch": 77.90735694822888,
+ "grad_norm": 3.995161771774292,
+ "learning_rate": 2.4525214480600577e-06,
+ "loss": 0.0303,
+ "step": 28592
+ },
+ {
+ "epoch": 77.91008174386921,
+ "grad_norm": 2.431945323944092,
+ "learning_rate": 2.451942547735596e-06,
+ "loss": 0.0356,
+ "step": 28593
+ },
+ {
+ "epoch": 77.91280653950953,
+ "grad_norm": 2.9772019386291504,
+ "learning_rate": 2.4513637061951655e-06,
+ "loss": 0.0361,
+ "step": 28594
+ },
+ {
+ "epoch": 77.91553133514986,
+ "grad_norm": 2.962559461593628,
+ "learning_rate": 2.450784923443272e-06,
+ "loss": 0.0815,
+ "step": 28595
+ },
+ {
+ "epoch": 77.9182561307902,
+ "grad_norm": 2.871248960494995,
+ "learning_rate": 2.450206199484423e-06,
+ "loss": 0.0609,
+ "step": 28596
+ },
+ {
+ "epoch": 77.92098092643052,
+ "grad_norm": 2.7894411087036133,
+ "learning_rate": 2.4496275343231214e-06,
+ "loss": 0.0312,
+ "step": 28597
+ },
+ {
+ "epoch": 77.92370572207085,
+ "grad_norm": 2.7226953506469727,
+ "learning_rate": 2.4490489279638806e-06,
+ "loss": 0.0375,
+ "step": 28598
+ },
+ {
+ "epoch": 77.92643051771117,
+ "grad_norm": 4.2436699867248535,
+ "learning_rate": 2.448470380411204e-06,
+ "loss": 0.0745,
+ "step": 28599
+ },
+ {
+ "epoch": 77.9291553133515,
+ "grad_norm": 3.8377609252929688,
+ "learning_rate": 2.447891891669596e-06,
+ "loss": 0.0422,
+ "step": 28600
+ },
+ {
+ "epoch": 77.93188010899182,
+ "grad_norm": 4.173841953277588,
+ "learning_rate": 2.4473134617435614e-06,
+ "loss": 0.0461,
+ "step": 28601
+ },
+ {
+ "epoch": 77.93460490463215,
+ "grad_norm": 3.207427501678467,
+ "learning_rate": 2.4467350906376085e-06,
+ "loss": 0.0936,
+ "step": 28602
+ },
+ {
+ "epoch": 77.93732970027249,
+ "grad_norm": 3.2238423824310303,
+ "learning_rate": 2.44615677835624e-06,
+ "loss": 0.1035,
+ "step": 28603
+ },
+ {
+ "epoch": 77.9400544959128,
+ "grad_norm": 3.26841402053833,
+ "learning_rate": 2.44557852490396e-06,
+ "loss": 0.0754,
+ "step": 28604
+ },
+ {
+ "epoch": 77.94277929155314,
+ "grad_norm": 3.017800807952881,
+ "learning_rate": 2.4450003302852663e-06,
+ "loss": 0.1067,
+ "step": 28605
+ },
+ {
+ "epoch": 77.94550408719346,
+ "grad_norm": 2.6638243198394775,
+ "learning_rate": 2.4444221945046687e-06,
+ "loss": 0.0359,
+ "step": 28606
+ },
+ {
+ "epoch": 77.94822888283379,
+ "grad_norm": 3.491483449935913,
+ "learning_rate": 2.4438441175666706e-06,
+ "loss": 0.0686,
+ "step": 28607
+ },
+ {
+ "epoch": 77.95095367847412,
+ "grad_norm": 2.04025936126709,
+ "learning_rate": 2.4432660994757707e-06,
+ "loss": 0.0423,
+ "step": 28608
+ },
+ {
+ "epoch": 77.95367847411444,
+ "grad_norm": 2.4790706634521484,
+ "learning_rate": 2.4426881402364722e-06,
+ "loss": 0.0403,
+ "step": 28609
+ },
+ {
+ "epoch": 77.95640326975477,
+ "grad_norm": 1.964853286743164,
+ "learning_rate": 2.4421102398532716e-06,
+ "loss": 0.0282,
+ "step": 28610
+ },
+ {
+ "epoch": 77.95912806539509,
+ "grad_norm": 2.6440622806549072,
+ "learning_rate": 2.441532398330676e-06,
+ "loss": 0.1535,
+ "step": 28611
+ },
+ {
+ "epoch": 77.96185286103542,
+ "grad_norm": 2.9482619762420654,
+ "learning_rate": 2.4409546156731835e-06,
+ "loss": 0.0292,
+ "step": 28612
+ },
+ {
+ "epoch": 77.96457765667574,
+ "grad_norm": 1.9689563512802124,
+ "learning_rate": 2.4403768918852923e-06,
+ "loss": 0.0505,
+ "step": 28613
+ },
+ {
+ "epoch": 77.96730245231608,
+ "grad_norm": 3.476179361343384,
+ "learning_rate": 2.4397992269714996e-06,
+ "loss": 0.0635,
+ "step": 28614
+ },
+ {
+ "epoch": 77.97002724795641,
+ "grad_norm": 1.731796145439148,
+ "learning_rate": 2.4392216209363106e-06,
+ "loss": 0.0228,
+ "step": 28615
+ },
+ {
+ "epoch": 77.97275204359673,
+ "grad_norm": 1.4027667045593262,
+ "learning_rate": 2.438644073784221e-06,
+ "loss": 0.0183,
+ "step": 28616
+ },
+ {
+ "epoch": 77.97547683923706,
+ "grad_norm": 2.9973654747009277,
+ "learning_rate": 2.438066585519724e-06,
+ "loss": 0.0488,
+ "step": 28617
+ },
+ {
+ "epoch": 77.97820163487738,
+ "grad_norm": 2.85360050201416,
+ "learning_rate": 2.4374891561473236e-06,
+ "loss": 0.0324,
+ "step": 28618
+ },
+ {
+ "epoch": 77.98092643051771,
+ "grad_norm": 1.7630435228347778,
+ "learning_rate": 2.4369117856715152e-06,
+ "loss": 0.1123,
+ "step": 28619
+ },
+ {
+ "epoch": 77.98365122615803,
+ "grad_norm": 2.655789852142334,
+ "learning_rate": 2.436334474096794e-06,
+ "loss": 0.2556,
+ "step": 28620
+ },
+ {
+ "epoch": 77.98637602179836,
+ "grad_norm": 2.6451289653778076,
+ "learning_rate": 2.4357572214276536e-06,
+ "loss": 0.1174,
+ "step": 28621
+ },
+ {
+ "epoch": 77.9891008174387,
+ "grad_norm": 3.7719886302948,
+ "learning_rate": 2.4351800276685932e-06,
+ "loss": 0.0858,
+ "step": 28622
+ },
+ {
+ "epoch": 77.99182561307902,
+ "grad_norm": 4.808012962341309,
+ "learning_rate": 2.4346028928241095e-06,
+ "loss": 0.0458,
+ "step": 28623
+ },
+ {
+ "epoch": 77.99455040871935,
+ "grad_norm": 3.1198360919952393,
+ "learning_rate": 2.434025816898695e-06,
+ "loss": 0.0456,
+ "step": 28624
+ },
+ {
+ "epoch": 77.99727520435967,
+ "grad_norm": 2.0654773712158203,
+ "learning_rate": 2.4334487998968435e-06,
+ "loss": 0.0265,
+ "step": 28625
+ },
+ {
+ "epoch": 78.0,
+ "grad_norm": 3.193361520767212,
+ "learning_rate": 2.432871841823047e-06,
+ "loss": 0.056,
+ "step": 28626
+ },
+ {
+ "epoch": 78.00272479564033,
+ "grad_norm": 4.100928783416748,
+ "learning_rate": 2.432294942681803e-06,
+ "loss": 0.0728,
+ "step": 28627
+ },
+ {
+ "epoch": 78.00544959128065,
+ "grad_norm": 2.658005475997925,
+ "learning_rate": 2.431718102477604e-06,
+ "loss": 0.0624,
+ "step": 28628
+ },
+ {
+ "epoch": 78.00817438692098,
+ "grad_norm": 4.394220352172852,
+ "learning_rate": 2.4311413212149395e-06,
+ "loss": 0.0923,
+ "step": 28629
+ },
+ {
+ "epoch": 78.0108991825613,
+ "grad_norm": 4.086851596832275,
+ "learning_rate": 2.4305645988983007e-06,
+ "loss": 0.0847,
+ "step": 28630
+ },
+ {
+ "epoch": 78.01362397820164,
+ "grad_norm": 2.9714341163635254,
+ "learning_rate": 2.4299879355321844e-06,
+ "loss": 0.0385,
+ "step": 28631
+ },
+ {
+ "epoch": 78.01634877384195,
+ "grad_norm": 4.148153305053711,
+ "learning_rate": 2.4294113311210775e-06,
+ "loss": 0.0505,
+ "step": 28632
+ },
+ {
+ "epoch": 78.01907356948229,
+ "grad_norm": 3.036773920059204,
+ "learning_rate": 2.4288347856694718e-06,
+ "loss": 0.0606,
+ "step": 28633
+ },
+ {
+ "epoch": 78.02179836512262,
+ "grad_norm": 3.061009168624878,
+ "learning_rate": 2.428258299181854e-06,
+ "loss": 0.0309,
+ "step": 28634
+ },
+ {
+ "epoch": 78.02452316076294,
+ "grad_norm": 2.729743242263794,
+ "learning_rate": 2.4276818716627195e-06,
+ "loss": 0.0668,
+ "step": 28635
+ },
+ {
+ "epoch": 78.02724795640327,
+ "grad_norm": 2.4344239234924316,
+ "learning_rate": 2.4271055031165557e-06,
+ "loss": 0.0886,
+ "step": 28636
+ },
+ {
+ "epoch": 78.02997275204359,
+ "grad_norm": 4.145779132843018,
+ "learning_rate": 2.4265291935478472e-06,
+ "loss": 0.1251,
+ "step": 28637
+ },
+ {
+ "epoch": 78.03269754768392,
+ "grad_norm": 3.1622867584228516,
+ "learning_rate": 2.4259529429610884e-06,
+ "loss": 0.0432,
+ "step": 28638
+ },
+ {
+ "epoch": 78.03542234332426,
+ "grad_norm": 2.4364748001098633,
+ "learning_rate": 2.425376751360764e-06,
+ "loss": 0.0872,
+ "step": 28639
+ },
+ {
+ "epoch": 78.03814713896458,
+ "grad_norm": 2.948251724243164,
+ "learning_rate": 2.4248006187513597e-06,
+ "loss": 0.0499,
+ "step": 28640
+ },
+ {
+ "epoch": 78.04087193460491,
+ "grad_norm": 1.996466875076294,
+ "learning_rate": 2.4242245451373667e-06,
+ "loss": 0.0398,
+ "step": 28641
+ },
+ {
+ "epoch": 78.04359673024523,
+ "grad_norm": 3.166872262954712,
+ "learning_rate": 2.423648530523266e-06,
+ "loss": 0.1205,
+ "step": 28642
+ },
+ {
+ "epoch": 78.04632152588556,
+ "grad_norm": 2.3039448261260986,
+ "learning_rate": 2.4230725749135496e-06,
+ "loss": 0.0712,
+ "step": 28643
+ },
+ {
+ "epoch": 78.04904632152588,
+ "grad_norm": 1.8140027523040771,
+ "learning_rate": 2.4224966783127014e-06,
+ "loss": 0.0257,
+ "step": 28644
+ },
+ {
+ "epoch": 78.05177111716621,
+ "grad_norm": 3.5995044708251953,
+ "learning_rate": 2.4219208407252036e-06,
+ "loss": 0.1424,
+ "step": 28645
+ },
+ {
+ "epoch": 78.05449591280654,
+ "grad_norm": 2.4110090732574463,
+ "learning_rate": 2.42134506215554e-06,
+ "loss": 0.0586,
+ "step": 28646
+ },
+ {
+ "epoch": 78.05722070844686,
+ "grad_norm": 2.7712249755859375,
+ "learning_rate": 2.4207693426082003e-06,
+ "loss": 0.0375,
+ "step": 28647
+ },
+ {
+ "epoch": 78.0599455040872,
+ "grad_norm": 2.5217080116271973,
+ "learning_rate": 2.420193682087665e-06,
+ "loss": 0.0937,
+ "step": 28648
+ },
+ {
+ "epoch": 78.06267029972751,
+ "grad_norm": 2.138751268386841,
+ "learning_rate": 2.419618080598417e-06,
+ "loss": 0.0216,
+ "step": 28649
+ },
+ {
+ "epoch": 78.06539509536785,
+ "grad_norm": 2.249903917312622,
+ "learning_rate": 2.4190425381449366e-06,
+ "loss": 0.0235,
+ "step": 28650
+ },
+ {
+ "epoch": 78.06811989100818,
+ "grad_norm": 2.7832961082458496,
+ "learning_rate": 2.4184670547317123e-06,
+ "loss": 0.1426,
+ "step": 28651
+ },
+ {
+ "epoch": 78.0708446866485,
+ "grad_norm": 3.140596866607666,
+ "learning_rate": 2.417891630363222e-06,
+ "loss": 0.045,
+ "step": 28652
+ },
+ {
+ "epoch": 78.07356948228883,
+ "grad_norm": 3.63569712638855,
+ "learning_rate": 2.4173162650439485e-06,
+ "loss": 0.0302,
+ "step": 28653
+ },
+ {
+ "epoch": 78.07629427792915,
+ "grad_norm": 2.5194928646087646,
+ "learning_rate": 2.4167409587783676e-06,
+ "loss": 0.1044,
+ "step": 28654
+ },
+ {
+ "epoch": 78.07901907356948,
+ "grad_norm": 3.443791151046753,
+ "learning_rate": 2.416165711570968e-06,
+ "loss": 0.1248,
+ "step": 28655
+ },
+ {
+ "epoch": 78.0817438692098,
+ "grad_norm": 2.9317615032196045,
+ "learning_rate": 2.4155905234262255e-06,
+ "loss": 0.1934,
+ "step": 28656
+ },
+ {
+ "epoch": 78.08446866485014,
+ "grad_norm": 3.092083692550659,
+ "learning_rate": 2.4150153943486166e-06,
+ "loss": 0.0334,
+ "step": 28657
+ },
+ {
+ "epoch": 78.08719346049047,
+ "grad_norm": 1.6678235530853271,
+ "learning_rate": 2.414440324342624e-06,
+ "loss": 0.0247,
+ "step": 28658
+ },
+ {
+ "epoch": 78.08991825613079,
+ "grad_norm": 4.245721340179443,
+ "learning_rate": 2.413865313412729e-06,
+ "loss": 0.035,
+ "step": 28659
+ },
+ {
+ "epoch": 78.09264305177112,
+ "grad_norm": 2.952965021133423,
+ "learning_rate": 2.4132903615634073e-06,
+ "loss": 0.0525,
+ "step": 28660
+ },
+ {
+ "epoch": 78.09536784741144,
+ "grad_norm": 3.37847900390625,
+ "learning_rate": 2.412715468799135e-06,
+ "loss": 0.0291,
+ "step": 28661
+ },
+ {
+ "epoch": 78.09809264305177,
+ "grad_norm": 2.557279348373413,
+ "learning_rate": 2.412140635124388e-06,
+ "loss": 0.0285,
+ "step": 28662
+ },
+ {
+ "epoch": 78.1008174386921,
+ "grad_norm": 2.3011956214904785,
+ "learning_rate": 2.4115658605436488e-06,
+ "loss": 0.0356,
+ "step": 28663
+ },
+ {
+ "epoch": 78.10354223433242,
+ "grad_norm": 3.312464714050293,
+ "learning_rate": 2.41099114506139e-06,
+ "loss": 0.19,
+ "step": 28664
+ },
+ {
+ "epoch": 78.10626702997276,
+ "grad_norm": 3.0109522342681885,
+ "learning_rate": 2.410416488682088e-06,
+ "loss": 0.0625,
+ "step": 28665
+ },
+ {
+ "epoch": 78.10899182561307,
+ "grad_norm": 3.418283224105835,
+ "learning_rate": 2.409841891410215e-06,
+ "loss": 0.0352,
+ "step": 28666
+ },
+ {
+ "epoch": 78.11171662125341,
+ "grad_norm": 2.0435028076171875,
+ "learning_rate": 2.409267353250252e-06,
+ "loss": 0.0279,
+ "step": 28667
+ },
+ {
+ "epoch": 78.11444141689373,
+ "grad_norm": 3.5080766677856445,
+ "learning_rate": 2.408692874206672e-06,
+ "loss": 0.0999,
+ "step": 28668
+ },
+ {
+ "epoch": 78.11716621253406,
+ "grad_norm": 2.4358937740325928,
+ "learning_rate": 2.4081184542839455e-06,
+ "loss": 0.046,
+ "step": 28669
+ },
+ {
+ "epoch": 78.11989100817439,
+ "grad_norm": 2.2511494159698486,
+ "learning_rate": 2.407544093486546e-06,
+ "loss": 0.0417,
+ "step": 28670
+ },
+ {
+ "epoch": 78.12261580381471,
+ "grad_norm": 4.012392997741699,
+ "learning_rate": 2.4069697918189515e-06,
+ "loss": 0.0346,
+ "step": 28671
+ },
+ {
+ "epoch": 78.12534059945504,
+ "grad_norm": 2.87082839012146,
+ "learning_rate": 2.406395549285633e-06,
+ "loss": 0.1297,
+ "step": 28672
+ },
+ {
+ "epoch": 78.12806539509536,
+ "grad_norm": 2.527850866317749,
+ "learning_rate": 2.4058213658910602e-06,
+ "loss": 0.0732,
+ "step": 28673
+ },
+ {
+ "epoch": 78.1307901907357,
+ "grad_norm": 2.9530582427978516,
+ "learning_rate": 2.4052472416397034e-06,
+ "loss": 0.0562,
+ "step": 28674
+ },
+ {
+ "epoch": 78.13351498637603,
+ "grad_norm": 2.147108793258667,
+ "learning_rate": 2.4046731765360377e-06,
+ "loss": 0.0231,
+ "step": 28675
+ },
+ {
+ "epoch": 78.13623978201635,
+ "grad_norm": 3.0856306552886963,
+ "learning_rate": 2.404099170584534e-06,
+ "loss": 0.1795,
+ "step": 28676
+ },
+ {
+ "epoch": 78.13896457765668,
+ "grad_norm": 1.4786776304244995,
+ "learning_rate": 2.4035252237896635e-06,
+ "loss": 0.0247,
+ "step": 28677
+ },
+ {
+ "epoch": 78.141689373297,
+ "grad_norm": 2.742638111114502,
+ "learning_rate": 2.40295133615589e-06,
+ "loss": 0.0406,
+ "step": 28678
+ },
+ {
+ "epoch": 78.14441416893733,
+ "grad_norm": 1.8566851615905762,
+ "learning_rate": 2.40237750768769e-06,
+ "loss": 0.0573,
+ "step": 28679
+ },
+ {
+ "epoch": 78.14713896457765,
+ "grad_norm": 3.6054091453552246,
+ "learning_rate": 2.4018037383895287e-06,
+ "loss": 0.0728,
+ "step": 28680
+ },
+ {
+ "epoch": 78.14986376021798,
+ "grad_norm": 1.8873311281204224,
+ "learning_rate": 2.401230028265876e-06,
+ "loss": 0.0246,
+ "step": 28681
+ },
+ {
+ "epoch": 78.15258855585832,
+ "grad_norm": 2.6724722385406494,
+ "learning_rate": 2.400656377321197e-06,
+ "loss": 0.0229,
+ "step": 28682
+ },
+ {
+ "epoch": 78.15531335149863,
+ "grad_norm": 2.5824334621429443,
+ "learning_rate": 2.400082785559964e-06,
+ "loss": 0.1163,
+ "step": 28683
+ },
+ {
+ "epoch": 78.15803814713897,
+ "grad_norm": 2.8021554946899414,
+ "learning_rate": 2.3995092529866415e-06,
+ "loss": 0.0304,
+ "step": 28684
+ },
+ {
+ "epoch": 78.16076294277929,
+ "grad_norm": 2.497877359390259,
+ "learning_rate": 2.3989357796056966e-06,
+ "loss": 0.0562,
+ "step": 28685
+ },
+ {
+ "epoch": 78.16348773841962,
+ "grad_norm": 2.606130361557007,
+ "learning_rate": 2.398362365421593e-06,
+ "loss": 0.1258,
+ "step": 28686
+ },
+ {
+ "epoch": 78.16621253405995,
+ "grad_norm": 2.5798847675323486,
+ "learning_rate": 2.3977890104388002e-06,
+ "loss": 0.1724,
+ "step": 28687
+ },
+ {
+ "epoch": 78.16893732970027,
+ "grad_norm": 3.3414177894592285,
+ "learning_rate": 2.3972157146617823e-06,
+ "loss": 0.067,
+ "step": 28688
+ },
+ {
+ "epoch": 78.1716621253406,
+ "grad_norm": 2.186988592147827,
+ "learning_rate": 2.396642478095004e-06,
+ "loss": 0.0766,
+ "step": 28689
+ },
+ {
+ "epoch": 78.17438692098092,
+ "grad_norm": 3.304708480834961,
+ "learning_rate": 2.396069300742926e-06,
+ "loss": 0.0408,
+ "step": 28690
+ },
+ {
+ "epoch": 78.17711171662125,
+ "grad_norm": 2.2575109004974365,
+ "learning_rate": 2.3954961826100154e-06,
+ "loss": 0.0367,
+ "step": 28691
+ },
+ {
+ "epoch": 78.17983651226157,
+ "grad_norm": 3.3511736392974854,
+ "learning_rate": 2.3949231237007396e-06,
+ "loss": 0.0939,
+ "step": 28692
+ },
+ {
+ "epoch": 78.1825613079019,
+ "grad_norm": 2.3919754028320312,
+ "learning_rate": 2.3943501240195565e-06,
+ "loss": 0.0427,
+ "step": 28693
+ },
+ {
+ "epoch": 78.18528610354224,
+ "grad_norm": 2.78475022315979,
+ "learning_rate": 2.3937771835709313e-06,
+ "loss": 0.0657,
+ "step": 28694
+ },
+ {
+ "epoch": 78.18801089918256,
+ "grad_norm": 2.3260419368743896,
+ "learning_rate": 2.393204302359321e-06,
+ "loss": 0.0314,
+ "step": 28695
+ },
+ {
+ "epoch": 78.19073569482289,
+ "grad_norm": 3.031043767929077,
+ "learning_rate": 2.392631480389194e-06,
+ "loss": 0.1068,
+ "step": 28696
+ },
+ {
+ "epoch": 78.19346049046321,
+ "grad_norm": 2.7713918685913086,
+ "learning_rate": 2.3920587176650077e-06,
+ "loss": 0.0604,
+ "step": 28697
+ },
+ {
+ "epoch": 78.19618528610354,
+ "grad_norm": 2.4141011238098145,
+ "learning_rate": 2.3914860141912234e-06,
+ "loss": 0.0314,
+ "step": 28698
+ },
+ {
+ "epoch": 78.19891008174388,
+ "grad_norm": 2.8410580158233643,
+ "learning_rate": 2.3909133699722976e-06,
+ "loss": 0.1591,
+ "step": 28699
+ },
+ {
+ "epoch": 78.2016348773842,
+ "grad_norm": 2.6988158226013184,
+ "learning_rate": 2.390340785012697e-06,
+ "loss": 0.0617,
+ "step": 28700
+ },
+ {
+ "epoch": 78.20435967302453,
+ "grad_norm": 2.9085278511047363,
+ "learning_rate": 2.389768259316878e-06,
+ "loss": 0.1084,
+ "step": 28701
+ },
+ {
+ "epoch": 78.20708446866485,
+ "grad_norm": 2.911033868789673,
+ "learning_rate": 2.389195792889295e-06,
+ "loss": 0.0561,
+ "step": 28702
+ },
+ {
+ "epoch": 78.20980926430518,
+ "grad_norm": 3.393951892852783,
+ "learning_rate": 2.3886233857344143e-06,
+ "loss": 0.0407,
+ "step": 28703
+ },
+ {
+ "epoch": 78.2125340599455,
+ "grad_norm": 2.7640810012817383,
+ "learning_rate": 2.388051037856689e-06,
+ "loss": 0.0319,
+ "step": 28704
+ },
+ {
+ "epoch": 78.21525885558583,
+ "grad_norm": 3.228947401046753,
+ "learning_rate": 2.3874787492605765e-06,
+ "loss": 0.0586,
+ "step": 28705
+ },
+ {
+ "epoch": 78.21798365122616,
+ "grad_norm": 2.958425760269165,
+ "learning_rate": 2.3869065199505328e-06,
+ "loss": 0.1149,
+ "step": 28706
+ },
+ {
+ "epoch": 78.22070844686648,
+ "grad_norm": 2.5740206241607666,
+ "learning_rate": 2.3863343499310187e-06,
+ "loss": 0.072,
+ "step": 28707
+ },
+ {
+ "epoch": 78.22343324250681,
+ "grad_norm": 2.93585467338562,
+ "learning_rate": 2.385762239206485e-06,
+ "loss": 0.0311,
+ "step": 28708
+ },
+ {
+ "epoch": 78.22615803814713,
+ "grad_norm": 2.986391305923462,
+ "learning_rate": 2.3851901877813923e-06,
+ "loss": 0.0425,
+ "step": 28709
+ },
+ {
+ "epoch": 78.22888283378747,
+ "grad_norm": 3.4620413780212402,
+ "learning_rate": 2.384618195660193e-06,
+ "loss": 0.1551,
+ "step": 28710
+ },
+ {
+ "epoch": 78.2316076294278,
+ "grad_norm": 2.392394781112671,
+ "learning_rate": 2.3840462628473403e-06,
+ "loss": 0.1175,
+ "step": 28711
+ },
+ {
+ "epoch": 78.23433242506812,
+ "grad_norm": 2.5387089252471924,
+ "learning_rate": 2.3834743893472923e-06,
+ "loss": 0.1602,
+ "step": 28712
+ },
+ {
+ "epoch": 78.23705722070845,
+ "grad_norm": 2.3510639667510986,
+ "learning_rate": 2.382902575164501e-06,
+ "loss": 0.061,
+ "step": 28713
+ },
+ {
+ "epoch": 78.23978201634877,
+ "grad_norm": 2.9034781455993652,
+ "learning_rate": 2.382330820303419e-06,
+ "loss": 0.0475,
+ "step": 28714
+ },
+ {
+ "epoch": 78.2425068119891,
+ "grad_norm": 2.7706029415130615,
+ "learning_rate": 2.381759124768496e-06,
+ "loss": 0.0645,
+ "step": 28715
+ },
+ {
+ "epoch": 78.24523160762942,
+ "grad_norm": 2.5357940196990967,
+ "learning_rate": 2.381187488564192e-06,
+ "loss": 0.1157,
+ "step": 28716
+ },
+ {
+ "epoch": 78.24795640326975,
+ "grad_norm": 2.7941699028015137,
+ "learning_rate": 2.3806159116949536e-06,
+ "loss": 0.12,
+ "step": 28717
+ },
+ {
+ "epoch": 78.25068119891009,
+ "grad_norm": 2.7098867893218994,
+ "learning_rate": 2.380044394165233e-06,
+ "loss": 0.0565,
+ "step": 28718
+ },
+ {
+ "epoch": 78.2534059945504,
+ "grad_norm": 2.5567994117736816,
+ "learning_rate": 2.379472935979479e-06,
+ "loss": 0.0454,
+ "step": 28719
+ },
+ {
+ "epoch": 78.25613079019074,
+ "grad_norm": 2.509187698364258,
+ "learning_rate": 2.3789015371421476e-06,
+ "loss": 0.0357,
+ "step": 28720
+ },
+ {
+ "epoch": 78.25885558583106,
+ "grad_norm": 2.3222243785858154,
+ "learning_rate": 2.3783301976576854e-06,
+ "loss": 0.1334,
+ "step": 28721
+ },
+ {
+ "epoch": 78.26158038147139,
+ "grad_norm": 3.3466756343841553,
+ "learning_rate": 2.3777589175305428e-06,
+ "loss": 0.0579,
+ "step": 28722
+ },
+ {
+ "epoch": 78.26430517711172,
+ "grad_norm": 2.327862501144409,
+ "learning_rate": 2.3771876967651652e-06,
+ "loss": 0.02,
+ "step": 28723
+ },
+ {
+ "epoch": 78.26702997275204,
+ "grad_norm": 2.378955841064453,
+ "learning_rate": 2.3766165353660065e-06,
+ "loss": 0.0176,
+ "step": 28724
+ },
+ {
+ "epoch": 78.26975476839237,
+ "grad_norm": 3.090916156768799,
+ "learning_rate": 2.376045433337514e-06,
+ "loss": 0.084,
+ "step": 28725
+ },
+ {
+ "epoch": 78.2724795640327,
+ "grad_norm": 2.2813174724578857,
+ "learning_rate": 2.3754743906841316e-06,
+ "loss": 0.0248,
+ "step": 28726
+ },
+ {
+ "epoch": 78.27520435967303,
+ "grad_norm": 3.227043628692627,
+ "learning_rate": 2.3749034074103084e-06,
+ "loss": 0.0445,
+ "step": 28727
+ },
+ {
+ "epoch": 78.27792915531334,
+ "grad_norm": 3.2909417152404785,
+ "learning_rate": 2.374332483520495e-06,
+ "loss": 0.0624,
+ "step": 28728
+ },
+ {
+ "epoch": 78.28065395095368,
+ "grad_norm": 2.8302438259124756,
+ "learning_rate": 2.373761619019136e-06,
+ "loss": 0.0344,
+ "step": 28729
+ },
+ {
+ "epoch": 78.28337874659401,
+ "grad_norm": 2.969295024871826,
+ "learning_rate": 2.373190813910674e-06,
+ "loss": 0.1248,
+ "step": 28730
+ },
+ {
+ "epoch": 78.28610354223433,
+ "grad_norm": 4.589273452758789,
+ "learning_rate": 2.372620068199555e-06,
+ "loss": 0.042,
+ "step": 28731
+ },
+ {
+ "epoch": 78.28882833787466,
+ "grad_norm": 2.352987051010132,
+ "learning_rate": 2.372049381890228e-06,
+ "loss": 0.0339,
+ "step": 28732
+ },
+ {
+ "epoch": 78.29155313351498,
+ "grad_norm": 2.2704436779022217,
+ "learning_rate": 2.3714787549871355e-06,
+ "loss": 0.1835,
+ "step": 28733
+ },
+ {
+ "epoch": 78.29427792915531,
+ "grad_norm": 3.4268100261688232,
+ "learning_rate": 2.3709081874947204e-06,
+ "loss": 0.1952,
+ "step": 28734
+ },
+ {
+ "epoch": 78.29700272479565,
+ "grad_norm": 3.415231227874756,
+ "learning_rate": 2.3703376794174237e-06,
+ "loss": 0.0875,
+ "step": 28735
+ },
+ {
+ "epoch": 78.29972752043597,
+ "grad_norm": 2.6673519611358643,
+ "learning_rate": 2.3697672307596955e-06,
+ "loss": 0.1024,
+ "step": 28736
+ },
+ {
+ "epoch": 78.3024523160763,
+ "grad_norm": 2.4854893684387207,
+ "learning_rate": 2.3691968415259727e-06,
+ "loss": 0.0857,
+ "step": 28737
+ },
+ {
+ "epoch": 78.30517711171662,
+ "grad_norm": 2.290933609008789,
+ "learning_rate": 2.3686265117207007e-06,
+ "loss": 0.0839,
+ "step": 28738
+ },
+ {
+ "epoch": 78.30790190735695,
+ "grad_norm": 2.550001621246338,
+ "learning_rate": 2.3680562413483167e-06,
+ "loss": 0.0688,
+ "step": 28739
+ },
+ {
+ "epoch": 78.31062670299727,
+ "grad_norm": 2.604231119155884,
+ "learning_rate": 2.3674860304132675e-06,
+ "loss": 0.0317,
+ "step": 28740
+ },
+ {
+ "epoch": 78.3133514986376,
+ "grad_norm": 1.6347862482070923,
+ "learning_rate": 2.366915878919992e-06,
+ "loss": 0.0231,
+ "step": 28741
+ },
+ {
+ "epoch": 78.31607629427793,
+ "grad_norm": 3.765108585357666,
+ "learning_rate": 2.366345786872929e-06,
+ "loss": 0.0516,
+ "step": 28742
+ },
+ {
+ "epoch": 78.31880108991825,
+ "grad_norm": 3.561452627182007,
+ "learning_rate": 2.3657757542765145e-06,
+ "loss": 0.0322,
+ "step": 28743
+ },
+ {
+ "epoch": 78.32152588555859,
+ "grad_norm": 4.27000093460083,
+ "learning_rate": 2.3652057811351982e-06,
+ "loss": 0.0577,
+ "step": 28744
+ },
+ {
+ "epoch": 78.3242506811989,
+ "grad_norm": 2.3249168395996094,
+ "learning_rate": 2.364635867453414e-06,
+ "loss": 0.0946,
+ "step": 28745
+ },
+ {
+ "epoch": 78.32697547683924,
+ "grad_norm": 2.7798616886138916,
+ "learning_rate": 2.3640660132356e-06,
+ "loss": 0.035,
+ "step": 28746
+ },
+ {
+ "epoch": 78.32970027247957,
+ "grad_norm": 2.1884665489196777,
+ "learning_rate": 2.3634962184861897e-06,
+ "loss": 0.0337,
+ "step": 28747
+ },
+ {
+ "epoch": 78.33242506811989,
+ "grad_norm": 2.7179813385009766,
+ "learning_rate": 2.36292648320963e-06,
+ "loss": 0.0405,
+ "step": 28748
+ },
+ {
+ "epoch": 78.33514986376022,
+ "grad_norm": 2.6988346576690674,
+ "learning_rate": 2.362356807410352e-06,
+ "loss": 0.0359,
+ "step": 28749
+ },
+ {
+ "epoch": 78.33787465940054,
+ "grad_norm": 5.135148525238037,
+ "learning_rate": 2.3617871910927927e-06,
+ "loss": 0.0783,
+ "step": 28750
+ },
+ {
+ "epoch": 78.34059945504087,
+ "grad_norm": 2.046766519546509,
+ "learning_rate": 2.361217634261387e-06,
+ "loss": 0.0861,
+ "step": 28751
+ },
+ {
+ "epoch": 78.34332425068119,
+ "grad_norm": 3.113476514816284,
+ "learning_rate": 2.360648136920575e-06,
+ "loss": 0.0417,
+ "step": 28752
+ },
+ {
+ "epoch": 78.34604904632153,
+ "grad_norm": 3.2326583862304688,
+ "learning_rate": 2.360078699074789e-06,
+ "loss": 0.0532,
+ "step": 28753
+ },
+ {
+ "epoch": 78.34877384196186,
+ "grad_norm": 3.191349983215332,
+ "learning_rate": 2.3595093207284657e-06,
+ "loss": 0.2164,
+ "step": 28754
+ },
+ {
+ "epoch": 78.35149863760218,
+ "grad_norm": 2.1410105228424072,
+ "learning_rate": 2.3589400018860343e-06,
+ "loss": 0.0667,
+ "step": 28755
+ },
+ {
+ "epoch": 78.35422343324251,
+ "grad_norm": 2.7011985778808594,
+ "learning_rate": 2.3583707425519344e-06,
+ "loss": 0.0472,
+ "step": 28756
+ },
+ {
+ "epoch": 78.35694822888283,
+ "grad_norm": 2.3861894607543945,
+ "learning_rate": 2.3578015427305977e-06,
+ "loss": 0.0372,
+ "step": 28757
+ },
+ {
+ "epoch": 78.35967302452316,
+ "grad_norm": 2.214292049407959,
+ "learning_rate": 2.357232402426457e-06,
+ "loss": 0.0371,
+ "step": 28758
+ },
+ {
+ "epoch": 78.3623978201635,
+ "grad_norm": 2.59604811668396,
+ "learning_rate": 2.3566633216439416e-06,
+ "loss": 0.1263,
+ "step": 28759
+ },
+ {
+ "epoch": 78.36512261580381,
+ "grad_norm": 2.2566699981689453,
+ "learning_rate": 2.356094300387486e-06,
+ "loss": 0.0396,
+ "step": 28760
+ },
+ {
+ "epoch": 78.36784741144415,
+ "grad_norm": 3.471081256866455,
+ "learning_rate": 2.355525338661524e-06,
+ "loss": 0.0435,
+ "step": 28761
+ },
+ {
+ "epoch": 78.37057220708446,
+ "grad_norm": 2.0240402221679688,
+ "learning_rate": 2.3549564364704856e-06,
+ "loss": 0.0403,
+ "step": 28762
+ },
+ {
+ "epoch": 78.3732970027248,
+ "grad_norm": 3.4439470767974854,
+ "learning_rate": 2.3543875938187997e-06,
+ "loss": 0.1056,
+ "step": 28763
+ },
+ {
+ "epoch": 78.37602179836512,
+ "grad_norm": 10.956733703613281,
+ "learning_rate": 2.353818810710895e-06,
+ "loss": 0.1349,
+ "step": 28764
+ },
+ {
+ "epoch": 78.37874659400545,
+ "grad_norm": 2.729780435562134,
+ "learning_rate": 2.3532500871512054e-06,
+ "loss": 0.0398,
+ "step": 28765
+ },
+ {
+ "epoch": 78.38147138964578,
+ "grad_norm": 2.260324478149414,
+ "learning_rate": 2.3526814231441586e-06,
+ "loss": 0.032,
+ "step": 28766
+ },
+ {
+ "epoch": 78.3841961852861,
+ "grad_norm": 2.290607213973999,
+ "learning_rate": 2.35211281869418e-06,
+ "loss": 0.0474,
+ "step": 28767
+ },
+ {
+ "epoch": 78.38692098092643,
+ "grad_norm": 2.24245548248291,
+ "learning_rate": 2.3515442738057027e-06,
+ "loss": 0.0325,
+ "step": 28768
+ },
+ {
+ "epoch": 78.38964577656675,
+ "grad_norm": 2.8790132999420166,
+ "learning_rate": 2.350975788483153e-06,
+ "loss": 0.083,
+ "step": 28769
+ },
+ {
+ "epoch": 78.39237057220708,
+ "grad_norm": 3.1960229873657227,
+ "learning_rate": 2.3504073627309575e-06,
+ "loss": 0.0376,
+ "step": 28770
+ },
+ {
+ "epoch": 78.39509536784742,
+ "grad_norm": 2.145268440246582,
+ "learning_rate": 2.3498389965535406e-06,
+ "loss": 0.1345,
+ "step": 28771
+ },
+ {
+ "epoch": 78.39782016348774,
+ "grad_norm": 2.2832589149475098,
+ "learning_rate": 2.3492706899553354e-06,
+ "loss": 0.0894,
+ "step": 28772
+ },
+ {
+ "epoch": 78.40054495912807,
+ "grad_norm": 2.4074416160583496,
+ "learning_rate": 2.3487024429407625e-06,
+ "loss": 0.1127,
+ "step": 28773
+ },
+ {
+ "epoch": 78.40326975476839,
+ "grad_norm": 3.619366407394409,
+ "learning_rate": 2.3481342555142484e-06,
+ "loss": 0.1049,
+ "step": 28774
+ },
+ {
+ "epoch": 78.40599455040872,
+ "grad_norm": 2.3534491062164307,
+ "learning_rate": 2.3475661276802164e-06,
+ "loss": 0.0329,
+ "step": 28775
+ },
+ {
+ "epoch": 78.40871934604904,
+ "grad_norm": 3.1109061241149902,
+ "learning_rate": 2.346998059443095e-06,
+ "loss": 0.0492,
+ "step": 28776
+ },
+ {
+ "epoch": 78.41144414168937,
+ "grad_norm": 2.226891279220581,
+ "learning_rate": 2.3464300508073046e-06,
+ "loss": 0.1112,
+ "step": 28777
+ },
+ {
+ "epoch": 78.4141689373297,
+ "grad_norm": 3.561785936355591,
+ "learning_rate": 2.3458621017772733e-06,
+ "loss": 0.111,
+ "step": 28778
+ },
+ {
+ "epoch": 78.41689373297002,
+ "grad_norm": 1.934870719909668,
+ "learning_rate": 2.3452942123574208e-06,
+ "loss": 0.1072,
+ "step": 28779
+ },
+ {
+ "epoch": 78.41961852861036,
+ "grad_norm": 3.1643896102905273,
+ "learning_rate": 2.344726382552168e-06,
+ "loss": 0.0567,
+ "step": 28780
+ },
+ {
+ "epoch": 78.42234332425068,
+ "grad_norm": 2.6465632915496826,
+ "learning_rate": 2.3441586123659434e-06,
+ "loss": 0.3397,
+ "step": 28781
+ },
+ {
+ "epoch": 78.42506811989101,
+ "grad_norm": 2.2327096462249756,
+ "learning_rate": 2.3435909018031645e-06,
+ "loss": 0.0273,
+ "step": 28782
+ },
+ {
+ "epoch": 78.42779291553134,
+ "grad_norm": 2.1167855262756348,
+ "learning_rate": 2.3430232508682525e-06,
+ "loss": 0.0499,
+ "step": 28783
+ },
+ {
+ "epoch": 78.43051771117166,
+ "grad_norm": 2.2226626873016357,
+ "learning_rate": 2.3424556595656276e-06,
+ "loss": 0.0219,
+ "step": 28784
+ },
+ {
+ "epoch": 78.433242506812,
+ "grad_norm": 1.781945824623108,
+ "learning_rate": 2.341888127899714e-06,
+ "loss": 0.0151,
+ "step": 28785
+ },
+ {
+ "epoch": 78.43596730245231,
+ "grad_norm": 2.4531352519989014,
+ "learning_rate": 2.341320655874929e-06,
+ "loss": 0.0362,
+ "step": 28786
+ },
+ {
+ "epoch": 78.43869209809264,
+ "grad_norm": 5.346907138824463,
+ "learning_rate": 2.3407532434956913e-06,
+ "loss": 0.0654,
+ "step": 28787
+ },
+ {
+ "epoch": 78.44141689373296,
+ "grad_norm": 2.3232154846191406,
+ "learning_rate": 2.34018589076642e-06,
+ "loss": 0.1128,
+ "step": 28788
+ },
+ {
+ "epoch": 78.4441416893733,
+ "grad_norm": 2.272002696990967,
+ "learning_rate": 2.3396185976915355e-06,
+ "loss": 0.0318,
+ "step": 28789
+ },
+ {
+ "epoch": 78.44686648501363,
+ "grad_norm": 2.511538028717041,
+ "learning_rate": 2.3390513642754555e-06,
+ "loss": 0.0739,
+ "step": 28790
+ },
+ {
+ "epoch": 78.44959128065395,
+ "grad_norm": 5.701254367828369,
+ "learning_rate": 2.338484190522594e-06,
+ "loss": 0.0444,
+ "step": 28791
+ },
+ {
+ "epoch": 78.45231607629428,
+ "grad_norm": 3.599649429321289,
+ "learning_rate": 2.3379170764373737e-06,
+ "loss": 0.0984,
+ "step": 28792
+ },
+ {
+ "epoch": 78.4550408719346,
+ "grad_norm": 3.17618989944458,
+ "learning_rate": 2.3373500220242095e-06,
+ "loss": 0.0459,
+ "step": 28793
+ },
+ {
+ "epoch": 78.45776566757493,
+ "grad_norm": 2.0977768898010254,
+ "learning_rate": 2.3367830272875136e-06,
+ "loss": 0.1065,
+ "step": 28794
+ },
+ {
+ "epoch": 78.46049046321527,
+ "grad_norm": 2.5540215969085693,
+ "learning_rate": 2.336216092231707e-06,
+ "loss": 0.0894,
+ "step": 28795
+ },
+ {
+ "epoch": 78.46321525885558,
+ "grad_norm": 2.071661949157715,
+ "learning_rate": 2.3356492168612e-06,
+ "loss": 0.1047,
+ "step": 28796
+ },
+ {
+ "epoch": 78.46594005449592,
+ "grad_norm": 6.077733516693115,
+ "learning_rate": 2.335082401180413e-06,
+ "loss": 0.0467,
+ "step": 28797
+ },
+ {
+ "epoch": 78.46866485013624,
+ "grad_norm": 3.6167330741882324,
+ "learning_rate": 2.3345156451937577e-06,
+ "loss": 0.0438,
+ "step": 28798
+ },
+ {
+ "epoch": 78.47138964577657,
+ "grad_norm": 2.4257559776306152,
+ "learning_rate": 2.333948948905649e-06,
+ "loss": 0.0466,
+ "step": 28799
+ },
+ {
+ "epoch": 78.47411444141689,
+ "grad_norm": 2.514841318130493,
+ "learning_rate": 2.3333823123204946e-06,
+ "loss": 0.0828,
+ "step": 28800
+ },
+ {
+ "epoch": 78.47683923705722,
+ "grad_norm": 2.6107676029205322,
+ "learning_rate": 2.332815735442716e-06,
+ "loss": 0.1185,
+ "step": 28801
+ },
+ {
+ "epoch": 78.47956403269755,
+ "grad_norm": 4.774962425231934,
+ "learning_rate": 2.332249218276721e-06,
+ "loss": 0.1953,
+ "step": 28802
+ },
+ {
+ "epoch": 78.48228882833787,
+ "grad_norm": 2.341609477996826,
+ "learning_rate": 2.3316827608269233e-06,
+ "loss": 0.0344,
+ "step": 28803
+ },
+ {
+ "epoch": 78.4850136239782,
+ "grad_norm": 2.3848965167999268,
+ "learning_rate": 2.3311163630977296e-06,
+ "loss": 0.0329,
+ "step": 28804
+ },
+ {
+ "epoch": 78.48773841961852,
+ "grad_norm": 2.820605993270874,
+ "learning_rate": 2.3305500250935574e-06,
+ "loss": 0.1103,
+ "step": 28805
+ },
+ {
+ "epoch": 78.49046321525886,
+ "grad_norm": 3.5609471797943115,
+ "learning_rate": 2.3299837468188156e-06,
+ "loss": 0.0772,
+ "step": 28806
+ },
+ {
+ "epoch": 78.49318801089919,
+ "grad_norm": 2.606863498687744,
+ "learning_rate": 2.329417528277914e-06,
+ "loss": 0.0339,
+ "step": 28807
+ },
+ {
+ "epoch": 78.49591280653951,
+ "grad_norm": 2.2633886337280273,
+ "learning_rate": 2.328851369475258e-06,
+ "loss": 0.0802,
+ "step": 28808
+ },
+ {
+ "epoch": 78.49863760217984,
+ "grad_norm": 2.9578235149383545,
+ "learning_rate": 2.3282852704152638e-06,
+ "loss": 0.0504,
+ "step": 28809
+ },
+ {
+ "epoch": 78.50136239782016,
+ "grad_norm": 4.267442226409912,
+ "learning_rate": 2.3277192311023366e-06,
+ "loss": 0.0799,
+ "step": 28810
+ },
+ {
+ "epoch": 78.50408719346049,
+ "grad_norm": 2.333279848098755,
+ "learning_rate": 2.3271532515408825e-06,
+ "loss": 0.062,
+ "step": 28811
+ },
+ {
+ "epoch": 78.50681198910081,
+ "grad_norm": 2.689195394515991,
+ "learning_rate": 2.326587331735313e-06,
+ "loss": 0.2114,
+ "step": 28812
+ },
+ {
+ "epoch": 78.50953678474114,
+ "grad_norm": 2.947387218475342,
+ "learning_rate": 2.3260214716900353e-06,
+ "loss": 0.1225,
+ "step": 28813
+ },
+ {
+ "epoch": 78.51226158038148,
+ "grad_norm": 2.5247998237609863,
+ "learning_rate": 2.325455671409457e-06,
+ "loss": 0.1136,
+ "step": 28814
+ },
+ {
+ "epoch": 78.5149863760218,
+ "grad_norm": 3.2816948890686035,
+ "learning_rate": 2.324889930897982e-06,
+ "loss": 0.1286,
+ "step": 28815
+ },
+ {
+ "epoch": 78.51771117166213,
+ "grad_norm": 3.0933926105499268,
+ "learning_rate": 2.324324250160015e-06,
+ "loss": 0.2823,
+ "step": 28816
+ },
+ {
+ "epoch": 78.52043596730245,
+ "grad_norm": 3.2287774085998535,
+ "learning_rate": 2.3237586291999657e-06,
+ "loss": 0.0517,
+ "step": 28817
+ },
+ {
+ "epoch": 78.52316076294278,
+ "grad_norm": 2.898211717605591,
+ "learning_rate": 2.323193068022238e-06,
+ "loss": 0.0798,
+ "step": 28818
+ },
+ {
+ "epoch": 78.52588555858311,
+ "grad_norm": 3.3788342475891113,
+ "learning_rate": 2.3226275666312346e-06,
+ "loss": 0.0695,
+ "step": 28819
+ },
+ {
+ "epoch": 78.52861035422343,
+ "grad_norm": 2.0427491664886475,
+ "learning_rate": 2.322062125031359e-06,
+ "loss": 0.0794,
+ "step": 28820
+ },
+ {
+ "epoch": 78.53133514986376,
+ "grad_norm": 4.412542343139648,
+ "learning_rate": 2.3214967432270187e-06,
+ "loss": 0.0426,
+ "step": 28821
+ },
+ {
+ "epoch": 78.53405994550408,
+ "grad_norm": 3.6098456382751465,
+ "learning_rate": 2.3209314212226143e-06,
+ "loss": 0.0804,
+ "step": 28822
+ },
+ {
+ "epoch": 78.53678474114442,
+ "grad_norm": 3.7335867881774902,
+ "learning_rate": 2.320366159022549e-06,
+ "loss": 0.0569,
+ "step": 28823
+ },
+ {
+ "epoch": 78.53950953678473,
+ "grad_norm": 2.3873815536499023,
+ "learning_rate": 2.319800956631222e-06,
+ "loss": 0.1644,
+ "step": 28824
+ },
+ {
+ "epoch": 78.54223433242507,
+ "grad_norm": 2.321789503097534,
+ "learning_rate": 2.3192358140530415e-06,
+ "loss": 0.0952,
+ "step": 28825
+ },
+ {
+ "epoch": 78.5449591280654,
+ "grad_norm": 3.5240705013275146,
+ "learning_rate": 2.3186707312924053e-06,
+ "loss": 0.0321,
+ "step": 28826
+ },
+ {
+ "epoch": 78.54768392370572,
+ "grad_norm": 2.644545078277588,
+ "learning_rate": 2.3181057083537127e-06,
+ "loss": 0.1152,
+ "step": 28827
+ },
+ {
+ "epoch": 78.55040871934605,
+ "grad_norm": 3.6151700019836426,
+ "learning_rate": 2.3175407452413647e-06,
+ "loss": 0.1202,
+ "step": 28828
+ },
+ {
+ "epoch": 78.55313351498637,
+ "grad_norm": 10.351760864257812,
+ "learning_rate": 2.316975841959761e-06,
+ "loss": 0.0574,
+ "step": 28829
+ },
+ {
+ "epoch": 78.5558583106267,
+ "grad_norm": 3.1691505908966064,
+ "learning_rate": 2.3164109985133043e-06,
+ "loss": 0.0472,
+ "step": 28830
+ },
+ {
+ "epoch": 78.55858310626704,
+ "grad_norm": 1.7434918880462646,
+ "learning_rate": 2.315846214906393e-06,
+ "loss": 0.0239,
+ "step": 28831
+ },
+ {
+ "epoch": 78.56130790190736,
+ "grad_norm": 2.751307487487793,
+ "learning_rate": 2.315281491143421e-06,
+ "loss": 0.1578,
+ "step": 28832
+ },
+ {
+ "epoch": 78.56403269754769,
+ "grad_norm": 2.538161039352417,
+ "learning_rate": 2.314716827228791e-06,
+ "loss": 0.1006,
+ "step": 28833
+ },
+ {
+ "epoch": 78.566757493188,
+ "grad_norm": 2.3712387084960938,
+ "learning_rate": 2.3141522231669e-06,
+ "loss": 0.0345,
+ "step": 28834
+ },
+ {
+ "epoch": 78.56948228882834,
+ "grad_norm": 4.287030220031738,
+ "learning_rate": 2.3135876789621436e-06,
+ "loss": 0.1119,
+ "step": 28835
+ },
+ {
+ "epoch": 78.57220708446866,
+ "grad_norm": 2.3746984004974365,
+ "learning_rate": 2.313023194618916e-06,
+ "loss": 0.1901,
+ "step": 28836
+ },
+ {
+ "epoch": 78.57493188010899,
+ "grad_norm": 2.118539810180664,
+ "learning_rate": 2.31245877014162e-06,
+ "loss": 0.0384,
+ "step": 28837
+ },
+ {
+ "epoch": 78.57765667574932,
+ "grad_norm": 2.6033174991607666,
+ "learning_rate": 2.3118944055346482e-06,
+ "loss": 0.0305,
+ "step": 28838
+ },
+ {
+ "epoch": 78.58038147138964,
+ "grad_norm": 1.9644960165023804,
+ "learning_rate": 2.3113301008023936e-06,
+ "loss": 0.0574,
+ "step": 28839
+ },
+ {
+ "epoch": 78.58310626702998,
+ "grad_norm": 3.0274219512939453,
+ "learning_rate": 2.3107658559492506e-06,
+ "loss": 0.0731,
+ "step": 28840
+ },
+ {
+ "epoch": 78.5858310626703,
+ "grad_norm": 3.726154088973999,
+ "learning_rate": 2.3102016709796193e-06,
+ "loss": 0.0348,
+ "step": 28841
+ },
+ {
+ "epoch": 78.58855585831063,
+ "grad_norm": 3.710953712463379,
+ "learning_rate": 2.3096375458978892e-06,
+ "loss": 0.0619,
+ "step": 28842
+ },
+ {
+ "epoch": 78.59128065395096,
+ "grad_norm": 3.5191240310668945,
+ "learning_rate": 2.3090734807084545e-06,
+ "loss": 0.0454,
+ "step": 28843
+ },
+ {
+ "epoch": 78.59400544959128,
+ "grad_norm": 2.173923969268799,
+ "learning_rate": 2.3085094754157045e-06,
+ "loss": 0.0251,
+ "step": 28844
+ },
+ {
+ "epoch": 78.59673024523161,
+ "grad_norm": 2.0286457538604736,
+ "learning_rate": 2.3079455300240394e-06,
+ "loss": 0.0334,
+ "step": 28845
+ },
+ {
+ "epoch": 78.59945504087193,
+ "grad_norm": 3.141050338745117,
+ "learning_rate": 2.3073816445378427e-06,
+ "loss": 0.0636,
+ "step": 28846
+ },
+ {
+ "epoch": 78.60217983651226,
+ "grad_norm": 3.3132381439208984,
+ "learning_rate": 2.3068178189615142e-06,
+ "loss": 0.035,
+ "step": 28847
+ },
+ {
+ "epoch": 78.60490463215258,
+ "grad_norm": 2.5420422554016113,
+ "learning_rate": 2.306254053299439e-06,
+ "loss": 0.0612,
+ "step": 28848
+ },
+ {
+ "epoch": 78.60762942779292,
+ "grad_norm": 2.8048555850982666,
+ "learning_rate": 2.305690347556009e-06,
+ "loss": 0.054,
+ "step": 28849
+ },
+ {
+ "epoch": 78.61035422343325,
+ "grad_norm": 2.628035545349121,
+ "learning_rate": 2.305126701735617e-06,
+ "loss": 0.0912,
+ "step": 28850
+ },
+ {
+ "epoch": 78.61307901907357,
+ "grad_norm": 2.939763307571411,
+ "learning_rate": 2.304563115842651e-06,
+ "loss": 0.0539,
+ "step": 28851
+ },
+ {
+ "epoch": 78.6158038147139,
+ "grad_norm": 3.509037733078003,
+ "learning_rate": 2.303999589881496e-06,
+ "loss": 0.1482,
+ "step": 28852
+ },
+ {
+ "epoch": 78.61852861035422,
+ "grad_norm": 2.390042543411255,
+ "learning_rate": 2.3034361238565474e-06,
+ "loss": 0.026,
+ "step": 28853
+ },
+ {
+ "epoch": 78.62125340599455,
+ "grad_norm": 2.847133159637451,
+ "learning_rate": 2.302872717772191e-06,
+ "loss": 0.0264,
+ "step": 28854
+ },
+ {
+ "epoch": 78.62397820163488,
+ "grad_norm": 2.7450544834136963,
+ "learning_rate": 2.302309371632814e-06,
+ "loss": 0.0334,
+ "step": 28855
+ },
+ {
+ "epoch": 78.6267029972752,
+ "grad_norm": 2.1127185821533203,
+ "learning_rate": 2.301746085442801e-06,
+ "loss": 0.0891,
+ "step": 28856
+ },
+ {
+ "epoch": 78.62942779291554,
+ "grad_norm": 3.734999895095825,
+ "learning_rate": 2.301182859206544e-06,
+ "loss": 0.0828,
+ "step": 28857
+ },
+ {
+ "epoch": 78.63215258855585,
+ "grad_norm": 1.8150416612625122,
+ "learning_rate": 2.3006196929284276e-06,
+ "loss": 0.0191,
+ "step": 28858
+ },
+ {
+ "epoch": 78.63487738419619,
+ "grad_norm": 4.945652008056641,
+ "learning_rate": 2.3000565866128377e-06,
+ "loss": 0.1195,
+ "step": 28859
+ },
+ {
+ "epoch": 78.6376021798365,
+ "grad_norm": 2.6597771644592285,
+ "learning_rate": 2.299493540264156e-06,
+ "loss": 0.1091,
+ "step": 28860
+ },
+ {
+ "epoch": 78.64032697547684,
+ "grad_norm": 2.7733194828033447,
+ "learning_rate": 2.2989305538867735e-06,
+ "loss": 0.1298,
+ "step": 28861
+ },
+ {
+ "epoch": 78.64305177111717,
+ "grad_norm": 10.696962356567383,
+ "learning_rate": 2.298367627485072e-06,
+ "loss": 0.0415,
+ "step": 28862
+ },
+ {
+ "epoch": 78.64577656675749,
+ "grad_norm": 2.93894100189209,
+ "learning_rate": 2.2978047610634335e-06,
+ "loss": 0.051,
+ "step": 28863
+ },
+ {
+ "epoch": 78.64850136239782,
+ "grad_norm": 3.761629343032837,
+ "learning_rate": 2.297241954626246e-06,
+ "loss": 0.1012,
+ "step": 28864
+ },
+ {
+ "epoch": 78.65122615803814,
+ "grad_norm": 3.8135571479797363,
+ "learning_rate": 2.2966792081778866e-06,
+ "loss": 0.0323,
+ "step": 28865
+ },
+ {
+ "epoch": 78.65395095367847,
+ "grad_norm": 2.2769131660461426,
+ "learning_rate": 2.2961165217227453e-06,
+ "loss": 0.0677,
+ "step": 28866
+ },
+ {
+ "epoch": 78.65667574931881,
+ "grad_norm": 3.278449058532715,
+ "learning_rate": 2.2955538952652e-06,
+ "loss": 0.1002,
+ "step": 28867
+ },
+ {
+ "epoch": 78.65940054495913,
+ "grad_norm": 2.091280221939087,
+ "learning_rate": 2.294991328809634e-06,
+ "loss": 0.0965,
+ "step": 28868
+ },
+ {
+ "epoch": 78.66212534059946,
+ "grad_norm": 3.919696092605591,
+ "learning_rate": 2.2944288223604237e-06,
+ "loss": 0.1999,
+ "step": 28869
+ },
+ {
+ "epoch": 78.66485013623978,
+ "grad_norm": 3.111398935317993,
+ "learning_rate": 2.293866375921957e-06,
+ "loss": 0.0377,
+ "step": 28870
+ },
+ {
+ "epoch": 78.66757493188011,
+ "grad_norm": 2.956389904022217,
+ "learning_rate": 2.2933039894986107e-06,
+ "loss": 0.0689,
+ "step": 28871
+ },
+ {
+ "epoch": 78.67029972752043,
+ "grad_norm": 1.9143258333206177,
+ "learning_rate": 2.2927416630947653e-06,
+ "loss": 0.029,
+ "step": 28872
+ },
+ {
+ "epoch": 78.67302452316076,
+ "grad_norm": 1.934957504272461,
+ "learning_rate": 2.2921793967147963e-06,
+ "loss": 0.0273,
+ "step": 28873
+ },
+ {
+ "epoch": 78.6757493188011,
+ "grad_norm": 3.2638096809387207,
+ "learning_rate": 2.2916171903630892e-06,
+ "loss": 0.1178,
+ "step": 28874
+ },
+ {
+ "epoch": 78.67847411444141,
+ "grad_norm": 2.8287012577056885,
+ "learning_rate": 2.2910550440440194e-06,
+ "loss": 0.0563,
+ "step": 28875
+ },
+ {
+ "epoch": 78.68119891008175,
+ "grad_norm": 4.911534786224365,
+ "learning_rate": 2.290492957761963e-06,
+ "loss": 0.0741,
+ "step": 28876
+ },
+ {
+ "epoch": 78.68392370572207,
+ "grad_norm": 3.7542495727539062,
+ "learning_rate": 2.2899309315213005e-06,
+ "loss": 0.0554,
+ "step": 28877
+ },
+ {
+ "epoch": 78.6866485013624,
+ "grad_norm": 1.7778617143630981,
+ "learning_rate": 2.2893689653264084e-06,
+ "loss": 0.0217,
+ "step": 28878
+ },
+ {
+ "epoch": 78.68937329700273,
+ "grad_norm": 2.246203660964966,
+ "learning_rate": 2.2888070591816626e-06,
+ "loss": 0.0799,
+ "step": 28879
+ },
+ {
+ "epoch": 78.69209809264305,
+ "grad_norm": 2.1796176433563232,
+ "learning_rate": 2.2882452130914367e-06,
+ "loss": 0.0411,
+ "step": 28880
+ },
+ {
+ "epoch": 78.69482288828338,
+ "grad_norm": 2.6442768573760986,
+ "learning_rate": 2.287683427060109e-06,
+ "loss": 0.0713,
+ "step": 28881
+ },
+ {
+ "epoch": 78.6975476839237,
+ "grad_norm": 2.0072710514068604,
+ "learning_rate": 2.2871217010920567e-06,
+ "loss": 0.0303,
+ "step": 28882
+ },
+ {
+ "epoch": 78.70027247956403,
+ "grad_norm": 2.3387610912323,
+ "learning_rate": 2.286560035191653e-06,
+ "loss": 0.0906,
+ "step": 28883
+ },
+ {
+ "epoch": 78.70299727520435,
+ "grad_norm": 3.0095784664154053,
+ "learning_rate": 2.2859984293632708e-06,
+ "loss": 0.0347,
+ "step": 28884
+ },
+ {
+ "epoch": 78.70572207084469,
+ "grad_norm": 3.653873920440674,
+ "learning_rate": 2.285436883611282e-06,
+ "loss": 0.0792,
+ "step": 28885
+ },
+ {
+ "epoch": 78.70844686648502,
+ "grad_norm": 2.7108097076416016,
+ "learning_rate": 2.284875397940065e-06,
+ "loss": 0.088,
+ "step": 28886
+ },
+ {
+ "epoch": 78.71117166212534,
+ "grad_norm": 16.79184341430664,
+ "learning_rate": 2.284313972353991e-06,
+ "loss": 0.0313,
+ "step": 28887
+ },
+ {
+ "epoch": 78.71389645776567,
+ "grad_norm": 2.76053786277771,
+ "learning_rate": 2.28375260685743e-06,
+ "loss": 0.0315,
+ "step": 28888
+ },
+ {
+ "epoch": 78.71662125340599,
+ "grad_norm": 2.97222900390625,
+ "learning_rate": 2.2831913014547535e-06,
+ "loss": 0.0624,
+ "step": 28889
+ },
+ {
+ "epoch": 78.71934604904632,
+ "grad_norm": 1.5932461023330688,
+ "learning_rate": 2.282630056150338e-06,
+ "loss": 0.0219,
+ "step": 28890
+ },
+ {
+ "epoch": 78.72207084468666,
+ "grad_norm": 2.40366530418396,
+ "learning_rate": 2.2820688709485504e-06,
+ "loss": 0.1016,
+ "step": 28891
+ },
+ {
+ "epoch": 78.72479564032697,
+ "grad_norm": 3.8289735317230225,
+ "learning_rate": 2.2815077458537628e-06,
+ "loss": 0.0452,
+ "step": 28892
+ },
+ {
+ "epoch": 78.7275204359673,
+ "grad_norm": 4.441797256469727,
+ "learning_rate": 2.2809466808703416e-06,
+ "loss": 0.0864,
+ "step": 28893
+ },
+ {
+ "epoch": 78.73024523160763,
+ "grad_norm": 4.0520782470703125,
+ "learning_rate": 2.280385676002661e-06,
+ "loss": 0.0794,
+ "step": 28894
+ },
+ {
+ "epoch": 78.73297002724796,
+ "grad_norm": 3.905402421951294,
+ "learning_rate": 2.2798247312550893e-06,
+ "loss": 0.0434,
+ "step": 28895
+ },
+ {
+ "epoch": 78.73569482288828,
+ "grad_norm": 3.881347894668579,
+ "learning_rate": 2.279263846631994e-06,
+ "loss": 0.0519,
+ "step": 28896
+ },
+ {
+ "epoch": 78.73841961852861,
+ "grad_norm": 2.0655436515808105,
+ "learning_rate": 2.2787030221377403e-06,
+ "loss": 0.0297,
+ "step": 28897
+ },
+ {
+ "epoch": 78.74114441416894,
+ "grad_norm": 2.325296401977539,
+ "learning_rate": 2.278142257776699e-06,
+ "loss": 0.0238,
+ "step": 28898
+ },
+ {
+ "epoch": 78.74386920980926,
+ "grad_norm": 2.9133946895599365,
+ "learning_rate": 2.27758155355324e-06,
+ "loss": 0.0555,
+ "step": 28899
+ },
+ {
+ "epoch": 78.7465940054496,
+ "grad_norm": 2.1299450397491455,
+ "learning_rate": 2.277020909471728e-06,
+ "loss": 0.0423,
+ "step": 28900
+ },
+ {
+ "epoch": 78.74931880108991,
+ "grad_norm": 1.8782014846801758,
+ "learning_rate": 2.2764603255365248e-06,
+ "loss": 0.0676,
+ "step": 28901
+ },
+ {
+ "epoch": 78.75204359673025,
+ "grad_norm": 3.7080154418945312,
+ "learning_rate": 2.2758998017520027e-06,
+ "loss": 0.1151,
+ "step": 28902
+ },
+ {
+ "epoch": 78.75476839237058,
+ "grad_norm": 2.812624931335449,
+ "learning_rate": 2.2753393381225252e-06,
+ "loss": 0.1553,
+ "step": 28903
+ },
+ {
+ "epoch": 78.7574931880109,
+ "grad_norm": 2.258704900741577,
+ "learning_rate": 2.274778934652456e-06,
+ "loss": 0.0679,
+ "step": 28904
+ },
+ {
+ "epoch": 78.76021798365123,
+ "grad_norm": 2.920022964477539,
+ "learning_rate": 2.274218591346157e-06,
+ "loss": 0.0438,
+ "step": 28905
+ },
+ {
+ "epoch": 78.76294277929155,
+ "grad_norm": 2.488492727279663,
+ "learning_rate": 2.2736583082079977e-06,
+ "loss": 0.0528,
+ "step": 28906
+ },
+ {
+ "epoch": 78.76566757493188,
+ "grad_norm": 3.3354389667510986,
+ "learning_rate": 2.273098085242339e-06,
+ "loss": 0.1207,
+ "step": 28907
+ },
+ {
+ "epoch": 78.7683923705722,
+ "grad_norm": 1.8576667308807373,
+ "learning_rate": 2.2725379224535438e-06,
+ "loss": 0.0341,
+ "step": 28908
+ },
+ {
+ "epoch": 78.77111716621253,
+ "grad_norm": 3.292917490005493,
+ "learning_rate": 2.271977819845971e-06,
+ "loss": 0.086,
+ "step": 28909
+ },
+ {
+ "epoch": 78.77384196185287,
+ "grad_norm": 3.809830665588379,
+ "learning_rate": 2.27141777742399e-06,
+ "loss": 0.1056,
+ "step": 28910
+ },
+ {
+ "epoch": 78.77656675749319,
+ "grad_norm": 3.4294378757476807,
+ "learning_rate": 2.2708577951919585e-06,
+ "loss": 0.1242,
+ "step": 28911
+ },
+ {
+ "epoch": 78.77929155313352,
+ "grad_norm": 2.9975271224975586,
+ "learning_rate": 2.270297873154237e-06,
+ "loss": 0.0297,
+ "step": 28912
+ },
+ {
+ "epoch": 78.78201634877384,
+ "grad_norm": 1.738965630531311,
+ "learning_rate": 2.2697380113151848e-06,
+ "loss": 0.0307,
+ "step": 28913
+ },
+ {
+ "epoch": 78.78474114441417,
+ "grad_norm": 1.7738715410232544,
+ "learning_rate": 2.269178209679166e-06,
+ "loss": 0.0169,
+ "step": 28914
+ },
+ {
+ "epoch": 78.7874659400545,
+ "grad_norm": 2.0331978797912598,
+ "learning_rate": 2.2686184682505365e-06,
+ "loss": 0.0319,
+ "step": 28915
+ },
+ {
+ "epoch": 78.79019073569482,
+ "grad_norm": 1.8429347276687622,
+ "learning_rate": 2.2680587870336603e-06,
+ "loss": 0.1209,
+ "step": 28916
+ },
+ {
+ "epoch": 78.79291553133515,
+ "grad_norm": 4.196180820465088,
+ "learning_rate": 2.2674991660328903e-06,
+ "loss": 0.0637,
+ "step": 28917
+ },
+ {
+ "epoch": 78.79564032697547,
+ "grad_norm": 2.5511345863342285,
+ "learning_rate": 2.2669396052525914e-06,
+ "loss": 0.0232,
+ "step": 28918
+ },
+ {
+ "epoch": 78.7983651226158,
+ "grad_norm": 3.883326530456543,
+ "learning_rate": 2.266380104697117e-06,
+ "loss": 0.3365,
+ "step": 28919
+ },
+ {
+ "epoch": 78.80108991825612,
+ "grad_norm": 2.1199047565460205,
+ "learning_rate": 2.265820664370826e-06,
+ "loss": 0.1337,
+ "step": 28920
+ },
+ {
+ "epoch": 78.80381471389646,
+ "grad_norm": 1.7725870609283447,
+ "learning_rate": 2.265261284278072e-06,
+ "loss": 0.0318,
+ "step": 28921
+ },
+ {
+ "epoch": 78.80653950953679,
+ "grad_norm": 2.95277738571167,
+ "learning_rate": 2.264701964423217e-06,
+ "loss": 0.0561,
+ "step": 28922
+ },
+ {
+ "epoch": 78.80926430517711,
+ "grad_norm": 3.0791056156158447,
+ "learning_rate": 2.2641427048106135e-06,
+ "loss": 0.0705,
+ "step": 28923
+ },
+ {
+ "epoch": 78.81198910081744,
+ "grad_norm": 3.029740333557129,
+ "learning_rate": 2.2635835054446186e-06,
+ "loss": 0.0813,
+ "step": 28924
+ },
+ {
+ "epoch": 78.81471389645776,
+ "grad_norm": 6.212014198303223,
+ "learning_rate": 2.2630243663295825e-06,
+ "loss": 0.0645,
+ "step": 28925
+ },
+ {
+ "epoch": 78.8174386920981,
+ "grad_norm": 3.0743587017059326,
+ "learning_rate": 2.2624652874698673e-06,
+ "loss": 0.0417,
+ "step": 28926
+ },
+ {
+ "epoch": 78.82016348773843,
+ "grad_norm": 3.5916972160339355,
+ "learning_rate": 2.2619062688698234e-06,
+ "loss": 0.1351,
+ "step": 28927
+ },
+ {
+ "epoch": 78.82288828337875,
+ "grad_norm": 1.8293107748031616,
+ "learning_rate": 2.2613473105338046e-06,
+ "loss": 0.0368,
+ "step": 28928
+ },
+ {
+ "epoch": 78.82561307901908,
+ "grad_norm": 2.0689969062805176,
+ "learning_rate": 2.2607884124661607e-06,
+ "loss": 0.0322,
+ "step": 28929
+ },
+ {
+ "epoch": 78.8283378746594,
+ "grad_norm": 3.2180821895599365,
+ "learning_rate": 2.2602295746712498e-06,
+ "loss": 0.1061,
+ "step": 28930
+ },
+ {
+ "epoch": 78.83106267029973,
+ "grad_norm": 3.7344260215759277,
+ "learning_rate": 2.2596707971534226e-06,
+ "loss": 0.0838,
+ "step": 28931
+ },
+ {
+ "epoch": 78.83378746594005,
+ "grad_norm": 3.4283828735351562,
+ "learning_rate": 2.2591120799170262e-06,
+ "loss": 0.1491,
+ "step": 28932
+ },
+ {
+ "epoch": 78.83651226158038,
+ "grad_norm": 2.585704803466797,
+ "learning_rate": 2.25855342296642e-06,
+ "loss": 0.0347,
+ "step": 28933
+ },
+ {
+ "epoch": 78.83923705722071,
+ "grad_norm": 1.3932832479476929,
+ "learning_rate": 2.257994826305947e-06,
+ "loss": 0.0202,
+ "step": 28934
+ },
+ {
+ "epoch": 78.84196185286103,
+ "grad_norm": 2.4599039554595947,
+ "learning_rate": 2.2574362899399648e-06,
+ "loss": 0.0593,
+ "step": 28935
+ },
+ {
+ "epoch": 78.84468664850137,
+ "grad_norm": 3.06209659576416,
+ "learning_rate": 2.2568778138728186e-06,
+ "loss": 0.0655,
+ "step": 28936
+ },
+ {
+ "epoch": 78.84741144414168,
+ "grad_norm": 3.4642419815063477,
+ "learning_rate": 2.256319398108859e-06,
+ "loss": 0.0354,
+ "step": 28937
+ },
+ {
+ "epoch": 78.85013623978202,
+ "grad_norm": 2.160891532897949,
+ "learning_rate": 2.255761042652432e-06,
+ "loss": 0.0268,
+ "step": 28938
+ },
+ {
+ "epoch": 78.85286103542235,
+ "grad_norm": 2.034299612045288,
+ "learning_rate": 2.255202747507892e-06,
+ "loss": 0.0544,
+ "step": 28939
+ },
+ {
+ "epoch": 78.85558583106267,
+ "grad_norm": 1.9354496002197266,
+ "learning_rate": 2.2546445126795822e-06,
+ "loss": 0.1085,
+ "step": 28940
+ },
+ {
+ "epoch": 78.858310626703,
+ "grad_norm": 2.530433177947998,
+ "learning_rate": 2.2540863381718502e-06,
+ "loss": 0.0381,
+ "step": 28941
+ },
+ {
+ "epoch": 78.86103542234332,
+ "grad_norm": 3.1374988555908203,
+ "learning_rate": 2.253528223989048e-06,
+ "loss": 0.095,
+ "step": 28942
+ },
+ {
+ "epoch": 78.86376021798365,
+ "grad_norm": 2.735203504562378,
+ "learning_rate": 2.2529701701355167e-06,
+ "loss": 0.0299,
+ "step": 28943
+ },
+ {
+ "epoch": 78.86648501362397,
+ "grad_norm": 2.352241039276123,
+ "learning_rate": 2.252412176615606e-06,
+ "loss": 0.0291,
+ "step": 28944
+ },
+ {
+ "epoch": 78.8692098092643,
+ "grad_norm": 2.0535550117492676,
+ "learning_rate": 2.2518542434336564e-06,
+ "loss": 0.0235,
+ "step": 28945
+ },
+ {
+ "epoch": 78.87193460490464,
+ "grad_norm": 2.4184505939483643,
+ "learning_rate": 2.2512963705940192e-06,
+ "loss": 0.0378,
+ "step": 28946
+ },
+ {
+ "epoch": 78.87465940054496,
+ "grad_norm": 2.285931348800659,
+ "learning_rate": 2.2507385581010364e-06,
+ "loss": 0.0204,
+ "step": 28947
+ },
+ {
+ "epoch": 78.87738419618529,
+ "grad_norm": 2.4018497467041016,
+ "learning_rate": 2.2501808059590537e-06,
+ "loss": 0.0522,
+ "step": 28948
+ },
+ {
+ "epoch": 78.88010899182561,
+ "grad_norm": 3.8832502365112305,
+ "learning_rate": 2.249623114172409e-06,
+ "loss": 0.0292,
+ "step": 28949
+ },
+ {
+ "epoch": 78.88283378746594,
+ "grad_norm": 3.2039356231689453,
+ "learning_rate": 2.2490654827454505e-06,
+ "loss": 0.1085,
+ "step": 28950
+ },
+ {
+ "epoch": 78.88555858310627,
+ "grad_norm": 4.351308822631836,
+ "learning_rate": 2.2485079116825236e-06,
+ "loss": 0.0428,
+ "step": 28951
+ },
+ {
+ "epoch": 78.88828337874659,
+ "grad_norm": 2.8200180530548096,
+ "learning_rate": 2.247950400987968e-06,
+ "loss": 0.0406,
+ "step": 28952
+ },
+ {
+ "epoch": 78.89100817438693,
+ "grad_norm": 8.28785228729248,
+ "learning_rate": 2.247392950666124e-06,
+ "loss": 0.13,
+ "step": 28953
+ },
+ {
+ "epoch": 78.89373297002724,
+ "grad_norm": 2.1097002029418945,
+ "learning_rate": 2.246835560721332e-06,
+ "loss": 0.0656,
+ "step": 28954
+ },
+ {
+ "epoch": 78.89645776566758,
+ "grad_norm": 2.7372913360595703,
+ "learning_rate": 2.246278231157939e-06,
+ "loss": 0.0768,
+ "step": 28955
+ },
+ {
+ "epoch": 78.8991825613079,
+ "grad_norm": 2.5888876914978027,
+ "learning_rate": 2.24572096198028e-06,
+ "loss": 0.0391,
+ "step": 28956
+ },
+ {
+ "epoch": 78.90190735694823,
+ "grad_norm": 3.376915216445923,
+ "learning_rate": 2.2451637531926973e-06,
+ "loss": 0.0305,
+ "step": 28957
+ },
+ {
+ "epoch": 78.90463215258856,
+ "grad_norm": 3.2022457122802734,
+ "learning_rate": 2.244606604799526e-06,
+ "loss": 0.1114,
+ "step": 28958
+ },
+ {
+ "epoch": 78.90735694822888,
+ "grad_norm": 2.461902379989624,
+ "learning_rate": 2.2440495168051134e-06,
+ "loss": 0.0431,
+ "step": 28959
+ },
+ {
+ "epoch": 78.91008174386921,
+ "grad_norm": 2.7596118450164795,
+ "learning_rate": 2.2434924892137923e-06,
+ "loss": 0.0619,
+ "step": 28960
+ },
+ {
+ "epoch": 78.91280653950953,
+ "grad_norm": 2.351466178894043,
+ "learning_rate": 2.2429355220299e-06,
+ "loss": 0.0379,
+ "step": 28961
+ },
+ {
+ "epoch": 78.91553133514986,
+ "grad_norm": 1.9727129936218262,
+ "learning_rate": 2.2423786152577788e-06,
+ "loss": 0.0273,
+ "step": 28962
+ },
+ {
+ "epoch": 78.9182561307902,
+ "grad_norm": 3.642521619796753,
+ "learning_rate": 2.241821768901762e-06,
+ "loss": 0.111,
+ "step": 28963
+ },
+ {
+ "epoch": 78.92098092643052,
+ "grad_norm": 2.45471453666687,
+ "learning_rate": 2.241264982966189e-06,
+ "loss": 0.0566,
+ "step": 28964
+ },
+ {
+ "epoch": 78.92370572207085,
+ "grad_norm": 3.0651931762695312,
+ "learning_rate": 2.2407082574553905e-06,
+ "loss": 0.0501,
+ "step": 28965
+ },
+ {
+ "epoch": 78.92643051771117,
+ "grad_norm": 3.414696455001831,
+ "learning_rate": 2.2401515923737083e-06,
+ "loss": 0.0405,
+ "step": 28966
+ },
+ {
+ "epoch": 78.9291553133515,
+ "grad_norm": 4.019133567810059,
+ "learning_rate": 2.2395949877254776e-06,
+ "loss": 0.1029,
+ "step": 28967
+ },
+ {
+ "epoch": 78.93188010899182,
+ "grad_norm": 3.0019774436950684,
+ "learning_rate": 2.23903844351503e-06,
+ "loss": 0.083,
+ "step": 28968
+ },
+ {
+ "epoch": 78.93460490463215,
+ "grad_norm": 2.116072416305542,
+ "learning_rate": 2.2384819597467033e-06,
+ "loss": 0.0295,
+ "step": 28969
+ },
+ {
+ "epoch": 78.93732970027249,
+ "grad_norm": 3.3626227378845215,
+ "learning_rate": 2.2379255364248252e-06,
+ "loss": 0.0462,
+ "step": 28970
+ },
+ {
+ "epoch": 78.9400544959128,
+ "grad_norm": 2.790712356567383,
+ "learning_rate": 2.237369173553736e-06,
+ "loss": 0.1157,
+ "step": 28971
+ },
+ {
+ "epoch": 78.94277929155314,
+ "grad_norm": 2.7577567100524902,
+ "learning_rate": 2.2368128711377666e-06,
+ "loss": 0.0585,
+ "step": 28972
+ },
+ {
+ "epoch": 78.94550408719346,
+ "grad_norm": 2.1706457138061523,
+ "learning_rate": 2.2362566291812483e-06,
+ "loss": 0.0237,
+ "step": 28973
+ },
+ {
+ "epoch": 78.94822888283379,
+ "grad_norm": 2.6240735054016113,
+ "learning_rate": 2.2357004476885112e-06,
+ "loss": 0.0548,
+ "step": 28974
+ },
+ {
+ "epoch": 78.95095367847412,
+ "grad_norm": 4.908451080322266,
+ "learning_rate": 2.2351443266638918e-06,
+ "loss": 0.1023,
+ "step": 28975
+ },
+ {
+ "epoch": 78.95367847411444,
+ "grad_norm": 2.3655176162719727,
+ "learning_rate": 2.234588266111718e-06,
+ "loss": 0.065,
+ "step": 28976
+ },
+ {
+ "epoch": 78.95640326975477,
+ "grad_norm": 2.5295188426971436,
+ "learning_rate": 2.2340322660363213e-06,
+ "loss": 0.081,
+ "step": 28977
+ },
+ {
+ "epoch": 78.95912806539509,
+ "grad_norm": 3.583195686340332,
+ "learning_rate": 2.2334763264420277e-06,
+ "loss": 0.0237,
+ "step": 28978
+ },
+ {
+ "epoch": 78.96185286103542,
+ "grad_norm": 2.523772716522217,
+ "learning_rate": 2.2329204473331745e-06,
+ "loss": 0.043,
+ "step": 28979
+ },
+ {
+ "epoch": 78.96457765667574,
+ "grad_norm": 3.4741899967193604,
+ "learning_rate": 2.2323646287140856e-06,
+ "loss": 0.1255,
+ "step": 28980
+ },
+ {
+ "epoch": 78.96730245231608,
+ "grad_norm": 3.007777214050293,
+ "learning_rate": 2.2318088705890917e-06,
+ "loss": 0.0346,
+ "step": 28981
+ },
+ {
+ "epoch": 78.97002724795641,
+ "grad_norm": 2.4841318130493164,
+ "learning_rate": 2.2312531729625175e-06,
+ "loss": 0.0412,
+ "step": 28982
+ },
+ {
+ "epoch": 78.97275204359673,
+ "grad_norm": 3.2065043449401855,
+ "learning_rate": 2.230697535838696e-06,
+ "loss": 0.0738,
+ "step": 28983
+ },
+ {
+ "epoch": 78.97547683923706,
+ "grad_norm": 2.92630672454834,
+ "learning_rate": 2.2301419592219496e-06,
+ "loss": 0.0562,
+ "step": 28984
+ },
+ {
+ "epoch": 78.97820163487738,
+ "grad_norm": 3.4912874698638916,
+ "learning_rate": 2.2295864431166105e-06,
+ "loss": 0.0916,
+ "step": 28985
+ },
+ {
+ "epoch": 78.98092643051771,
+ "grad_norm": 2.434004783630371,
+ "learning_rate": 2.229030987526999e-06,
+ "loss": 0.0305,
+ "step": 28986
+ },
+ {
+ "epoch": 78.98365122615803,
+ "grad_norm": 2.8450632095336914,
+ "learning_rate": 2.2284755924574477e-06,
+ "loss": 0.0804,
+ "step": 28987
+ },
+ {
+ "epoch": 78.98637602179836,
+ "grad_norm": 3.7656378746032715,
+ "learning_rate": 2.2279202579122773e-06,
+ "loss": 0.0881,
+ "step": 28988
+ },
+ {
+ "epoch": 78.9891008174387,
+ "grad_norm": 4.203093528747559,
+ "learning_rate": 2.2273649838958133e-06,
+ "loss": 0.1142,
+ "step": 28989
+ },
+ {
+ "epoch": 78.99182561307902,
+ "grad_norm": 2.87361478805542,
+ "learning_rate": 2.2268097704123793e-06,
+ "loss": 0.0602,
+ "step": 28990
+ },
+ {
+ "epoch": 78.99455040871935,
+ "grad_norm": 2.962855815887451,
+ "learning_rate": 2.2262546174663024e-06,
+ "loss": 0.0651,
+ "step": 28991
+ },
+ {
+ "epoch": 78.99727520435967,
+ "grad_norm": 2.7653558254241943,
+ "learning_rate": 2.225699525061905e-06,
+ "loss": 0.0336,
+ "step": 28992
+ },
+ {
+ "epoch": 79.0,
+ "grad_norm": 3.1838862895965576,
+ "learning_rate": 2.2251444932035094e-06,
+ "loss": 0.0642,
+ "step": 28993
+ },
+ {
+ "epoch": 79.00272479564033,
+ "grad_norm": 2.9148108959198,
+ "learning_rate": 2.224589521895435e-06,
+ "loss": 0.1426,
+ "step": 28994
+ },
+ {
+ "epoch": 79.00544959128065,
+ "grad_norm": 3.782153844833374,
+ "learning_rate": 2.22403461114201e-06,
+ "loss": 0.1301,
+ "step": 28995
+ },
+ {
+ "epoch": 79.00817438692098,
+ "grad_norm": 4.163833141326904,
+ "learning_rate": 2.2234797609475536e-06,
+ "loss": 0.0725,
+ "step": 28996
+ },
+ {
+ "epoch": 79.0108991825613,
+ "grad_norm": 3.2145962715148926,
+ "learning_rate": 2.222924971316386e-06,
+ "loss": 0.0449,
+ "step": 28997
+ },
+ {
+ "epoch": 79.01362397820164,
+ "grad_norm": 6.8873467445373535,
+ "learning_rate": 2.222370242252826e-06,
+ "loss": 0.067,
+ "step": 28998
+ },
+ {
+ "epoch": 79.01634877384195,
+ "grad_norm": 3.1379776000976562,
+ "learning_rate": 2.221815573761199e-06,
+ "loss": 0.0405,
+ "step": 28999
+ },
+ {
+ "epoch": 79.01907356948229,
+ "grad_norm": 2.1184167861938477,
+ "learning_rate": 2.2212609658458217e-06,
+ "loss": 0.0313,
+ "step": 29000
+ },
+ {
+ "epoch": 79.02179836512262,
+ "grad_norm": 2.5771548748016357,
+ "learning_rate": 2.2207064185110107e-06,
+ "loss": 0.0705,
+ "step": 29001
+ },
+ {
+ "epoch": 79.02452316076294,
+ "grad_norm": 2.5136120319366455,
+ "learning_rate": 2.220151931761091e-06,
+ "loss": 0.1279,
+ "step": 29002
+ },
+ {
+ "epoch": 79.02724795640327,
+ "grad_norm": 1.5938818454742432,
+ "learning_rate": 2.219597505600375e-06,
+ "loss": 0.03,
+ "step": 29003
+ },
+ {
+ "epoch": 79.02997275204359,
+ "grad_norm": 2.7952795028686523,
+ "learning_rate": 2.219043140033186e-06,
+ "loss": 0.0843,
+ "step": 29004
+ },
+ {
+ "epoch": 79.03269754768392,
+ "grad_norm": 2.659262180328369,
+ "learning_rate": 2.2184888350638378e-06,
+ "loss": 0.1777,
+ "step": 29005
+ },
+ {
+ "epoch": 79.03542234332426,
+ "grad_norm": 2.468482494354248,
+ "learning_rate": 2.2179345906966464e-06,
+ "loss": 0.0318,
+ "step": 29006
+ },
+ {
+ "epoch": 79.03814713896458,
+ "grad_norm": 2.700657844543457,
+ "learning_rate": 2.2173804069359316e-06,
+ "loss": 0.0941,
+ "step": 29007
+ },
+ {
+ "epoch": 79.04087193460491,
+ "grad_norm": 1.6931849718093872,
+ "learning_rate": 2.2168262837860087e-06,
+ "loss": 0.0305,
+ "step": 29008
+ },
+ {
+ "epoch": 79.04359673024523,
+ "grad_norm": 2.511362314224243,
+ "learning_rate": 2.216272221251192e-06,
+ "loss": 0.0315,
+ "step": 29009
+ },
+ {
+ "epoch": 79.04632152588556,
+ "grad_norm": 2.1316440105438232,
+ "learning_rate": 2.215718219335794e-06,
+ "loss": 0.0325,
+ "step": 29010
+ },
+ {
+ "epoch": 79.04904632152588,
+ "grad_norm": 2.4834442138671875,
+ "learning_rate": 2.215164278044134e-06,
+ "loss": 0.0383,
+ "step": 29011
+ },
+ {
+ "epoch": 79.05177111716621,
+ "grad_norm": 3.0480587482452393,
+ "learning_rate": 2.2146103973805243e-06,
+ "loss": 0.0398,
+ "step": 29012
+ },
+ {
+ "epoch": 79.05449591280654,
+ "grad_norm": 2.2068545818328857,
+ "learning_rate": 2.2140565773492783e-06,
+ "loss": 0.0871,
+ "step": 29013
+ },
+ {
+ "epoch": 79.05722070844686,
+ "grad_norm": 4.302914142608643,
+ "learning_rate": 2.213502817954707e-06,
+ "loss": 0.0996,
+ "step": 29014
+ },
+ {
+ "epoch": 79.0599455040872,
+ "grad_norm": 2.7306058406829834,
+ "learning_rate": 2.2129491192011276e-06,
+ "loss": 0.0247,
+ "step": 29015
+ },
+ {
+ "epoch": 79.06267029972751,
+ "grad_norm": 4.0557074546813965,
+ "learning_rate": 2.2123954810928494e-06,
+ "loss": 0.0666,
+ "step": 29016
+ },
+ {
+ "epoch": 79.06539509536785,
+ "grad_norm": 2.2466578483581543,
+ "learning_rate": 2.2118419036341852e-06,
+ "loss": 0.0856,
+ "step": 29017
+ },
+ {
+ "epoch": 79.06811989100818,
+ "grad_norm": 3.5039384365081787,
+ "learning_rate": 2.211288386829442e-06,
+ "loss": 0.0369,
+ "step": 29018
+ },
+ {
+ "epoch": 79.0708446866485,
+ "grad_norm": 2.205421209335327,
+ "learning_rate": 2.2107349306829353e-06,
+ "loss": 0.0284,
+ "step": 29019
+ },
+ {
+ "epoch": 79.07356948228883,
+ "grad_norm": 4.472661972045898,
+ "learning_rate": 2.2101815351989766e-06,
+ "loss": 0.0522,
+ "step": 29020
+ },
+ {
+ "epoch": 79.07629427792915,
+ "grad_norm": 3.3279480934143066,
+ "learning_rate": 2.2096282003818727e-06,
+ "loss": 0.1035,
+ "step": 29021
+ },
+ {
+ "epoch": 79.07901907356948,
+ "grad_norm": 3.8901562690734863,
+ "learning_rate": 2.2090749262359335e-06,
+ "loss": 0.0403,
+ "step": 29022
+ },
+ {
+ "epoch": 79.0817438692098,
+ "grad_norm": 1.69046950340271,
+ "learning_rate": 2.2085217127654667e-06,
+ "loss": 0.0228,
+ "step": 29023
+ },
+ {
+ "epoch": 79.08446866485014,
+ "grad_norm": 2.8504533767700195,
+ "learning_rate": 2.2079685599747836e-06,
+ "loss": 0.0438,
+ "step": 29024
+ },
+ {
+ "epoch": 79.08719346049047,
+ "grad_norm": 2.222036838531494,
+ "learning_rate": 2.2074154678681915e-06,
+ "loss": 0.0285,
+ "step": 29025
+ },
+ {
+ "epoch": 79.08991825613079,
+ "grad_norm": 2.6852304935455322,
+ "learning_rate": 2.2068624364499923e-06,
+ "loss": 0.0382,
+ "step": 29026
+ },
+ {
+ "epoch": 79.09264305177112,
+ "grad_norm": 4.05474328994751,
+ "learning_rate": 2.2063094657245023e-06,
+ "loss": 0.1143,
+ "step": 29027
+ },
+ {
+ "epoch": 79.09536784741144,
+ "grad_norm": 1.4751938581466675,
+ "learning_rate": 2.2057565556960224e-06,
+ "loss": 0.0177,
+ "step": 29028
+ },
+ {
+ "epoch": 79.09809264305177,
+ "grad_norm": 2.09287428855896,
+ "learning_rate": 2.20520370636886e-06,
+ "loss": 0.0433,
+ "step": 29029
+ },
+ {
+ "epoch": 79.1008174386921,
+ "grad_norm": 2.2168161869049072,
+ "learning_rate": 2.2046509177473172e-06,
+ "loss": 0.0314,
+ "step": 29030
+ },
+ {
+ "epoch": 79.10354223433242,
+ "grad_norm": 3.78035831451416,
+ "learning_rate": 2.204098189835705e-06,
+ "loss": 0.0625,
+ "step": 29031
+ },
+ {
+ "epoch": 79.10626702997276,
+ "grad_norm": 3.029510498046875,
+ "learning_rate": 2.203545522638326e-06,
+ "loss": 0.0353,
+ "step": 29032
+ },
+ {
+ "epoch": 79.10899182561307,
+ "grad_norm": 2.7755277156829834,
+ "learning_rate": 2.2029929161594832e-06,
+ "loss": 0.0292,
+ "step": 29033
+ },
+ {
+ "epoch": 79.11171662125341,
+ "grad_norm": 3.479027271270752,
+ "learning_rate": 2.202440370403477e-06,
+ "loss": 0.0337,
+ "step": 29034
+ },
+ {
+ "epoch": 79.11444141689373,
+ "grad_norm": 2.9710240364074707,
+ "learning_rate": 2.201887885374615e-06,
+ "loss": 0.0308,
+ "step": 29035
+ },
+ {
+ "epoch": 79.11716621253406,
+ "grad_norm": 2.7454752922058105,
+ "learning_rate": 2.201335461077201e-06,
+ "loss": 0.0461,
+ "step": 29036
+ },
+ {
+ "epoch": 79.11989100817439,
+ "grad_norm": 2.8812928199768066,
+ "learning_rate": 2.2007830975155366e-06,
+ "loss": 0.0292,
+ "step": 29037
+ },
+ {
+ "epoch": 79.12261580381471,
+ "grad_norm": 2.9671459197998047,
+ "learning_rate": 2.200230794693922e-06,
+ "loss": 0.0419,
+ "step": 29038
+ },
+ {
+ "epoch": 79.12534059945504,
+ "grad_norm": 2.3303415775299072,
+ "learning_rate": 2.1996785526166565e-06,
+ "loss": 0.0708,
+ "step": 29039
+ },
+ {
+ "epoch": 79.12806539509536,
+ "grad_norm": 3.224896192550659,
+ "learning_rate": 2.199126371288045e-06,
+ "loss": 0.0468,
+ "step": 29040
+ },
+ {
+ "epoch": 79.1307901907357,
+ "grad_norm": 2.227735996246338,
+ "learning_rate": 2.1985742507123873e-06,
+ "loss": 0.0241,
+ "step": 29041
+ },
+ {
+ "epoch": 79.13351498637603,
+ "grad_norm": 2.878380060195923,
+ "learning_rate": 2.1980221908939812e-06,
+ "loss": 0.0379,
+ "step": 29042
+ },
+ {
+ "epoch": 79.13623978201635,
+ "grad_norm": 2.451493501663208,
+ "learning_rate": 2.1974701918371253e-06,
+ "loss": 0.0975,
+ "step": 29043
+ },
+ {
+ "epoch": 79.13896457765668,
+ "grad_norm": 3.162177085876465,
+ "learning_rate": 2.196918253546123e-06,
+ "loss": 0.0339,
+ "step": 29044
+ },
+ {
+ "epoch": 79.141689373297,
+ "grad_norm": 2.534670829772949,
+ "learning_rate": 2.1963663760252706e-06,
+ "loss": 0.0399,
+ "step": 29045
+ },
+ {
+ "epoch": 79.14441416893733,
+ "grad_norm": 2.1600096225738525,
+ "learning_rate": 2.195814559278866e-06,
+ "loss": 0.063,
+ "step": 29046
+ },
+ {
+ "epoch": 79.14713896457765,
+ "grad_norm": 2.6848669052124023,
+ "learning_rate": 2.1952628033112023e-06,
+ "loss": 0.0931,
+ "step": 29047
+ },
+ {
+ "epoch": 79.14986376021798,
+ "grad_norm": 3.757939100265503,
+ "learning_rate": 2.194711108126585e-06,
+ "loss": 0.0976,
+ "step": 29048
+ },
+ {
+ "epoch": 79.15258855585832,
+ "grad_norm": 2.2765674591064453,
+ "learning_rate": 2.1941594737293046e-06,
+ "loss": 0.0368,
+ "step": 29049
+ },
+ {
+ "epoch": 79.15531335149863,
+ "grad_norm": 2.605943202972412,
+ "learning_rate": 2.193607900123658e-06,
+ "loss": 0.0335,
+ "step": 29050
+ },
+ {
+ "epoch": 79.15803814713897,
+ "grad_norm": 4.46356725692749,
+ "learning_rate": 2.193056387313943e-06,
+ "loss": 0.0785,
+ "step": 29051
+ },
+ {
+ "epoch": 79.16076294277929,
+ "grad_norm": 2.3422508239746094,
+ "learning_rate": 2.1925049353044516e-06,
+ "loss": 0.0585,
+ "step": 29052
+ },
+ {
+ "epoch": 79.16348773841962,
+ "grad_norm": 3.4779980182647705,
+ "learning_rate": 2.191953544099483e-06,
+ "loss": 0.1004,
+ "step": 29053
+ },
+ {
+ "epoch": 79.16621253405995,
+ "grad_norm": 3.1119022369384766,
+ "learning_rate": 2.1914022137033298e-06,
+ "loss": 0.1381,
+ "step": 29054
+ },
+ {
+ "epoch": 79.16893732970027,
+ "grad_norm": 3.0909368991851807,
+ "learning_rate": 2.1908509441202808e-06,
+ "loss": 0.0669,
+ "step": 29055
+ },
+ {
+ "epoch": 79.1716621253406,
+ "grad_norm": 2.227065324783325,
+ "learning_rate": 2.1902997353546375e-06,
+ "loss": 0.2358,
+ "step": 29056
+ },
+ {
+ "epoch": 79.17438692098092,
+ "grad_norm": 2.804032325744629,
+ "learning_rate": 2.189748587410687e-06,
+ "loss": 0.0848,
+ "step": 29057
+ },
+ {
+ "epoch": 79.17711171662125,
+ "grad_norm": 3.4174256324768066,
+ "learning_rate": 2.1891975002927235e-06,
+ "loss": 0.0597,
+ "step": 29058
+ },
+ {
+ "epoch": 79.17983651226157,
+ "grad_norm": 2.1053144931793213,
+ "learning_rate": 2.188646474005036e-06,
+ "loss": 0.0192,
+ "step": 29059
+ },
+ {
+ "epoch": 79.1825613079019,
+ "grad_norm": 2.635653018951416,
+ "learning_rate": 2.1880955085519217e-06,
+ "loss": 0.0849,
+ "step": 29060
+ },
+ {
+ "epoch": 79.18528610354224,
+ "grad_norm": 2.9646215438842773,
+ "learning_rate": 2.187544603937668e-06,
+ "loss": 0.0521,
+ "step": 29061
+ },
+ {
+ "epoch": 79.18801089918256,
+ "grad_norm": 2.1120166778564453,
+ "learning_rate": 2.1869937601665646e-06,
+ "loss": 0.0343,
+ "step": 29062
+ },
+ {
+ "epoch": 79.19073569482289,
+ "grad_norm": 4.583893299102783,
+ "learning_rate": 2.1864429772428997e-06,
+ "loss": 0.0392,
+ "step": 29063
+ },
+ {
+ "epoch": 79.19346049046321,
+ "grad_norm": 3.6696221828460693,
+ "learning_rate": 2.1858922551709694e-06,
+ "loss": 0.0763,
+ "step": 29064
+ },
+ {
+ "epoch": 79.19618528610354,
+ "grad_norm": 4.0118794441223145,
+ "learning_rate": 2.1853415939550572e-06,
+ "loss": 0.0663,
+ "step": 29065
+ },
+ {
+ "epoch": 79.19891008174388,
+ "grad_norm": 3.1027932167053223,
+ "learning_rate": 2.1847909935994538e-06,
+ "loss": 0.2138,
+ "step": 29066
+ },
+ {
+ "epoch": 79.2016348773842,
+ "grad_norm": 2.924137592315674,
+ "learning_rate": 2.1842404541084437e-06,
+ "loss": 0.1047,
+ "step": 29067
+ },
+ {
+ "epoch": 79.20435967302453,
+ "grad_norm": 2.2442281246185303,
+ "learning_rate": 2.1836899754863207e-06,
+ "loss": 0.0331,
+ "step": 29068
+ },
+ {
+ "epoch": 79.20708446866485,
+ "grad_norm": 2.7856338024139404,
+ "learning_rate": 2.183139557737368e-06,
+ "loss": 0.1887,
+ "step": 29069
+ },
+ {
+ "epoch": 79.20980926430518,
+ "grad_norm": 3.261448860168457,
+ "learning_rate": 2.18258920086587e-06,
+ "loss": 0.0935,
+ "step": 29070
+ },
+ {
+ "epoch": 79.2125340599455,
+ "grad_norm": 3.122056007385254,
+ "learning_rate": 2.1820389048761172e-06,
+ "loss": 0.0446,
+ "step": 29071
+ },
+ {
+ "epoch": 79.21525885558583,
+ "grad_norm": 3.940288782119751,
+ "learning_rate": 2.1814886697723946e-06,
+ "loss": 0.0401,
+ "step": 29072
+ },
+ {
+ "epoch": 79.21798365122616,
+ "grad_norm": 1.80351722240448,
+ "learning_rate": 2.1809384955589873e-06,
+ "loss": 0.0308,
+ "step": 29073
+ },
+ {
+ "epoch": 79.22070844686648,
+ "grad_norm": 3.1186141967773438,
+ "learning_rate": 2.1803883822401795e-06,
+ "loss": 0.0462,
+ "step": 29074
+ },
+ {
+ "epoch": 79.22343324250681,
+ "grad_norm": 2.8939812183380127,
+ "learning_rate": 2.1798383298202518e-06,
+ "loss": 0.0986,
+ "step": 29075
+ },
+ {
+ "epoch": 79.22615803814713,
+ "grad_norm": 2.034874677658081,
+ "learning_rate": 2.1792883383034956e-06,
+ "loss": 0.0211,
+ "step": 29076
+ },
+ {
+ "epoch": 79.22888283378747,
+ "grad_norm": 2.3820343017578125,
+ "learning_rate": 2.1787384076941897e-06,
+ "loss": 0.1199,
+ "step": 29077
+ },
+ {
+ "epoch": 79.2316076294278,
+ "grad_norm": 3.194413185119629,
+ "learning_rate": 2.1781885379966173e-06,
+ "loss": 0.0778,
+ "step": 29078
+ },
+ {
+ "epoch": 79.23433242506812,
+ "grad_norm": 2.6934423446655273,
+ "learning_rate": 2.177638729215057e-06,
+ "loss": 0.0881,
+ "step": 29079
+ },
+ {
+ "epoch": 79.23705722070845,
+ "grad_norm": 2.2399747371673584,
+ "learning_rate": 2.177088981353799e-06,
+ "loss": 0.0457,
+ "step": 29080
+ },
+ {
+ "epoch": 79.23978201634877,
+ "grad_norm": 2.8372128009796143,
+ "learning_rate": 2.1765392944171183e-06,
+ "loss": 0.0607,
+ "step": 29081
+ },
+ {
+ "epoch": 79.2425068119891,
+ "grad_norm": 2.8705480098724365,
+ "learning_rate": 2.1759896684092997e-06,
+ "loss": 0.0499,
+ "step": 29082
+ },
+ {
+ "epoch": 79.24523160762942,
+ "grad_norm": 2.626051187515259,
+ "learning_rate": 2.1754401033346172e-06,
+ "loss": 0.1157,
+ "step": 29083
+ },
+ {
+ "epoch": 79.24795640326975,
+ "grad_norm": 2.2016239166259766,
+ "learning_rate": 2.174890599197359e-06,
+ "loss": 0.0901,
+ "step": 29084
+ },
+ {
+ "epoch": 79.25068119891009,
+ "grad_norm": 2.451127290725708,
+ "learning_rate": 2.174341156001801e-06,
+ "loss": 0.0398,
+ "step": 29085
+ },
+ {
+ "epoch": 79.2534059945504,
+ "grad_norm": 2.5305445194244385,
+ "learning_rate": 2.173791773752223e-06,
+ "loss": 0.0375,
+ "step": 29086
+ },
+ {
+ "epoch": 79.25613079019074,
+ "grad_norm": 3.7565362453460693,
+ "learning_rate": 2.1732424524528984e-06,
+ "loss": 0.088,
+ "step": 29087
+ },
+ {
+ "epoch": 79.25885558583106,
+ "grad_norm": 4.2690534591674805,
+ "learning_rate": 2.172693192108111e-06,
+ "loss": 0.0655,
+ "step": 29088
+ },
+ {
+ "epoch": 79.26158038147139,
+ "grad_norm": 3.4888193607330322,
+ "learning_rate": 2.1721439927221386e-06,
+ "loss": 0.0292,
+ "step": 29089
+ },
+ {
+ "epoch": 79.26430517711172,
+ "grad_norm": 2.0520920753479004,
+ "learning_rate": 2.1715948542992583e-06,
+ "loss": 0.0201,
+ "step": 29090
+ },
+ {
+ "epoch": 79.26702997275204,
+ "grad_norm": 2.751879930496216,
+ "learning_rate": 2.171045776843742e-06,
+ "loss": 0.0403,
+ "step": 29091
+ },
+ {
+ "epoch": 79.26975476839237,
+ "grad_norm": 2.667137861251831,
+ "learning_rate": 2.1704967603598716e-06,
+ "loss": 0.1036,
+ "step": 29092
+ },
+ {
+ "epoch": 79.2724795640327,
+ "grad_norm": 2.8200252056121826,
+ "learning_rate": 2.1699478048519207e-06,
+ "loss": 0.033,
+ "step": 29093
+ },
+ {
+ "epoch": 79.27520435967303,
+ "grad_norm": 2.055072069168091,
+ "learning_rate": 2.169398910324164e-06,
+ "loss": 0.0403,
+ "step": 29094
+ },
+ {
+ "epoch": 79.27792915531334,
+ "grad_norm": 2.743004560470581,
+ "learning_rate": 2.168850076780874e-06,
+ "loss": 0.0383,
+ "step": 29095
+ },
+ {
+ "epoch": 79.28065395095368,
+ "grad_norm": 3.5729358196258545,
+ "learning_rate": 2.1683013042263303e-06,
+ "loss": 0.0657,
+ "step": 29096
+ },
+ {
+ "epoch": 79.28337874659401,
+ "grad_norm": 2.585911273956299,
+ "learning_rate": 2.1677525926648046e-06,
+ "loss": 0.0852,
+ "step": 29097
+ },
+ {
+ "epoch": 79.28610354223433,
+ "grad_norm": 2.3793601989746094,
+ "learning_rate": 2.1672039421005685e-06,
+ "loss": 0.0654,
+ "step": 29098
+ },
+ {
+ "epoch": 79.28882833787466,
+ "grad_norm": 4.038046836853027,
+ "learning_rate": 2.166655352537894e-06,
+ "loss": 0.0373,
+ "step": 29099
+ },
+ {
+ "epoch": 79.29155313351498,
+ "grad_norm": 2.678459644317627,
+ "learning_rate": 2.166106823981058e-06,
+ "loss": 0.109,
+ "step": 29100
+ },
+ {
+ "epoch": 79.29427792915531,
+ "grad_norm": 1.7455143928527832,
+ "learning_rate": 2.1655583564343295e-06,
+ "loss": 0.0164,
+ "step": 29101
+ },
+ {
+ "epoch": 79.29700272479565,
+ "grad_norm": 3.4639203548431396,
+ "learning_rate": 2.1650099499019817e-06,
+ "loss": 0.1119,
+ "step": 29102
+ },
+ {
+ "epoch": 79.29972752043597,
+ "grad_norm": 2.804391384124756,
+ "learning_rate": 2.1644616043882806e-06,
+ "loss": 0.0621,
+ "step": 29103
+ },
+ {
+ "epoch": 79.3024523160763,
+ "grad_norm": 2.591519594192505,
+ "learning_rate": 2.1639133198975003e-06,
+ "loss": 0.146,
+ "step": 29104
+ },
+ {
+ "epoch": 79.30517711171662,
+ "grad_norm": 3.3030831813812256,
+ "learning_rate": 2.1633650964339137e-06,
+ "loss": 0.032,
+ "step": 29105
+ },
+ {
+ "epoch": 79.30790190735695,
+ "grad_norm": 2.8341338634490967,
+ "learning_rate": 2.162816934001787e-06,
+ "loss": 0.0371,
+ "step": 29106
+ },
+ {
+ "epoch": 79.31062670299727,
+ "grad_norm": 2.3924429416656494,
+ "learning_rate": 2.162268832605391e-06,
+ "loss": 0.1243,
+ "step": 29107
+ },
+ {
+ "epoch": 79.3133514986376,
+ "grad_norm": 1.8220769166946411,
+ "learning_rate": 2.161720792248989e-06,
+ "loss": 0.0221,
+ "step": 29108
+ },
+ {
+ "epoch": 79.31607629427793,
+ "grad_norm": 2.4537875652313232,
+ "learning_rate": 2.161172812936857e-06,
+ "loss": 0.0321,
+ "step": 29109
+ },
+ {
+ "epoch": 79.31880108991825,
+ "grad_norm": 2.5680668354034424,
+ "learning_rate": 2.1606248946732578e-06,
+ "loss": 0.1026,
+ "step": 29110
+ },
+ {
+ "epoch": 79.32152588555859,
+ "grad_norm": 2.7012076377868652,
+ "learning_rate": 2.1600770374624604e-06,
+ "loss": 0.1166,
+ "step": 29111
+ },
+ {
+ "epoch": 79.3242506811989,
+ "grad_norm": 2.6602818965911865,
+ "learning_rate": 2.1595292413087277e-06,
+ "loss": 0.1375,
+ "step": 29112
+ },
+ {
+ "epoch": 79.32697547683924,
+ "grad_norm": 2.554255247116089,
+ "learning_rate": 2.1589815062163323e-06,
+ "loss": 0.0615,
+ "step": 29113
+ },
+ {
+ "epoch": 79.32970027247957,
+ "grad_norm": 2.9622340202331543,
+ "learning_rate": 2.1584338321895358e-06,
+ "loss": 0.0338,
+ "step": 29114
+ },
+ {
+ "epoch": 79.33242506811989,
+ "grad_norm": 2.0364558696746826,
+ "learning_rate": 2.157886219232601e-06,
+ "loss": 0.1146,
+ "step": 29115
+ },
+ {
+ "epoch": 79.33514986376022,
+ "grad_norm": 2.6309211254119873,
+ "learning_rate": 2.1573386673498e-06,
+ "loss": 0.039,
+ "step": 29116
+ },
+ {
+ "epoch": 79.33787465940054,
+ "grad_norm": 2.2014896869659424,
+ "learning_rate": 2.156791176545392e-06,
+ "loss": 0.027,
+ "step": 29117
+ },
+ {
+ "epoch": 79.34059945504087,
+ "grad_norm": 2.404651165008545,
+ "learning_rate": 2.156243746823643e-06,
+ "loss": 0.1221,
+ "step": 29118
+ },
+ {
+ "epoch": 79.34332425068119,
+ "grad_norm": 3.56484055519104,
+ "learning_rate": 2.155696378188812e-06,
+ "loss": 0.0547,
+ "step": 29119
+ },
+ {
+ "epoch": 79.34604904632153,
+ "grad_norm": 3.12198543548584,
+ "learning_rate": 2.155149070645167e-06,
+ "loss": 0.0602,
+ "step": 29120
+ },
+ {
+ "epoch": 79.34877384196186,
+ "grad_norm": 3.3931684494018555,
+ "learning_rate": 2.154601824196967e-06,
+ "loss": 0.1492,
+ "step": 29121
+ },
+ {
+ "epoch": 79.35149863760218,
+ "grad_norm": 2.0469658374786377,
+ "learning_rate": 2.1540546388484774e-06,
+ "loss": 0.0331,
+ "step": 29122
+ },
+ {
+ "epoch": 79.35422343324251,
+ "grad_norm": 2.0167696475982666,
+ "learning_rate": 2.1535075146039575e-06,
+ "loss": 0.1011,
+ "step": 29123
+ },
+ {
+ "epoch": 79.35694822888283,
+ "grad_norm": 2.6373302936553955,
+ "learning_rate": 2.152960451467667e-06,
+ "loss": 0.0665,
+ "step": 29124
+ },
+ {
+ "epoch": 79.35967302452316,
+ "grad_norm": 3.410719394683838,
+ "learning_rate": 2.1524134494438697e-06,
+ "loss": 0.0636,
+ "step": 29125
+ },
+ {
+ "epoch": 79.3623978201635,
+ "grad_norm": 3.731895923614502,
+ "learning_rate": 2.151866508536824e-06,
+ "loss": 0.0741,
+ "step": 29126
+ },
+ {
+ "epoch": 79.36512261580381,
+ "grad_norm": 4.988549709320068,
+ "learning_rate": 2.1513196287507898e-06,
+ "loss": 0.1301,
+ "step": 29127
+ },
+ {
+ "epoch": 79.36784741144415,
+ "grad_norm": 2.221756935119629,
+ "learning_rate": 2.1507728100900227e-06,
+ "loss": 0.0324,
+ "step": 29128
+ },
+ {
+ "epoch": 79.37057220708446,
+ "grad_norm": 2.468036413192749,
+ "learning_rate": 2.150226052558787e-06,
+ "loss": 0.0732,
+ "step": 29129
+ },
+ {
+ "epoch": 79.3732970027248,
+ "grad_norm": 2.1339199542999268,
+ "learning_rate": 2.149679356161338e-06,
+ "loss": 0.0281,
+ "step": 29130
+ },
+ {
+ "epoch": 79.37602179836512,
+ "grad_norm": 3.1965534687042236,
+ "learning_rate": 2.1491327209019342e-06,
+ "loss": 0.0666,
+ "step": 29131
+ },
+ {
+ "epoch": 79.37874659400545,
+ "grad_norm": 2.404315710067749,
+ "learning_rate": 2.148586146784829e-06,
+ "loss": 0.03,
+ "step": 29132
+ },
+ {
+ "epoch": 79.38147138964578,
+ "grad_norm": 2.7038164138793945,
+ "learning_rate": 2.148039633814285e-06,
+ "loss": 0.055,
+ "step": 29133
+ },
+ {
+ "epoch": 79.3841961852861,
+ "grad_norm": 4.145355701446533,
+ "learning_rate": 2.1474931819945555e-06,
+ "loss": 0.1405,
+ "step": 29134
+ },
+ {
+ "epoch": 79.38692098092643,
+ "grad_norm": 3.433864116668701,
+ "learning_rate": 2.1469467913298937e-06,
+ "loss": 0.0691,
+ "step": 29135
+ },
+ {
+ "epoch": 79.38964577656675,
+ "grad_norm": 3.0650908946990967,
+ "learning_rate": 2.1464004618245605e-06,
+ "loss": 0.0622,
+ "step": 29136
+ },
+ {
+ "epoch": 79.39237057220708,
+ "grad_norm": 4.756199359893799,
+ "learning_rate": 2.145854193482807e-06,
+ "loss": 0.1613,
+ "step": 29137
+ },
+ {
+ "epoch": 79.39509536784742,
+ "grad_norm": 3.309528350830078,
+ "learning_rate": 2.1453079863088888e-06,
+ "loss": 0.0246,
+ "step": 29138
+ },
+ {
+ "epoch": 79.39782016348774,
+ "grad_norm": 2.56789231300354,
+ "learning_rate": 2.144761840307057e-06,
+ "loss": 0.0788,
+ "step": 29139
+ },
+ {
+ "epoch": 79.40054495912807,
+ "grad_norm": 2.227259397506714,
+ "learning_rate": 2.1442157554815656e-06,
+ "loss": 0.0305,
+ "step": 29140
+ },
+ {
+ "epoch": 79.40326975476839,
+ "grad_norm": 3.5943763256073,
+ "learning_rate": 2.143669731836673e-06,
+ "loss": 0.0455,
+ "step": 29141
+ },
+ {
+ "epoch": 79.40599455040872,
+ "grad_norm": 2.7709333896636963,
+ "learning_rate": 2.1431237693766273e-06,
+ "loss": 0.0406,
+ "step": 29142
+ },
+ {
+ "epoch": 79.40871934604904,
+ "grad_norm": 3.2980639934539795,
+ "learning_rate": 2.1425778681056807e-06,
+ "loss": 0.0305,
+ "step": 29143
+ },
+ {
+ "epoch": 79.41144414168937,
+ "grad_norm": 2.189328908920288,
+ "learning_rate": 2.1420320280280827e-06,
+ "loss": 0.0328,
+ "step": 29144
+ },
+ {
+ "epoch": 79.4141689373297,
+ "grad_norm": 2.6904215812683105,
+ "learning_rate": 2.141486249148089e-06,
+ "loss": 0.1377,
+ "step": 29145
+ },
+ {
+ "epoch": 79.41689373297002,
+ "grad_norm": 2.8595118522644043,
+ "learning_rate": 2.1409405314699473e-06,
+ "loss": 0.0589,
+ "step": 29146
+ },
+ {
+ "epoch": 79.41961852861036,
+ "grad_norm": 4.642414569854736,
+ "learning_rate": 2.1403948749979074e-06,
+ "loss": 0.1823,
+ "step": 29147
+ },
+ {
+ "epoch": 79.42234332425068,
+ "grad_norm": 2.5312201976776123,
+ "learning_rate": 2.139849279736217e-06,
+ "loss": 0.0408,
+ "step": 29148
+ },
+ {
+ "epoch": 79.42506811989101,
+ "grad_norm": 5.1673054695129395,
+ "learning_rate": 2.13930374568913e-06,
+ "loss": 0.0455,
+ "step": 29149
+ },
+ {
+ "epoch": 79.42779291553134,
+ "grad_norm": 3.4629383087158203,
+ "learning_rate": 2.1387582728608913e-06,
+ "loss": 0.1931,
+ "step": 29150
+ },
+ {
+ "epoch": 79.43051771117166,
+ "grad_norm": 4.233945369720459,
+ "learning_rate": 2.138212861255752e-06,
+ "loss": 0.0495,
+ "step": 29151
+ },
+ {
+ "epoch": 79.433242506812,
+ "grad_norm": 2.226323366165161,
+ "learning_rate": 2.1376675108779543e-06,
+ "loss": 0.0334,
+ "step": 29152
+ },
+ {
+ "epoch": 79.43596730245231,
+ "grad_norm": 2.4665186405181885,
+ "learning_rate": 2.137122221731751e-06,
+ "loss": 0.0258,
+ "step": 29153
+ },
+ {
+ "epoch": 79.43869209809264,
+ "grad_norm": 3.466925859451294,
+ "learning_rate": 2.1365769938213876e-06,
+ "loss": 0.082,
+ "step": 29154
+ },
+ {
+ "epoch": 79.44141689373296,
+ "grad_norm": 3.4934182167053223,
+ "learning_rate": 2.1360318271511093e-06,
+ "loss": 0.0447,
+ "step": 29155
+ },
+ {
+ "epoch": 79.4441416893733,
+ "grad_norm": 2.2688581943511963,
+ "learning_rate": 2.1354867217251573e-06,
+ "loss": 0.0279,
+ "step": 29156
+ },
+ {
+ "epoch": 79.44686648501363,
+ "grad_norm": 3.084193468093872,
+ "learning_rate": 2.134941677547786e-06,
+ "loss": 0.2089,
+ "step": 29157
+ },
+ {
+ "epoch": 79.44959128065395,
+ "grad_norm": 3.214845895767212,
+ "learning_rate": 2.1343966946232366e-06,
+ "loss": 0.1284,
+ "step": 29158
+ },
+ {
+ "epoch": 79.45231607629428,
+ "grad_norm": 3.1596949100494385,
+ "learning_rate": 2.1338517729557517e-06,
+ "loss": 0.0695,
+ "step": 29159
+ },
+ {
+ "epoch": 79.4550408719346,
+ "grad_norm": 3.507193088531494,
+ "learning_rate": 2.133306912549574e-06,
+ "loss": 0.0547,
+ "step": 29160
+ },
+ {
+ "epoch": 79.45776566757493,
+ "grad_norm": 2.546586275100708,
+ "learning_rate": 2.1327621134089516e-06,
+ "loss": 0.0667,
+ "step": 29161
+ },
+ {
+ "epoch": 79.46049046321527,
+ "grad_norm": 2.6235101222991943,
+ "learning_rate": 2.132217375538125e-06,
+ "loss": 0.0511,
+ "step": 29162
+ },
+ {
+ "epoch": 79.46321525885558,
+ "grad_norm": 2.8926868438720703,
+ "learning_rate": 2.131672698941335e-06,
+ "loss": 0.0505,
+ "step": 29163
+ },
+ {
+ "epoch": 79.46594005449592,
+ "grad_norm": 2.8754851818084717,
+ "learning_rate": 2.131128083622823e-06,
+ "loss": 0.1188,
+ "step": 29164
+ },
+ {
+ "epoch": 79.46866485013624,
+ "grad_norm": 3.165276288986206,
+ "learning_rate": 2.130583529586835e-06,
+ "loss": 0.0711,
+ "step": 29165
+ },
+ {
+ "epoch": 79.47138964577657,
+ "grad_norm": 2.14923095703125,
+ "learning_rate": 2.130039036837609e-06,
+ "loss": 0.0497,
+ "step": 29166
+ },
+ {
+ "epoch": 79.47411444141689,
+ "grad_norm": 3.854116916656494,
+ "learning_rate": 2.129494605379385e-06,
+ "loss": 0.0619,
+ "step": 29167
+ },
+ {
+ "epoch": 79.47683923705722,
+ "grad_norm": 3.4426791667938232,
+ "learning_rate": 2.1289502352164015e-06,
+ "loss": 0.0559,
+ "step": 29168
+ },
+ {
+ "epoch": 79.47956403269755,
+ "grad_norm": 2.8873674869537354,
+ "learning_rate": 2.1284059263529035e-06,
+ "loss": 0.1437,
+ "step": 29169
+ },
+ {
+ "epoch": 79.48228882833787,
+ "grad_norm": 5.089114665985107,
+ "learning_rate": 2.127861678793126e-06,
+ "loss": 0.0796,
+ "step": 29170
+ },
+ {
+ "epoch": 79.4850136239782,
+ "grad_norm": 3.037562847137451,
+ "learning_rate": 2.1273174925413086e-06,
+ "loss": 0.0414,
+ "step": 29171
+ },
+ {
+ "epoch": 79.48773841961852,
+ "grad_norm": 1.9644275903701782,
+ "learning_rate": 2.126773367601688e-06,
+ "loss": 0.0197,
+ "step": 29172
+ },
+ {
+ "epoch": 79.49046321525886,
+ "grad_norm": 4.938040733337402,
+ "learning_rate": 2.126229303978501e-06,
+ "loss": 0.0354,
+ "step": 29173
+ },
+ {
+ "epoch": 79.49318801089919,
+ "grad_norm": 3.319546699523926,
+ "learning_rate": 2.1256853016759905e-06,
+ "loss": 0.0453,
+ "step": 29174
+ },
+ {
+ "epoch": 79.49591280653951,
+ "grad_norm": 1.9399495124816895,
+ "learning_rate": 2.1251413606983883e-06,
+ "loss": 0.0294,
+ "step": 29175
+ },
+ {
+ "epoch": 79.49863760217984,
+ "grad_norm": 3.333191394805908,
+ "learning_rate": 2.1245974810499326e-06,
+ "loss": 0.0894,
+ "step": 29176
+ },
+ {
+ "epoch": 79.50136239782016,
+ "grad_norm": 3.9922356605529785,
+ "learning_rate": 2.1240536627348553e-06,
+ "loss": 0.0325,
+ "step": 29177
+ },
+ {
+ "epoch": 79.50408719346049,
+ "grad_norm": 5.769985675811768,
+ "learning_rate": 2.1235099057573973e-06,
+ "loss": 0.0434,
+ "step": 29178
+ },
+ {
+ "epoch": 79.50681198910081,
+ "grad_norm": 2.921860933303833,
+ "learning_rate": 2.122966210121791e-06,
+ "loss": 0.0347,
+ "step": 29179
+ },
+ {
+ "epoch": 79.50953678474114,
+ "grad_norm": 2.8392391204833984,
+ "learning_rate": 2.122422575832267e-06,
+ "loss": 0.1007,
+ "step": 29180
+ },
+ {
+ "epoch": 79.51226158038148,
+ "grad_norm": 1.9620262384414673,
+ "learning_rate": 2.1218790028930656e-06,
+ "loss": 0.0259,
+ "step": 29181
+ },
+ {
+ "epoch": 79.5149863760218,
+ "grad_norm": 3.7188425064086914,
+ "learning_rate": 2.121335491308417e-06,
+ "loss": 0.2629,
+ "step": 29182
+ },
+ {
+ "epoch": 79.51771117166213,
+ "grad_norm": 2.0695464611053467,
+ "learning_rate": 2.1207920410825543e-06,
+ "loss": 0.2256,
+ "step": 29183
+ },
+ {
+ "epoch": 79.52043596730245,
+ "grad_norm": 1.73047935962677,
+ "learning_rate": 2.1202486522197063e-06,
+ "loss": 0.0408,
+ "step": 29184
+ },
+ {
+ "epoch": 79.52316076294278,
+ "grad_norm": 3.2469305992126465,
+ "learning_rate": 2.1197053247241116e-06,
+ "loss": 0.0928,
+ "step": 29185
+ },
+ {
+ "epoch": 79.52588555858311,
+ "grad_norm": 2.568074941635132,
+ "learning_rate": 2.1191620585999973e-06,
+ "loss": 0.0375,
+ "step": 29186
+ },
+ {
+ "epoch": 79.52861035422343,
+ "grad_norm": 3.095752000808716,
+ "learning_rate": 2.1186188538515964e-06,
+ "loss": 0.055,
+ "step": 29187
+ },
+ {
+ "epoch": 79.53133514986376,
+ "grad_norm": 1.5512783527374268,
+ "learning_rate": 2.118075710483134e-06,
+ "loss": 0.0317,
+ "step": 29188
+ },
+ {
+ "epoch": 79.53405994550408,
+ "grad_norm": 5.7658491134643555,
+ "learning_rate": 2.117532628498847e-06,
+ "loss": 0.0593,
+ "step": 29189
+ },
+ {
+ "epoch": 79.53678474114442,
+ "grad_norm": 4.0881028175354,
+ "learning_rate": 2.1169896079029607e-06,
+ "loss": 0.1097,
+ "step": 29190
+ },
+ {
+ "epoch": 79.53950953678473,
+ "grad_norm": 2.010342597961426,
+ "learning_rate": 2.116446648699708e-06,
+ "loss": 0.0211,
+ "step": 29191
+ },
+ {
+ "epoch": 79.54223433242507,
+ "grad_norm": 3.401838779449463,
+ "learning_rate": 2.1159037508933154e-06,
+ "loss": 0.1001,
+ "step": 29192
+ },
+ {
+ "epoch": 79.5449591280654,
+ "grad_norm": 4.027714252471924,
+ "learning_rate": 2.115360914488007e-06,
+ "loss": 0.3034,
+ "step": 29193
+ },
+ {
+ "epoch": 79.54768392370572,
+ "grad_norm": 3.6595537662506104,
+ "learning_rate": 2.1148181394880175e-06,
+ "loss": 0.106,
+ "step": 29194
+ },
+ {
+ "epoch": 79.55040871934605,
+ "grad_norm": 2.499828577041626,
+ "learning_rate": 2.1142754258975707e-06,
+ "loss": 0.0348,
+ "step": 29195
+ },
+ {
+ "epoch": 79.55313351498637,
+ "grad_norm": 1.8060368299484253,
+ "learning_rate": 2.1137327737208923e-06,
+ "loss": 0.034,
+ "step": 29196
+ },
+ {
+ "epoch": 79.5558583106267,
+ "grad_norm": 3.0636634826660156,
+ "learning_rate": 2.113190182962207e-06,
+ "loss": 0.0957,
+ "step": 29197
+ },
+ {
+ "epoch": 79.55858310626704,
+ "grad_norm": 2.7108492851257324,
+ "learning_rate": 2.1126476536257446e-06,
+ "loss": 0.0936,
+ "step": 29198
+ },
+ {
+ "epoch": 79.56130790190736,
+ "grad_norm": 2.1519253253936768,
+ "learning_rate": 2.1121051857157294e-06,
+ "loss": 0.0663,
+ "step": 29199
+ },
+ {
+ "epoch": 79.56403269754769,
+ "grad_norm": 5.154918193817139,
+ "learning_rate": 2.1115627792363823e-06,
+ "loss": 0.0338,
+ "step": 29200
+ },
+ {
+ "epoch": 79.566757493188,
+ "grad_norm": 2.4038360118865967,
+ "learning_rate": 2.1110204341919326e-06,
+ "loss": 0.0319,
+ "step": 29201
+ },
+ {
+ "epoch": 79.56948228882834,
+ "grad_norm": 2.6924593448638916,
+ "learning_rate": 2.110478150586602e-06,
+ "loss": 0.0351,
+ "step": 29202
+ },
+ {
+ "epoch": 79.57220708446866,
+ "grad_norm": 3.1435282230377197,
+ "learning_rate": 2.1099359284246144e-06,
+ "loss": 0.1325,
+ "step": 29203
+ },
+ {
+ "epoch": 79.57493188010899,
+ "grad_norm": 2.6756949424743652,
+ "learning_rate": 2.1093937677101884e-06,
+ "loss": 0.0564,
+ "step": 29204
+ },
+ {
+ "epoch": 79.57765667574932,
+ "grad_norm": 2.745969295501709,
+ "learning_rate": 2.1088516684475526e-06,
+ "loss": 0.0586,
+ "step": 29205
+ },
+ {
+ "epoch": 79.58038147138964,
+ "grad_norm": 1.9606775045394897,
+ "learning_rate": 2.1083096306409255e-06,
+ "loss": 0.0497,
+ "step": 29206
+ },
+ {
+ "epoch": 79.58310626702998,
+ "grad_norm": 4.065126895904541,
+ "learning_rate": 2.107767654294528e-06,
+ "loss": 0.1034,
+ "step": 29207
+ },
+ {
+ "epoch": 79.5858310626703,
+ "grad_norm": 3.9425268173217773,
+ "learning_rate": 2.1072257394125828e-06,
+ "loss": 0.0369,
+ "step": 29208
+ },
+ {
+ "epoch": 79.58855585831063,
+ "grad_norm": 2.6867868900299072,
+ "learning_rate": 2.106683885999308e-06,
+ "loss": 0.0343,
+ "step": 29209
+ },
+ {
+ "epoch": 79.59128065395096,
+ "grad_norm": 2.64862322807312,
+ "learning_rate": 2.1061420940589273e-06,
+ "loss": 0.1393,
+ "step": 29210
+ },
+ {
+ "epoch": 79.59400544959128,
+ "grad_norm": 4.8482985496521,
+ "learning_rate": 2.105600363595658e-06,
+ "loss": 0.1981,
+ "step": 29211
+ },
+ {
+ "epoch": 79.59673024523161,
+ "grad_norm": 3.8815159797668457,
+ "learning_rate": 2.1050586946137184e-06,
+ "loss": 0.0601,
+ "step": 29212
+ },
+ {
+ "epoch": 79.59945504087193,
+ "grad_norm": 2.8104629516601562,
+ "learning_rate": 2.104517087117326e-06,
+ "loss": 0.0347,
+ "step": 29213
+ },
+ {
+ "epoch": 79.60217983651226,
+ "grad_norm": 7.704208850860596,
+ "learning_rate": 2.1039755411107023e-06,
+ "loss": 0.0697,
+ "step": 29214
+ },
+ {
+ "epoch": 79.60490463215258,
+ "grad_norm": 2.3880417346954346,
+ "learning_rate": 2.1034340565980636e-06,
+ "loss": 0.0347,
+ "step": 29215
+ },
+ {
+ "epoch": 79.60762942779292,
+ "grad_norm": 3.6737351417541504,
+ "learning_rate": 2.1028926335836253e-06,
+ "loss": 0.0532,
+ "step": 29216
+ },
+ {
+ "epoch": 79.61035422343325,
+ "grad_norm": 2.6531341075897217,
+ "learning_rate": 2.1023512720716033e-06,
+ "loss": 0.046,
+ "step": 29217
+ },
+ {
+ "epoch": 79.61307901907357,
+ "grad_norm": 4.844764232635498,
+ "learning_rate": 2.1018099720662178e-06,
+ "loss": 0.0858,
+ "step": 29218
+ },
+ {
+ "epoch": 79.6158038147139,
+ "grad_norm": 2.7919328212738037,
+ "learning_rate": 2.101268733571682e-06,
+ "loss": 0.1226,
+ "step": 29219
+ },
+ {
+ "epoch": 79.61852861035422,
+ "grad_norm": 3.199812173843384,
+ "learning_rate": 2.100727556592211e-06,
+ "loss": 0.0742,
+ "step": 29220
+ },
+ {
+ "epoch": 79.62125340599455,
+ "grad_norm": 2.56154465675354,
+ "learning_rate": 2.1001864411320174e-06,
+ "loss": 0.0378,
+ "step": 29221
+ },
+ {
+ "epoch": 79.62397820163488,
+ "grad_norm": 2.337373733520508,
+ "learning_rate": 2.0996453871953192e-06,
+ "loss": 0.1088,
+ "step": 29222
+ },
+ {
+ "epoch": 79.6267029972752,
+ "grad_norm": 3.0385773181915283,
+ "learning_rate": 2.0991043947863286e-06,
+ "loss": 0.1082,
+ "step": 29223
+ },
+ {
+ "epoch": 79.62942779291554,
+ "grad_norm": 2.6796576976776123,
+ "learning_rate": 2.0985634639092567e-06,
+ "loss": 0.0307,
+ "step": 29224
+ },
+ {
+ "epoch": 79.63215258855585,
+ "grad_norm": 1.8098124265670776,
+ "learning_rate": 2.0980225945683185e-06,
+ "loss": 0.0279,
+ "step": 29225
+ },
+ {
+ "epoch": 79.63487738419619,
+ "grad_norm": 3.3715479373931885,
+ "learning_rate": 2.097481786767728e-06,
+ "loss": 0.1815,
+ "step": 29226
+ },
+ {
+ "epoch": 79.6376021798365,
+ "grad_norm": 2.9014835357666016,
+ "learning_rate": 2.096941040511695e-06,
+ "loss": 0.0264,
+ "step": 29227
+ },
+ {
+ "epoch": 79.64032697547684,
+ "grad_norm": 3.4781887531280518,
+ "learning_rate": 2.096400355804431e-06,
+ "loss": 0.0574,
+ "step": 29228
+ },
+ {
+ "epoch": 79.64305177111717,
+ "grad_norm": 2.586890459060669,
+ "learning_rate": 2.095859732650144e-06,
+ "loss": 0.1218,
+ "step": 29229
+ },
+ {
+ "epoch": 79.64577656675749,
+ "grad_norm": 2.3006093502044678,
+ "learning_rate": 2.0953191710530495e-06,
+ "loss": 0.1917,
+ "step": 29230
+ },
+ {
+ "epoch": 79.64850136239782,
+ "grad_norm": 2.843937873840332,
+ "learning_rate": 2.0947786710173545e-06,
+ "loss": 0.074,
+ "step": 29231
+ },
+ {
+ "epoch": 79.65122615803814,
+ "grad_norm": 3.1083977222442627,
+ "learning_rate": 2.09423823254727e-06,
+ "loss": 0.0379,
+ "step": 29232
+ },
+ {
+ "epoch": 79.65395095367847,
+ "grad_norm": 2.344449043273926,
+ "learning_rate": 2.093697855647e-06,
+ "loss": 0.0771,
+ "step": 29233
+ },
+ {
+ "epoch": 79.65667574931881,
+ "grad_norm": 2.2525219917297363,
+ "learning_rate": 2.0931575403207594e-06,
+ "loss": 0.0841,
+ "step": 29234
+ },
+ {
+ "epoch": 79.65940054495913,
+ "grad_norm": 3.596081256866455,
+ "learning_rate": 2.0926172865727534e-06,
+ "loss": 0.0388,
+ "step": 29235
+ },
+ {
+ "epoch": 79.66212534059946,
+ "grad_norm": 2.5542967319488525,
+ "learning_rate": 2.09207709440719e-06,
+ "loss": 0.1207,
+ "step": 29236
+ },
+ {
+ "epoch": 79.66485013623978,
+ "grad_norm": 3.693990468978882,
+ "learning_rate": 2.091536963828272e-06,
+ "loss": 0.0352,
+ "step": 29237
+ },
+ {
+ "epoch": 79.66757493188011,
+ "grad_norm": 2.903559923171997,
+ "learning_rate": 2.090996894840214e-06,
+ "loss": 0.0234,
+ "step": 29238
+ },
+ {
+ "epoch": 79.67029972752043,
+ "grad_norm": 4.205155849456787,
+ "learning_rate": 2.0904568874472166e-06,
+ "loss": 0.0396,
+ "step": 29239
+ },
+ {
+ "epoch": 79.67302452316076,
+ "grad_norm": 3.108189344406128,
+ "learning_rate": 2.089916941653486e-06,
+ "loss": 0.0636,
+ "step": 29240
+ },
+ {
+ "epoch": 79.6757493188011,
+ "grad_norm": 3.3302626609802246,
+ "learning_rate": 2.0893770574632253e-06,
+ "loss": 0.0412,
+ "step": 29241
+ },
+ {
+ "epoch": 79.67847411444141,
+ "grad_norm": 4.701046466827393,
+ "learning_rate": 2.088837234880642e-06,
+ "loss": 0.052,
+ "step": 29242
+ },
+ {
+ "epoch": 79.68119891008175,
+ "grad_norm": 3.134046792984009,
+ "learning_rate": 2.0882974739099417e-06,
+ "loss": 0.0562,
+ "step": 29243
+ },
+ {
+ "epoch": 79.68392370572207,
+ "grad_norm": 3.2510342597961426,
+ "learning_rate": 2.087757774555326e-06,
+ "loss": 0.0754,
+ "step": 29244
+ },
+ {
+ "epoch": 79.6866485013624,
+ "grad_norm": 3.2784006595611572,
+ "learning_rate": 2.0872181368209954e-06,
+ "loss": 0.0261,
+ "step": 29245
+ },
+ {
+ "epoch": 79.68937329700273,
+ "grad_norm": 3.756096124649048,
+ "learning_rate": 2.0866785607111583e-06,
+ "loss": 0.0578,
+ "step": 29246
+ },
+ {
+ "epoch": 79.69209809264305,
+ "grad_norm": 2.896062135696411,
+ "learning_rate": 2.0861390462300137e-06,
+ "loss": 0.0862,
+ "step": 29247
+ },
+ {
+ "epoch": 79.69482288828338,
+ "grad_norm": 4.018967628479004,
+ "learning_rate": 2.085599593381764e-06,
+ "loss": 0.0763,
+ "step": 29248
+ },
+ {
+ "epoch": 79.6975476839237,
+ "grad_norm": 2.785836696624756,
+ "learning_rate": 2.085060202170607e-06,
+ "loss": 0.0802,
+ "step": 29249
+ },
+ {
+ "epoch": 79.70027247956403,
+ "grad_norm": 3.413893461227417,
+ "learning_rate": 2.0845208726007484e-06,
+ "loss": 0.0738,
+ "step": 29250
+ },
+ {
+ "epoch": 79.70299727520435,
+ "grad_norm": 2.3878374099731445,
+ "learning_rate": 2.083981604676387e-06,
+ "loss": 0.0389,
+ "step": 29251
+ },
+ {
+ "epoch": 79.70572207084469,
+ "grad_norm": 5.857513427734375,
+ "learning_rate": 2.083442398401723e-06,
+ "loss": 0.058,
+ "step": 29252
+ },
+ {
+ "epoch": 79.70844686648502,
+ "grad_norm": 2.4599688053131104,
+ "learning_rate": 2.082903253780951e-06,
+ "loss": 0.0212,
+ "step": 29253
+ },
+ {
+ "epoch": 79.71117166212534,
+ "grad_norm": 2.517099380493164,
+ "learning_rate": 2.082364170818276e-06,
+ "loss": 0.0488,
+ "step": 29254
+ },
+ {
+ "epoch": 79.71389645776567,
+ "grad_norm": 2.4274439811706543,
+ "learning_rate": 2.081825149517895e-06,
+ "loss": 0.0428,
+ "step": 29255
+ },
+ {
+ "epoch": 79.71662125340599,
+ "grad_norm": 2.7039241790771484,
+ "learning_rate": 2.0812861898840043e-06,
+ "loss": 0.0368,
+ "step": 29256
+ },
+ {
+ "epoch": 79.71934604904632,
+ "grad_norm": 3.2438275814056396,
+ "learning_rate": 2.0807472919207993e-06,
+ "loss": 0.1247,
+ "step": 29257
+ },
+ {
+ "epoch": 79.72207084468666,
+ "grad_norm": 3.6895644664764404,
+ "learning_rate": 2.080208455632482e-06,
+ "loss": 0.1358,
+ "step": 29258
+ },
+ {
+ "epoch": 79.72479564032697,
+ "grad_norm": 2.9256253242492676,
+ "learning_rate": 2.079669681023244e-06,
+ "loss": 0.0249,
+ "step": 29259
+ },
+ {
+ "epoch": 79.7275204359673,
+ "grad_norm": 2.9980931282043457,
+ "learning_rate": 2.079130968097287e-06,
+ "loss": 0.0327,
+ "step": 29260
+ },
+ {
+ "epoch": 79.73024523160763,
+ "grad_norm": 2.4223766326904297,
+ "learning_rate": 2.078592316858802e-06,
+ "loss": 0.034,
+ "step": 29261
+ },
+ {
+ "epoch": 79.73297002724796,
+ "grad_norm": 2.9649951457977295,
+ "learning_rate": 2.0780537273119826e-06,
+ "loss": 0.0315,
+ "step": 29262
+ },
+ {
+ "epoch": 79.73569482288828,
+ "grad_norm": 2.3366172313690186,
+ "learning_rate": 2.077515199461029e-06,
+ "loss": 0.0314,
+ "step": 29263
+ },
+ {
+ "epoch": 79.73841961852861,
+ "grad_norm": 5.506527900695801,
+ "learning_rate": 2.076976733310131e-06,
+ "loss": 0.1247,
+ "step": 29264
+ },
+ {
+ "epoch": 79.74114441416894,
+ "grad_norm": 3.715538263320923,
+ "learning_rate": 2.0764383288634813e-06,
+ "loss": 0.0854,
+ "step": 29265
+ },
+ {
+ "epoch": 79.74386920980926,
+ "grad_norm": 3.026465892791748,
+ "learning_rate": 2.0758999861252783e-06,
+ "loss": 0.0353,
+ "step": 29266
+ },
+ {
+ "epoch": 79.7465940054496,
+ "grad_norm": 2.029677391052246,
+ "learning_rate": 2.0753617050997097e-06,
+ "loss": 0.0363,
+ "step": 29267
+ },
+ {
+ "epoch": 79.74931880108991,
+ "grad_norm": 2.721902370452881,
+ "learning_rate": 2.07482348579097e-06,
+ "loss": 0.0254,
+ "step": 29268
+ },
+ {
+ "epoch": 79.75204359673025,
+ "grad_norm": 2.84169340133667,
+ "learning_rate": 2.074285328203247e-06,
+ "loss": 0.0557,
+ "step": 29269
+ },
+ {
+ "epoch": 79.75476839237058,
+ "grad_norm": 2.6797447204589844,
+ "learning_rate": 2.073747232340737e-06,
+ "loss": 0.0977,
+ "step": 29270
+ },
+ {
+ "epoch": 79.7574931880109,
+ "grad_norm": 3.6222918033599854,
+ "learning_rate": 2.0732091982076286e-06,
+ "loss": 0.0863,
+ "step": 29271
+ },
+ {
+ "epoch": 79.76021798365123,
+ "grad_norm": 2.777568817138672,
+ "learning_rate": 2.072671225808113e-06,
+ "loss": 0.0815,
+ "step": 29272
+ },
+ {
+ "epoch": 79.76294277929155,
+ "grad_norm": 2.5429670810699463,
+ "learning_rate": 2.072133315146375e-06,
+ "loss": 0.094,
+ "step": 29273
+ },
+ {
+ "epoch": 79.76566757493188,
+ "grad_norm": 3.273588180541992,
+ "learning_rate": 2.07159546622661e-06,
+ "loss": 0.1388,
+ "step": 29274
+ },
+ {
+ "epoch": 79.7683923705722,
+ "grad_norm": 2.2256669998168945,
+ "learning_rate": 2.0710576790530046e-06,
+ "loss": 0.1327,
+ "step": 29275
+ },
+ {
+ "epoch": 79.77111716621253,
+ "grad_norm": 2.7126142978668213,
+ "learning_rate": 2.070519953629745e-06,
+ "loss": 0.0632,
+ "step": 29276
+ },
+ {
+ "epoch": 79.77384196185287,
+ "grad_norm": 3.8536276817321777,
+ "learning_rate": 2.069982289961022e-06,
+ "loss": 0.0495,
+ "step": 29277
+ },
+ {
+ "epoch": 79.77656675749319,
+ "grad_norm": 2.4987895488739014,
+ "learning_rate": 2.06944468805102e-06,
+ "loss": 0.1387,
+ "step": 29278
+ },
+ {
+ "epoch": 79.77929155313352,
+ "grad_norm": 3.027650833129883,
+ "learning_rate": 2.0689071479039303e-06,
+ "loss": 0.1404,
+ "step": 29279
+ },
+ {
+ "epoch": 79.78201634877384,
+ "grad_norm": 2.678555488586426,
+ "learning_rate": 2.0683696695239364e-06,
+ "loss": 0.0637,
+ "step": 29280
+ },
+ {
+ "epoch": 79.78474114441417,
+ "grad_norm": 3.3591952323913574,
+ "learning_rate": 2.0678322529152238e-06,
+ "loss": 0.0582,
+ "step": 29281
+ },
+ {
+ "epoch": 79.7874659400545,
+ "grad_norm": 1.6419581174850464,
+ "learning_rate": 2.067294898081975e-06,
+ "loss": 0.0224,
+ "step": 29282
+ },
+ {
+ "epoch": 79.79019073569482,
+ "grad_norm": 2.1855525970458984,
+ "learning_rate": 2.066757605028382e-06,
+ "loss": 0.0407,
+ "step": 29283
+ },
+ {
+ "epoch": 79.79291553133515,
+ "grad_norm": 4.04316520690918,
+ "learning_rate": 2.066220373758625e-06,
+ "loss": 0.0691,
+ "step": 29284
+ },
+ {
+ "epoch": 79.79564032697547,
+ "grad_norm": 3.079613208770752,
+ "learning_rate": 2.065683204276889e-06,
+ "loss": 0.079,
+ "step": 29285
+ },
+ {
+ "epoch": 79.7983651226158,
+ "grad_norm": 2.6407501697540283,
+ "learning_rate": 2.0651460965873537e-06,
+ "loss": 0.0751,
+ "step": 29286
+ },
+ {
+ "epoch": 79.80108991825612,
+ "grad_norm": 6.0405964851379395,
+ "learning_rate": 2.0646090506942084e-06,
+ "loss": 0.1496,
+ "step": 29287
+ },
+ {
+ "epoch": 79.80381471389646,
+ "grad_norm": 2.920759439468384,
+ "learning_rate": 2.0640720666016314e-06,
+ "loss": 0.0316,
+ "step": 29288
+ },
+ {
+ "epoch": 79.80653950953679,
+ "grad_norm": 2.829606056213379,
+ "learning_rate": 2.063535144313804e-06,
+ "loss": 0.0553,
+ "step": 29289
+ },
+ {
+ "epoch": 79.80926430517711,
+ "grad_norm": 2.013718605041504,
+ "learning_rate": 2.0629982838349117e-06,
+ "loss": 0.0366,
+ "step": 29290
+ },
+ {
+ "epoch": 79.81198910081744,
+ "grad_norm": 2.5959970951080322,
+ "learning_rate": 2.0624614851691327e-06,
+ "loss": 0.0788,
+ "step": 29291
+ },
+ {
+ "epoch": 79.81471389645776,
+ "grad_norm": 2.969374895095825,
+ "learning_rate": 2.0619247483206495e-06,
+ "loss": 0.0889,
+ "step": 29292
+ },
+ {
+ "epoch": 79.8174386920981,
+ "grad_norm": 2.5356993675231934,
+ "learning_rate": 2.0613880732936376e-06,
+ "loss": 0.0347,
+ "step": 29293
+ },
+ {
+ "epoch": 79.82016348773843,
+ "grad_norm": 4.257425308227539,
+ "learning_rate": 2.0608514600922793e-06,
+ "loss": 0.0497,
+ "step": 29294
+ },
+ {
+ "epoch": 79.82288828337875,
+ "grad_norm": 2.892382860183716,
+ "learning_rate": 2.0603149087207576e-06,
+ "loss": 0.0562,
+ "step": 29295
+ },
+ {
+ "epoch": 79.82561307901908,
+ "grad_norm": 2.452202558517456,
+ "learning_rate": 2.0597784191832483e-06,
+ "loss": 0.1419,
+ "step": 29296
+ },
+ {
+ "epoch": 79.8283378746594,
+ "grad_norm": 2.9188475608825684,
+ "learning_rate": 2.059241991483928e-06,
+ "loss": 0.197,
+ "step": 29297
+ },
+ {
+ "epoch": 79.83106267029973,
+ "grad_norm": 2.675443649291992,
+ "learning_rate": 2.058705625626973e-06,
+ "loss": 0.0813,
+ "step": 29298
+ },
+ {
+ "epoch": 79.83378746594005,
+ "grad_norm": 2.5195724964141846,
+ "learning_rate": 2.0581693216165668e-06,
+ "loss": 0.0344,
+ "step": 29299
+ },
+ {
+ "epoch": 79.83651226158038,
+ "grad_norm": 2.4789111614227295,
+ "learning_rate": 2.057633079456881e-06,
+ "loss": 0.0412,
+ "step": 29300
+ },
+ {
+ "epoch": 79.83923705722071,
+ "grad_norm": 3.065528631210327,
+ "learning_rate": 2.0570968991520933e-06,
+ "loss": 0.0346,
+ "step": 29301
+ },
+ {
+ "epoch": 79.84196185286103,
+ "grad_norm": 3.8140010833740234,
+ "learning_rate": 2.056560780706377e-06,
+ "loss": 0.0971,
+ "step": 29302
+ },
+ {
+ "epoch": 79.84468664850137,
+ "grad_norm": 2.497077465057373,
+ "learning_rate": 2.0560247241239127e-06,
+ "loss": 0.0477,
+ "step": 29303
+ },
+ {
+ "epoch": 79.84741144414168,
+ "grad_norm": 3.2433173656463623,
+ "learning_rate": 2.0554887294088723e-06,
+ "loss": 0.078,
+ "step": 29304
+ },
+ {
+ "epoch": 79.85013623978202,
+ "grad_norm": 2.877556800842285,
+ "learning_rate": 2.0549527965654293e-06,
+ "loss": 0.1024,
+ "step": 29305
+ },
+ {
+ "epoch": 79.85286103542235,
+ "grad_norm": 2.370661973953247,
+ "learning_rate": 2.0544169255977563e-06,
+ "loss": 0.0335,
+ "step": 29306
+ },
+ {
+ "epoch": 79.85558583106267,
+ "grad_norm": 4.0430378913879395,
+ "learning_rate": 2.0538811165100303e-06,
+ "loss": 0.0735,
+ "step": 29307
+ },
+ {
+ "epoch": 79.858310626703,
+ "grad_norm": 3.651853322982788,
+ "learning_rate": 2.053345369306423e-06,
+ "loss": 0.1569,
+ "step": 29308
+ },
+ {
+ "epoch": 79.86103542234332,
+ "grad_norm": 1.9985288381576538,
+ "learning_rate": 2.052809683991103e-06,
+ "loss": 0.1131,
+ "step": 29309
+ },
+ {
+ "epoch": 79.86376021798365,
+ "grad_norm": 2.669971466064453,
+ "learning_rate": 2.052274060568249e-06,
+ "loss": 0.0338,
+ "step": 29310
+ },
+ {
+ "epoch": 79.86648501362397,
+ "grad_norm": 1.5900779962539673,
+ "learning_rate": 2.0517384990420253e-06,
+ "loss": 0.0246,
+ "step": 29311
+ },
+ {
+ "epoch": 79.8692098092643,
+ "grad_norm": 2.7960777282714844,
+ "learning_rate": 2.0512029994166093e-06,
+ "loss": 0.045,
+ "step": 29312
+ },
+ {
+ "epoch": 79.87193460490464,
+ "grad_norm": 3.1913352012634277,
+ "learning_rate": 2.050667561696168e-06,
+ "loss": 0.089,
+ "step": 29313
+ },
+ {
+ "epoch": 79.87465940054496,
+ "grad_norm": 3.306302070617676,
+ "learning_rate": 2.05013218588487e-06,
+ "loss": 0.0621,
+ "step": 29314
+ },
+ {
+ "epoch": 79.87738419618529,
+ "grad_norm": 2.8709847927093506,
+ "learning_rate": 2.0495968719868895e-06,
+ "loss": 0.0439,
+ "step": 29315
+ },
+ {
+ "epoch": 79.88010899182561,
+ "grad_norm": 2.6839709281921387,
+ "learning_rate": 2.049061620006392e-06,
+ "loss": 0.1548,
+ "step": 29316
+ },
+ {
+ "epoch": 79.88283378746594,
+ "grad_norm": 2.072481155395508,
+ "learning_rate": 2.048526429947547e-06,
+ "loss": 0.0543,
+ "step": 29317
+ },
+ {
+ "epoch": 79.88555858310627,
+ "grad_norm": 2.4812171459198,
+ "learning_rate": 2.0479913018145194e-06,
+ "loss": 0.027,
+ "step": 29318
+ },
+ {
+ "epoch": 79.88828337874659,
+ "grad_norm": 3.2204062938690186,
+ "learning_rate": 2.0474562356114824e-06,
+ "loss": 0.0632,
+ "step": 29319
+ },
+ {
+ "epoch": 79.89100817438693,
+ "grad_norm": 4.5732879638671875,
+ "learning_rate": 2.0469212313426e-06,
+ "loss": 0.0529,
+ "step": 29320
+ },
+ {
+ "epoch": 79.89373297002724,
+ "grad_norm": 1.547419548034668,
+ "learning_rate": 2.04638628901204e-06,
+ "loss": 0.0858,
+ "step": 29321
+ },
+ {
+ "epoch": 79.89645776566758,
+ "grad_norm": 2.4170684814453125,
+ "learning_rate": 2.0458514086239644e-06,
+ "loss": 0.0456,
+ "step": 29322
+ },
+ {
+ "epoch": 79.8991825613079,
+ "grad_norm": 3.026855707168579,
+ "learning_rate": 2.0453165901825445e-06,
+ "loss": 0.1024,
+ "step": 29323
+ },
+ {
+ "epoch": 79.90190735694823,
+ "grad_norm": 2.3698346614837646,
+ "learning_rate": 2.0447818336919433e-06,
+ "loss": 0.0729,
+ "step": 29324
+ },
+ {
+ "epoch": 79.90463215258856,
+ "grad_norm": 2.5736029148101807,
+ "learning_rate": 2.0442471391563244e-06,
+ "loss": 0.031,
+ "step": 29325
+ },
+ {
+ "epoch": 79.90735694822888,
+ "grad_norm": 2.27970290184021,
+ "learning_rate": 2.0437125065798515e-06,
+ "loss": 0.0251,
+ "step": 29326
+ },
+ {
+ "epoch": 79.91008174386921,
+ "grad_norm": 1.7866114377975464,
+ "learning_rate": 2.04317793596669e-06,
+ "loss": 0.0338,
+ "step": 29327
+ },
+ {
+ "epoch": 79.91280653950953,
+ "grad_norm": 2.945972442626953,
+ "learning_rate": 2.0426434273210016e-06,
+ "loss": 0.0314,
+ "step": 29328
+ },
+ {
+ "epoch": 79.91553133514986,
+ "grad_norm": 2.1935908794403076,
+ "learning_rate": 2.042108980646953e-06,
+ "loss": 0.2351,
+ "step": 29329
+ },
+ {
+ "epoch": 79.9182561307902,
+ "grad_norm": 2.1854188442230225,
+ "learning_rate": 2.0415745959486997e-06,
+ "loss": 0.0354,
+ "step": 29330
+ },
+ {
+ "epoch": 79.92098092643052,
+ "grad_norm": 2.4516072273254395,
+ "learning_rate": 2.0410402732304115e-06,
+ "loss": 0.0598,
+ "step": 29331
+ },
+ {
+ "epoch": 79.92370572207085,
+ "grad_norm": 2.6645407676696777,
+ "learning_rate": 2.040506012496244e-06,
+ "loss": 0.1124,
+ "step": 29332
+ },
+ {
+ "epoch": 79.92643051771117,
+ "grad_norm": 3.365372896194458,
+ "learning_rate": 2.03997181375036e-06,
+ "loss": 0.0555,
+ "step": 29333
+ },
+ {
+ "epoch": 79.9291553133515,
+ "grad_norm": 2.762101173400879,
+ "learning_rate": 2.039437676996917e-06,
+ "loss": 0.0393,
+ "step": 29334
+ },
+ {
+ "epoch": 79.93188010899182,
+ "grad_norm": 2.4632163047790527,
+ "learning_rate": 2.0389036022400786e-06,
+ "loss": 0.1255,
+ "step": 29335
+ },
+ {
+ "epoch": 79.93460490463215,
+ "grad_norm": 3.0442001819610596,
+ "learning_rate": 2.038369589484004e-06,
+ "loss": 0.0764,
+ "step": 29336
+ },
+ {
+ "epoch": 79.93732970027249,
+ "grad_norm": 1.5549694299697876,
+ "learning_rate": 2.03783563873285e-06,
+ "loss": 0.0329,
+ "step": 29337
+ },
+ {
+ "epoch": 79.9400544959128,
+ "grad_norm": 2.3120741844177246,
+ "learning_rate": 2.0373017499907743e-06,
+ "loss": 0.1115,
+ "step": 29338
+ },
+ {
+ "epoch": 79.94277929155314,
+ "grad_norm": 2.2634379863739014,
+ "learning_rate": 2.0367679232619385e-06,
+ "loss": 0.0767,
+ "step": 29339
+ },
+ {
+ "epoch": 79.94550408719346,
+ "grad_norm": 2.465524435043335,
+ "learning_rate": 2.0362341585504974e-06,
+ "loss": 0.1215,
+ "step": 29340
+ },
+ {
+ "epoch": 79.94822888283379,
+ "grad_norm": 2.9260036945343018,
+ "learning_rate": 2.0357004558606087e-06,
+ "loss": 0.028,
+ "step": 29341
+ },
+ {
+ "epoch": 79.95095367847412,
+ "grad_norm": 2.66758394241333,
+ "learning_rate": 2.0351668151964253e-06,
+ "loss": 0.0246,
+ "step": 29342
+ },
+ {
+ "epoch": 79.95367847411444,
+ "grad_norm": 2.967787027359009,
+ "learning_rate": 2.034633236562109e-06,
+ "loss": 0.0928,
+ "step": 29343
+ },
+ {
+ "epoch": 79.95640326975477,
+ "grad_norm": 1.8456788063049316,
+ "learning_rate": 2.0340997199618128e-06,
+ "loss": 0.0205,
+ "step": 29344
+ },
+ {
+ "epoch": 79.95912806539509,
+ "grad_norm": 2.21388840675354,
+ "learning_rate": 2.03356626539969e-06,
+ "loss": 0.0667,
+ "step": 29345
+ },
+ {
+ "epoch": 79.96185286103542,
+ "grad_norm": 2.046415090560913,
+ "learning_rate": 2.0330328728798988e-06,
+ "loss": 0.0266,
+ "step": 29346
+ },
+ {
+ "epoch": 79.96457765667574,
+ "grad_norm": 4.012266635894775,
+ "learning_rate": 2.0324995424065884e-06,
+ "loss": 0.0406,
+ "step": 29347
+ },
+ {
+ "epoch": 79.96730245231608,
+ "grad_norm": 3.13988995552063,
+ "learning_rate": 2.0319662739839174e-06,
+ "loss": 0.0963,
+ "step": 29348
+ },
+ {
+ "epoch": 79.97002724795641,
+ "grad_norm": 3.302042245864868,
+ "learning_rate": 2.0314330676160364e-06,
+ "loss": 0.0347,
+ "step": 29349
+ },
+ {
+ "epoch": 79.97275204359673,
+ "grad_norm": 2.4337568283081055,
+ "learning_rate": 2.030899923307097e-06,
+ "loss": 0.0348,
+ "step": 29350
+ },
+ {
+ "epoch": 79.97547683923706,
+ "grad_norm": 3.118250608444214,
+ "learning_rate": 2.0303668410612544e-06,
+ "loss": 0.1335,
+ "step": 29351
+ },
+ {
+ "epoch": 79.97820163487738,
+ "grad_norm": 2.537001132965088,
+ "learning_rate": 2.0298338208826574e-06,
+ "loss": 0.1521,
+ "step": 29352
+ },
+ {
+ "epoch": 79.98092643051771,
+ "grad_norm": 3.249803066253662,
+ "learning_rate": 2.0293008627754597e-06,
+ "loss": 0.1485,
+ "step": 29353
+ },
+ {
+ "epoch": 79.98365122615803,
+ "grad_norm": 2.459155321121216,
+ "learning_rate": 2.0287679667438063e-06,
+ "loss": 0.0662,
+ "step": 29354
+ },
+ {
+ "epoch": 79.98637602179836,
+ "grad_norm": 3.170015573501587,
+ "learning_rate": 2.028235132791855e-06,
+ "loss": 0.056,
+ "step": 29355
+ },
+ {
+ "epoch": 79.9891008174387,
+ "grad_norm": 3.1561808586120605,
+ "learning_rate": 2.027702360923751e-06,
+ "loss": 0.0354,
+ "step": 29356
+ },
+ {
+ "epoch": 79.99182561307902,
+ "grad_norm": 3.056755542755127,
+ "learning_rate": 2.0271696511436457e-06,
+ "loss": 0.065,
+ "step": 29357
+ },
+ {
+ "epoch": 79.99455040871935,
+ "grad_norm": 2.7098047733306885,
+ "learning_rate": 2.0266370034556824e-06,
+ "loss": 0.1533,
+ "step": 29358
+ },
+ {
+ "epoch": 79.99727520435967,
+ "grad_norm": 3.2575576305389404,
+ "learning_rate": 2.0261044178640166e-06,
+ "loss": 0.1153,
+ "step": 29359
+ },
+ {
+ "epoch": 80.0,
+ "grad_norm": 3.2451682090759277,
+ "learning_rate": 2.025571894372794e-06,
+ "loss": 0.2123,
+ "step": 29360
+ },
+ {
+ "epoch": 80.00272479564033,
+ "grad_norm": 5.603143215179443,
+ "learning_rate": 2.02503943298616e-06,
+ "loss": 0.1196,
+ "step": 29361
+ },
+ {
+ "epoch": 80.00544959128065,
+ "grad_norm": 2.9784491062164307,
+ "learning_rate": 2.0245070337082596e-06,
+ "loss": 0.0473,
+ "step": 29362
+ },
+ {
+ "epoch": 80.00817438692098,
+ "grad_norm": 12.486374855041504,
+ "learning_rate": 2.0239746965432417e-06,
+ "loss": 0.0385,
+ "step": 29363
+ },
+ {
+ "epoch": 80.0108991825613,
+ "grad_norm": 2.0977165699005127,
+ "learning_rate": 2.023442421495255e-06,
+ "loss": 0.099,
+ "step": 29364
+ },
+ {
+ "epoch": 80.01362397820164,
+ "grad_norm": 1.9674521684646606,
+ "learning_rate": 2.0229102085684416e-06,
+ "loss": 0.1507,
+ "step": 29365
+ },
+ {
+ "epoch": 80.01634877384195,
+ "grad_norm": 2.7131857872009277,
+ "learning_rate": 2.022378057766947e-06,
+ "loss": 0.0457,
+ "step": 29366
+ },
+ {
+ "epoch": 80.01907356948229,
+ "grad_norm": 3.055431604385376,
+ "learning_rate": 2.021845969094913e-06,
+ "loss": 0.0425,
+ "step": 29367
+ },
+ {
+ "epoch": 80.02179836512262,
+ "grad_norm": 3.1296238899230957,
+ "learning_rate": 2.0213139425564888e-06,
+ "loss": 0.0586,
+ "step": 29368
+ },
+ {
+ "epoch": 80.02452316076294,
+ "grad_norm": 2.3376431465148926,
+ "learning_rate": 2.0207819781558137e-06,
+ "loss": 0.1063,
+ "step": 29369
+ },
+ {
+ "epoch": 80.02724795640327,
+ "grad_norm": 1.8747031688690186,
+ "learning_rate": 2.0202500758970323e-06,
+ "loss": 0.0199,
+ "step": 29370
+ },
+ {
+ "epoch": 80.02997275204359,
+ "grad_norm": 2.9020087718963623,
+ "learning_rate": 2.0197182357842836e-06,
+ "loss": 0.0577,
+ "step": 29371
+ },
+ {
+ "epoch": 80.03269754768392,
+ "grad_norm": 2.2700018882751465,
+ "learning_rate": 2.0191864578217155e-06,
+ "loss": 0.0366,
+ "step": 29372
+ },
+ {
+ "epoch": 80.03542234332426,
+ "grad_norm": 2.2061479091644287,
+ "learning_rate": 2.0186547420134663e-06,
+ "loss": 0.0298,
+ "step": 29373
+ },
+ {
+ "epoch": 80.03814713896458,
+ "grad_norm": 2.363985061645508,
+ "learning_rate": 2.018123088363675e-06,
+ "loss": 0.0339,
+ "step": 29374
+ },
+ {
+ "epoch": 80.04087193460491,
+ "grad_norm": 2.4737119674682617,
+ "learning_rate": 2.017591496876485e-06,
+ "loss": 0.0684,
+ "step": 29375
+ },
+ {
+ "epoch": 80.04359673024523,
+ "grad_norm": 2.2740232944488525,
+ "learning_rate": 2.0170599675560376e-06,
+ "loss": 0.0408,
+ "step": 29376
+ },
+ {
+ "epoch": 80.04632152588556,
+ "grad_norm": 2.1201000213623047,
+ "learning_rate": 2.0165285004064692e-06,
+ "loss": 0.033,
+ "step": 29377
+ },
+ {
+ "epoch": 80.04904632152588,
+ "grad_norm": 1.6579976081848145,
+ "learning_rate": 2.0159970954319173e-06,
+ "loss": 0.0203,
+ "step": 29378
+ },
+ {
+ "epoch": 80.05177111716621,
+ "grad_norm": 1.8335825204849243,
+ "learning_rate": 2.0154657526365227e-06,
+ "loss": 0.0234,
+ "step": 29379
+ },
+ {
+ "epoch": 80.05449591280654,
+ "grad_norm": 3.6377949714660645,
+ "learning_rate": 2.014934472024427e-06,
+ "loss": 0.038,
+ "step": 29380
+ },
+ {
+ "epoch": 80.05722070844686,
+ "grad_norm": 4.581460475921631,
+ "learning_rate": 2.014403253599765e-06,
+ "loss": 0.197,
+ "step": 29381
+ },
+ {
+ "epoch": 80.0599455040872,
+ "grad_norm": 1.6591564416885376,
+ "learning_rate": 2.0138720973666727e-06,
+ "loss": 0.0246,
+ "step": 29382
+ },
+ {
+ "epoch": 80.06267029972751,
+ "grad_norm": 3.421288251876831,
+ "learning_rate": 2.0133410033292854e-06,
+ "loss": 0.0461,
+ "step": 29383
+ },
+ {
+ "epoch": 80.06539509536785,
+ "grad_norm": 1.9600965976715088,
+ "learning_rate": 2.0128099714917436e-06,
+ "loss": 0.1076,
+ "step": 29384
+ },
+ {
+ "epoch": 80.06811989100818,
+ "grad_norm": 2.0340168476104736,
+ "learning_rate": 2.0122790018581805e-06,
+ "loss": 0.1289,
+ "step": 29385
+ },
+ {
+ "epoch": 80.0708446866485,
+ "grad_norm": 2.848813056945801,
+ "learning_rate": 2.0117480944327317e-06,
+ "loss": 0.059,
+ "step": 29386
+ },
+ {
+ "epoch": 80.07356948228883,
+ "grad_norm": 1.989477276802063,
+ "learning_rate": 2.011217249219529e-06,
+ "loss": 0.0154,
+ "step": 29387
+ },
+ {
+ "epoch": 80.07629427792915,
+ "grad_norm": 2.7358896732330322,
+ "learning_rate": 2.010686466222712e-06,
+ "loss": 0.0796,
+ "step": 29388
+ },
+ {
+ "epoch": 80.07901907356948,
+ "grad_norm": 2.944010019302368,
+ "learning_rate": 2.0101557454464115e-06,
+ "loss": 0.108,
+ "step": 29389
+ },
+ {
+ "epoch": 80.0817438692098,
+ "grad_norm": 2.212073802947998,
+ "learning_rate": 2.009625086894761e-06,
+ "loss": 0.0466,
+ "step": 29390
+ },
+ {
+ "epoch": 80.08446866485014,
+ "grad_norm": 2.7997961044311523,
+ "learning_rate": 2.0090944905718913e-06,
+ "loss": 0.1205,
+ "step": 29391
+ },
+ {
+ "epoch": 80.08719346049047,
+ "grad_norm": 3.7996926307678223,
+ "learning_rate": 2.0085639564819383e-06,
+ "loss": 0.1322,
+ "step": 29392
+ },
+ {
+ "epoch": 80.08991825613079,
+ "grad_norm": 3.034207582473755,
+ "learning_rate": 2.0080334846290317e-06,
+ "loss": 0.0531,
+ "step": 29393
+ },
+ {
+ "epoch": 80.09264305177112,
+ "grad_norm": 2.514934539794922,
+ "learning_rate": 2.007503075017303e-06,
+ "loss": 0.0628,
+ "step": 29394
+ },
+ {
+ "epoch": 80.09536784741144,
+ "grad_norm": 2.12790584564209,
+ "learning_rate": 2.006972727650881e-06,
+ "loss": 0.0301,
+ "step": 29395
+ },
+ {
+ "epoch": 80.09809264305177,
+ "grad_norm": 5.728973865509033,
+ "learning_rate": 2.0064424425339014e-06,
+ "loss": 0.0709,
+ "step": 29396
+ },
+ {
+ "epoch": 80.1008174386921,
+ "grad_norm": 2.994800329208374,
+ "learning_rate": 2.0059122196704872e-06,
+ "loss": 0.0362,
+ "step": 29397
+ },
+ {
+ "epoch": 80.10354223433242,
+ "grad_norm": 2.195781946182251,
+ "learning_rate": 2.0053820590647744e-06,
+ "loss": 0.064,
+ "step": 29398
+ },
+ {
+ "epoch": 80.10626702997276,
+ "grad_norm": 2.763132333755493,
+ "learning_rate": 2.004851960720886e-06,
+ "loss": 0.0763,
+ "step": 29399
+ },
+ {
+ "epoch": 80.10899182561307,
+ "grad_norm": 2.22554612159729,
+ "learning_rate": 2.0043219246429555e-06,
+ "loss": 0.0471,
+ "step": 29400
+ },
+ {
+ "epoch": 80.11171662125341,
+ "grad_norm": 2.436314821243286,
+ "learning_rate": 2.003791950835109e-06,
+ "loss": 0.0404,
+ "step": 29401
+ },
+ {
+ "epoch": 80.11444141689373,
+ "grad_norm": 2.6080710887908936,
+ "learning_rate": 2.0032620393014734e-06,
+ "loss": 0.0383,
+ "step": 29402
+ },
+ {
+ "epoch": 80.11716621253406,
+ "grad_norm": 3.8651154041290283,
+ "learning_rate": 2.0027321900461726e-06,
+ "loss": 0.0282,
+ "step": 29403
+ },
+ {
+ "epoch": 80.11989100817439,
+ "grad_norm": 3.0691099166870117,
+ "learning_rate": 2.002202403073339e-06,
+ "loss": 0.0568,
+ "step": 29404
+ },
+ {
+ "epoch": 80.12261580381471,
+ "grad_norm": 2.3447935581207275,
+ "learning_rate": 2.0016726783870966e-06,
+ "loss": 0.0899,
+ "step": 29405
+ },
+ {
+ "epoch": 80.12534059945504,
+ "grad_norm": 3.291969060897827,
+ "learning_rate": 2.001143015991569e-06,
+ "loss": 0.1161,
+ "step": 29406
+ },
+ {
+ "epoch": 80.12806539509536,
+ "grad_norm": 3.1843996047973633,
+ "learning_rate": 2.0006134158908796e-06,
+ "loss": 0.1323,
+ "step": 29407
+ },
+ {
+ "epoch": 80.1307901907357,
+ "grad_norm": 3.0894100666046143,
+ "learning_rate": 2.0000838780891573e-06,
+ "loss": 0.0523,
+ "step": 29408
+ },
+ {
+ "epoch": 80.13351498637603,
+ "grad_norm": 2.975862503051758,
+ "learning_rate": 1.9995544025905254e-06,
+ "loss": 0.0464,
+ "step": 29409
+ },
+ {
+ "epoch": 80.13623978201635,
+ "grad_norm": 2.842663288116455,
+ "learning_rate": 1.9990249893991064e-06,
+ "loss": 0.0436,
+ "step": 29410
+ },
+ {
+ "epoch": 80.13896457765668,
+ "grad_norm": 2.7382287979125977,
+ "learning_rate": 1.9984956385190204e-06,
+ "loss": 0.1006,
+ "step": 29411
+ },
+ {
+ "epoch": 80.141689373297,
+ "grad_norm": 2.1449384689331055,
+ "learning_rate": 1.9979663499543956e-06,
+ "loss": 0.0441,
+ "step": 29412
+ },
+ {
+ "epoch": 80.14441416893733,
+ "grad_norm": 1.671662449836731,
+ "learning_rate": 1.9974371237093505e-06,
+ "loss": 0.021,
+ "step": 29413
+ },
+ {
+ "epoch": 80.14713896457765,
+ "grad_norm": 3.9940028190612793,
+ "learning_rate": 1.996907959788006e-06,
+ "loss": 0.13,
+ "step": 29414
+ },
+ {
+ "epoch": 80.14986376021798,
+ "grad_norm": 2.6534218788146973,
+ "learning_rate": 1.9963788581944832e-06,
+ "loss": 0.0688,
+ "step": 29415
+ },
+ {
+ "epoch": 80.15258855585832,
+ "grad_norm": 2.4782872200012207,
+ "learning_rate": 1.995849818932908e-06,
+ "loss": 0.0342,
+ "step": 29416
+ },
+ {
+ "epoch": 80.15531335149863,
+ "grad_norm": 2.70391845703125,
+ "learning_rate": 1.9953208420073965e-06,
+ "loss": 0.0345,
+ "step": 29417
+ },
+ {
+ "epoch": 80.15803814713897,
+ "grad_norm": 1.8681391477584839,
+ "learning_rate": 1.9947919274220693e-06,
+ "loss": 0.0328,
+ "step": 29418
+ },
+ {
+ "epoch": 80.16076294277929,
+ "grad_norm": 2.7991154193878174,
+ "learning_rate": 1.994263075181042e-06,
+ "loss": 0.0431,
+ "step": 29419
+ },
+ {
+ "epoch": 80.16348773841962,
+ "grad_norm": 3.968597173690796,
+ "learning_rate": 1.993734285288439e-06,
+ "loss": 0.1206,
+ "step": 29420
+ },
+ {
+ "epoch": 80.16621253405995,
+ "grad_norm": 3.151745080947876,
+ "learning_rate": 1.9932055577483743e-06,
+ "loss": 0.0595,
+ "step": 29421
+ },
+ {
+ "epoch": 80.16893732970027,
+ "grad_norm": 3.6714539527893066,
+ "learning_rate": 1.9926768925649685e-06,
+ "loss": 0.1386,
+ "step": 29422
+ },
+ {
+ "epoch": 80.1716621253406,
+ "grad_norm": 2.5412685871124268,
+ "learning_rate": 1.992148289742334e-06,
+ "loss": 0.1026,
+ "step": 29423
+ },
+ {
+ "epoch": 80.17438692098092,
+ "grad_norm": 2.7091026306152344,
+ "learning_rate": 1.9916197492845947e-06,
+ "loss": 0.0359,
+ "step": 29424
+ },
+ {
+ "epoch": 80.17711171662125,
+ "grad_norm": 2.3547556400299072,
+ "learning_rate": 1.991091271195862e-06,
+ "loss": 0.0682,
+ "step": 29425
+ },
+ {
+ "epoch": 80.17983651226157,
+ "grad_norm": 3.9136271476745605,
+ "learning_rate": 1.9905628554802525e-06,
+ "loss": 0.0985,
+ "step": 29426
+ },
+ {
+ "epoch": 80.1825613079019,
+ "grad_norm": 2.6397290229797363,
+ "learning_rate": 1.9900345021418797e-06,
+ "loss": 0.0194,
+ "step": 29427
+ },
+ {
+ "epoch": 80.18528610354224,
+ "grad_norm": 2.6623542308807373,
+ "learning_rate": 1.9895062111848628e-06,
+ "loss": 0.0303,
+ "step": 29428
+ },
+ {
+ "epoch": 80.18801089918256,
+ "grad_norm": 3.0329337120056152,
+ "learning_rate": 1.9889779826133136e-06,
+ "loss": 0.0453,
+ "step": 29429
+ },
+ {
+ "epoch": 80.19073569482289,
+ "grad_norm": 3.3232171535491943,
+ "learning_rate": 1.9884498164313458e-06,
+ "loss": 0.125,
+ "step": 29430
+ },
+ {
+ "epoch": 80.19346049046321,
+ "grad_norm": 2.496865749359131,
+ "learning_rate": 1.9879217126430704e-06,
+ "loss": 0.0364,
+ "step": 29431
+ },
+ {
+ "epoch": 80.19618528610354,
+ "grad_norm": 2.626728057861328,
+ "learning_rate": 1.9873936712526033e-06,
+ "loss": 0.0434,
+ "step": 29432
+ },
+ {
+ "epoch": 80.19891008174388,
+ "grad_norm": 2.1771438121795654,
+ "learning_rate": 1.9868656922640596e-06,
+ "loss": 0.0249,
+ "step": 29433
+ },
+ {
+ "epoch": 80.2016348773842,
+ "grad_norm": 2.1724393367767334,
+ "learning_rate": 1.986337775681546e-06,
+ "loss": 0.0338,
+ "step": 29434
+ },
+ {
+ "epoch": 80.20435967302453,
+ "grad_norm": 2.520867347717285,
+ "learning_rate": 1.9858099215091773e-06,
+ "loss": 0.1075,
+ "step": 29435
+ },
+ {
+ "epoch": 80.20708446866485,
+ "grad_norm": 2.6357574462890625,
+ "learning_rate": 1.9852821297510605e-06,
+ "loss": 0.0428,
+ "step": 29436
+ },
+ {
+ "epoch": 80.20980926430518,
+ "grad_norm": 2.61205792427063,
+ "learning_rate": 1.9847544004113105e-06,
+ "loss": 0.1401,
+ "step": 29437
+ },
+ {
+ "epoch": 80.2125340599455,
+ "grad_norm": 2.8970611095428467,
+ "learning_rate": 1.9842267334940357e-06,
+ "loss": 0.0986,
+ "step": 29438
+ },
+ {
+ "epoch": 80.21525885558583,
+ "grad_norm": 2.5879549980163574,
+ "learning_rate": 1.9836991290033427e-06,
+ "loss": 0.1085,
+ "step": 29439
+ },
+ {
+ "epoch": 80.21798365122616,
+ "grad_norm": 3.0536818504333496,
+ "learning_rate": 1.9831715869433456e-06,
+ "loss": 0.1055,
+ "step": 29440
+ },
+ {
+ "epoch": 80.22070844686648,
+ "grad_norm": 3.0303287506103516,
+ "learning_rate": 1.982644107318149e-06,
+ "loss": 0.0795,
+ "step": 29441
+ },
+ {
+ "epoch": 80.22343324250681,
+ "grad_norm": 3.1025660037994385,
+ "learning_rate": 1.9821166901318634e-06,
+ "loss": 0.1188,
+ "step": 29442
+ },
+ {
+ "epoch": 80.22615803814713,
+ "grad_norm": 2.673023223876953,
+ "learning_rate": 1.981589335388592e-06,
+ "loss": 0.0362,
+ "step": 29443
+ },
+ {
+ "epoch": 80.22888283378747,
+ "grad_norm": 3.098051071166992,
+ "learning_rate": 1.9810620430924465e-06,
+ "loss": 0.0554,
+ "step": 29444
+ },
+ {
+ "epoch": 80.2316076294278,
+ "grad_norm": 3.2103559970855713,
+ "learning_rate": 1.980534813247532e-06,
+ "loss": 0.0276,
+ "step": 29445
+ },
+ {
+ "epoch": 80.23433242506812,
+ "grad_norm": 2.42803955078125,
+ "learning_rate": 1.9800076458579552e-06,
+ "loss": 0.0573,
+ "step": 29446
+ },
+ {
+ "epoch": 80.23705722070845,
+ "grad_norm": 8.295357704162598,
+ "learning_rate": 1.9794805409278174e-06,
+ "loss": 0.0739,
+ "step": 29447
+ },
+ {
+ "epoch": 80.23978201634877,
+ "grad_norm": 2.6432881355285645,
+ "learning_rate": 1.978953498461227e-06,
+ "loss": 0.0654,
+ "step": 29448
+ },
+ {
+ "epoch": 80.2425068119891,
+ "grad_norm": 2.679471492767334,
+ "learning_rate": 1.978426518462291e-06,
+ "loss": 0.042,
+ "step": 29449
+ },
+ {
+ "epoch": 80.24523160762942,
+ "grad_norm": 2.8455731868743896,
+ "learning_rate": 1.9778996009351116e-06,
+ "loss": 0.0489,
+ "step": 29450
+ },
+ {
+ "epoch": 80.24795640326975,
+ "grad_norm": 1.6808359622955322,
+ "learning_rate": 1.977372745883792e-06,
+ "loss": 0.0202,
+ "step": 29451
+ },
+ {
+ "epoch": 80.25068119891009,
+ "grad_norm": 2.7449731826782227,
+ "learning_rate": 1.976845953312432e-06,
+ "loss": 0.0441,
+ "step": 29452
+ },
+ {
+ "epoch": 80.2534059945504,
+ "grad_norm": 3.0539281368255615,
+ "learning_rate": 1.9763192232251405e-06,
+ "loss": 0.0288,
+ "step": 29453
+ },
+ {
+ "epoch": 80.25613079019074,
+ "grad_norm": 2.833569288253784,
+ "learning_rate": 1.975792555626017e-06,
+ "loss": 0.082,
+ "step": 29454
+ },
+ {
+ "epoch": 80.25885558583106,
+ "grad_norm": 3.311829090118408,
+ "learning_rate": 1.975265950519163e-06,
+ "loss": 0.0599,
+ "step": 29455
+ },
+ {
+ "epoch": 80.26158038147139,
+ "grad_norm": 4.416215896606445,
+ "learning_rate": 1.9747394079086756e-06,
+ "loss": 0.1164,
+ "step": 29456
+ },
+ {
+ "epoch": 80.26430517711172,
+ "grad_norm": 2.7725939750671387,
+ "learning_rate": 1.974212927798663e-06,
+ "loss": 0.1197,
+ "step": 29457
+ },
+ {
+ "epoch": 80.26702997275204,
+ "grad_norm": 3.2645301818847656,
+ "learning_rate": 1.973686510193221e-06,
+ "loss": 0.1733,
+ "step": 29458
+ },
+ {
+ "epoch": 80.26975476839237,
+ "grad_norm": 1.6957669258117676,
+ "learning_rate": 1.973160155096452e-06,
+ "loss": 0.0206,
+ "step": 29459
+ },
+ {
+ "epoch": 80.2724795640327,
+ "grad_norm": 2.67549991607666,
+ "learning_rate": 1.9726338625124488e-06,
+ "loss": 0.0783,
+ "step": 29460
+ },
+ {
+ "epoch": 80.27520435967303,
+ "grad_norm": 2.7992019653320312,
+ "learning_rate": 1.972107632445318e-06,
+ "loss": 0.2081,
+ "step": 29461
+ },
+ {
+ "epoch": 80.27792915531334,
+ "grad_norm": 2.060793161392212,
+ "learning_rate": 1.971581464899155e-06,
+ "loss": 0.0415,
+ "step": 29462
+ },
+ {
+ "epoch": 80.28065395095368,
+ "grad_norm": 2.4207475185394287,
+ "learning_rate": 1.9710553598780534e-06,
+ "loss": 0.0286,
+ "step": 29463
+ },
+ {
+ "epoch": 80.28337874659401,
+ "grad_norm": 2.4379923343658447,
+ "learning_rate": 1.9705293173861182e-06,
+ "loss": 0.087,
+ "step": 29464
+ },
+ {
+ "epoch": 80.28610354223433,
+ "grad_norm": 2.448291301727295,
+ "learning_rate": 1.9700033374274386e-06,
+ "loss": 0.0326,
+ "step": 29465
+ },
+ {
+ "epoch": 80.28882833787466,
+ "grad_norm": 2.084537982940674,
+ "learning_rate": 1.9694774200061175e-06,
+ "loss": 0.0452,
+ "step": 29466
+ },
+ {
+ "epoch": 80.29155313351498,
+ "grad_norm": 3.169152021408081,
+ "learning_rate": 1.9689515651262482e-06,
+ "loss": 0.0483,
+ "step": 29467
+ },
+ {
+ "epoch": 80.29427792915531,
+ "grad_norm": 2.543179988861084,
+ "learning_rate": 1.9684257727919233e-06,
+ "loss": 0.0755,
+ "step": 29468
+ },
+ {
+ "epoch": 80.29700272479565,
+ "grad_norm": 2.1362757682800293,
+ "learning_rate": 1.9679000430072414e-06,
+ "loss": 0.0315,
+ "step": 29469
+ },
+ {
+ "epoch": 80.29972752043597,
+ "grad_norm": 1.747061014175415,
+ "learning_rate": 1.9673743757762963e-06,
+ "loss": 0.0251,
+ "step": 29470
+ },
+ {
+ "epoch": 80.3024523160763,
+ "grad_norm": 1.8823891878128052,
+ "learning_rate": 1.9668487711031804e-06,
+ "loss": 0.0182,
+ "step": 29471
+ },
+ {
+ "epoch": 80.30517711171662,
+ "grad_norm": 3.2333693504333496,
+ "learning_rate": 1.9663232289919854e-06,
+ "loss": 0.1943,
+ "step": 29472
+ },
+ {
+ "epoch": 80.30790190735695,
+ "grad_norm": 2.659660816192627,
+ "learning_rate": 1.9657977494468095e-06,
+ "loss": 0.0508,
+ "step": 29473
+ },
+ {
+ "epoch": 80.31062670299727,
+ "grad_norm": 2.9786505699157715,
+ "learning_rate": 1.9652723324717415e-06,
+ "loss": 0.0924,
+ "step": 29474
+ },
+ {
+ "epoch": 80.3133514986376,
+ "grad_norm": 2.215651273727417,
+ "learning_rate": 1.964746978070875e-06,
+ "loss": 0.0407,
+ "step": 29475
+ },
+ {
+ "epoch": 80.31607629427793,
+ "grad_norm": 2.2558863162994385,
+ "learning_rate": 1.964221686248298e-06,
+ "loss": 0.0474,
+ "step": 29476
+ },
+ {
+ "epoch": 80.31880108991825,
+ "grad_norm": 5.30399751663208,
+ "learning_rate": 1.9636964570081054e-06,
+ "loss": 0.0456,
+ "step": 29477
+ },
+ {
+ "epoch": 80.32152588555859,
+ "grad_norm": 2.3896677494049072,
+ "learning_rate": 1.9631712903543854e-06,
+ "loss": 0.0298,
+ "step": 29478
+ },
+ {
+ "epoch": 80.3242506811989,
+ "grad_norm": 2.5672144889831543,
+ "learning_rate": 1.9626461862912304e-06,
+ "loss": 0.0937,
+ "step": 29479
+ },
+ {
+ "epoch": 80.32697547683924,
+ "grad_norm": 2.6122467517852783,
+ "learning_rate": 1.962121144822725e-06,
+ "loss": 0.055,
+ "step": 29480
+ },
+ {
+ "epoch": 80.32970027247957,
+ "grad_norm": 1.9325565099716187,
+ "learning_rate": 1.9615961659529637e-06,
+ "loss": 0.067,
+ "step": 29481
+ },
+ {
+ "epoch": 80.33242506811989,
+ "grad_norm": 2.978832483291626,
+ "learning_rate": 1.961071249686033e-06,
+ "loss": 0.0476,
+ "step": 29482
+ },
+ {
+ "epoch": 80.33514986376022,
+ "grad_norm": 1.8789916038513184,
+ "learning_rate": 1.9605463960260186e-06,
+ "loss": 0.1755,
+ "step": 29483
+ },
+ {
+ "epoch": 80.33787465940054,
+ "grad_norm": 2.263629198074341,
+ "learning_rate": 1.960021604977009e-06,
+ "loss": 0.0376,
+ "step": 29484
+ },
+ {
+ "epoch": 80.34059945504087,
+ "grad_norm": 3.0086748600006104,
+ "learning_rate": 1.9594968765430956e-06,
+ "loss": 0.1481,
+ "step": 29485
+ },
+ {
+ "epoch": 80.34332425068119,
+ "grad_norm": 2.566378355026245,
+ "learning_rate": 1.9589722107283628e-06,
+ "loss": 0.0287,
+ "step": 29486
+ },
+ {
+ "epoch": 80.34604904632153,
+ "grad_norm": 2.287869930267334,
+ "learning_rate": 1.958447607536894e-06,
+ "loss": 0.0499,
+ "step": 29487
+ },
+ {
+ "epoch": 80.34877384196186,
+ "grad_norm": 2.3460464477539062,
+ "learning_rate": 1.9579230669727745e-06,
+ "loss": 0.0203,
+ "step": 29488
+ },
+ {
+ "epoch": 80.35149863760218,
+ "grad_norm": 4.031327724456787,
+ "learning_rate": 1.957398589040094e-06,
+ "loss": 0.0498,
+ "step": 29489
+ },
+ {
+ "epoch": 80.35422343324251,
+ "grad_norm": 3.1813266277313232,
+ "learning_rate": 1.9568741737429344e-06,
+ "loss": 0.0727,
+ "step": 29490
+ },
+ {
+ "epoch": 80.35694822888283,
+ "grad_norm": 9.18799114227295,
+ "learning_rate": 1.9563498210853792e-06,
+ "loss": 0.1077,
+ "step": 29491
+ },
+ {
+ "epoch": 80.35967302452316,
+ "grad_norm": 1.7899898290634155,
+ "learning_rate": 1.9558255310715103e-06,
+ "loss": 0.02,
+ "step": 29492
+ },
+ {
+ "epoch": 80.3623978201635,
+ "grad_norm": 2.570700168609619,
+ "learning_rate": 1.955301303705417e-06,
+ "loss": 0.0657,
+ "step": 29493
+ },
+ {
+ "epoch": 80.36512261580381,
+ "grad_norm": 2.8046064376831055,
+ "learning_rate": 1.9547771389911774e-06,
+ "loss": 0.0527,
+ "step": 29494
+ },
+ {
+ "epoch": 80.36784741144415,
+ "grad_norm": 2.3152570724487305,
+ "learning_rate": 1.9542530369328738e-06,
+ "loss": 0.0241,
+ "step": 29495
+ },
+ {
+ "epoch": 80.37057220708446,
+ "grad_norm": 2.5495524406433105,
+ "learning_rate": 1.9537289975345876e-06,
+ "loss": 0.0737,
+ "step": 29496
+ },
+ {
+ "epoch": 80.3732970027248,
+ "grad_norm": 2.499063014984131,
+ "learning_rate": 1.9532050208004014e-06,
+ "loss": 0.042,
+ "step": 29497
+ },
+ {
+ "epoch": 80.37602179836512,
+ "grad_norm": 2.108701467514038,
+ "learning_rate": 1.9526811067343977e-06,
+ "loss": 0.0295,
+ "step": 29498
+ },
+ {
+ "epoch": 80.37874659400545,
+ "grad_norm": 2.7002453804016113,
+ "learning_rate": 1.952157255340653e-06,
+ "loss": 0.0809,
+ "step": 29499
+ },
+ {
+ "epoch": 80.38147138964578,
+ "grad_norm": 4.181662082672119,
+ "learning_rate": 1.9516334666232474e-06,
+ "loss": 0.2036,
+ "step": 29500
+ },
+ {
+ "epoch": 80.3841961852861,
+ "grad_norm": 2.412010908126831,
+ "learning_rate": 1.95110974058626e-06,
+ "loss": 0.1952,
+ "step": 29501
+ },
+ {
+ "epoch": 80.38692098092643,
+ "grad_norm": 1.9975512027740479,
+ "learning_rate": 1.950586077233775e-06,
+ "loss": 0.0217,
+ "step": 29502
+ },
+ {
+ "epoch": 80.38964577656675,
+ "grad_norm": 3.2104544639587402,
+ "learning_rate": 1.950062476569865e-06,
+ "loss": 0.0391,
+ "step": 29503
+ },
+ {
+ "epoch": 80.39237057220708,
+ "grad_norm": 2.4745044708251953,
+ "learning_rate": 1.9495389385986076e-06,
+ "loss": 0.0281,
+ "step": 29504
+ },
+ {
+ "epoch": 80.39509536784742,
+ "grad_norm": 3.938070297241211,
+ "learning_rate": 1.9490154633240843e-06,
+ "loss": 0.0378,
+ "step": 29505
+ },
+ {
+ "epoch": 80.39782016348774,
+ "grad_norm": 3.3507866859436035,
+ "learning_rate": 1.948492050750369e-06,
+ "loss": 0.0598,
+ "step": 29506
+ },
+ {
+ "epoch": 80.40054495912807,
+ "grad_norm": 2.580538034439087,
+ "learning_rate": 1.9479687008815396e-06,
+ "loss": 0.058,
+ "step": 29507
+ },
+ {
+ "epoch": 80.40326975476839,
+ "grad_norm": 2.0212392807006836,
+ "learning_rate": 1.947445413721667e-06,
+ "loss": 0.0596,
+ "step": 29508
+ },
+ {
+ "epoch": 80.40599455040872,
+ "grad_norm": 2.680859327316284,
+ "learning_rate": 1.9469221892748337e-06,
+ "loss": 0.1228,
+ "step": 29509
+ },
+ {
+ "epoch": 80.40871934604904,
+ "grad_norm": 2.15167498588562,
+ "learning_rate": 1.9463990275451107e-06,
+ "loss": 0.0312,
+ "step": 29510
+ },
+ {
+ "epoch": 80.41144414168937,
+ "grad_norm": 3.37306809425354,
+ "learning_rate": 1.9458759285365723e-06,
+ "loss": 0.0562,
+ "step": 29511
+ },
+ {
+ "epoch": 80.4141689373297,
+ "grad_norm": 4.165459156036377,
+ "learning_rate": 1.9453528922532915e-06,
+ "loss": 0.1646,
+ "step": 29512
+ },
+ {
+ "epoch": 80.41689373297002,
+ "grad_norm": 10.101032257080078,
+ "learning_rate": 1.944829918699346e-06,
+ "loss": 0.0368,
+ "step": 29513
+ },
+ {
+ "epoch": 80.41961852861036,
+ "grad_norm": 3.278978109359741,
+ "learning_rate": 1.944307007878805e-06,
+ "loss": 0.0734,
+ "step": 29514
+ },
+ {
+ "epoch": 80.42234332425068,
+ "grad_norm": 1.8675167560577393,
+ "learning_rate": 1.943784159795742e-06,
+ "loss": 0.0249,
+ "step": 29515
+ },
+ {
+ "epoch": 80.42506811989101,
+ "grad_norm": 2.862319231033325,
+ "learning_rate": 1.943261374454226e-06,
+ "loss": 0.0537,
+ "step": 29516
+ },
+ {
+ "epoch": 80.42779291553134,
+ "grad_norm": 3.1203036308288574,
+ "learning_rate": 1.9427386518583313e-06,
+ "loss": 0.0373,
+ "step": 29517
+ },
+ {
+ "epoch": 80.43051771117166,
+ "grad_norm": 2.046741247177124,
+ "learning_rate": 1.942215992012131e-06,
+ "loss": 0.0633,
+ "step": 29518
+ },
+ {
+ "epoch": 80.433242506812,
+ "grad_norm": 2.4257113933563232,
+ "learning_rate": 1.9416933949196926e-06,
+ "loss": 0.0294,
+ "step": 29519
+ },
+ {
+ "epoch": 80.43596730245231,
+ "grad_norm": 2.9155521392822266,
+ "learning_rate": 1.9411708605850875e-06,
+ "loss": 0.0995,
+ "step": 29520
+ },
+ {
+ "epoch": 80.43869209809264,
+ "grad_norm": 3.372971534729004,
+ "learning_rate": 1.9406483890123817e-06,
+ "loss": 0.0745,
+ "step": 29521
+ },
+ {
+ "epoch": 80.44141689373296,
+ "grad_norm": 3.321413278579712,
+ "learning_rate": 1.9401259802056495e-06,
+ "loss": 0.0567,
+ "step": 29522
+ },
+ {
+ "epoch": 80.4441416893733,
+ "grad_norm": 2.972351551055908,
+ "learning_rate": 1.939603634168957e-06,
+ "loss": 0.0472,
+ "step": 29523
+ },
+ {
+ "epoch": 80.44686648501363,
+ "grad_norm": 2.0562520027160645,
+ "learning_rate": 1.939081350906369e-06,
+ "loss": 0.0208,
+ "step": 29524
+ },
+ {
+ "epoch": 80.44959128065395,
+ "grad_norm": 2.546272039413452,
+ "learning_rate": 1.9385591304219585e-06,
+ "loss": 0.0519,
+ "step": 29525
+ },
+ {
+ "epoch": 80.45231607629428,
+ "grad_norm": 2.502002239227295,
+ "learning_rate": 1.93803697271979e-06,
+ "loss": 0.0257,
+ "step": 29526
+ },
+ {
+ "epoch": 80.4550408719346,
+ "grad_norm": 1.9413026571273804,
+ "learning_rate": 1.937514877803931e-06,
+ "loss": 0.0201,
+ "step": 29527
+ },
+ {
+ "epoch": 80.45776566757493,
+ "grad_norm": 2.404670000076294,
+ "learning_rate": 1.9369928456784425e-06,
+ "loss": 0.0417,
+ "step": 29528
+ },
+ {
+ "epoch": 80.46049046321527,
+ "grad_norm": 1.6891522407531738,
+ "learning_rate": 1.936470876347398e-06,
+ "loss": 0.1206,
+ "step": 29529
+ },
+ {
+ "epoch": 80.46321525885558,
+ "grad_norm": 2.2138748168945312,
+ "learning_rate": 1.935948969814858e-06,
+ "loss": 0.0304,
+ "step": 29530
+ },
+ {
+ "epoch": 80.46594005449592,
+ "grad_norm": 3.2485358715057373,
+ "learning_rate": 1.935427126084889e-06,
+ "loss": 0.1371,
+ "step": 29531
+ },
+ {
+ "epoch": 80.46866485013624,
+ "grad_norm": 2.471385955810547,
+ "learning_rate": 1.934905345161551e-06,
+ "loss": 0.0367,
+ "step": 29532
+ },
+ {
+ "epoch": 80.47138964577657,
+ "grad_norm": 4.403931140899658,
+ "learning_rate": 1.9343836270489124e-06,
+ "loss": 0.0605,
+ "step": 29533
+ },
+ {
+ "epoch": 80.47411444141689,
+ "grad_norm": 3.497035026550293,
+ "learning_rate": 1.933861971751032e-06,
+ "loss": 0.106,
+ "step": 29534
+ },
+ {
+ "epoch": 80.47683923705722,
+ "grad_norm": 3.98860502243042,
+ "learning_rate": 1.9333403792719783e-06,
+ "loss": 0.0593,
+ "step": 29535
+ },
+ {
+ "epoch": 80.47956403269755,
+ "grad_norm": 1.806820273399353,
+ "learning_rate": 1.9328188496158095e-06,
+ "loss": 0.0182,
+ "step": 29536
+ },
+ {
+ "epoch": 80.48228882833787,
+ "grad_norm": 2.6612436771392822,
+ "learning_rate": 1.9322973827865854e-06,
+ "loss": 0.0582,
+ "step": 29537
+ },
+ {
+ "epoch": 80.4850136239782,
+ "grad_norm": 2.6918468475341797,
+ "learning_rate": 1.9317759787883727e-06,
+ "loss": 0.0577,
+ "step": 29538
+ },
+ {
+ "epoch": 80.48773841961852,
+ "grad_norm": 2.69391131401062,
+ "learning_rate": 1.931254637625228e-06,
+ "loss": 0.0372,
+ "step": 29539
+ },
+ {
+ "epoch": 80.49046321525886,
+ "grad_norm": 3.332688093185425,
+ "learning_rate": 1.9307333593012134e-06,
+ "loss": 0.0772,
+ "step": 29540
+ },
+ {
+ "epoch": 80.49318801089919,
+ "grad_norm": 4.455597400665283,
+ "learning_rate": 1.9302121438203847e-06,
+ "loss": 0.2296,
+ "step": 29541
+ },
+ {
+ "epoch": 80.49591280653951,
+ "grad_norm": 2.459177017211914,
+ "learning_rate": 1.929690991186808e-06,
+ "loss": 0.0352,
+ "step": 29542
+ },
+ {
+ "epoch": 80.49863760217984,
+ "grad_norm": 4.751394748687744,
+ "learning_rate": 1.9291699014045362e-06,
+ "loss": 0.1556,
+ "step": 29543
+ },
+ {
+ "epoch": 80.50136239782016,
+ "grad_norm": 2.685845136642456,
+ "learning_rate": 1.92864887447763e-06,
+ "loss": 0.0608,
+ "step": 29544
+ },
+ {
+ "epoch": 80.50408719346049,
+ "grad_norm": 2.879746675491333,
+ "learning_rate": 1.928127910410145e-06,
+ "loss": 0.1232,
+ "step": 29545
+ },
+ {
+ "epoch": 80.50681198910081,
+ "grad_norm": 2.6398751735687256,
+ "learning_rate": 1.9276070092061414e-06,
+ "loss": 0.0738,
+ "step": 29546
+ },
+ {
+ "epoch": 80.50953678474114,
+ "grad_norm": 2.0282692909240723,
+ "learning_rate": 1.927086170869675e-06,
+ "loss": 0.049,
+ "step": 29547
+ },
+ {
+ "epoch": 80.51226158038148,
+ "grad_norm": 3.3353421688079834,
+ "learning_rate": 1.926565395404799e-06,
+ "loss": 0.0535,
+ "step": 29548
+ },
+ {
+ "epoch": 80.5149863760218,
+ "grad_norm": 7.86765718460083,
+ "learning_rate": 1.9260446828155745e-06,
+ "loss": 0.2399,
+ "step": 29549
+ },
+ {
+ "epoch": 80.51771117166213,
+ "grad_norm": 2.7736849784851074,
+ "learning_rate": 1.9255240331060543e-06,
+ "loss": 0.0579,
+ "step": 29550
+ },
+ {
+ "epoch": 80.52043596730245,
+ "grad_norm": 3.1279215812683105,
+ "learning_rate": 1.92500344628029e-06,
+ "loss": 0.0769,
+ "step": 29551
+ },
+ {
+ "epoch": 80.52316076294278,
+ "grad_norm": 2.62282395362854,
+ "learning_rate": 1.9244829223423424e-06,
+ "loss": 0.0527,
+ "step": 29552
+ },
+ {
+ "epoch": 80.52588555858311,
+ "grad_norm": 2.7637453079223633,
+ "learning_rate": 1.9239624612962593e-06,
+ "loss": 0.3223,
+ "step": 29553
+ },
+ {
+ "epoch": 80.52861035422343,
+ "grad_norm": 2.9348785877227783,
+ "learning_rate": 1.9234420631460982e-06,
+ "loss": 0.0361,
+ "step": 29554
+ },
+ {
+ "epoch": 80.53133514986376,
+ "grad_norm": 2.3062024116516113,
+ "learning_rate": 1.922921727895911e-06,
+ "loss": 0.0804,
+ "step": 29555
+ },
+ {
+ "epoch": 80.53405994550408,
+ "grad_norm": 2.510293960571289,
+ "learning_rate": 1.9224014555497493e-06,
+ "loss": 0.035,
+ "step": 29556
+ },
+ {
+ "epoch": 80.53678474114442,
+ "grad_norm": 3.1365272998809814,
+ "learning_rate": 1.921881246111662e-06,
+ "loss": 0.071,
+ "step": 29557
+ },
+ {
+ "epoch": 80.53950953678473,
+ "grad_norm": 1.9490344524383545,
+ "learning_rate": 1.9213610995857067e-06,
+ "loss": 0.0237,
+ "step": 29558
+ },
+ {
+ "epoch": 80.54223433242507,
+ "grad_norm": 2.332551956176758,
+ "learning_rate": 1.9208410159759316e-06,
+ "loss": 0.0429,
+ "step": 29559
+ },
+ {
+ "epoch": 80.5449591280654,
+ "grad_norm": 2.3657114505767822,
+ "learning_rate": 1.9203209952863866e-06,
+ "loss": 0.0288,
+ "step": 29560
+ },
+ {
+ "epoch": 80.54768392370572,
+ "grad_norm": 2.3163259029388428,
+ "learning_rate": 1.9198010375211185e-06,
+ "loss": 0.0274,
+ "step": 29561
+ },
+ {
+ "epoch": 80.55040871934605,
+ "grad_norm": 2.813373327255249,
+ "learning_rate": 1.919281142684183e-06,
+ "loss": 0.0843,
+ "step": 29562
+ },
+ {
+ "epoch": 80.55313351498637,
+ "grad_norm": 2.549604654312134,
+ "learning_rate": 1.918761310779624e-06,
+ "loss": 0.0838,
+ "step": 29563
+ },
+ {
+ "epoch": 80.5558583106267,
+ "grad_norm": 1.7128933668136597,
+ "learning_rate": 1.9182415418114943e-06,
+ "loss": 0.1445,
+ "step": 29564
+ },
+ {
+ "epoch": 80.55858310626704,
+ "grad_norm": 2.762568473815918,
+ "learning_rate": 1.917721835783836e-06,
+ "loss": 0.1624,
+ "step": 29565
+ },
+ {
+ "epoch": 80.56130790190736,
+ "grad_norm": 2.697061777114868,
+ "learning_rate": 1.9172021927007024e-06,
+ "loss": 0.0706,
+ "step": 29566
+ },
+ {
+ "epoch": 80.56403269754769,
+ "grad_norm": 2.739628791809082,
+ "learning_rate": 1.9166826125661376e-06,
+ "loss": 0.1294,
+ "step": 29567
+ },
+ {
+ "epoch": 80.566757493188,
+ "grad_norm": 2.1490402221679688,
+ "learning_rate": 1.916163095384188e-06,
+ "loss": 0.0579,
+ "step": 29568
+ },
+ {
+ "epoch": 80.56948228882834,
+ "grad_norm": 2.475924015045166,
+ "learning_rate": 1.9156436411588963e-06,
+ "loss": 0.1306,
+ "step": 29569
+ },
+ {
+ "epoch": 80.57220708446866,
+ "grad_norm": 3.805649518966675,
+ "learning_rate": 1.9151242498943155e-06,
+ "loss": 0.127,
+ "step": 29570
+ },
+ {
+ "epoch": 80.57493188010899,
+ "grad_norm": 2.7910525798797607,
+ "learning_rate": 1.9146049215944886e-06,
+ "loss": 0.0492,
+ "step": 29571
+ },
+ {
+ "epoch": 80.57765667574932,
+ "grad_norm": 3.0342190265655518,
+ "learning_rate": 1.914085656263457e-06,
+ "loss": 0.0756,
+ "step": 29572
+ },
+ {
+ "epoch": 80.58038147138964,
+ "grad_norm": 3.363170623779297,
+ "learning_rate": 1.9135664539052634e-06,
+ "loss": 0.1101,
+ "step": 29573
+ },
+ {
+ "epoch": 80.58310626702998,
+ "grad_norm": 2.4629461765289307,
+ "learning_rate": 1.913047314523957e-06,
+ "loss": 0.0563,
+ "step": 29574
+ },
+ {
+ "epoch": 80.5858310626703,
+ "grad_norm": 1.9890810251235962,
+ "learning_rate": 1.9125282381235775e-06,
+ "loss": 0.0379,
+ "step": 29575
+ },
+ {
+ "epoch": 80.58855585831063,
+ "grad_norm": 1.9922795295715332,
+ "learning_rate": 1.912009224708168e-06,
+ "loss": 0.0497,
+ "step": 29576
+ },
+ {
+ "epoch": 80.59128065395096,
+ "grad_norm": 1.87977933883667,
+ "learning_rate": 1.9114902742817675e-06,
+ "loss": 0.0368,
+ "step": 29577
+ },
+ {
+ "epoch": 80.59400544959128,
+ "grad_norm": 3.2104647159576416,
+ "learning_rate": 1.9109713868484235e-06,
+ "loss": 0.0456,
+ "step": 29578
+ },
+ {
+ "epoch": 80.59673024523161,
+ "grad_norm": 1.9903428554534912,
+ "learning_rate": 1.910452562412174e-06,
+ "loss": 0.0478,
+ "step": 29579
+ },
+ {
+ "epoch": 80.59945504087193,
+ "grad_norm": 2.8873534202575684,
+ "learning_rate": 1.9099338009770596e-06,
+ "loss": 0.14,
+ "step": 29580
+ },
+ {
+ "epoch": 80.60217983651226,
+ "grad_norm": 2.1759111881256104,
+ "learning_rate": 1.9094151025471175e-06,
+ "loss": 0.04,
+ "step": 29581
+ },
+ {
+ "epoch": 80.60490463215258,
+ "grad_norm": 3.4681735038757324,
+ "learning_rate": 1.908896467126392e-06,
+ "loss": 0.0684,
+ "step": 29582
+ },
+ {
+ "epoch": 80.60762942779292,
+ "grad_norm": 2.570377826690674,
+ "learning_rate": 1.908377894718921e-06,
+ "loss": 0.0733,
+ "step": 29583
+ },
+ {
+ "epoch": 80.61035422343325,
+ "grad_norm": 3.0153040885925293,
+ "learning_rate": 1.907859385328743e-06,
+ "loss": 0.1376,
+ "step": 29584
+ },
+ {
+ "epoch": 80.61307901907357,
+ "grad_norm": 4.000795841217041,
+ "learning_rate": 1.9073409389598929e-06,
+ "loss": 0.0762,
+ "step": 29585
+ },
+ {
+ "epoch": 80.6158038147139,
+ "grad_norm": 2.1445767879486084,
+ "learning_rate": 1.9068225556164112e-06,
+ "loss": 0.0305,
+ "step": 29586
+ },
+ {
+ "epoch": 80.61852861035422,
+ "grad_norm": 1.8627997636795044,
+ "learning_rate": 1.9063042353023375e-06,
+ "loss": 0.116,
+ "step": 29587
+ },
+ {
+ "epoch": 80.62125340599455,
+ "grad_norm": 2.578044891357422,
+ "learning_rate": 1.9057859780217058e-06,
+ "loss": 0.0274,
+ "step": 29588
+ },
+ {
+ "epoch": 80.62397820163488,
+ "grad_norm": 1.7357089519500732,
+ "learning_rate": 1.9052677837785505e-06,
+ "loss": 0.068,
+ "step": 29589
+ },
+ {
+ "epoch": 80.6267029972752,
+ "grad_norm": 2.2578418254852295,
+ "learning_rate": 1.9047496525769104e-06,
+ "loss": 0.0427,
+ "step": 29590
+ },
+ {
+ "epoch": 80.62942779291554,
+ "grad_norm": 2.87907338142395,
+ "learning_rate": 1.9042315844208203e-06,
+ "loss": 0.0822,
+ "step": 29591
+ },
+ {
+ "epoch": 80.63215258855585,
+ "grad_norm": 3.326517105102539,
+ "learning_rate": 1.9037135793143135e-06,
+ "loss": 0.0258,
+ "step": 29592
+ },
+ {
+ "epoch": 80.63487738419619,
+ "grad_norm": 2.6102454662323,
+ "learning_rate": 1.9031956372614236e-06,
+ "loss": 0.0653,
+ "step": 29593
+ },
+ {
+ "epoch": 80.6376021798365,
+ "grad_norm": 2.579186201095581,
+ "learning_rate": 1.902677758266186e-06,
+ "loss": 0.1855,
+ "step": 29594
+ },
+ {
+ "epoch": 80.64032697547684,
+ "grad_norm": 1.9239168167114258,
+ "learning_rate": 1.9021599423326353e-06,
+ "loss": 0.0207,
+ "step": 29595
+ },
+ {
+ "epoch": 80.64305177111717,
+ "grad_norm": 2.068316698074341,
+ "learning_rate": 1.9016421894648006e-06,
+ "loss": 0.0191,
+ "step": 29596
+ },
+ {
+ "epoch": 80.64577656675749,
+ "grad_norm": 2.4410226345062256,
+ "learning_rate": 1.9011244996667144e-06,
+ "loss": 0.1417,
+ "step": 29597
+ },
+ {
+ "epoch": 80.64850136239782,
+ "grad_norm": 2.3196847438812256,
+ "learning_rate": 1.900606872942413e-06,
+ "loss": 0.0582,
+ "step": 29598
+ },
+ {
+ "epoch": 80.65122615803814,
+ "grad_norm": 2.043778896331787,
+ "learning_rate": 1.9000893092959238e-06,
+ "loss": 0.0334,
+ "step": 29599
+ },
+ {
+ "epoch": 80.65395095367847,
+ "grad_norm": 3.3655807971954346,
+ "learning_rate": 1.8995718087312787e-06,
+ "loss": 0.1447,
+ "step": 29600
+ },
+ {
+ "epoch": 80.65667574931881,
+ "grad_norm": 2.0184550285339355,
+ "learning_rate": 1.8990543712525045e-06,
+ "loss": 0.0302,
+ "step": 29601
+ },
+ {
+ "epoch": 80.65940054495913,
+ "grad_norm": 3.035971164703369,
+ "learning_rate": 1.898536996863637e-06,
+ "loss": 0.0293,
+ "step": 29602
+ },
+ {
+ "epoch": 80.66212534059946,
+ "grad_norm": 2.2015907764434814,
+ "learning_rate": 1.8980196855687005e-06,
+ "loss": 0.0292,
+ "step": 29603
+ },
+ {
+ "epoch": 80.66485013623978,
+ "grad_norm": 3.003671884536743,
+ "learning_rate": 1.8975024373717277e-06,
+ "loss": 0.165,
+ "step": 29604
+ },
+ {
+ "epoch": 80.66757493188011,
+ "grad_norm": 2.6577353477478027,
+ "learning_rate": 1.8969852522767452e-06,
+ "loss": 0.0577,
+ "step": 29605
+ },
+ {
+ "epoch": 80.67029972752043,
+ "grad_norm": 3.1609206199645996,
+ "learning_rate": 1.8964681302877786e-06,
+ "loss": 0.0766,
+ "step": 29606
+ },
+ {
+ "epoch": 80.67302452316076,
+ "grad_norm": 2.8355610370635986,
+ "learning_rate": 1.8959510714088603e-06,
+ "loss": 0.0501,
+ "step": 29607
+ },
+ {
+ "epoch": 80.6757493188011,
+ "grad_norm": 4.325540065765381,
+ "learning_rate": 1.8954340756440137e-06,
+ "loss": 0.0815,
+ "step": 29608
+ },
+ {
+ "epoch": 80.67847411444141,
+ "grad_norm": 3.164767026901245,
+ "learning_rate": 1.8949171429972657e-06,
+ "loss": 0.0952,
+ "step": 29609
+ },
+ {
+ "epoch": 80.68119891008175,
+ "grad_norm": 3.5869052410125732,
+ "learning_rate": 1.8944002734726396e-06,
+ "loss": 0.0416,
+ "step": 29610
+ },
+ {
+ "epoch": 80.68392370572207,
+ "grad_norm": 1.9556015729904175,
+ "learning_rate": 1.8938834670741656e-06,
+ "loss": 0.026,
+ "step": 29611
+ },
+ {
+ "epoch": 80.6866485013624,
+ "grad_norm": 3.7239344120025635,
+ "learning_rate": 1.8933667238058672e-06,
+ "loss": 0.0569,
+ "step": 29612
+ },
+ {
+ "epoch": 80.68937329700273,
+ "grad_norm": 2.3650319576263428,
+ "learning_rate": 1.8928500436717645e-06,
+ "loss": 0.036,
+ "step": 29613
+ },
+ {
+ "epoch": 80.69209809264305,
+ "grad_norm": 2.493445634841919,
+ "learning_rate": 1.8923334266758874e-06,
+ "loss": 0.0907,
+ "step": 29614
+ },
+ {
+ "epoch": 80.69482288828338,
+ "grad_norm": 2.0561065673828125,
+ "learning_rate": 1.8918168728222564e-06,
+ "loss": 0.0496,
+ "step": 29615
+ },
+ {
+ "epoch": 80.6975476839237,
+ "grad_norm": 2.926267385482788,
+ "learning_rate": 1.8913003821148957e-06,
+ "loss": 0.0413,
+ "step": 29616
+ },
+ {
+ "epoch": 80.70027247956403,
+ "grad_norm": 4.192161560058594,
+ "learning_rate": 1.8907839545578233e-06,
+ "loss": 0.0425,
+ "step": 29617
+ },
+ {
+ "epoch": 80.70299727520435,
+ "grad_norm": 2.738772392272949,
+ "learning_rate": 1.890267590155066e-06,
+ "loss": 0.0775,
+ "step": 29618
+ },
+ {
+ "epoch": 80.70572207084469,
+ "grad_norm": 4.501349925994873,
+ "learning_rate": 1.8897512889106451e-06,
+ "loss": 0.1273,
+ "step": 29619
+ },
+ {
+ "epoch": 80.70844686648502,
+ "grad_norm": 3.0270581245422363,
+ "learning_rate": 1.8892350508285773e-06,
+ "loss": 0.0584,
+ "step": 29620
+ },
+ {
+ "epoch": 80.71117166212534,
+ "grad_norm": 3.082486629486084,
+ "learning_rate": 1.8887188759128883e-06,
+ "loss": 0.0452,
+ "step": 29621
+ },
+ {
+ "epoch": 80.71389645776567,
+ "grad_norm": 1.7954591512680054,
+ "learning_rate": 1.8882027641675927e-06,
+ "loss": 0.0294,
+ "step": 29622
+ },
+ {
+ "epoch": 80.71662125340599,
+ "grad_norm": 3.0222692489624023,
+ "learning_rate": 1.887686715596716e-06,
+ "loss": 0.0832,
+ "step": 29623
+ },
+ {
+ "epoch": 80.71934604904632,
+ "grad_norm": 2.030682325363159,
+ "learning_rate": 1.887170730204274e-06,
+ "loss": 0.0511,
+ "step": 29624
+ },
+ {
+ "epoch": 80.72207084468666,
+ "grad_norm": 1.996232271194458,
+ "learning_rate": 1.886654807994286e-06,
+ "loss": 0.0907,
+ "step": 29625
+ },
+ {
+ "epoch": 80.72479564032697,
+ "grad_norm": 5.397789001464844,
+ "learning_rate": 1.8861389489707648e-06,
+ "loss": 0.1492,
+ "step": 29626
+ },
+ {
+ "epoch": 80.7275204359673,
+ "grad_norm": 4.474803447723389,
+ "learning_rate": 1.8856231531377367e-06,
+ "loss": 0.041,
+ "step": 29627
+ },
+ {
+ "epoch": 80.73024523160763,
+ "grad_norm": 2.154280185699463,
+ "learning_rate": 1.8851074204992137e-06,
+ "loss": 0.0496,
+ "step": 29628
+ },
+ {
+ "epoch": 80.73297002724796,
+ "grad_norm": 2.165541887283325,
+ "learning_rate": 1.8845917510592126e-06,
+ "loss": 0.0884,
+ "step": 29629
+ },
+ {
+ "epoch": 80.73569482288828,
+ "grad_norm": 1.7544691562652588,
+ "learning_rate": 1.884076144821747e-06,
+ "loss": 0.0949,
+ "step": 29630
+ },
+ {
+ "epoch": 80.73841961852861,
+ "grad_norm": 1.7653148174285889,
+ "learning_rate": 1.8835606017908382e-06,
+ "loss": 0.0242,
+ "step": 29631
+ },
+ {
+ "epoch": 80.74114441416894,
+ "grad_norm": 2.971686363220215,
+ "learning_rate": 1.883045121970498e-06,
+ "loss": 0.0607,
+ "step": 29632
+ },
+ {
+ "epoch": 80.74386920980926,
+ "grad_norm": 2.4125564098358154,
+ "learning_rate": 1.8825297053647418e-06,
+ "loss": 0.0361,
+ "step": 29633
+ },
+ {
+ "epoch": 80.7465940054496,
+ "grad_norm": 2.2299764156341553,
+ "learning_rate": 1.8820143519775792e-06,
+ "loss": 0.0652,
+ "step": 29634
+ },
+ {
+ "epoch": 80.74931880108991,
+ "grad_norm": 3.280430555343628,
+ "learning_rate": 1.8814990618130313e-06,
+ "loss": 0.1178,
+ "step": 29635
+ },
+ {
+ "epoch": 80.75204359673025,
+ "grad_norm": 2.1842055320739746,
+ "learning_rate": 1.8809838348751065e-06,
+ "loss": 0.0427,
+ "step": 29636
+ },
+ {
+ "epoch": 80.75476839237058,
+ "grad_norm": 2.3917200565338135,
+ "learning_rate": 1.8804686711678167e-06,
+ "loss": 0.0917,
+ "step": 29637
+ },
+ {
+ "epoch": 80.7574931880109,
+ "grad_norm": 2.8943660259246826,
+ "learning_rate": 1.8799535706951743e-06,
+ "loss": 0.0653,
+ "step": 29638
+ },
+ {
+ "epoch": 80.76021798365123,
+ "grad_norm": 4.0513081550598145,
+ "learning_rate": 1.8794385334611953e-06,
+ "loss": 0.0316,
+ "step": 29639
+ },
+ {
+ "epoch": 80.76294277929155,
+ "grad_norm": 5.677994251251221,
+ "learning_rate": 1.8789235594698885e-06,
+ "loss": 0.034,
+ "step": 29640
+ },
+ {
+ "epoch": 80.76566757493188,
+ "grad_norm": 2.3507676124572754,
+ "learning_rate": 1.8784086487252628e-06,
+ "loss": 0.1498,
+ "step": 29641
+ },
+ {
+ "epoch": 80.7683923705722,
+ "grad_norm": 2.821159839630127,
+ "learning_rate": 1.8778938012313263e-06,
+ "loss": 0.1113,
+ "step": 29642
+ },
+ {
+ "epoch": 80.77111716621253,
+ "grad_norm": 2.3692619800567627,
+ "learning_rate": 1.8773790169920947e-06,
+ "loss": 0.0594,
+ "step": 29643
+ },
+ {
+ "epoch": 80.77384196185287,
+ "grad_norm": 2.7331764698028564,
+ "learning_rate": 1.8768642960115735e-06,
+ "loss": 0.0585,
+ "step": 29644
+ },
+ {
+ "epoch": 80.77656675749319,
+ "grad_norm": 3.1903886795043945,
+ "learning_rate": 1.8763496382937718e-06,
+ "loss": 0.0552,
+ "step": 29645
+ },
+ {
+ "epoch": 80.77929155313352,
+ "grad_norm": 8.227446556091309,
+ "learning_rate": 1.8758350438426954e-06,
+ "loss": 0.0899,
+ "step": 29646
+ },
+ {
+ "epoch": 80.78201634877384,
+ "grad_norm": 2.9153196811676025,
+ "learning_rate": 1.8753205126623564e-06,
+ "loss": 0.1175,
+ "step": 29647
+ },
+ {
+ "epoch": 80.78474114441417,
+ "grad_norm": 3.3126773834228516,
+ "learning_rate": 1.8748060447567595e-06,
+ "loss": 0.1439,
+ "step": 29648
+ },
+ {
+ "epoch": 80.7874659400545,
+ "grad_norm": 1.6990525722503662,
+ "learning_rate": 1.8742916401299128e-06,
+ "loss": 0.0241,
+ "step": 29649
+ },
+ {
+ "epoch": 80.79019073569482,
+ "grad_norm": 3.0038223266601562,
+ "learning_rate": 1.8737772987858172e-06,
+ "loss": 0.0768,
+ "step": 29650
+ },
+ {
+ "epoch": 80.79291553133515,
+ "grad_norm": 3.690922498703003,
+ "learning_rate": 1.8732630207284863e-06,
+ "loss": 0.0282,
+ "step": 29651
+ },
+ {
+ "epoch": 80.79564032697547,
+ "grad_norm": 2.6866910457611084,
+ "learning_rate": 1.8727488059619203e-06,
+ "loss": 0.0992,
+ "step": 29652
+ },
+ {
+ "epoch": 80.7983651226158,
+ "grad_norm": 2.986560106277466,
+ "learning_rate": 1.872234654490126e-06,
+ "loss": 0.1254,
+ "step": 29653
+ },
+ {
+ "epoch": 80.80108991825612,
+ "grad_norm": 1.9595917463302612,
+ "learning_rate": 1.8717205663171034e-06,
+ "loss": 0.0236,
+ "step": 29654
+ },
+ {
+ "epoch": 80.80381471389646,
+ "grad_norm": 2.430351734161377,
+ "learning_rate": 1.8712065414468595e-06,
+ "loss": 0.0429,
+ "step": 29655
+ },
+ {
+ "epoch": 80.80653950953679,
+ "grad_norm": 2.9290590286254883,
+ "learning_rate": 1.8706925798833997e-06,
+ "loss": 0.0515,
+ "step": 29656
+ },
+ {
+ "epoch": 80.80926430517711,
+ "grad_norm": 3.7299163341522217,
+ "learning_rate": 1.8701786816307255e-06,
+ "loss": 0.0623,
+ "step": 29657
+ },
+ {
+ "epoch": 80.81198910081744,
+ "grad_norm": 2.51239275932312,
+ "learning_rate": 1.8696648466928347e-06,
+ "loss": 0.1859,
+ "step": 29658
+ },
+ {
+ "epoch": 80.81471389645776,
+ "grad_norm": 2.1915643215179443,
+ "learning_rate": 1.8691510750737352e-06,
+ "loss": 0.0233,
+ "step": 29659
+ },
+ {
+ "epoch": 80.8174386920981,
+ "grad_norm": 2.2097456455230713,
+ "learning_rate": 1.8686373667774248e-06,
+ "loss": 0.0321,
+ "step": 29660
+ },
+ {
+ "epoch": 80.82016348773843,
+ "grad_norm": 2.278515577316284,
+ "learning_rate": 1.8681237218079063e-06,
+ "loss": 0.0328,
+ "step": 29661
+ },
+ {
+ "epoch": 80.82288828337875,
+ "grad_norm": 4.386941432952881,
+ "learning_rate": 1.8676101401691748e-06,
+ "loss": 0.103,
+ "step": 29662
+ },
+ {
+ "epoch": 80.82561307901908,
+ "grad_norm": 3.178586483001709,
+ "learning_rate": 1.8670966218652365e-06,
+ "loss": 0.114,
+ "step": 29663
+ },
+ {
+ "epoch": 80.8283378746594,
+ "grad_norm": 2.8836803436279297,
+ "learning_rate": 1.866583166900089e-06,
+ "loss": 0.0487,
+ "step": 29664
+ },
+ {
+ "epoch": 80.83106267029973,
+ "grad_norm": 2.9946720600128174,
+ "learning_rate": 1.866069775277729e-06,
+ "loss": 0.0349,
+ "step": 29665
+ },
+ {
+ "epoch": 80.83378746594005,
+ "grad_norm": 2.5141279697418213,
+ "learning_rate": 1.8655564470021526e-06,
+ "loss": 0.0285,
+ "step": 29666
+ },
+ {
+ "epoch": 80.83651226158038,
+ "grad_norm": 2.748910427093506,
+ "learning_rate": 1.8650431820773651e-06,
+ "loss": 0.0798,
+ "step": 29667
+ },
+ {
+ "epoch": 80.83923705722071,
+ "grad_norm": 2.2487642765045166,
+ "learning_rate": 1.864529980507358e-06,
+ "loss": 0.0364,
+ "step": 29668
+ },
+ {
+ "epoch": 80.84196185286103,
+ "grad_norm": 1.5930827856063843,
+ "learning_rate": 1.8640168422961303e-06,
+ "loss": 0.0229,
+ "step": 29669
+ },
+ {
+ "epoch": 80.84468664850137,
+ "grad_norm": 4.5194292068481445,
+ "learning_rate": 1.8635037674476752e-06,
+ "loss": 0.1947,
+ "step": 29670
+ },
+ {
+ "epoch": 80.84741144414168,
+ "grad_norm": 3.067448139190674,
+ "learning_rate": 1.8629907559659922e-06,
+ "loss": 0.0555,
+ "step": 29671
+ },
+ {
+ "epoch": 80.85013623978202,
+ "grad_norm": 2.2344095706939697,
+ "learning_rate": 1.8624778078550743e-06,
+ "loss": 0.0264,
+ "step": 29672
+ },
+ {
+ "epoch": 80.85286103542235,
+ "grad_norm": 2.330422878265381,
+ "learning_rate": 1.8619649231189186e-06,
+ "loss": 0.0391,
+ "step": 29673
+ },
+ {
+ "epoch": 80.85558583106267,
+ "grad_norm": 2.7653892040252686,
+ "learning_rate": 1.8614521017615196e-06,
+ "loss": 0.0508,
+ "step": 29674
+ },
+ {
+ "epoch": 80.858310626703,
+ "grad_norm": 2.0616846084594727,
+ "learning_rate": 1.8609393437868662e-06,
+ "loss": 0.1164,
+ "step": 29675
+ },
+ {
+ "epoch": 80.86103542234332,
+ "grad_norm": 2.1021788120269775,
+ "learning_rate": 1.8604266491989575e-06,
+ "loss": 0.0286,
+ "step": 29676
+ },
+ {
+ "epoch": 80.86376021798365,
+ "grad_norm": 2.714175224304199,
+ "learning_rate": 1.859914018001785e-06,
+ "loss": 0.0982,
+ "step": 29677
+ },
+ {
+ "epoch": 80.86648501362397,
+ "grad_norm": 1.7867244482040405,
+ "learning_rate": 1.8594014501993362e-06,
+ "loss": 0.0801,
+ "step": 29678
+ },
+ {
+ "epoch": 80.8692098092643,
+ "grad_norm": 2.017289876937866,
+ "learning_rate": 1.8588889457956106e-06,
+ "loss": 0.0291,
+ "step": 29679
+ },
+ {
+ "epoch": 80.87193460490464,
+ "grad_norm": 1.6092020273208618,
+ "learning_rate": 1.8583765047945956e-06,
+ "loss": 0.0186,
+ "step": 29680
+ },
+ {
+ "epoch": 80.87465940054496,
+ "grad_norm": 3.8612475395202637,
+ "learning_rate": 1.8578641272002818e-06,
+ "loss": 0.1904,
+ "step": 29681
+ },
+ {
+ "epoch": 80.87738419618529,
+ "grad_norm": 3.600154399871826,
+ "learning_rate": 1.857351813016659e-06,
+ "loss": 0.0456,
+ "step": 29682
+ },
+ {
+ "epoch": 80.88010899182561,
+ "grad_norm": 2.4364824295043945,
+ "learning_rate": 1.8568395622477198e-06,
+ "loss": 0.025,
+ "step": 29683
+ },
+ {
+ "epoch": 80.88283378746594,
+ "grad_norm": 4.23787260055542,
+ "learning_rate": 1.856327374897452e-06,
+ "loss": 0.1376,
+ "step": 29684
+ },
+ {
+ "epoch": 80.88555858310627,
+ "grad_norm": 2.548859119415283,
+ "learning_rate": 1.8558152509698446e-06,
+ "loss": 0.038,
+ "step": 29685
+ },
+ {
+ "epoch": 80.88828337874659,
+ "grad_norm": 1.9448168277740479,
+ "learning_rate": 1.8553031904688833e-06,
+ "loss": 0.0614,
+ "step": 29686
+ },
+ {
+ "epoch": 80.89100817438693,
+ "grad_norm": 3.829408884048462,
+ "learning_rate": 1.8547911933985607e-06,
+ "loss": 0.2498,
+ "step": 29687
+ },
+ {
+ "epoch": 80.89373297002724,
+ "grad_norm": 2.3729562759399414,
+ "learning_rate": 1.8542792597628622e-06,
+ "loss": 0.0553,
+ "step": 29688
+ },
+ {
+ "epoch": 80.89645776566758,
+ "grad_norm": 2.532068967819214,
+ "learning_rate": 1.8537673895657726e-06,
+ "loss": 0.0325,
+ "step": 29689
+ },
+ {
+ "epoch": 80.8991825613079,
+ "grad_norm": 2.1381380558013916,
+ "learning_rate": 1.853255582811283e-06,
+ "loss": 0.0198,
+ "step": 29690
+ },
+ {
+ "epoch": 80.90190735694823,
+ "grad_norm": 2.2383947372436523,
+ "learning_rate": 1.8527438395033747e-06,
+ "loss": 0.0384,
+ "step": 29691
+ },
+ {
+ "epoch": 80.90463215258856,
+ "grad_norm": 3.122887372970581,
+ "learning_rate": 1.8522321596460368e-06,
+ "loss": 0.0869,
+ "step": 29692
+ },
+ {
+ "epoch": 80.90735694822888,
+ "grad_norm": 3.0096633434295654,
+ "learning_rate": 1.8517205432432527e-06,
+ "loss": 0.0855,
+ "step": 29693
+ },
+ {
+ "epoch": 80.91008174386921,
+ "grad_norm": 3.814385175704956,
+ "learning_rate": 1.851208990299007e-06,
+ "loss": 0.0641,
+ "step": 29694
+ },
+ {
+ "epoch": 80.91280653950953,
+ "grad_norm": 3.931626319885254,
+ "learning_rate": 1.850697500817281e-06,
+ "loss": 0.075,
+ "step": 29695
+ },
+ {
+ "epoch": 80.91553133514986,
+ "grad_norm": 2.4536795616149902,
+ "learning_rate": 1.8501860748020629e-06,
+ "loss": 0.0468,
+ "step": 29696
+ },
+ {
+ "epoch": 80.9182561307902,
+ "grad_norm": 10.569121360778809,
+ "learning_rate": 1.8496747122573333e-06,
+ "loss": 0.0817,
+ "step": 29697
+ },
+ {
+ "epoch": 80.92098092643052,
+ "grad_norm": 2.4495747089385986,
+ "learning_rate": 1.8491634131870716e-06,
+ "loss": 0.1734,
+ "step": 29698
+ },
+ {
+ "epoch": 80.92370572207085,
+ "grad_norm": 2.783935785293579,
+ "learning_rate": 1.848652177595267e-06,
+ "loss": 0.0599,
+ "step": 29699
+ },
+ {
+ "epoch": 80.92643051771117,
+ "grad_norm": 1.924935221672058,
+ "learning_rate": 1.848141005485895e-06,
+ "loss": 0.0269,
+ "step": 29700
+ },
+ {
+ "epoch": 80.9291553133515,
+ "grad_norm": 5.172467231750488,
+ "learning_rate": 1.8476298968629401e-06,
+ "loss": 0.0405,
+ "step": 29701
+ },
+ {
+ "epoch": 80.93188010899182,
+ "grad_norm": 2.371753215789795,
+ "learning_rate": 1.8471188517303774e-06,
+ "loss": 0.0359,
+ "step": 29702
+ },
+ {
+ "epoch": 80.93460490463215,
+ "grad_norm": 2.5195109844207764,
+ "learning_rate": 1.846607870092194e-06,
+ "loss": 0.0991,
+ "step": 29703
+ },
+ {
+ "epoch": 80.93732970027249,
+ "grad_norm": 2.765890598297119,
+ "learning_rate": 1.8460969519523664e-06,
+ "loss": 0.0414,
+ "step": 29704
+ },
+ {
+ "epoch": 80.9400544959128,
+ "grad_norm": 3.039405584335327,
+ "learning_rate": 1.845586097314872e-06,
+ "loss": 0.047,
+ "step": 29705
+ },
+ {
+ "epoch": 80.94277929155314,
+ "grad_norm": 3.6830575466156006,
+ "learning_rate": 1.845075306183689e-06,
+ "loss": 0.0483,
+ "step": 29706
+ },
+ {
+ "epoch": 80.94550408719346,
+ "grad_norm": 2.1750757694244385,
+ "learning_rate": 1.8445645785627974e-06,
+ "loss": 0.1033,
+ "step": 29707
+ },
+ {
+ "epoch": 80.94822888283379,
+ "grad_norm": 3.339379072189331,
+ "learning_rate": 1.8440539144561763e-06,
+ "loss": 0.0714,
+ "step": 29708
+ },
+ {
+ "epoch": 80.95095367847412,
+ "grad_norm": 2.8890480995178223,
+ "learning_rate": 1.8435433138678017e-06,
+ "loss": 0.1083,
+ "step": 29709
+ },
+ {
+ "epoch": 80.95367847411444,
+ "grad_norm": 2.765408992767334,
+ "learning_rate": 1.8430327768016475e-06,
+ "loss": 0.0389,
+ "step": 29710
+ },
+ {
+ "epoch": 80.95640326975477,
+ "grad_norm": 2.0470902919769287,
+ "learning_rate": 1.84252230326169e-06,
+ "loss": 0.0867,
+ "step": 29711
+ },
+ {
+ "epoch": 80.95912806539509,
+ "grad_norm": 2.717745780944824,
+ "learning_rate": 1.8420118932519092e-06,
+ "loss": 0.0569,
+ "step": 29712
+ },
+ {
+ "epoch": 80.96185286103542,
+ "grad_norm": 3.666560411453247,
+ "learning_rate": 1.8415015467762764e-06,
+ "loss": 0.0859,
+ "step": 29713
+ },
+ {
+ "epoch": 80.96457765667574,
+ "grad_norm": 3.9778239727020264,
+ "learning_rate": 1.8409912638387684e-06,
+ "loss": 0.0852,
+ "step": 29714
+ },
+ {
+ "epoch": 80.96730245231608,
+ "grad_norm": 3.1109132766723633,
+ "learning_rate": 1.840481044443354e-06,
+ "loss": 0.0373,
+ "step": 29715
+ },
+ {
+ "epoch": 80.97002724795641,
+ "grad_norm": 2.45131778717041,
+ "learning_rate": 1.8399708885940136e-06,
+ "loss": 0.0559,
+ "step": 29716
+ },
+ {
+ "epoch": 80.97275204359673,
+ "grad_norm": 3.836390495300293,
+ "learning_rate": 1.8394607962947164e-06,
+ "loss": 0.0799,
+ "step": 29717
+ },
+ {
+ "epoch": 80.97547683923706,
+ "grad_norm": 2.3351268768310547,
+ "learning_rate": 1.8389507675494367e-06,
+ "loss": 0.025,
+ "step": 29718
+ },
+ {
+ "epoch": 80.97820163487738,
+ "grad_norm": 2.296884775161743,
+ "learning_rate": 1.8384408023621437e-06,
+ "loss": 0.1174,
+ "step": 29719
+ },
+ {
+ "epoch": 80.98092643051771,
+ "grad_norm": 1.9378864765167236,
+ "learning_rate": 1.8379309007368129e-06,
+ "loss": 0.1176,
+ "step": 29720
+ },
+ {
+ "epoch": 80.98365122615803,
+ "grad_norm": 2.872282028198242,
+ "learning_rate": 1.8374210626774137e-06,
+ "loss": 0.0511,
+ "step": 29721
+ },
+ {
+ "epoch": 80.98637602179836,
+ "grad_norm": 1.8208796977996826,
+ "learning_rate": 1.8369112881879136e-06,
+ "loss": 0.0693,
+ "step": 29722
+ },
+ {
+ "epoch": 80.9891008174387,
+ "grad_norm": 2.248429298400879,
+ "learning_rate": 1.8364015772722887e-06,
+ "loss": 0.0229,
+ "step": 29723
+ },
+ {
+ "epoch": 80.99182561307902,
+ "grad_norm": 4.804901123046875,
+ "learning_rate": 1.8358919299345024e-06,
+ "loss": 0.0479,
+ "step": 29724
+ },
+ {
+ "epoch": 80.99455040871935,
+ "grad_norm": 2.6181886196136475,
+ "learning_rate": 1.8353823461785304e-06,
+ "loss": 0.0536,
+ "step": 29725
+ },
+ {
+ "epoch": 80.99727520435967,
+ "grad_norm": 2.9905195236206055,
+ "learning_rate": 1.834872826008338e-06,
+ "loss": 0.0317,
+ "step": 29726
+ },
+ {
+ "epoch": 81.0,
+ "grad_norm": 2.4764912128448486,
+ "learning_rate": 1.8343633694278895e-06,
+ "loss": 0.0516,
+ "step": 29727
+ },
+ {
+ "epoch": 81.00272479564033,
+ "grad_norm": 2.7293291091918945,
+ "learning_rate": 1.83385397644116e-06,
+ "loss": 0.0323,
+ "step": 29728
+ },
+ {
+ "epoch": 81.00544959128065,
+ "grad_norm": 2.3819448947906494,
+ "learning_rate": 1.8333446470521122e-06,
+ "loss": 0.064,
+ "step": 29729
+ },
+ {
+ "epoch": 81.00817438692098,
+ "grad_norm": 3.2576510906219482,
+ "learning_rate": 1.8328353812647136e-06,
+ "loss": 0.0536,
+ "step": 29730
+ },
+ {
+ "epoch": 81.0108991825613,
+ "grad_norm": 2.521439552307129,
+ "learning_rate": 1.8323261790829283e-06,
+ "loss": 0.1308,
+ "step": 29731
+ },
+ {
+ "epoch": 81.01362397820164,
+ "grad_norm": 2.4987714290618896,
+ "learning_rate": 1.831817040510726e-06,
+ "loss": 0.0503,
+ "step": 29732
+ },
+ {
+ "epoch": 81.01634877384195,
+ "grad_norm": 2.5798354148864746,
+ "learning_rate": 1.8313079655520693e-06,
+ "loss": 0.0357,
+ "step": 29733
+ },
+ {
+ "epoch": 81.01907356948229,
+ "grad_norm": 2.3716537952423096,
+ "learning_rate": 1.8307989542109238e-06,
+ "loss": 0.1051,
+ "step": 29734
+ },
+ {
+ "epoch": 81.02179836512262,
+ "grad_norm": 2.076399564743042,
+ "learning_rate": 1.83029000649125e-06,
+ "loss": 0.0361,
+ "step": 29735
+ },
+ {
+ "epoch": 81.02452316076294,
+ "grad_norm": 1.5192015171051025,
+ "learning_rate": 1.8297811223970174e-06,
+ "loss": 0.0232,
+ "step": 29736
+ },
+ {
+ "epoch": 81.02724795640327,
+ "grad_norm": 1.9292784929275513,
+ "learning_rate": 1.8292723019321867e-06,
+ "loss": 0.0476,
+ "step": 29737
+ },
+ {
+ "epoch": 81.02997275204359,
+ "grad_norm": 2.645071268081665,
+ "learning_rate": 1.8287635451007202e-06,
+ "loss": 0.0393,
+ "step": 29738
+ },
+ {
+ "epoch": 81.03269754768392,
+ "grad_norm": 4.546024799346924,
+ "learning_rate": 1.8282548519065778e-06,
+ "loss": 0.2184,
+ "step": 29739
+ },
+ {
+ "epoch": 81.03542234332426,
+ "grad_norm": 2.8581202030181885,
+ "learning_rate": 1.8277462223537257e-06,
+ "loss": 0.0244,
+ "step": 29740
+ },
+ {
+ "epoch": 81.03814713896458,
+ "grad_norm": 1.6781800985336304,
+ "learning_rate": 1.8272376564461203e-06,
+ "loss": 0.0252,
+ "step": 29741
+ },
+ {
+ "epoch": 81.04087193460491,
+ "grad_norm": 2.3823750019073486,
+ "learning_rate": 1.8267291541877287e-06,
+ "loss": 0.0301,
+ "step": 29742
+ },
+ {
+ "epoch": 81.04359673024523,
+ "grad_norm": 2.648144483566284,
+ "learning_rate": 1.826220715582504e-06,
+ "loss": 0.148,
+ "step": 29743
+ },
+ {
+ "epoch": 81.04632152588556,
+ "grad_norm": 2.7481918334960938,
+ "learning_rate": 1.8257123406344125e-06,
+ "loss": 0.0814,
+ "step": 29744
+ },
+ {
+ "epoch": 81.04904632152588,
+ "grad_norm": 2.714812994003296,
+ "learning_rate": 1.8252040293474093e-06,
+ "loss": 0.0236,
+ "step": 29745
+ },
+ {
+ "epoch": 81.05177111716621,
+ "grad_norm": 2.4104068279266357,
+ "learning_rate": 1.824695781725454e-06,
+ "loss": 0.0238,
+ "step": 29746
+ },
+ {
+ "epoch": 81.05449591280654,
+ "grad_norm": 2.3135838508605957,
+ "learning_rate": 1.8241875977725032e-06,
+ "loss": 0.0279,
+ "step": 29747
+ },
+ {
+ "epoch": 81.05722070844686,
+ "grad_norm": 2.8281619548797607,
+ "learning_rate": 1.823679477492518e-06,
+ "loss": 0.0625,
+ "step": 29748
+ },
+ {
+ "epoch": 81.0599455040872,
+ "grad_norm": 2.4785587787628174,
+ "learning_rate": 1.8231714208894547e-06,
+ "loss": 0.2692,
+ "step": 29749
+ },
+ {
+ "epoch": 81.06267029972751,
+ "grad_norm": 2.241762161254883,
+ "learning_rate": 1.8226634279672684e-06,
+ "loss": 0.0283,
+ "step": 29750
+ },
+ {
+ "epoch": 81.06539509536785,
+ "grad_norm": 1.611305832862854,
+ "learning_rate": 1.822155498729914e-06,
+ "loss": 0.0215,
+ "step": 29751
+ },
+ {
+ "epoch": 81.06811989100818,
+ "grad_norm": 4.047661781311035,
+ "learning_rate": 1.8216476331813516e-06,
+ "loss": 0.18,
+ "step": 29752
+ },
+ {
+ "epoch": 81.0708446866485,
+ "grad_norm": 2.6989967823028564,
+ "learning_rate": 1.8211398313255347e-06,
+ "loss": 0.0994,
+ "step": 29753
+ },
+ {
+ "epoch": 81.07356948228883,
+ "grad_norm": 2.2276933193206787,
+ "learning_rate": 1.8206320931664168e-06,
+ "loss": 0.058,
+ "step": 29754
+ },
+ {
+ "epoch": 81.07629427792915,
+ "grad_norm": 2.4780147075653076,
+ "learning_rate": 1.8201244187079514e-06,
+ "loss": 0.0956,
+ "step": 29755
+ },
+ {
+ "epoch": 81.07901907356948,
+ "grad_norm": 2.6041982173919678,
+ "learning_rate": 1.8196168079540954e-06,
+ "loss": 0.1367,
+ "step": 29756
+ },
+ {
+ "epoch": 81.0817438692098,
+ "grad_norm": 2.5354366302490234,
+ "learning_rate": 1.8191092609088e-06,
+ "loss": 0.0642,
+ "step": 29757
+ },
+ {
+ "epoch": 81.08446866485014,
+ "grad_norm": 3.1977767944335938,
+ "learning_rate": 1.8186017775760167e-06,
+ "loss": 0.063,
+ "step": 29758
+ },
+ {
+ "epoch": 81.08719346049047,
+ "grad_norm": 2.9032578468322754,
+ "learning_rate": 1.818094357959702e-06,
+ "loss": 0.0409,
+ "step": 29759
+ },
+ {
+ "epoch": 81.08991825613079,
+ "grad_norm": 3.4103946685791016,
+ "learning_rate": 1.8175870020638032e-06,
+ "loss": 0.0905,
+ "step": 29760
+ },
+ {
+ "epoch": 81.09264305177112,
+ "grad_norm": 2.9289729595184326,
+ "learning_rate": 1.8170797098922744e-06,
+ "loss": 0.0762,
+ "step": 29761
+ },
+ {
+ "epoch": 81.09536784741144,
+ "grad_norm": 4.693163871765137,
+ "learning_rate": 1.8165724814490671e-06,
+ "loss": 0.0816,
+ "step": 29762
+ },
+ {
+ "epoch": 81.09809264305177,
+ "grad_norm": 2.403782844543457,
+ "learning_rate": 1.816065316738126e-06,
+ "loss": 0.0336,
+ "step": 29763
+ },
+ {
+ "epoch": 81.1008174386921,
+ "grad_norm": 2.709383964538574,
+ "learning_rate": 1.8155582157634077e-06,
+ "loss": 0.0806,
+ "step": 29764
+ },
+ {
+ "epoch": 81.10354223433242,
+ "grad_norm": 2.2318778038024902,
+ "learning_rate": 1.8150511785288593e-06,
+ "loss": 0.0926,
+ "step": 29765
+ },
+ {
+ "epoch": 81.10626702997276,
+ "grad_norm": 2.6320977210998535,
+ "learning_rate": 1.8145442050384287e-06,
+ "loss": 0.0997,
+ "step": 29766
+ },
+ {
+ "epoch": 81.10899182561307,
+ "grad_norm": 2.7063615322113037,
+ "learning_rate": 1.8140372952960617e-06,
+ "loss": 0.0531,
+ "step": 29767
+ },
+ {
+ "epoch": 81.11171662125341,
+ "grad_norm": 2.643054485321045,
+ "learning_rate": 1.8135304493057104e-06,
+ "loss": 0.1194,
+ "step": 29768
+ },
+ {
+ "epoch": 81.11444141689373,
+ "grad_norm": 1.9962857961654663,
+ "learning_rate": 1.813023667071322e-06,
+ "loss": 0.0352,
+ "step": 29769
+ },
+ {
+ "epoch": 81.11716621253406,
+ "grad_norm": 2.9487380981445312,
+ "learning_rate": 1.8125169485968409e-06,
+ "loss": 0.0857,
+ "step": 29770
+ },
+ {
+ "epoch": 81.11989100817439,
+ "grad_norm": 3.3684611320495605,
+ "learning_rate": 1.8120102938862115e-06,
+ "loss": 0.0842,
+ "step": 29771
+ },
+ {
+ "epoch": 81.12261580381471,
+ "grad_norm": 2.9693615436553955,
+ "learning_rate": 1.8115037029433857e-06,
+ "loss": 0.0575,
+ "step": 29772
+ },
+ {
+ "epoch": 81.12534059945504,
+ "grad_norm": 2.80663800239563,
+ "learning_rate": 1.8109971757723055e-06,
+ "loss": 0.0278,
+ "step": 29773
+ },
+ {
+ "epoch": 81.12806539509536,
+ "grad_norm": 16.64714241027832,
+ "learning_rate": 1.8104907123769155e-06,
+ "loss": 0.0515,
+ "step": 29774
+ },
+ {
+ "epoch": 81.1307901907357,
+ "grad_norm": 2.446871042251587,
+ "learning_rate": 1.8099843127611572e-06,
+ "loss": 0.1008,
+ "step": 29775
+ },
+ {
+ "epoch": 81.13351498637603,
+ "grad_norm": 2.202486753463745,
+ "learning_rate": 1.8094779769289782e-06,
+ "loss": 0.0224,
+ "step": 29776
+ },
+ {
+ "epoch": 81.13623978201635,
+ "grad_norm": 2.504746913909912,
+ "learning_rate": 1.8089717048843236e-06,
+ "loss": 0.1461,
+ "step": 29777
+ },
+ {
+ "epoch": 81.13896457765668,
+ "grad_norm": 4.355173587799072,
+ "learning_rate": 1.8084654966311333e-06,
+ "loss": 0.0335,
+ "step": 29778
+ },
+ {
+ "epoch": 81.141689373297,
+ "grad_norm": 3.3645434379577637,
+ "learning_rate": 1.8079593521733496e-06,
+ "loss": 0.0375,
+ "step": 29779
+ },
+ {
+ "epoch": 81.14441416893733,
+ "grad_norm": 2.8605713844299316,
+ "learning_rate": 1.8074532715149129e-06,
+ "loss": 0.0259,
+ "step": 29780
+ },
+ {
+ "epoch": 81.14713896457765,
+ "grad_norm": 5.118342876434326,
+ "learning_rate": 1.806947254659769e-06,
+ "loss": 0.0438,
+ "step": 29781
+ },
+ {
+ "epoch": 81.14986376021798,
+ "grad_norm": 2.464529275894165,
+ "learning_rate": 1.8064413016118566e-06,
+ "loss": 0.0957,
+ "step": 29782
+ },
+ {
+ "epoch": 81.15258855585832,
+ "grad_norm": 3.3721847534179688,
+ "learning_rate": 1.805935412375115e-06,
+ "loss": 0.0667,
+ "step": 29783
+ },
+ {
+ "epoch": 81.15531335149863,
+ "grad_norm": 2.146632671356201,
+ "learning_rate": 1.8054295869534822e-06,
+ "loss": 0.0327,
+ "step": 29784
+ },
+ {
+ "epoch": 81.15803814713897,
+ "grad_norm": 2.9291207790374756,
+ "learning_rate": 1.8049238253509027e-06,
+ "loss": 0.0807,
+ "step": 29785
+ },
+ {
+ "epoch": 81.16076294277929,
+ "grad_norm": 3.279160976409912,
+ "learning_rate": 1.8044181275713136e-06,
+ "loss": 0.0594,
+ "step": 29786
+ },
+ {
+ "epoch": 81.16348773841962,
+ "grad_norm": 2.5780253410339355,
+ "learning_rate": 1.803912493618648e-06,
+ "loss": 0.197,
+ "step": 29787
+ },
+ {
+ "epoch": 81.16621253405995,
+ "grad_norm": 3.292588710784912,
+ "learning_rate": 1.8034069234968521e-06,
+ "loss": 0.0959,
+ "step": 29788
+ },
+ {
+ "epoch": 81.16893732970027,
+ "grad_norm": 2.65609073638916,
+ "learning_rate": 1.802901417209859e-06,
+ "loss": 0.0677,
+ "step": 29789
+ },
+ {
+ "epoch": 81.1716621253406,
+ "grad_norm": 3.3790442943573,
+ "learning_rate": 1.802395974761605e-06,
+ "loss": 0.0349,
+ "step": 29790
+ },
+ {
+ "epoch": 81.17438692098092,
+ "grad_norm": 3.52130126953125,
+ "learning_rate": 1.8018905961560252e-06,
+ "loss": 0.2011,
+ "step": 29791
+ },
+ {
+ "epoch": 81.17711171662125,
+ "grad_norm": 2.5949528217315674,
+ "learning_rate": 1.8013852813970578e-06,
+ "loss": 0.0688,
+ "step": 29792
+ },
+ {
+ "epoch": 81.17983651226157,
+ "grad_norm": 2.531221628189087,
+ "learning_rate": 1.800880030488641e-06,
+ "loss": 0.0314,
+ "step": 29793
+ },
+ {
+ "epoch": 81.1825613079019,
+ "grad_norm": 2.031641721725464,
+ "learning_rate": 1.8003748434347056e-06,
+ "loss": 0.0306,
+ "step": 29794
+ },
+ {
+ "epoch": 81.18528610354224,
+ "grad_norm": 2.294825553894043,
+ "learning_rate": 1.7998697202391879e-06,
+ "loss": 0.0275,
+ "step": 29795
+ },
+ {
+ "epoch": 81.18801089918256,
+ "grad_norm": 2.5791168212890625,
+ "learning_rate": 1.7993646609060178e-06,
+ "loss": 0.1291,
+ "step": 29796
+ },
+ {
+ "epoch": 81.19073569482289,
+ "grad_norm": 2.418940782546997,
+ "learning_rate": 1.7988596654391344e-06,
+ "loss": 0.0325,
+ "step": 29797
+ },
+ {
+ "epoch": 81.19346049046321,
+ "grad_norm": 2.2982542514801025,
+ "learning_rate": 1.7983547338424679e-06,
+ "loss": 0.0644,
+ "step": 29798
+ },
+ {
+ "epoch": 81.19618528610354,
+ "grad_norm": 2.1509060859680176,
+ "learning_rate": 1.7978498661199517e-06,
+ "loss": 0.0413,
+ "step": 29799
+ },
+ {
+ "epoch": 81.19891008174388,
+ "grad_norm": 2.949258327484131,
+ "learning_rate": 1.7973450622755128e-06,
+ "loss": 0.0663,
+ "step": 29800
+ },
+ {
+ "epoch": 81.2016348773842,
+ "grad_norm": 3.26342511177063,
+ "learning_rate": 1.7968403223130903e-06,
+ "loss": 0.0394,
+ "step": 29801
+ },
+ {
+ "epoch": 81.20435967302453,
+ "grad_norm": 1.684457778930664,
+ "learning_rate": 1.79633564623661e-06,
+ "loss": 0.0191,
+ "step": 29802
+ },
+ {
+ "epoch": 81.20708446866485,
+ "grad_norm": 2.2108731269836426,
+ "learning_rate": 1.7958310340500052e-06,
+ "loss": 0.0283,
+ "step": 29803
+ },
+ {
+ "epoch": 81.20980926430518,
+ "grad_norm": 1.8673276901245117,
+ "learning_rate": 1.7953264857572007e-06,
+ "loss": 0.03,
+ "step": 29804
+ },
+ {
+ "epoch": 81.2125340599455,
+ "grad_norm": 2.0287740230560303,
+ "learning_rate": 1.794822001362132e-06,
+ "loss": 0.0336,
+ "step": 29805
+ },
+ {
+ "epoch": 81.21525885558583,
+ "grad_norm": 3.3488810062408447,
+ "learning_rate": 1.7943175808687263e-06,
+ "loss": 0.0333,
+ "step": 29806
+ },
+ {
+ "epoch": 81.21798365122616,
+ "grad_norm": 4.035453796386719,
+ "learning_rate": 1.793813224280908e-06,
+ "loss": 0.1081,
+ "step": 29807
+ },
+ {
+ "epoch": 81.22070844686648,
+ "grad_norm": 1.9230246543884277,
+ "learning_rate": 1.793308931602611e-06,
+ "loss": 0.0775,
+ "step": 29808
+ },
+ {
+ "epoch": 81.22343324250681,
+ "grad_norm": 2.6343846321105957,
+ "learning_rate": 1.7928047028377593e-06,
+ "loss": 0.0838,
+ "step": 29809
+ },
+ {
+ "epoch": 81.22615803814713,
+ "grad_norm": 2.7012295722961426,
+ "learning_rate": 1.792300537990278e-06,
+ "loss": 0.0493,
+ "step": 29810
+ },
+ {
+ "epoch": 81.22888283378747,
+ "grad_norm": 7.361477851867676,
+ "learning_rate": 1.7917964370640995e-06,
+ "loss": 0.0706,
+ "step": 29811
+ },
+ {
+ "epoch": 81.2316076294278,
+ "grad_norm": 3.7112202644348145,
+ "learning_rate": 1.7912924000631426e-06,
+ "loss": 0.0466,
+ "step": 29812
+ },
+ {
+ "epoch": 81.23433242506812,
+ "grad_norm": 3.7624340057373047,
+ "learning_rate": 1.790788426991339e-06,
+ "loss": 0.0584,
+ "step": 29813
+ },
+ {
+ "epoch": 81.23705722070845,
+ "grad_norm": 2.4636874198913574,
+ "learning_rate": 1.7902845178526108e-06,
+ "loss": 0.0584,
+ "step": 29814
+ },
+ {
+ "epoch": 81.23978201634877,
+ "grad_norm": 2.357530117034912,
+ "learning_rate": 1.7897806726508825e-06,
+ "loss": 0.0387,
+ "step": 29815
+ },
+ {
+ "epoch": 81.2425068119891,
+ "grad_norm": 2.0760278701782227,
+ "learning_rate": 1.789276891390076e-06,
+ "loss": 0.0282,
+ "step": 29816
+ },
+ {
+ "epoch": 81.24523160762942,
+ "grad_norm": 2.263711452484131,
+ "learning_rate": 1.7887731740741199e-06,
+ "loss": 0.115,
+ "step": 29817
+ },
+ {
+ "epoch": 81.24795640326975,
+ "grad_norm": 3.8498334884643555,
+ "learning_rate": 1.7882695207069333e-06,
+ "loss": 0.0714,
+ "step": 29818
+ },
+ {
+ "epoch": 81.25068119891009,
+ "grad_norm": 2.1670942306518555,
+ "learning_rate": 1.787765931292439e-06,
+ "loss": 0.0296,
+ "step": 29819
+ },
+ {
+ "epoch": 81.2534059945504,
+ "grad_norm": 4.979239463806152,
+ "learning_rate": 1.7872624058345578e-06,
+ "loss": 0.2006,
+ "step": 29820
+ },
+ {
+ "epoch": 81.25613079019074,
+ "grad_norm": 2.578134775161743,
+ "learning_rate": 1.7867589443372145e-06,
+ "loss": 0.1225,
+ "step": 29821
+ },
+ {
+ "epoch": 81.25885558583106,
+ "grad_norm": 2.23673939704895,
+ "learning_rate": 1.7862555468043286e-06,
+ "loss": 0.1429,
+ "step": 29822
+ },
+ {
+ "epoch": 81.26158038147139,
+ "grad_norm": 2.3067750930786133,
+ "learning_rate": 1.7857522132398197e-06,
+ "loss": 0.0632,
+ "step": 29823
+ },
+ {
+ "epoch": 81.26430517711172,
+ "grad_norm": 3.627553939819336,
+ "learning_rate": 1.785248943647605e-06,
+ "loss": 0.065,
+ "step": 29824
+ },
+ {
+ "epoch": 81.26702997275204,
+ "grad_norm": 1.98140287399292,
+ "learning_rate": 1.7847457380316114e-06,
+ "loss": 0.023,
+ "step": 29825
+ },
+ {
+ "epoch": 81.26975476839237,
+ "grad_norm": 3.2189109325408936,
+ "learning_rate": 1.7842425963957522e-06,
+ "loss": 0.168,
+ "step": 29826
+ },
+ {
+ "epoch": 81.2724795640327,
+ "grad_norm": 2.831796169281006,
+ "learning_rate": 1.7837395187439454e-06,
+ "loss": 0.0354,
+ "step": 29827
+ },
+ {
+ "epoch": 81.27520435967303,
+ "grad_norm": 2.3508572578430176,
+ "learning_rate": 1.7832365050801104e-06,
+ "loss": 0.0255,
+ "step": 29828
+ },
+ {
+ "epoch": 81.27792915531334,
+ "grad_norm": 1.9571527242660522,
+ "learning_rate": 1.7827335554081671e-06,
+ "loss": 0.1761,
+ "step": 29829
+ },
+ {
+ "epoch": 81.28065395095368,
+ "grad_norm": 3.471651792526245,
+ "learning_rate": 1.7822306697320313e-06,
+ "loss": 0.0968,
+ "step": 29830
+ },
+ {
+ "epoch": 81.28337874659401,
+ "grad_norm": 2.7563226222991943,
+ "learning_rate": 1.7817278480556188e-06,
+ "loss": 0.0277,
+ "step": 29831
+ },
+ {
+ "epoch": 81.28610354223433,
+ "grad_norm": 6.3749680519104,
+ "learning_rate": 1.7812250903828421e-06,
+ "loss": 0.0312,
+ "step": 29832
+ },
+ {
+ "epoch": 81.28882833787466,
+ "grad_norm": 2.8318443298339844,
+ "learning_rate": 1.7807223967176223e-06,
+ "loss": 0.0378,
+ "step": 29833
+ },
+ {
+ "epoch": 81.29155313351498,
+ "grad_norm": 2.431612968444824,
+ "learning_rate": 1.7802197670638722e-06,
+ "loss": 0.0307,
+ "step": 29834
+ },
+ {
+ "epoch": 81.29427792915531,
+ "grad_norm": 5.3716349601745605,
+ "learning_rate": 1.779717201425506e-06,
+ "loss": 0.0495,
+ "step": 29835
+ },
+ {
+ "epoch": 81.29700272479565,
+ "grad_norm": 2.0733096599578857,
+ "learning_rate": 1.7792146998064352e-06,
+ "loss": 0.0274,
+ "step": 29836
+ },
+ {
+ "epoch": 81.29972752043597,
+ "grad_norm": 2.359156370162964,
+ "learning_rate": 1.778712262210578e-06,
+ "loss": 0.166,
+ "step": 29837
+ },
+ {
+ "epoch": 81.3024523160763,
+ "grad_norm": 3.301111936569214,
+ "learning_rate": 1.7782098886418452e-06,
+ "loss": 0.0467,
+ "step": 29838
+ },
+ {
+ "epoch": 81.30517711171662,
+ "grad_norm": 2.5791015625,
+ "learning_rate": 1.77770757910415e-06,
+ "loss": 0.0334,
+ "step": 29839
+ },
+ {
+ "epoch": 81.30790190735695,
+ "grad_norm": 2.3258755207061768,
+ "learning_rate": 1.7772053336013994e-06,
+ "loss": 0.1319,
+ "step": 29840
+ },
+ {
+ "epoch": 81.31062670299727,
+ "grad_norm": 2.801180601119995,
+ "learning_rate": 1.7767031521375133e-06,
+ "loss": 0.0821,
+ "step": 29841
+ },
+ {
+ "epoch": 81.3133514986376,
+ "grad_norm": 3.4304990768432617,
+ "learning_rate": 1.7762010347163971e-06,
+ "loss": 0.047,
+ "step": 29842
+ },
+ {
+ "epoch": 81.31607629427793,
+ "grad_norm": 2.7437901496887207,
+ "learning_rate": 1.7756989813419633e-06,
+ "loss": 0.0402,
+ "step": 29843
+ },
+ {
+ "epoch": 81.31880108991825,
+ "grad_norm": 3.671950578689575,
+ "learning_rate": 1.7751969920181179e-06,
+ "loss": 0.0481,
+ "step": 29844
+ },
+ {
+ "epoch": 81.32152588555859,
+ "grad_norm": 3.3324074745178223,
+ "learning_rate": 1.774695066748774e-06,
+ "loss": 0.0638,
+ "step": 29845
+ },
+ {
+ "epoch": 81.3242506811989,
+ "grad_norm": 3.460700511932373,
+ "learning_rate": 1.774193205537843e-06,
+ "loss": 0.0431,
+ "step": 29846
+ },
+ {
+ "epoch": 81.32697547683924,
+ "grad_norm": 4.062001705169678,
+ "learning_rate": 1.7736914083892299e-06,
+ "loss": 0.0891,
+ "step": 29847
+ },
+ {
+ "epoch": 81.32970027247957,
+ "grad_norm": 2.143021583557129,
+ "learning_rate": 1.7731896753068444e-06,
+ "loss": 0.0907,
+ "step": 29848
+ },
+ {
+ "epoch": 81.33242506811989,
+ "grad_norm": 2.740246295928955,
+ "learning_rate": 1.7726880062945895e-06,
+ "loss": 0.038,
+ "step": 29849
+ },
+ {
+ "epoch": 81.33514986376022,
+ "grad_norm": 2.9971389770507812,
+ "learning_rate": 1.7721864013563784e-06,
+ "loss": 0.1202,
+ "step": 29850
+ },
+ {
+ "epoch": 81.33787465940054,
+ "grad_norm": 2.616865634918213,
+ "learning_rate": 1.7716848604961144e-06,
+ "loss": 0.0839,
+ "step": 29851
+ },
+ {
+ "epoch": 81.34059945504087,
+ "grad_norm": 1.8004435300827026,
+ "learning_rate": 1.7711833837177017e-06,
+ "loss": 0.0193,
+ "step": 29852
+ },
+ {
+ "epoch": 81.34332425068119,
+ "grad_norm": 2.3700060844421387,
+ "learning_rate": 1.7706819710250512e-06,
+ "loss": 0.0437,
+ "step": 29853
+ },
+ {
+ "epoch": 81.34604904632153,
+ "grad_norm": 2.3682754039764404,
+ "learning_rate": 1.770180622422063e-06,
+ "loss": 0.0686,
+ "step": 29854
+ },
+ {
+ "epoch": 81.34877384196186,
+ "grad_norm": 3.4635727405548096,
+ "learning_rate": 1.7696793379126442e-06,
+ "loss": 0.1762,
+ "step": 29855
+ },
+ {
+ "epoch": 81.35149863760218,
+ "grad_norm": 3.5942399501800537,
+ "learning_rate": 1.769178117500696e-06,
+ "loss": 0.1508,
+ "step": 29856
+ },
+ {
+ "epoch": 81.35422343324251,
+ "grad_norm": 3.25348162651062,
+ "learning_rate": 1.7686769611901255e-06,
+ "loss": 0.0376,
+ "step": 29857
+ },
+ {
+ "epoch": 81.35694822888283,
+ "grad_norm": 3.1193687915802,
+ "learning_rate": 1.7681758689848338e-06,
+ "loss": 0.0826,
+ "step": 29858
+ },
+ {
+ "epoch": 81.35967302452316,
+ "grad_norm": 2.747248888015747,
+ "learning_rate": 1.7676748408887235e-06,
+ "loss": 0.0591,
+ "step": 29859
+ },
+ {
+ "epoch": 81.3623978201635,
+ "grad_norm": 2.7811264991760254,
+ "learning_rate": 1.7671738769056945e-06,
+ "loss": 0.133,
+ "step": 29860
+ },
+ {
+ "epoch": 81.36512261580381,
+ "grad_norm": 3.5850346088409424,
+ "learning_rate": 1.7666729770396495e-06,
+ "loss": 0.0386,
+ "step": 29861
+ },
+ {
+ "epoch": 81.36784741144415,
+ "grad_norm": 1.7230792045593262,
+ "learning_rate": 1.7661721412944943e-06,
+ "loss": 0.0554,
+ "step": 29862
+ },
+ {
+ "epoch": 81.37057220708446,
+ "grad_norm": 3.7165582180023193,
+ "learning_rate": 1.7656713696741246e-06,
+ "loss": 0.0675,
+ "step": 29863
+ },
+ {
+ "epoch": 81.3732970027248,
+ "grad_norm": 2.740318536758423,
+ "learning_rate": 1.7651706621824405e-06,
+ "loss": 0.0725,
+ "step": 29864
+ },
+ {
+ "epoch": 81.37602179836512,
+ "grad_norm": 2.3790948390960693,
+ "learning_rate": 1.7646700188233411e-06,
+ "loss": 0.0211,
+ "step": 29865
+ },
+ {
+ "epoch": 81.37874659400545,
+ "grad_norm": 1.86640202999115,
+ "learning_rate": 1.764169439600728e-06,
+ "loss": 0.1383,
+ "step": 29866
+ },
+ {
+ "epoch": 81.38147138964578,
+ "grad_norm": 3.29257869720459,
+ "learning_rate": 1.763668924518499e-06,
+ "loss": 0.047,
+ "step": 29867
+ },
+ {
+ "epoch": 81.3841961852861,
+ "grad_norm": 2.2106664180755615,
+ "learning_rate": 1.763168473580551e-06,
+ "loss": 0.0818,
+ "step": 29868
+ },
+ {
+ "epoch": 81.38692098092643,
+ "grad_norm": 2.619067668914795,
+ "learning_rate": 1.7626680867907787e-06,
+ "loss": 0.0582,
+ "step": 29869
+ },
+ {
+ "epoch": 81.38964577656675,
+ "grad_norm": 3.078220844268799,
+ "learning_rate": 1.7621677641530855e-06,
+ "loss": 0.257,
+ "step": 29870
+ },
+ {
+ "epoch": 81.39237057220708,
+ "grad_norm": 3.548492670059204,
+ "learning_rate": 1.761667505671365e-06,
+ "loss": 0.0604,
+ "step": 29871
+ },
+ {
+ "epoch": 81.39509536784742,
+ "grad_norm": 2.28106427192688,
+ "learning_rate": 1.7611673113495098e-06,
+ "loss": 0.0374,
+ "step": 29872
+ },
+ {
+ "epoch": 81.39782016348774,
+ "grad_norm": 2.0537807941436768,
+ "learning_rate": 1.7606671811914212e-06,
+ "loss": 0.0179,
+ "step": 29873
+ },
+ {
+ "epoch": 81.40054495912807,
+ "grad_norm": 2.14174747467041,
+ "learning_rate": 1.7601671152009903e-06,
+ "loss": 0.0263,
+ "step": 29874
+ },
+ {
+ "epoch": 81.40326975476839,
+ "grad_norm": 3.556363582611084,
+ "learning_rate": 1.7596671133821142e-06,
+ "loss": 0.0538,
+ "step": 29875
+ },
+ {
+ "epoch": 81.40599455040872,
+ "grad_norm": 2.0083611011505127,
+ "learning_rate": 1.7591671757386818e-06,
+ "loss": 0.0298,
+ "step": 29876
+ },
+ {
+ "epoch": 81.40871934604904,
+ "grad_norm": 2.6074280738830566,
+ "learning_rate": 1.7586673022745936e-06,
+ "loss": 0.1115,
+ "step": 29877
+ },
+ {
+ "epoch": 81.41144414168937,
+ "grad_norm": 3.154125213623047,
+ "learning_rate": 1.7581674929937354e-06,
+ "loss": 0.0352,
+ "step": 29878
+ },
+ {
+ "epoch": 81.4141689373297,
+ "grad_norm": 1.8756235837936401,
+ "learning_rate": 1.7576677479000072e-06,
+ "loss": 0.0249,
+ "step": 29879
+ },
+ {
+ "epoch": 81.41689373297002,
+ "grad_norm": 2.6808886528015137,
+ "learning_rate": 1.7571680669972969e-06,
+ "loss": 0.1049,
+ "step": 29880
+ },
+ {
+ "epoch": 81.41961852861036,
+ "grad_norm": 2.7920801639556885,
+ "learning_rate": 1.7566684502894938e-06,
+ "loss": 0.0524,
+ "step": 29881
+ },
+ {
+ "epoch": 81.42234332425068,
+ "grad_norm": 2.620394706726074,
+ "learning_rate": 1.7561688977804946e-06,
+ "loss": 0.0293,
+ "step": 29882
+ },
+ {
+ "epoch": 81.42506811989101,
+ "grad_norm": 2.0136470794677734,
+ "learning_rate": 1.7556694094741867e-06,
+ "loss": 0.0302,
+ "step": 29883
+ },
+ {
+ "epoch": 81.42779291553134,
+ "grad_norm": 2.3976151943206787,
+ "learning_rate": 1.7551699853744587e-06,
+ "loss": 0.0619,
+ "step": 29884
+ },
+ {
+ "epoch": 81.43051771117166,
+ "grad_norm": 10.679306983947754,
+ "learning_rate": 1.7546706254852008e-06,
+ "loss": 0.0429,
+ "step": 29885
+ },
+ {
+ "epoch": 81.433242506812,
+ "grad_norm": 2.1830060482025146,
+ "learning_rate": 1.7541713298103036e-06,
+ "loss": 0.0413,
+ "step": 29886
+ },
+ {
+ "epoch": 81.43596730245231,
+ "grad_norm": 2.6556344032287598,
+ "learning_rate": 1.753672098353656e-06,
+ "loss": 0.064,
+ "step": 29887
+ },
+ {
+ "epoch": 81.43869209809264,
+ "grad_norm": 2.9608054161071777,
+ "learning_rate": 1.7531729311191436e-06,
+ "loss": 0.0666,
+ "step": 29888
+ },
+ {
+ "epoch": 81.44141689373296,
+ "grad_norm": 3.7339558601379395,
+ "learning_rate": 1.7526738281106537e-06,
+ "loss": 0.0741,
+ "step": 29889
+ },
+ {
+ "epoch": 81.4441416893733,
+ "grad_norm": 5.09855318069458,
+ "learning_rate": 1.7521747893320762e-06,
+ "loss": 0.0683,
+ "step": 29890
+ },
+ {
+ "epoch": 81.44686648501363,
+ "grad_norm": 2.303555965423584,
+ "learning_rate": 1.7516758147872958e-06,
+ "loss": 0.0665,
+ "step": 29891
+ },
+ {
+ "epoch": 81.44959128065395,
+ "grad_norm": 2.3130557537078857,
+ "learning_rate": 1.7511769044801996e-06,
+ "loss": 0.0345,
+ "step": 29892
+ },
+ {
+ "epoch": 81.45231607629428,
+ "grad_norm": 2.083970069885254,
+ "learning_rate": 1.7506780584146688e-06,
+ "loss": 0.0852,
+ "step": 29893
+ },
+ {
+ "epoch": 81.4550408719346,
+ "grad_norm": 3.7353780269622803,
+ "learning_rate": 1.7501792765945947e-06,
+ "loss": 0.1158,
+ "step": 29894
+ },
+ {
+ "epoch": 81.45776566757493,
+ "grad_norm": 2.5525665283203125,
+ "learning_rate": 1.7496805590238586e-06,
+ "loss": 0.0521,
+ "step": 29895
+ },
+ {
+ "epoch": 81.46049046321527,
+ "grad_norm": 3.040743589401245,
+ "learning_rate": 1.7491819057063419e-06,
+ "loss": 0.0464,
+ "step": 29896
+ },
+ {
+ "epoch": 81.46321525885558,
+ "grad_norm": 3.0327980518341064,
+ "learning_rate": 1.7486833166459316e-06,
+ "loss": 0.0427,
+ "step": 29897
+ },
+ {
+ "epoch": 81.46594005449592,
+ "grad_norm": 1.9803370237350464,
+ "learning_rate": 1.7481847918465133e-06,
+ "loss": 0.0217,
+ "step": 29898
+ },
+ {
+ "epoch": 81.46866485013624,
+ "grad_norm": 2.665926456451416,
+ "learning_rate": 1.7476863313119653e-06,
+ "loss": 0.0726,
+ "step": 29899
+ },
+ {
+ "epoch": 81.47138964577657,
+ "grad_norm": 2.0836374759674072,
+ "learning_rate": 1.7471879350461706e-06,
+ "loss": 0.0342,
+ "step": 29900
+ },
+ {
+ "epoch": 81.47411444141689,
+ "grad_norm": 2.743572950363159,
+ "learning_rate": 1.7466896030530078e-06,
+ "loss": 0.0377,
+ "step": 29901
+ },
+ {
+ "epoch": 81.47683923705722,
+ "grad_norm": 2.8299994468688965,
+ "learning_rate": 1.7461913353363635e-06,
+ "loss": 0.0573,
+ "step": 29902
+ },
+ {
+ "epoch": 81.47956403269755,
+ "grad_norm": 3.7928919792175293,
+ "learning_rate": 1.745693131900116e-06,
+ "loss": 0.0939,
+ "step": 29903
+ },
+ {
+ "epoch": 81.48228882833787,
+ "grad_norm": 2.3251705169677734,
+ "learning_rate": 1.745194992748145e-06,
+ "loss": 0.0331,
+ "step": 29904
+ },
+ {
+ "epoch": 81.4850136239782,
+ "grad_norm": 1.957998275756836,
+ "learning_rate": 1.7446969178843265e-06,
+ "loss": 0.026,
+ "step": 29905
+ },
+ {
+ "epoch": 81.48773841961852,
+ "grad_norm": 2.587820529937744,
+ "learning_rate": 1.7441989073125453e-06,
+ "loss": 0.0477,
+ "step": 29906
+ },
+ {
+ "epoch": 81.49046321525886,
+ "grad_norm": 2.38033390045166,
+ "learning_rate": 1.7437009610366773e-06,
+ "loss": 0.0337,
+ "step": 29907
+ },
+ {
+ "epoch": 81.49318801089919,
+ "grad_norm": 2.0060131549835205,
+ "learning_rate": 1.7432030790606003e-06,
+ "loss": 0.0511,
+ "step": 29908
+ },
+ {
+ "epoch": 81.49591280653951,
+ "grad_norm": 2.593278646469116,
+ "learning_rate": 1.742705261388189e-06,
+ "loss": 0.0331,
+ "step": 29909
+ },
+ {
+ "epoch": 81.49863760217984,
+ "grad_norm": 2.8909037113189697,
+ "learning_rate": 1.742207508023327e-06,
+ "loss": 0.0859,
+ "step": 29910
+ },
+ {
+ "epoch": 81.50136239782016,
+ "grad_norm": 3.4047446250915527,
+ "learning_rate": 1.7417098189698866e-06,
+ "loss": 0.0426,
+ "step": 29911
+ },
+ {
+ "epoch": 81.50408719346049,
+ "grad_norm": 3.3756182193756104,
+ "learning_rate": 1.741212194231744e-06,
+ "loss": 0.1363,
+ "step": 29912
+ },
+ {
+ "epoch": 81.50681198910081,
+ "grad_norm": 2.3397152423858643,
+ "learning_rate": 1.7407146338127713e-06,
+ "loss": 0.0369,
+ "step": 29913
+ },
+ {
+ "epoch": 81.50953678474114,
+ "grad_norm": 2.27807879447937,
+ "learning_rate": 1.7402171377168509e-06,
+ "loss": 0.0342,
+ "step": 29914
+ },
+ {
+ "epoch": 81.51226158038148,
+ "grad_norm": 1.9141989946365356,
+ "learning_rate": 1.7397197059478543e-06,
+ "loss": 0.0731,
+ "step": 29915
+ },
+ {
+ "epoch": 81.5149863760218,
+ "grad_norm": 3.7800650596618652,
+ "learning_rate": 1.7392223385096542e-06,
+ "loss": 0.059,
+ "step": 29916
+ },
+ {
+ "epoch": 81.51771117166213,
+ "grad_norm": 2.881908416748047,
+ "learning_rate": 1.7387250354061225e-06,
+ "loss": 0.035,
+ "step": 29917
+ },
+ {
+ "epoch": 81.52043596730245,
+ "grad_norm": 3.036841869354248,
+ "learning_rate": 1.7382277966411366e-06,
+ "loss": 0.0469,
+ "step": 29918
+ },
+ {
+ "epoch": 81.52316076294278,
+ "grad_norm": 2.2260324954986572,
+ "learning_rate": 1.7377306222185663e-06,
+ "loss": 0.045,
+ "step": 29919
+ },
+ {
+ "epoch": 81.52588555858311,
+ "grad_norm": 2.8261077404022217,
+ "learning_rate": 1.7372335121422857e-06,
+ "loss": 0.043,
+ "step": 29920
+ },
+ {
+ "epoch": 81.52861035422343,
+ "grad_norm": 4.075632572174072,
+ "learning_rate": 1.7367364664161602e-06,
+ "loss": 0.0724,
+ "step": 29921
+ },
+ {
+ "epoch": 81.53133514986376,
+ "grad_norm": 3.843763828277588,
+ "learning_rate": 1.736239485044069e-06,
+ "loss": 0.0865,
+ "step": 29922
+ },
+ {
+ "epoch": 81.53405994550408,
+ "grad_norm": 5.14616584777832,
+ "learning_rate": 1.7357425680298778e-06,
+ "loss": 0.0412,
+ "step": 29923
+ },
+ {
+ "epoch": 81.53678474114442,
+ "grad_norm": 2.7485291957855225,
+ "learning_rate": 1.7352457153774583e-06,
+ "loss": 0.1001,
+ "step": 29924
+ },
+ {
+ "epoch": 81.53950953678473,
+ "grad_norm": 3.3290557861328125,
+ "learning_rate": 1.734748927090676e-06,
+ "loss": 0.0421,
+ "step": 29925
+ },
+ {
+ "epoch": 81.54223433242507,
+ "grad_norm": 3.092393636703491,
+ "learning_rate": 1.7342522031734054e-06,
+ "loss": 0.0351,
+ "step": 29926
+ },
+ {
+ "epoch": 81.5449591280654,
+ "grad_norm": 2.5042364597320557,
+ "learning_rate": 1.7337555436295128e-06,
+ "loss": 0.0471,
+ "step": 29927
+ },
+ {
+ "epoch": 81.54768392370572,
+ "grad_norm": 2.964219808578491,
+ "learning_rate": 1.733258948462866e-06,
+ "loss": 0.0653,
+ "step": 29928
+ },
+ {
+ "epoch": 81.55040871934605,
+ "grad_norm": 2.377936601638794,
+ "learning_rate": 1.7327624176773306e-06,
+ "loss": 0.0304,
+ "step": 29929
+ },
+ {
+ "epoch": 81.55313351498637,
+ "grad_norm": 6.652313232421875,
+ "learning_rate": 1.7322659512767748e-06,
+ "loss": 0.1374,
+ "step": 29930
+ },
+ {
+ "epoch": 81.5558583106267,
+ "grad_norm": 3.4335744380950928,
+ "learning_rate": 1.7317695492650676e-06,
+ "loss": 0.0881,
+ "step": 29931
+ },
+ {
+ "epoch": 81.55858310626704,
+ "grad_norm": 1.9838346242904663,
+ "learning_rate": 1.731273211646074e-06,
+ "loss": 0.0295,
+ "step": 29932
+ },
+ {
+ "epoch": 81.56130790190736,
+ "grad_norm": 1.8397482633590698,
+ "learning_rate": 1.7307769384236584e-06,
+ "loss": 0.0735,
+ "step": 29933
+ },
+ {
+ "epoch": 81.56403269754769,
+ "grad_norm": 3.7043726444244385,
+ "learning_rate": 1.7302807296016833e-06,
+ "loss": 0.0695,
+ "step": 29934
+ },
+ {
+ "epoch": 81.566757493188,
+ "grad_norm": 2.511993169784546,
+ "learning_rate": 1.7297845851840177e-06,
+ "loss": 0.0996,
+ "step": 29935
+ },
+ {
+ "epoch": 81.56948228882834,
+ "grad_norm": 3.044713020324707,
+ "learning_rate": 1.7292885051745246e-06,
+ "loss": 0.1011,
+ "step": 29936
+ },
+ {
+ "epoch": 81.57220708446866,
+ "grad_norm": 1.742403268814087,
+ "learning_rate": 1.7287924895770624e-06,
+ "loss": 0.0359,
+ "step": 29937
+ },
+ {
+ "epoch": 81.57493188010899,
+ "grad_norm": 2.31221079826355,
+ "learning_rate": 1.7282965383955019e-06,
+ "loss": 0.0305,
+ "step": 29938
+ },
+ {
+ "epoch": 81.57765667574932,
+ "grad_norm": 1.7335597276687622,
+ "learning_rate": 1.7278006516337008e-06,
+ "loss": 0.0253,
+ "step": 29939
+ },
+ {
+ "epoch": 81.58038147138964,
+ "grad_norm": 2.5325331687927246,
+ "learning_rate": 1.727304829295523e-06,
+ "loss": 0.132,
+ "step": 29940
+ },
+ {
+ "epoch": 81.58310626702998,
+ "grad_norm": 3.9940176010131836,
+ "learning_rate": 1.7268090713848262e-06,
+ "loss": 0.0905,
+ "step": 29941
+ },
+ {
+ "epoch": 81.5858310626703,
+ "grad_norm": 3.1452503204345703,
+ "learning_rate": 1.7263133779054763e-06,
+ "loss": 0.0342,
+ "step": 29942
+ },
+ {
+ "epoch": 81.58855585831063,
+ "grad_norm": 3.458385705947876,
+ "learning_rate": 1.7258177488613316e-06,
+ "loss": 0.0243,
+ "step": 29943
+ },
+ {
+ "epoch": 81.59128065395096,
+ "grad_norm": 2.0628957748413086,
+ "learning_rate": 1.7253221842562518e-06,
+ "loss": 0.0232,
+ "step": 29944
+ },
+ {
+ "epoch": 81.59400544959128,
+ "grad_norm": 2.961764097213745,
+ "learning_rate": 1.7248266840940941e-06,
+ "loss": 0.0457,
+ "step": 29945
+ },
+ {
+ "epoch": 81.59673024523161,
+ "grad_norm": 2.7390084266662598,
+ "learning_rate": 1.7243312483787222e-06,
+ "loss": 0.044,
+ "step": 29946
+ },
+ {
+ "epoch": 81.59945504087193,
+ "grad_norm": 1.9267858266830444,
+ "learning_rate": 1.7238358771139896e-06,
+ "loss": 0.0211,
+ "step": 29947
+ },
+ {
+ "epoch": 81.60217983651226,
+ "grad_norm": 1.6273704767227173,
+ "learning_rate": 1.7233405703037599e-06,
+ "loss": 0.0186,
+ "step": 29948
+ },
+ {
+ "epoch": 81.60490463215258,
+ "grad_norm": 2.7950947284698486,
+ "learning_rate": 1.7228453279518863e-06,
+ "loss": 0.085,
+ "step": 29949
+ },
+ {
+ "epoch": 81.60762942779292,
+ "grad_norm": 3.9736552238464355,
+ "learning_rate": 1.7223501500622252e-06,
+ "loss": 0.1084,
+ "step": 29950
+ },
+ {
+ "epoch": 81.61035422343325,
+ "grad_norm": 3.1905932426452637,
+ "learning_rate": 1.7218550366386378e-06,
+ "loss": 0.0843,
+ "step": 29951
+ },
+ {
+ "epoch": 81.61307901907357,
+ "grad_norm": 2.498032569885254,
+ "learning_rate": 1.7213599876849762e-06,
+ "loss": 0.045,
+ "step": 29952
+ },
+ {
+ "epoch": 81.6158038147139,
+ "grad_norm": 3.981534242630005,
+ "learning_rate": 1.7208650032050966e-06,
+ "loss": 0.0526,
+ "step": 29953
+ },
+ {
+ "epoch": 81.61852861035422,
+ "grad_norm": 2.571485996246338,
+ "learning_rate": 1.7203700832028513e-06,
+ "loss": 0.0667,
+ "step": 29954
+ },
+ {
+ "epoch": 81.62125340599455,
+ "grad_norm": 3.0207929611206055,
+ "learning_rate": 1.7198752276821007e-06,
+ "loss": 0.0285,
+ "step": 29955
+ },
+ {
+ "epoch": 81.62397820163488,
+ "grad_norm": 5.051114082336426,
+ "learning_rate": 1.7193804366466948e-06,
+ "loss": 0.1077,
+ "step": 29956
+ },
+ {
+ "epoch": 81.6267029972752,
+ "grad_norm": 2.274768352508545,
+ "learning_rate": 1.7188857101004873e-06,
+ "loss": 0.0813,
+ "step": 29957
+ },
+ {
+ "epoch": 81.62942779291554,
+ "grad_norm": 2.348160982131958,
+ "learning_rate": 1.7183910480473287e-06,
+ "loss": 0.1317,
+ "step": 29958
+ },
+ {
+ "epoch": 81.63215258855585,
+ "grad_norm": 1.8370074033737183,
+ "learning_rate": 1.7178964504910766e-06,
+ "loss": 0.0225,
+ "step": 29959
+ },
+ {
+ "epoch": 81.63487738419619,
+ "grad_norm": 2.805293560028076,
+ "learning_rate": 1.7174019174355805e-06,
+ "loss": 0.0744,
+ "step": 29960
+ },
+ {
+ "epoch": 81.6376021798365,
+ "grad_norm": 2.7617228031158447,
+ "learning_rate": 1.7169074488846905e-06,
+ "loss": 0.0433,
+ "step": 29961
+ },
+ {
+ "epoch": 81.64032697547684,
+ "grad_norm": 2.7769405841827393,
+ "learning_rate": 1.716413044842259e-06,
+ "loss": 0.0554,
+ "step": 29962
+ },
+ {
+ "epoch": 81.64305177111717,
+ "grad_norm": 3.071134328842163,
+ "learning_rate": 1.7159187053121373e-06,
+ "loss": 0.0972,
+ "step": 29963
+ },
+ {
+ "epoch": 81.64577656675749,
+ "grad_norm": 2.6598658561706543,
+ "learning_rate": 1.7154244302981715e-06,
+ "loss": 0.081,
+ "step": 29964
+ },
+ {
+ "epoch": 81.64850136239782,
+ "grad_norm": 3.348020315170288,
+ "learning_rate": 1.7149302198042162e-06,
+ "loss": 0.0742,
+ "step": 29965
+ },
+ {
+ "epoch": 81.65122615803814,
+ "grad_norm": 2.5943949222564697,
+ "learning_rate": 1.7144360738341148e-06,
+ "loss": 0.1429,
+ "step": 29966
+ },
+ {
+ "epoch": 81.65395095367847,
+ "grad_norm": 3.244645118713379,
+ "learning_rate": 1.713941992391721e-06,
+ "loss": 0.0366,
+ "step": 29967
+ },
+ {
+ "epoch": 81.65667574931881,
+ "grad_norm": 3.5837454795837402,
+ "learning_rate": 1.7134479754808808e-06,
+ "loss": 0.0822,
+ "step": 29968
+ },
+ {
+ "epoch": 81.65940054495913,
+ "grad_norm": 2.711371421813965,
+ "learning_rate": 1.712954023105441e-06,
+ "loss": 0.0778,
+ "step": 29969
+ },
+ {
+ "epoch": 81.66212534059946,
+ "grad_norm": 3.1979498863220215,
+ "learning_rate": 1.712460135269246e-06,
+ "loss": 0.0403,
+ "step": 29970
+ },
+ {
+ "epoch": 81.66485013623978,
+ "grad_norm": 2.8670384883880615,
+ "learning_rate": 1.7119663119761476e-06,
+ "loss": 0.0244,
+ "step": 29971
+ },
+ {
+ "epoch": 81.66757493188011,
+ "grad_norm": 2.829710006713867,
+ "learning_rate": 1.711472553229988e-06,
+ "loss": 0.0542,
+ "step": 29972
+ },
+ {
+ "epoch": 81.67029972752043,
+ "grad_norm": 2.1916730403900146,
+ "learning_rate": 1.7109788590346132e-06,
+ "loss": 0.0261,
+ "step": 29973
+ },
+ {
+ "epoch": 81.67302452316076,
+ "grad_norm": 3.1586687564849854,
+ "learning_rate": 1.7104852293938668e-06,
+ "loss": 0.0513,
+ "step": 29974
+ },
+ {
+ "epoch": 81.6757493188011,
+ "grad_norm": 2.4942362308502197,
+ "learning_rate": 1.7099916643115965e-06,
+ "loss": 0.1349,
+ "step": 29975
+ },
+ {
+ "epoch": 81.67847411444141,
+ "grad_norm": 2.431182622909546,
+ "learning_rate": 1.709498163791644e-06,
+ "loss": 0.0737,
+ "step": 29976
+ },
+ {
+ "epoch": 81.68119891008175,
+ "grad_norm": 2.157503843307495,
+ "learning_rate": 1.709004727837854e-06,
+ "loss": 0.0685,
+ "step": 29977
+ },
+ {
+ "epoch": 81.68392370572207,
+ "grad_norm": 3.029843330383301,
+ "learning_rate": 1.7085113564540657e-06,
+ "loss": 0.2559,
+ "step": 29978
+ },
+ {
+ "epoch": 81.6866485013624,
+ "grad_norm": 3.3971712589263916,
+ "learning_rate": 1.7080180496441257e-06,
+ "loss": 0.027,
+ "step": 29979
+ },
+ {
+ "epoch": 81.68937329700273,
+ "grad_norm": 3.483119487762451,
+ "learning_rate": 1.7075248074118745e-06,
+ "loss": 0.0348,
+ "step": 29980
+ },
+ {
+ "epoch": 81.69209809264305,
+ "grad_norm": 3.3105521202087402,
+ "learning_rate": 1.7070316297611512e-06,
+ "loss": 0.0393,
+ "step": 29981
+ },
+ {
+ "epoch": 81.69482288828338,
+ "grad_norm": 2.3459017276763916,
+ "learning_rate": 1.7065385166957982e-06,
+ "loss": 0.0441,
+ "step": 29982
+ },
+ {
+ "epoch": 81.6975476839237,
+ "grad_norm": 2.717716693878174,
+ "learning_rate": 1.7060454682196592e-06,
+ "loss": 0.0672,
+ "step": 29983
+ },
+ {
+ "epoch": 81.70027247956403,
+ "grad_norm": 3.3285694122314453,
+ "learning_rate": 1.7055524843365711e-06,
+ "loss": 0.0441,
+ "step": 29984
+ },
+ {
+ "epoch": 81.70299727520435,
+ "grad_norm": 2.250732183456421,
+ "learning_rate": 1.7050595650503732e-06,
+ "loss": 0.15,
+ "step": 29985
+ },
+ {
+ "epoch": 81.70572207084469,
+ "grad_norm": 4.812022686004639,
+ "learning_rate": 1.7045667103649021e-06,
+ "loss": 0.053,
+ "step": 29986
+ },
+ {
+ "epoch": 81.70844686648502,
+ "grad_norm": 3.1134819984436035,
+ "learning_rate": 1.7040739202840006e-06,
+ "loss": 0.2067,
+ "step": 29987
+ },
+ {
+ "epoch": 81.71117166212534,
+ "grad_norm": 2.6714956760406494,
+ "learning_rate": 1.7035811948115044e-06,
+ "loss": 0.0581,
+ "step": 29988
+ },
+ {
+ "epoch": 81.71389645776567,
+ "grad_norm": 2.735435962677002,
+ "learning_rate": 1.7030885339512505e-06,
+ "loss": 0.0703,
+ "step": 29989
+ },
+ {
+ "epoch": 81.71662125340599,
+ "grad_norm": 3.5400795936584473,
+ "learning_rate": 1.7025959377070745e-06,
+ "loss": 0.0434,
+ "step": 29990
+ },
+ {
+ "epoch": 81.71934604904632,
+ "grad_norm": 3.131110906600952,
+ "learning_rate": 1.7021034060828157e-06,
+ "loss": 0.0251,
+ "step": 29991
+ },
+ {
+ "epoch": 81.72207084468666,
+ "grad_norm": 2.1790151596069336,
+ "learning_rate": 1.70161093908231e-06,
+ "loss": 0.1077,
+ "step": 29992
+ },
+ {
+ "epoch": 81.72479564032697,
+ "grad_norm": 2.450204849243164,
+ "learning_rate": 1.7011185367093897e-06,
+ "loss": 0.087,
+ "step": 29993
+ },
+ {
+ "epoch": 81.7275204359673,
+ "grad_norm": 4.017487049102783,
+ "learning_rate": 1.7006261989678895e-06,
+ "loss": 0.062,
+ "step": 29994
+ },
+ {
+ "epoch": 81.73024523160763,
+ "grad_norm": 2.6964058876037598,
+ "learning_rate": 1.7001339258616478e-06,
+ "loss": 0.0718,
+ "step": 29995
+ },
+ {
+ "epoch": 81.73297002724796,
+ "grad_norm": 2.3090856075286865,
+ "learning_rate": 1.6996417173944957e-06,
+ "loss": 0.0529,
+ "step": 29996
+ },
+ {
+ "epoch": 81.73569482288828,
+ "grad_norm": 2.345402956008911,
+ "learning_rate": 1.6991495735702667e-06,
+ "loss": 0.1334,
+ "step": 29997
+ },
+ {
+ "epoch": 81.73841961852861,
+ "grad_norm": 2.830742835998535,
+ "learning_rate": 1.6986574943927913e-06,
+ "loss": 0.0771,
+ "step": 29998
+ },
+ {
+ "epoch": 81.74114441416894,
+ "grad_norm": 1.844018578529358,
+ "learning_rate": 1.6981654798659041e-06,
+ "loss": 0.0328,
+ "step": 29999
+ },
+ {
+ "epoch": 81.74386920980926,
+ "grad_norm": 4.724454402923584,
+ "learning_rate": 1.69767352999344e-06,
+ "loss": 0.0495,
+ "step": 30000
+ },
+ {
+ "epoch": 81.7465940054496,
+ "grad_norm": 3.6605615615844727,
+ "learning_rate": 1.6971816447792266e-06,
+ "loss": 0.1277,
+ "step": 30001
+ },
+ {
+ "epoch": 81.74931880108991,
+ "grad_norm": 2.996783494949341,
+ "learning_rate": 1.6966898242270935e-06,
+ "loss": 0.0268,
+ "step": 30002
+ },
+ {
+ "epoch": 81.75204359673025,
+ "grad_norm": 2.80468487739563,
+ "learning_rate": 1.6961980683408742e-06,
+ "loss": 0.0672,
+ "step": 30003
+ },
+ {
+ "epoch": 81.75476839237058,
+ "grad_norm": 2.24398136138916,
+ "learning_rate": 1.6957063771243977e-06,
+ "loss": 0.0511,
+ "step": 30004
+ },
+ {
+ "epoch": 81.7574931880109,
+ "grad_norm": 2.3950204849243164,
+ "learning_rate": 1.695214750581493e-06,
+ "loss": 0.032,
+ "step": 30005
+ },
+ {
+ "epoch": 81.76021798365123,
+ "grad_norm": 2.247523307800293,
+ "learning_rate": 1.6947231887159854e-06,
+ "loss": 0.0359,
+ "step": 30006
+ },
+ {
+ "epoch": 81.76294277929155,
+ "grad_norm": 2.835435628890991,
+ "learning_rate": 1.6942316915317091e-06,
+ "loss": 0.1541,
+ "step": 30007
+ },
+ {
+ "epoch": 81.76566757493188,
+ "grad_norm": 2.9872546195983887,
+ "learning_rate": 1.6937402590324892e-06,
+ "loss": 0.0295,
+ "step": 30008
+ },
+ {
+ "epoch": 81.7683923705722,
+ "grad_norm": 3.174426317214966,
+ "learning_rate": 1.6932488912221523e-06,
+ "loss": 0.0427,
+ "step": 30009
+ },
+ {
+ "epoch": 81.77111716621253,
+ "grad_norm": 3.640789747238159,
+ "learning_rate": 1.6927575881045243e-06,
+ "loss": 0.0435,
+ "step": 30010
+ },
+ {
+ "epoch": 81.77384196185287,
+ "grad_norm": 3.952859401702881,
+ "learning_rate": 1.6922663496834346e-06,
+ "loss": 0.1197,
+ "step": 30011
+ },
+ {
+ "epoch": 81.77656675749319,
+ "grad_norm": 2.8318142890930176,
+ "learning_rate": 1.6917751759627066e-06,
+ "loss": 0.1828,
+ "step": 30012
+ },
+ {
+ "epoch": 81.77929155313352,
+ "grad_norm": 2.7179439067840576,
+ "learning_rate": 1.6912840669461672e-06,
+ "loss": 0.0764,
+ "step": 30013
+ },
+ {
+ "epoch": 81.78201634877384,
+ "grad_norm": 3.1840264797210693,
+ "learning_rate": 1.6907930226376367e-06,
+ "loss": 0.1202,
+ "step": 30014
+ },
+ {
+ "epoch": 81.78474114441417,
+ "grad_norm": 2.3267662525177,
+ "learning_rate": 1.6903020430409456e-06,
+ "loss": 0.0383,
+ "step": 30015
+ },
+ {
+ "epoch": 81.7874659400545,
+ "grad_norm": 4.1154561042785645,
+ "learning_rate": 1.6898111281599129e-06,
+ "loss": 0.0715,
+ "step": 30016
+ },
+ {
+ "epoch": 81.79019073569482,
+ "grad_norm": 3.4539682865142822,
+ "learning_rate": 1.6893202779983654e-06,
+ "loss": 0.0504,
+ "step": 30017
+ },
+ {
+ "epoch": 81.79291553133515,
+ "grad_norm": 3.567556619644165,
+ "learning_rate": 1.6888294925601235e-06,
+ "loss": 0.0273,
+ "step": 30018
+ },
+ {
+ "epoch": 81.79564032697547,
+ "grad_norm": 3.3005082607269287,
+ "learning_rate": 1.6883387718490086e-06,
+ "loss": 0.2091,
+ "step": 30019
+ },
+ {
+ "epoch": 81.7983651226158,
+ "grad_norm": 2.836658000946045,
+ "learning_rate": 1.6878481158688454e-06,
+ "loss": 0.1856,
+ "step": 30020
+ },
+ {
+ "epoch": 81.80108991825612,
+ "grad_norm": 1.7724984884262085,
+ "learning_rate": 1.6873575246234542e-06,
+ "loss": 0.038,
+ "step": 30021
+ },
+ {
+ "epoch": 81.80381471389646,
+ "grad_norm": 2.244910717010498,
+ "learning_rate": 1.6868669981166553e-06,
+ "loss": 0.1502,
+ "step": 30022
+ },
+ {
+ "epoch": 81.80653950953679,
+ "grad_norm": 2.91497540473938,
+ "learning_rate": 1.6863765363522654e-06,
+ "loss": 0.0359,
+ "step": 30023
+ },
+ {
+ "epoch": 81.80926430517711,
+ "grad_norm": 2.6984496116638184,
+ "learning_rate": 1.685886139334111e-06,
+ "loss": 0.0374,
+ "step": 30024
+ },
+ {
+ "epoch": 81.81198910081744,
+ "grad_norm": 1.5971429347991943,
+ "learning_rate": 1.685395807066007e-06,
+ "loss": 0.0205,
+ "step": 30025
+ },
+ {
+ "epoch": 81.81471389645776,
+ "grad_norm": 2.5110671520233154,
+ "learning_rate": 1.68490553955177e-06,
+ "loss": 0.1074,
+ "step": 30026
+ },
+ {
+ "epoch": 81.8174386920981,
+ "grad_norm": 2.5040781497955322,
+ "learning_rate": 1.6844153367952242e-06,
+ "loss": 0.0366,
+ "step": 30027
+ },
+ {
+ "epoch": 81.82016348773843,
+ "grad_norm": 2.7937262058258057,
+ "learning_rate": 1.6839251988001838e-06,
+ "loss": 0.0691,
+ "step": 30028
+ },
+ {
+ "epoch": 81.82288828337875,
+ "grad_norm": 2.183349370956421,
+ "learning_rate": 1.6834351255704673e-06,
+ "loss": 0.0204,
+ "step": 30029
+ },
+ {
+ "epoch": 81.82561307901908,
+ "grad_norm": 5.8651299476623535,
+ "learning_rate": 1.6829451171098865e-06,
+ "loss": 0.1189,
+ "step": 30030
+ },
+ {
+ "epoch": 81.8283378746594,
+ "grad_norm": 2.891397476196289,
+ "learning_rate": 1.6824551734222649e-06,
+ "loss": 0.1082,
+ "step": 30031
+ },
+ {
+ "epoch": 81.83106267029973,
+ "grad_norm": 2.7424800395965576,
+ "learning_rate": 1.681965294511414e-06,
+ "loss": 0.0313,
+ "step": 30032
+ },
+ {
+ "epoch": 81.83378746594005,
+ "grad_norm": 2.4093427658081055,
+ "learning_rate": 1.6814754803811474e-06,
+ "loss": 0.1106,
+ "step": 30033
+ },
+ {
+ "epoch": 81.83651226158038,
+ "grad_norm": 2.4709415435791016,
+ "learning_rate": 1.6809857310352852e-06,
+ "loss": 0.025,
+ "step": 30034
+ },
+ {
+ "epoch": 81.83923705722071,
+ "grad_norm": 1.8941694498062134,
+ "learning_rate": 1.6804960464776344e-06,
+ "loss": 0.0174,
+ "step": 30035
+ },
+ {
+ "epoch": 81.84196185286103,
+ "grad_norm": 2.468430280685425,
+ "learning_rate": 1.6800064267120163e-06,
+ "loss": 0.091,
+ "step": 30036
+ },
+ {
+ "epoch": 81.84468664850137,
+ "grad_norm": 1.7741538286209106,
+ "learning_rate": 1.6795168717422404e-06,
+ "loss": 0.0239,
+ "step": 30037
+ },
+ {
+ "epoch": 81.84741144414168,
+ "grad_norm": 1.6462080478668213,
+ "learning_rate": 1.6790273815721191e-06,
+ "loss": 0.0177,
+ "step": 30038
+ },
+ {
+ "epoch": 81.85013623978202,
+ "grad_norm": 2.0248351097106934,
+ "learning_rate": 1.6785379562054615e-06,
+ "loss": 0.052,
+ "step": 30039
+ },
+ {
+ "epoch": 81.85286103542235,
+ "grad_norm": 4.469536781311035,
+ "learning_rate": 1.6780485956460857e-06,
+ "loss": 0.0991,
+ "step": 30040
+ },
+ {
+ "epoch": 81.85558583106267,
+ "grad_norm": 3.5721821784973145,
+ "learning_rate": 1.6775592998977995e-06,
+ "loss": 0.1362,
+ "step": 30041
+ },
+ {
+ "epoch": 81.858310626703,
+ "grad_norm": 2.6830410957336426,
+ "learning_rate": 1.6770700689644138e-06,
+ "loss": 0.1015,
+ "step": 30042
+ },
+ {
+ "epoch": 81.86103542234332,
+ "grad_norm": 2.327113389968872,
+ "learning_rate": 1.676580902849736e-06,
+ "loss": 0.0263,
+ "step": 30043
+ },
+ {
+ "epoch": 81.86376021798365,
+ "grad_norm": 2.0420827865600586,
+ "learning_rate": 1.67609180155758e-06,
+ "loss": 0.1379,
+ "step": 30044
+ },
+ {
+ "epoch": 81.86648501362397,
+ "grad_norm": 3.5153493881225586,
+ "learning_rate": 1.6756027650917539e-06,
+ "loss": 0.0818,
+ "step": 30045
+ },
+ {
+ "epoch": 81.8692098092643,
+ "grad_norm": 2.7035679817199707,
+ "learning_rate": 1.6751137934560635e-06,
+ "loss": 0.0357,
+ "step": 30046
+ },
+ {
+ "epoch": 81.87193460490464,
+ "grad_norm": 3.255575180053711,
+ "learning_rate": 1.6746248866543201e-06,
+ "loss": 0.0938,
+ "step": 30047
+ },
+ {
+ "epoch": 81.87465940054496,
+ "grad_norm": 2.4730582237243652,
+ "learning_rate": 1.6741360446903309e-06,
+ "loss": 0.1371,
+ "step": 30048
+ },
+ {
+ "epoch": 81.87738419618529,
+ "grad_norm": 2.590402841567993,
+ "learning_rate": 1.6736472675679028e-06,
+ "loss": 0.1255,
+ "step": 30049
+ },
+ {
+ "epoch": 81.88010899182561,
+ "grad_norm": 2.0248920917510986,
+ "learning_rate": 1.6731585552908381e-06,
+ "loss": 0.0314,
+ "step": 30050
+ },
+ {
+ "epoch": 81.88283378746594,
+ "grad_norm": 2.2059524059295654,
+ "learning_rate": 1.672669907862947e-06,
+ "loss": 0.039,
+ "step": 30051
+ },
+ {
+ "epoch": 81.88555858310627,
+ "grad_norm": 2.7759554386138916,
+ "learning_rate": 1.672181325288037e-06,
+ "loss": 0.0268,
+ "step": 30052
+ },
+ {
+ "epoch": 81.88828337874659,
+ "grad_norm": 2.258518934249878,
+ "learning_rate": 1.6716928075699112e-06,
+ "loss": 0.0287,
+ "step": 30053
+ },
+ {
+ "epoch": 81.89100817438693,
+ "grad_norm": 4.108890533447266,
+ "learning_rate": 1.6712043547123735e-06,
+ "loss": 0.1903,
+ "step": 30054
+ },
+ {
+ "epoch": 81.89373297002724,
+ "grad_norm": 2.274536609649658,
+ "learning_rate": 1.6707159667192263e-06,
+ "loss": 0.0939,
+ "step": 30055
+ },
+ {
+ "epoch": 81.89645776566758,
+ "grad_norm": 2.4938838481903076,
+ "learning_rate": 1.6702276435942776e-06,
+ "loss": 0.0664,
+ "step": 30056
+ },
+ {
+ "epoch": 81.8991825613079,
+ "grad_norm": 4.16168737411499,
+ "learning_rate": 1.6697393853413269e-06,
+ "loss": 0.0636,
+ "step": 30057
+ },
+ {
+ "epoch": 81.90190735694823,
+ "grad_norm": 2.1645264625549316,
+ "learning_rate": 1.6692511919641786e-06,
+ "loss": 0.0273,
+ "step": 30058
+ },
+ {
+ "epoch": 81.90463215258856,
+ "grad_norm": 2.435659885406494,
+ "learning_rate": 1.6687630634666308e-06,
+ "loss": 0.028,
+ "step": 30059
+ },
+ {
+ "epoch": 81.90735694822888,
+ "grad_norm": 2.16802978515625,
+ "learning_rate": 1.6682749998524917e-06,
+ "loss": 0.0704,
+ "step": 30060
+ },
+ {
+ "epoch": 81.91008174386921,
+ "grad_norm": 3.9329493045806885,
+ "learning_rate": 1.667787001125557e-06,
+ "loss": 0.0345,
+ "step": 30061
+ },
+ {
+ "epoch": 81.91280653950953,
+ "grad_norm": 2.289764642715454,
+ "learning_rate": 1.6672990672896304e-06,
+ "loss": 0.0725,
+ "step": 30062
+ },
+ {
+ "epoch": 81.91553133514986,
+ "grad_norm": 2.794121265411377,
+ "learning_rate": 1.666811198348508e-06,
+ "loss": 0.1162,
+ "step": 30063
+ },
+ {
+ "epoch": 81.9182561307902,
+ "grad_norm": 2.8760757446289062,
+ "learning_rate": 1.6663233943059932e-06,
+ "loss": 0.0466,
+ "step": 30064
+ },
+ {
+ "epoch": 81.92098092643052,
+ "grad_norm": 2.378352403640747,
+ "learning_rate": 1.6658356551658838e-06,
+ "loss": 0.0318,
+ "step": 30065
+ },
+ {
+ "epoch": 81.92370572207085,
+ "grad_norm": 1.9247372150421143,
+ "learning_rate": 1.6653479809319795e-06,
+ "loss": 0.0197,
+ "step": 30066
+ },
+ {
+ "epoch": 81.92643051771117,
+ "grad_norm": 2.9816741943359375,
+ "learning_rate": 1.6648603716080725e-06,
+ "loss": 0.0324,
+ "step": 30067
+ },
+ {
+ "epoch": 81.9291553133515,
+ "grad_norm": 3.170616626739502,
+ "learning_rate": 1.6643728271979665e-06,
+ "loss": 0.0464,
+ "step": 30068
+ },
+ {
+ "epoch": 81.93188010899182,
+ "grad_norm": 2.9416186809539795,
+ "learning_rate": 1.6638853477054573e-06,
+ "loss": 0.0441,
+ "step": 30069
+ },
+ {
+ "epoch": 81.93460490463215,
+ "grad_norm": 2.3222405910491943,
+ "learning_rate": 1.663397933134342e-06,
+ "loss": 0.1783,
+ "step": 30070
+ },
+ {
+ "epoch": 81.93732970027249,
+ "grad_norm": 2.681143283843994,
+ "learning_rate": 1.6629105834884119e-06,
+ "loss": 0.0392,
+ "step": 30071
+ },
+ {
+ "epoch": 81.9400544959128,
+ "grad_norm": 3.0393142700195312,
+ "learning_rate": 1.6624232987714695e-06,
+ "loss": 0.0428,
+ "step": 30072
+ },
+ {
+ "epoch": 81.94277929155314,
+ "grad_norm": 2.3829312324523926,
+ "learning_rate": 1.6619360789873051e-06,
+ "loss": 0.1214,
+ "step": 30073
+ },
+ {
+ "epoch": 81.94550408719346,
+ "grad_norm": 1.8362236022949219,
+ "learning_rate": 1.6614489241397148e-06,
+ "loss": 0.0311,
+ "step": 30074
+ },
+ {
+ "epoch": 81.94822888283379,
+ "grad_norm": 2.6642162799835205,
+ "learning_rate": 1.6609618342324884e-06,
+ "loss": 0.0326,
+ "step": 30075
+ },
+ {
+ "epoch": 81.95095367847412,
+ "grad_norm": 2.634880542755127,
+ "learning_rate": 1.6604748092694268e-06,
+ "loss": 0.1138,
+ "step": 30076
+ },
+ {
+ "epoch": 81.95367847411444,
+ "grad_norm": 2.1546363830566406,
+ "learning_rate": 1.6599878492543175e-06,
+ "loss": 0.0406,
+ "step": 30077
+ },
+ {
+ "epoch": 81.95640326975477,
+ "grad_norm": 1.9578328132629395,
+ "learning_rate": 1.6595009541909558e-06,
+ "loss": 0.0404,
+ "step": 30078
+ },
+ {
+ "epoch": 81.95912806539509,
+ "grad_norm": 1.6919559240341187,
+ "learning_rate": 1.6590141240831281e-06,
+ "loss": 0.0204,
+ "step": 30079
+ },
+ {
+ "epoch": 81.96185286103542,
+ "grad_norm": 3.3523151874542236,
+ "learning_rate": 1.658527358934634e-06,
+ "loss": 0.0442,
+ "step": 30080
+ },
+ {
+ "epoch": 81.96457765667574,
+ "grad_norm": 2.374912738800049,
+ "learning_rate": 1.6580406587492592e-06,
+ "loss": 0.0308,
+ "step": 30081
+ },
+ {
+ "epoch": 81.96730245231608,
+ "grad_norm": 2.683181047439575,
+ "learning_rate": 1.6575540235307964e-06,
+ "loss": 0.0939,
+ "step": 30082
+ },
+ {
+ "epoch": 81.97002724795641,
+ "grad_norm": 2.0993354320526123,
+ "learning_rate": 1.6570674532830312e-06,
+ "loss": 0.118,
+ "step": 30083
+ },
+ {
+ "epoch": 81.97275204359673,
+ "grad_norm": 2.8864526748657227,
+ "learning_rate": 1.6565809480097583e-06,
+ "loss": 0.2046,
+ "step": 30084
+ },
+ {
+ "epoch": 81.97547683923706,
+ "grad_norm": 3.024050712585449,
+ "learning_rate": 1.6560945077147628e-06,
+ "loss": 0.0806,
+ "step": 30085
+ },
+ {
+ "epoch": 81.97820163487738,
+ "grad_norm": 1.5702760219573975,
+ "learning_rate": 1.655608132401837e-06,
+ "loss": 0.028,
+ "step": 30086
+ },
+ {
+ "epoch": 81.98092643051771,
+ "grad_norm": 3.0154566764831543,
+ "learning_rate": 1.6551218220747634e-06,
+ "loss": 0.0572,
+ "step": 30087
+ },
+ {
+ "epoch": 81.98365122615803,
+ "grad_norm": 1.8100252151489258,
+ "learning_rate": 1.6546355767373357e-06,
+ "loss": 0.0587,
+ "step": 30088
+ },
+ {
+ "epoch": 81.98637602179836,
+ "grad_norm": 2.5257043838500977,
+ "learning_rate": 1.6541493963933375e-06,
+ "loss": 0.0676,
+ "step": 30089
+ },
+ {
+ "epoch": 81.9891008174387,
+ "grad_norm": 2.980360984802246,
+ "learning_rate": 1.6536632810465547e-06,
+ "loss": 0.0469,
+ "step": 30090
+ },
+ {
+ "epoch": 81.99182561307902,
+ "grad_norm": 2.4827728271484375,
+ "learning_rate": 1.653177230700771e-06,
+ "loss": 0.0408,
+ "step": 30091
+ },
+ {
+ "epoch": 81.99455040871935,
+ "grad_norm": 2.323294162750244,
+ "learning_rate": 1.6526912453597776e-06,
+ "loss": 0.1011,
+ "step": 30092
+ },
+ {
+ "epoch": 81.99727520435967,
+ "grad_norm": 2.739640951156616,
+ "learning_rate": 1.6522053250273551e-06,
+ "loss": 0.0432,
+ "step": 30093
+ },
+ {
+ "epoch": 82.0,
+ "grad_norm": 3.3195836544036865,
+ "learning_rate": 1.6517194697072903e-06,
+ "loss": 0.0561,
+ "step": 30094
+ },
+ {
+ "epoch": 82.00272479564033,
+ "grad_norm": 2.452608823776245,
+ "learning_rate": 1.6512336794033622e-06,
+ "loss": 0.0643,
+ "step": 30095
+ },
+ {
+ "epoch": 82.00544959128065,
+ "grad_norm": 4.400585651397705,
+ "learning_rate": 1.6507479541193595e-06,
+ "loss": 0.0629,
+ "step": 30096
+ },
+ {
+ "epoch": 82.00817438692098,
+ "grad_norm": 2.563040256500244,
+ "learning_rate": 1.650262293859064e-06,
+ "loss": 0.1783,
+ "step": 30097
+ },
+ {
+ "epoch": 82.0108991825613,
+ "grad_norm": 2.6949498653411865,
+ "learning_rate": 1.6497766986262564e-06,
+ "loss": 0.0358,
+ "step": 30098
+ },
+ {
+ "epoch": 82.01362397820164,
+ "grad_norm": 5.2082695960998535,
+ "learning_rate": 1.6492911684247171e-06,
+ "loss": 0.2074,
+ "step": 30099
+ },
+ {
+ "epoch": 82.01634877384195,
+ "grad_norm": 2.20147705078125,
+ "learning_rate": 1.6488057032582316e-06,
+ "loss": 0.0349,
+ "step": 30100
+ },
+ {
+ "epoch": 82.01907356948229,
+ "grad_norm": 2.8832318782806396,
+ "learning_rate": 1.6483203031305784e-06,
+ "loss": 0.0414,
+ "step": 30101
+ },
+ {
+ "epoch": 82.02179836512262,
+ "grad_norm": 2.864335060119629,
+ "learning_rate": 1.6478349680455351e-06,
+ "loss": 0.0621,
+ "step": 30102
+ },
+ {
+ "epoch": 82.02452316076294,
+ "grad_norm": 2.6042680740356445,
+ "learning_rate": 1.6473496980068882e-06,
+ "loss": 0.0221,
+ "step": 30103
+ },
+ {
+ "epoch": 82.02724795640327,
+ "grad_norm": 2.670797348022461,
+ "learning_rate": 1.6468644930184097e-06,
+ "loss": 0.0546,
+ "step": 30104
+ },
+ {
+ "epoch": 82.02997275204359,
+ "grad_norm": 2.3810532093048096,
+ "learning_rate": 1.6463793530838834e-06,
+ "loss": 0.0671,
+ "step": 30105
+ },
+ {
+ "epoch": 82.03269754768392,
+ "grad_norm": 2.194476842880249,
+ "learning_rate": 1.6458942782070864e-06,
+ "loss": 0.025,
+ "step": 30106
+ },
+ {
+ "epoch": 82.03542234332426,
+ "grad_norm": 2.59818434715271,
+ "learning_rate": 1.6454092683917954e-06,
+ "loss": 0.0617,
+ "step": 30107
+ },
+ {
+ "epoch": 82.03814713896458,
+ "grad_norm": 3.1329987049102783,
+ "learning_rate": 1.6449243236417866e-06,
+ "loss": 0.126,
+ "step": 30108
+ },
+ {
+ "epoch": 82.04087193460491,
+ "grad_norm": 2.04888653755188,
+ "learning_rate": 1.6444394439608402e-06,
+ "loss": 0.0331,
+ "step": 30109
+ },
+ {
+ "epoch": 82.04359673024523,
+ "grad_norm": 2.1385014057159424,
+ "learning_rate": 1.6439546293527309e-06,
+ "loss": 0.049,
+ "step": 30110
+ },
+ {
+ "epoch": 82.04632152588556,
+ "grad_norm": 2.791651487350464,
+ "learning_rate": 1.6434698798212312e-06,
+ "loss": 0.141,
+ "step": 30111
+ },
+ {
+ "epoch": 82.04904632152588,
+ "grad_norm": 3.0007333755493164,
+ "learning_rate": 1.6429851953701214e-06,
+ "loss": 0.0712,
+ "step": 30112
+ },
+ {
+ "epoch": 82.05177111716621,
+ "grad_norm": 2.4517953395843506,
+ "learning_rate": 1.6425005760031742e-06,
+ "loss": 0.0281,
+ "step": 30113
+ },
+ {
+ "epoch": 82.05449591280654,
+ "grad_norm": 2.233431577682495,
+ "learning_rate": 1.642016021724163e-06,
+ "loss": 0.046,
+ "step": 30114
+ },
+ {
+ "epoch": 82.05722070844686,
+ "grad_norm": 2.6009597778320312,
+ "learning_rate": 1.6415315325368608e-06,
+ "loss": 0.059,
+ "step": 30115
+ },
+ {
+ "epoch": 82.0599455040872,
+ "grad_norm": 3.337405204772949,
+ "learning_rate": 1.641047108445044e-06,
+ "loss": 0.1318,
+ "step": 30116
+ },
+ {
+ "epoch": 82.06267029972751,
+ "grad_norm": 4.06247091293335,
+ "learning_rate": 1.6405627494524823e-06,
+ "loss": 0.2333,
+ "step": 30117
+ },
+ {
+ "epoch": 82.06539509536785,
+ "grad_norm": 1.3780720233917236,
+ "learning_rate": 1.64007845556295e-06,
+ "loss": 0.0476,
+ "step": 30118
+ },
+ {
+ "epoch": 82.06811989100818,
+ "grad_norm": 2.218391180038452,
+ "learning_rate": 1.6395942267802145e-06,
+ "loss": 0.0264,
+ "step": 30119
+ },
+ {
+ "epoch": 82.0708446866485,
+ "grad_norm": 2.4761962890625,
+ "learning_rate": 1.6391100631080504e-06,
+ "loss": 0.0741,
+ "step": 30120
+ },
+ {
+ "epoch": 82.07356948228883,
+ "grad_norm": 2.4118857383728027,
+ "learning_rate": 1.63862596455023e-06,
+ "loss": 0.0349,
+ "step": 30121
+ },
+ {
+ "epoch": 82.07629427792915,
+ "grad_norm": 2.839411973953247,
+ "learning_rate": 1.6381419311105217e-06,
+ "loss": 0.0471,
+ "step": 30122
+ },
+ {
+ "epoch": 82.07901907356948,
+ "grad_norm": 2.217923879623413,
+ "learning_rate": 1.6376579627926958e-06,
+ "loss": 0.0646,
+ "step": 30123
+ },
+ {
+ "epoch": 82.0817438692098,
+ "grad_norm": 2.5746586322784424,
+ "learning_rate": 1.637174059600517e-06,
+ "loss": 0.0703,
+ "step": 30124
+ },
+ {
+ "epoch": 82.08446866485014,
+ "grad_norm": 3.2880475521087646,
+ "learning_rate": 1.6366902215377612e-06,
+ "loss": 0.0555,
+ "step": 30125
+ },
+ {
+ "epoch": 82.08719346049047,
+ "grad_norm": 2.633786916732788,
+ "learning_rate": 1.6362064486081908e-06,
+ "loss": 0.022,
+ "step": 30126
+ },
+ {
+ "epoch": 82.08991825613079,
+ "grad_norm": 2.3178820610046387,
+ "learning_rate": 1.6357227408155773e-06,
+ "loss": 0.0597,
+ "step": 30127
+ },
+ {
+ "epoch": 82.09264305177112,
+ "grad_norm": 2.050793170928955,
+ "learning_rate": 1.6352390981636823e-06,
+ "loss": 0.0733,
+ "step": 30128
+ },
+ {
+ "epoch": 82.09536784741144,
+ "grad_norm": 1.5514721870422363,
+ "learning_rate": 1.6347555206562792e-06,
+ "loss": 0.0161,
+ "step": 30129
+ },
+ {
+ "epoch": 82.09809264305177,
+ "grad_norm": 2.0822415351867676,
+ "learning_rate": 1.6342720082971297e-06,
+ "loss": 0.0417,
+ "step": 30130
+ },
+ {
+ "epoch": 82.1008174386921,
+ "grad_norm": 2.493922233581543,
+ "learning_rate": 1.6337885610900017e-06,
+ "loss": 0.115,
+ "step": 30131
+ },
+ {
+ "epoch": 82.10354223433242,
+ "grad_norm": 2.7690391540527344,
+ "learning_rate": 1.6333051790386556e-06,
+ "loss": 0.0793,
+ "step": 30132
+ },
+ {
+ "epoch": 82.10626702997276,
+ "grad_norm": 2.0981123447418213,
+ "learning_rate": 1.6328218621468628e-06,
+ "loss": 0.0507,
+ "step": 30133
+ },
+ {
+ "epoch": 82.10899182561307,
+ "grad_norm": 3.4307641983032227,
+ "learning_rate": 1.6323386104183836e-06,
+ "loss": 0.039,
+ "step": 30134
+ },
+ {
+ "epoch": 82.11171662125341,
+ "grad_norm": 2.3298115730285645,
+ "learning_rate": 1.6318554238569807e-06,
+ "loss": 0.0244,
+ "step": 30135
+ },
+ {
+ "epoch": 82.11444141689373,
+ "grad_norm": 2.2847211360931396,
+ "learning_rate": 1.6313723024664175e-06,
+ "loss": 0.034,
+ "step": 30136
+ },
+ {
+ "epoch": 82.11716621253406,
+ "grad_norm": 2.782477855682373,
+ "learning_rate": 1.6308892462504599e-06,
+ "loss": 0.0363,
+ "step": 30137
+ },
+ {
+ "epoch": 82.11989100817439,
+ "grad_norm": 2.7747435569763184,
+ "learning_rate": 1.6304062552128674e-06,
+ "loss": 0.0752,
+ "step": 30138
+ },
+ {
+ "epoch": 82.12261580381471,
+ "grad_norm": 2.447909116744995,
+ "learning_rate": 1.6299233293574012e-06,
+ "loss": 0.0733,
+ "step": 30139
+ },
+ {
+ "epoch": 82.12534059945504,
+ "grad_norm": 2.572230100631714,
+ "learning_rate": 1.6294404686878207e-06,
+ "loss": 0.0378,
+ "step": 30140
+ },
+ {
+ "epoch": 82.12806539509536,
+ "grad_norm": 2.5960028171539307,
+ "learning_rate": 1.6289576732078916e-06,
+ "loss": 0.0273,
+ "step": 30141
+ },
+ {
+ "epoch": 82.1307901907357,
+ "grad_norm": 1.7044440507888794,
+ "learning_rate": 1.6284749429213697e-06,
+ "loss": 0.0255,
+ "step": 30142
+ },
+ {
+ "epoch": 82.13351498637603,
+ "grad_norm": 3.533142328262329,
+ "learning_rate": 1.6279922778320156e-06,
+ "loss": 0.1516,
+ "step": 30143
+ },
+ {
+ "epoch": 82.13623978201635,
+ "grad_norm": 3.6024680137634277,
+ "learning_rate": 1.6275096779435862e-06,
+ "loss": 0.0331,
+ "step": 30144
+ },
+ {
+ "epoch": 82.13896457765668,
+ "grad_norm": 3.0792603492736816,
+ "learning_rate": 1.6270271432598438e-06,
+ "loss": 0.0983,
+ "step": 30145
+ },
+ {
+ "epoch": 82.141689373297,
+ "grad_norm": 1.7023431062698364,
+ "learning_rate": 1.6265446737845458e-06,
+ "loss": 0.024,
+ "step": 30146
+ },
+ {
+ "epoch": 82.14441416893733,
+ "grad_norm": 2.2191717624664307,
+ "learning_rate": 1.626062269521448e-06,
+ "loss": 0.0654,
+ "step": 30147
+ },
+ {
+ "epoch": 82.14713896457765,
+ "grad_norm": 3.3200104236602783,
+ "learning_rate": 1.6255799304743048e-06,
+ "loss": 0.0301,
+ "step": 30148
+ },
+ {
+ "epoch": 82.14986376021798,
+ "grad_norm": 2.1497583389282227,
+ "learning_rate": 1.6250976566468779e-06,
+ "loss": 0.0361,
+ "step": 30149
+ },
+ {
+ "epoch": 82.15258855585832,
+ "grad_norm": 2.7354648113250732,
+ "learning_rate": 1.624615448042921e-06,
+ "loss": 0.0253,
+ "step": 30150
+ },
+ {
+ "epoch": 82.15531335149863,
+ "grad_norm": 3.8269991874694824,
+ "learning_rate": 1.6241333046661888e-06,
+ "loss": 0.1245,
+ "step": 30151
+ },
+ {
+ "epoch": 82.15803814713897,
+ "grad_norm": 3.1344497203826904,
+ "learning_rate": 1.6236512265204352e-06,
+ "loss": 0.0348,
+ "step": 30152
+ },
+ {
+ "epoch": 82.16076294277929,
+ "grad_norm": 2.80470609664917,
+ "learning_rate": 1.623169213609419e-06,
+ "loss": 0.0376,
+ "step": 30153
+ },
+ {
+ "epoch": 82.16348773841962,
+ "grad_norm": 3.6900198459625244,
+ "learning_rate": 1.6226872659368885e-06,
+ "loss": 0.0383,
+ "step": 30154
+ },
+ {
+ "epoch": 82.16621253405995,
+ "grad_norm": 3.068413257598877,
+ "learning_rate": 1.622205383506602e-06,
+ "loss": 0.0623,
+ "step": 30155
+ },
+ {
+ "epoch": 82.16893732970027,
+ "grad_norm": 2.7594008445739746,
+ "learning_rate": 1.6217235663223085e-06,
+ "loss": 0.1019,
+ "step": 30156
+ },
+ {
+ "epoch": 82.1716621253406,
+ "grad_norm": 3.374462604522705,
+ "learning_rate": 1.621241814387764e-06,
+ "loss": 0.0805,
+ "step": 30157
+ },
+ {
+ "epoch": 82.17438692098092,
+ "grad_norm": 2.7398502826690674,
+ "learning_rate": 1.6207601277067197e-06,
+ "loss": 0.0295,
+ "step": 30158
+ },
+ {
+ "epoch": 82.17711171662125,
+ "grad_norm": 2.4901440143585205,
+ "learning_rate": 1.6202785062829252e-06,
+ "loss": 0.0471,
+ "step": 30159
+ },
+ {
+ "epoch": 82.17983651226157,
+ "grad_norm": 2.8590476512908936,
+ "learning_rate": 1.6197969501201295e-06,
+ "loss": 0.0231,
+ "step": 30160
+ },
+ {
+ "epoch": 82.1825613079019,
+ "grad_norm": 10.413185119628906,
+ "learning_rate": 1.6193154592220871e-06,
+ "loss": 0.115,
+ "step": 30161
+ },
+ {
+ "epoch": 82.18528610354224,
+ "grad_norm": 2.662334680557251,
+ "learning_rate": 1.6188340335925478e-06,
+ "loss": 0.0684,
+ "step": 30162
+ },
+ {
+ "epoch": 82.18801089918256,
+ "grad_norm": 2.848132848739624,
+ "learning_rate": 1.6183526732352583e-06,
+ "loss": 0.042,
+ "step": 30163
+ },
+ {
+ "epoch": 82.19073569482289,
+ "grad_norm": 2.152181386947632,
+ "learning_rate": 1.6178713781539658e-06,
+ "loss": 0.0454,
+ "step": 30164
+ },
+ {
+ "epoch": 82.19346049046321,
+ "grad_norm": 2.8709352016448975,
+ "learning_rate": 1.6173901483524246e-06,
+ "loss": 0.1143,
+ "step": 30165
+ },
+ {
+ "epoch": 82.19618528610354,
+ "grad_norm": 2.3323049545288086,
+ "learning_rate": 1.6169089838343776e-06,
+ "loss": 0.0748,
+ "step": 30166
+ },
+ {
+ "epoch": 82.19891008174388,
+ "grad_norm": 2.783975839614868,
+ "learning_rate": 1.6164278846035752e-06,
+ "loss": 0.0835,
+ "step": 30167
+ },
+ {
+ "epoch": 82.2016348773842,
+ "grad_norm": 3.9515433311462402,
+ "learning_rate": 1.61594685066376e-06,
+ "loss": 0.032,
+ "step": 30168
+ },
+ {
+ "epoch": 82.20435967302453,
+ "grad_norm": 2.7064707279205322,
+ "learning_rate": 1.6154658820186819e-06,
+ "loss": 0.1027,
+ "step": 30169
+ },
+ {
+ "epoch": 82.20708446866485,
+ "grad_norm": 2.2218239307403564,
+ "learning_rate": 1.6149849786720873e-06,
+ "loss": 0.1038,
+ "step": 30170
+ },
+ {
+ "epoch": 82.20980926430518,
+ "grad_norm": 2.2611162662506104,
+ "learning_rate": 1.6145041406277162e-06,
+ "loss": 0.0419,
+ "step": 30171
+ },
+ {
+ "epoch": 82.2125340599455,
+ "grad_norm": 2.452496290206909,
+ "learning_rate": 1.6140233678893203e-06,
+ "loss": 0.0332,
+ "step": 30172
+ },
+ {
+ "epoch": 82.21525885558583,
+ "grad_norm": 2.9502222537994385,
+ "learning_rate": 1.6135426604606375e-06,
+ "loss": 0.0842,
+ "step": 30173
+ },
+ {
+ "epoch": 82.21798365122616,
+ "grad_norm": 3.4729695320129395,
+ "learning_rate": 1.613062018345417e-06,
+ "loss": 0.1134,
+ "step": 30174
+ },
+ {
+ "epoch": 82.22070844686648,
+ "grad_norm": 2.6018288135528564,
+ "learning_rate": 1.6125814415473994e-06,
+ "loss": 0.0486,
+ "step": 30175
+ },
+ {
+ "epoch": 82.22343324250681,
+ "grad_norm": 3.1216282844543457,
+ "learning_rate": 1.6121009300703262e-06,
+ "loss": 0.0929,
+ "step": 30176
+ },
+ {
+ "epoch": 82.22615803814713,
+ "grad_norm": 4.083061218261719,
+ "learning_rate": 1.6116204839179428e-06,
+ "loss": 0.0389,
+ "step": 30177
+ },
+ {
+ "epoch": 82.22888283378747,
+ "grad_norm": 3.2521812915802,
+ "learning_rate": 1.611140103093989e-06,
+ "loss": 0.0638,
+ "step": 30178
+ },
+ {
+ "epoch": 82.2316076294278,
+ "grad_norm": 1.6322013139724731,
+ "learning_rate": 1.6106597876022057e-06,
+ "loss": 0.0196,
+ "step": 30179
+ },
+ {
+ "epoch": 82.23433242506812,
+ "grad_norm": 2.0123422145843506,
+ "learning_rate": 1.6101795374463314e-06,
+ "loss": 0.0249,
+ "step": 30180
+ },
+ {
+ "epoch": 82.23705722070845,
+ "grad_norm": 1.8605958223342896,
+ "learning_rate": 1.6096993526301118e-06,
+ "loss": 0.09,
+ "step": 30181
+ },
+ {
+ "epoch": 82.23978201634877,
+ "grad_norm": 2.4019317626953125,
+ "learning_rate": 1.6092192331572843e-06,
+ "loss": 0.0282,
+ "step": 30182
+ },
+ {
+ "epoch": 82.2425068119891,
+ "grad_norm": 2.736300468444824,
+ "learning_rate": 1.6087391790315866e-06,
+ "loss": 0.0564,
+ "step": 30183
+ },
+ {
+ "epoch": 82.24523160762942,
+ "grad_norm": 3.2253520488739014,
+ "learning_rate": 1.6082591902567557e-06,
+ "loss": 0.1209,
+ "step": 30184
+ },
+ {
+ "epoch": 82.24795640326975,
+ "grad_norm": 3.003744125366211,
+ "learning_rate": 1.6077792668365344e-06,
+ "loss": 0.1923,
+ "step": 30185
+ },
+ {
+ "epoch": 82.25068119891009,
+ "grad_norm": 1.6995396614074707,
+ "learning_rate": 1.6072994087746585e-06,
+ "loss": 0.0435,
+ "step": 30186
+ },
+ {
+ "epoch": 82.2534059945504,
+ "grad_norm": 2.5432207584381104,
+ "learning_rate": 1.606819616074864e-06,
+ "loss": 0.0893,
+ "step": 30187
+ },
+ {
+ "epoch": 82.25613079019074,
+ "grad_norm": 2.037693500518799,
+ "learning_rate": 1.6063398887408866e-06,
+ "loss": 0.0284,
+ "step": 30188
+ },
+ {
+ "epoch": 82.25885558583106,
+ "grad_norm": 1.7175441980361938,
+ "learning_rate": 1.6058602267764633e-06,
+ "loss": 0.0694,
+ "step": 30189
+ },
+ {
+ "epoch": 82.26158038147139,
+ "grad_norm": 2.559647798538208,
+ "learning_rate": 1.6053806301853337e-06,
+ "loss": 0.0397,
+ "step": 30190
+ },
+ {
+ "epoch": 82.26430517711172,
+ "grad_norm": 4.633242130279541,
+ "learning_rate": 1.6049010989712288e-06,
+ "loss": 0.2483,
+ "step": 30191
+ },
+ {
+ "epoch": 82.26702997275204,
+ "grad_norm": 1.9954807758331299,
+ "learning_rate": 1.6044216331378837e-06,
+ "loss": 0.1054,
+ "step": 30192
+ },
+ {
+ "epoch": 82.26975476839237,
+ "grad_norm": 2.322779893875122,
+ "learning_rate": 1.603942232689031e-06,
+ "loss": 0.038,
+ "step": 30193
+ },
+ {
+ "epoch": 82.2724795640327,
+ "grad_norm": 2.8108303546905518,
+ "learning_rate": 1.6034628976284084e-06,
+ "loss": 0.0412,
+ "step": 30194
+ },
+ {
+ "epoch": 82.27520435967303,
+ "grad_norm": 2.5841689109802246,
+ "learning_rate": 1.6029836279597455e-06,
+ "loss": 0.044,
+ "step": 30195
+ },
+ {
+ "epoch": 82.27792915531334,
+ "grad_norm": 3.463477611541748,
+ "learning_rate": 1.602504423686775e-06,
+ "loss": 0.0629,
+ "step": 30196
+ },
+ {
+ "epoch": 82.28065395095368,
+ "grad_norm": 2.757986545562744,
+ "learning_rate": 1.6020252848132311e-06,
+ "loss": 0.0304,
+ "step": 30197
+ },
+ {
+ "epoch": 82.28337874659401,
+ "grad_norm": 3.4663634300231934,
+ "learning_rate": 1.6015462113428436e-06,
+ "loss": 0.0537,
+ "step": 30198
+ },
+ {
+ "epoch": 82.28610354223433,
+ "grad_norm": 2.922712564468384,
+ "learning_rate": 1.601067203279345e-06,
+ "loss": 0.0741,
+ "step": 30199
+ },
+ {
+ "epoch": 82.28882833787466,
+ "grad_norm": 2.993884325027466,
+ "learning_rate": 1.6005882606264621e-06,
+ "loss": 0.0383,
+ "step": 30200
+ },
+ {
+ "epoch": 82.29155313351498,
+ "grad_norm": 3.265608072280884,
+ "learning_rate": 1.6001093833879288e-06,
+ "loss": 0.1017,
+ "step": 30201
+ },
+ {
+ "epoch": 82.29427792915531,
+ "grad_norm": 3.439603805541992,
+ "learning_rate": 1.5996305715674743e-06,
+ "loss": 0.0472,
+ "step": 30202
+ },
+ {
+ "epoch": 82.29700272479565,
+ "grad_norm": 1.7652721405029297,
+ "learning_rate": 1.5991518251688265e-06,
+ "loss": 0.0213,
+ "step": 30203
+ },
+ {
+ "epoch": 82.29972752043597,
+ "grad_norm": 2.2727067470550537,
+ "learning_rate": 1.5986731441957114e-06,
+ "loss": 0.0291,
+ "step": 30204
+ },
+ {
+ "epoch": 82.3024523160763,
+ "grad_norm": 2.3539865016937256,
+ "learning_rate": 1.5981945286518597e-06,
+ "loss": 0.076,
+ "step": 30205
+ },
+ {
+ "epoch": 82.30517711171662,
+ "grad_norm": 3.262967824935913,
+ "learning_rate": 1.597715978541e-06,
+ "loss": 0.083,
+ "step": 30206
+ },
+ {
+ "epoch": 82.30790190735695,
+ "grad_norm": 3.4969043731689453,
+ "learning_rate": 1.597237493866859e-06,
+ "loss": 0.0956,
+ "step": 30207
+ },
+ {
+ "epoch": 82.31062670299727,
+ "grad_norm": 2.654318332672119,
+ "learning_rate": 1.5967590746331619e-06,
+ "loss": 0.0367,
+ "step": 30208
+ },
+ {
+ "epoch": 82.3133514986376,
+ "grad_norm": 2.8982152938842773,
+ "learning_rate": 1.5962807208436315e-06,
+ "loss": 0.0437,
+ "step": 30209
+ },
+ {
+ "epoch": 82.31607629427793,
+ "grad_norm": 5.074118614196777,
+ "learning_rate": 1.5958024325019993e-06,
+ "loss": 0.0481,
+ "step": 30210
+ },
+ {
+ "epoch": 82.31880108991825,
+ "grad_norm": 1.6220102310180664,
+ "learning_rate": 1.595324209611987e-06,
+ "loss": 0.0343,
+ "step": 30211
+ },
+ {
+ "epoch": 82.32152588555859,
+ "grad_norm": 3.144766092300415,
+ "learning_rate": 1.594846052177319e-06,
+ "loss": 0.2532,
+ "step": 30212
+ },
+ {
+ "epoch": 82.3242506811989,
+ "grad_norm": 2.7922792434692383,
+ "learning_rate": 1.594367960201718e-06,
+ "loss": 0.0801,
+ "step": 30213
+ },
+ {
+ "epoch": 82.32697547683924,
+ "grad_norm": 3.7109549045562744,
+ "learning_rate": 1.5938899336889102e-06,
+ "loss": 0.1202,
+ "step": 30214
+ },
+ {
+ "epoch": 82.32970027247957,
+ "grad_norm": 3.6727981567382812,
+ "learning_rate": 1.5934119726426177e-06,
+ "loss": 0.0345,
+ "step": 30215
+ },
+ {
+ "epoch": 82.33242506811989,
+ "grad_norm": 5.282775402069092,
+ "learning_rate": 1.5929340770665614e-06,
+ "loss": 0.1466,
+ "step": 30216
+ },
+ {
+ "epoch": 82.33514986376022,
+ "grad_norm": 2.2777795791625977,
+ "learning_rate": 1.5924562469644623e-06,
+ "loss": 0.0508,
+ "step": 30217
+ },
+ {
+ "epoch": 82.33787465940054,
+ "grad_norm": 2.966745615005493,
+ "learning_rate": 1.5919784823400452e-06,
+ "loss": 0.1701,
+ "step": 30218
+ },
+ {
+ "epoch": 82.34059945504087,
+ "grad_norm": 1.6942039728164673,
+ "learning_rate": 1.5915007831970297e-06,
+ "loss": 0.026,
+ "step": 30219
+ },
+ {
+ "epoch": 82.34332425068119,
+ "grad_norm": 2.008901357650757,
+ "learning_rate": 1.5910231495391326e-06,
+ "loss": 0.1946,
+ "step": 30220
+ },
+ {
+ "epoch": 82.34604904632153,
+ "grad_norm": 3.4828262329101562,
+ "learning_rate": 1.5905455813700788e-06,
+ "loss": 0.062,
+ "step": 30221
+ },
+ {
+ "epoch": 82.34877384196186,
+ "grad_norm": 2.490074872970581,
+ "learning_rate": 1.590068078693584e-06,
+ "loss": 0.1156,
+ "step": 30222
+ },
+ {
+ "epoch": 82.35149863760218,
+ "grad_norm": 2.6140756607055664,
+ "learning_rate": 1.58959064151337e-06,
+ "loss": 0.0433,
+ "step": 30223
+ },
+ {
+ "epoch": 82.35422343324251,
+ "grad_norm": 2.654006242752075,
+ "learning_rate": 1.5891132698331536e-06,
+ "loss": 0.0487,
+ "step": 30224
+ },
+ {
+ "epoch": 82.35694822888283,
+ "grad_norm": 1.9457130432128906,
+ "learning_rate": 1.5886359636566494e-06,
+ "loss": 0.025,
+ "step": 30225
+ },
+ {
+ "epoch": 82.35967302452316,
+ "grad_norm": 3.361292600631714,
+ "learning_rate": 1.5881587229875806e-06,
+ "loss": 0.0654,
+ "step": 30226
+ },
+ {
+ "epoch": 82.3623978201635,
+ "grad_norm": 2.7696139812469482,
+ "learning_rate": 1.5876815478296602e-06,
+ "loss": 0.1032,
+ "step": 30227
+ },
+ {
+ "epoch": 82.36512261580381,
+ "grad_norm": 1.7006996870040894,
+ "learning_rate": 1.5872044381866058e-06,
+ "loss": 0.024,
+ "step": 30228
+ },
+ {
+ "epoch": 82.36784741144415,
+ "grad_norm": 2.56009840965271,
+ "learning_rate": 1.5867273940621297e-06,
+ "loss": 0.0395,
+ "step": 30229
+ },
+ {
+ "epoch": 82.37057220708446,
+ "grad_norm": 1.888870120048523,
+ "learning_rate": 1.5862504154599522e-06,
+ "loss": 0.0238,
+ "step": 30230
+ },
+ {
+ "epoch": 82.3732970027248,
+ "grad_norm": 2.4918346405029297,
+ "learning_rate": 1.5857735023837861e-06,
+ "loss": 0.0254,
+ "step": 30231
+ },
+ {
+ "epoch": 82.37602179836512,
+ "grad_norm": 2.846223831176758,
+ "learning_rate": 1.585296654837345e-06,
+ "loss": 0.0959,
+ "step": 30232
+ },
+ {
+ "epoch": 82.37874659400545,
+ "grad_norm": 2.0135998725891113,
+ "learning_rate": 1.5848198728243402e-06,
+ "loss": 0.0236,
+ "step": 30233
+ },
+ {
+ "epoch": 82.38147138964578,
+ "grad_norm": 2.7633562088012695,
+ "learning_rate": 1.5843431563484902e-06,
+ "loss": 0.0304,
+ "step": 30234
+ },
+ {
+ "epoch": 82.3841961852861,
+ "grad_norm": 1.961612582206726,
+ "learning_rate": 1.583866505413505e-06,
+ "loss": 0.0755,
+ "step": 30235
+ },
+ {
+ "epoch": 82.38692098092643,
+ "grad_norm": 2.5416512489318848,
+ "learning_rate": 1.5833899200230963e-06,
+ "loss": 0.0487,
+ "step": 30236
+ },
+ {
+ "epoch": 82.38964577656675,
+ "grad_norm": 2.978325128555298,
+ "learning_rate": 1.582913400180973e-06,
+ "loss": 0.1387,
+ "step": 30237
+ },
+ {
+ "epoch": 82.39237057220708,
+ "grad_norm": 2.6418581008911133,
+ "learning_rate": 1.5824369458908518e-06,
+ "loss": 0.1327,
+ "step": 30238
+ },
+ {
+ "epoch": 82.39509536784742,
+ "grad_norm": 2.6299800872802734,
+ "learning_rate": 1.581960557156441e-06,
+ "loss": 0.055,
+ "step": 30239
+ },
+ {
+ "epoch": 82.39782016348774,
+ "grad_norm": 4.451153755187988,
+ "learning_rate": 1.5814842339814485e-06,
+ "loss": 0.1029,
+ "step": 30240
+ },
+ {
+ "epoch": 82.40054495912807,
+ "grad_norm": 5.714231967926025,
+ "learning_rate": 1.5810079763695852e-06,
+ "loss": 0.0235,
+ "step": 30241
+ },
+ {
+ "epoch": 82.40326975476839,
+ "grad_norm": 1.663466215133667,
+ "learning_rate": 1.5805317843245638e-06,
+ "loss": 0.0168,
+ "step": 30242
+ },
+ {
+ "epoch": 82.40599455040872,
+ "grad_norm": 2.099660873413086,
+ "learning_rate": 1.5800556578500891e-06,
+ "loss": 0.0273,
+ "step": 30243
+ },
+ {
+ "epoch": 82.40871934604904,
+ "grad_norm": 3.4054901599884033,
+ "learning_rate": 1.5795795969498706e-06,
+ "loss": 0.08,
+ "step": 30244
+ },
+ {
+ "epoch": 82.41144414168937,
+ "grad_norm": 4.001406669616699,
+ "learning_rate": 1.579103601627613e-06,
+ "loss": 0.1298,
+ "step": 30245
+ },
+ {
+ "epoch": 82.4141689373297,
+ "grad_norm": 3.6959145069122314,
+ "learning_rate": 1.5786276718870274e-06,
+ "loss": 0.0782,
+ "step": 30246
+ },
+ {
+ "epoch": 82.41689373297002,
+ "grad_norm": 2.4311442375183105,
+ "learning_rate": 1.578151807731818e-06,
+ "loss": 0.0359,
+ "step": 30247
+ },
+ {
+ "epoch": 82.41961852861036,
+ "grad_norm": 2.4477179050445557,
+ "learning_rate": 1.5776760091656918e-06,
+ "loss": 0.0998,
+ "step": 30248
+ },
+ {
+ "epoch": 82.42234332425068,
+ "grad_norm": 2.8573293685913086,
+ "learning_rate": 1.577200276192351e-06,
+ "loss": 0.0335,
+ "step": 30249
+ },
+ {
+ "epoch": 82.42506811989101,
+ "grad_norm": 3.3418049812316895,
+ "learning_rate": 1.5767246088155064e-06,
+ "loss": 0.1005,
+ "step": 30250
+ },
+ {
+ "epoch": 82.42779291553134,
+ "grad_norm": 2.3806207180023193,
+ "learning_rate": 1.5762490070388592e-06,
+ "loss": 0.0373,
+ "step": 30251
+ },
+ {
+ "epoch": 82.43051771117166,
+ "grad_norm": 2.034852981567383,
+ "learning_rate": 1.5757734708661144e-06,
+ "loss": 0.0329,
+ "step": 30252
+ },
+ {
+ "epoch": 82.433242506812,
+ "grad_norm": 2.5034232139587402,
+ "learning_rate": 1.575298000300971e-06,
+ "loss": 0.0387,
+ "step": 30253
+ },
+ {
+ "epoch": 82.43596730245231,
+ "grad_norm": 2.270033359527588,
+ "learning_rate": 1.5748225953471385e-06,
+ "loss": 0.0799,
+ "step": 30254
+ },
+ {
+ "epoch": 82.43869209809264,
+ "grad_norm": 2.658634901046753,
+ "learning_rate": 1.5743472560083162e-06,
+ "loss": 0.1347,
+ "step": 30255
+ },
+ {
+ "epoch": 82.44141689373296,
+ "grad_norm": 5.519894123077393,
+ "learning_rate": 1.5738719822882064e-06,
+ "loss": 0.0948,
+ "step": 30256
+ },
+ {
+ "epoch": 82.4441416893733,
+ "grad_norm": 2.8614137172698975,
+ "learning_rate": 1.5733967741905087e-06,
+ "loss": 0.1078,
+ "step": 30257
+ },
+ {
+ "epoch": 82.44686648501363,
+ "grad_norm": 2.6079354286193848,
+ "learning_rate": 1.5729216317189245e-06,
+ "loss": 0.0734,
+ "step": 30258
+ },
+ {
+ "epoch": 82.44959128065395,
+ "grad_norm": 2.9450924396514893,
+ "learning_rate": 1.5724465548771584e-06,
+ "loss": 0.0694,
+ "step": 30259
+ },
+ {
+ "epoch": 82.45231607629428,
+ "grad_norm": 2.2583277225494385,
+ "learning_rate": 1.5719715436689076e-06,
+ "loss": 0.0238,
+ "step": 30260
+ },
+ {
+ "epoch": 82.4550408719346,
+ "grad_norm": 3.2999963760375977,
+ "learning_rate": 1.5714965980978692e-06,
+ "loss": 0.11,
+ "step": 30261
+ },
+ {
+ "epoch": 82.45776566757493,
+ "grad_norm": 1.9584386348724365,
+ "learning_rate": 1.5710217181677456e-06,
+ "loss": 0.0169,
+ "step": 30262
+ },
+ {
+ "epoch": 82.46049046321527,
+ "grad_norm": 2.5350840091705322,
+ "learning_rate": 1.570546903882233e-06,
+ "loss": 0.0436,
+ "step": 30263
+ },
+ {
+ "epoch": 82.46321525885558,
+ "grad_norm": 3.3207385540008545,
+ "learning_rate": 1.5700721552450315e-06,
+ "loss": 0.0593,
+ "step": 30264
+ },
+ {
+ "epoch": 82.46594005449592,
+ "grad_norm": 2.6607284545898438,
+ "learning_rate": 1.5695974722598328e-06,
+ "loss": 0.0351,
+ "step": 30265
+ },
+ {
+ "epoch": 82.46866485013624,
+ "grad_norm": 1.9403024911880493,
+ "learning_rate": 1.5691228549303406e-06,
+ "loss": 0.0352,
+ "step": 30266
+ },
+ {
+ "epoch": 82.47138964577657,
+ "grad_norm": 2.3460240364074707,
+ "learning_rate": 1.5686483032602484e-06,
+ "loss": 0.029,
+ "step": 30267
+ },
+ {
+ "epoch": 82.47411444141689,
+ "grad_norm": 2.857072591781616,
+ "learning_rate": 1.5681738172532513e-06,
+ "loss": 0.0429,
+ "step": 30268
+ },
+ {
+ "epoch": 82.47683923705722,
+ "grad_norm": 2.1656620502471924,
+ "learning_rate": 1.5676993969130439e-06,
+ "loss": 0.0262,
+ "step": 30269
+ },
+ {
+ "epoch": 82.47956403269755,
+ "grad_norm": 3.6469504833221436,
+ "learning_rate": 1.5672250422433233e-06,
+ "loss": 0.0514,
+ "step": 30270
+ },
+ {
+ "epoch": 82.48228882833787,
+ "grad_norm": 1.6631399393081665,
+ "learning_rate": 1.5667507532477833e-06,
+ "loss": 0.0191,
+ "step": 30271
+ },
+ {
+ "epoch": 82.4850136239782,
+ "grad_norm": 2.5740177631378174,
+ "learning_rate": 1.5662765299301174e-06,
+ "loss": 0.0697,
+ "step": 30272
+ },
+ {
+ "epoch": 82.48773841961852,
+ "grad_norm": 2.5435543060302734,
+ "learning_rate": 1.5658023722940151e-06,
+ "loss": 0.1915,
+ "step": 30273
+ },
+ {
+ "epoch": 82.49046321525886,
+ "grad_norm": 3.1907248497009277,
+ "learning_rate": 1.5653282803431734e-06,
+ "loss": 0.0545,
+ "step": 30274
+ },
+ {
+ "epoch": 82.49318801089919,
+ "grad_norm": 4.00557804107666,
+ "learning_rate": 1.564854254081285e-06,
+ "loss": 0.0563,
+ "step": 30275
+ },
+ {
+ "epoch": 82.49591280653951,
+ "grad_norm": 2.2429308891296387,
+ "learning_rate": 1.5643802935120411e-06,
+ "loss": 0.035,
+ "step": 30276
+ },
+ {
+ "epoch": 82.49863760217984,
+ "grad_norm": 3.5843381881713867,
+ "learning_rate": 1.5639063986391322e-06,
+ "loss": 0.1553,
+ "step": 30277
+ },
+ {
+ "epoch": 82.50136239782016,
+ "grad_norm": 1.9688689708709717,
+ "learning_rate": 1.5634325694662455e-06,
+ "loss": 0.0358,
+ "step": 30278
+ },
+ {
+ "epoch": 82.50408719346049,
+ "grad_norm": 2.6274609565734863,
+ "learning_rate": 1.5629588059970769e-06,
+ "loss": 0.031,
+ "step": 30279
+ },
+ {
+ "epoch": 82.50681198910081,
+ "grad_norm": 2.148953676223755,
+ "learning_rate": 1.5624851082353143e-06,
+ "loss": 0.1204,
+ "step": 30280
+ },
+ {
+ "epoch": 82.50953678474114,
+ "grad_norm": 2.4428417682647705,
+ "learning_rate": 1.562011476184645e-06,
+ "loss": 0.034,
+ "step": 30281
+ },
+ {
+ "epoch": 82.51226158038148,
+ "grad_norm": 2.7503209114074707,
+ "learning_rate": 1.561537909848757e-06,
+ "loss": 0.0346,
+ "step": 30282
+ },
+ {
+ "epoch": 82.5149863760218,
+ "grad_norm": 2.4017913341522217,
+ "learning_rate": 1.561064409231342e-06,
+ "loss": 0.0484,
+ "step": 30283
+ },
+ {
+ "epoch": 82.51771117166213,
+ "grad_norm": 2.8435680866241455,
+ "learning_rate": 1.560590974336087e-06,
+ "loss": 0.0574,
+ "step": 30284
+ },
+ {
+ "epoch": 82.52043596730245,
+ "grad_norm": 1.748368740081787,
+ "learning_rate": 1.5601176051666744e-06,
+ "loss": 0.035,
+ "step": 30285
+ },
+ {
+ "epoch": 82.52316076294278,
+ "grad_norm": 3.2250211238861084,
+ "learning_rate": 1.559644301726797e-06,
+ "loss": 0.0543,
+ "step": 30286
+ },
+ {
+ "epoch": 82.52588555858311,
+ "grad_norm": 1.9527214765548706,
+ "learning_rate": 1.5591710640201385e-06,
+ "loss": 0.0245,
+ "step": 30287
+ },
+ {
+ "epoch": 82.52861035422343,
+ "grad_norm": 2.7119812965393066,
+ "learning_rate": 1.5586978920503836e-06,
+ "loss": 0.0351,
+ "step": 30288
+ },
+ {
+ "epoch": 82.53133514986376,
+ "grad_norm": 1.9051939249038696,
+ "learning_rate": 1.5582247858212152e-06,
+ "loss": 0.033,
+ "step": 30289
+ },
+ {
+ "epoch": 82.53405994550408,
+ "grad_norm": 2.1461281776428223,
+ "learning_rate": 1.5577517453363234e-06,
+ "loss": 0.0296,
+ "step": 30290
+ },
+ {
+ "epoch": 82.53678474114442,
+ "grad_norm": 3.381720542907715,
+ "learning_rate": 1.5572787705993863e-06,
+ "loss": 0.0357,
+ "step": 30291
+ },
+ {
+ "epoch": 82.53950953678473,
+ "grad_norm": 2.9295082092285156,
+ "learning_rate": 1.5568058616140934e-06,
+ "loss": 0.0379,
+ "step": 30292
+ },
+ {
+ "epoch": 82.54223433242507,
+ "grad_norm": 3.9110260009765625,
+ "learning_rate": 1.5563330183841252e-06,
+ "loss": 0.0748,
+ "step": 30293
+ },
+ {
+ "epoch": 82.5449591280654,
+ "grad_norm": 2.8895926475524902,
+ "learning_rate": 1.5558602409131606e-06,
+ "loss": 0.054,
+ "step": 30294
+ },
+ {
+ "epoch": 82.54768392370572,
+ "grad_norm": 4.43402624130249,
+ "learning_rate": 1.555387529204887e-06,
+ "loss": 0.0612,
+ "step": 30295
+ },
+ {
+ "epoch": 82.55040871934605,
+ "grad_norm": 2.748997449874878,
+ "learning_rate": 1.5549148832629834e-06,
+ "loss": 0.1353,
+ "step": 30296
+ },
+ {
+ "epoch": 82.55313351498637,
+ "grad_norm": 2.1949260234832764,
+ "learning_rate": 1.5544423030911316e-06,
+ "loss": 0.0277,
+ "step": 30297
+ },
+ {
+ "epoch": 82.5558583106267,
+ "grad_norm": 2.609607696533203,
+ "learning_rate": 1.5539697886930082e-06,
+ "loss": 0.056,
+ "step": 30298
+ },
+ {
+ "epoch": 82.55858310626704,
+ "grad_norm": 2.2071664333343506,
+ "learning_rate": 1.5534973400722986e-06,
+ "loss": 0.0159,
+ "step": 30299
+ },
+ {
+ "epoch": 82.56130790190736,
+ "grad_norm": 2.790907621383667,
+ "learning_rate": 1.5530249572326806e-06,
+ "loss": 0.0301,
+ "step": 30300
+ },
+ {
+ "epoch": 82.56403269754769,
+ "grad_norm": 2.826721668243408,
+ "learning_rate": 1.5525526401778313e-06,
+ "loss": 0.0798,
+ "step": 30301
+ },
+ {
+ "epoch": 82.566757493188,
+ "grad_norm": 3.125518560409546,
+ "learning_rate": 1.5520803889114288e-06,
+ "loss": 0.2181,
+ "step": 30302
+ },
+ {
+ "epoch": 82.56948228882834,
+ "grad_norm": 2.3341801166534424,
+ "learning_rate": 1.5516082034371538e-06,
+ "loss": 0.1092,
+ "step": 30303
+ },
+ {
+ "epoch": 82.57220708446866,
+ "grad_norm": 3.8021793365478516,
+ "learning_rate": 1.5511360837586832e-06,
+ "loss": 0.2114,
+ "step": 30304
+ },
+ {
+ "epoch": 82.57493188010899,
+ "grad_norm": 3.2330422401428223,
+ "learning_rate": 1.5506640298796927e-06,
+ "loss": 0.0796,
+ "step": 30305
+ },
+ {
+ "epoch": 82.57765667574932,
+ "grad_norm": 2.2091379165649414,
+ "learning_rate": 1.5501920418038553e-06,
+ "loss": 0.0378,
+ "step": 30306
+ },
+ {
+ "epoch": 82.58038147138964,
+ "grad_norm": 2.6230266094207764,
+ "learning_rate": 1.5497201195348532e-06,
+ "loss": 0.0766,
+ "step": 30307
+ },
+ {
+ "epoch": 82.58310626702998,
+ "grad_norm": 3.9569058418273926,
+ "learning_rate": 1.5492482630763594e-06,
+ "loss": 0.0507,
+ "step": 30308
+ },
+ {
+ "epoch": 82.5858310626703,
+ "grad_norm": 2.079242706298828,
+ "learning_rate": 1.5487764724320453e-06,
+ "loss": 0.0662,
+ "step": 30309
+ },
+ {
+ "epoch": 82.58855585831063,
+ "grad_norm": 2.6884078979492188,
+ "learning_rate": 1.548304747605589e-06,
+ "loss": 0.0497,
+ "step": 30310
+ },
+ {
+ "epoch": 82.59128065395096,
+ "grad_norm": 1.6678122282028198,
+ "learning_rate": 1.5478330886006643e-06,
+ "loss": 0.0262,
+ "step": 30311
+ },
+ {
+ "epoch": 82.59400544959128,
+ "grad_norm": 2.8677210807800293,
+ "learning_rate": 1.5473614954209449e-06,
+ "loss": 0.0311,
+ "step": 30312
+ },
+ {
+ "epoch": 82.59673024523161,
+ "grad_norm": 3.624225378036499,
+ "learning_rate": 1.546889968070101e-06,
+ "loss": 0.128,
+ "step": 30313
+ },
+ {
+ "epoch": 82.59945504087193,
+ "grad_norm": 2.751782178878784,
+ "learning_rate": 1.5464185065518034e-06,
+ "loss": 0.0441,
+ "step": 30314
+ },
+ {
+ "epoch": 82.60217983651226,
+ "grad_norm": 3.056368112564087,
+ "learning_rate": 1.54594711086973e-06,
+ "loss": 0.0949,
+ "step": 30315
+ },
+ {
+ "epoch": 82.60490463215258,
+ "grad_norm": 1.8355586528778076,
+ "learning_rate": 1.5454757810275468e-06,
+ "loss": 0.0197,
+ "step": 30316
+ },
+ {
+ "epoch": 82.60762942779292,
+ "grad_norm": 2.217400074005127,
+ "learning_rate": 1.5450045170289275e-06,
+ "loss": 0.103,
+ "step": 30317
+ },
+ {
+ "epoch": 82.61035422343325,
+ "grad_norm": 2.9036612510681152,
+ "learning_rate": 1.544533318877538e-06,
+ "loss": 0.1514,
+ "step": 30318
+ },
+ {
+ "epoch": 82.61307901907357,
+ "grad_norm": 3.0461792945861816,
+ "learning_rate": 1.5440621865770533e-06,
+ "loss": 0.0303,
+ "step": 30319
+ },
+ {
+ "epoch": 82.6158038147139,
+ "grad_norm": 2.601266860961914,
+ "learning_rate": 1.5435911201311405e-06,
+ "loss": 0.051,
+ "step": 30320
+ },
+ {
+ "epoch": 82.61852861035422,
+ "grad_norm": 2.228388786315918,
+ "learning_rate": 1.5431201195434664e-06,
+ "loss": 0.0476,
+ "step": 30321
+ },
+ {
+ "epoch": 82.62125340599455,
+ "grad_norm": 2.456087350845337,
+ "learning_rate": 1.5426491848176995e-06,
+ "loss": 0.1547,
+ "step": 30322
+ },
+ {
+ "epoch": 82.62397820163488,
+ "grad_norm": 4.665582180023193,
+ "learning_rate": 1.542178315957511e-06,
+ "loss": 0.0913,
+ "step": 30323
+ },
+ {
+ "epoch": 82.6267029972752,
+ "grad_norm": 1.9684175252914429,
+ "learning_rate": 1.541707512966566e-06,
+ "loss": 0.0295,
+ "step": 30324
+ },
+ {
+ "epoch": 82.62942779291554,
+ "grad_norm": 3.1616861820220947,
+ "learning_rate": 1.541236775848529e-06,
+ "loss": 0.1428,
+ "step": 30325
+ },
+ {
+ "epoch": 82.63215258855585,
+ "grad_norm": 5.245412826538086,
+ "learning_rate": 1.5407661046070643e-06,
+ "loss": 0.0353,
+ "step": 30326
+ },
+ {
+ "epoch": 82.63487738419619,
+ "grad_norm": 2.222473382949829,
+ "learning_rate": 1.5402954992458451e-06,
+ "loss": 0.0297,
+ "step": 30327
+ },
+ {
+ "epoch": 82.6376021798365,
+ "grad_norm": 2.7224769592285156,
+ "learning_rate": 1.5398249597685334e-06,
+ "loss": 0.2564,
+ "step": 30328
+ },
+ {
+ "epoch": 82.64032697547684,
+ "grad_norm": 4.054591178894043,
+ "learning_rate": 1.5393544861787912e-06,
+ "loss": 0.0649,
+ "step": 30329
+ },
+ {
+ "epoch": 82.64305177111717,
+ "grad_norm": 2.383607864379883,
+ "learning_rate": 1.5388840784802817e-06,
+ "loss": 0.0678,
+ "step": 30330
+ },
+ {
+ "epoch": 82.64577656675749,
+ "grad_norm": 2.370311975479126,
+ "learning_rate": 1.5384137366766739e-06,
+ "loss": 0.0459,
+ "step": 30331
+ },
+ {
+ "epoch": 82.64850136239782,
+ "grad_norm": 2.658867835998535,
+ "learning_rate": 1.5379434607716271e-06,
+ "loss": 0.0666,
+ "step": 30332
+ },
+ {
+ "epoch": 82.65122615803814,
+ "grad_norm": 2.7283833026885986,
+ "learning_rate": 1.537473250768804e-06,
+ "loss": 0.0381,
+ "step": 30333
+ },
+ {
+ "epoch": 82.65395095367847,
+ "grad_norm": 1.801334261894226,
+ "learning_rate": 1.537003106671865e-06,
+ "loss": 0.0211,
+ "step": 30334
+ },
+ {
+ "epoch": 82.65667574931881,
+ "grad_norm": 2.466092586517334,
+ "learning_rate": 1.536533028484476e-06,
+ "loss": 0.0835,
+ "step": 30335
+ },
+ {
+ "epoch": 82.65940054495913,
+ "grad_norm": 2.314575672149658,
+ "learning_rate": 1.5360630162102953e-06,
+ "loss": 0.0376,
+ "step": 30336
+ },
+ {
+ "epoch": 82.66212534059946,
+ "grad_norm": 2.093158006668091,
+ "learning_rate": 1.535593069852983e-06,
+ "loss": 0.0272,
+ "step": 30337
+ },
+ {
+ "epoch": 82.66485013623978,
+ "grad_norm": 3.99423885345459,
+ "learning_rate": 1.5351231894161967e-06,
+ "loss": 0.0568,
+ "step": 30338
+ },
+ {
+ "epoch": 82.66757493188011,
+ "grad_norm": 3.385798692703247,
+ "learning_rate": 1.534653374903602e-06,
+ "loss": 0.1196,
+ "step": 30339
+ },
+ {
+ "epoch": 82.67029972752043,
+ "grad_norm": 3.752199411392212,
+ "learning_rate": 1.5341836263188537e-06,
+ "loss": 0.0334,
+ "step": 30340
+ },
+ {
+ "epoch": 82.67302452316076,
+ "grad_norm": 2.3044042587280273,
+ "learning_rate": 1.53371394366561e-06,
+ "loss": 0.0671,
+ "step": 30341
+ },
+ {
+ "epoch": 82.6757493188011,
+ "grad_norm": 2.897268772125244,
+ "learning_rate": 1.5332443269475284e-06,
+ "loss": 0.1777,
+ "step": 30342
+ },
+ {
+ "epoch": 82.67847411444141,
+ "grad_norm": 2.632194757461548,
+ "learning_rate": 1.5327747761682677e-06,
+ "loss": 0.1456,
+ "step": 30343
+ },
+ {
+ "epoch": 82.68119891008175,
+ "grad_norm": 2.468472719192505,
+ "learning_rate": 1.5323052913314863e-06,
+ "loss": 0.0263,
+ "step": 30344
+ },
+ {
+ "epoch": 82.68392370572207,
+ "grad_norm": 2.753012180328369,
+ "learning_rate": 1.531835872440839e-06,
+ "loss": 0.0849,
+ "step": 30345
+ },
+ {
+ "epoch": 82.6866485013624,
+ "grad_norm": 2.3302366733551025,
+ "learning_rate": 1.5313665194999816e-06,
+ "loss": 0.0476,
+ "step": 30346
+ },
+ {
+ "epoch": 82.68937329700273,
+ "grad_norm": 3.279644012451172,
+ "learning_rate": 1.530897232512566e-06,
+ "loss": 0.037,
+ "step": 30347
+ },
+ {
+ "epoch": 82.69209809264305,
+ "grad_norm": 3.16890549659729,
+ "learning_rate": 1.5304280114822534e-06,
+ "loss": 0.0423,
+ "step": 30348
+ },
+ {
+ "epoch": 82.69482288828338,
+ "grad_norm": 1.5937548875808716,
+ "learning_rate": 1.5299588564126944e-06,
+ "loss": 0.0194,
+ "step": 30349
+ },
+ {
+ "epoch": 82.6975476839237,
+ "grad_norm": 2.417611598968506,
+ "learning_rate": 1.5294897673075405e-06,
+ "loss": 0.0385,
+ "step": 30350
+ },
+ {
+ "epoch": 82.70027247956403,
+ "grad_norm": 2.9801692962646484,
+ "learning_rate": 1.5290207441704507e-06,
+ "loss": 0.0501,
+ "step": 30351
+ },
+ {
+ "epoch": 82.70299727520435,
+ "grad_norm": 2.648916482925415,
+ "learning_rate": 1.5285517870050748e-06,
+ "loss": 0.1549,
+ "step": 30352
+ },
+ {
+ "epoch": 82.70572207084469,
+ "grad_norm": 2.461791515350342,
+ "learning_rate": 1.528082895815065e-06,
+ "loss": 0.1026,
+ "step": 30353
+ },
+ {
+ "epoch": 82.70844686648502,
+ "grad_norm": 2.5765380859375,
+ "learning_rate": 1.5276140706040698e-06,
+ "loss": 0.0536,
+ "step": 30354
+ },
+ {
+ "epoch": 82.71117166212534,
+ "grad_norm": 2.104875326156616,
+ "learning_rate": 1.5271453113757462e-06,
+ "loss": 0.0284,
+ "step": 30355
+ },
+ {
+ "epoch": 82.71389645776567,
+ "grad_norm": 3.0429880619049072,
+ "learning_rate": 1.5266766181337423e-06,
+ "loss": 0.0596,
+ "step": 30356
+ },
+ {
+ "epoch": 82.71662125340599,
+ "grad_norm": 2.4085068702697754,
+ "learning_rate": 1.5262079908817084e-06,
+ "loss": 0.0319,
+ "step": 30357
+ },
+ {
+ "epoch": 82.71934604904632,
+ "grad_norm": 3.892064332962036,
+ "learning_rate": 1.5257394296232907e-06,
+ "loss": 0.096,
+ "step": 30358
+ },
+ {
+ "epoch": 82.72207084468666,
+ "grad_norm": 1.9599765539169312,
+ "learning_rate": 1.5252709343621452e-06,
+ "loss": 0.0277,
+ "step": 30359
+ },
+ {
+ "epoch": 82.72479564032697,
+ "grad_norm": 2.7941465377807617,
+ "learning_rate": 1.5248025051019145e-06,
+ "loss": 0.0881,
+ "step": 30360
+ },
+ {
+ "epoch": 82.7275204359673,
+ "grad_norm": 3.0377144813537598,
+ "learning_rate": 1.524334141846251e-06,
+ "loss": 0.0847,
+ "step": 30361
+ },
+ {
+ "epoch": 82.73024523160763,
+ "grad_norm": 2.1820876598358154,
+ "learning_rate": 1.5238658445987997e-06,
+ "loss": 0.0345,
+ "step": 30362
+ },
+ {
+ "epoch": 82.73297002724796,
+ "grad_norm": 4.174436569213867,
+ "learning_rate": 1.5233976133632067e-06,
+ "loss": 0.0917,
+ "step": 30363
+ },
+ {
+ "epoch": 82.73569482288828,
+ "grad_norm": 3.4797418117523193,
+ "learning_rate": 1.5229294481431233e-06,
+ "loss": 0.1001,
+ "step": 30364
+ },
+ {
+ "epoch": 82.73841961852861,
+ "grad_norm": 2.293530225753784,
+ "learning_rate": 1.5224613489421914e-06,
+ "loss": 0.0307,
+ "step": 30365
+ },
+ {
+ "epoch": 82.74114441416894,
+ "grad_norm": 2.3010637760162354,
+ "learning_rate": 1.5219933157640576e-06,
+ "loss": 0.0726,
+ "step": 30366
+ },
+ {
+ "epoch": 82.74386920980926,
+ "grad_norm": 2.6362626552581787,
+ "learning_rate": 1.521525348612366e-06,
+ "loss": 0.1183,
+ "step": 30367
+ },
+ {
+ "epoch": 82.7465940054496,
+ "grad_norm": 3.284475564956665,
+ "learning_rate": 1.5210574474907635e-06,
+ "loss": 0.0678,
+ "step": 30368
+ },
+ {
+ "epoch": 82.74931880108991,
+ "grad_norm": 1.8884029388427734,
+ "learning_rate": 1.520589612402893e-06,
+ "loss": 0.0197,
+ "step": 30369
+ },
+ {
+ "epoch": 82.75204359673025,
+ "grad_norm": 2.4459478855133057,
+ "learning_rate": 1.5201218433523945e-06,
+ "loss": 0.0264,
+ "step": 30370
+ },
+ {
+ "epoch": 82.75476839237058,
+ "grad_norm": 1.9934412240982056,
+ "learning_rate": 1.5196541403429176e-06,
+ "loss": 0.0404,
+ "step": 30371
+ },
+ {
+ "epoch": 82.7574931880109,
+ "grad_norm": 4.480851650238037,
+ "learning_rate": 1.5191865033781005e-06,
+ "loss": 0.0641,
+ "step": 30372
+ },
+ {
+ "epoch": 82.76021798365123,
+ "grad_norm": 3.1816046237945557,
+ "learning_rate": 1.518718932461587e-06,
+ "loss": 0.0825,
+ "step": 30373
+ },
+ {
+ "epoch": 82.76294277929155,
+ "grad_norm": 3.600402593612671,
+ "learning_rate": 1.518251427597014e-06,
+ "loss": 0.1267,
+ "step": 30374
+ },
+ {
+ "epoch": 82.76566757493188,
+ "grad_norm": 2.135265827178955,
+ "learning_rate": 1.5177839887880287e-06,
+ "loss": 0.0391,
+ "step": 30375
+ },
+ {
+ "epoch": 82.7683923705722,
+ "grad_norm": 1.769209384918213,
+ "learning_rate": 1.5173166160382692e-06,
+ "loss": 0.0286,
+ "step": 30376
+ },
+ {
+ "epoch": 82.77111716621253,
+ "grad_norm": 2.300689697265625,
+ "learning_rate": 1.5168493093513714e-06,
+ "loss": 0.0462,
+ "step": 30377
+ },
+ {
+ "epoch": 82.77384196185287,
+ "grad_norm": 5.4529948234558105,
+ "learning_rate": 1.5163820687309816e-06,
+ "loss": 0.0331,
+ "step": 30378
+ },
+ {
+ "epoch": 82.77656675749319,
+ "grad_norm": 3.395545244216919,
+ "learning_rate": 1.5159148941807323e-06,
+ "loss": 0.0498,
+ "step": 30379
+ },
+ {
+ "epoch": 82.77929155313352,
+ "grad_norm": 3.3990988731384277,
+ "learning_rate": 1.5154477857042672e-06,
+ "loss": 0.0288,
+ "step": 30380
+ },
+ {
+ "epoch": 82.78201634877384,
+ "grad_norm": 2.8645358085632324,
+ "learning_rate": 1.5149807433052222e-06,
+ "loss": 0.1668,
+ "step": 30381
+ },
+ {
+ "epoch": 82.78474114441417,
+ "grad_norm": 1.9748790264129639,
+ "learning_rate": 1.5145137669872334e-06,
+ "loss": 0.0238,
+ "step": 30382
+ },
+ {
+ "epoch": 82.7874659400545,
+ "grad_norm": 2.9800281524658203,
+ "learning_rate": 1.5140468567539357e-06,
+ "loss": 0.095,
+ "step": 30383
+ },
+ {
+ "epoch": 82.79019073569482,
+ "grad_norm": 2.9694268703460693,
+ "learning_rate": 1.5135800126089707e-06,
+ "loss": 0.0295,
+ "step": 30384
+ },
+ {
+ "epoch": 82.79291553133515,
+ "grad_norm": 2.362278699874878,
+ "learning_rate": 1.5131132345559718e-06,
+ "loss": 0.0309,
+ "step": 30385
+ },
+ {
+ "epoch": 82.79564032697547,
+ "grad_norm": 2.7103750705718994,
+ "learning_rate": 1.5126465225985731e-06,
+ "loss": 0.0697,
+ "step": 30386
+ },
+ {
+ "epoch": 82.7983651226158,
+ "grad_norm": 2.0758557319641113,
+ "learning_rate": 1.5121798767404084e-06,
+ "loss": 0.0233,
+ "step": 30387
+ },
+ {
+ "epoch": 82.80108991825612,
+ "grad_norm": 2.3000056743621826,
+ "learning_rate": 1.5117132969851156e-06,
+ "loss": 0.047,
+ "step": 30388
+ },
+ {
+ "epoch": 82.80381471389646,
+ "grad_norm": 3.21502423286438,
+ "learning_rate": 1.5112467833363265e-06,
+ "loss": 0.0957,
+ "step": 30389
+ },
+ {
+ "epoch": 82.80653950953679,
+ "grad_norm": 2.4644534587860107,
+ "learning_rate": 1.5107803357976748e-06,
+ "loss": 0.0904,
+ "step": 30390
+ },
+ {
+ "epoch": 82.80926430517711,
+ "grad_norm": 2.0804672241210938,
+ "learning_rate": 1.5103139543727895e-06,
+ "loss": 0.0291,
+ "step": 30391
+ },
+ {
+ "epoch": 82.81198910081744,
+ "grad_norm": 2.8503310680389404,
+ "learning_rate": 1.5098476390653082e-06,
+ "loss": 0.1207,
+ "step": 30392
+ },
+ {
+ "epoch": 82.81471389645776,
+ "grad_norm": 2.9527807235717773,
+ "learning_rate": 1.509381389878861e-06,
+ "loss": 0.0517,
+ "step": 30393
+ },
+ {
+ "epoch": 82.8174386920981,
+ "grad_norm": 3.389192581176758,
+ "learning_rate": 1.5089152068170755e-06,
+ "loss": 0.0401,
+ "step": 30394
+ },
+ {
+ "epoch": 82.82016348773843,
+ "grad_norm": 3.221360921859741,
+ "learning_rate": 1.5084490898835857e-06,
+ "loss": 0.0496,
+ "step": 30395
+ },
+ {
+ "epoch": 82.82288828337875,
+ "grad_norm": 2.4442756175994873,
+ "learning_rate": 1.5079830390820226e-06,
+ "loss": 0.0295,
+ "step": 30396
+ },
+ {
+ "epoch": 82.82561307901908,
+ "grad_norm": 3.3505232334136963,
+ "learning_rate": 1.5075170544160145e-06,
+ "loss": 0.0624,
+ "step": 30397
+ },
+ {
+ "epoch": 82.8283378746594,
+ "grad_norm": 1.7819381952285767,
+ "learning_rate": 1.5070511358891904e-06,
+ "loss": 0.0206,
+ "step": 30398
+ },
+ {
+ "epoch": 82.83106267029973,
+ "grad_norm": 2.8520798683166504,
+ "learning_rate": 1.5065852835051764e-06,
+ "loss": 0.031,
+ "step": 30399
+ },
+ {
+ "epoch": 82.83378746594005,
+ "grad_norm": 2.9648475646972656,
+ "learning_rate": 1.5061194972676041e-06,
+ "loss": 0.0932,
+ "step": 30400
+ },
+ {
+ "epoch": 82.83651226158038,
+ "grad_norm": 2.1956398487091064,
+ "learning_rate": 1.5056537771801016e-06,
+ "loss": 0.042,
+ "step": 30401
+ },
+ {
+ "epoch": 82.83923705722071,
+ "grad_norm": 3.113151788711548,
+ "learning_rate": 1.5051881232462928e-06,
+ "loss": 0.0357,
+ "step": 30402
+ },
+ {
+ "epoch": 82.84196185286103,
+ "grad_norm": 3.4155240058898926,
+ "learning_rate": 1.5047225354698037e-06,
+ "loss": 0.0434,
+ "step": 30403
+ },
+ {
+ "epoch": 82.84468664850137,
+ "grad_norm": 3.0014431476593018,
+ "learning_rate": 1.5042570138542645e-06,
+ "loss": 0.0336,
+ "step": 30404
+ },
+ {
+ "epoch": 82.84741144414168,
+ "grad_norm": 2.3759243488311768,
+ "learning_rate": 1.503791558403298e-06,
+ "loss": 0.0439,
+ "step": 30405
+ },
+ {
+ "epoch": 82.85013623978202,
+ "grad_norm": 3.328617572784424,
+ "learning_rate": 1.5033261691205292e-06,
+ "loss": 0.2054,
+ "step": 30406
+ },
+ {
+ "epoch": 82.85286103542235,
+ "grad_norm": 3.585984230041504,
+ "learning_rate": 1.5028608460095807e-06,
+ "loss": 0.0538,
+ "step": 30407
+ },
+ {
+ "epoch": 82.85558583106267,
+ "grad_norm": 2.3514294624328613,
+ "learning_rate": 1.5023955890740804e-06,
+ "loss": 0.0342,
+ "step": 30408
+ },
+ {
+ "epoch": 82.858310626703,
+ "grad_norm": 3.1947872638702393,
+ "learning_rate": 1.5019303983176504e-06,
+ "loss": 0.0362,
+ "step": 30409
+ },
+ {
+ "epoch": 82.86103542234332,
+ "grad_norm": 2.9419167041778564,
+ "learning_rate": 1.501465273743913e-06,
+ "loss": 0.0327,
+ "step": 30410
+ },
+ {
+ "epoch": 82.86376021798365,
+ "grad_norm": 3.953352212905884,
+ "learning_rate": 1.5010002153564873e-06,
+ "loss": 0.106,
+ "step": 30411
+ },
+ {
+ "epoch": 82.86648501362397,
+ "grad_norm": 2.5346102714538574,
+ "learning_rate": 1.5005352231589987e-06,
+ "loss": 0.0364,
+ "step": 30412
+ },
+ {
+ "epoch": 82.8692098092643,
+ "grad_norm": 1.6460795402526855,
+ "learning_rate": 1.5000702971550707e-06,
+ "loss": 0.0216,
+ "step": 30413
+ },
+ {
+ "epoch": 82.87193460490464,
+ "grad_norm": 3.1867313385009766,
+ "learning_rate": 1.4996054373483215e-06,
+ "loss": 0.1681,
+ "step": 30414
+ },
+ {
+ "epoch": 82.87465940054496,
+ "grad_norm": 2.953021764755249,
+ "learning_rate": 1.4991406437423694e-06,
+ "loss": 0.1105,
+ "step": 30415
+ },
+ {
+ "epoch": 82.87738419618529,
+ "grad_norm": 2.1132028102874756,
+ "learning_rate": 1.4986759163408393e-06,
+ "loss": 0.0472,
+ "step": 30416
+ },
+ {
+ "epoch": 82.88010899182561,
+ "grad_norm": 2.8401522636413574,
+ "learning_rate": 1.498211255147347e-06,
+ "loss": 0.1408,
+ "step": 30417
+ },
+ {
+ "epoch": 82.88283378746594,
+ "grad_norm": 2.509892702102661,
+ "learning_rate": 1.497746660165511e-06,
+ "loss": 0.0973,
+ "step": 30418
+ },
+ {
+ "epoch": 82.88555858310627,
+ "grad_norm": 2.653618097305298,
+ "learning_rate": 1.4972821313989495e-06,
+ "loss": 0.0714,
+ "step": 30419
+ },
+ {
+ "epoch": 82.88828337874659,
+ "grad_norm": 2.429211378097534,
+ "learning_rate": 1.4968176688512824e-06,
+ "loss": 0.0202,
+ "step": 30420
+ },
+ {
+ "epoch": 82.89100817438693,
+ "grad_norm": 2.8095321655273438,
+ "learning_rate": 1.4963532725261266e-06,
+ "loss": 0.0642,
+ "step": 30421
+ },
+ {
+ "epoch": 82.89373297002724,
+ "grad_norm": 3.2260658740997314,
+ "learning_rate": 1.495888942427096e-06,
+ "loss": 0.0577,
+ "step": 30422
+ },
+ {
+ "epoch": 82.89645776566758,
+ "grad_norm": 1.9967072010040283,
+ "learning_rate": 1.4954246785578085e-06,
+ "loss": 0.0706,
+ "step": 30423
+ },
+ {
+ "epoch": 82.8991825613079,
+ "grad_norm": 1.501876950263977,
+ "learning_rate": 1.4949604809218809e-06,
+ "loss": 0.0172,
+ "step": 30424
+ },
+ {
+ "epoch": 82.90190735694823,
+ "grad_norm": 6.5108819007873535,
+ "learning_rate": 1.4944963495229281e-06,
+ "loss": 0.0757,
+ "step": 30425
+ },
+ {
+ "epoch": 82.90463215258856,
+ "grad_norm": 2.5461976528167725,
+ "learning_rate": 1.4940322843645628e-06,
+ "loss": 0.0275,
+ "step": 30426
+ },
+ {
+ "epoch": 82.90735694822888,
+ "grad_norm": 2.8796920776367188,
+ "learning_rate": 1.4935682854503986e-06,
+ "loss": 0.0397,
+ "step": 30427
+ },
+ {
+ "epoch": 82.91008174386921,
+ "grad_norm": 3.414139986038208,
+ "learning_rate": 1.4931043527840538e-06,
+ "loss": 0.1772,
+ "step": 30428
+ },
+ {
+ "epoch": 82.91280653950953,
+ "grad_norm": 3.3438730239868164,
+ "learning_rate": 1.4926404863691357e-06,
+ "loss": 0.0849,
+ "step": 30429
+ },
+ {
+ "epoch": 82.91553133514986,
+ "grad_norm": 2.3764259815216064,
+ "learning_rate": 1.4921766862092612e-06,
+ "loss": 0.0252,
+ "step": 30430
+ },
+ {
+ "epoch": 82.9182561307902,
+ "grad_norm": 3.374160051345825,
+ "learning_rate": 1.491712952308042e-06,
+ "loss": 0.0494,
+ "step": 30431
+ },
+ {
+ "epoch": 82.92098092643052,
+ "grad_norm": 5.138745307922363,
+ "learning_rate": 1.4912492846690862e-06,
+ "loss": 0.0846,
+ "step": 30432
+ },
+ {
+ "epoch": 82.92370572207085,
+ "grad_norm": 2.571094512939453,
+ "learning_rate": 1.4907856832960088e-06,
+ "loss": 0.0702,
+ "step": 30433
+ },
+ {
+ "epoch": 82.92643051771117,
+ "grad_norm": 3.858018636703491,
+ "learning_rate": 1.490322148192419e-06,
+ "loss": 0.1358,
+ "step": 30434
+ },
+ {
+ "epoch": 82.9291553133515,
+ "grad_norm": 2.0177221298217773,
+ "learning_rate": 1.489858679361923e-06,
+ "loss": 0.0293,
+ "step": 30435
+ },
+ {
+ "epoch": 82.93188010899182,
+ "grad_norm": 1.7879647016525269,
+ "learning_rate": 1.4893952768081377e-06,
+ "loss": 0.0308,
+ "step": 30436
+ },
+ {
+ "epoch": 82.93460490463215,
+ "grad_norm": 2.2398107051849365,
+ "learning_rate": 1.488931940534667e-06,
+ "loss": 0.1906,
+ "step": 30437
+ },
+ {
+ "epoch": 82.93732970027249,
+ "grad_norm": 2.5204010009765625,
+ "learning_rate": 1.4884686705451213e-06,
+ "loss": 0.1873,
+ "step": 30438
+ },
+ {
+ "epoch": 82.9400544959128,
+ "grad_norm": 2.8309268951416016,
+ "learning_rate": 1.4880054668431043e-06,
+ "loss": 0.0631,
+ "step": 30439
+ },
+ {
+ "epoch": 82.94277929155314,
+ "grad_norm": 1.8874447345733643,
+ "learning_rate": 1.48754232943223e-06,
+ "loss": 0.025,
+ "step": 30440
+ },
+ {
+ "epoch": 82.94550408719346,
+ "grad_norm": 2.8392603397369385,
+ "learning_rate": 1.487079258316101e-06,
+ "loss": 0.1589,
+ "step": 30441
+ },
+ {
+ "epoch": 82.94822888283379,
+ "grad_norm": 4.089603900909424,
+ "learning_rate": 1.4866162534983252e-06,
+ "loss": 0.0425,
+ "step": 30442
+ },
+ {
+ "epoch": 82.95095367847412,
+ "grad_norm": 4.412265777587891,
+ "learning_rate": 1.4861533149825058e-06,
+ "loss": 0.0697,
+ "step": 30443
+ },
+ {
+ "epoch": 82.95367847411444,
+ "grad_norm": 2.268439292907715,
+ "learning_rate": 1.485690442772253e-06,
+ "loss": 0.0246,
+ "step": 30444
+ },
+ {
+ "epoch": 82.95640326975477,
+ "grad_norm": 2.5823121070861816,
+ "learning_rate": 1.4852276368711694e-06,
+ "loss": 0.0963,
+ "step": 30445
+ },
+ {
+ "epoch": 82.95912806539509,
+ "grad_norm": 3.604337692260742,
+ "learning_rate": 1.4847648972828554e-06,
+ "loss": 0.0265,
+ "step": 30446
+ },
+ {
+ "epoch": 82.96185286103542,
+ "grad_norm": 2.5100910663604736,
+ "learning_rate": 1.4843022240109218e-06,
+ "loss": 0.0226,
+ "step": 30447
+ },
+ {
+ "epoch": 82.96457765667574,
+ "grad_norm": 2.983286142349243,
+ "learning_rate": 1.4838396170589653e-06,
+ "loss": 0.0363,
+ "step": 30448
+ },
+ {
+ "epoch": 82.96730245231608,
+ "grad_norm": 2.635679244995117,
+ "learning_rate": 1.4833770764305944e-06,
+ "loss": 0.0891,
+ "step": 30449
+ },
+ {
+ "epoch": 82.97002724795641,
+ "grad_norm": 2.105109691619873,
+ "learning_rate": 1.4829146021294083e-06,
+ "loss": 0.0314,
+ "step": 30450
+ },
+ {
+ "epoch": 82.97275204359673,
+ "grad_norm": 3.193880558013916,
+ "learning_rate": 1.4824521941590097e-06,
+ "loss": 0.0221,
+ "step": 30451
+ },
+ {
+ "epoch": 82.97547683923706,
+ "grad_norm": 3.5505714416503906,
+ "learning_rate": 1.4819898525229958e-06,
+ "loss": 0.0597,
+ "step": 30452
+ },
+ {
+ "epoch": 82.97820163487738,
+ "grad_norm": 4.77075719833374,
+ "learning_rate": 1.4815275772249748e-06,
+ "loss": 0.0641,
+ "step": 30453
+ },
+ {
+ "epoch": 82.98092643051771,
+ "grad_norm": 3.000122308731079,
+ "learning_rate": 1.4810653682685417e-06,
+ "loss": 0.1045,
+ "step": 30454
+ },
+ {
+ "epoch": 82.98365122615803,
+ "grad_norm": 2.824181079864502,
+ "learning_rate": 1.4806032256572978e-06,
+ "loss": 0.1285,
+ "step": 30455
+ },
+ {
+ "epoch": 82.98637602179836,
+ "grad_norm": 2.2954354286193848,
+ "learning_rate": 1.4801411493948392e-06,
+ "loss": 0.1122,
+ "step": 30456
+ },
+ {
+ "epoch": 82.9891008174387,
+ "grad_norm": 2.3021657466888428,
+ "learning_rate": 1.47967913948477e-06,
+ "loss": 0.0271,
+ "step": 30457
+ },
+ {
+ "epoch": 82.99182561307902,
+ "grad_norm": 2.3377256393432617,
+ "learning_rate": 1.4792171959306844e-06,
+ "loss": 0.0824,
+ "step": 30458
+ },
+ {
+ "epoch": 82.99455040871935,
+ "grad_norm": 2.6584062576293945,
+ "learning_rate": 1.4787553187361793e-06,
+ "loss": 0.0325,
+ "step": 30459
+ },
+ {
+ "epoch": 82.99727520435967,
+ "grad_norm": 4.0611371994018555,
+ "learning_rate": 1.4782935079048567e-06,
+ "loss": 0.0837,
+ "step": 30460
+ },
+ {
+ "epoch": 83.0,
+ "grad_norm": 3.178171396255493,
+ "learning_rate": 1.4778317634403082e-06,
+ "loss": 0.0384,
+ "step": 30461
+ },
+ {
+ "epoch": 83.00272479564033,
+ "grad_norm": 2.2527153491973877,
+ "learning_rate": 1.4773700853461337e-06,
+ "loss": 0.0552,
+ "step": 30462
+ },
+ {
+ "epoch": 83.00544959128065,
+ "grad_norm": 2.4300429821014404,
+ "learning_rate": 1.4769084736259232e-06,
+ "loss": 0.0335,
+ "step": 30463
+ },
+ {
+ "epoch": 83.00817438692098,
+ "grad_norm": 2.9316818714141846,
+ "learning_rate": 1.4764469282832749e-06,
+ "loss": 0.0597,
+ "step": 30464
+ },
+ {
+ "epoch": 83.0108991825613,
+ "grad_norm": 2.5857608318328857,
+ "learning_rate": 1.4759854493217863e-06,
+ "loss": 0.0337,
+ "step": 30465
+ },
+ {
+ "epoch": 83.01362397820164,
+ "grad_norm": 3.271679639816284,
+ "learning_rate": 1.4755240367450485e-06,
+ "loss": 0.0271,
+ "step": 30466
+ },
+ {
+ "epoch": 83.01634877384195,
+ "grad_norm": 1.6700094938278198,
+ "learning_rate": 1.4750626905566557e-06,
+ "loss": 0.0189,
+ "step": 30467
+ },
+ {
+ "epoch": 83.01907356948229,
+ "grad_norm": 2.1981701850891113,
+ "learning_rate": 1.4746014107601969e-06,
+ "loss": 0.0901,
+ "step": 30468
+ },
+ {
+ "epoch": 83.02179836512262,
+ "grad_norm": 2.88409686088562,
+ "learning_rate": 1.4741401973592718e-06,
+ "loss": 0.0715,
+ "step": 30469
+ },
+ {
+ "epoch": 83.02452316076294,
+ "grad_norm": 3.3284995555877686,
+ "learning_rate": 1.4736790503574672e-06,
+ "loss": 0.019,
+ "step": 30470
+ },
+ {
+ "epoch": 83.02724795640327,
+ "grad_norm": 3.269502878189087,
+ "learning_rate": 1.473217969758376e-06,
+ "loss": 0.0818,
+ "step": 30471
+ },
+ {
+ "epoch": 83.02997275204359,
+ "grad_norm": 2.178234577178955,
+ "learning_rate": 1.4727569555655863e-06,
+ "loss": 0.0653,
+ "step": 30472
+ },
+ {
+ "epoch": 83.03269754768392,
+ "grad_norm": 2.9592747688293457,
+ "learning_rate": 1.4722960077826941e-06,
+ "loss": 0.1468,
+ "step": 30473
+ },
+ {
+ "epoch": 83.03542234332426,
+ "grad_norm": 3.2190043926239014,
+ "learning_rate": 1.4718351264132858e-06,
+ "loss": 0.0342,
+ "step": 30474
+ },
+ {
+ "epoch": 83.03814713896458,
+ "grad_norm": 2.257591485977173,
+ "learning_rate": 1.4713743114609501e-06,
+ "loss": 0.0391,
+ "step": 30475
+ },
+ {
+ "epoch": 83.04087193460491,
+ "grad_norm": 4.885451793670654,
+ "learning_rate": 1.4709135629292759e-06,
+ "loss": 0.0525,
+ "step": 30476
+ },
+ {
+ "epoch": 83.04359673024523,
+ "grad_norm": 2.8167476654052734,
+ "learning_rate": 1.4704528808218544e-06,
+ "loss": 0.1154,
+ "step": 30477
+ },
+ {
+ "epoch": 83.04632152588556,
+ "grad_norm": 2.9282259941101074,
+ "learning_rate": 1.4699922651422705e-06,
+ "loss": 0.2091,
+ "step": 30478
+ },
+ {
+ "epoch": 83.04904632152588,
+ "grad_norm": 3.9317188262939453,
+ "learning_rate": 1.4695317158941126e-06,
+ "loss": 0.0426,
+ "step": 30479
+ },
+ {
+ "epoch": 83.05177111716621,
+ "grad_norm": 2.7909698486328125,
+ "learning_rate": 1.4690712330809653e-06,
+ "loss": 0.0469,
+ "step": 30480
+ },
+ {
+ "epoch": 83.05449591280654,
+ "grad_norm": 2.0851080417633057,
+ "learning_rate": 1.4686108167064162e-06,
+ "loss": 0.1813,
+ "step": 30481
+ },
+ {
+ "epoch": 83.05722070844686,
+ "grad_norm": 2.5919992923736572,
+ "learning_rate": 1.4681504667740544e-06,
+ "loss": 0.0915,
+ "step": 30482
+ },
+ {
+ "epoch": 83.0599455040872,
+ "grad_norm": 2.0471487045288086,
+ "learning_rate": 1.4676901832874612e-06,
+ "loss": 0.0525,
+ "step": 30483
+ },
+ {
+ "epoch": 83.06267029972751,
+ "grad_norm": 2.909069776535034,
+ "learning_rate": 1.467229966250221e-06,
+ "loss": 0.0646,
+ "step": 30484
+ },
+ {
+ "epoch": 83.06539509536785,
+ "grad_norm": 3.2137203216552734,
+ "learning_rate": 1.4667698156659205e-06,
+ "loss": 0.0466,
+ "step": 30485
+ },
+ {
+ "epoch": 83.06811989100818,
+ "grad_norm": 3.1511332988739014,
+ "learning_rate": 1.4663097315381426e-06,
+ "loss": 0.1227,
+ "step": 30486
+ },
+ {
+ "epoch": 83.0708446866485,
+ "grad_norm": 3.3379552364349365,
+ "learning_rate": 1.4658497138704697e-06,
+ "loss": 0.0275,
+ "step": 30487
+ },
+ {
+ "epoch": 83.07356948228883,
+ "grad_norm": 1.6353423595428467,
+ "learning_rate": 1.4653897626664825e-06,
+ "loss": 0.111,
+ "step": 30488
+ },
+ {
+ "epoch": 83.07629427792915,
+ "grad_norm": 2.2430222034454346,
+ "learning_rate": 1.4649298779297671e-06,
+ "loss": 0.0451,
+ "step": 30489
+ },
+ {
+ "epoch": 83.07901907356948,
+ "grad_norm": 2.024216651916504,
+ "learning_rate": 1.4644700596639028e-06,
+ "loss": 0.0292,
+ "step": 30490
+ },
+ {
+ "epoch": 83.0817438692098,
+ "grad_norm": 2.4999301433563232,
+ "learning_rate": 1.4640103078724722e-06,
+ "loss": 0.1379,
+ "step": 30491
+ },
+ {
+ "epoch": 83.08446866485014,
+ "grad_norm": 2.5175302028656006,
+ "learning_rate": 1.4635506225590511e-06,
+ "loss": 0.0499,
+ "step": 30492
+ },
+ {
+ "epoch": 83.08719346049047,
+ "grad_norm": 1.646105408668518,
+ "learning_rate": 1.4630910037272262e-06,
+ "loss": 0.0364,
+ "step": 30493
+ },
+ {
+ "epoch": 83.08991825613079,
+ "grad_norm": 2.1817586421966553,
+ "learning_rate": 1.4626314513805728e-06,
+ "loss": 0.0451,
+ "step": 30494
+ },
+ {
+ "epoch": 83.09264305177112,
+ "grad_norm": 2.398751974105835,
+ "learning_rate": 1.4621719655226718e-06,
+ "loss": 0.0199,
+ "step": 30495
+ },
+ {
+ "epoch": 83.09536784741144,
+ "grad_norm": 2.215655565261841,
+ "learning_rate": 1.461712546157098e-06,
+ "loss": 0.0998,
+ "step": 30496
+ },
+ {
+ "epoch": 83.09809264305177,
+ "grad_norm": 3.4925975799560547,
+ "learning_rate": 1.461253193287434e-06,
+ "loss": 0.0876,
+ "step": 30497
+ },
+ {
+ "epoch": 83.1008174386921,
+ "grad_norm": 2.289992332458496,
+ "learning_rate": 1.4607939069172539e-06,
+ "loss": 0.0528,
+ "step": 30498
+ },
+ {
+ "epoch": 83.10354223433242,
+ "grad_norm": 3.3366615772247314,
+ "learning_rate": 1.4603346870501377e-06,
+ "loss": 0.0846,
+ "step": 30499
+ },
+ {
+ "epoch": 83.10626702997276,
+ "grad_norm": 2.611370325088501,
+ "learning_rate": 1.4598755336896575e-06,
+ "loss": 0.0329,
+ "step": 30500
+ },
+ {
+ "epoch": 83.10899182561307,
+ "grad_norm": 2.5329489707946777,
+ "learning_rate": 1.4594164468393945e-06,
+ "loss": 0.0361,
+ "step": 30501
+ },
+ {
+ "epoch": 83.11171662125341,
+ "grad_norm": 3.375791549682617,
+ "learning_rate": 1.4589574265029216e-06,
+ "loss": 0.0822,
+ "step": 30502
+ },
+ {
+ "epoch": 83.11444141689373,
+ "grad_norm": 2.672603130340576,
+ "learning_rate": 1.4584984726838136e-06,
+ "loss": 0.0269,
+ "step": 30503
+ },
+ {
+ "epoch": 83.11716621253406,
+ "grad_norm": 1.6498534679412842,
+ "learning_rate": 1.4580395853856412e-06,
+ "loss": 0.029,
+ "step": 30504
+ },
+ {
+ "epoch": 83.11989100817439,
+ "grad_norm": 3.100522994995117,
+ "learning_rate": 1.4575807646119844e-06,
+ "loss": 0.1374,
+ "step": 30505
+ },
+ {
+ "epoch": 83.12261580381471,
+ "grad_norm": 3.5831732749938965,
+ "learning_rate": 1.4571220103664142e-06,
+ "loss": 0.1449,
+ "step": 30506
+ },
+ {
+ "epoch": 83.12534059945504,
+ "grad_norm": 3.589817762374878,
+ "learning_rate": 1.4566633226525028e-06,
+ "loss": 0.1358,
+ "step": 30507
+ },
+ {
+ "epoch": 83.12806539509536,
+ "grad_norm": 3.455409526824951,
+ "learning_rate": 1.456204701473819e-06,
+ "loss": 0.0396,
+ "step": 30508
+ },
+ {
+ "epoch": 83.1307901907357,
+ "grad_norm": 2.8189685344696045,
+ "learning_rate": 1.4557461468339418e-06,
+ "loss": 0.0313,
+ "step": 30509
+ },
+ {
+ "epoch": 83.13351498637603,
+ "grad_norm": 3.691716432571411,
+ "learning_rate": 1.4552876587364373e-06,
+ "loss": 0.0425,
+ "step": 30510
+ },
+ {
+ "epoch": 83.13623978201635,
+ "grad_norm": 3.000974655151367,
+ "learning_rate": 1.4548292371848782e-06,
+ "loss": 0.0935,
+ "step": 30511
+ },
+ {
+ "epoch": 83.13896457765668,
+ "grad_norm": 1.9675675630569458,
+ "learning_rate": 1.4543708821828317e-06,
+ "loss": 0.0187,
+ "step": 30512
+ },
+ {
+ "epoch": 83.141689373297,
+ "grad_norm": 2.303309917449951,
+ "learning_rate": 1.4539125937338727e-06,
+ "loss": 0.0364,
+ "step": 30513
+ },
+ {
+ "epoch": 83.14441416893733,
+ "grad_norm": 3.037252902984619,
+ "learning_rate": 1.453454371841566e-06,
+ "loss": 0.1173,
+ "step": 30514
+ },
+ {
+ "epoch": 83.14713896457765,
+ "grad_norm": 1.996396541595459,
+ "learning_rate": 1.4529962165094803e-06,
+ "loss": 0.0722,
+ "step": 30515
+ },
+ {
+ "epoch": 83.14986376021798,
+ "grad_norm": 2.8723056316375732,
+ "learning_rate": 1.4525381277411864e-06,
+ "loss": 0.0352,
+ "step": 30516
+ },
+ {
+ "epoch": 83.15258855585832,
+ "grad_norm": 2.116116762161255,
+ "learning_rate": 1.452080105540249e-06,
+ "loss": 0.0233,
+ "step": 30517
+ },
+ {
+ "epoch": 83.15531335149863,
+ "grad_norm": 3.4875447750091553,
+ "learning_rate": 1.451622149910239e-06,
+ "loss": 0.0553,
+ "step": 30518
+ },
+ {
+ "epoch": 83.15803814713897,
+ "grad_norm": 3.095039129257202,
+ "learning_rate": 1.4511642608547195e-06,
+ "loss": 0.1883,
+ "step": 30519
+ },
+ {
+ "epoch": 83.16076294277929,
+ "grad_norm": 5.829368591308594,
+ "learning_rate": 1.4507064383772585e-06,
+ "loss": 0.1004,
+ "step": 30520
+ },
+ {
+ "epoch": 83.16348773841962,
+ "grad_norm": 2.4921467304229736,
+ "learning_rate": 1.4502486824814176e-06,
+ "loss": 0.1027,
+ "step": 30521
+ },
+ {
+ "epoch": 83.16621253405995,
+ "grad_norm": 3.3920462131500244,
+ "learning_rate": 1.4497909931707677e-06,
+ "loss": 0.0785,
+ "step": 30522
+ },
+ {
+ "epoch": 83.16893732970027,
+ "grad_norm": 1.6282061338424683,
+ "learning_rate": 1.4493333704488698e-06,
+ "loss": 0.0198,
+ "step": 30523
+ },
+ {
+ "epoch": 83.1716621253406,
+ "grad_norm": 1.7396368980407715,
+ "learning_rate": 1.4488758143192871e-06,
+ "loss": 0.0244,
+ "step": 30524
+ },
+ {
+ "epoch": 83.17438692098092,
+ "grad_norm": 2.3437485694885254,
+ "learning_rate": 1.4484183247855853e-06,
+ "loss": 0.1113,
+ "step": 30525
+ },
+ {
+ "epoch": 83.17711171662125,
+ "grad_norm": 2.6190948486328125,
+ "learning_rate": 1.4479609018513275e-06,
+ "loss": 0.0672,
+ "step": 30526
+ },
+ {
+ "epoch": 83.17983651226157,
+ "grad_norm": 2.357954502105713,
+ "learning_rate": 1.4475035455200748e-06,
+ "loss": 0.0504,
+ "step": 30527
+ },
+ {
+ "epoch": 83.1825613079019,
+ "grad_norm": 5.0774922370910645,
+ "learning_rate": 1.4470462557953869e-06,
+ "loss": 0.0404,
+ "step": 30528
+ },
+ {
+ "epoch": 83.18528610354224,
+ "grad_norm": 2.440586805343628,
+ "learning_rate": 1.4465890326808297e-06,
+ "loss": 0.0441,
+ "step": 30529
+ },
+ {
+ "epoch": 83.18801089918256,
+ "grad_norm": 1.9190253019332886,
+ "learning_rate": 1.4461318761799615e-06,
+ "loss": 0.0274,
+ "step": 30530
+ },
+ {
+ "epoch": 83.19073569482289,
+ "grad_norm": 3.7399632930755615,
+ "learning_rate": 1.4456747862963427e-06,
+ "loss": 0.0589,
+ "step": 30531
+ },
+ {
+ "epoch": 83.19346049046321,
+ "grad_norm": 2.8228495121002197,
+ "learning_rate": 1.4452177630335318e-06,
+ "loss": 0.0787,
+ "step": 30532
+ },
+ {
+ "epoch": 83.19618528610354,
+ "grad_norm": 4.243612766265869,
+ "learning_rate": 1.444760806395089e-06,
+ "loss": 0.0576,
+ "step": 30533
+ },
+ {
+ "epoch": 83.19891008174388,
+ "grad_norm": 2.3741116523742676,
+ "learning_rate": 1.4443039163845761e-06,
+ "loss": 0.0338,
+ "step": 30534
+ },
+ {
+ "epoch": 83.2016348773842,
+ "grad_norm": 2.946852684020996,
+ "learning_rate": 1.4438470930055492e-06,
+ "loss": 0.0667,
+ "step": 30535
+ },
+ {
+ "epoch": 83.20435967302453,
+ "grad_norm": 2.58840274810791,
+ "learning_rate": 1.4433903362615654e-06,
+ "loss": 0.0751,
+ "step": 30536
+ },
+ {
+ "epoch": 83.20708446866485,
+ "grad_norm": 2.3835275173187256,
+ "learning_rate": 1.4429336461561804e-06,
+ "loss": 0.1215,
+ "step": 30537
+ },
+ {
+ "epoch": 83.20980926430518,
+ "grad_norm": 1.418433666229248,
+ "learning_rate": 1.4424770226929551e-06,
+ "loss": 0.029,
+ "step": 30538
+ },
+ {
+ "epoch": 83.2125340599455,
+ "grad_norm": 3.596494436264038,
+ "learning_rate": 1.4420204658754432e-06,
+ "loss": 0.0902,
+ "step": 30539
+ },
+ {
+ "epoch": 83.21525885558583,
+ "grad_norm": 2.294933795928955,
+ "learning_rate": 1.4415639757071998e-06,
+ "loss": 0.1384,
+ "step": 30540
+ },
+ {
+ "epoch": 83.21798365122616,
+ "grad_norm": 2.1866657733917236,
+ "learning_rate": 1.4411075521917794e-06,
+ "loss": 0.0433,
+ "step": 30541
+ },
+ {
+ "epoch": 83.22070844686648,
+ "grad_norm": 1.8189126253128052,
+ "learning_rate": 1.4406511953327397e-06,
+ "loss": 0.0631,
+ "step": 30542
+ },
+ {
+ "epoch": 83.22343324250681,
+ "grad_norm": 2.6391940116882324,
+ "learning_rate": 1.4401949051336328e-06,
+ "loss": 0.1192,
+ "step": 30543
+ },
+ {
+ "epoch": 83.22615803814713,
+ "grad_norm": 4.100677967071533,
+ "learning_rate": 1.4397386815980107e-06,
+ "loss": 0.1347,
+ "step": 30544
+ },
+ {
+ "epoch": 83.22888283378747,
+ "grad_norm": 2.553624391555786,
+ "learning_rate": 1.4392825247294307e-06,
+ "loss": 0.0775,
+ "step": 30545
+ },
+ {
+ "epoch": 83.2316076294278,
+ "grad_norm": 2.033749580383301,
+ "learning_rate": 1.4388264345314419e-06,
+ "loss": 0.0284,
+ "step": 30546
+ },
+ {
+ "epoch": 83.23433242506812,
+ "grad_norm": 2.9180612564086914,
+ "learning_rate": 1.438370411007598e-06,
+ "loss": 0.0624,
+ "step": 30547
+ },
+ {
+ "epoch": 83.23705722070845,
+ "grad_norm": 1.4826465845108032,
+ "learning_rate": 1.4379144541614476e-06,
+ "loss": 0.0225,
+ "step": 30548
+ },
+ {
+ "epoch": 83.23978201634877,
+ "grad_norm": 4.95634126663208,
+ "learning_rate": 1.4374585639965433e-06,
+ "loss": 0.065,
+ "step": 30549
+ },
+ {
+ "epoch": 83.2425068119891,
+ "grad_norm": 2.916814088821411,
+ "learning_rate": 1.437002740516439e-06,
+ "loss": 0.0676,
+ "step": 30550
+ },
+ {
+ "epoch": 83.24523160762942,
+ "grad_norm": 3.431065559387207,
+ "learning_rate": 1.4365469837246816e-06,
+ "loss": 0.0545,
+ "step": 30551
+ },
+ {
+ "epoch": 83.24795640326975,
+ "grad_norm": 1.5764778852462769,
+ "learning_rate": 1.4360912936248206e-06,
+ "loss": 0.023,
+ "step": 30552
+ },
+ {
+ "epoch": 83.25068119891009,
+ "grad_norm": 2.429016590118408,
+ "learning_rate": 1.4356356702204033e-06,
+ "loss": 0.0626,
+ "step": 30553
+ },
+ {
+ "epoch": 83.2534059945504,
+ "grad_norm": 2.5421488285064697,
+ "learning_rate": 1.4351801135149812e-06,
+ "loss": 0.0632,
+ "step": 30554
+ },
+ {
+ "epoch": 83.25613079019074,
+ "grad_norm": 1.6964192390441895,
+ "learning_rate": 1.4347246235121003e-06,
+ "loss": 0.0745,
+ "step": 30555
+ },
+ {
+ "epoch": 83.25885558583106,
+ "grad_norm": 2.7233622074127197,
+ "learning_rate": 1.434269200215309e-06,
+ "loss": 0.2518,
+ "step": 30556
+ },
+ {
+ "epoch": 83.26158038147139,
+ "grad_norm": 2.3182289600372314,
+ "learning_rate": 1.4338138436281512e-06,
+ "loss": 0.0272,
+ "step": 30557
+ },
+ {
+ "epoch": 83.26430517711172,
+ "grad_norm": 2.4392614364624023,
+ "learning_rate": 1.4333585537541782e-06,
+ "loss": 0.026,
+ "step": 30558
+ },
+ {
+ "epoch": 83.26702997275204,
+ "grad_norm": 2.2778537273406982,
+ "learning_rate": 1.432903330596933e-06,
+ "loss": 0.0846,
+ "step": 30559
+ },
+ {
+ "epoch": 83.26975476839237,
+ "grad_norm": 2.0409388542175293,
+ "learning_rate": 1.4324481741599606e-06,
+ "loss": 0.0413,
+ "step": 30560
+ },
+ {
+ "epoch": 83.2724795640327,
+ "grad_norm": 2.103501081466675,
+ "learning_rate": 1.4319930844468032e-06,
+ "loss": 0.0439,
+ "step": 30561
+ },
+ {
+ "epoch": 83.27520435967303,
+ "grad_norm": 2.7763302326202393,
+ "learning_rate": 1.4315380614610109e-06,
+ "loss": 0.1452,
+ "step": 30562
+ },
+ {
+ "epoch": 83.27792915531334,
+ "grad_norm": 2.781834125518799,
+ "learning_rate": 1.4310831052061248e-06,
+ "loss": 0.0546,
+ "step": 30563
+ },
+ {
+ "epoch": 83.28065395095368,
+ "grad_norm": 2.491203784942627,
+ "learning_rate": 1.4306282156856866e-06,
+ "loss": 0.0893,
+ "step": 30564
+ },
+ {
+ "epoch": 83.28337874659401,
+ "grad_norm": 2.416351318359375,
+ "learning_rate": 1.430173392903238e-06,
+ "loss": 0.0614,
+ "step": 30565
+ },
+ {
+ "epoch": 83.28610354223433,
+ "grad_norm": 2.570690393447876,
+ "learning_rate": 1.4297186368623262e-06,
+ "loss": 0.0201,
+ "step": 30566
+ },
+ {
+ "epoch": 83.28882833787466,
+ "grad_norm": 2.3026962280273438,
+ "learning_rate": 1.4292639475664872e-06,
+ "loss": 0.089,
+ "step": 30567
+ },
+ {
+ "epoch": 83.29155313351498,
+ "grad_norm": 3.0163443088531494,
+ "learning_rate": 1.4288093250192669e-06,
+ "loss": 0.1858,
+ "step": 30568
+ },
+ {
+ "epoch": 83.29427792915531,
+ "grad_norm": 2.9206223487854004,
+ "learning_rate": 1.4283547692242017e-06,
+ "loss": 0.0482,
+ "step": 30569
+ },
+ {
+ "epoch": 83.29700272479565,
+ "grad_norm": 3.8568670749664307,
+ "learning_rate": 1.4279002801848352e-06,
+ "loss": 0.0684,
+ "step": 30570
+ },
+ {
+ "epoch": 83.29972752043597,
+ "grad_norm": 2.722461462020874,
+ "learning_rate": 1.4274458579047056e-06,
+ "loss": 0.0273,
+ "step": 30571
+ },
+ {
+ "epoch": 83.3024523160763,
+ "grad_norm": 4.237865447998047,
+ "learning_rate": 1.4269915023873526e-06,
+ "loss": 0.0704,
+ "step": 30572
+ },
+ {
+ "epoch": 83.30517711171662,
+ "grad_norm": 2.010971784591675,
+ "learning_rate": 1.4265372136363109e-06,
+ "loss": 0.0262,
+ "step": 30573
+ },
+ {
+ "epoch": 83.30790190735695,
+ "grad_norm": 1.8063124418258667,
+ "learning_rate": 1.4260829916551245e-06,
+ "loss": 0.022,
+ "step": 30574
+ },
+ {
+ "epoch": 83.31062670299727,
+ "grad_norm": 2.8567333221435547,
+ "learning_rate": 1.425628836447327e-06,
+ "loss": 0.0369,
+ "step": 30575
+ },
+ {
+ "epoch": 83.3133514986376,
+ "grad_norm": 2.1532137393951416,
+ "learning_rate": 1.4251747480164557e-06,
+ "loss": 0.0679,
+ "step": 30576
+ },
+ {
+ "epoch": 83.31607629427793,
+ "grad_norm": 4.473711967468262,
+ "learning_rate": 1.4247207263660467e-06,
+ "loss": 0.1316,
+ "step": 30577
+ },
+ {
+ "epoch": 83.31880108991825,
+ "grad_norm": 3.0395073890686035,
+ "learning_rate": 1.4242667714996371e-06,
+ "loss": 0.0936,
+ "step": 30578
+ },
+ {
+ "epoch": 83.32152588555859,
+ "grad_norm": 2.379467725753784,
+ "learning_rate": 1.4238128834207633e-06,
+ "loss": 0.046,
+ "step": 30579
+ },
+ {
+ "epoch": 83.3242506811989,
+ "grad_norm": 3.5517351627349854,
+ "learning_rate": 1.4233590621329585e-06,
+ "loss": 0.0663,
+ "step": 30580
+ },
+ {
+ "epoch": 83.32697547683924,
+ "grad_norm": 3.2514889240264893,
+ "learning_rate": 1.4229053076397547e-06,
+ "loss": 0.1059,
+ "step": 30581
+ },
+ {
+ "epoch": 83.32970027247957,
+ "grad_norm": 3.2749216556549072,
+ "learning_rate": 1.4224516199446915e-06,
+ "loss": 0.1151,
+ "step": 30582
+ },
+ {
+ "epoch": 83.33242506811989,
+ "grad_norm": 1.983525037765503,
+ "learning_rate": 1.4219979990512977e-06,
+ "loss": 0.0227,
+ "step": 30583
+ },
+ {
+ "epoch": 83.33514986376022,
+ "grad_norm": 2.9139275550842285,
+ "learning_rate": 1.4215444449631054e-06,
+ "loss": 0.0809,
+ "step": 30584
+ },
+ {
+ "epoch": 83.33787465940054,
+ "grad_norm": 2.6436755657196045,
+ "learning_rate": 1.4210909576836496e-06,
+ "loss": 0.054,
+ "step": 30585
+ },
+ {
+ "epoch": 83.34059945504087,
+ "grad_norm": 2.570117235183716,
+ "learning_rate": 1.4206375372164628e-06,
+ "loss": 0.0635,
+ "step": 30586
+ },
+ {
+ "epoch": 83.34332425068119,
+ "grad_norm": 2.180441379547119,
+ "learning_rate": 1.4201841835650755e-06,
+ "loss": 0.1727,
+ "step": 30587
+ },
+ {
+ "epoch": 83.34604904632153,
+ "grad_norm": 1.9770933389663696,
+ "learning_rate": 1.419730896733017e-06,
+ "loss": 0.0207,
+ "step": 30588
+ },
+ {
+ "epoch": 83.34877384196186,
+ "grad_norm": 2.7037570476531982,
+ "learning_rate": 1.419277676723816e-06,
+ "loss": 0.0652,
+ "step": 30589
+ },
+ {
+ "epoch": 83.35149863760218,
+ "grad_norm": 2.091167688369751,
+ "learning_rate": 1.418824523541007e-06,
+ "loss": 0.0382,
+ "step": 30590
+ },
+ {
+ "epoch": 83.35422343324251,
+ "grad_norm": 4.447286128997803,
+ "learning_rate": 1.4183714371881164e-06,
+ "loss": 0.095,
+ "step": 30591
+ },
+ {
+ "epoch": 83.35694822888283,
+ "grad_norm": 3.060070753097534,
+ "learning_rate": 1.4179184176686722e-06,
+ "loss": 0.1467,
+ "step": 30592
+ },
+ {
+ "epoch": 83.35967302452316,
+ "grad_norm": 2.0797278881073,
+ "learning_rate": 1.4174654649862007e-06,
+ "loss": 0.0241,
+ "step": 30593
+ },
+ {
+ "epoch": 83.3623978201635,
+ "grad_norm": 2.980470895767212,
+ "learning_rate": 1.4170125791442346e-06,
+ "loss": 0.0349,
+ "step": 30594
+ },
+ {
+ "epoch": 83.36512261580381,
+ "grad_norm": 2.5694875717163086,
+ "learning_rate": 1.4165597601462987e-06,
+ "loss": 0.0486,
+ "step": 30595
+ },
+ {
+ "epoch": 83.36784741144415,
+ "grad_norm": 5.260220050811768,
+ "learning_rate": 1.4161070079959193e-06,
+ "loss": 0.0368,
+ "step": 30596
+ },
+ {
+ "epoch": 83.37057220708446,
+ "grad_norm": 2.054333209991455,
+ "learning_rate": 1.4156543226966191e-06,
+ "loss": 0.0455,
+ "step": 30597
+ },
+ {
+ "epoch": 83.3732970027248,
+ "grad_norm": 2.686857223510742,
+ "learning_rate": 1.4152017042519295e-06,
+ "loss": 0.0733,
+ "step": 30598
+ },
+ {
+ "epoch": 83.37602179836512,
+ "grad_norm": 2.216090202331543,
+ "learning_rate": 1.4147491526653723e-06,
+ "loss": 0.0734,
+ "step": 30599
+ },
+ {
+ "epoch": 83.37874659400545,
+ "grad_norm": 1.8555707931518555,
+ "learning_rate": 1.4142966679404724e-06,
+ "loss": 0.0211,
+ "step": 30600
+ },
+ {
+ "epoch": 83.38147138964578,
+ "grad_norm": 3.099801778793335,
+ "learning_rate": 1.4138442500807524e-06,
+ "loss": 0.0465,
+ "step": 30601
+ },
+ {
+ "epoch": 83.3841961852861,
+ "grad_norm": 2.2599716186523438,
+ "learning_rate": 1.4133918990897366e-06,
+ "loss": 0.021,
+ "step": 30602
+ },
+ {
+ "epoch": 83.38692098092643,
+ "grad_norm": 3.633221387863159,
+ "learning_rate": 1.4129396149709496e-06,
+ "loss": 0.0861,
+ "step": 30603
+ },
+ {
+ "epoch": 83.38964577656675,
+ "grad_norm": 2.193885087966919,
+ "learning_rate": 1.412487397727914e-06,
+ "loss": 0.0466,
+ "step": 30604
+ },
+ {
+ "epoch": 83.39237057220708,
+ "grad_norm": 2.2453367710113525,
+ "learning_rate": 1.4120352473641497e-06,
+ "loss": 0.0618,
+ "step": 30605
+ },
+ {
+ "epoch": 83.39509536784742,
+ "grad_norm": 3.7001543045043945,
+ "learning_rate": 1.4115831638831756e-06,
+ "loss": 0.0586,
+ "step": 30606
+ },
+ {
+ "epoch": 83.39782016348774,
+ "grad_norm": 3.756469249725342,
+ "learning_rate": 1.411131147288518e-06,
+ "loss": 0.1001,
+ "step": 30607
+ },
+ {
+ "epoch": 83.40054495912807,
+ "grad_norm": 2.7054014205932617,
+ "learning_rate": 1.4106791975836941e-06,
+ "loss": 0.0302,
+ "step": 30608
+ },
+ {
+ "epoch": 83.40326975476839,
+ "grad_norm": 1.775532603263855,
+ "learning_rate": 1.4102273147722235e-06,
+ "loss": 0.02,
+ "step": 30609
+ },
+ {
+ "epoch": 83.40599455040872,
+ "grad_norm": 3.216789960861206,
+ "learning_rate": 1.4097754988576273e-06,
+ "loss": 0.029,
+ "step": 30610
+ },
+ {
+ "epoch": 83.40871934604904,
+ "grad_norm": 1.575819492340088,
+ "learning_rate": 1.4093237498434232e-06,
+ "loss": 0.0206,
+ "step": 30611
+ },
+ {
+ "epoch": 83.41144414168937,
+ "grad_norm": 1.5731652975082397,
+ "learning_rate": 1.408872067733128e-06,
+ "loss": 0.0312,
+ "step": 30612
+ },
+ {
+ "epoch": 83.4141689373297,
+ "grad_norm": 2.619858741760254,
+ "learning_rate": 1.4084204525302602e-06,
+ "loss": 0.0825,
+ "step": 30613
+ },
+ {
+ "epoch": 83.41689373297002,
+ "grad_norm": 2.8369081020355225,
+ "learning_rate": 1.4079689042383394e-06,
+ "loss": 0.0654,
+ "step": 30614
+ },
+ {
+ "epoch": 83.41961852861036,
+ "grad_norm": 2.1706619262695312,
+ "learning_rate": 1.407517422860879e-06,
+ "loss": 0.0266,
+ "step": 30615
+ },
+ {
+ "epoch": 83.42234332425068,
+ "grad_norm": 3.0266902446746826,
+ "learning_rate": 1.4070660084013977e-06,
+ "loss": 0.0541,
+ "step": 30616
+ },
+ {
+ "epoch": 83.42506811989101,
+ "grad_norm": 6.6772356033325195,
+ "learning_rate": 1.4066146608634068e-06,
+ "loss": 0.0365,
+ "step": 30617
+ },
+ {
+ "epoch": 83.42779291553134,
+ "grad_norm": 1.6007728576660156,
+ "learning_rate": 1.4061633802504237e-06,
+ "loss": 0.0336,
+ "step": 30618
+ },
+ {
+ "epoch": 83.43051771117166,
+ "grad_norm": 4.361444473266602,
+ "learning_rate": 1.4057121665659667e-06,
+ "loss": 0.0641,
+ "step": 30619
+ },
+ {
+ "epoch": 83.433242506812,
+ "grad_norm": 2.419548273086548,
+ "learning_rate": 1.4052610198135475e-06,
+ "loss": 0.0233,
+ "step": 30620
+ },
+ {
+ "epoch": 83.43596730245231,
+ "grad_norm": 3.443169593811035,
+ "learning_rate": 1.4048099399966774e-06,
+ "loss": 0.0995,
+ "step": 30621
+ },
+ {
+ "epoch": 83.43869209809264,
+ "grad_norm": 3.115429639816284,
+ "learning_rate": 1.4043589271188695e-06,
+ "loss": 0.0538,
+ "step": 30622
+ },
+ {
+ "epoch": 83.44141689373296,
+ "grad_norm": 3.2137451171875,
+ "learning_rate": 1.4039079811836398e-06,
+ "loss": 0.0373,
+ "step": 30623
+ },
+ {
+ "epoch": 83.4441416893733,
+ "grad_norm": 2.704097270965576,
+ "learning_rate": 1.4034571021944976e-06,
+ "loss": 0.1261,
+ "step": 30624
+ },
+ {
+ "epoch": 83.44686648501363,
+ "grad_norm": 3.3638358116149902,
+ "learning_rate": 1.4030062901549557e-06,
+ "loss": 0.0397,
+ "step": 30625
+ },
+ {
+ "epoch": 83.44959128065395,
+ "grad_norm": 1.66252863407135,
+ "learning_rate": 1.4025555450685213e-06,
+ "loss": 0.0215,
+ "step": 30626
+ },
+ {
+ "epoch": 83.45231607629428,
+ "grad_norm": 1.5898563861846924,
+ "learning_rate": 1.4021048669387094e-06,
+ "loss": 0.0215,
+ "step": 30627
+ },
+ {
+ "epoch": 83.4550408719346,
+ "grad_norm": 1.9060828685760498,
+ "learning_rate": 1.4016542557690282e-06,
+ "loss": 0.0272,
+ "step": 30628
+ },
+ {
+ "epoch": 83.45776566757493,
+ "grad_norm": 2.683668613433838,
+ "learning_rate": 1.4012037115629873e-06,
+ "loss": 0.0589,
+ "step": 30629
+ },
+ {
+ "epoch": 83.46049046321527,
+ "grad_norm": 3.511038303375244,
+ "learning_rate": 1.4007532343240936e-06,
+ "loss": 0.0573,
+ "step": 30630
+ },
+ {
+ "epoch": 83.46321525885558,
+ "grad_norm": 2.3716983795166016,
+ "learning_rate": 1.400302824055858e-06,
+ "loss": 0.0301,
+ "step": 30631
+ },
+ {
+ "epoch": 83.46594005449592,
+ "grad_norm": 2.2675628662109375,
+ "learning_rate": 1.3998524807617875e-06,
+ "loss": 0.0228,
+ "step": 30632
+ },
+ {
+ "epoch": 83.46866485013624,
+ "grad_norm": 2.15134596824646,
+ "learning_rate": 1.399402204445387e-06,
+ "loss": 0.0221,
+ "step": 30633
+ },
+ {
+ "epoch": 83.47138964577657,
+ "grad_norm": 2.639045476913452,
+ "learning_rate": 1.3989519951101682e-06,
+ "loss": 0.0328,
+ "step": 30634
+ },
+ {
+ "epoch": 83.47411444141689,
+ "grad_norm": 2.77884578704834,
+ "learning_rate": 1.3985018527596316e-06,
+ "loss": 0.0475,
+ "step": 30635
+ },
+ {
+ "epoch": 83.47683923705722,
+ "grad_norm": 1.6611262559890747,
+ "learning_rate": 1.398051777397288e-06,
+ "loss": 0.0355,
+ "step": 30636
+ },
+ {
+ "epoch": 83.47956403269755,
+ "grad_norm": 2.4296114444732666,
+ "learning_rate": 1.3976017690266397e-06,
+ "loss": 0.0592,
+ "step": 30637
+ },
+ {
+ "epoch": 83.48228882833787,
+ "grad_norm": 3.121490478515625,
+ "learning_rate": 1.3971518276511909e-06,
+ "loss": 0.0489,
+ "step": 30638
+ },
+ {
+ "epoch": 83.4850136239782,
+ "grad_norm": 3.141040325164795,
+ "learning_rate": 1.3967019532744475e-06,
+ "loss": 0.0381,
+ "step": 30639
+ },
+ {
+ "epoch": 83.48773841961852,
+ "grad_norm": 4.265635013580322,
+ "learning_rate": 1.3962521458999135e-06,
+ "loss": 0.0633,
+ "step": 30640
+ },
+ {
+ "epoch": 83.49046321525886,
+ "grad_norm": 2.9381966590881348,
+ "learning_rate": 1.3958024055310903e-06,
+ "loss": 0.0284,
+ "step": 30641
+ },
+ {
+ "epoch": 83.49318801089919,
+ "grad_norm": 4.230826377868652,
+ "learning_rate": 1.39535273217148e-06,
+ "loss": 0.1055,
+ "step": 30642
+ },
+ {
+ "epoch": 83.49591280653951,
+ "grad_norm": 2.1036412715911865,
+ "learning_rate": 1.3949031258245872e-06,
+ "loss": 0.0441,
+ "step": 30643
+ },
+ {
+ "epoch": 83.49863760217984,
+ "grad_norm": 2.635373115539551,
+ "learning_rate": 1.3944535864939112e-06,
+ "loss": 0.0543,
+ "step": 30644
+ },
+ {
+ "epoch": 83.50136239782016,
+ "grad_norm": 3.0548596382141113,
+ "learning_rate": 1.394004114182954e-06,
+ "loss": 0.1288,
+ "step": 30645
+ },
+ {
+ "epoch": 83.50408719346049,
+ "grad_norm": 3.0379130840301514,
+ "learning_rate": 1.393554708895214e-06,
+ "loss": 0.0715,
+ "step": 30646
+ },
+ {
+ "epoch": 83.50681198910081,
+ "grad_norm": 2.745727062225342,
+ "learning_rate": 1.3931053706341946e-06,
+ "loss": 0.0361,
+ "step": 30647
+ },
+ {
+ "epoch": 83.50953678474114,
+ "grad_norm": 3.432950019836426,
+ "learning_rate": 1.3926560994033945e-06,
+ "loss": 0.03,
+ "step": 30648
+ },
+ {
+ "epoch": 83.51226158038148,
+ "grad_norm": 1.986212134361267,
+ "learning_rate": 1.3922068952063107e-06,
+ "loss": 0.04,
+ "step": 30649
+ },
+ {
+ "epoch": 83.5149863760218,
+ "grad_norm": 2.554323673248291,
+ "learning_rate": 1.3917577580464414e-06,
+ "loss": 0.0786,
+ "step": 30650
+ },
+ {
+ "epoch": 83.51771117166213,
+ "grad_norm": 2.3508431911468506,
+ "learning_rate": 1.3913086879272874e-06,
+ "loss": 0.1057,
+ "step": 30651
+ },
+ {
+ "epoch": 83.52043596730245,
+ "grad_norm": 2.4980311393737793,
+ "learning_rate": 1.3908596848523436e-06,
+ "loss": 0.042,
+ "step": 30652
+ },
+ {
+ "epoch": 83.52316076294278,
+ "grad_norm": 2.53886342048645,
+ "learning_rate": 1.390410748825106e-06,
+ "loss": 0.0601,
+ "step": 30653
+ },
+ {
+ "epoch": 83.52588555858311,
+ "grad_norm": 1.843441367149353,
+ "learning_rate": 1.389961879849072e-06,
+ "loss": 0.0921,
+ "step": 30654
+ },
+ {
+ "epoch": 83.52861035422343,
+ "grad_norm": 2.445556640625,
+ "learning_rate": 1.3895130779277398e-06,
+ "loss": 0.0538,
+ "step": 30655
+ },
+ {
+ "epoch": 83.53133514986376,
+ "grad_norm": 3.4484446048736572,
+ "learning_rate": 1.3890643430646033e-06,
+ "loss": 0.0788,
+ "step": 30656
+ },
+ {
+ "epoch": 83.53405994550408,
+ "grad_norm": 1.5983630418777466,
+ "learning_rate": 1.3886156752631563e-06,
+ "loss": 0.1406,
+ "step": 30657
+ },
+ {
+ "epoch": 83.53678474114442,
+ "grad_norm": 3.125032901763916,
+ "learning_rate": 1.3881670745268904e-06,
+ "loss": 0.0841,
+ "step": 30658
+ },
+ {
+ "epoch": 83.53950953678473,
+ "grad_norm": 2.777785539627075,
+ "learning_rate": 1.3877185408593052e-06,
+ "loss": 0.035,
+ "step": 30659
+ },
+ {
+ "epoch": 83.54223433242507,
+ "grad_norm": 3.1854898929595947,
+ "learning_rate": 1.38727007426389e-06,
+ "loss": 0.0733,
+ "step": 30660
+ },
+ {
+ "epoch": 83.5449591280654,
+ "grad_norm": 3.2417075634002686,
+ "learning_rate": 1.3868216747441388e-06,
+ "loss": 0.0559,
+ "step": 30661
+ },
+ {
+ "epoch": 83.54768392370572,
+ "grad_norm": 2.797309160232544,
+ "learning_rate": 1.386373342303542e-06,
+ "loss": 0.0914,
+ "step": 30662
+ },
+ {
+ "epoch": 83.55040871934605,
+ "grad_norm": 2.2952725887298584,
+ "learning_rate": 1.3859250769455933e-06,
+ "loss": 0.043,
+ "step": 30663
+ },
+ {
+ "epoch": 83.55313351498637,
+ "grad_norm": 2.7266359329223633,
+ "learning_rate": 1.3854768786737826e-06,
+ "loss": 0.0312,
+ "step": 30664
+ },
+ {
+ "epoch": 83.5558583106267,
+ "grad_norm": 3.4587957859039307,
+ "learning_rate": 1.3850287474916013e-06,
+ "loss": 0.0401,
+ "step": 30665
+ },
+ {
+ "epoch": 83.55858310626704,
+ "grad_norm": 4.483211994171143,
+ "learning_rate": 1.3845806834025365e-06,
+ "loss": 0.0289,
+ "step": 30666
+ },
+ {
+ "epoch": 83.56130790190736,
+ "grad_norm": 2.459195852279663,
+ "learning_rate": 1.3841326864100823e-06,
+ "loss": 0.0427,
+ "step": 30667
+ },
+ {
+ "epoch": 83.56403269754769,
+ "grad_norm": 5.380830764770508,
+ "learning_rate": 1.3836847565177258e-06,
+ "loss": 0.0282,
+ "step": 30668
+ },
+ {
+ "epoch": 83.566757493188,
+ "grad_norm": 2.1368446350097656,
+ "learning_rate": 1.3832368937289543e-06,
+ "loss": 0.0287,
+ "step": 30669
+ },
+ {
+ "epoch": 83.56948228882834,
+ "grad_norm": 3.613755941390991,
+ "learning_rate": 1.3827890980472547e-06,
+ "loss": 0.0407,
+ "step": 30670
+ },
+ {
+ "epoch": 83.57220708446866,
+ "grad_norm": 3.5539443492889404,
+ "learning_rate": 1.3823413694761167e-06,
+ "loss": 0.0673,
+ "step": 30671
+ },
+ {
+ "epoch": 83.57493188010899,
+ "grad_norm": 2.5715603828430176,
+ "learning_rate": 1.3818937080190287e-06,
+ "loss": 0.0749,
+ "step": 30672
+ },
+ {
+ "epoch": 83.57765667574932,
+ "grad_norm": 2.368882894515991,
+ "learning_rate": 1.3814461136794755e-06,
+ "loss": 0.0874,
+ "step": 30673
+ },
+ {
+ "epoch": 83.58038147138964,
+ "grad_norm": 3.156682014465332,
+ "learning_rate": 1.3809985864609398e-06,
+ "loss": 0.0434,
+ "step": 30674
+ },
+ {
+ "epoch": 83.58310626702998,
+ "grad_norm": 3.6735572814941406,
+ "learning_rate": 1.3805511263669113e-06,
+ "loss": 0.1656,
+ "step": 30675
+ },
+ {
+ "epoch": 83.5858310626703,
+ "grad_norm": 2.4326329231262207,
+ "learning_rate": 1.3801037334008738e-06,
+ "loss": 0.0489,
+ "step": 30676
+ },
+ {
+ "epoch": 83.58855585831063,
+ "grad_norm": 2.5024240016937256,
+ "learning_rate": 1.379656407566311e-06,
+ "loss": 0.1442,
+ "step": 30677
+ },
+ {
+ "epoch": 83.59128065395096,
+ "grad_norm": 3.217705011367798,
+ "learning_rate": 1.3792091488667047e-06,
+ "loss": 0.038,
+ "step": 30678
+ },
+ {
+ "epoch": 83.59400544959128,
+ "grad_norm": 3.0005221366882324,
+ "learning_rate": 1.3787619573055421e-06,
+ "loss": 0.0558,
+ "step": 30679
+ },
+ {
+ "epoch": 83.59673024523161,
+ "grad_norm": 2.5085296630859375,
+ "learning_rate": 1.378314832886305e-06,
+ "loss": 0.039,
+ "step": 30680
+ },
+ {
+ "epoch": 83.59945504087193,
+ "grad_norm": 2.812469005584717,
+ "learning_rate": 1.3778677756124724e-06,
+ "loss": 0.0897,
+ "step": 30681
+ },
+ {
+ "epoch": 83.60217983651226,
+ "grad_norm": 2.7174370288848877,
+ "learning_rate": 1.3774207854875277e-06,
+ "loss": 0.1178,
+ "step": 30682
+ },
+ {
+ "epoch": 83.60490463215258,
+ "grad_norm": 2.182560682296753,
+ "learning_rate": 1.3769738625149532e-06,
+ "loss": 0.1622,
+ "step": 30683
+ },
+ {
+ "epoch": 83.60762942779292,
+ "grad_norm": 2.84898042678833,
+ "learning_rate": 1.3765270066982294e-06,
+ "loss": 0.0395,
+ "step": 30684
+ },
+ {
+ "epoch": 83.61035422343325,
+ "grad_norm": 2.567331075668335,
+ "learning_rate": 1.3760802180408362e-06,
+ "loss": 0.0294,
+ "step": 30685
+ },
+ {
+ "epoch": 83.61307901907357,
+ "grad_norm": 3.532907485961914,
+ "learning_rate": 1.3756334965462502e-06,
+ "loss": 0.0791,
+ "step": 30686
+ },
+ {
+ "epoch": 83.6158038147139,
+ "grad_norm": 3.5884735584259033,
+ "learning_rate": 1.3751868422179527e-06,
+ "loss": 0.048,
+ "step": 30687
+ },
+ {
+ "epoch": 83.61852861035422,
+ "grad_norm": 2.8066675662994385,
+ "learning_rate": 1.3747402550594246e-06,
+ "loss": 0.105,
+ "step": 30688
+ },
+ {
+ "epoch": 83.62125340599455,
+ "grad_norm": 4.59223747253418,
+ "learning_rate": 1.3742937350741414e-06,
+ "loss": 0.0326,
+ "step": 30689
+ },
+ {
+ "epoch": 83.62397820163488,
+ "grad_norm": 2.3158602714538574,
+ "learning_rate": 1.3738472822655824e-06,
+ "loss": 0.0263,
+ "step": 30690
+ },
+ {
+ "epoch": 83.6267029972752,
+ "grad_norm": 2.349701404571533,
+ "learning_rate": 1.3734008966372192e-06,
+ "loss": 0.0312,
+ "step": 30691
+ },
+ {
+ "epoch": 83.62942779291554,
+ "grad_norm": 2.4214534759521484,
+ "learning_rate": 1.3729545781925357e-06,
+ "loss": 0.0301,
+ "step": 30692
+ },
+ {
+ "epoch": 83.63215258855585,
+ "grad_norm": 2.4475653171539307,
+ "learning_rate": 1.3725083269350038e-06,
+ "loss": 0.0569,
+ "step": 30693
+ },
+ {
+ "epoch": 83.63487738419619,
+ "grad_norm": 4.429915904998779,
+ "learning_rate": 1.3720621428680991e-06,
+ "loss": 0.029,
+ "step": 30694
+ },
+ {
+ "epoch": 83.6376021798365,
+ "grad_norm": 3.721404552459717,
+ "learning_rate": 1.3716160259952948e-06,
+ "loss": 0.1161,
+ "step": 30695
+ },
+ {
+ "epoch": 83.64032697547684,
+ "grad_norm": 1.9863237142562866,
+ "learning_rate": 1.3711699763200692e-06,
+ "loss": 0.0211,
+ "step": 30696
+ },
+ {
+ "epoch": 83.64305177111717,
+ "grad_norm": 3.1300644874572754,
+ "learning_rate": 1.370723993845895e-06,
+ "loss": 0.2092,
+ "step": 30697
+ },
+ {
+ "epoch": 83.64577656675749,
+ "grad_norm": 5.223509311676025,
+ "learning_rate": 1.3702780785762415e-06,
+ "loss": 0.0372,
+ "step": 30698
+ },
+ {
+ "epoch": 83.64850136239782,
+ "grad_norm": 3.500175714492798,
+ "learning_rate": 1.3698322305145871e-06,
+ "loss": 0.0512,
+ "step": 30699
+ },
+ {
+ "epoch": 83.65122615803814,
+ "grad_norm": 2.1549646854400635,
+ "learning_rate": 1.3693864496644017e-06,
+ "loss": 0.0806,
+ "step": 30700
+ },
+ {
+ "epoch": 83.65395095367847,
+ "grad_norm": 2.5164310932159424,
+ "learning_rate": 1.3689407360291562e-06,
+ "loss": 0.0874,
+ "step": 30701
+ },
+ {
+ "epoch": 83.65667574931881,
+ "grad_norm": 2.9584224224090576,
+ "learning_rate": 1.3684950896123205e-06,
+ "loss": 0.223,
+ "step": 30702
+ },
+ {
+ "epoch": 83.65940054495913,
+ "grad_norm": 3.1741037368774414,
+ "learning_rate": 1.3680495104173697e-06,
+ "loss": 0.112,
+ "step": 30703
+ },
+ {
+ "epoch": 83.66212534059946,
+ "grad_norm": 3.3103814125061035,
+ "learning_rate": 1.3676039984477684e-06,
+ "loss": 0.045,
+ "step": 30704
+ },
+ {
+ "epoch": 83.66485013623978,
+ "grad_norm": 2.4003143310546875,
+ "learning_rate": 1.3671585537069931e-06,
+ "loss": 0.0453,
+ "step": 30705
+ },
+ {
+ "epoch": 83.66757493188011,
+ "grad_norm": 2.857621669769287,
+ "learning_rate": 1.3667131761985076e-06,
+ "loss": 0.0537,
+ "step": 30706
+ },
+ {
+ "epoch": 83.67029972752043,
+ "grad_norm": 2.950096845626831,
+ "learning_rate": 1.3662678659257811e-06,
+ "loss": 0.0477,
+ "step": 30707
+ },
+ {
+ "epoch": 83.67302452316076,
+ "grad_norm": 2.1988792419433594,
+ "learning_rate": 1.3658226228922844e-06,
+ "loss": 0.0796,
+ "step": 30708
+ },
+ {
+ "epoch": 83.6757493188011,
+ "grad_norm": 2.5007739067077637,
+ "learning_rate": 1.3653774471014825e-06,
+ "loss": 0.0622,
+ "step": 30709
+ },
+ {
+ "epoch": 83.67847411444141,
+ "grad_norm": 1.994951605796814,
+ "learning_rate": 1.3649323385568435e-06,
+ "loss": 0.0213,
+ "step": 30710
+ },
+ {
+ "epoch": 83.68119891008175,
+ "grad_norm": 2.182677745819092,
+ "learning_rate": 1.3644872972618316e-06,
+ "loss": 0.0238,
+ "step": 30711
+ },
+ {
+ "epoch": 83.68392370572207,
+ "grad_norm": 1.9833247661590576,
+ "learning_rate": 1.3640423232199174e-06,
+ "loss": 0.1247,
+ "step": 30712
+ },
+ {
+ "epoch": 83.6866485013624,
+ "grad_norm": 5.841768264770508,
+ "learning_rate": 1.3635974164345634e-06,
+ "loss": 0.0509,
+ "step": 30713
+ },
+ {
+ "epoch": 83.68937329700273,
+ "grad_norm": 2.157848834991455,
+ "learning_rate": 1.3631525769092336e-06,
+ "loss": 0.0432,
+ "step": 30714
+ },
+ {
+ "epoch": 83.69209809264305,
+ "grad_norm": 3.3198623657226562,
+ "learning_rate": 1.362707804647393e-06,
+ "loss": 0.1129,
+ "step": 30715
+ },
+ {
+ "epoch": 83.69482288828338,
+ "grad_norm": 7.962392330169678,
+ "learning_rate": 1.3622630996525067e-06,
+ "loss": 0.1005,
+ "step": 30716
+ },
+ {
+ "epoch": 83.6975476839237,
+ "grad_norm": 2.285831928253174,
+ "learning_rate": 1.3618184619280383e-06,
+ "loss": 0.141,
+ "step": 30717
+ },
+ {
+ "epoch": 83.70027247956403,
+ "grad_norm": 3.1766984462738037,
+ "learning_rate": 1.3613738914774477e-06,
+ "loss": 0.0723,
+ "step": 30718
+ },
+ {
+ "epoch": 83.70299727520435,
+ "grad_norm": 2.1154513359069824,
+ "learning_rate": 1.3609293883042007e-06,
+ "loss": 0.0608,
+ "step": 30719
+ },
+ {
+ "epoch": 83.70572207084469,
+ "grad_norm": 2.6665258407592773,
+ "learning_rate": 1.360484952411758e-06,
+ "loss": 0.101,
+ "step": 30720
+ },
+ {
+ "epoch": 83.70844686648502,
+ "grad_norm": 2.3414156436920166,
+ "learning_rate": 1.3600405838035779e-06,
+ "loss": 0.0314,
+ "step": 30721
+ },
+ {
+ "epoch": 83.71117166212534,
+ "grad_norm": 2.286808729171753,
+ "learning_rate": 1.3595962824831255e-06,
+ "loss": 0.0941,
+ "step": 30722
+ },
+ {
+ "epoch": 83.71389645776567,
+ "grad_norm": 1.7137775421142578,
+ "learning_rate": 1.3591520484538578e-06,
+ "loss": 0.0461,
+ "step": 30723
+ },
+ {
+ "epoch": 83.71662125340599,
+ "grad_norm": 2.542334794998169,
+ "learning_rate": 1.3587078817192378e-06,
+ "loss": 0.0527,
+ "step": 30724
+ },
+ {
+ "epoch": 83.71934604904632,
+ "grad_norm": 2.442690372467041,
+ "learning_rate": 1.3582637822827228e-06,
+ "loss": 0.0823,
+ "step": 30725
+ },
+ {
+ "epoch": 83.72207084468666,
+ "grad_norm": 1.598746657371521,
+ "learning_rate": 1.3578197501477708e-06,
+ "loss": 0.0205,
+ "step": 30726
+ },
+ {
+ "epoch": 83.72479564032697,
+ "grad_norm": 4.047211647033691,
+ "learning_rate": 1.3573757853178392e-06,
+ "loss": 0.1028,
+ "step": 30727
+ },
+ {
+ "epoch": 83.7275204359673,
+ "grad_norm": 2.4902350902557373,
+ "learning_rate": 1.3569318877963878e-06,
+ "loss": 0.1635,
+ "step": 30728
+ },
+ {
+ "epoch": 83.73024523160763,
+ "grad_norm": 2.145904541015625,
+ "learning_rate": 1.3564880575868734e-06,
+ "loss": 0.0409,
+ "step": 30729
+ },
+ {
+ "epoch": 83.73297002724796,
+ "grad_norm": 2.8706185817718506,
+ "learning_rate": 1.3560442946927522e-06,
+ "loss": 0.0326,
+ "step": 30730
+ },
+ {
+ "epoch": 83.73569482288828,
+ "grad_norm": 3.4135332107543945,
+ "learning_rate": 1.355600599117477e-06,
+ "loss": 0.0359,
+ "step": 30731
+ },
+ {
+ "epoch": 83.73841961852861,
+ "grad_norm": 3.3279924392700195,
+ "learning_rate": 1.3551569708645084e-06,
+ "loss": 0.1347,
+ "step": 30732
+ },
+ {
+ "epoch": 83.74114441416894,
+ "grad_norm": 3.154670000076294,
+ "learning_rate": 1.3547134099372993e-06,
+ "loss": 0.0558,
+ "step": 30733
+ },
+ {
+ "epoch": 83.74386920980926,
+ "grad_norm": 2.459663152694702,
+ "learning_rate": 1.3542699163393036e-06,
+ "loss": 0.0403,
+ "step": 30734
+ },
+ {
+ "epoch": 83.7465940054496,
+ "grad_norm": 2.3531036376953125,
+ "learning_rate": 1.353826490073974e-06,
+ "loss": 0.0515,
+ "step": 30735
+ },
+ {
+ "epoch": 83.74931880108991,
+ "grad_norm": 2.820645809173584,
+ "learning_rate": 1.3533831311447665e-06,
+ "loss": 0.0406,
+ "step": 30736
+ },
+ {
+ "epoch": 83.75204359673025,
+ "grad_norm": 2.0220279693603516,
+ "learning_rate": 1.3529398395551342e-06,
+ "loss": 0.0183,
+ "step": 30737
+ },
+ {
+ "epoch": 83.75476839237058,
+ "grad_norm": 3.94909930229187,
+ "learning_rate": 1.3524966153085272e-06,
+ "loss": 0.0858,
+ "step": 30738
+ },
+ {
+ "epoch": 83.7574931880109,
+ "grad_norm": 2.462339162826538,
+ "learning_rate": 1.3520534584083932e-06,
+ "loss": 0.0272,
+ "step": 30739
+ },
+ {
+ "epoch": 83.76021798365123,
+ "grad_norm": 2.521505832672119,
+ "learning_rate": 1.351610368858194e-06,
+ "loss": 0.0499,
+ "step": 30740
+ },
+ {
+ "epoch": 83.76294277929155,
+ "grad_norm": 3.2271714210510254,
+ "learning_rate": 1.351167346661375e-06,
+ "loss": 0.0789,
+ "step": 30741
+ },
+ {
+ "epoch": 83.76566757493188,
+ "grad_norm": 3.7426722049713135,
+ "learning_rate": 1.3507243918213864e-06,
+ "loss": 0.0493,
+ "step": 30742
+ },
+ {
+ "epoch": 83.7683923705722,
+ "grad_norm": 2.64389967918396,
+ "learning_rate": 1.3502815043416751e-06,
+ "loss": 0.1364,
+ "step": 30743
+ },
+ {
+ "epoch": 83.77111716621253,
+ "grad_norm": 2.8800723552703857,
+ "learning_rate": 1.349838684225695e-06,
+ "loss": 0.1093,
+ "step": 30744
+ },
+ {
+ "epoch": 83.77384196185287,
+ "grad_norm": 3.1709158420562744,
+ "learning_rate": 1.3493959314768934e-06,
+ "loss": 0.1316,
+ "step": 30745
+ },
+ {
+ "epoch": 83.77656675749319,
+ "grad_norm": 2.8967678546905518,
+ "learning_rate": 1.3489532460987176e-06,
+ "loss": 0.0496,
+ "step": 30746
+ },
+ {
+ "epoch": 83.77929155313352,
+ "grad_norm": 1.6467289924621582,
+ "learning_rate": 1.3485106280946137e-06,
+ "loss": 0.0194,
+ "step": 30747
+ },
+ {
+ "epoch": 83.78201634877384,
+ "grad_norm": 2.877261161804199,
+ "learning_rate": 1.348068077468032e-06,
+ "loss": 0.0649,
+ "step": 30748
+ },
+ {
+ "epoch": 83.78474114441417,
+ "grad_norm": 2.013784170150757,
+ "learning_rate": 1.3476255942224193e-06,
+ "loss": 0.1587,
+ "step": 30749
+ },
+ {
+ "epoch": 83.7874659400545,
+ "grad_norm": 2.0299766063690186,
+ "learning_rate": 1.3471831783612189e-06,
+ "loss": 0.0246,
+ "step": 30750
+ },
+ {
+ "epoch": 83.79019073569482,
+ "grad_norm": 1.8846317529678345,
+ "learning_rate": 1.3467408298878747e-06,
+ "loss": 0.0325,
+ "step": 30751
+ },
+ {
+ "epoch": 83.79291553133515,
+ "grad_norm": 2.4729061126708984,
+ "learning_rate": 1.3462985488058366e-06,
+ "loss": 0.115,
+ "step": 30752
+ },
+ {
+ "epoch": 83.79564032697547,
+ "grad_norm": 3.446141481399536,
+ "learning_rate": 1.3458563351185482e-06,
+ "loss": 0.0824,
+ "step": 30753
+ },
+ {
+ "epoch": 83.7983651226158,
+ "grad_norm": 3.2303617000579834,
+ "learning_rate": 1.3454141888294514e-06,
+ "loss": 0.0343,
+ "step": 30754
+ },
+ {
+ "epoch": 83.80108991825612,
+ "grad_norm": 2.0372912883758545,
+ "learning_rate": 1.3449721099419876e-06,
+ "loss": 0.026,
+ "step": 30755
+ },
+ {
+ "epoch": 83.80381471389646,
+ "grad_norm": 2.161118507385254,
+ "learning_rate": 1.3445300984596032e-06,
+ "loss": 0.0423,
+ "step": 30756
+ },
+ {
+ "epoch": 83.80653950953679,
+ "grad_norm": 4.139506816864014,
+ "learning_rate": 1.344088154385741e-06,
+ "loss": 0.0711,
+ "step": 30757
+ },
+ {
+ "epoch": 83.80926430517711,
+ "grad_norm": 2.070422649383545,
+ "learning_rate": 1.3436462777238424e-06,
+ "loss": 0.0359,
+ "step": 30758
+ },
+ {
+ "epoch": 83.81198910081744,
+ "grad_norm": 3.227454900741577,
+ "learning_rate": 1.343204468477346e-06,
+ "loss": 0.1504,
+ "step": 30759
+ },
+ {
+ "epoch": 83.81471389645776,
+ "grad_norm": 2.8671176433563232,
+ "learning_rate": 1.3427627266496967e-06,
+ "loss": 0.0839,
+ "step": 30760
+ },
+ {
+ "epoch": 83.8174386920981,
+ "grad_norm": 1.9733912944793701,
+ "learning_rate": 1.342321052244333e-06,
+ "loss": 0.029,
+ "step": 30761
+ },
+ {
+ "epoch": 83.82016348773843,
+ "grad_norm": 3.2461791038513184,
+ "learning_rate": 1.3418794452646932e-06,
+ "loss": 0.0461,
+ "step": 30762
+ },
+ {
+ "epoch": 83.82288828337875,
+ "grad_norm": 2.115133285522461,
+ "learning_rate": 1.3414379057142158e-06,
+ "loss": 0.1248,
+ "step": 30763
+ },
+ {
+ "epoch": 83.82561307901908,
+ "grad_norm": 1.7545677423477173,
+ "learning_rate": 1.3409964335963443e-06,
+ "loss": 0.0162,
+ "step": 30764
+ },
+ {
+ "epoch": 83.8283378746594,
+ "grad_norm": 2.0505893230438232,
+ "learning_rate": 1.3405550289145131e-06,
+ "loss": 0.0707,
+ "step": 30765
+ },
+ {
+ "epoch": 83.83106267029973,
+ "grad_norm": 2.327916383743286,
+ "learning_rate": 1.3401136916721614e-06,
+ "loss": 0.0438,
+ "step": 30766
+ },
+ {
+ "epoch": 83.83378746594005,
+ "grad_norm": 2.9162378311157227,
+ "learning_rate": 1.339672421872722e-06,
+ "loss": 0.0292,
+ "step": 30767
+ },
+ {
+ "epoch": 83.83651226158038,
+ "grad_norm": 2.5131583213806152,
+ "learning_rate": 1.339231219519639e-06,
+ "loss": 0.1061,
+ "step": 30768
+ },
+ {
+ "epoch": 83.83923705722071,
+ "grad_norm": 3.5404741764068604,
+ "learning_rate": 1.3387900846163427e-06,
+ "loss": 0.1621,
+ "step": 30769
+ },
+ {
+ "epoch": 83.84196185286103,
+ "grad_norm": 2.8070809841156006,
+ "learning_rate": 1.3383490171662717e-06,
+ "loss": 0.062,
+ "step": 30770
+ },
+ {
+ "epoch": 83.84468664850137,
+ "grad_norm": 2.572690486907959,
+ "learning_rate": 1.3379080171728575e-06,
+ "loss": 0.0701,
+ "step": 30771
+ },
+ {
+ "epoch": 83.84741144414168,
+ "grad_norm": 4.501012325286865,
+ "learning_rate": 1.3374670846395388e-06,
+ "loss": 0.0436,
+ "step": 30772
+ },
+ {
+ "epoch": 83.85013623978202,
+ "grad_norm": 3.021658182144165,
+ "learning_rate": 1.3370262195697449e-06,
+ "loss": 0.0804,
+ "step": 30773
+ },
+ {
+ "epoch": 83.85286103542235,
+ "grad_norm": 2.2155721187591553,
+ "learning_rate": 1.336585421966915e-06,
+ "loss": 0.028,
+ "step": 30774
+ },
+ {
+ "epoch": 83.85558583106267,
+ "grad_norm": 2.8366146087646484,
+ "learning_rate": 1.3361446918344789e-06,
+ "loss": 0.041,
+ "step": 30775
+ },
+ {
+ "epoch": 83.858310626703,
+ "grad_norm": 3.742677688598633,
+ "learning_rate": 1.3357040291758661e-06,
+ "loss": 0.0359,
+ "step": 30776
+ },
+ {
+ "epoch": 83.86103542234332,
+ "grad_norm": 3.1085548400878906,
+ "learning_rate": 1.3352634339945147e-06,
+ "loss": 0.1177,
+ "step": 30777
+ },
+ {
+ "epoch": 83.86376021798365,
+ "grad_norm": 2.6871159076690674,
+ "learning_rate": 1.3348229062938522e-06,
+ "loss": 0.029,
+ "step": 30778
+ },
+ {
+ "epoch": 83.86648501362397,
+ "grad_norm": 2.5326735973358154,
+ "learning_rate": 1.3343824460773103e-06,
+ "loss": 0.1137,
+ "step": 30779
+ },
+ {
+ "epoch": 83.8692098092643,
+ "grad_norm": 3.30340313911438,
+ "learning_rate": 1.3339420533483171e-06,
+ "loss": 0.047,
+ "step": 30780
+ },
+ {
+ "epoch": 83.87193460490464,
+ "grad_norm": 3.567577600479126,
+ "learning_rate": 1.3335017281103059e-06,
+ "loss": 0.1472,
+ "step": 30781
+ },
+ {
+ "epoch": 83.87465940054496,
+ "grad_norm": 1.5896742343902588,
+ "learning_rate": 1.3330614703667045e-06,
+ "loss": 0.0453,
+ "step": 30782
+ },
+ {
+ "epoch": 83.87738419618529,
+ "grad_norm": 2.422525644302368,
+ "learning_rate": 1.3326212801209392e-06,
+ "loss": 0.0347,
+ "step": 30783
+ },
+ {
+ "epoch": 83.88010899182561,
+ "grad_norm": 2.526461362838745,
+ "learning_rate": 1.332181157376442e-06,
+ "loss": 0.0426,
+ "step": 30784
+ },
+ {
+ "epoch": 83.88283378746594,
+ "grad_norm": 2.8503379821777344,
+ "learning_rate": 1.33174110213664e-06,
+ "loss": 0.0658,
+ "step": 30785
+ },
+ {
+ "epoch": 83.88555858310627,
+ "grad_norm": 2.456122636795044,
+ "learning_rate": 1.3313011144049593e-06,
+ "loss": 0.0412,
+ "step": 30786
+ },
+ {
+ "epoch": 83.88828337874659,
+ "grad_norm": 1.6854655742645264,
+ "learning_rate": 1.3308611941848237e-06,
+ "loss": 0.0227,
+ "step": 30787
+ },
+ {
+ "epoch": 83.89100817438693,
+ "grad_norm": 2.3722498416900635,
+ "learning_rate": 1.330421341479664e-06,
+ "loss": 0.0312,
+ "step": 30788
+ },
+ {
+ "epoch": 83.89373297002724,
+ "grad_norm": 2.219261646270752,
+ "learning_rate": 1.3299815562929052e-06,
+ "loss": 0.0359,
+ "step": 30789
+ },
+ {
+ "epoch": 83.89645776566758,
+ "grad_norm": 3.1999733448028564,
+ "learning_rate": 1.3295418386279679e-06,
+ "loss": 0.0357,
+ "step": 30790
+ },
+ {
+ "epoch": 83.8991825613079,
+ "grad_norm": 2.2349696159362793,
+ "learning_rate": 1.3291021884882815e-06,
+ "loss": 0.0189,
+ "step": 30791
+ },
+ {
+ "epoch": 83.90190735694823,
+ "grad_norm": 4.736440658569336,
+ "learning_rate": 1.3286626058772668e-06,
+ "loss": 0.0338,
+ "step": 30792
+ },
+ {
+ "epoch": 83.90463215258856,
+ "grad_norm": 2.3881900310516357,
+ "learning_rate": 1.3282230907983507e-06,
+ "loss": 0.1011,
+ "step": 30793
+ },
+ {
+ "epoch": 83.90735694822888,
+ "grad_norm": 2.436798095703125,
+ "learning_rate": 1.327783643254954e-06,
+ "loss": 0.1332,
+ "step": 30794
+ },
+ {
+ "epoch": 83.91008174386921,
+ "grad_norm": 3.1069788932800293,
+ "learning_rate": 1.3273442632504985e-06,
+ "loss": 0.0848,
+ "step": 30795
+ },
+ {
+ "epoch": 83.91280653950953,
+ "grad_norm": 2.8002724647521973,
+ "learning_rate": 1.3269049507884057e-06,
+ "loss": 0.1597,
+ "step": 30796
+ },
+ {
+ "epoch": 83.91553133514986,
+ "grad_norm": 4.678211212158203,
+ "learning_rate": 1.3264657058720998e-06,
+ "loss": 0.1286,
+ "step": 30797
+ },
+ {
+ "epoch": 83.9182561307902,
+ "grad_norm": 3.485680103302002,
+ "learning_rate": 1.326026528504999e-06,
+ "loss": 0.1663,
+ "step": 30798
+ },
+ {
+ "epoch": 83.92098092643052,
+ "grad_norm": 2.8237295150756836,
+ "learning_rate": 1.325587418690525e-06,
+ "loss": 0.124,
+ "step": 30799
+ },
+ {
+ "epoch": 83.92370572207085,
+ "grad_norm": 2.188760995864868,
+ "learning_rate": 1.325148376432095e-06,
+ "loss": 0.0598,
+ "step": 30800
+ },
+ {
+ "epoch": 83.92643051771117,
+ "grad_norm": 2.43650221824646,
+ "learning_rate": 1.324709401733133e-06,
+ "loss": 0.028,
+ "step": 30801
+ },
+ {
+ "epoch": 83.9291553133515,
+ "grad_norm": 1.6160179376602173,
+ "learning_rate": 1.3242704945970541e-06,
+ "loss": 0.0201,
+ "step": 30802
+ },
+ {
+ "epoch": 83.93188010899182,
+ "grad_norm": 3.291584014892578,
+ "learning_rate": 1.3238316550272767e-06,
+ "loss": 0.0403,
+ "step": 30803
+ },
+ {
+ "epoch": 83.93460490463215,
+ "grad_norm": 3.426374673843384,
+ "learning_rate": 1.323392883027218e-06,
+ "loss": 0.0413,
+ "step": 30804
+ },
+ {
+ "epoch": 83.93732970027249,
+ "grad_norm": 4.177335262298584,
+ "learning_rate": 1.3229541786002987e-06,
+ "loss": 0.0972,
+ "step": 30805
+ },
+ {
+ "epoch": 83.9400544959128,
+ "grad_norm": 3.023916006088257,
+ "learning_rate": 1.3225155417499325e-06,
+ "loss": 0.1318,
+ "step": 30806
+ },
+ {
+ "epoch": 83.94277929155314,
+ "grad_norm": 2.683013916015625,
+ "learning_rate": 1.3220769724795334e-06,
+ "loss": 0.0687,
+ "step": 30807
+ },
+ {
+ "epoch": 83.94550408719346,
+ "grad_norm": 3.029341697692871,
+ "learning_rate": 1.32163847079252e-06,
+ "loss": 0.1477,
+ "step": 30808
+ },
+ {
+ "epoch": 83.94822888283379,
+ "grad_norm": 2.1001205444335938,
+ "learning_rate": 1.3212000366923095e-06,
+ "loss": 0.0492,
+ "step": 30809
+ },
+ {
+ "epoch": 83.95095367847412,
+ "grad_norm": 1.5391870737075806,
+ "learning_rate": 1.3207616701823135e-06,
+ "loss": 0.0199,
+ "step": 30810
+ },
+ {
+ "epoch": 83.95367847411444,
+ "grad_norm": 2.2881364822387695,
+ "learning_rate": 1.3203233712659457e-06,
+ "loss": 0.0889,
+ "step": 30811
+ },
+ {
+ "epoch": 83.95640326975477,
+ "grad_norm": 3.243116855621338,
+ "learning_rate": 1.3198851399466184e-06,
+ "loss": 0.0865,
+ "step": 30812
+ },
+ {
+ "epoch": 83.95912806539509,
+ "grad_norm": 3.009913206100464,
+ "learning_rate": 1.3194469762277485e-06,
+ "loss": 0.0822,
+ "step": 30813
+ },
+ {
+ "epoch": 83.96185286103542,
+ "grad_norm": 4.149927616119385,
+ "learning_rate": 1.3190088801127454e-06,
+ "loss": 0.0555,
+ "step": 30814
+ },
+ {
+ "epoch": 83.96457765667574,
+ "grad_norm": 1.8183202743530273,
+ "learning_rate": 1.3185708516050233e-06,
+ "loss": 0.025,
+ "step": 30815
+ },
+ {
+ "epoch": 83.96730245231608,
+ "grad_norm": 2.282015800476074,
+ "learning_rate": 1.3181328907079883e-06,
+ "loss": 0.0359,
+ "step": 30816
+ },
+ {
+ "epoch": 83.97002724795641,
+ "grad_norm": 1.651680827140808,
+ "learning_rate": 1.3176949974250575e-06,
+ "loss": 0.0199,
+ "step": 30817
+ },
+ {
+ "epoch": 83.97275204359673,
+ "grad_norm": 3.44093656539917,
+ "learning_rate": 1.3172571717596393e-06,
+ "loss": 0.0732,
+ "step": 30818
+ },
+ {
+ "epoch": 83.97547683923706,
+ "grad_norm": 2.1605823040008545,
+ "learning_rate": 1.3168194137151423e-06,
+ "loss": 0.026,
+ "step": 30819
+ },
+ {
+ "epoch": 83.97820163487738,
+ "grad_norm": 2.1238672733306885,
+ "learning_rate": 1.3163817232949738e-06,
+ "loss": 0.0295,
+ "step": 30820
+ },
+ {
+ "epoch": 83.98092643051771,
+ "grad_norm": 2.07331919670105,
+ "learning_rate": 1.3159441005025475e-06,
+ "loss": 0.0894,
+ "step": 30821
+ },
+ {
+ "epoch": 83.98365122615803,
+ "grad_norm": 3.058595895767212,
+ "learning_rate": 1.3155065453412696e-06,
+ "loss": 0.1239,
+ "step": 30822
+ },
+ {
+ "epoch": 83.98637602179836,
+ "grad_norm": 5.056929588317871,
+ "learning_rate": 1.3150690578145465e-06,
+ "loss": 0.1538,
+ "step": 30823
+ },
+ {
+ "epoch": 83.9891008174387,
+ "grad_norm": 1.865096092224121,
+ "learning_rate": 1.314631637925784e-06,
+ "loss": 0.0318,
+ "step": 30824
+ },
+ {
+ "epoch": 83.99182561307902,
+ "grad_norm": 2.403432607650757,
+ "learning_rate": 1.3141942856783908e-06,
+ "loss": 0.052,
+ "step": 30825
+ },
+ {
+ "epoch": 83.99455040871935,
+ "grad_norm": 2.6325230598449707,
+ "learning_rate": 1.313757001075775e-06,
+ "loss": 0.1049,
+ "step": 30826
+ },
+ {
+ "epoch": 83.99727520435967,
+ "grad_norm": 1.7367075681686401,
+ "learning_rate": 1.3133197841213396e-06,
+ "loss": 0.1423,
+ "step": 30827
+ },
+ {
+ "epoch": 84.0,
+ "grad_norm": 2.738262414932251,
+ "learning_rate": 1.3128826348184886e-06,
+ "loss": 0.0675,
+ "step": 30828
+ },
+ {
+ "epoch": 84.00272479564033,
+ "grad_norm": 2.9976625442504883,
+ "learning_rate": 1.3124455531706304e-06,
+ "loss": 0.075,
+ "step": 30829
+ },
+ {
+ "epoch": 84.00544959128065,
+ "grad_norm": 11.635932922363281,
+ "learning_rate": 1.3120085391811666e-06,
+ "loss": 0.0366,
+ "step": 30830
+ },
+ {
+ "epoch": 84.00817438692098,
+ "grad_norm": 2.359337568283081,
+ "learning_rate": 1.3115715928535e-06,
+ "loss": 0.025,
+ "step": 30831
+ },
+ {
+ "epoch": 84.0108991825613,
+ "grad_norm": 1.7224256992340088,
+ "learning_rate": 1.3111347141910324e-06,
+ "loss": 0.0272,
+ "step": 30832
+ },
+ {
+ "epoch": 84.01362397820164,
+ "grad_norm": 2.0104165077209473,
+ "learning_rate": 1.3106979031971701e-06,
+ "loss": 0.0425,
+ "step": 30833
+ },
+ {
+ "epoch": 84.01634877384195,
+ "grad_norm": 3.3771467208862305,
+ "learning_rate": 1.3102611598753135e-06,
+ "loss": 0.1773,
+ "step": 30834
+ },
+ {
+ "epoch": 84.01907356948229,
+ "grad_norm": 2.174729108810425,
+ "learning_rate": 1.3098244842288622e-06,
+ "loss": 0.0293,
+ "step": 30835
+ },
+ {
+ "epoch": 84.02179836512262,
+ "grad_norm": 3.263211965560913,
+ "learning_rate": 1.3093878762612167e-06,
+ "loss": 0.0771,
+ "step": 30836
+ },
+ {
+ "epoch": 84.02452316076294,
+ "grad_norm": 2.6361441612243652,
+ "learning_rate": 1.308951335975781e-06,
+ "loss": 0.0822,
+ "step": 30837
+ },
+ {
+ "epoch": 84.02724795640327,
+ "grad_norm": 4.018730640411377,
+ "learning_rate": 1.3085148633759525e-06,
+ "loss": 0.1253,
+ "step": 30838
+ },
+ {
+ "epoch": 84.02997275204359,
+ "grad_norm": 2.339142084121704,
+ "learning_rate": 1.3080784584651308e-06,
+ "loss": 0.0258,
+ "step": 30839
+ },
+ {
+ "epoch": 84.03269754768392,
+ "grad_norm": 2.0447726249694824,
+ "learning_rate": 1.3076421212467117e-06,
+ "loss": 0.0882,
+ "step": 30840
+ },
+ {
+ "epoch": 84.03542234332426,
+ "grad_norm": 2.7352120876312256,
+ "learning_rate": 1.307205851724097e-06,
+ "loss": 0.0681,
+ "step": 30841
+ },
+ {
+ "epoch": 84.03814713896458,
+ "grad_norm": 2.458771228790283,
+ "learning_rate": 1.3067696499006832e-06,
+ "loss": 0.0378,
+ "step": 30842
+ },
+ {
+ "epoch": 84.04087193460491,
+ "grad_norm": 2.5709726810455322,
+ "learning_rate": 1.3063335157798685e-06,
+ "loss": 0.0618,
+ "step": 30843
+ },
+ {
+ "epoch": 84.04359673024523,
+ "grad_norm": 3.4718542098999023,
+ "learning_rate": 1.305897449365049e-06,
+ "loss": 0.0762,
+ "step": 30844
+ },
+ {
+ "epoch": 84.04632152588556,
+ "grad_norm": 2.1422181129455566,
+ "learning_rate": 1.3054614506596186e-06,
+ "loss": 0.0276,
+ "step": 30845
+ },
+ {
+ "epoch": 84.04904632152588,
+ "grad_norm": 1.9626917839050293,
+ "learning_rate": 1.305025519666976e-06,
+ "loss": 0.0225,
+ "step": 30846
+ },
+ {
+ "epoch": 84.05177111716621,
+ "grad_norm": 2.641353130340576,
+ "learning_rate": 1.3045896563905147e-06,
+ "loss": 0.1121,
+ "step": 30847
+ },
+ {
+ "epoch": 84.05449591280654,
+ "grad_norm": 3.349381923675537,
+ "learning_rate": 1.3041538608336279e-06,
+ "loss": 0.0983,
+ "step": 30848
+ },
+ {
+ "epoch": 84.05722070844686,
+ "grad_norm": 9.3013334274292,
+ "learning_rate": 1.3037181329997128e-06,
+ "loss": 0.1697,
+ "step": 30849
+ },
+ {
+ "epoch": 84.0599455040872,
+ "grad_norm": 2.1191818714141846,
+ "learning_rate": 1.3032824728921612e-06,
+ "loss": 0.0515,
+ "step": 30850
+ },
+ {
+ "epoch": 84.06267029972751,
+ "grad_norm": 2.3567941188812256,
+ "learning_rate": 1.3028468805143657e-06,
+ "loss": 0.075,
+ "step": 30851
+ },
+ {
+ "epoch": 84.06539509536785,
+ "grad_norm": 4.8907928466796875,
+ "learning_rate": 1.302411355869716e-06,
+ "loss": 0.0441,
+ "step": 30852
+ },
+ {
+ "epoch": 84.06811989100818,
+ "grad_norm": 4.172059059143066,
+ "learning_rate": 1.3019758989616094e-06,
+ "loss": 0.1561,
+ "step": 30853
+ },
+ {
+ "epoch": 84.0708446866485,
+ "grad_norm": 2.6362855434417725,
+ "learning_rate": 1.3015405097934342e-06,
+ "loss": 0.0486,
+ "step": 30854
+ },
+ {
+ "epoch": 84.07356948228883,
+ "grad_norm": 2.9769845008850098,
+ "learning_rate": 1.301105188368582e-06,
+ "loss": 0.0565,
+ "step": 30855
+ },
+ {
+ "epoch": 84.07629427792915,
+ "grad_norm": 3.011777639389038,
+ "learning_rate": 1.3006699346904406e-06,
+ "loss": 0.074,
+ "step": 30856
+ },
+ {
+ "epoch": 84.07901907356948,
+ "grad_norm": 3.191282272338867,
+ "learning_rate": 1.3002347487624035e-06,
+ "loss": 0.146,
+ "step": 30857
+ },
+ {
+ "epoch": 84.0817438692098,
+ "grad_norm": 2.3934123516082764,
+ "learning_rate": 1.299799630587858e-06,
+ "loss": 0.0353,
+ "step": 30858
+ },
+ {
+ "epoch": 84.08446866485014,
+ "grad_norm": 2.757439374923706,
+ "learning_rate": 1.2993645801701914e-06,
+ "loss": 0.0457,
+ "step": 30859
+ },
+ {
+ "epoch": 84.08719346049047,
+ "grad_norm": 2.566817283630371,
+ "learning_rate": 1.2989295975127957e-06,
+ "loss": 0.0434,
+ "step": 30860
+ },
+ {
+ "epoch": 84.08991825613079,
+ "grad_norm": 2.684659481048584,
+ "learning_rate": 1.2984946826190537e-06,
+ "loss": 0.0312,
+ "step": 30861
+ },
+ {
+ "epoch": 84.09264305177112,
+ "grad_norm": 2.3274450302124023,
+ "learning_rate": 1.2980598354923567e-06,
+ "loss": 0.124,
+ "step": 30862
+ },
+ {
+ "epoch": 84.09536784741144,
+ "grad_norm": 1.5184946060180664,
+ "learning_rate": 1.2976250561360904e-06,
+ "loss": 0.0163,
+ "step": 30863
+ },
+ {
+ "epoch": 84.09809264305177,
+ "grad_norm": 4.458086013793945,
+ "learning_rate": 1.2971903445536393e-06,
+ "loss": 0.0395,
+ "step": 30864
+ },
+ {
+ "epoch": 84.1008174386921,
+ "grad_norm": 3.278067111968994,
+ "learning_rate": 1.2967557007483888e-06,
+ "loss": 0.0714,
+ "step": 30865
+ },
+ {
+ "epoch": 84.10354223433242,
+ "grad_norm": 6.933575630187988,
+ "learning_rate": 1.296321124723726e-06,
+ "loss": 0.1478,
+ "step": 30866
+ },
+ {
+ "epoch": 84.10626702997276,
+ "grad_norm": 1.8300024271011353,
+ "learning_rate": 1.2958866164830342e-06,
+ "loss": 0.0407,
+ "step": 30867
+ },
+ {
+ "epoch": 84.10899182561307,
+ "grad_norm": 1.7332144975662231,
+ "learning_rate": 1.295452176029698e-06,
+ "loss": 0.026,
+ "step": 30868
+ },
+ {
+ "epoch": 84.11171662125341,
+ "grad_norm": 2.7168946266174316,
+ "learning_rate": 1.2950178033670969e-06,
+ "loss": 0.0295,
+ "step": 30869
+ },
+ {
+ "epoch": 84.11444141689373,
+ "grad_norm": 3.1485800743103027,
+ "learning_rate": 1.2945834984986194e-06,
+ "loss": 0.0709,
+ "step": 30870
+ },
+ {
+ "epoch": 84.11716621253406,
+ "grad_norm": 2.4771053791046143,
+ "learning_rate": 1.2941492614276463e-06,
+ "loss": 0.0236,
+ "step": 30871
+ },
+ {
+ "epoch": 84.11989100817439,
+ "grad_norm": 2.1699888706207275,
+ "learning_rate": 1.2937150921575548e-06,
+ "loss": 0.0328,
+ "step": 30872
+ },
+ {
+ "epoch": 84.12261580381471,
+ "grad_norm": 2.5949923992156982,
+ "learning_rate": 1.293280990691733e-06,
+ "loss": 0.0341,
+ "step": 30873
+ },
+ {
+ "epoch": 84.12534059945504,
+ "grad_norm": 4.152580261230469,
+ "learning_rate": 1.292846957033559e-06,
+ "loss": 0.0759,
+ "step": 30874
+ },
+ {
+ "epoch": 84.12806539509536,
+ "grad_norm": 1.6484575271606445,
+ "learning_rate": 1.2924129911864126e-06,
+ "loss": 0.02,
+ "step": 30875
+ },
+ {
+ "epoch": 84.1307901907357,
+ "grad_norm": 8.59929084777832,
+ "learning_rate": 1.2919790931536714e-06,
+ "loss": 0.1513,
+ "step": 30876
+ },
+ {
+ "epoch": 84.13351498637603,
+ "grad_norm": 2.347327709197998,
+ "learning_rate": 1.291545262938716e-06,
+ "loss": 0.0391,
+ "step": 30877
+ },
+ {
+ "epoch": 84.13623978201635,
+ "grad_norm": 2.467940330505371,
+ "learning_rate": 1.291111500544928e-06,
+ "loss": 0.1548,
+ "step": 30878
+ },
+ {
+ "epoch": 84.13896457765668,
+ "grad_norm": 3.4825150966644287,
+ "learning_rate": 1.2906778059756842e-06,
+ "loss": 0.107,
+ "step": 30879
+ },
+ {
+ "epoch": 84.141689373297,
+ "grad_norm": 2.71108078956604,
+ "learning_rate": 1.2902441792343611e-06,
+ "loss": 0.0523,
+ "step": 30880
+ },
+ {
+ "epoch": 84.14441416893733,
+ "grad_norm": 3.5202860832214355,
+ "learning_rate": 1.2898106203243343e-06,
+ "loss": 0.1405,
+ "step": 30881
+ },
+ {
+ "epoch": 84.14713896457765,
+ "grad_norm": 2.7637648582458496,
+ "learning_rate": 1.2893771292489833e-06,
+ "loss": 0.1779,
+ "step": 30882
+ },
+ {
+ "epoch": 84.14986376021798,
+ "grad_norm": 2.0411412715911865,
+ "learning_rate": 1.2889437060116827e-06,
+ "loss": 0.0222,
+ "step": 30883
+ },
+ {
+ "epoch": 84.15258855585832,
+ "grad_norm": 2.349391222000122,
+ "learning_rate": 1.2885103506158091e-06,
+ "loss": 0.0362,
+ "step": 30884
+ },
+ {
+ "epoch": 84.15531335149863,
+ "grad_norm": 2.401488780975342,
+ "learning_rate": 1.2880770630647344e-06,
+ "loss": 0.0329,
+ "step": 30885
+ },
+ {
+ "epoch": 84.15803814713897,
+ "grad_norm": 3.2894418239593506,
+ "learning_rate": 1.2876438433618365e-06,
+ "loss": 0.0998,
+ "step": 30886
+ },
+ {
+ "epoch": 84.16076294277929,
+ "grad_norm": 3.3366899490356445,
+ "learning_rate": 1.2872106915104876e-06,
+ "loss": 0.1908,
+ "step": 30887
+ },
+ {
+ "epoch": 84.16348773841962,
+ "grad_norm": 2.944432497024536,
+ "learning_rate": 1.2867776075140625e-06,
+ "loss": 0.0735,
+ "step": 30888
+ },
+ {
+ "epoch": 84.16621253405995,
+ "grad_norm": 4.728024482727051,
+ "learning_rate": 1.2863445913759299e-06,
+ "loss": 0.0296,
+ "step": 30889
+ },
+ {
+ "epoch": 84.16893732970027,
+ "grad_norm": 2.4820241928100586,
+ "learning_rate": 1.2859116430994677e-06,
+ "loss": 0.0621,
+ "step": 30890
+ },
+ {
+ "epoch": 84.1716621253406,
+ "grad_norm": 1.9522933959960938,
+ "learning_rate": 1.285478762688046e-06,
+ "loss": 0.0211,
+ "step": 30891
+ },
+ {
+ "epoch": 84.17438692098092,
+ "grad_norm": 2.085561513900757,
+ "learning_rate": 1.285045950145032e-06,
+ "loss": 0.0729,
+ "step": 30892
+ },
+ {
+ "epoch": 84.17711171662125,
+ "grad_norm": 3.332383394241333,
+ "learning_rate": 1.2846132054738026e-06,
+ "loss": 0.0444,
+ "step": 30893
+ },
+ {
+ "epoch": 84.17983651226157,
+ "grad_norm": 2.9827792644500732,
+ "learning_rate": 1.284180528677722e-06,
+ "loss": 0.0545,
+ "step": 30894
+ },
+ {
+ "epoch": 84.1825613079019,
+ "grad_norm": 4.191866874694824,
+ "learning_rate": 1.2837479197601654e-06,
+ "loss": 0.0446,
+ "step": 30895
+ },
+ {
+ "epoch": 84.18528610354224,
+ "grad_norm": 3.2883105278015137,
+ "learning_rate": 1.2833153787245e-06,
+ "loss": 0.0655,
+ "step": 30896
+ },
+ {
+ "epoch": 84.18801089918256,
+ "grad_norm": 4.032162666320801,
+ "learning_rate": 1.282882905574091e-06,
+ "loss": 0.0128,
+ "step": 30897
+ },
+ {
+ "epoch": 84.19073569482289,
+ "grad_norm": 3.0079433917999268,
+ "learning_rate": 1.2824505003123123e-06,
+ "loss": 0.0341,
+ "step": 30898
+ },
+ {
+ "epoch": 84.19346049046321,
+ "grad_norm": 2.4322404861450195,
+ "learning_rate": 1.2820181629425276e-06,
+ "loss": 0.0564,
+ "step": 30899
+ },
+ {
+ "epoch": 84.19618528610354,
+ "grad_norm": 4.670801162719727,
+ "learning_rate": 1.2815858934681059e-06,
+ "loss": 0.0239,
+ "step": 30900
+ },
+ {
+ "epoch": 84.19891008174388,
+ "grad_norm": 2.6506736278533936,
+ "learning_rate": 1.2811536918924095e-06,
+ "loss": 0.044,
+ "step": 30901
+ },
+ {
+ "epoch": 84.2016348773842,
+ "grad_norm": 2.5493180751800537,
+ "learning_rate": 1.2807215582188104e-06,
+ "loss": 0.1176,
+ "step": 30902
+ },
+ {
+ "epoch": 84.20435967302453,
+ "grad_norm": 2.146432638168335,
+ "learning_rate": 1.2802894924506703e-06,
+ "loss": 0.0423,
+ "step": 30903
+ },
+ {
+ "epoch": 84.20708446866485,
+ "grad_norm": 2.18966007232666,
+ "learning_rate": 1.2798574945913556e-06,
+ "loss": 0.0201,
+ "step": 30904
+ },
+ {
+ "epoch": 84.20980926430518,
+ "grad_norm": 3.3071603775024414,
+ "learning_rate": 1.2794255646442278e-06,
+ "loss": 0.0583,
+ "step": 30905
+ },
+ {
+ "epoch": 84.2125340599455,
+ "grad_norm": 3.4619028568267822,
+ "learning_rate": 1.2789937026126553e-06,
+ "loss": 0.1473,
+ "step": 30906
+ },
+ {
+ "epoch": 84.21525885558583,
+ "grad_norm": 2.6102943420410156,
+ "learning_rate": 1.278561908499999e-06,
+ "loss": 0.0339,
+ "step": 30907
+ },
+ {
+ "epoch": 84.21798365122616,
+ "grad_norm": 2.582096815109253,
+ "learning_rate": 1.2781301823096226e-06,
+ "loss": 0.066,
+ "step": 30908
+ },
+ {
+ "epoch": 84.22070844686648,
+ "grad_norm": 2.0452327728271484,
+ "learning_rate": 1.2776985240448847e-06,
+ "loss": 0.0834,
+ "step": 30909
+ },
+ {
+ "epoch": 84.22343324250681,
+ "grad_norm": 1.526092767715454,
+ "learning_rate": 1.2772669337091525e-06,
+ "loss": 0.0232,
+ "step": 30910
+ },
+ {
+ "epoch": 84.22615803814713,
+ "grad_norm": 2.2443490028381348,
+ "learning_rate": 1.2768354113057823e-06,
+ "loss": 0.1376,
+ "step": 30911
+ },
+ {
+ "epoch": 84.22888283378747,
+ "grad_norm": 3.8927268981933594,
+ "learning_rate": 1.2764039568381392e-06,
+ "loss": 0.1478,
+ "step": 30912
+ },
+ {
+ "epoch": 84.2316076294278,
+ "grad_norm": 2.086414098739624,
+ "learning_rate": 1.2759725703095793e-06,
+ "loss": 0.0336,
+ "step": 30913
+ },
+ {
+ "epoch": 84.23433242506812,
+ "grad_norm": 2.4165940284729004,
+ "learning_rate": 1.2755412517234667e-06,
+ "loss": 0.0211,
+ "step": 30914
+ },
+ {
+ "epoch": 84.23705722070845,
+ "grad_norm": 2.5106959342956543,
+ "learning_rate": 1.2751100010831575e-06,
+ "loss": 0.1234,
+ "step": 30915
+ },
+ {
+ "epoch": 84.23978201634877,
+ "grad_norm": 1.790252923965454,
+ "learning_rate": 1.2746788183920112e-06,
+ "loss": 0.0216,
+ "step": 30916
+ },
+ {
+ "epoch": 84.2425068119891,
+ "grad_norm": 2.535311222076416,
+ "learning_rate": 1.274247703653383e-06,
+ "loss": 0.0208,
+ "step": 30917
+ },
+ {
+ "epoch": 84.24523160762942,
+ "grad_norm": 1.900929570198059,
+ "learning_rate": 1.2738166568706345e-06,
+ "loss": 0.0211,
+ "step": 30918
+ },
+ {
+ "epoch": 84.24795640326975,
+ "grad_norm": 2.733259439468384,
+ "learning_rate": 1.273385678047122e-06,
+ "loss": 0.0845,
+ "step": 30919
+ },
+ {
+ "epoch": 84.25068119891009,
+ "grad_norm": 2.1603260040283203,
+ "learning_rate": 1.2729547671862008e-06,
+ "loss": 0.0251,
+ "step": 30920
+ },
+ {
+ "epoch": 84.2534059945504,
+ "grad_norm": 2.6811716556549072,
+ "learning_rate": 1.2725239242912246e-06,
+ "loss": 0.0393,
+ "step": 30921
+ },
+ {
+ "epoch": 84.25613079019074,
+ "grad_norm": 1.8573046922683716,
+ "learning_rate": 1.272093149365553e-06,
+ "loss": 0.0291,
+ "step": 30922
+ },
+ {
+ "epoch": 84.25885558583106,
+ "grad_norm": 1.8902552127838135,
+ "learning_rate": 1.2716624424125402e-06,
+ "loss": 0.0342,
+ "step": 30923
+ },
+ {
+ "epoch": 84.26158038147139,
+ "grad_norm": 3.814934492111206,
+ "learning_rate": 1.2712318034355387e-06,
+ "loss": 0.0434,
+ "step": 30924
+ },
+ {
+ "epoch": 84.26430517711172,
+ "grad_norm": 2.337177276611328,
+ "learning_rate": 1.2708012324379004e-06,
+ "loss": 0.0277,
+ "step": 30925
+ },
+ {
+ "epoch": 84.26702997275204,
+ "grad_norm": 3.1108927726745605,
+ "learning_rate": 1.2703707294229839e-06,
+ "loss": 0.1517,
+ "step": 30926
+ },
+ {
+ "epoch": 84.26975476839237,
+ "grad_norm": 2.411223888397217,
+ "learning_rate": 1.2699402943941386e-06,
+ "loss": 0.0433,
+ "step": 30927
+ },
+ {
+ "epoch": 84.2724795640327,
+ "grad_norm": 2.898160457611084,
+ "learning_rate": 1.2695099273547152e-06,
+ "loss": 0.0975,
+ "step": 30928
+ },
+ {
+ "epoch": 84.27520435967303,
+ "grad_norm": 2.993513584136963,
+ "learning_rate": 1.2690796283080698e-06,
+ "loss": 0.0949,
+ "step": 30929
+ },
+ {
+ "epoch": 84.27792915531334,
+ "grad_norm": 2.257850408554077,
+ "learning_rate": 1.2686493972575498e-06,
+ "loss": 0.0277,
+ "step": 30930
+ },
+ {
+ "epoch": 84.28065395095368,
+ "grad_norm": 2.626110315322876,
+ "learning_rate": 1.2682192342065093e-06,
+ "loss": 0.0405,
+ "step": 30931
+ },
+ {
+ "epoch": 84.28337874659401,
+ "grad_norm": 3.5695180892944336,
+ "learning_rate": 1.2677891391582953e-06,
+ "loss": 0.0306,
+ "step": 30932
+ },
+ {
+ "epoch": 84.28610354223433,
+ "grad_norm": 2.670917272567749,
+ "learning_rate": 1.2673591121162577e-06,
+ "loss": 0.0439,
+ "step": 30933
+ },
+ {
+ "epoch": 84.28882833787466,
+ "grad_norm": 3.586989641189575,
+ "learning_rate": 1.2669291530837469e-06,
+ "loss": 0.0845,
+ "step": 30934
+ },
+ {
+ "epoch": 84.29155313351498,
+ "grad_norm": 2.1815574169158936,
+ "learning_rate": 1.2664992620641114e-06,
+ "loss": 0.0437,
+ "step": 30935
+ },
+ {
+ "epoch": 84.29427792915531,
+ "grad_norm": 2.8163528442382812,
+ "learning_rate": 1.2660694390606986e-06,
+ "loss": 0.0634,
+ "step": 30936
+ },
+ {
+ "epoch": 84.29700272479565,
+ "grad_norm": 2.318514108657837,
+ "learning_rate": 1.2656396840768549e-06,
+ "loss": 0.0394,
+ "step": 30937
+ },
+ {
+ "epoch": 84.29972752043597,
+ "grad_norm": 4.409590244293213,
+ "learning_rate": 1.2652099971159293e-06,
+ "loss": 0.0283,
+ "step": 30938
+ },
+ {
+ "epoch": 84.3024523160763,
+ "grad_norm": 1.8094323873519897,
+ "learning_rate": 1.2647803781812673e-06,
+ "loss": 0.0297,
+ "step": 30939
+ },
+ {
+ "epoch": 84.30517711171662,
+ "grad_norm": 24.27855682373047,
+ "learning_rate": 1.264350827276214e-06,
+ "loss": 0.0663,
+ "step": 30940
+ },
+ {
+ "epoch": 84.30790190735695,
+ "grad_norm": 2.4616377353668213,
+ "learning_rate": 1.2639213444041133e-06,
+ "loss": 0.1532,
+ "step": 30941
+ },
+ {
+ "epoch": 84.31062670299727,
+ "grad_norm": 1.8487862348556519,
+ "learning_rate": 1.2634919295683145e-06,
+ "loss": 0.0305,
+ "step": 30942
+ },
+ {
+ "epoch": 84.3133514986376,
+ "grad_norm": 2.1329538822174072,
+ "learning_rate": 1.26306258277216e-06,
+ "loss": 0.0241,
+ "step": 30943
+ },
+ {
+ "epoch": 84.31607629427793,
+ "grad_norm": 2.2670230865478516,
+ "learning_rate": 1.262633304018992e-06,
+ "loss": 0.089,
+ "step": 30944
+ },
+ {
+ "epoch": 84.31880108991825,
+ "grad_norm": 2.1846530437469482,
+ "learning_rate": 1.2622040933121527e-06,
+ "loss": 0.0602,
+ "step": 30945
+ },
+ {
+ "epoch": 84.32152588555859,
+ "grad_norm": 2.693756341934204,
+ "learning_rate": 1.261774950654986e-06,
+ "loss": 0.0292,
+ "step": 30946
+ },
+ {
+ "epoch": 84.3242506811989,
+ "grad_norm": 3.18593168258667,
+ "learning_rate": 1.261345876050838e-06,
+ "loss": 0.0283,
+ "step": 30947
+ },
+ {
+ "epoch": 84.32697547683924,
+ "grad_norm": 2.7687511444091797,
+ "learning_rate": 1.2609168695030471e-06,
+ "loss": 0.0807,
+ "step": 30948
+ },
+ {
+ "epoch": 84.32970027247957,
+ "grad_norm": 3.2963898181915283,
+ "learning_rate": 1.260487931014953e-06,
+ "loss": 0.0496,
+ "step": 30949
+ },
+ {
+ "epoch": 84.33242506811989,
+ "grad_norm": 2.9117414951324463,
+ "learning_rate": 1.2600590605898966e-06,
+ "loss": 0.0457,
+ "step": 30950
+ },
+ {
+ "epoch": 84.33514986376022,
+ "grad_norm": 3.7882585525512695,
+ "learning_rate": 1.2596302582312214e-06,
+ "loss": 0.1302,
+ "step": 30951
+ },
+ {
+ "epoch": 84.33787465940054,
+ "grad_norm": 2.384852647781372,
+ "learning_rate": 1.2592015239422639e-06,
+ "loss": 0.04,
+ "step": 30952
+ },
+ {
+ "epoch": 84.34059945504087,
+ "grad_norm": 1.8089810609817505,
+ "learning_rate": 1.2587728577263636e-06,
+ "loss": 0.1188,
+ "step": 30953
+ },
+ {
+ "epoch": 84.34332425068119,
+ "grad_norm": 2.1156163215637207,
+ "learning_rate": 1.2583442595868566e-06,
+ "loss": 0.0431,
+ "step": 30954
+ },
+ {
+ "epoch": 84.34604904632153,
+ "grad_norm": 3.846061944961548,
+ "learning_rate": 1.257915729527085e-06,
+ "loss": 0.0419,
+ "step": 30955
+ },
+ {
+ "epoch": 84.34877384196186,
+ "grad_norm": 3.296739101409912,
+ "learning_rate": 1.2574872675503858e-06,
+ "loss": 0.082,
+ "step": 30956
+ },
+ {
+ "epoch": 84.35149863760218,
+ "grad_norm": 2.082808256149292,
+ "learning_rate": 1.2570588736600909e-06,
+ "loss": 0.0252,
+ "step": 30957
+ },
+ {
+ "epoch": 84.35422343324251,
+ "grad_norm": 5.212313652038574,
+ "learning_rate": 1.2566305478595431e-06,
+ "loss": 0.1072,
+ "step": 30958
+ },
+ {
+ "epoch": 84.35694822888283,
+ "grad_norm": 2.4390437602996826,
+ "learning_rate": 1.2562022901520744e-06,
+ "loss": 0.0641,
+ "step": 30959
+ },
+ {
+ "epoch": 84.35967302452316,
+ "grad_norm": 1.88674795627594,
+ "learning_rate": 1.2557741005410207e-06,
+ "loss": 0.0216,
+ "step": 30960
+ },
+ {
+ "epoch": 84.3623978201635,
+ "grad_norm": 2.0010910034179688,
+ "learning_rate": 1.255345979029715e-06,
+ "loss": 0.0391,
+ "step": 30961
+ },
+ {
+ "epoch": 84.36512261580381,
+ "grad_norm": 2.3853631019592285,
+ "learning_rate": 1.2549179256214939e-06,
+ "loss": 0.0546,
+ "step": 30962
+ },
+ {
+ "epoch": 84.36784741144415,
+ "grad_norm": 1.9459019899368286,
+ "learning_rate": 1.254489940319692e-06,
+ "loss": 0.0306,
+ "step": 30963
+ },
+ {
+ "epoch": 84.37057220708446,
+ "grad_norm": 1.6892529726028442,
+ "learning_rate": 1.2540620231276423e-06,
+ "loss": 0.0265,
+ "step": 30964
+ },
+ {
+ "epoch": 84.3732970027248,
+ "grad_norm": 3.0371382236480713,
+ "learning_rate": 1.2536341740486746e-06,
+ "loss": 0.2409,
+ "step": 30965
+ },
+ {
+ "epoch": 84.37602179836512,
+ "grad_norm": 2.210012912750244,
+ "learning_rate": 1.2532063930861205e-06,
+ "loss": 0.0375,
+ "step": 30966
+ },
+ {
+ "epoch": 84.37874659400545,
+ "grad_norm": 3.261143207550049,
+ "learning_rate": 1.2527786802433162e-06,
+ "loss": 0.1751,
+ "step": 30967
+ },
+ {
+ "epoch": 84.38147138964578,
+ "grad_norm": 5.779815673828125,
+ "learning_rate": 1.2523510355235902e-06,
+ "loss": 0.0497,
+ "step": 30968
+ },
+ {
+ "epoch": 84.3841961852861,
+ "grad_norm": 2.058689832687378,
+ "learning_rate": 1.251923458930272e-06,
+ "loss": 0.0815,
+ "step": 30969
+ },
+ {
+ "epoch": 84.38692098092643,
+ "grad_norm": 2.412895917892456,
+ "learning_rate": 1.25149595046669e-06,
+ "loss": 0.026,
+ "step": 30970
+ },
+ {
+ "epoch": 84.38964577656675,
+ "grad_norm": 2.345301389694214,
+ "learning_rate": 1.2510685101361797e-06,
+ "loss": 0.0925,
+ "step": 30971
+ },
+ {
+ "epoch": 84.39237057220708,
+ "grad_norm": 2.365218162536621,
+ "learning_rate": 1.2506411379420647e-06,
+ "loss": 0.0274,
+ "step": 30972
+ },
+ {
+ "epoch": 84.39509536784742,
+ "grad_norm": 4.25044059753418,
+ "learning_rate": 1.2502138338876757e-06,
+ "loss": 0.0877,
+ "step": 30973
+ },
+ {
+ "epoch": 84.39782016348774,
+ "grad_norm": 2.1025803089141846,
+ "learning_rate": 1.2497865979763368e-06,
+ "loss": 0.0357,
+ "step": 30974
+ },
+ {
+ "epoch": 84.40054495912807,
+ "grad_norm": 3.219825267791748,
+ "learning_rate": 1.249359430211381e-06,
+ "loss": 0.0613,
+ "step": 30975
+ },
+ {
+ "epoch": 84.40326975476839,
+ "grad_norm": 2.0448338985443115,
+ "learning_rate": 1.248932330596132e-06,
+ "loss": 0.026,
+ "step": 30976
+ },
+ {
+ "epoch": 84.40599455040872,
+ "grad_norm": 1.8425649404525757,
+ "learning_rate": 1.2485052991339174e-06,
+ "loss": 0.0208,
+ "step": 30977
+ },
+ {
+ "epoch": 84.40871934604904,
+ "grad_norm": 2.058178663253784,
+ "learning_rate": 1.248078335828059e-06,
+ "loss": 0.0329,
+ "step": 30978
+ },
+ {
+ "epoch": 84.41144414168937,
+ "grad_norm": 1.8262965679168701,
+ "learning_rate": 1.2476514406818863e-06,
+ "loss": 0.0309,
+ "step": 30979
+ },
+ {
+ "epoch": 84.4141689373297,
+ "grad_norm": 1.9117165803909302,
+ "learning_rate": 1.247224613698721e-06,
+ "loss": 0.0192,
+ "step": 30980
+ },
+ {
+ "epoch": 84.41689373297002,
+ "grad_norm": 2.8641581535339355,
+ "learning_rate": 1.2467978548818914e-06,
+ "loss": 0.1315,
+ "step": 30981
+ },
+ {
+ "epoch": 84.41961852861036,
+ "grad_norm": 2.1521008014678955,
+ "learning_rate": 1.2463711642347154e-06,
+ "loss": 0.1354,
+ "step": 30982
+ },
+ {
+ "epoch": 84.42234332425068,
+ "grad_norm": 2.883301258087158,
+ "learning_rate": 1.245944541760522e-06,
+ "loss": 0.0472,
+ "step": 30983
+ },
+ {
+ "epoch": 84.42506811989101,
+ "grad_norm": 2.296856641769409,
+ "learning_rate": 1.24551798746263e-06,
+ "loss": 0.0292,
+ "step": 30984
+ },
+ {
+ "epoch": 84.42779291553134,
+ "grad_norm": 2.1604671478271484,
+ "learning_rate": 1.245091501344362e-06,
+ "loss": 0.0354,
+ "step": 30985
+ },
+ {
+ "epoch": 84.43051771117166,
+ "grad_norm": 2.4055051803588867,
+ "learning_rate": 1.244665083409038e-06,
+ "loss": 0.0542,
+ "step": 30986
+ },
+ {
+ "epoch": 84.433242506812,
+ "grad_norm": 3.1053826808929443,
+ "learning_rate": 1.2442387336599825e-06,
+ "loss": 0.0252,
+ "step": 30987
+ },
+ {
+ "epoch": 84.43596730245231,
+ "grad_norm": 1.906609058380127,
+ "learning_rate": 1.2438124521005135e-06,
+ "loss": 0.0238,
+ "step": 30988
+ },
+ {
+ "epoch": 84.43869209809264,
+ "grad_norm": 2.015774965286255,
+ "learning_rate": 1.2433862387339524e-06,
+ "loss": 0.0274,
+ "step": 30989
+ },
+ {
+ "epoch": 84.44141689373296,
+ "grad_norm": 2.535973310470581,
+ "learning_rate": 1.2429600935636144e-06,
+ "loss": 0.0421,
+ "step": 30990
+ },
+ {
+ "epoch": 84.4441416893733,
+ "grad_norm": 2.4865448474884033,
+ "learning_rate": 1.2425340165928234e-06,
+ "loss": 0.0483,
+ "step": 30991
+ },
+ {
+ "epoch": 84.44686648501363,
+ "grad_norm": 1.868030071258545,
+ "learning_rate": 1.242108007824896e-06,
+ "loss": 0.0224,
+ "step": 30992
+ },
+ {
+ "epoch": 84.44959128065395,
+ "grad_norm": 3.9106252193450928,
+ "learning_rate": 1.2416820672631502e-06,
+ "loss": 0.0426,
+ "step": 30993
+ },
+ {
+ "epoch": 84.45231607629428,
+ "grad_norm": 1.4307934045791626,
+ "learning_rate": 1.2412561949108992e-06,
+ "loss": 0.123,
+ "step": 30994
+ },
+ {
+ "epoch": 84.4550408719346,
+ "grad_norm": 2.5642943382263184,
+ "learning_rate": 1.240830390771466e-06,
+ "loss": 0.0305,
+ "step": 30995
+ },
+ {
+ "epoch": 84.45776566757493,
+ "grad_norm": 1.859707236289978,
+ "learning_rate": 1.2404046548481641e-06,
+ "loss": 0.0277,
+ "step": 30996
+ },
+ {
+ "epoch": 84.46049046321527,
+ "grad_norm": 2.6319589614868164,
+ "learning_rate": 1.2399789871443057e-06,
+ "loss": 0.0896,
+ "step": 30997
+ },
+ {
+ "epoch": 84.46321525885558,
+ "grad_norm": 2.9149649143218994,
+ "learning_rate": 1.2395533876632094e-06,
+ "loss": 0.0246,
+ "step": 30998
+ },
+ {
+ "epoch": 84.46594005449592,
+ "grad_norm": 3.1326661109924316,
+ "learning_rate": 1.2391278564081921e-06,
+ "loss": 0.1539,
+ "step": 30999
+ },
+ {
+ "epoch": 84.46866485013624,
+ "grad_norm": 2.4415969848632812,
+ "learning_rate": 1.2387023933825637e-06,
+ "loss": 0.0405,
+ "step": 31000
+ },
+ {
+ "epoch": 84.47138964577657,
+ "grad_norm": 2.142533302307129,
+ "learning_rate": 1.2382769985896405e-06,
+ "loss": 0.0343,
+ "step": 31001
+ },
+ {
+ "epoch": 84.47411444141689,
+ "grad_norm": 3.939147472381592,
+ "learning_rate": 1.2378516720327315e-06,
+ "loss": 0.1234,
+ "step": 31002
+ },
+ {
+ "epoch": 84.47683923705722,
+ "grad_norm": 3.032827615737915,
+ "learning_rate": 1.2374264137151537e-06,
+ "loss": 0.0408,
+ "step": 31003
+ },
+ {
+ "epoch": 84.47956403269755,
+ "grad_norm": 2.321712017059326,
+ "learning_rate": 1.2370012236402162e-06,
+ "loss": 0.0873,
+ "step": 31004
+ },
+ {
+ "epoch": 84.48228882833787,
+ "grad_norm": 2.2680418491363525,
+ "learning_rate": 1.236576101811232e-06,
+ "loss": 0.0836,
+ "step": 31005
+ },
+ {
+ "epoch": 84.4850136239782,
+ "grad_norm": 2.3834011554718018,
+ "learning_rate": 1.2361510482315087e-06,
+ "loss": 0.2104,
+ "step": 31006
+ },
+ {
+ "epoch": 84.48773841961852,
+ "grad_norm": 2.9098286628723145,
+ "learning_rate": 1.235726062904361e-06,
+ "loss": 0.0476,
+ "step": 31007
+ },
+ {
+ "epoch": 84.49046321525886,
+ "grad_norm": 2.6561827659606934,
+ "learning_rate": 1.2353011458330976e-06,
+ "loss": 0.0657,
+ "step": 31008
+ },
+ {
+ "epoch": 84.49318801089919,
+ "grad_norm": 2.9487643241882324,
+ "learning_rate": 1.234876297021026e-06,
+ "loss": 0.0361,
+ "step": 31009
+ },
+ {
+ "epoch": 84.49591280653951,
+ "grad_norm": 2.6250460147857666,
+ "learning_rate": 1.2344515164714531e-06,
+ "loss": 0.0347,
+ "step": 31010
+ },
+ {
+ "epoch": 84.49863760217984,
+ "grad_norm": 2.3775174617767334,
+ "learning_rate": 1.2340268041876923e-06,
+ "loss": 0.0491,
+ "step": 31011
+ },
+ {
+ "epoch": 84.50136239782016,
+ "grad_norm": 1.9457837343215942,
+ "learning_rate": 1.2336021601730485e-06,
+ "loss": 0.0315,
+ "step": 31012
+ },
+ {
+ "epoch": 84.50408719346049,
+ "grad_norm": 2.286740779876709,
+ "learning_rate": 1.2331775844308292e-06,
+ "loss": 0.0429,
+ "step": 31013
+ },
+ {
+ "epoch": 84.50681198910081,
+ "grad_norm": 2.9992775917053223,
+ "learning_rate": 1.232753076964338e-06,
+ "loss": 0.0771,
+ "step": 31014
+ },
+ {
+ "epoch": 84.50953678474114,
+ "grad_norm": 2.1540305614471436,
+ "learning_rate": 1.2323286377768839e-06,
+ "loss": 0.0342,
+ "step": 31015
+ },
+ {
+ "epoch": 84.51226158038148,
+ "grad_norm": 2.3368608951568604,
+ "learning_rate": 1.231904266871775e-06,
+ "loss": 0.0284,
+ "step": 31016
+ },
+ {
+ "epoch": 84.5149863760218,
+ "grad_norm": 1.906496524810791,
+ "learning_rate": 1.2314799642523135e-06,
+ "loss": 0.0569,
+ "step": 31017
+ },
+ {
+ "epoch": 84.51771117166213,
+ "grad_norm": 4.40822696685791,
+ "learning_rate": 1.2310557299218029e-06,
+ "loss": 0.0353,
+ "step": 31018
+ },
+ {
+ "epoch": 84.52043596730245,
+ "grad_norm": 2.7115578651428223,
+ "learning_rate": 1.2306315638835464e-06,
+ "loss": 0.0661,
+ "step": 31019
+ },
+ {
+ "epoch": 84.52316076294278,
+ "grad_norm": 3.1134707927703857,
+ "learning_rate": 1.2302074661408502e-06,
+ "loss": 0.0421,
+ "step": 31020
+ },
+ {
+ "epoch": 84.52588555858311,
+ "grad_norm": 2.8423943519592285,
+ "learning_rate": 1.2297834366970174e-06,
+ "loss": 0.1245,
+ "step": 31021
+ },
+ {
+ "epoch": 84.52861035422343,
+ "grad_norm": 2.3413920402526855,
+ "learning_rate": 1.2293594755553462e-06,
+ "loss": 0.1918,
+ "step": 31022
+ },
+ {
+ "epoch": 84.53133514986376,
+ "grad_norm": 2.1077334880828857,
+ "learning_rate": 1.228935582719143e-06,
+ "loss": 0.0427,
+ "step": 31023
+ },
+ {
+ "epoch": 84.53405994550408,
+ "grad_norm": 2.3549013137817383,
+ "learning_rate": 1.2285117581917084e-06,
+ "loss": 0.098,
+ "step": 31024
+ },
+ {
+ "epoch": 84.53678474114442,
+ "grad_norm": 2.0314838886260986,
+ "learning_rate": 1.2280880019763407e-06,
+ "loss": 0.0216,
+ "step": 31025
+ },
+ {
+ "epoch": 84.53950953678473,
+ "grad_norm": 2.8202052116394043,
+ "learning_rate": 1.227664314076339e-06,
+ "loss": 0.079,
+ "step": 31026
+ },
+ {
+ "epoch": 84.54223433242507,
+ "grad_norm": 3.7878527641296387,
+ "learning_rate": 1.227240694495009e-06,
+ "loss": 0.0235,
+ "step": 31027
+ },
+ {
+ "epoch": 84.5449591280654,
+ "grad_norm": 6.113048076629639,
+ "learning_rate": 1.2268171432356447e-06,
+ "loss": 0.1633,
+ "step": 31028
+ },
+ {
+ "epoch": 84.54768392370572,
+ "grad_norm": 2.637174129486084,
+ "learning_rate": 1.2263936603015457e-06,
+ "loss": 0.06,
+ "step": 31029
+ },
+ {
+ "epoch": 84.55040871934605,
+ "grad_norm": 3.4079182147979736,
+ "learning_rate": 1.2259702456960099e-06,
+ "loss": 0.12,
+ "step": 31030
+ },
+ {
+ "epoch": 84.55313351498637,
+ "grad_norm": 2.9253225326538086,
+ "learning_rate": 1.2255468994223342e-06,
+ "loss": 0.1418,
+ "step": 31031
+ },
+ {
+ "epoch": 84.5558583106267,
+ "grad_norm": 2.9753916263580322,
+ "learning_rate": 1.225123621483819e-06,
+ "loss": 0.058,
+ "step": 31032
+ },
+ {
+ "epoch": 84.55858310626704,
+ "grad_norm": 2.4538822174072266,
+ "learning_rate": 1.2247004118837603e-06,
+ "loss": 0.1138,
+ "step": 31033
+ },
+ {
+ "epoch": 84.56130790190736,
+ "grad_norm": 2.228626251220703,
+ "learning_rate": 1.2242772706254502e-06,
+ "loss": 0.0296,
+ "step": 31034
+ },
+ {
+ "epoch": 84.56403269754769,
+ "grad_norm": 2.627859115600586,
+ "learning_rate": 1.2238541977121853e-06,
+ "loss": 0.1024,
+ "step": 31035
+ },
+ {
+ "epoch": 84.566757493188,
+ "grad_norm": 3.1097116470336914,
+ "learning_rate": 1.223431193147263e-06,
+ "loss": 0.188,
+ "step": 31036
+ },
+ {
+ "epoch": 84.56948228882834,
+ "grad_norm": 1.7681435346603394,
+ "learning_rate": 1.2230082569339773e-06,
+ "loss": 0.0208,
+ "step": 31037
+ },
+ {
+ "epoch": 84.57220708446866,
+ "grad_norm": 1.7119303941726685,
+ "learning_rate": 1.222585389075619e-06,
+ "loss": 0.0193,
+ "step": 31038
+ },
+ {
+ "epoch": 84.57493188010899,
+ "grad_norm": 2.7175660133361816,
+ "learning_rate": 1.222162589575483e-06,
+ "loss": 0.042,
+ "step": 31039
+ },
+ {
+ "epoch": 84.57765667574932,
+ "grad_norm": 2.8624460697174072,
+ "learning_rate": 1.2217398584368634e-06,
+ "loss": 0.1138,
+ "step": 31040
+ },
+ {
+ "epoch": 84.58038147138964,
+ "grad_norm": 1.645054578781128,
+ "learning_rate": 1.221317195663051e-06,
+ "loss": 0.1273,
+ "step": 31041
+ },
+ {
+ "epoch": 84.58310626702998,
+ "grad_norm": 1.6453557014465332,
+ "learning_rate": 1.2208946012573352e-06,
+ "loss": 0.0642,
+ "step": 31042
+ },
+ {
+ "epoch": 84.5858310626703,
+ "grad_norm": 6.238443374633789,
+ "learning_rate": 1.2204720752230126e-06,
+ "loss": 0.0368,
+ "step": 31043
+ },
+ {
+ "epoch": 84.58855585831063,
+ "grad_norm": 2.3180487155914307,
+ "learning_rate": 1.2200496175633714e-06,
+ "loss": 0.1693,
+ "step": 31044
+ },
+ {
+ "epoch": 84.59128065395096,
+ "grad_norm": 2.5004770755767822,
+ "learning_rate": 1.2196272282817e-06,
+ "loss": 0.0537,
+ "step": 31045
+ },
+ {
+ "epoch": 84.59400544959128,
+ "grad_norm": 3.1233437061309814,
+ "learning_rate": 1.2192049073812872e-06,
+ "loss": 0.0854,
+ "step": 31046
+ },
+ {
+ "epoch": 84.59673024523161,
+ "grad_norm": 1.4701508283615112,
+ "learning_rate": 1.218782654865427e-06,
+ "loss": 0.0183,
+ "step": 31047
+ },
+ {
+ "epoch": 84.59945504087193,
+ "grad_norm": 2.837486505508423,
+ "learning_rate": 1.218360470737402e-06,
+ "loss": 0.0482,
+ "step": 31048
+ },
+ {
+ "epoch": 84.60217983651226,
+ "grad_norm": 1.651308536529541,
+ "learning_rate": 1.2179383550005052e-06,
+ "loss": 0.0216,
+ "step": 31049
+ },
+ {
+ "epoch": 84.60490463215258,
+ "grad_norm": 2.7535626888275146,
+ "learning_rate": 1.2175163076580222e-06,
+ "loss": 0.0243,
+ "step": 31050
+ },
+ {
+ "epoch": 84.60762942779292,
+ "grad_norm": 2.362203598022461,
+ "learning_rate": 1.2170943287132375e-06,
+ "loss": 0.1221,
+ "step": 31051
+ },
+ {
+ "epoch": 84.61035422343325,
+ "grad_norm": 2.717883348464966,
+ "learning_rate": 1.2166724181694411e-06,
+ "loss": 0.0828,
+ "step": 31052
+ },
+ {
+ "epoch": 84.61307901907357,
+ "grad_norm": 1.5653126239776611,
+ "learning_rate": 1.2162505760299182e-06,
+ "loss": 0.0209,
+ "step": 31053
+ },
+ {
+ "epoch": 84.6158038147139,
+ "grad_norm": 3.5864832401275635,
+ "learning_rate": 1.2158288022979514e-06,
+ "loss": 0.0935,
+ "step": 31054
+ },
+ {
+ "epoch": 84.61852861035422,
+ "grad_norm": 4.0297160148620605,
+ "learning_rate": 1.215407096976826e-06,
+ "loss": 0.0945,
+ "step": 31055
+ },
+ {
+ "epoch": 84.62125340599455,
+ "grad_norm": 2.4685301780700684,
+ "learning_rate": 1.2149854600698296e-06,
+ "loss": 0.0526,
+ "step": 31056
+ },
+ {
+ "epoch": 84.62397820163488,
+ "grad_norm": 1.8899409770965576,
+ "learning_rate": 1.2145638915802438e-06,
+ "loss": 0.0241,
+ "step": 31057
+ },
+ {
+ "epoch": 84.6267029972752,
+ "grad_norm": 3.2765052318573,
+ "learning_rate": 1.2141423915113515e-06,
+ "loss": 0.0333,
+ "step": 31058
+ },
+ {
+ "epoch": 84.62942779291554,
+ "grad_norm": 2.8388254642486572,
+ "learning_rate": 1.2137209598664334e-06,
+ "loss": 0.0682,
+ "step": 31059
+ },
+ {
+ "epoch": 84.63215258855585,
+ "grad_norm": 2.8888697624206543,
+ "learning_rate": 1.213299596648776e-06,
+ "loss": 0.1235,
+ "step": 31060
+ },
+ {
+ "epoch": 84.63487738419619,
+ "grad_norm": 2.789600133895874,
+ "learning_rate": 1.2128783018616585e-06,
+ "loss": 0.1367,
+ "step": 31061
+ },
+ {
+ "epoch": 84.6376021798365,
+ "grad_norm": 2.938390016555786,
+ "learning_rate": 1.212457075508362e-06,
+ "loss": 0.0446,
+ "step": 31062
+ },
+ {
+ "epoch": 84.64032697547684,
+ "grad_norm": 2.4707260131835938,
+ "learning_rate": 1.2120359175921636e-06,
+ "loss": 0.2618,
+ "step": 31063
+ },
+ {
+ "epoch": 84.64305177111717,
+ "grad_norm": 2.305969715118408,
+ "learning_rate": 1.2116148281163497e-06,
+ "loss": 0.0809,
+ "step": 31064
+ },
+ {
+ "epoch": 84.64577656675749,
+ "grad_norm": 3.376065492630005,
+ "learning_rate": 1.2111938070841979e-06,
+ "loss": 0.0724,
+ "step": 31065
+ },
+ {
+ "epoch": 84.64850136239782,
+ "grad_norm": 3.548962116241455,
+ "learning_rate": 1.2107728544989817e-06,
+ "loss": 0.0347,
+ "step": 31066
+ },
+ {
+ "epoch": 84.65122615803814,
+ "grad_norm": 2.1145694255828857,
+ "learning_rate": 1.2103519703639844e-06,
+ "loss": 0.1118,
+ "step": 31067
+ },
+ {
+ "epoch": 84.65395095367847,
+ "grad_norm": 2.4844484329223633,
+ "learning_rate": 1.2099311546824853e-06,
+ "loss": 0.0376,
+ "step": 31068
+ },
+ {
+ "epoch": 84.65667574931881,
+ "grad_norm": 2.0232150554656982,
+ "learning_rate": 1.20951040745776e-06,
+ "loss": 0.0338,
+ "step": 31069
+ },
+ {
+ "epoch": 84.65940054495913,
+ "grad_norm": 5.746128082275391,
+ "learning_rate": 1.2090897286930837e-06,
+ "loss": 0.0821,
+ "step": 31070
+ },
+ {
+ "epoch": 84.66212534059946,
+ "grad_norm": 2.1323885917663574,
+ "learning_rate": 1.2086691183917322e-06,
+ "loss": 0.039,
+ "step": 31071
+ },
+ {
+ "epoch": 84.66485013623978,
+ "grad_norm": 3.363504648208618,
+ "learning_rate": 1.208248576556985e-06,
+ "loss": 0.0508,
+ "step": 31072
+ },
+ {
+ "epoch": 84.66757493188011,
+ "grad_norm": 3.2984578609466553,
+ "learning_rate": 1.2078281031921146e-06,
+ "loss": 0.1499,
+ "step": 31073
+ },
+ {
+ "epoch": 84.67029972752043,
+ "grad_norm": 2.885843276977539,
+ "learning_rate": 1.2074076983003956e-06,
+ "loss": 0.054,
+ "step": 31074
+ },
+ {
+ "epoch": 84.67302452316076,
+ "grad_norm": 2.0458831787109375,
+ "learning_rate": 1.2069873618851001e-06,
+ "loss": 0.038,
+ "step": 31075
+ },
+ {
+ "epoch": 84.6757493188011,
+ "grad_norm": 2.1821789741516113,
+ "learning_rate": 1.2065670939495068e-06,
+ "loss": 0.0532,
+ "step": 31076
+ },
+ {
+ "epoch": 84.67847411444141,
+ "grad_norm": 4.3712053298950195,
+ "learning_rate": 1.2061468944968857e-06,
+ "loss": 0.0278,
+ "step": 31077
+ },
+ {
+ "epoch": 84.68119891008175,
+ "grad_norm": 3.6181650161743164,
+ "learning_rate": 1.2057267635305102e-06,
+ "loss": 0.0635,
+ "step": 31078
+ },
+ {
+ "epoch": 84.68392370572207,
+ "grad_norm": 3.243540048599243,
+ "learning_rate": 1.205306701053649e-06,
+ "loss": 0.0646,
+ "step": 31079
+ },
+ {
+ "epoch": 84.6866485013624,
+ "grad_norm": 2.5232150554656982,
+ "learning_rate": 1.204886707069578e-06,
+ "loss": 0.0372,
+ "step": 31080
+ },
+ {
+ "epoch": 84.68937329700273,
+ "grad_norm": 3.703014373779297,
+ "learning_rate": 1.2044667815815668e-06,
+ "loss": 0.0549,
+ "step": 31081
+ },
+ {
+ "epoch": 84.69209809264305,
+ "grad_norm": 1.814774751663208,
+ "learning_rate": 1.2040469245928843e-06,
+ "loss": 0.0267,
+ "step": 31082
+ },
+ {
+ "epoch": 84.69482288828338,
+ "grad_norm": 2.440342664718628,
+ "learning_rate": 1.2036271361067996e-06,
+ "loss": 0.0547,
+ "step": 31083
+ },
+ {
+ "epoch": 84.6975476839237,
+ "grad_norm": 2.8584320545196533,
+ "learning_rate": 1.203207416126584e-06,
+ "loss": 0.0314,
+ "step": 31084
+ },
+ {
+ "epoch": 84.70027247956403,
+ "grad_norm": 4.247107028961182,
+ "learning_rate": 1.2027877646555087e-06,
+ "loss": 0.0472,
+ "step": 31085
+ },
+ {
+ "epoch": 84.70299727520435,
+ "grad_norm": 4.565586566925049,
+ "learning_rate": 1.202368181696838e-06,
+ "loss": 0.0707,
+ "step": 31086
+ },
+ {
+ "epoch": 84.70572207084469,
+ "grad_norm": 2.6981148719787598,
+ "learning_rate": 1.2019486672538383e-06,
+ "loss": 0.0278,
+ "step": 31087
+ },
+ {
+ "epoch": 84.70844686648502,
+ "grad_norm": 2.0777294635772705,
+ "learning_rate": 1.2015292213297824e-06,
+ "loss": 0.0635,
+ "step": 31088
+ },
+ {
+ "epoch": 84.71117166212534,
+ "grad_norm": 3.509965658187866,
+ "learning_rate": 1.2011098439279333e-06,
+ "loss": 0.0839,
+ "step": 31089
+ },
+ {
+ "epoch": 84.71389645776567,
+ "grad_norm": 2.077681541442871,
+ "learning_rate": 1.2006905350515575e-06,
+ "loss": 0.0781,
+ "step": 31090
+ },
+ {
+ "epoch": 84.71662125340599,
+ "grad_norm": 2.4037723541259766,
+ "learning_rate": 1.2002712947039185e-06,
+ "loss": 0.0282,
+ "step": 31091
+ },
+ {
+ "epoch": 84.71934604904632,
+ "grad_norm": 2.0101139545440674,
+ "learning_rate": 1.1998521228882853e-06,
+ "loss": 0.0259,
+ "step": 31092
+ },
+ {
+ "epoch": 84.72207084468666,
+ "grad_norm": 2.952502489089966,
+ "learning_rate": 1.1994330196079208e-06,
+ "loss": 0.0504,
+ "step": 31093
+ },
+ {
+ "epoch": 84.72479564032697,
+ "grad_norm": 2.8094520568847656,
+ "learning_rate": 1.1990139848660886e-06,
+ "loss": 0.107,
+ "step": 31094
+ },
+ {
+ "epoch": 84.7275204359673,
+ "grad_norm": 2.9072251319885254,
+ "learning_rate": 1.198595018666051e-06,
+ "loss": 0.0944,
+ "step": 31095
+ },
+ {
+ "epoch": 84.73024523160763,
+ "grad_norm": 3.1361992359161377,
+ "learning_rate": 1.1981761210110732e-06,
+ "loss": 0.0674,
+ "step": 31096
+ },
+ {
+ "epoch": 84.73297002724796,
+ "grad_norm": 2.763051986694336,
+ "learning_rate": 1.1977572919044166e-06,
+ "loss": 0.0265,
+ "step": 31097
+ },
+ {
+ "epoch": 84.73569482288828,
+ "grad_norm": 3.9850151538848877,
+ "learning_rate": 1.1973385313493436e-06,
+ "loss": 0.0349,
+ "step": 31098
+ },
+ {
+ "epoch": 84.73841961852861,
+ "grad_norm": 2.8541979789733887,
+ "learning_rate": 1.1969198393491123e-06,
+ "loss": 0.0525,
+ "step": 31099
+ },
+ {
+ "epoch": 84.74114441416894,
+ "grad_norm": 2.51537823677063,
+ "learning_rate": 1.1965012159069855e-06,
+ "loss": 0.0711,
+ "step": 31100
+ },
+ {
+ "epoch": 84.74386920980926,
+ "grad_norm": 2.9767189025878906,
+ "learning_rate": 1.1960826610262266e-06,
+ "loss": 0.0348,
+ "step": 31101
+ },
+ {
+ "epoch": 84.7465940054496,
+ "grad_norm": 2.8209567070007324,
+ "learning_rate": 1.1956641747100918e-06,
+ "loss": 0.0441,
+ "step": 31102
+ },
+ {
+ "epoch": 84.74931880108991,
+ "grad_norm": 2.726255178451538,
+ "learning_rate": 1.1952457569618415e-06,
+ "loss": 0.0213,
+ "step": 31103
+ },
+ {
+ "epoch": 84.75204359673025,
+ "grad_norm": 2.257753610610962,
+ "learning_rate": 1.1948274077847322e-06,
+ "loss": 0.0232,
+ "step": 31104
+ },
+ {
+ "epoch": 84.75476839237058,
+ "grad_norm": 8.945773124694824,
+ "learning_rate": 1.1944091271820258e-06,
+ "loss": 0.0518,
+ "step": 31105
+ },
+ {
+ "epoch": 84.7574931880109,
+ "grad_norm": 1.8746299743652344,
+ "learning_rate": 1.1939909151569773e-06,
+ "loss": 0.0314,
+ "step": 31106
+ },
+ {
+ "epoch": 84.76021798365123,
+ "grad_norm": 4.879593849182129,
+ "learning_rate": 1.193572771712842e-06,
+ "loss": 0.0649,
+ "step": 31107
+ },
+ {
+ "epoch": 84.76294277929155,
+ "grad_norm": 2.582674980163574,
+ "learning_rate": 1.1931546968528807e-06,
+ "loss": 0.0397,
+ "step": 31108
+ },
+ {
+ "epoch": 84.76566757493188,
+ "grad_norm": 4.804081439971924,
+ "learning_rate": 1.192736690580346e-06,
+ "loss": 0.0867,
+ "step": 31109
+ },
+ {
+ "epoch": 84.7683923705722,
+ "grad_norm": 18.874242782592773,
+ "learning_rate": 1.1923187528984958e-06,
+ "loss": 0.1046,
+ "step": 31110
+ },
+ {
+ "epoch": 84.77111716621253,
+ "grad_norm": 2.4071621894836426,
+ "learning_rate": 1.1919008838105816e-06,
+ "loss": 0.0323,
+ "step": 31111
+ },
+ {
+ "epoch": 84.77384196185287,
+ "grad_norm": 2.356154203414917,
+ "learning_rate": 1.191483083319862e-06,
+ "loss": 0.1667,
+ "step": 31112
+ },
+ {
+ "epoch": 84.77656675749319,
+ "grad_norm": 3.3072586059570312,
+ "learning_rate": 1.191065351429589e-06,
+ "loss": 0.118,
+ "step": 31113
+ },
+ {
+ "epoch": 84.77929155313352,
+ "grad_norm": 2.270320415496826,
+ "learning_rate": 1.190647688143014e-06,
+ "loss": 0.1204,
+ "step": 31114
+ },
+ {
+ "epoch": 84.78201634877384,
+ "grad_norm": 2.617692708969116,
+ "learning_rate": 1.1902300934633904e-06,
+ "loss": 0.0427,
+ "step": 31115
+ },
+ {
+ "epoch": 84.78474114441417,
+ "grad_norm": 3.325610876083374,
+ "learning_rate": 1.189812567393973e-06,
+ "loss": 0.046,
+ "step": 31116
+ },
+ {
+ "epoch": 84.7874659400545,
+ "grad_norm": 2.1286509037017822,
+ "learning_rate": 1.1893951099380097e-06,
+ "loss": 0.0273,
+ "step": 31117
+ },
+ {
+ "epoch": 84.79019073569482,
+ "grad_norm": 5.044488906860352,
+ "learning_rate": 1.1889777210987564e-06,
+ "loss": 0.058,
+ "step": 31118
+ },
+ {
+ "epoch": 84.79291553133515,
+ "grad_norm": 2.514359474182129,
+ "learning_rate": 1.1885604008794604e-06,
+ "loss": 0.0311,
+ "step": 31119
+ },
+ {
+ "epoch": 84.79564032697547,
+ "grad_norm": 2.4255313873291016,
+ "learning_rate": 1.1881431492833694e-06,
+ "loss": 0.0403,
+ "step": 31120
+ },
+ {
+ "epoch": 84.7983651226158,
+ "grad_norm": 4.272997856140137,
+ "learning_rate": 1.1877259663137398e-06,
+ "loss": 0.036,
+ "step": 31121
+ },
+ {
+ "epoch": 84.80108991825612,
+ "grad_norm": 2.7143914699554443,
+ "learning_rate": 1.1873088519738163e-06,
+ "loss": 0.0286,
+ "step": 31122
+ },
+ {
+ "epoch": 84.80381471389646,
+ "grad_norm": 1.854542851448059,
+ "learning_rate": 1.1868918062668467e-06,
+ "loss": 0.0225,
+ "step": 31123
+ },
+ {
+ "epoch": 84.80653950953679,
+ "grad_norm": 2.3984200954437256,
+ "learning_rate": 1.1864748291960793e-06,
+ "loss": 0.0614,
+ "step": 31124
+ },
+ {
+ "epoch": 84.80926430517711,
+ "grad_norm": 2.313521385192871,
+ "learning_rate": 1.1860579207647638e-06,
+ "loss": 0.0905,
+ "step": 31125
+ },
+ {
+ "epoch": 84.81198910081744,
+ "grad_norm": 3.3067080974578857,
+ "learning_rate": 1.1856410809761454e-06,
+ "loss": 0.0237,
+ "step": 31126
+ },
+ {
+ "epoch": 84.81471389645776,
+ "grad_norm": 1.8766144514083862,
+ "learning_rate": 1.1852243098334703e-06,
+ "loss": 0.034,
+ "step": 31127
+ },
+ {
+ "epoch": 84.8174386920981,
+ "grad_norm": 2.371131181716919,
+ "learning_rate": 1.1848076073399838e-06,
+ "loss": 0.041,
+ "step": 31128
+ },
+ {
+ "epoch": 84.82016348773843,
+ "grad_norm": 2.869938850402832,
+ "learning_rate": 1.1843909734989323e-06,
+ "loss": 0.0428,
+ "step": 31129
+ },
+ {
+ "epoch": 84.82288828337875,
+ "grad_norm": 5.338016033172607,
+ "learning_rate": 1.1839744083135618e-06,
+ "loss": 0.0854,
+ "step": 31130
+ },
+ {
+ "epoch": 84.82561307901908,
+ "grad_norm": 2.4351656436920166,
+ "learning_rate": 1.183557911787112e-06,
+ "loss": 0.1161,
+ "step": 31131
+ },
+ {
+ "epoch": 84.8283378746594,
+ "grad_norm": 2.4238884449005127,
+ "learning_rate": 1.1831414839228318e-06,
+ "loss": 0.0297,
+ "step": 31132
+ },
+ {
+ "epoch": 84.83106267029973,
+ "grad_norm": 2.19629168510437,
+ "learning_rate": 1.1827251247239614e-06,
+ "loss": 0.0621,
+ "step": 31133
+ },
+ {
+ "epoch": 84.83378746594005,
+ "grad_norm": 2.6091413497924805,
+ "learning_rate": 1.1823088341937416e-06,
+ "loss": 0.021,
+ "step": 31134
+ },
+ {
+ "epoch": 84.83651226158038,
+ "grad_norm": 2.723750114440918,
+ "learning_rate": 1.1818926123354201e-06,
+ "loss": 0.0998,
+ "step": 31135
+ },
+ {
+ "epoch": 84.83923705722071,
+ "grad_norm": 3.025283098220825,
+ "learning_rate": 1.181476459152232e-06,
+ "loss": 0.0399,
+ "step": 31136
+ },
+ {
+ "epoch": 84.84196185286103,
+ "grad_norm": 1.6982884407043457,
+ "learning_rate": 1.1810603746474235e-06,
+ "loss": 0.0213,
+ "step": 31137
+ },
+ {
+ "epoch": 84.84468664850137,
+ "grad_norm": 3.653689384460449,
+ "learning_rate": 1.1806443588242333e-06,
+ "loss": 0.1872,
+ "step": 31138
+ },
+ {
+ "epoch": 84.84741144414168,
+ "grad_norm": 2.5489659309387207,
+ "learning_rate": 1.1802284116859008e-06,
+ "loss": 0.1274,
+ "step": 31139
+ },
+ {
+ "epoch": 84.85013623978202,
+ "grad_norm": 2.3214521408081055,
+ "learning_rate": 1.1798125332356646e-06,
+ "loss": 0.0807,
+ "step": 31140
+ },
+ {
+ "epoch": 84.85286103542235,
+ "grad_norm": 2.6158955097198486,
+ "learning_rate": 1.1793967234767656e-06,
+ "loss": 0.0384,
+ "step": 31141
+ },
+ {
+ "epoch": 84.85558583106267,
+ "grad_norm": 7.601649761199951,
+ "learning_rate": 1.178980982412441e-06,
+ "loss": 0.1165,
+ "step": 31142
+ },
+ {
+ "epoch": 84.858310626703,
+ "grad_norm": 3.254023313522339,
+ "learning_rate": 1.1785653100459282e-06,
+ "loss": 0.0483,
+ "step": 31143
+ },
+ {
+ "epoch": 84.86103542234332,
+ "grad_norm": 3.435879945755005,
+ "learning_rate": 1.1781497063804636e-06,
+ "loss": 0.0952,
+ "step": 31144
+ },
+ {
+ "epoch": 84.86376021798365,
+ "grad_norm": 3.469769239425659,
+ "learning_rate": 1.177734171419287e-06,
+ "loss": 0.0854,
+ "step": 31145
+ },
+ {
+ "epoch": 84.86648501362397,
+ "grad_norm": 2.5312633514404297,
+ "learning_rate": 1.1773187051656332e-06,
+ "loss": 0.1277,
+ "step": 31146
+ },
+ {
+ "epoch": 84.8692098092643,
+ "grad_norm": 2.338857650756836,
+ "learning_rate": 1.1769033076227364e-06,
+ "loss": 0.0605,
+ "step": 31147
+ },
+ {
+ "epoch": 84.87193460490464,
+ "grad_norm": 1.533124566078186,
+ "learning_rate": 1.1764879787938311e-06,
+ "loss": 0.0217,
+ "step": 31148
+ },
+ {
+ "epoch": 84.87465940054496,
+ "grad_norm": 5.608811855316162,
+ "learning_rate": 1.1760727186821552e-06,
+ "loss": 0.0547,
+ "step": 31149
+ },
+ {
+ "epoch": 84.87738419618529,
+ "grad_norm": 3.0883374214172363,
+ "learning_rate": 1.175657527290941e-06,
+ "loss": 0.0475,
+ "step": 31150
+ },
+ {
+ "epoch": 84.88010899182561,
+ "grad_norm": 2.5763869285583496,
+ "learning_rate": 1.1752424046234223e-06,
+ "loss": 0.0509,
+ "step": 31151
+ },
+ {
+ "epoch": 84.88283378746594,
+ "grad_norm": 1.486336350440979,
+ "learning_rate": 1.1748273506828278e-06,
+ "loss": 0.0198,
+ "step": 31152
+ },
+ {
+ "epoch": 84.88555858310627,
+ "grad_norm": 2.8218631744384766,
+ "learning_rate": 1.174412365472397e-06,
+ "loss": 0.0547,
+ "step": 31153
+ },
+ {
+ "epoch": 84.88828337874659,
+ "grad_norm": 4.80703067779541,
+ "learning_rate": 1.1739974489953598e-06,
+ "loss": 0.0379,
+ "step": 31154
+ },
+ {
+ "epoch": 84.89100817438693,
+ "grad_norm": 7.6221208572387695,
+ "learning_rate": 1.1735826012549457e-06,
+ "loss": 0.0318,
+ "step": 31155
+ },
+ {
+ "epoch": 84.89373297002724,
+ "grad_norm": 1.7960706949234009,
+ "learning_rate": 1.1731678222543841e-06,
+ "loss": 0.061,
+ "step": 31156
+ },
+ {
+ "epoch": 84.89645776566758,
+ "grad_norm": 3.2422173023223877,
+ "learning_rate": 1.1727531119969104e-06,
+ "loss": 0.0469,
+ "step": 31157
+ },
+ {
+ "epoch": 84.8991825613079,
+ "grad_norm": 1.7906864881515503,
+ "learning_rate": 1.172338470485751e-06,
+ "loss": 0.0178,
+ "step": 31158
+ },
+ {
+ "epoch": 84.90190735694823,
+ "grad_norm": 3.061605930328369,
+ "learning_rate": 1.1719238977241343e-06,
+ "loss": 0.1223,
+ "step": 31159
+ },
+ {
+ "epoch": 84.90463215258856,
+ "grad_norm": 6.10139799118042,
+ "learning_rate": 1.1715093937152888e-06,
+ "loss": 0.1513,
+ "step": 31160
+ },
+ {
+ "epoch": 84.90735694822888,
+ "grad_norm": 1.8453673124313354,
+ "learning_rate": 1.1710949584624466e-06,
+ "loss": 0.0167,
+ "step": 31161
+ },
+ {
+ "epoch": 84.91008174386921,
+ "grad_norm": 2.165992259979248,
+ "learning_rate": 1.1706805919688323e-06,
+ "loss": 0.023,
+ "step": 31162
+ },
+ {
+ "epoch": 84.91280653950953,
+ "grad_norm": 3.98290753364563,
+ "learning_rate": 1.1702662942376742e-06,
+ "loss": 0.1148,
+ "step": 31163
+ },
+ {
+ "epoch": 84.91553133514986,
+ "grad_norm": 3.149789810180664,
+ "learning_rate": 1.1698520652721946e-06,
+ "loss": 0.131,
+ "step": 31164
+ },
+ {
+ "epoch": 84.9182561307902,
+ "grad_norm": 4.626081466674805,
+ "learning_rate": 1.1694379050756256e-06,
+ "loss": 0.0928,
+ "step": 31165
+ },
+ {
+ "epoch": 84.92098092643052,
+ "grad_norm": 2.892207622528076,
+ "learning_rate": 1.16902381365119e-06,
+ "loss": 0.0401,
+ "step": 31166
+ },
+ {
+ "epoch": 84.92370572207085,
+ "grad_norm": 2.274512529373169,
+ "learning_rate": 1.168609791002112e-06,
+ "loss": 0.0345,
+ "step": 31167
+ },
+ {
+ "epoch": 84.92643051771117,
+ "grad_norm": 2.4470462799072266,
+ "learning_rate": 1.168195837131616e-06,
+ "loss": 0.0663,
+ "step": 31168
+ },
+ {
+ "epoch": 84.9291553133515,
+ "grad_norm": 3.115577220916748,
+ "learning_rate": 1.1677819520429258e-06,
+ "loss": 0.1073,
+ "step": 31169
+ },
+ {
+ "epoch": 84.93188010899182,
+ "grad_norm": 2.0581114292144775,
+ "learning_rate": 1.1673681357392674e-06,
+ "loss": 0.1468,
+ "step": 31170
+ },
+ {
+ "epoch": 84.93460490463215,
+ "grad_norm": 2.517979145050049,
+ "learning_rate": 1.166954388223862e-06,
+ "loss": 0.0661,
+ "step": 31171
+ },
+ {
+ "epoch": 84.93732970027249,
+ "grad_norm": 2.2308521270751953,
+ "learning_rate": 1.1665407094999292e-06,
+ "loss": 0.0263,
+ "step": 31172
+ },
+ {
+ "epoch": 84.9400544959128,
+ "grad_norm": 2.980236768722534,
+ "learning_rate": 1.1661270995706953e-06,
+ "loss": 0.1513,
+ "step": 31173
+ },
+ {
+ "epoch": 84.94277929155314,
+ "grad_norm": 1.9563831090927124,
+ "learning_rate": 1.1657135584393797e-06,
+ "loss": 0.0236,
+ "step": 31174
+ },
+ {
+ "epoch": 84.94550408719346,
+ "grad_norm": 2.2078192234039307,
+ "learning_rate": 1.1653000861092012e-06,
+ "loss": 0.0337,
+ "step": 31175
+ },
+ {
+ "epoch": 84.94822888283379,
+ "grad_norm": 3.0110480785369873,
+ "learning_rate": 1.1648866825833804e-06,
+ "loss": 0.2238,
+ "step": 31176
+ },
+ {
+ "epoch": 84.95095367847412,
+ "grad_norm": 1.9992401599884033,
+ "learning_rate": 1.1644733478651394e-06,
+ "loss": 0.0192,
+ "step": 31177
+ },
+ {
+ "epoch": 84.95367847411444,
+ "grad_norm": 3.679093360900879,
+ "learning_rate": 1.1640600819576965e-06,
+ "loss": 0.0235,
+ "step": 31178
+ },
+ {
+ "epoch": 84.95640326975477,
+ "grad_norm": 3.946873664855957,
+ "learning_rate": 1.163646884864268e-06,
+ "loss": 0.0602,
+ "step": 31179
+ },
+ {
+ "epoch": 84.95912806539509,
+ "grad_norm": 3.0473928451538086,
+ "learning_rate": 1.1632337565880715e-06,
+ "loss": 0.025,
+ "step": 31180
+ },
+ {
+ "epoch": 84.96185286103542,
+ "grad_norm": 2.5463502407073975,
+ "learning_rate": 1.1628206971323287e-06,
+ "loss": 0.0283,
+ "step": 31181
+ },
+ {
+ "epoch": 84.96457765667574,
+ "grad_norm": 2.951878309249878,
+ "learning_rate": 1.1624077065002537e-06,
+ "loss": 0.0784,
+ "step": 31182
+ },
+ {
+ "epoch": 84.96730245231608,
+ "grad_norm": 2.6662778854370117,
+ "learning_rate": 1.161994784695063e-06,
+ "loss": 0.0309,
+ "step": 31183
+ },
+ {
+ "epoch": 84.97002724795641,
+ "grad_norm": 3.0899598598480225,
+ "learning_rate": 1.1615819317199696e-06,
+ "loss": 0.0242,
+ "step": 31184
+ },
+ {
+ "epoch": 84.97275204359673,
+ "grad_norm": 2.764861583709717,
+ "learning_rate": 1.161169147578195e-06,
+ "loss": 0.0521,
+ "step": 31185
+ },
+ {
+ "epoch": 84.97547683923706,
+ "grad_norm": 1.660042643547058,
+ "learning_rate": 1.160756432272947e-06,
+ "loss": 0.137,
+ "step": 31186
+ },
+ {
+ "epoch": 84.97820163487738,
+ "grad_norm": 2.3153398036956787,
+ "learning_rate": 1.1603437858074463e-06,
+ "loss": 0.0395,
+ "step": 31187
+ },
+ {
+ "epoch": 84.98092643051771,
+ "grad_norm": 5.803910732269287,
+ "learning_rate": 1.1599312081849046e-06,
+ "loss": 0.0934,
+ "step": 31188
+ },
+ {
+ "epoch": 84.98365122615803,
+ "grad_norm": 2.680100917816162,
+ "learning_rate": 1.1595186994085306e-06,
+ "loss": 0.0411,
+ "step": 31189
+ },
+ {
+ "epoch": 84.98637602179836,
+ "grad_norm": 4.34005069732666,
+ "learning_rate": 1.159106259481544e-06,
+ "loss": 0.1272,
+ "step": 31190
+ },
+ {
+ "epoch": 84.9891008174387,
+ "grad_norm": 2.859818458557129,
+ "learning_rate": 1.1586938884071519e-06,
+ "loss": 0.0697,
+ "step": 31191
+ },
+ {
+ "epoch": 84.99182561307902,
+ "grad_norm": 2.5982792377471924,
+ "learning_rate": 1.1582815861885676e-06,
+ "loss": 0.138,
+ "step": 31192
+ },
+ {
+ "epoch": 84.99455040871935,
+ "grad_norm": 4.581809997558594,
+ "learning_rate": 1.1578693528289998e-06,
+ "loss": 0.12,
+ "step": 31193
+ },
+ {
+ "epoch": 84.99727520435967,
+ "grad_norm": 2.7573812007904053,
+ "learning_rate": 1.1574571883316632e-06,
+ "loss": 0.127,
+ "step": 31194
+ },
+ {
+ "epoch": 85.0,
+ "grad_norm": 3.7230260372161865,
+ "learning_rate": 1.1570450926997657e-06,
+ "loss": 0.0482,
+ "step": 31195
+ },
+ {
+ "epoch": 85.00272479564033,
+ "grad_norm": 2.5617825984954834,
+ "learning_rate": 1.1566330659365134e-06,
+ "loss": 0.0917,
+ "step": 31196
+ },
+ {
+ "epoch": 85.00544959128065,
+ "grad_norm": 3.321756601333618,
+ "learning_rate": 1.1562211080451201e-06,
+ "loss": 0.0431,
+ "step": 31197
+ },
+ {
+ "epoch": 85.00817438692098,
+ "grad_norm": 2.9215753078460693,
+ "learning_rate": 1.155809219028794e-06,
+ "loss": 0.0309,
+ "step": 31198
+ },
+ {
+ "epoch": 85.0108991825613,
+ "grad_norm": 2.704392910003662,
+ "learning_rate": 1.1553973988907397e-06,
+ "loss": 0.0821,
+ "step": 31199
+ },
+ {
+ "epoch": 85.01362397820164,
+ "grad_norm": 1.7946335077285767,
+ "learning_rate": 1.1549856476341637e-06,
+ "loss": 0.0607,
+ "step": 31200
+ },
+ {
+ "epoch": 85.01634877384195,
+ "grad_norm": 2.6398544311523438,
+ "learning_rate": 1.1545739652622768e-06,
+ "loss": 0.0727,
+ "step": 31201
+ },
+ {
+ "epoch": 85.01907356948229,
+ "grad_norm": 2.370229959487915,
+ "learning_rate": 1.154162351778283e-06,
+ "loss": 0.03,
+ "step": 31202
+ },
+ {
+ "epoch": 85.02179836512262,
+ "grad_norm": 2.9440078735351562,
+ "learning_rate": 1.1537508071853865e-06,
+ "loss": 0.0268,
+ "step": 31203
+ },
+ {
+ "epoch": 85.02452316076294,
+ "grad_norm": 3.667236566543579,
+ "learning_rate": 1.1533393314867959e-06,
+ "loss": 0.1429,
+ "step": 31204
+ },
+ {
+ "epoch": 85.02724795640327,
+ "grad_norm": 2.9445602893829346,
+ "learning_rate": 1.1529279246857129e-06,
+ "loss": 0.1617,
+ "step": 31205
+ },
+ {
+ "epoch": 85.02997275204359,
+ "grad_norm": 2.893164873123169,
+ "learning_rate": 1.1525165867853427e-06,
+ "loss": 0.1164,
+ "step": 31206
+ },
+ {
+ "epoch": 85.03269754768392,
+ "grad_norm": 2.4880118370056152,
+ "learning_rate": 1.1521053177888897e-06,
+ "loss": 0.0347,
+ "step": 31207
+ },
+ {
+ "epoch": 85.03542234332426,
+ "grad_norm": 1.9457095861434937,
+ "learning_rate": 1.1516941176995555e-06,
+ "loss": 0.066,
+ "step": 31208
+ },
+ {
+ "epoch": 85.03814713896458,
+ "grad_norm": 2.136549234390259,
+ "learning_rate": 1.1512829865205399e-06,
+ "loss": 0.0394,
+ "step": 31209
+ },
+ {
+ "epoch": 85.04087193460491,
+ "grad_norm": 3.3046276569366455,
+ "learning_rate": 1.1508719242550504e-06,
+ "loss": 0.1154,
+ "step": 31210
+ },
+ {
+ "epoch": 85.04359673024523,
+ "grad_norm": 2.7356948852539062,
+ "learning_rate": 1.1504609309062865e-06,
+ "loss": 0.0315,
+ "step": 31211
+ },
+ {
+ "epoch": 85.04632152588556,
+ "grad_norm": 3.503849744796753,
+ "learning_rate": 1.1500500064774468e-06,
+ "loss": 0.077,
+ "step": 31212
+ },
+ {
+ "epoch": 85.04904632152588,
+ "grad_norm": 2.7946083545684814,
+ "learning_rate": 1.149639150971731e-06,
+ "loss": 0.0604,
+ "step": 31213
+ },
+ {
+ "epoch": 85.05177111716621,
+ "grad_norm": 2.3161447048187256,
+ "learning_rate": 1.149228364392343e-06,
+ "loss": 0.0505,
+ "step": 31214
+ },
+ {
+ "epoch": 85.05449591280654,
+ "grad_norm": 2.6644997596740723,
+ "learning_rate": 1.1488176467424783e-06,
+ "loss": 0.0559,
+ "step": 31215
+ },
+ {
+ "epoch": 85.05722070844686,
+ "grad_norm": 2.237291097640991,
+ "learning_rate": 1.1484069980253365e-06,
+ "loss": 0.0398,
+ "step": 31216
+ },
+ {
+ "epoch": 85.0599455040872,
+ "grad_norm": 2.0043485164642334,
+ "learning_rate": 1.1479964182441172e-06,
+ "loss": 0.1298,
+ "step": 31217
+ },
+ {
+ "epoch": 85.06267029972751,
+ "grad_norm": 2.936828851699829,
+ "learning_rate": 1.147585907402018e-06,
+ "loss": 0.0819,
+ "step": 31218
+ },
+ {
+ "epoch": 85.06539509536785,
+ "grad_norm": 2.717475652694702,
+ "learning_rate": 1.1471754655022338e-06,
+ "loss": 0.144,
+ "step": 31219
+ },
+ {
+ "epoch": 85.06811989100818,
+ "grad_norm": 2.3554444313049316,
+ "learning_rate": 1.14676509254796e-06,
+ "loss": 0.0378,
+ "step": 31220
+ },
+ {
+ "epoch": 85.0708446866485,
+ "grad_norm": 1.8457690477371216,
+ "learning_rate": 1.1463547885423953e-06,
+ "loss": 0.0201,
+ "step": 31221
+ },
+ {
+ "epoch": 85.07356948228883,
+ "grad_norm": 3.1834592819213867,
+ "learning_rate": 1.145944553488736e-06,
+ "loss": 0.2402,
+ "step": 31222
+ },
+ {
+ "epoch": 85.07629427792915,
+ "grad_norm": 2.8990871906280518,
+ "learning_rate": 1.1455343873901758e-06,
+ "loss": 0.1426,
+ "step": 31223
+ },
+ {
+ "epoch": 85.07901907356948,
+ "grad_norm": 2.236565113067627,
+ "learning_rate": 1.1451242902499093e-06,
+ "loss": 0.1035,
+ "step": 31224
+ },
+ {
+ "epoch": 85.0817438692098,
+ "grad_norm": 2.261110544204712,
+ "learning_rate": 1.1447142620711282e-06,
+ "loss": 0.0701,
+ "step": 31225
+ },
+ {
+ "epoch": 85.08446866485014,
+ "grad_norm": 2.307209014892578,
+ "learning_rate": 1.1443043028570277e-06,
+ "loss": 0.1181,
+ "step": 31226
+ },
+ {
+ "epoch": 85.08719346049047,
+ "grad_norm": 1.7935295104980469,
+ "learning_rate": 1.143894412610802e-06,
+ "loss": 0.0445,
+ "step": 31227
+ },
+ {
+ "epoch": 85.08991825613079,
+ "grad_norm": 2.47874116897583,
+ "learning_rate": 1.1434845913356407e-06,
+ "loss": 0.0458,
+ "step": 31228
+ },
+ {
+ "epoch": 85.09264305177112,
+ "grad_norm": 3.583185911178589,
+ "learning_rate": 1.1430748390347345e-06,
+ "loss": 0.0691,
+ "step": 31229
+ },
+ {
+ "epoch": 85.09536784741144,
+ "grad_norm": 2.242398262023926,
+ "learning_rate": 1.142665155711279e-06,
+ "loss": 0.03,
+ "step": 31230
+ },
+ {
+ "epoch": 85.09809264305177,
+ "grad_norm": 1.7714391946792603,
+ "learning_rate": 1.142255541368461e-06,
+ "loss": 0.03,
+ "step": 31231
+ },
+ {
+ "epoch": 85.1008174386921,
+ "grad_norm": 3.1620378494262695,
+ "learning_rate": 1.141845996009472e-06,
+ "loss": 0.1696,
+ "step": 31232
+ },
+ {
+ "epoch": 85.10354223433242,
+ "grad_norm": 7.280642986297607,
+ "learning_rate": 1.1414365196374999e-06,
+ "loss": 0.0847,
+ "step": 31233
+ },
+ {
+ "epoch": 85.10626702997276,
+ "grad_norm": 2.3759689331054688,
+ "learning_rate": 1.141027112255737e-06,
+ "loss": 0.026,
+ "step": 31234
+ },
+ {
+ "epoch": 85.10899182561307,
+ "grad_norm": 2.9072611331939697,
+ "learning_rate": 1.1406177738673697e-06,
+ "loss": 0.0734,
+ "step": 31235
+ },
+ {
+ "epoch": 85.11171662125341,
+ "grad_norm": 2.286513328552246,
+ "learning_rate": 1.1402085044755862e-06,
+ "loss": 0.0255,
+ "step": 31236
+ },
+ {
+ "epoch": 85.11444141689373,
+ "grad_norm": 3.010617733001709,
+ "learning_rate": 1.139799304083571e-06,
+ "loss": 0.0982,
+ "step": 31237
+ },
+ {
+ "epoch": 85.11716621253406,
+ "grad_norm": 2.5518136024475098,
+ "learning_rate": 1.1393901726945145e-06,
+ "loss": 0.0519,
+ "step": 31238
+ },
+ {
+ "epoch": 85.11989100817439,
+ "grad_norm": 2.2859580516815186,
+ "learning_rate": 1.1389811103116032e-06,
+ "loss": 0.047,
+ "step": 31239
+ },
+ {
+ "epoch": 85.12261580381471,
+ "grad_norm": 2.7176449298858643,
+ "learning_rate": 1.1385721169380226e-06,
+ "loss": 0.1465,
+ "step": 31240
+ },
+ {
+ "epoch": 85.12534059945504,
+ "grad_norm": 2.257220983505249,
+ "learning_rate": 1.1381631925769555e-06,
+ "loss": 0.0256,
+ "step": 31241
+ },
+ {
+ "epoch": 85.12806539509536,
+ "grad_norm": 2.7775049209594727,
+ "learning_rate": 1.1377543372315892e-06,
+ "loss": 0.1032,
+ "step": 31242
+ },
+ {
+ "epoch": 85.1307901907357,
+ "grad_norm": 2.5805413722991943,
+ "learning_rate": 1.1373455509051078e-06,
+ "loss": 0.0284,
+ "step": 31243
+ },
+ {
+ "epoch": 85.13351498637603,
+ "grad_norm": 2.0446224212646484,
+ "learning_rate": 1.1369368336006937e-06,
+ "loss": 0.0316,
+ "step": 31244
+ },
+ {
+ "epoch": 85.13623978201635,
+ "grad_norm": 3.1809558868408203,
+ "learning_rate": 1.136528185321528e-06,
+ "loss": 0.1657,
+ "step": 31245
+ },
+ {
+ "epoch": 85.13896457765668,
+ "grad_norm": 2.5956246852874756,
+ "learning_rate": 1.136119606070798e-06,
+ "loss": 0.0262,
+ "step": 31246
+ },
+ {
+ "epoch": 85.141689373297,
+ "grad_norm": 2.1996331214904785,
+ "learning_rate": 1.1357110958516826e-06,
+ "loss": 0.0258,
+ "step": 31247
+ },
+ {
+ "epoch": 85.14441416893733,
+ "grad_norm": 1.5208231210708618,
+ "learning_rate": 1.135302654667364e-06,
+ "loss": 0.1075,
+ "step": 31248
+ },
+ {
+ "epoch": 85.14713896457765,
+ "grad_norm": 2.095036029815674,
+ "learning_rate": 1.1348942825210218e-06,
+ "loss": 0.0305,
+ "step": 31249
+ },
+ {
+ "epoch": 85.14986376021798,
+ "grad_norm": 3.0639026165008545,
+ "learning_rate": 1.1344859794158391e-06,
+ "loss": 0.2263,
+ "step": 31250
+ },
+ {
+ "epoch": 85.15258855585832,
+ "grad_norm": 2.629934549331665,
+ "learning_rate": 1.1340777453549944e-06,
+ "loss": 0.0828,
+ "step": 31251
+ },
+ {
+ "epoch": 85.15531335149863,
+ "grad_norm": 2.574131488800049,
+ "learning_rate": 1.1336695803416664e-06,
+ "loss": 0.0454,
+ "step": 31252
+ },
+ {
+ "epoch": 85.15803814713897,
+ "grad_norm": 2.7287404537200928,
+ "learning_rate": 1.1332614843790325e-06,
+ "loss": 0.0228,
+ "step": 31253
+ },
+ {
+ "epoch": 85.16076294277929,
+ "grad_norm": 2.968825101852417,
+ "learning_rate": 1.1328534574702755e-06,
+ "loss": 0.106,
+ "step": 31254
+ },
+ {
+ "epoch": 85.16348773841962,
+ "grad_norm": 2.069678544998169,
+ "learning_rate": 1.1324454996185673e-06,
+ "loss": 0.0744,
+ "step": 31255
+ },
+ {
+ "epoch": 85.16621253405995,
+ "grad_norm": 2.4735465049743652,
+ "learning_rate": 1.1320376108270904e-06,
+ "loss": 0.0351,
+ "step": 31256
+ },
+ {
+ "epoch": 85.16893732970027,
+ "grad_norm": 6.014044761657715,
+ "learning_rate": 1.1316297910990203e-06,
+ "loss": 0.0474,
+ "step": 31257
+ },
+ {
+ "epoch": 85.1716621253406,
+ "grad_norm": 2.1581010818481445,
+ "learning_rate": 1.1312220404375285e-06,
+ "loss": 0.0285,
+ "step": 31258
+ },
+ {
+ "epoch": 85.17438692098092,
+ "grad_norm": 3.769885540008545,
+ "learning_rate": 1.1308143588457965e-06,
+ "loss": 0.1763,
+ "step": 31259
+ },
+ {
+ "epoch": 85.17711171662125,
+ "grad_norm": 3.3707964420318604,
+ "learning_rate": 1.1304067463269974e-06,
+ "loss": 0.071,
+ "step": 31260
+ },
+ {
+ "epoch": 85.17983651226157,
+ "grad_norm": 6.158848762512207,
+ "learning_rate": 1.129999202884302e-06,
+ "loss": 0.0274,
+ "step": 31261
+ },
+ {
+ "epoch": 85.1825613079019,
+ "grad_norm": 2.6891701221466064,
+ "learning_rate": 1.1295917285208901e-06,
+ "loss": 0.0343,
+ "step": 31262
+ },
+ {
+ "epoch": 85.18528610354224,
+ "grad_norm": 2.750530481338501,
+ "learning_rate": 1.1291843232399324e-06,
+ "loss": 0.0407,
+ "step": 31263
+ },
+ {
+ "epoch": 85.18801089918256,
+ "grad_norm": 2.945326328277588,
+ "learning_rate": 1.128776987044602e-06,
+ "loss": 0.0627,
+ "step": 31264
+ },
+ {
+ "epoch": 85.19073569482289,
+ "grad_norm": 78.27469635009766,
+ "learning_rate": 1.1283697199380683e-06,
+ "loss": 0.0397,
+ "step": 31265
+ },
+ {
+ "epoch": 85.19346049046321,
+ "grad_norm": 2.988227367401123,
+ "learning_rate": 1.1279625219235068e-06,
+ "loss": 0.1306,
+ "step": 31266
+ },
+ {
+ "epoch": 85.19618528610354,
+ "grad_norm": 2.2063028812408447,
+ "learning_rate": 1.1275553930040894e-06,
+ "loss": 0.0306,
+ "step": 31267
+ },
+ {
+ "epoch": 85.19891008174388,
+ "grad_norm": 3.1017582416534424,
+ "learning_rate": 1.1271483331829835e-06,
+ "loss": 0.0246,
+ "step": 31268
+ },
+ {
+ "epoch": 85.2016348773842,
+ "grad_norm": 3.0398337841033936,
+ "learning_rate": 1.12674134246336e-06,
+ "loss": 0.0315,
+ "step": 31269
+ },
+ {
+ "epoch": 85.20435967302453,
+ "grad_norm": 3.5283937454223633,
+ "learning_rate": 1.1263344208483906e-06,
+ "loss": 0.097,
+ "step": 31270
+ },
+ {
+ "epoch": 85.20708446866485,
+ "grad_norm": 2.1142489910125732,
+ "learning_rate": 1.125927568341244e-06,
+ "loss": 0.024,
+ "step": 31271
+ },
+ {
+ "epoch": 85.20980926430518,
+ "grad_norm": 2.6907687187194824,
+ "learning_rate": 1.1255207849450845e-06,
+ "loss": 0.0297,
+ "step": 31272
+ },
+ {
+ "epoch": 85.2125340599455,
+ "grad_norm": 1.589200496673584,
+ "learning_rate": 1.125114070663087e-06,
+ "loss": 0.0723,
+ "step": 31273
+ },
+ {
+ "epoch": 85.21525885558583,
+ "grad_norm": 1.5391526222229004,
+ "learning_rate": 1.1247074254984126e-06,
+ "loss": 0.0222,
+ "step": 31274
+ },
+ {
+ "epoch": 85.21798365122616,
+ "grad_norm": 2.298555374145508,
+ "learning_rate": 1.1243008494542328e-06,
+ "loss": 0.0267,
+ "step": 31275
+ },
+ {
+ "epoch": 85.22070844686648,
+ "grad_norm": 3.090374231338501,
+ "learning_rate": 1.1238943425337135e-06,
+ "loss": 0.0399,
+ "step": 31276
+ },
+ {
+ "epoch": 85.22343324250681,
+ "grad_norm": 1.9240354299545288,
+ "learning_rate": 1.1234879047400183e-06,
+ "loss": 0.1801,
+ "step": 31277
+ },
+ {
+ "epoch": 85.22615803814713,
+ "grad_norm": 2.856506586074829,
+ "learning_rate": 1.1230815360763126e-06,
+ "loss": 0.0693,
+ "step": 31278
+ },
+ {
+ "epoch": 85.22888283378747,
+ "grad_norm": 1.5447888374328613,
+ "learning_rate": 1.1226752365457626e-06,
+ "loss": 0.0196,
+ "step": 31279
+ },
+ {
+ "epoch": 85.2316076294278,
+ "grad_norm": 2.7791478633880615,
+ "learning_rate": 1.122269006151534e-06,
+ "loss": 0.064,
+ "step": 31280
+ },
+ {
+ "epoch": 85.23433242506812,
+ "grad_norm": 1.721009612083435,
+ "learning_rate": 1.121862844896786e-06,
+ "loss": 0.0385,
+ "step": 31281
+ },
+ {
+ "epoch": 85.23705722070845,
+ "grad_norm": 2.0161871910095215,
+ "learning_rate": 1.1214567527846854e-06,
+ "loss": 0.1422,
+ "step": 31282
+ },
+ {
+ "epoch": 85.23978201634877,
+ "grad_norm": 4.117589950561523,
+ "learning_rate": 1.1210507298183948e-06,
+ "loss": 0.0613,
+ "step": 31283
+ },
+ {
+ "epoch": 85.2425068119891,
+ "grad_norm": 2.8080499172210693,
+ "learning_rate": 1.1206447760010752e-06,
+ "loss": 0.1205,
+ "step": 31284
+ },
+ {
+ "epoch": 85.24523160762942,
+ "grad_norm": 2.301487445831299,
+ "learning_rate": 1.1202388913358863e-06,
+ "loss": 0.0329,
+ "step": 31285
+ },
+ {
+ "epoch": 85.24795640326975,
+ "grad_norm": 2.305171012878418,
+ "learning_rate": 1.1198330758259934e-06,
+ "loss": 0.0531,
+ "step": 31286
+ },
+ {
+ "epoch": 85.25068119891009,
+ "grad_norm": 2.888373374938965,
+ "learning_rate": 1.119427329474555e-06,
+ "loss": 0.0626,
+ "step": 31287
+ },
+ {
+ "epoch": 85.2534059945504,
+ "grad_norm": 3.4480016231536865,
+ "learning_rate": 1.1190216522847297e-06,
+ "loss": 0.072,
+ "step": 31288
+ },
+ {
+ "epoch": 85.25613079019074,
+ "grad_norm": 2.151869058609009,
+ "learning_rate": 1.118616044259676e-06,
+ "loss": 0.0673,
+ "step": 31289
+ },
+ {
+ "epoch": 85.25885558583106,
+ "grad_norm": 1.628497838973999,
+ "learning_rate": 1.118210505402556e-06,
+ "loss": 0.0487,
+ "step": 31290
+ },
+ {
+ "epoch": 85.26158038147139,
+ "grad_norm": 1.705924391746521,
+ "learning_rate": 1.117805035716527e-06,
+ "loss": 0.0278,
+ "step": 31291
+ },
+ {
+ "epoch": 85.26430517711172,
+ "grad_norm": 1.645024061203003,
+ "learning_rate": 1.117399635204748e-06,
+ "loss": 0.0268,
+ "step": 31292
+ },
+ {
+ "epoch": 85.26702997275204,
+ "grad_norm": 2.6714820861816406,
+ "learning_rate": 1.1169943038703734e-06,
+ "loss": 0.0263,
+ "step": 31293
+ },
+ {
+ "epoch": 85.26975476839237,
+ "grad_norm": 1.848447322845459,
+ "learning_rate": 1.1165890417165604e-06,
+ "loss": 0.0193,
+ "step": 31294
+ },
+ {
+ "epoch": 85.2724795640327,
+ "grad_norm": 2.722369909286499,
+ "learning_rate": 1.1161838487464682e-06,
+ "loss": 0.0359,
+ "step": 31295
+ },
+ {
+ "epoch": 85.27520435967303,
+ "grad_norm": 2.494370460510254,
+ "learning_rate": 1.115778724963249e-06,
+ "loss": 0.0701,
+ "step": 31296
+ },
+ {
+ "epoch": 85.27792915531334,
+ "grad_norm": 2.0855612754821777,
+ "learning_rate": 1.1153736703700602e-06,
+ "loss": 0.0211,
+ "step": 31297
+ },
+ {
+ "epoch": 85.28065395095368,
+ "grad_norm": 1.9474340677261353,
+ "learning_rate": 1.1149686849700524e-06,
+ "loss": 0.0343,
+ "step": 31298
+ },
+ {
+ "epoch": 85.28337874659401,
+ "grad_norm": 3.5660603046417236,
+ "learning_rate": 1.1145637687663856e-06,
+ "loss": 0.0623,
+ "step": 31299
+ },
+ {
+ "epoch": 85.28610354223433,
+ "grad_norm": 1.9984091520309448,
+ "learning_rate": 1.1141589217622096e-06,
+ "loss": 0.0208,
+ "step": 31300
+ },
+ {
+ "epoch": 85.28882833787466,
+ "grad_norm": 2.32194447517395,
+ "learning_rate": 1.1137541439606781e-06,
+ "loss": 0.1028,
+ "step": 31301
+ },
+ {
+ "epoch": 85.29155313351498,
+ "grad_norm": 2.6686768531799316,
+ "learning_rate": 1.113349435364941e-06,
+ "loss": 0.0389,
+ "step": 31302
+ },
+ {
+ "epoch": 85.29427792915531,
+ "grad_norm": 2.5307862758636475,
+ "learning_rate": 1.1129447959781546e-06,
+ "loss": 0.0249,
+ "step": 31303
+ },
+ {
+ "epoch": 85.29700272479565,
+ "grad_norm": 3.1726667881011963,
+ "learning_rate": 1.112540225803468e-06,
+ "loss": 0.0769,
+ "step": 31304
+ },
+ {
+ "epoch": 85.29972752043597,
+ "grad_norm": 2.270932197570801,
+ "learning_rate": 1.1121357248440301e-06,
+ "loss": 0.0247,
+ "step": 31305
+ },
+ {
+ "epoch": 85.3024523160763,
+ "grad_norm": 1.6723506450653076,
+ "learning_rate": 1.1117312931029933e-06,
+ "loss": 0.0177,
+ "step": 31306
+ },
+ {
+ "epoch": 85.30517711171662,
+ "grad_norm": 2.499312400817871,
+ "learning_rate": 1.1113269305835095e-06,
+ "loss": 0.1686,
+ "step": 31307
+ },
+ {
+ "epoch": 85.30790190735695,
+ "grad_norm": 1.9165818691253662,
+ "learning_rate": 1.110922637288725e-06,
+ "loss": 0.024,
+ "step": 31308
+ },
+ {
+ "epoch": 85.31062670299727,
+ "grad_norm": 3.382559299468994,
+ "learning_rate": 1.1105184132217894e-06,
+ "loss": 0.0561,
+ "step": 31309
+ },
+ {
+ "epoch": 85.3133514986376,
+ "grad_norm": 3.5681657791137695,
+ "learning_rate": 1.110114258385847e-06,
+ "loss": 0.144,
+ "step": 31310
+ },
+ {
+ "epoch": 85.31607629427793,
+ "grad_norm": 2.3098039627075195,
+ "learning_rate": 1.109710172784052e-06,
+ "loss": 0.0869,
+ "step": 31311
+ },
+ {
+ "epoch": 85.31880108991825,
+ "grad_norm": 5.275523662567139,
+ "learning_rate": 1.1093061564195473e-06,
+ "loss": 0.2314,
+ "step": 31312
+ },
+ {
+ "epoch": 85.32152588555859,
+ "grad_norm": 2.3177170753479004,
+ "learning_rate": 1.1089022092954804e-06,
+ "loss": 0.0722,
+ "step": 31313
+ },
+ {
+ "epoch": 85.3242506811989,
+ "grad_norm": 4.753061771392822,
+ "learning_rate": 1.1084983314149956e-06,
+ "loss": 0.0399,
+ "step": 31314
+ },
+ {
+ "epoch": 85.32697547683924,
+ "grad_norm": 2.071126937866211,
+ "learning_rate": 1.1080945227812401e-06,
+ "loss": 0.0317,
+ "step": 31315
+ },
+ {
+ "epoch": 85.32970027247957,
+ "grad_norm": 1.5893691778182983,
+ "learning_rate": 1.1076907833973594e-06,
+ "loss": 0.0224,
+ "step": 31316
+ },
+ {
+ "epoch": 85.33242506811989,
+ "grad_norm": 3.2053310871124268,
+ "learning_rate": 1.1072871132664964e-06,
+ "loss": 0.0321,
+ "step": 31317
+ },
+ {
+ "epoch": 85.33514986376022,
+ "grad_norm": 2.5301358699798584,
+ "learning_rate": 1.1068835123917932e-06,
+ "loss": 0.0318,
+ "step": 31318
+ },
+ {
+ "epoch": 85.33787465940054,
+ "grad_norm": 2.5551259517669678,
+ "learning_rate": 1.106479980776397e-06,
+ "loss": 0.0998,
+ "step": 31319
+ },
+ {
+ "epoch": 85.34059945504087,
+ "grad_norm": 2.8790533542633057,
+ "learning_rate": 1.106076518423449e-06,
+ "loss": 0.0703,
+ "step": 31320
+ },
+ {
+ "epoch": 85.34332425068119,
+ "grad_norm": 2.3201816082000732,
+ "learning_rate": 1.1056731253360896e-06,
+ "loss": 0.036,
+ "step": 31321
+ },
+ {
+ "epoch": 85.34604904632153,
+ "grad_norm": 2.061262845993042,
+ "learning_rate": 1.1052698015174601e-06,
+ "loss": 0.0563,
+ "step": 31322
+ },
+ {
+ "epoch": 85.34877384196186,
+ "grad_norm": 3.3432466983795166,
+ "learning_rate": 1.1048665469707055e-06,
+ "loss": 0.1288,
+ "step": 31323
+ },
+ {
+ "epoch": 85.35149863760218,
+ "grad_norm": 3.4909512996673584,
+ "learning_rate": 1.104463361698962e-06,
+ "loss": 0.0766,
+ "step": 31324
+ },
+ {
+ "epoch": 85.35422343324251,
+ "grad_norm": 2.3487298488616943,
+ "learning_rate": 1.1040602457053729e-06,
+ "loss": 0.0624,
+ "step": 31325
+ },
+ {
+ "epoch": 85.35694822888283,
+ "grad_norm": 2.2828550338745117,
+ "learning_rate": 1.1036571989930744e-06,
+ "loss": 0.0402,
+ "step": 31326
+ },
+ {
+ "epoch": 85.35967302452316,
+ "grad_norm": 3.2351059913635254,
+ "learning_rate": 1.1032542215652098e-06,
+ "loss": 0.1084,
+ "step": 31327
+ },
+ {
+ "epoch": 85.3623978201635,
+ "grad_norm": 1.4596086740493774,
+ "learning_rate": 1.1028513134249153e-06,
+ "loss": 0.0159,
+ "step": 31328
+ },
+ {
+ "epoch": 85.36512261580381,
+ "grad_norm": 1.4271363019943237,
+ "learning_rate": 1.1024484745753271e-06,
+ "loss": 0.0206,
+ "step": 31329
+ },
+ {
+ "epoch": 85.36784741144415,
+ "grad_norm": 1.773149847984314,
+ "learning_rate": 1.1020457050195833e-06,
+ "loss": 0.0202,
+ "step": 31330
+ },
+ {
+ "epoch": 85.37057220708446,
+ "grad_norm": 2.0291876792907715,
+ "learning_rate": 1.1016430047608218e-06,
+ "loss": 0.1331,
+ "step": 31331
+ },
+ {
+ "epoch": 85.3732970027248,
+ "grad_norm": 3.2120614051818848,
+ "learning_rate": 1.1012403738021793e-06,
+ "loss": 0.0467,
+ "step": 31332
+ },
+ {
+ "epoch": 85.37602179836512,
+ "grad_norm": 2.912571668624878,
+ "learning_rate": 1.10083781214679e-06,
+ "loss": 0.114,
+ "step": 31333
+ },
+ {
+ "epoch": 85.37874659400545,
+ "grad_norm": 2.736415386199951,
+ "learning_rate": 1.1004353197977869e-06,
+ "loss": 0.0289,
+ "step": 31334
+ },
+ {
+ "epoch": 85.38147138964578,
+ "grad_norm": 2.302786111831665,
+ "learning_rate": 1.1000328967583096e-06,
+ "loss": 0.0355,
+ "step": 31335
+ },
+ {
+ "epoch": 85.3841961852861,
+ "grad_norm": 3.136418104171753,
+ "learning_rate": 1.099630543031489e-06,
+ "loss": 0.1011,
+ "step": 31336
+ },
+ {
+ "epoch": 85.38692098092643,
+ "grad_norm": 2.4176077842712402,
+ "learning_rate": 1.0992282586204605e-06,
+ "loss": 0.023,
+ "step": 31337
+ },
+ {
+ "epoch": 85.38964577656675,
+ "grad_norm": 2.6242637634277344,
+ "learning_rate": 1.0988260435283526e-06,
+ "loss": 0.0296,
+ "step": 31338
+ },
+ {
+ "epoch": 85.39237057220708,
+ "grad_norm": 2.302511215209961,
+ "learning_rate": 1.098423897758304e-06,
+ "loss": 0.0217,
+ "step": 31339
+ },
+ {
+ "epoch": 85.39509536784742,
+ "grad_norm": 2.617093801498413,
+ "learning_rate": 1.098021821313443e-06,
+ "loss": 0.0621,
+ "step": 31340
+ },
+ {
+ "epoch": 85.39782016348774,
+ "grad_norm": 4.201938152313232,
+ "learning_rate": 1.0976198141968998e-06,
+ "loss": 0.0968,
+ "step": 31341
+ },
+ {
+ "epoch": 85.40054495912807,
+ "grad_norm": 2.8996481895446777,
+ "learning_rate": 1.097217876411808e-06,
+ "loss": 0.05,
+ "step": 31342
+ },
+ {
+ "epoch": 85.40326975476839,
+ "grad_norm": 5.1527557373046875,
+ "learning_rate": 1.0968160079612966e-06,
+ "loss": 0.1267,
+ "step": 31343
+ },
+ {
+ "epoch": 85.40599455040872,
+ "grad_norm": 2.3500819206237793,
+ "learning_rate": 1.0964142088484963e-06,
+ "loss": 0.0312,
+ "step": 31344
+ },
+ {
+ "epoch": 85.40871934604904,
+ "grad_norm": 2.4018545150756836,
+ "learning_rate": 1.0960124790765358e-06,
+ "loss": 0.0482,
+ "step": 31345
+ },
+ {
+ "epoch": 85.41144414168937,
+ "grad_norm": 3.214704751968384,
+ "learning_rate": 1.0956108186485414e-06,
+ "loss": 0.0484,
+ "step": 31346
+ },
+ {
+ "epoch": 85.4141689373297,
+ "grad_norm": 2.7772579193115234,
+ "learning_rate": 1.0952092275676461e-06,
+ "loss": 0.1192,
+ "step": 31347
+ },
+ {
+ "epoch": 85.41689373297002,
+ "grad_norm": 9.122698783874512,
+ "learning_rate": 1.0948077058369744e-06,
+ "loss": 0.0257,
+ "step": 31348
+ },
+ {
+ "epoch": 85.41961852861036,
+ "grad_norm": 2.5185344219207764,
+ "learning_rate": 1.0944062534596534e-06,
+ "loss": 0.0297,
+ "step": 31349
+ },
+ {
+ "epoch": 85.42234332425068,
+ "grad_norm": 2.5750045776367188,
+ "learning_rate": 1.0940048704388085e-06,
+ "loss": 0.1198,
+ "step": 31350
+ },
+ {
+ "epoch": 85.42506811989101,
+ "grad_norm": 2.800236701965332,
+ "learning_rate": 1.0936035567775682e-06,
+ "loss": 0.0509,
+ "step": 31351
+ },
+ {
+ "epoch": 85.42779291553134,
+ "grad_norm": 3.1607398986816406,
+ "learning_rate": 1.093202312479057e-06,
+ "loss": 0.0387,
+ "step": 31352
+ },
+ {
+ "epoch": 85.43051771117166,
+ "grad_norm": 3.0872299671173096,
+ "learning_rate": 1.0928011375464e-06,
+ "loss": 0.0855,
+ "step": 31353
+ },
+ {
+ "epoch": 85.433242506812,
+ "grad_norm": 4.9866766929626465,
+ "learning_rate": 1.0924000319827189e-06,
+ "loss": 0.0336,
+ "step": 31354
+ },
+ {
+ "epoch": 85.43596730245231,
+ "grad_norm": 2.2867190837860107,
+ "learning_rate": 1.0919989957911414e-06,
+ "loss": 0.093,
+ "step": 31355
+ },
+ {
+ "epoch": 85.43869209809264,
+ "grad_norm": 2.031414270401001,
+ "learning_rate": 1.0915980289747885e-06,
+ "loss": 0.1001,
+ "step": 31356
+ },
+ {
+ "epoch": 85.44141689373296,
+ "grad_norm": 3.1889355182647705,
+ "learning_rate": 1.0911971315367842e-06,
+ "loss": 0.0287,
+ "step": 31357
+ },
+ {
+ "epoch": 85.4441416893733,
+ "grad_norm": 1.4479886293411255,
+ "learning_rate": 1.0907963034802472e-06,
+ "loss": 0.0231,
+ "step": 31358
+ },
+ {
+ "epoch": 85.44686648501363,
+ "grad_norm": 2.1521711349487305,
+ "learning_rate": 1.0903955448083025e-06,
+ "loss": 0.0507,
+ "step": 31359
+ },
+ {
+ "epoch": 85.44959128065395,
+ "grad_norm": 2.2834932804107666,
+ "learning_rate": 1.0899948555240724e-06,
+ "loss": 0.0745,
+ "step": 31360
+ },
+ {
+ "epoch": 85.45231607629428,
+ "grad_norm": 3.421525239944458,
+ "learning_rate": 1.0895942356306754e-06,
+ "loss": 0.0495,
+ "step": 31361
+ },
+ {
+ "epoch": 85.4550408719346,
+ "grad_norm": 3.9137887954711914,
+ "learning_rate": 1.0891936851312325e-06,
+ "loss": 0.0602,
+ "step": 31362
+ },
+ {
+ "epoch": 85.45776566757493,
+ "grad_norm": 2.5682373046875,
+ "learning_rate": 1.0887932040288597e-06,
+ "loss": 0.0656,
+ "step": 31363
+ },
+ {
+ "epoch": 85.46049046321527,
+ "grad_norm": 2.6598455905914307,
+ "learning_rate": 1.0883927923266813e-06,
+ "loss": 0.1311,
+ "step": 31364
+ },
+ {
+ "epoch": 85.46321525885558,
+ "grad_norm": 2.747976541519165,
+ "learning_rate": 1.0879924500278116e-06,
+ "loss": 0.0326,
+ "step": 31365
+ },
+ {
+ "epoch": 85.46594005449592,
+ "grad_norm": 1.0858652591705322,
+ "learning_rate": 1.0875921771353714e-06,
+ "loss": 0.0143,
+ "step": 31366
+ },
+ {
+ "epoch": 85.46866485013624,
+ "grad_norm": 5.205644607543945,
+ "learning_rate": 1.0871919736524739e-06,
+ "loss": 0.0232,
+ "step": 31367
+ },
+ {
+ "epoch": 85.47138964577657,
+ "grad_norm": 2.80965256690979,
+ "learning_rate": 1.0867918395822397e-06,
+ "loss": 0.0311,
+ "step": 31368
+ },
+ {
+ "epoch": 85.47411444141689,
+ "grad_norm": 1.7131377458572388,
+ "learning_rate": 1.0863917749277852e-06,
+ "loss": 0.1043,
+ "step": 31369
+ },
+ {
+ "epoch": 85.47683923705722,
+ "grad_norm": 2.595020055770874,
+ "learning_rate": 1.0859917796922216e-06,
+ "loss": 0.0878,
+ "step": 31370
+ },
+ {
+ "epoch": 85.47956403269755,
+ "grad_norm": 1.2756234407424927,
+ "learning_rate": 1.0855918538786692e-06,
+ "loss": 0.0158,
+ "step": 31371
+ },
+ {
+ "epoch": 85.48228882833787,
+ "grad_norm": 2.4362616539001465,
+ "learning_rate": 1.0851919974902403e-06,
+ "loss": 0.027,
+ "step": 31372
+ },
+ {
+ "epoch": 85.4850136239782,
+ "grad_norm": 5.21702241897583,
+ "learning_rate": 1.0847922105300502e-06,
+ "loss": 0.0666,
+ "step": 31373
+ },
+ {
+ "epoch": 85.48773841961852,
+ "grad_norm": 2.4590508937835693,
+ "learning_rate": 1.0843924930012084e-06,
+ "loss": 0.1561,
+ "step": 31374
+ },
+ {
+ "epoch": 85.49046321525886,
+ "grad_norm": 2.4573071002960205,
+ "learning_rate": 1.0839928449068316e-06,
+ "loss": 0.0404,
+ "step": 31375
+ },
+ {
+ "epoch": 85.49318801089919,
+ "grad_norm": 4.320873737335205,
+ "learning_rate": 1.0835932662500338e-06,
+ "loss": 0.0459,
+ "step": 31376
+ },
+ {
+ "epoch": 85.49591280653951,
+ "grad_norm": 2.13910174369812,
+ "learning_rate": 1.0831937570339247e-06,
+ "loss": 0.0344,
+ "step": 31377
+ },
+ {
+ "epoch": 85.49863760217984,
+ "grad_norm": 2.389197826385498,
+ "learning_rate": 1.082794317261615e-06,
+ "loss": 0.0988,
+ "step": 31378
+ },
+ {
+ "epoch": 85.50136239782016,
+ "grad_norm": 2.4774317741394043,
+ "learning_rate": 1.0823949469362138e-06,
+ "loss": 0.1,
+ "step": 31379
+ },
+ {
+ "epoch": 85.50408719346049,
+ "grad_norm": 2.9944775104522705,
+ "learning_rate": 1.081995646060836e-06,
+ "loss": 0.041,
+ "step": 31380
+ },
+ {
+ "epoch": 85.50681198910081,
+ "grad_norm": 4.310959339141846,
+ "learning_rate": 1.0815964146385894e-06,
+ "loss": 0.0392,
+ "step": 31381
+ },
+ {
+ "epoch": 85.50953678474114,
+ "grad_norm": 2.6893749237060547,
+ "learning_rate": 1.0811972526725834e-06,
+ "loss": 0.0374,
+ "step": 31382
+ },
+ {
+ "epoch": 85.51226158038148,
+ "grad_norm": 2.7266385555267334,
+ "learning_rate": 1.0807981601659234e-06,
+ "loss": 0.0927,
+ "step": 31383
+ },
+ {
+ "epoch": 85.5149863760218,
+ "grad_norm": 2.57831072807312,
+ "learning_rate": 1.0803991371217227e-06,
+ "loss": 0.0374,
+ "step": 31384
+ },
+ {
+ "epoch": 85.51771117166213,
+ "grad_norm": 5.09738302230835,
+ "learning_rate": 1.0800001835430861e-06,
+ "loss": 0.0845,
+ "step": 31385
+ },
+ {
+ "epoch": 85.52043596730245,
+ "grad_norm": 2.6946308612823486,
+ "learning_rate": 1.0796012994331207e-06,
+ "loss": 0.0717,
+ "step": 31386
+ },
+ {
+ "epoch": 85.52316076294278,
+ "grad_norm": 2.0716943740844727,
+ "learning_rate": 1.0792024847949323e-06,
+ "loss": 0.0296,
+ "step": 31387
+ },
+ {
+ "epoch": 85.52588555858311,
+ "grad_norm": 2.4201676845550537,
+ "learning_rate": 1.0788037396316287e-06,
+ "loss": 0.0241,
+ "step": 31388
+ },
+ {
+ "epoch": 85.52861035422343,
+ "grad_norm": 2.9360971450805664,
+ "learning_rate": 1.0784050639463151e-06,
+ "loss": 0.0445,
+ "step": 31389
+ },
+ {
+ "epoch": 85.53133514986376,
+ "grad_norm": 2.013364791870117,
+ "learning_rate": 1.0780064577420935e-06,
+ "loss": 0.0189,
+ "step": 31390
+ },
+ {
+ "epoch": 85.53405994550408,
+ "grad_norm": 3.436640977859497,
+ "learning_rate": 1.0776079210220725e-06,
+ "loss": 0.1096,
+ "step": 31391
+ },
+ {
+ "epoch": 85.53678474114442,
+ "grad_norm": 2.0758986473083496,
+ "learning_rate": 1.0772094537893518e-06,
+ "loss": 0.0638,
+ "step": 31392
+ },
+ {
+ "epoch": 85.53950953678473,
+ "grad_norm": 4.707724094390869,
+ "learning_rate": 1.076811056047039e-06,
+ "loss": 0.0671,
+ "step": 31393
+ },
+ {
+ "epoch": 85.54223433242507,
+ "grad_norm": 2.8454244136810303,
+ "learning_rate": 1.076412727798234e-06,
+ "loss": 0.1167,
+ "step": 31394
+ },
+ {
+ "epoch": 85.5449591280654,
+ "grad_norm": 2.417797565460205,
+ "learning_rate": 1.0760144690460384e-06,
+ "loss": 0.0767,
+ "step": 31395
+ },
+ {
+ "epoch": 85.54768392370572,
+ "grad_norm": 1.9386225938796997,
+ "learning_rate": 1.0756162797935555e-06,
+ "loss": 0.1134,
+ "step": 31396
+ },
+ {
+ "epoch": 85.55040871934605,
+ "grad_norm": 2.14420485496521,
+ "learning_rate": 1.0752181600438872e-06,
+ "loss": 0.2065,
+ "step": 31397
+ },
+ {
+ "epoch": 85.55313351498637,
+ "grad_norm": 2.394150733947754,
+ "learning_rate": 1.0748201098001322e-06,
+ "loss": 0.0452,
+ "step": 31398
+ },
+ {
+ "epoch": 85.5558583106267,
+ "grad_norm": 2.4033522605895996,
+ "learning_rate": 1.0744221290653877e-06,
+ "loss": 0.1661,
+ "step": 31399
+ },
+ {
+ "epoch": 85.55858310626704,
+ "grad_norm": 2.9644079208374023,
+ "learning_rate": 1.0740242178427595e-06,
+ "loss": 0.028,
+ "step": 31400
+ },
+ {
+ "epoch": 85.56130790190736,
+ "grad_norm": 2.385225534439087,
+ "learning_rate": 1.0736263761353437e-06,
+ "loss": 0.1234,
+ "step": 31401
+ },
+ {
+ "epoch": 85.56403269754769,
+ "grad_norm": 3.1157336235046387,
+ "learning_rate": 1.0732286039462381e-06,
+ "loss": 0.1483,
+ "step": 31402
+ },
+ {
+ "epoch": 85.566757493188,
+ "grad_norm": 1.2751082181930542,
+ "learning_rate": 1.0728309012785386e-06,
+ "loss": 0.0175,
+ "step": 31403
+ },
+ {
+ "epoch": 85.56948228882834,
+ "grad_norm": 2.8085267543792725,
+ "learning_rate": 1.0724332681353466e-06,
+ "loss": 0.0617,
+ "step": 31404
+ },
+ {
+ "epoch": 85.57220708446866,
+ "grad_norm": 3.7019472122192383,
+ "learning_rate": 1.0720357045197572e-06,
+ "loss": 0.0338,
+ "step": 31405
+ },
+ {
+ "epoch": 85.57493188010899,
+ "grad_norm": 2.4826486110687256,
+ "learning_rate": 1.0716382104348667e-06,
+ "loss": 0.0442,
+ "step": 31406
+ },
+ {
+ "epoch": 85.57765667574932,
+ "grad_norm": 4.046591758728027,
+ "learning_rate": 1.0712407858837682e-06,
+ "loss": 0.0831,
+ "step": 31407
+ },
+ {
+ "epoch": 85.58038147138964,
+ "grad_norm": 5.646476745605469,
+ "learning_rate": 1.0708434308695604e-06,
+ "loss": 0.0908,
+ "step": 31408
+ },
+ {
+ "epoch": 85.58310626702998,
+ "grad_norm": 3.560476064682007,
+ "learning_rate": 1.0704461453953373e-06,
+ "loss": 0.0964,
+ "step": 31409
+ },
+ {
+ "epoch": 85.5858310626703,
+ "grad_norm": 2.3625431060791016,
+ "learning_rate": 1.0700489294641902e-06,
+ "loss": 0.0346,
+ "step": 31410
+ },
+ {
+ "epoch": 85.58855585831063,
+ "grad_norm": 2.201275587081909,
+ "learning_rate": 1.0696517830792141e-06,
+ "loss": 0.0345,
+ "step": 31411
+ },
+ {
+ "epoch": 85.59128065395096,
+ "grad_norm": 2.2521026134490967,
+ "learning_rate": 1.0692547062435056e-06,
+ "loss": 0.0264,
+ "step": 31412
+ },
+ {
+ "epoch": 85.59400544959128,
+ "grad_norm": 2.509371519088745,
+ "learning_rate": 1.0688576989601528e-06,
+ "loss": 0.058,
+ "step": 31413
+ },
+ {
+ "epoch": 85.59673024523161,
+ "grad_norm": 2.8696141242980957,
+ "learning_rate": 1.0684607612322495e-06,
+ "loss": 0.0323,
+ "step": 31414
+ },
+ {
+ "epoch": 85.59945504087193,
+ "grad_norm": 2.570969581604004,
+ "learning_rate": 1.068063893062884e-06,
+ "loss": 0.0933,
+ "step": 31415
+ },
+ {
+ "epoch": 85.60217983651226,
+ "grad_norm": 1.7264670133590698,
+ "learning_rate": 1.0676670944551515e-06,
+ "loss": 0.043,
+ "step": 31416
+ },
+ {
+ "epoch": 85.60490463215258,
+ "grad_norm": 6.297112941741943,
+ "learning_rate": 1.0672703654121407e-06,
+ "loss": 0.1358,
+ "step": 31417
+ },
+ {
+ "epoch": 85.60762942779292,
+ "grad_norm": 2.092822790145874,
+ "learning_rate": 1.0668737059369405e-06,
+ "loss": 0.0234,
+ "step": 31418
+ },
+ {
+ "epoch": 85.61035422343325,
+ "grad_norm": 3.4409234523773193,
+ "learning_rate": 1.0664771160326382e-06,
+ "loss": 0.0609,
+ "step": 31419
+ },
+ {
+ "epoch": 85.61307901907357,
+ "grad_norm": 2.049858808517456,
+ "learning_rate": 1.0660805957023268e-06,
+ "loss": 0.0202,
+ "step": 31420
+ },
+ {
+ "epoch": 85.6158038147139,
+ "grad_norm": 2.0648813247680664,
+ "learning_rate": 1.0656841449490918e-06,
+ "loss": 0.0257,
+ "step": 31421
+ },
+ {
+ "epoch": 85.61852861035422,
+ "grad_norm": 1.8562856912612915,
+ "learning_rate": 1.0652877637760217e-06,
+ "loss": 0.0251,
+ "step": 31422
+ },
+ {
+ "epoch": 85.62125340599455,
+ "grad_norm": 3.5806736946105957,
+ "learning_rate": 1.0648914521862008e-06,
+ "loss": 0.03,
+ "step": 31423
+ },
+ {
+ "epoch": 85.62397820163488,
+ "grad_norm": 3.132786273956299,
+ "learning_rate": 1.064495210182719e-06,
+ "loss": 0.0504,
+ "step": 31424
+ },
+ {
+ "epoch": 85.6267029972752,
+ "grad_norm": 2.8375136852264404,
+ "learning_rate": 1.0640990377686611e-06,
+ "loss": 0.0466,
+ "step": 31425
+ },
+ {
+ "epoch": 85.62942779291554,
+ "grad_norm": 2.8802056312561035,
+ "learning_rate": 1.0637029349471128e-06,
+ "loss": 0.0393,
+ "step": 31426
+ },
+ {
+ "epoch": 85.63215258855585,
+ "grad_norm": 2.7082021236419678,
+ "learning_rate": 1.0633069017211562e-06,
+ "loss": 0.0581,
+ "step": 31427
+ },
+ {
+ "epoch": 85.63487738419619,
+ "grad_norm": 2.3465468883514404,
+ "learning_rate": 1.0629109380938785e-06,
+ "loss": 0.0419,
+ "step": 31428
+ },
+ {
+ "epoch": 85.6376021798365,
+ "grad_norm": 3.680985927581787,
+ "learning_rate": 1.062515044068364e-06,
+ "loss": 0.0239,
+ "step": 31429
+ },
+ {
+ "epoch": 85.64032697547684,
+ "grad_norm": 4.25960636138916,
+ "learning_rate": 1.0621192196476949e-06,
+ "loss": 0.0475,
+ "step": 31430
+ },
+ {
+ "epoch": 85.64305177111717,
+ "grad_norm": 2.498424530029297,
+ "learning_rate": 1.0617234648349506e-06,
+ "loss": 0.0728,
+ "step": 31431
+ },
+ {
+ "epoch": 85.64577656675749,
+ "grad_norm": 3.0986287593841553,
+ "learning_rate": 1.06132777963322e-06,
+ "loss": 0.096,
+ "step": 31432
+ },
+ {
+ "epoch": 85.64850136239782,
+ "grad_norm": 2.214416265487671,
+ "learning_rate": 1.0609321640455793e-06,
+ "loss": 0.0566,
+ "step": 31433
+ },
+ {
+ "epoch": 85.65122615803814,
+ "grad_norm": 1.5452136993408203,
+ "learning_rate": 1.060536618075113e-06,
+ "loss": 0.0215,
+ "step": 31434
+ },
+ {
+ "epoch": 85.65395095367847,
+ "grad_norm": 4.361598014831543,
+ "learning_rate": 1.0601411417248964e-06,
+ "loss": 0.0395,
+ "step": 31435
+ },
+ {
+ "epoch": 85.65667574931881,
+ "grad_norm": 3.358471393585205,
+ "learning_rate": 1.0597457349980156e-06,
+ "loss": 0.0562,
+ "step": 31436
+ },
+ {
+ "epoch": 85.65940054495913,
+ "grad_norm": 2.2020375728607178,
+ "learning_rate": 1.0593503978975472e-06,
+ "loss": 0.0899,
+ "step": 31437
+ },
+ {
+ "epoch": 85.66212534059946,
+ "grad_norm": 3.1154308319091797,
+ "learning_rate": 1.05895513042657e-06,
+ "loss": 0.0459,
+ "step": 31438
+ },
+ {
+ "epoch": 85.66485013623978,
+ "grad_norm": 2.8388190269470215,
+ "learning_rate": 1.0585599325881602e-06,
+ "loss": 0.032,
+ "step": 31439
+ },
+ {
+ "epoch": 85.66757493188011,
+ "grad_norm": 2.577883005142212,
+ "learning_rate": 1.0581648043853999e-06,
+ "loss": 0.0281,
+ "step": 31440
+ },
+ {
+ "epoch": 85.67029972752043,
+ "grad_norm": 3.873203754425049,
+ "learning_rate": 1.0577697458213654e-06,
+ "loss": 0.0652,
+ "step": 31441
+ },
+ {
+ "epoch": 85.67302452316076,
+ "grad_norm": 4.001662731170654,
+ "learning_rate": 1.0573747568991311e-06,
+ "loss": 0.0791,
+ "step": 31442
+ },
+ {
+ "epoch": 85.6757493188011,
+ "grad_norm": 3.218181610107422,
+ "learning_rate": 1.0569798376217722e-06,
+ "loss": 0.1775,
+ "step": 31443
+ },
+ {
+ "epoch": 85.67847411444141,
+ "grad_norm": 1.7833396196365356,
+ "learning_rate": 1.0565849879923673e-06,
+ "loss": 0.0236,
+ "step": 31444
+ },
+ {
+ "epoch": 85.68119891008175,
+ "grad_norm": 3.1455492973327637,
+ "learning_rate": 1.056190208013993e-06,
+ "loss": 0.0829,
+ "step": 31445
+ },
+ {
+ "epoch": 85.68392370572207,
+ "grad_norm": 3.2898142337799072,
+ "learning_rate": 1.05579549768972e-06,
+ "loss": 0.037,
+ "step": 31446
+ },
+ {
+ "epoch": 85.6866485013624,
+ "grad_norm": 1.9134249687194824,
+ "learning_rate": 1.0554008570226248e-06,
+ "loss": 0.0781,
+ "step": 31447
+ },
+ {
+ "epoch": 85.68937329700273,
+ "grad_norm": 4.054567337036133,
+ "learning_rate": 1.0550062860157783e-06,
+ "loss": 0.0599,
+ "step": 31448
+ },
+ {
+ "epoch": 85.69209809264305,
+ "grad_norm": 2.6702451705932617,
+ "learning_rate": 1.054611784672256e-06,
+ "loss": 0.0755,
+ "step": 31449
+ },
+ {
+ "epoch": 85.69482288828338,
+ "grad_norm": 1.6346731185913086,
+ "learning_rate": 1.0542173529951293e-06,
+ "loss": 0.0677,
+ "step": 31450
+ },
+ {
+ "epoch": 85.6975476839237,
+ "grad_norm": 4.656773090362549,
+ "learning_rate": 1.053822990987471e-06,
+ "loss": 0.1542,
+ "step": 31451
+ },
+ {
+ "epoch": 85.70027247956403,
+ "grad_norm": 1.8992481231689453,
+ "learning_rate": 1.053428698652349e-06,
+ "loss": 0.0555,
+ "step": 31452
+ },
+ {
+ "epoch": 85.70299727520435,
+ "grad_norm": 2.108342409133911,
+ "learning_rate": 1.0530344759928369e-06,
+ "loss": 0.0293,
+ "step": 31453
+ },
+ {
+ "epoch": 85.70572207084469,
+ "grad_norm": 2.579798460006714,
+ "learning_rate": 1.0526403230120064e-06,
+ "loss": 0.0406,
+ "step": 31454
+ },
+ {
+ "epoch": 85.70844686648502,
+ "grad_norm": 3.2917730808258057,
+ "learning_rate": 1.0522462397129218e-06,
+ "loss": 0.0213,
+ "step": 31455
+ },
+ {
+ "epoch": 85.71117166212534,
+ "grad_norm": 2.3854780197143555,
+ "learning_rate": 1.0518522260986575e-06,
+ "loss": 0.0296,
+ "step": 31456
+ },
+ {
+ "epoch": 85.71389645776567,
+ "grad_norm": 3.2360236644744873,
+ "learning_rate": 1.0514582821722807e-06,
+ "loss": 0.1155,
+ "step": 31457
+ },
+ {
+ "epoch": 85.71662125340599,
+ "grad_norm": 2.146756172180176,
+ "learning_rate": 1.0510644079368582e-06,
+ "loss": 0.0276,
+ "step": 31458
+ },
+ {
+ "epoch": 85.71934604904632,
+ "grad_norm": 2.608949899673462,
+ "learning_rate": 1.0506706033954561e-06,
+ "loss": 0.0243,
+ "step": 31459
+ },
+ {
+ "epoch": 85.72207084468666,
+ "grad_norm": 2.1771044731140137,
+ "learning_rate": 1.0502768685511456e-06,
+ "loss": 0.049,
+ "step": 31460
+ },
+ {
+ "epoch": 85.72479564032697,
+ "grad_norm": 1.8936131000518799,
+ "learning_rate": 1.0498832034069884e-06,
+ "loss": 0.0223,
+ "step": 31461
+ },
+ {
+ "epoch": 85.7275204359673,
+ "grad_norm": 3.245781660079956,
+ "learning_rate": 1.0494896079660554e-06,
+ "loss": 0.0338,
+ "step": 31462
+ },
+ {
+ "epoch": 85.73024523160763,
+ "grad_norm": 2.8010880947113037,
+ "learning_rate": 1.049096082231409e-06,
+ "loss": 0.0592,
+ "step": 31463
+ },
+ {
+ "epoch": 85.73297002724796,
+ "grad_norm": 2.7403125762939453,
+ "learning_rate": 1.0487026262061117e-06,
+ "loss": 0.0214,
+ "step": 31464
+ },
+ {
+ "epoch": 85.73569482288828,
+ "grad_norm": 1.6857712268829346,
+ "learning_rate": 1.0483092398932326e-06,
+ "loss": 0.0805,
+ "step": 31465
+ },
+ {
+ "epoch": 85.73841961852861,
+ "grad_norm": 2.862874746322632,
+ "learning_rate": 1.0479159232958337e-06,
+ "loss": 0.1347,
+ "step": 31466
+ },
+ {
+ "epoch": 85.74114441416894,
+ "grad_norm": 1.8531434535980225,
+ "learning_rate": 1.0475226764169766e-06,
+ "loss": 0.0612,
+ "step": 31467
+ },
+ {
+ "epoch": 85.74386920980926,
+ "grad_norm": 2.6498937606811523,
+ "learning_rate": 1.0471294992597237e-06,
+ "loss": 0.0293,
+ "step": 31468
+ },
+ {
+ "epoch": 85.7465940054496,
+ "grad_norm": 1.5940945148468018,
+ "learning_rate": 1.046736391827139e-06,
+ "loss": 0.0169,
+ "step": 31469
+ },
+ {
+ "epoch": 85.74931880108991,
+ "grad_norm": 3.2719297409057617,
+ "learning_rate": 1.0463433541222834e-06,
+ "loss": 0.0893,
+ "step": 31470
+ },
+ {
+ "epoch": 85.75204359673025,
+ "grad_norm": 3.037069082260132,
+ "learning_rate": 1.0459503861482179e-06,
+ "loss": 0.036,
+ "step": 31471
+ },
+ {
+ "epoch": 85.75476839237058,
+ "grad_norm": 2.491203546524048,
+ "learning_rate": 1.0455574879079999e-06,
+ "loss": 0.05,
+ "step": 31472
+ },
+ {
+ "epoch": 85.7574931880109,
+ "grad_norm": 3.3718345165252686,
+ "learning_rate": 1.045164659404695e-06,
+ "loss": 0.1023,
+ "step": 31473
+ },
+ {
+ "epoch": 85.76021798365123,
+ "grad_norm": 2.3489160537719727,
+ "learning_rate": 1.0447719006413592e-06,
+ "loss": 0.0719,
+ "step": 31474
+ },
+ {
+ "epoch": 85.76294277929155,
+ "grad_norm": 4.1013383865356445,
+ "learning_rate": 1.0443792116210515e-06,
+ "loss": 0.0478,
+ "step": 31475
+ },
+ {
+ "epoch": 85.76566757493188,
+ "grad_norm": 2.5753602981567383,
+ "learning_rate": 1.0439865923468284e-06,
+ "loss": 0.0389,
+ "step": 31476
+ },
+ {
+ "epoch": 85.7683923705722,
+ "grad_norm": 2.968282461166382,
+ "learning_rate": 1.0435940428217516e-06,
+ "loss": 0.0492,
+ "step": 31477
+ },
+ {
+ "epoch": 85.77111716621253,
+ "grad_norm": 3.0301930904388428,
+ "learning_rate": 1.0432015630488756e-06,
+ "loss": 0.0941,
+ "step": 31478
+ },
+ {
+ "epoch": 85.77384196185287,
+ "grad_norm": 2.6919567584991455,
+ "learning_rate": 1.0428091530312556e-06,
+ "loss": 0.0448,
+ "step": 31479
+ },
+ {
+ "epoch": 85.77656675749319,
+ "grad_norm": 2.990431785583496,
+ "learning_rate": 1.0424168127719502e-06,
+ "loss": 0.2594,
+ "step": 31480
+ },
+ {
+ "epoch": 85.77929155313352,
+ "grad_norm": 3.8211493492126465,
+ "learning_rate": 1.042024542274016e-06,
+ "loss": 0.0489,
+ "step": 31481
+ },
+ {
+ "epoch": 85.78201634877384,
+ "grad_norm": 2.424978017807007,
+ "learning_rate": 1.0416323415405061e-06,
+ "loss": 0.1753,
+ "step": 31482
+ },
+ {
+ "epoch": 85.78474114441417,
+ "grad_norm": 2.314209222793579,
+ "learning_rate": 1.0412402105744756e-06,
+ "loss": 0.0315,
+ "step": 31483
+ },
+ {
+ "epoch": 85.7874659400545,
+ "grad_norm": 3.6571786403656006,
+ "learning_rate": 1.0408481493789758e-06,
+ "loss": 0.1508,
+ "step": 31484
+ },
+ {
+ "epoch": 85.79019073569482,
+ "grad_norm": 2.1805782318115234,
+ "learning_rate": 1.040456157957065e-06,
+ "loss": 0.0235,
+ "step": 31485
+ },
+ {
+ "epoch": 85.79291553133515,
+ "grad_norm": 2.3275468349456787,
+ "learning_rate": 1.0400642363117918e-06,
+ "loss": 0.0294,
+ "step": 31486
+ },
+ {
+ "epoch": 85.79564032697547,
+ "grad_norm": 2.6586239337921143,
+ "learning_rate": 1.039672384446211e-06,
+ "loss": 0.0275,
+ "step": 31487
+ },
+ {
+ "epoch": 85.7983651226158,
+ "grad_norm": 2.1028189659118652,
+ "learning_rate": 1.0392806023633717e-06,
+ "loss": 0.0388,
+ "step": 31488
+ },
+ {
+ "epoch": 85.80108991825612,
+ "grad_norm": 2.2674365043640137,
+ "learning_rate": 1.0388888900663274e-06,
+ "loss": 0.1472,
+ "step": 31489
+ },
+ {
+ "epoch": 85.80381471389646,
+ "grad_norm": 3.2275967597961426,
+ "learning_rate": 1.038497247558129e-06,
+ "loss": 0.0364,
+ "step": 31490
+ },
+ {
+ "epoch": 85.80653950953679,
+ "grad_norm": 2.492194652557373,
+ "learning_rate": 1.038105674841825e-06,
+ "loss": 0.0705,
+ "step": 31491
+ },
+ {
+ "epoch": 85.80926430517711,
+ "grad_norm": 2.9958271980285645,
+ "learning_rate": 1.0377141719204642e-06,
+ "loss": 0.2088,
+ "step": 31492
+ },
+ {
+ "epoch": 85.81198910081744,
+ "grad_norm": 2.5424046516418457,
+ "learning_rate": 1.0373227387970986e-06,
+ "loss": 0.027,
+ "step": 31493
+ },
+ {
+ "epoch": 85.81471389645776,
+ "grad_norm": 2.828305959701538,
+ "learning_rate": 1.0369313754747744e-06,
+ "loss": 0.076,
+ "step": 31494
+ },
+ {
+ "epoch": 85.8174386920981,
+ "grad_norm": 2.2557549476623535,
+ "learning_rate": 1.0365400819565407e-06,
+ "loss": 0.0321,
+ "step": 31495
+ },
+ {
+ "epoch": 85.82016348773843,
+ "grad_norm": 2.285198926925659,
+ "learning_rate": 1.0361488582454404e-06,
+ "loss": 0.069,
+ "step": 31496
+ },
+ {
+ "epoch": 85.82288828337875,
+ "grad_norm": 3.4394943714141846,
+ "learning_rate": 1.0357577043445287e-06,
+ "loss": 0.0373,
+ "step": 31497
+ },
+ {
+ "epoch": 85.82561307901908,
+ "grad_norm": 2.6939773559570312,
+ "learning_rate": 1.0353666202568468e-06,
+ "loss": 0.0318,
+ "step": 31498
+ },
+ {
+ "epoch": 85.8283378746594,
+ "grad_norm": 3.18467378616333,
+ "learning_rate": 1.0349756059854421e-06,
+ "loss": 0.1026,
+ "step": 31499
+ },
+ {
+ "epoch": 85.83106267029973,
+ "grad_norm": 2.1771793365478516,
+ "learning_rate": 1.0345846615333565e-06,
+ "loss": 0.0364,
+ "step": 31500
+ },
+ {
+ "epoch": 85.83378746594005,
+ "grad_norm": 4.8560662269592285,
+ "learning_rate": 1.034193786903639e-06,
+ "loss": 0.1635,
+ "step": 31501
+ },
+ {
+ "epoch": 85.83651226158038,
+ "grad_norm": 2.727335214614868,
+ "learning_rate": 1.033802982099331e-06,
+ "loss": 0.0716,
+ "step": 31502
+ },
+ {
+ "epoch": 85.83923705722071,
+ "grad_norm": 2.5315072536468506,
+ "learning_rate": 1.0334122471234775e-06,
+ "loss": 0.1616,
+ "step": 31503
+ },
+ {
+ "epoch": 85.84196185286103,
+ "grad_norm": 2.0643715858459473,
+ "learning_rate": 1.033021581979118e-06,
+ "loss": 0.0664,
+ "step": 31504
+ },
+ {
+ "epoch": 85.84468664850137,
+ "grad_norm": 3.0063178539276123,
+ "learning_rate": 1.0326309866693007e-06,
+ "loss": 0.2104,
+ "step": 31505
+ },
+ {
+ "epoch": 85.84741144414168,
+ "grad_norm": 3.5163540840148926,
+ "learning_rate": 1.032240461197065e-06,
+ "loss": 0.0269,
+ "step": 31506
+ },
+ {
+ "epoch": 85.85013623978202,
+ "grad_norm": 2.4701731204986572,
+ "learning_rate": 1.0318500055654513e-06,
+ "loss": 0.0315,
+ "step": 31507
+ },
+ {
+ "epoch": 85.85286103542235,
+ "grad_norm": 3.7995245456695557,
+ "learning_rate": 1.0314596197774985e-06,
+ "loss": 0.1136,
+ "step": 31508
+ },
+ {
+ "epoch": 85.85558583106267,
+ "grad_norm": 2.90480375289917,
+ "learning_rate": 1.0310693038362518e-06,
+ "loss": 0.0612,
+ "step": 31509
+ },
+ {
+ "epoch": 85.858310626703,
+ "grad_norm": 2.6373202800750732,
+ "learning_rate": 1.03067905774475e-06,
+ "loss": 0.0476,
+ "step": 31510
+ },
+ {
+ "epoch": 85.86103542234332,
+ "grad_norm": 2.086611747741699,
+ "learning_rate": 1.0302888815060297e-06,
+ "loss": 0.0798,
+ "step": 31511
+ },
+ {
+ "epoch": 85.86376021798365,
+ "grad_norm": 2.0838420391082764,
+ "learning_rate": 1.0298987751231293e-06,
+ "loss": 0.0282,
+ "step": 31512
+ },
+ {
+ "epoch": 85.86648501362397,
+ "grad_norm": 2.5717296600341797,
+ "learning_rate": 1.0295087385990888e-06,
+ "loss": 0.2165,
+ "step": 31513
+ },
+ {
+ "epoch": 85.8692098092643,
+ "grad_norm": 4.200585842132568,
+ "learning_rate": 1.0291187719369466e-06,
+ "loss": 0.0344,
+ "step": 31514
+ },
+ {
+ "epoch": 85.87193460490464,
+ "grad_norm": 2.4633283615112305,
+ "learning_rate": 1.0287288751397395e-06,
+ "loss": 0.0529,
+ "step": 31515
+ },
+ {
+ "epoch": 85.87465940054496,
+ "grad_norm": 3.0095136165618896,
+ "learning_rate": 1.0283390482105037e-06,
+ "loss": 0.0295,
+ "step": 31516
+ },
+ {
+ "epoch": 85.87738419618529,
+ "grad_norm": 2.8084800243377686,
+ "learning_rate": 1.0279492911522714e-06,
+ "loss": 0.0425,
+ "step": 31517
+ },
+ {
+ "epoch": 85.88010899182561,
+ "grad_norm": 2.4964981079101562,
+ "learning_rate": 1.0275596039680835e-06,
+ "loss": 0.0404,
+ "step": 31518
+ },
+ {
+ "epoch": 85.88283378746594,
+ "grad_norm": 2.2275397777557373,
+ "learning_rate": 1.027169986660973e-06,
+ "loss": 0.0281,
+ "step": 31519
+ },
+ {
+ "epoch": 85.88555858310627,
+ "grad_norm": 2.452439785003662,
+ "learning_rate": 1.026780439233972e-06,
+ "loss": 0.0469,
+ "step": 31520
+ },
+ {
+ "epoch": 85.88828337874659,
+ "grad_norm": 2.2140159606933594,
+ "learning_rate": 1.026390961690118e-06,
+ "loss": 0.0178,
+ "step": 31521
+ },
+ {
+ "epoch": 85.89100817438693,
+ "grad_norm": 2.875448703765869,
+ "learning_rate": 1.026001554032443e-06,
+ "loss": 0.0587,
+ "step": 31522
+ },
+ {
+ "epoch": 85.89373297002724,
+ "grad_norm": 2.641120672225952,
+ "learning_rate": 1.025612216263978e-06,
+ "loss": 0.0683,
+ "step": 31523
+ },
+ {
+ "epoch": 85.89645776566758,
+ "grad_norm": 1.6421146392822266,
+ "learning_rate": 1.0252229483877551e-06,
+ "loss": 0.0227,
+ "step": 31524
+ },
+ {
+ "epoch": 85.8991825613079,
+ "grad_norm": 2.881132125854492,
+ "learning_rate": 1.0248337504068085e-06,
+ "loss": 0.0413,
+ "step": 31525
+ },
+ {
+ "epoch": 85.90190735694823,
+ "grad_norm": 2.6686294078826904,
+ "learning_rate": 1.0244446223241677e-06,
+ "loss": 0.0603,
+ "step": 31526
+ },
+ {
+ "epoch": 85.90463215258856,
+ "grad_norm": 1.8666067123413086,
+ "learning_rate": 1.024055564142863e-06,
+ "loss": 0.0174,
+ "step": 31527
+ },
+ {
+ "epoch": 85.90735694822888,
+ "grad_norm": 2.5336527824401855,
+ "learning_rate": 1.0236665758659237e-06,
+ "loss": 0.0888,
+ "step": 31528
+ },
+ {
+ "epoch": 85.91008174386921,
+ "grad_norm": 2.7427446842193604,
+ "learning_rate": 1.023277657496381e-06,
+ "loss": 0.0374,
+ "step": 31529
+ },
+ {
+ "epoch": 85.91280653950953,
+ "grad_norm": 2.498741388320923,
+ "learning_rate": 1.0228888090372613e-06,
+ "loss": 0.0218,
+ "step": 31530
+ },
+ {
+ "epoch": 85.91553133514986,
+ "grad_norm": 2.7943947315216064,
+ "learning_rate": 1.0225000304915977e-06,
+ "loss": 0.0419,
+ "step": 31531
+ },
+ {
+ "epoch": 85.9182561307902,
+ "grad_norm": 6.141363143920898,
+ "learning_rate": 1.0221113218624134e-06,
+ "loss": 0.1079,
+ "step": 31532
+ },
+ {
+ "epoch": 85.92098092643052,
+ "grad_norm": 2.3486995697021484,
+ "learning_rate": 1.021722683152736e-06,
+ "loss": 0.046,
+ "step": 31533
+ },
+ {
+ "epoch": 85.92370572207085,
+ "grad_norm": 2.334148645401001,
+ "learning_rate": 1.0213341143655952e-06,
+ "loss": 0.0354,
+ "step": 31534
+ },
+ {
+ "epoch": 85.92643051771117,
+ "grad_norm": 2.234052896499634,
+ "learning_rate": 1.0209456155040166e-06,
+ "loss": 0.1401,
+ "step": 31535
+ },
+ {
+ "epoch": 85.9291553133515,
+ "grad_norm": 5.003220558166504,
+ "learning_rate": 1.020557186571023e-06,
+ "loss": 0.0345,
+ "step": 31536
+ },
+ {
+ "epoch": 85.93188010899182,
+ "grad_norm": 2.0255320072174072,
+ "learning_rate": 1.0201688275696397e-06,
+ "loss": 0.0686,
+ "step": 31537
+ },
+ {
+ "epoch": 85.93460490463215,
+ "grad_norm": 2.026007652282715,
+ "learning_rate": 1.0197805385028935e-06,
+ "loss": 0.0272,
+ "step": 31538
+ },
+ {
+ "epoch": 85.93732970027249,
+ "grad_norm": 2.777132749557495,
+ "learning_rate": 1.0193923193738087e-06,
+ "loss": 0.045,
+ "step": 31539
+ },
+ {
+ "epoch": 85.9400544959128,
+ "grad_norm": 2.49111008644104,
+ "learning_rate": 1.019004170185407e-06,
+ "loss": 0.0387,
+ "step": 31540
+ },
+ {
+ "epoch": 85.94277929155314,
+ "grad_norm": 2.2162814140319824,
+ "learning_rate": 1.0186160909407095e-06,
+ "loss": 0.0233,
+ "step": 31541
+ },
+ {
+ "epoch": 85.94550408719346,
+ "grad_norm": 2.7575600147247314,
+ "learning_rate": 1.0182280816427436e-06,
+ "loss": 0.1483,
+ "step": 31542
+ },
+ {
+ "epoch": 85.94822888283379,
+ "grad_norm": 3.0144386291503906,
+ "learning_rate": 1.0178401422945273e-06,
+ "loss": 0.0549,
+ "step": 31543
+ },
+ {
+ "epoch": 85.95095367847412,
+ "grad_norm": 3.633289098739624,
+ "learning_rate": 1.0174522728990821e-06,
+ "loss": 0.0442,
+ "step": 31544
+ },
+ {
+ "epoch": 85.95367847411444,
+ "grad_norm": 2.7940962314605713,
+ "learning_rate": 1.0170644734594304e-06,
+ "loss": 0.0675,
+ "step": 31545
+ },
+ {
+ "epoch": 85.95640326975477,
+ "grad_norm": 2.4861257076263428,
+ "learning_rate": 1.0166767439785917e-06,
+ "loss": 0.0333,
+ "step": 31546
+ },
+ {
+ "epoch": 85.95912806539509,
+ "grad_norm": 2.6529250144958496,
+ "learning_rate": 1.016289084459584e-06,
+ "loss": 0.0348,
+ "step": 31547
+ },
+ {
+ "epoch": 85.96185286103542,
+ "grad_norm": 3.331308364868164,
+ "learning_rate": 1.015901494905429e-06,
+ "loss": 0.0411,
+ "step": 31548
+ },
+ {
+ "epoch": 85.96457765667574,
+ "grad_norm": 2.4053611755371094,
+ "learning_rate": 1.0155139753191424e-06,
+ "loss": 0.053,
+ "step": 31549
+ },
+ {
+ "epoch": 85.96730245231608,
+ "grad_norm": 2.1256680488586426,
+ "learning_rate": 1.0151265257037457e-06,
+ "loss": 0.0401,
+ "step": 31550
+ },
+ {
+ "epoch": 85.97002724795641,
+ "grad_norm": 3.6913411617279053,
+ "learning_rate": 1.0147391460622547e-06,
+ "loss": 0.1061,
+ "step": 31551
+ },
+ {
+ "epoch": 85.97275204359673,
+ "grad_norm": 2.2901344299316406,
+ "learning_rate": 1.0143518363976857e-06,
+ "loss": 0.0257,
+ "step": 31552
+ },
+ {
+ "epoch": 85.97547683923706,
+ "grad_norm": 3.701040744781494,
+ "learning_rate": 1.013964596713053e-06,
+ "loss": 0.1472,
+ "step": 31553
+ },
+ {
+ "epoch": 85.97820163487738,
+ "grad_norm": 2.446267604827881,
+ "learning_rate": 1.0135774270113774e-06,
+ "loss": 0.0359,
+ "step": 31554
+ },
+ {
+ "epoch": 85.98092643051771,
+ "grad_norm": 7.176121234893799,
+ "learning_rate": 1.0131903272956722e-06,
+ "loss": 0.0816,
+ "step": 31555
+ },
+ {
+ "epoch": 85.98365122615803,
+ "grad_norm": 1.4883784055709839,
+ "learning_rate": 1.0128032975689506e-06,
+ "loss": 0.0185,
+ "step": 31556
+ },
+ {
+ "epoch": 85.98637602179836,
+ "grad_norm": 2.5638229846954346,
+ "learning_rate": 1.0124163378342255e-06,
+ "loss": 0.0256,
+ "step": 31557
+ },
+ {
+ "epoch": 85.9891008174387,
+ "grad_norm": 3.9347333908081055,
+ "learning_rate": 1.0120294480945148e-06,
+ "loss": 0.0617,
+ "step": 31558
+ },
+ {
+ "epoch": 85.99182561307902,
+ "grad_norm": 2.0129220485687256,
+ "learning_rate": 1.0116426283528301e-06,
+ "loss": 0.0208,
+ "step": 31559
+ },
+ {
+ "epoch": 85.99455040871935,
+ "grad_norm": 2.478191614151001,
+ "learning_rate": 1.0112558786121829e-06,
+ "loss": 0.1113,
+ "step": 31560
+ },
+ {
+ "epoch": 85.99727520435967,
+ "grad_norm": 2.614762783050537,
+ "learning_rate": 1.0108691988755837e-06,
+ "loss": 0.1372,
+ "step": 31561
+ },
+ {
+ "epoch": 86.0,
+ "grad_norm": 2.7023041248321533,
+ "learning_rate": 1.010482589146048e-06,
+ "loss": 0.0381,
+ "step": 31562
+ },
+ {
+ "epoch": 86.00272479564033,
+ "grad_norm": 3.757795572280884,
+ "learning_rate": 1.0100960494265843e-06,
+ "loss": 0.1278,
+ "step": 31563
+ },
+ {
+ "epoch": 86.00544959128065,
+ "grad_norm": 1.8841562271118164,
+ "learning_rate": 1.0097095797202016e-06,
+ "loss": 0.0246,
+ "step": 31564
+ },
+ {
+ "epoch": 86.00817438692098,
+ "grad_norm": 2.0132946968078613,
+ "learning_rate": 1.0093231800299109e-06,
+ "loss": 0.0715,
+ "step": 31565
+ },
+ {
+ "epoch": 86.0108991825613,
+ "grad_norm": 3.5072214603424072,
+ "learning_rate": 1.0089368503587238e-06,
+ "loss": 0.0303,
+ "step": 31566
+ },
+ {
+ "epoch": 86.01362397820164,
+ "grad_norm": 2.2425694465637207,
+ "learning_rate": 1.008550590709647e-06,
+ "loss": 0.0373,
+ "step": 31567
+ },
+ {
+ "epoch": 86.01634877384195,
+ "grad_norm": 2.0086355209350586,
+ "learning_rate": 1.0081644010856895e-06,
+ "loss": 0.0391,
+ "step": 31568
+ },
+ {
+ "epoch": 86.01907356948229,
+ "grad_norm": 3.336557626724243,
+ "learning_rate": 1.0077782814898563e-06,
+ "loss": 0.0402,
+ "step": 31569
+ },
+ {
+ "epoch": 86.02179836512262,
+ "grad_norm": 2.4130775928497314,
+ "learning_rate": 1.0073922319251584e-06,
+ "loss": 0.0249,
+ "step": 31570
+ },
+ {
+ "epoch": 86.02452316076294,
+ "grad_norm": 2.9354212284088135,
+ "learning_rate": 1.0070062523946001e-06,
+ "loss": 0.0931,
+ "step": 31571
+ },
+ {
+ "epoch": 86.02724795640327,
+ "grad_norm": 3.061462163925171,
+ "learning_rate": 1.006620342901188e-06,
+ "loss": 0.0888,
+ "step": 31572
+ },
+ {
+ "epoch": 86.02997275204359,
+ "grad_norm": 3.5965375900268555,
+ "learning_rate": 1.0062345034479236e-06,
+ "loss": 0.0609,
+ "step": 31573
+ },
+ {
+ "epoch": 86.03269754768392,
+ "grad_norm": 2.9291248321533203,
+ "learning_rate": 1.0058487340378187e-06,
+ "loss": 0.1035,
+ "step": 31574
+ },
+ {
+ "epoch": 86.03542234332426,
+ "grad_norm": 1.810512900352478,
+ "learning_rate": 1.0054630346738747e-06,
+ "loss": 0.0278,
+ "step": 31575
+ },
+ {
+ "epoch": 86.03814713896458,
+ "grad_norm": 2.29118275642395,
+ "learning_rate": 1.005077405359095e-06,
+ "loss": 0.0427,
+ "step": 31576
+ },
+ {
+ "epoch": 86.04087193460491,
+ "grad_norm": 1.8794190883636475,
+ "learning_rate": 1.0046918460964806e-06,
+ "loss": 0.0446,
+ "step": 31577
+ },
+ {
+ "epoch": 86.04359673024523,
+ "grad_norm": 2.5822699069976807,
+ "learning_rate": 1.0043063568890388e-06,
+ "loss": 0.0974,
+ "step": 31578
+ },
+ {
+ "epoch": 86.04632152588556,
+ "grad_norm": 7.6384663581848145,
+ "learning_rate": 1.0039209377397696e-06,
+ "loss": 0.0791,
+ "step": 31579
+ },
+ {
+ "epoch": 86.04904632152588,
+ "grad_norm": 2.6081624031066895,
+ "learning_rate": 1.003535588651674e-06,
+ "loss": 0.0252,
+ "step": 31580
+ },
+ {
+ "epoch": 86.05177111716621,
+ "grad_norm": 4.446021556854248,
+ "learning_rate": 1.0031503096277529e-06,
+ "loss": 0.0521,
+ "step": 31581
+ },
+ {
+ "epoch": 86.05449591280654,
+ "grad_norm": 3.872101068496704,
+ "learning_rate": 1.002765100671007e-06,
+ "loss": 0.0657,
+ "step": 31582
+ },
+ {
+ "epoch": 86.05722070844686,
+ "grad_norm": 3.703188896179199,
+ "learning_rate": 1.0023799617844387e-06,
+ "loss": 0.1037,
+ "step": 31583
+ },
+ {
+ "epoch": 86.0599455040872,
+ "grad_norm": 3.0919201374053955,
+ "learning_rate": 1.0019948929710456e-06,
+ "loss": 0.0465,
+ "step": 31584
+ },
+ {
+ "epoch": 86.06267029972751,
+ "grad_norm": 2.5964608192443848,
+ "learning_rate": 1.0016098942338249e-06,
+ "loss": 0.1445,
+ "step": 31585
+ },
+ {
+ "epoch": 86.06539509536785,
+ "grad_norm": 3.06375789642334,
+ "learning_rate": 1.0012249655757788e-06,
+ "loss": 0.047,
+ "step": 31586
+ },
+ {
+ "epoch": 86.06811989100818,
+ "grad_norm": 2.214186668395996,
+ "learning_rate": 1.000840106999903e-06,
+ "loss": 0.0228,
+ "step": 31587
+ },
+ {
+ "epoch": 86.0708446866485,
+ "grad_norm": 2.7507073879241943,
+ "learning_rate": 1.0004553185091948e-06,
+ "loss": 0.0348,
+ "step": 31588
+ },
+ {
+ "epoch": 86.07356948228883,
+ "grad_norm": 5.628101348876953,
+ "learning_rate": 1.0000706001066485e-06,
+ "loss": 0.2528,
+ "step": 31589
+ },
+ {
+ "epoch": 86.07629427792915,
+ "grad_norm": 1.5397335290908813,
+ "learning_rate": 9.996859517952652e-07,
+ "loss": 0.0209,
+ "step": 31590
+ },
+ {
+ "epoch": 86.07901907356948,
+ "grad_norm": 2.0383923053741455,
+ "learning_rate": 9.993013735780376e-07,
+ "loss": 0.1154,
+ "step": 31591
+ },
+ {
+ "epoch": 86.0817438692098,
+ "grad_norm": 2.6254165172576904,
+ "learning_rate": 9.989168654579617e-07,
+ "loss": 0.0374,
+ "step": 31592
+ },
+ {
+ "epoch": 86.08446866485014,
+ "grad_norm": 2.1478607654571533,
+ "learning_rate": 9.985324274380292e-07,
+ "loss": 0.0405,
+ "step": 31593
+ },
+ {
+ "epoch": 86.08719346049047,
+ "grad_norm": 5.356241703033447,
+ "learning_rate": 9.981480595212389e-07,
+ "loss": 0.1077,
+ "step": 31594
+ },
+ {
+ "epoch": 86.08991825613079,
+ "grad_norm": 2.7925865650177,
+ "learning_rate": 9.977637617105818e-07,
+ "loss": 0.0503,
+ "step": 31595
+ },
+ {
+ "epoch": 86.09264305177112,
+ "grad_norm": 2.177604913711548,
+ "learning_rate": 9.973795340090498e-07,
+ "loss": 0.2251,
+ "step": 31596
+ },
+ {
+ "epoch": 86.09536784741144,
+ "grad_norm": 2.89493989944458,
+ "learning_rate": 9.96995376419635e-07,
+ "loss": 0.0238,
+ "step": 31597
+ },
+ {
+ "epoch": 86.09809264305177,
+ "grad_norm": 2.561154842376709,
+ "learning_rate": 9.966112889453328e-07,
+ "loss": 0.0974,
+ "step": 31598
+ },
+ {
+ "epoch": 86.1008174386921,
+ "grad_norm": 2.3899598121643066,
+ "learning_rate": 9.962272715891296e-07,
+ "loss": 0.0529,
+ "step": 31599
+ },
+ {
+ "epoch": 86.10354223433242,
+ "grad_norm": 2.1979386806488037,
+ "learning_rate": 9.958433243540211e-07,
+ "loss": 0.0818,
+ "step": 31600
+ },
+ {
+ "epoch": 86.10626702997276,
+ "grad_norm": 1.9779709577560425,
+ "learning_rate": 9.954594472429947e-07,
+ "loss": 0.0222,
+ "step": 31601
+ },
+ {
+ "epoch": 86.10899182561307,
+ "grad_norm": 6.739572525024414,
+ "learning_rate": 9.950756402590379e-07,
+ "loss": 0.0601,
+ "step": 31602
+ },
+ {
+ "epoch": 86.11171662125341,
+ "grad_norm": 2.4656660556793213,
+ "learning_rate": 9.94691903405145e-07,
+ "loss": 0.0442,
+ "step": 31603
+ },
+ {
+ "epoch": 86.11444141689373,
+ "grad_norm": 1.7424670457839966,
+ "learning_rate": 9.943082366843005e-07,
+ "loss": 0.1101,
+ "step": 31604
+ },
+ {
+ "epoch": 86.11716621253406,
+ "grad_norm": 1.816726803779602,
+ "learning_rate": 9.939246400994929e-07,
+ "loss": 0.1181,
+ "step": 31605
+ },
+ {
+ "epoch": 86.11989100817439,
+ "grad_norm": 2.8455731868743896,
+ "learning_rate": 9.935411136537121e-07,
+ "loss": 0.0796,
+ "step": 31606
+ },
+ {
+ "epoch": 86.12261580381471,
+ "grad_norm": 1.9792871475219727,
+ "learning_rate": 9.931576573499425e-07,
+ "loss": 0.0303,
+ "step": 31607
+ },
+ {
+ "epoch": 86.12534059945504,
+ "grad_norm": 2.497490882873535,
+ "learning_rate": 9.927742711911715e-07,
+ "loss": 0.1184,
+ "step": 31608
+ },
+ {
+ "epoch": 86.12806539509536,
+ "grad_norm": 2.35503888130188,
+ "learning_rate": 9.923909551803824e-07,
+ "loss": 0.0634,
+ "step": 31609
+ },
+ {
+ "epoch": 86.1307901907357,
+ "grad_norm": 2.9196982383728027,
+ "learning_rate": 9.920077093205648e-07,
+ "loss": 0.0273,
+ "step": 31610
+ },
+ {
+ "epoch": 86.13351498637603,
+ "grad_norm": 3.038902521133423,
+ "learning_rate": 9.916245336147023e-07,
+ "loss": 0.0262,
+ "step": 31611
+ },
+ {
+ "epoch": 86.13623978201635,
+ "grad_norm": 2.693570852279663,
+ "learning_rate": 9.912414280657766e-07,
+ "loss": 0.0563,
+ "step": 31612
+ },
+ {
+ "epoch": 86.13896457765668,
+ "grad_norm": 2.607591390609741,
+ "learning_rate": 9.908583926767712e-07,
+ "loss": 0.1106,
+ "step": 31613
+ },
+ {
+ "epoch": 86.141689373297,
+ "grad_norm": 2.580155372619629,
+ "learning_rate": 9.904754274506723e-07,
+ "loss": 0.0608,
+ "step": 31614
+ },
+ {
+ "epoch": 86.14441416893733,
+ "grad_norm": 3.828810453414917,
+ "learning_rate": 9.90092532390462e-07,
+ "loss": 0.1573,
+ "step": 31615
+ },
+ {
+ "epoch": 86.14713896457765,
+ "grad_norm": 2.2987725734710693,
+ "learning_rate": 9.89709707499118e-07,
+ "loss": 0.0311,
+ "step": 31616
+ },
+ {
+ "epoch": 86.14986376021798,
+ "grad_norm": 2.210296630859375,
+ "learning_rate": 9.893269527796268e-07,
+ "loss": 0.0528,
+ "step": 31617
+ },
+ {
+ "epoch": 86.15258855585832,
+ "grad_norm": 4.510499954223633,
+ "learning_rate": 9.88944268234966e-07,
+ "loss": 0.1065,
+ "step": 31618
+ },
+ {
+ "epoch": 86.15531335149863,
+ "grad_norm": 2.624666452407837,
+ "learning_rate": 9.885616538681186e-07,
+ "loss": 0.0655,
+ "step": 31619
+ },
+ {
+ "epoch": 86.15803814713897,
+ "grad_norm": 3.6263275146484375,
+ "learning_rate": 9.881791096820625e-07,
+ "loss": 0.0242,
+ "step": 31620
+ },
+ {
+ "epoch": 86.16076294277929,
+ "grad_norm": 2.314969062805176,
+ "learning_rate": 9.877966356797785e-07,
+ "loss": 0.0376,
+ "step": 31621
+ },
+ {
+ "epoch": 86.16348773841962,
+ "grad_norm": 2.3886630535125732,
+ "learning_rate": 9.87414231864242e-07,
+ "loss": 0.0185,
+ "step": 31622
+ },
+ {
+ "epoch": 86.16621253405995,
+ "grad_norm": 3.664731502532959,
+ "learning_rate": 9.870318982384352e-07,
+ "loss": 0.035,
+ "step": 31623
+ },
+ {
+ "epoch": 86.16893732970027,
+ "grad_norm": 6.761654376983643,
+ "learning_rate": 9.866496348053334e-07,
+ "loss": 0.0874,
+ "step": 31624
+ },
+ {
+ "epoch": 86.1716621253406,
+ "grad_norm": 2.344679594039917,
+ "learning_rate": 9.862674415679152e-07,
+ "loss": 0.0234,
+ "step": 31625
+ },
+ {
+ "epoch": 86.17438692098092,
+ "grad_norm": 2.3501219749450684,
+ "learning_rate": 9.858853185291538e-07,
+ "loss": 0.0343,
+ "step": 31626
+ },
+ {
+ "epoch": 86.17711171662125,
+ "grad_norm": 2.972172260284424,
+ "learning_rate": 9.855032656920283e-07,
+ "loss": 0.0427,
+ "step": 31627
+ },
+ {
+ "epoch": 86.17983651226157,
+ "grad_norm": 2.6144793033599854,
+ "learning_rate": 9.851212830595148e-07,
+ "loss": 0.0368,
+ "step": 31628
+ },
+ {
+ "epoch": 86.1825613079019,
+ "grad_norm": 1.8932509422302246,
+ "learning_rate": 9.847393706345843e-07,
+ "loss": 0.023,
+ "step": 31629
+ },
+ {
+ "epoch": 86.18528610354224,
+ "grad_norm": 2.38089919090271,
+ "learning_rate": 9.843575284202145e-07,
+ "loss": 0.0579,
+ "step": 31630
+ },
+ {
+ "epoch": 86.18801089918256,
+ "grad_norm": 3.900752544403076,
+ "learning_rate": 9.839757564193787e-07,
+ "loss": 0.1188,
+ "step": 31631
+ },
+ {
+ "epoch": 86.19073569482289,
+ "grad_norm": 2.6539125442504883,
+ "learning_rate": 9.835940546350498e-07,
+ "loss": 0.0752,
+ "step": 31632
+ },
+ {
+ "epoch": 86.19346049046321,
+ "grad_norm": 2.0343661308288574,
+ "learning_rate": 9.832124230701979e-07,
+ "loss": 0.0365,
+ "step": 31633
+ },
+ {
+ "epoch": 86.19618528610354,
+ "grad_norm": 2.7909703254699707,
+ "learning_rate": 9.828308617277971e-07,
+ "loss": 0.0272,
+ "step": 31634
+ },
+ {
+ "epoch": 86.19891008174388,
+ "grad_norm": 2.19333815574646,
+ "learning_rate": 9.824493706108218e-07,
+ "loss": 0.0705,
+ "step": 31635
+ },
+ {
+ "epoch": 86.2016348773842,
+ "grad_norm": 1.797225832939148,
+ "learning_rate": 9.820679497222396e-07,
+ "loss": 0.0279,
+ "step": 31636
+ },
+ {
+ "epoch": 86.20435967302453,
+ "grad_norm": 2.0403614044189453,
+ "learning_rate": 9.816865990650238e-07,
+ "loss": 0.0642,
+ "step": 31637
+ },
+ {
+ "epoch": 86.20708446866485,
+ "grad_norm": 3.0743956565856934,
+ "learning_rate": 9.813053186421395e-07,
+ "loss": 0.028,
+ "step": 31638
+ },
+ {
+ "epoch": 86.20980926430518,
+ "grad_norm": 1.8789576292037964,
+ "learning_rate": 9.8092410845656e-07,
+ "loss": 0.1133,
+ "step": 31639
+ },
+ {
+ "epoch": 86.2125340599455,
+ "grad_norm": 2.5614380836486816,
+ "learning_rate": 9.805429685112555e-07,
+ "loss": 0.1739,
+ "step": 31640
+ },
+ {
+ "epoch": 86.21525885558583,
+ "grad_norm": 2.94986629486084,
+ "learning_rate": 9.80161898809191e-07,
+ "loss": 0.1197,
+ "step": 31641
+ },
+ {
+ "epoch": 86.21798365122616,
+ "grad_norm": 8.736162185668945,
+ "learning_rate": 9.79780899353333e-07,
+ "loss": 0.0333,
+ "step": 31642
+ },
+ {
+ "epoch": 86.22070844686648,
+ "grad_norm": 2.2208738327026367,
+ "learning_rate": 9.793999701466527e-07,
+ "loss": 0.1297,
+ "step": 31643
+ },
+ {
+ "epoch": 86.22343324250681,
+ "grad_norm": 2.76037859916687,
+ "learning_rate": 9.790191111921166e-07,
+ "loss": 0.102,
+ "step": 31644
+ },
+ {
+ "epoch": 86.22615803814713,
+ "grad_norm": 2.774686098098755,
+ "learning_rate": 9.786383224926877e-07,
+ "loss": 0.0749,
+ "step": 31645
+ },
+ {
+ "epoch": 86.22888283378747,
+ "grad_norm": 2.381895065307617,
+ "learning_rate": 9.782576040513325e-07,
+ "loss": 0.0385,
+ "step": 31646
+ },
+ {
+ "epoch": 86.2316076294278,
+ "grad_norm": 2.5969865322113037,
+ "learning_rate": 9.778769558710177e-07,
+ "loss": 0.0536,
+ "step": 31647
+ },
+ {
+ "epoch": 86.23433242506812,
+ "grad_norm": 2.099355697631836,
+ "learning_rate": 9.774963779547076e-07,
+ "loss": 0.0508,
+ "step": 31648
+ },
+ {
+ "epoch": 86.23705722070845,
+ "grad_norm": 2.1510770320892334,
+ "learning_rate": 9.771158703053652e-07,
+ "loss": 0.03,
+ "step": 31649
+ },
+ {
+ "epoch": 86.23978201634877,
+ "grad_norm": 3.3781051635742188,
+ "learning_rate": 9.767354329259515e-07,
+ "loss": 0.0821,
+ "step": 31650
+ },
+ {
+ "epoch": 86.2425068119891,
+ "grad_norm": 2.2429616451263428,
+ "learning_rate": 9.76355065819432e-07,
+ "loss": 0.035,
+ "step": 31651
+ },
+ {
+ "epoch": 86.24523160762942,
+ "grad_norm": 3.0349185466766357,
+ "learning_rate": 9.75974768988771e-07,
+ "loss": 0.1015,
+ "step": 31652
+ },
+ {
+ "epoch": 86.24795640326975,
+ "grad_norm": 2.058422565460205,
+ "learning_rate": 9.755945424369283e-07,
+ "loss": 0.0319,
+ "step": 31653
+ },
+ {
+ "epoch": 86.25068119891009,
+ "grad_norm": 2.664964199066162,
+ "learning_rate": 9.752143861668628e-07,
+ "loss": 0.0303,
+ "step": 31654
+ },
+ {
+ "epoch": 86.2534059945504,
+ "grad_norm": 2.0678510665893555,
+ "learning_rate": 9.748343001815385e-07,
+ "loss": 0.0316,
+ "step": 31655
+ },
+ {
+ "epoch": 86.25613079019074,
+ "grad_norm": 2.756922960281372,
+ "learning_rate": 9.744542844839145e-07,
+ "loss": 0.0724,
+ "step": 31656
+ },
+ {
+ "epoch": 86.25885558583106,
+ "grad_norm": 2.7466092109680176,
+ "learning_rate": 9.740743390769503e-07,
+ "loss": 0.0384,
+ "step": 31657
+ },
+ {
+ "epoch": 86.26158038147139,
+ "grad_norm": 2.183837652206421,
+ "learning_rate": 9.736944639636025e-07,
+ "loss": 0.061,
+ "step": 31658
+ },
+ {
+ "epoch": 86.26430517711172,
+ "grad_norm": 2.141596794128418,
+ "learning_rate": 9.733146591468334e-07,
+ "loss": 0.0342,
+ "step": 31659
+ },
+ {
+ "epoch": 86.26702997275204,
+ "grad_norm": 1.158841848373413,
+ "learning_rate": 9.729349246296005e-07,
+ "loss": 0.0144,
+ "step": 31660
+ },
+ {
+ "epoch": 86.26975476839237,
+ "grad_norm": 3.59151029586792,
+ "learning_rate": 9.72555260414858e-07,
+ "loss": 0.1706,
+ "step": 31661
+ },
+ {
+ "epoch": 86.2724795640327,
+ "grad_norm": 2.8652048110961914,
+ "learning_rate": 9.721756665055637e-07,
+ "loss": 0.113,
+ "step": 31662
+ },
+ {
+ "epoch": 86.27520435967303,
+ "grad_norm": 2.286719560623169,
+ "learning_rate": 9.717961429046773e-07,
+ "loss": 0.0691,
+ "step": 31663
+ },
+ {
+ "epoch": 86.27792915531334,
+ "grad_norm": 3.3621742725372314,
+ "learning_rate": 9.714166896151511e-07,
+ "loss": 0.051,
+ "step": 31664
+ },
+ {
+ "epoch": 86.28065395095368,
+ "grad_norm": 7.1724677085876465,
+ "learning_rate": 9.710373066399413e-07,
+ "loss": 0.0445,
+ "step": 31665
+ },
+ {
+ "epoch": 86.28337874659401,
+ "grad_norm": 2.8919363021850586,
+ "learning_rate": 9.706579939820005e-07,
+ "loss": 0.1347,
+ "step": 31666
+ },
+ {
+ "epoch": 86.28610354223433,
+ "grad_norm": 3.9138731956481934,
+ "learning_rate": 9.702787516442858e-07,
+ "loss": 0.0484,
+ "step": 31667
+ },
+ {
+ "epoch": 86.28882833787466,
+ "grad_norm": 2.2986462116241455,
+ "learning_rate": 9.698995796297483e-07,
+ "loss": 0.0996,
+ "step": 31668
+ },
+ {
+ "epoch": 86.29155313351498,
+ "grad_norm": 2.9334826469421387,
+ "learning_rate": 9.695204779413448e-07,
+ "loss": 0.173,
+ "step": 31669
+ },
+ {
+ "epoch": 86.29427792915531,
+ "grad_norm": 1.976965069770813,
+ "learning_rate": 9.691414465820226e-07,
+ "loss": 0.0242,
+ "step": 31670
+ },
+ {
+ "epoch": 86.29700272479565,
+ "grad_norm": 3.205742120742798,
+ "learning_rate": 9.687624855547372e-07,
+ "loss": 0.0263,
+ "step": 31671
+ },
+ {
+ "epoch": 86.29972752043597,
+ "grad_norm": 2.6435394287109375,
+ "learning_rate": 9.683835948624397e-07,
+ "loss": 0.0585,
+ "step": 31672
+ },
+ {
+ "epoch": 86.3024523160763,
+ "grad_norm": 2.673785924911499,
+ "learning_rate": 9.680047745080811e-07,
+ "loss": 0.1645,
+ "step": 31673
+ },
+ {
+ "epoch": 86.30517711171662,
+ "grad_norm": 2.2024083137512207,
+ "learning_rate": 9.676260244946078e-07,
+ "loss": 0.052,
+ "step": 31674
+ },
+ {
+ "epoch": 86.30790190735695,
+ "grad_norm": 1.9879213571548462,
+ "learning_rate": 9.672473448249741e-07,
+ "loss": 0.1141,
+ "step": 31675
+ },
+ {
+ "epoch": 86.31062670299727,
+ "grad_norm": 2.3783514499664307,
+ "learning_rate": 9.668687355021266e-07,
+ "loss": 0.0229,
+ "step": 31676
+ },
+ {
+ "epoch": 86.3133514986376,
+ "grad_norm": 2.5844457149505615,
+ "learning_rate": 9.664901965290163e-07,
+ "loss": 0.0403,
+ "step": 31677
+ },
+ {
+ "epoch": 86.31607629427793,
+ "grad_norm": 2.5226974487304688,
+ "learning_rate": 9.661117279085862e-07,
+ "loss": 0.0565,
+ "step": 31678
+ },
+ {
+ "epoch": 86.31880108991825,
+ "grad_norm": 2.8497304916381836,
+ "learning_rate": 9.6573332964379e-07,
+ "loss": 0.0582,
+ "step": 31679
+ },
+ {
+ "epoch": 86.32152588555859,
+ "grad_norm": 2.5396921634674072,
+ "learning_rate": 9.653550017375724e-07,
+ "loss": 0.0564,
+ "step": 31680
+ },
+ {
+ "epoch": 86.3242506811989,
+ "grad_norm": 2.415186643600464,
+ "learning_rate": 9.64976744192878e-07,
+ "loss": 0.0755,
+ "step": 31681
+ },
+ {
+ "epoch": 86.32697547683924,
+ "grad_norm": 2.5656049251556396,
+ "learning_rate": 9.645985570126526e-07,
+ "loss": 0.0437,
+ "step": 31682
+ },
+ {
+ "epoch": 86.32970027247957,
+ "grad_norm": 2.18369197845459,
+ "learning_rate": 9.642204401998446e-07,
+ "loss": 0.0396,
+ "step": 31683
+ },
+ {
+ "epoch": 86.33242506811989,
+ "grad_norm": 2.092224359512329,
+ "learning_rate": 9.63842393757397e-07,
+ "loss": 0.0344,
+ "step": 31684
+ },
+ {
+ "epoch": 86.33514986376022,
+ "grad_norm": 2.9330737590789795,
+ "learning_rate": 9.634644176882523e-07,
+ "loss": 0.1577,
+ "step": 31685
+ },
+ {
+ "epoch": 86.33787465940054,
+ "grad_norm": 4.163845062255859,
+ "learning_rate": 9.63086511995358e-07,
+ "loss": 0.0517,
+ "step": 31686
+ },
+ {
+ "epoch": 86.34059945504087,
+ "grad_norm": 1.6118370294570923,
+ "learning_rate": 9.62708676681653e-07,
+ "loss": 0.022,
+ "step": 31687
+ },
+ {
+ "epoch": 86.34332425068119,
+ "grad_norm": 1.8610044717788696,
+ "learning_rate": 9.623309117500833e-07,
+ "loss": 0.0326,
+ "step": 31688
+ },
+ {
+ "epoch": 86.34604904632153,
+ "grad_norm": 2.1245548725128174,
+ "learning_rate": 9.619532172035906e-07,
+ "loss": 0.1534,
+ "step": 31689
+ },
+ {
+ "epoch": 86.34877384196186,
+ "grad_norm": 3.2282018661499023,
+ "learning_rate": 9.615755930451144e-07,
+ "loss": 0.0527,
+ "step": 31690
+ },
+ {
+ "epoch": 86.35149863760218,
+ "grad_norm": 2.665231227874756,
+ "learning_rate": 9.611980392775956e-07,
+ "loss": 0.027,
+ "step": 31691
+ },
+ {
+ "epoch": 86.35422343324251,
+ "grad_norm": 1.7034244537353516,
+ "learning_rate": 9.608205559039763e-07,
+ "loss": 0.0215,
+ "step": 31692
+ },
+ {
+ "epoch": 86.35694822888283,
+ "grad_norm": 2.240299940109253,
+ "learning_rate": 9.604431429271965e-07,
+ "loss": 0.0431,
+ "step": 31693
+ },
+ {
+ "epoch": 86.35967302452316,
+ "grad_norm": 2.746917963027954,
+ "learning_rate": 9.600658003501928e-07,
+ "loss": 0.031,
+ "step": 31694
+ },
+ {
+ "epoch": 86.3623978201635,
+ "grad_norm": 3.9302194118499756,
+ "learning_rate": 9.596885281759071e-07,
+ "loss": 0.097,
+ "step": 31695
+ },
+ {
+ "epoch": 86.36512261580381,
+ "grad_norm": 2.550478458404541,
+ "learning_rate": 9.593113264072762e-07,
+ "loss": 0.0354,
+ "step": 31696
+ },
+ {
+ "epoch": 86.36784741144415,
+ "grad_norm": 2.1466379165649414,
+ "learning_rate": 9.589341950472374e-07,
+ "loss": 0.0285,
+ "step": 31697
+ },
+ {
+ "epoch": 86.37057220708446,
+ "grad_norm": 2.9122791290283203,
+ "learning_rate": 9.585571340987265e-07,
+ "loss": 0.0986,
+ "step": 31698
+ },
+ {
+ "epoch": 86.3732970027248,
+ "grad_norm": 2.4622130393981934,
+ "learning_rate": 9.581801435646843e-07,
+ "loss": 0.0646,
+ "step": 31699
+ },
+ {
+ "epoch": 86.37602179836512,
+ "grad_norm": 2.4040420055389404,
+ "learning_rate": 9.578032234480428e-07,
+ "loss": 0.0262,
+ "step": 31700
+ },
+ {
+ "epoch": 86.37874659400545,
+ "grad_norm": 2.9493465423583984,
+ "learning_rate": 9.574263737517398e-07,
+ "loss": 0.087,
+ "step": 31701
+ },
+ {
+ "epoch": 86.38147138964578,
+ "grad_norm": 3.674093008041382,
+ "learning_rate": 9.570495944787062e-07,
+ "loss": 0.0902,
+ "step": 31702
+ },
+ {
+ "epoch": 86.3841961852861,
+ "grad_norm": 1.984806776046753,
+ "learning_rate": 9.566728856318807e-07,
+ "loss": 0.0305,
+ "step": 31703
+ },
+ {
+ "epoch": 86.38692098092643,
+ "grad_norm": 1.5852702856063843,
+ "learning_rate": 9.562962472141967e-07,
+ "loss": 0.0221,
+ "step": 31704
+ },
+ {
+ "epoch": 86.38964577656675,
+ "grad_norm": 3.671549081802368,
+ "learning_rate": 9.559196792285864e-07,
+ "loss": 0.0425,
+ "step": 31705
+ },
+ {
+ "epoch": 86.39237057220708,
+ "grad_norm": 2.510288715362549,
+ "learning_rate": 9.555431816779836e-07,
+ "loss": 0.0349,
+ "step": 31706
+ },
+ {
+ "epoch": 86.39509536784742,
+ "grad_norm": 2.7061891555786133,
+ "learning_rate": 9.551667545653164e-07,
+ "loss": 0.0582,
+ "step": 31707
+ },
+ {
+ "epoch": 86.39782016348774,
+ "grad_norm": 3.321589946746826,
+ "learning_rate": 9.547903978935214e-07,
+ "loss": 0.0523,
+ "step": 31708
+ },
+ {
+ "epoch": 86.40054495912807,
+ "grad_norm": 2.741774797439575,
+ "learning_rate": 9.544141116655282e-07,
+ "loss": 0.0353,
+ "step": 31709
+ },
+ {
+ "epoch": 86.40326975476839,
+ "grad_norm": 2.553030252456665,
+ "learning_rate": 9.540378958842666e-07,
+ "loss": 0.0639,
+ "step": 31710
+ },
+ {
+ "epoch": 86.40599455040872,
+ "grad_norm": 2.1983866691589355,
+ "learning_rate": 9.536617505526647e-07,
+ "loss": 0.0264,
+ "step": 31711
+ },
+ {
+ "epoch": 86.40871934604904,
+ "grad_norm": 3.1577227115631104,
+ "learning_rate": 9.532856756736552e-07,
+ "loss": 0.0671,
+ "step": 31712
+ },
+ {
+ "epoch": 86.41144414168937,
+ "grad_norm": 2.494140625,
+ "learning_rate": 9.529096712501662e-07,
+ "loss": 0.0475,
+ "step": 31713
+ },
+ {
+ "epoch": 86.4141689373297,
+ "grad_norm": 1.940166711807251,
+ "learning_rate": 9.525337372851262e-07,
+ "loss": 0.0286,
+ "step": 31714
+ },
+ {
+ "epoch": 86.41689373297002,
+ "grad_norm": 1.5205905437469482,
+ "learning_rate": 9.521578737814596e-07,
+ "loss": 0.0274,
+ "step": 31715
+ },
+ {
+ "epoch": 86.41961852861036,
+ "grad_norm": 3.7131528854370117,
+ "learning_rate": 9.517820807420985e-07,
+ "loss": 0.1935,
+ "step": 31716
+ },
+ {
+ "epoch": 86.42234332425068,
+ "grad_norm": 3.8278331756591797,
+ "learning_rate": 9.514063581699673e-07,
+ "loss": 0.0605,
+ "step": 31717
+ },
+ {
+ "epoch": 86.42506811989101,
+ "grad_norm": 3.2751076221466064,
+ "learning_rate": 9.510307060679902e-07,
+ "loss": 0.057,
+ "step": 31718
+ },
+ {
+ "epoch": 86.42779291553134,
+ "grad_norm": 1.6732395887374878,
+ "learning_rate": 9.506551244390949e-07,
+ "loss": 0.0163,
+ "step": 31719
+ },
+ {
+ "epoch": 86.43051771117166,
+ "grad_norm": 2.4423439502716064,
+ "learning_rate": 9.50279613286208e-07,
+ "loss": 0.0477,
+ "step": 31720
+ },
+ {
+ "epoch": 86.433242506812,
+ "grad_norm": 2.7212328910827637,
+ "learning_rate": 9.499041726122515e-07,
+ "loss": 0.0534,
+ "step": 31721
+ },
+ {
+ "epoch": 86.43596730245231,
+ "grad_norm": 1.925323247909546,
+ "learning_rate": 9.49528802420151e-07,
+ "loss": 0.0355,
+ "step": 31722
+ },
+ {
+ "epoch": 86.43869209809264,
+ "grad_norm": 3.1092705726623535,
+ "learning_rate": 9.491535027128262e-07,
+ "loss": 0.0569,
+ "step": 31723
+ },
+ {
+ "epoch": 86.44141689373296,
+ "grad_norm": 3.6347572803497314,
+ "learning_rate": 9.487782734932049e-07,
+ "loss": 0.0532,
+ "step": 31724
+ },
+ {
+ "epoch": 86.4441416893733,
+ "grad_norm": 2.326617956161499,
+ "learning_rate": 9.48403114764207e-07,
+ "loss": 0.098,
+ "step": 31725
+ },
+ {
+ "epoch": 86.44686648501363,
+ "grad_norm": 2.7363393306732178,
+ "learning_rate": 9.480280265287545e-07,
+ "loss": 0.0788,
+ "step": 31726
+ },
+ {
+ "epoch": 86.44959128065395,
+ "grad_norm": 2.173239231109619,
+ "learning_rate": 9.476530087897673e-07,
+ "loss": 0.0289,
+ "step": 31727
+ },
+ {
+ "epoch": 86.45231607629428,
+ "grad_norm": 1.6472687721252441,
+ "learning_rate": 9.472780615501675e-07,
+ "loss": 0.0239,
+ "step": 31728
+ },
+ {
+ "epoch": 86.4550408719346,
+ "grad_norm": 2.5682032108306885,
+ "learning_rate": 9.469031848128762e-07,
+ "loss": 0.0379,
+ "step": 31729
+ },
+ {
+ "epoch": 86.45776566757493,
+ "grad_norm": 2.8013603687286377,
+ "learning_rate": 9.4652837858081e-07,
+ "loss": 0.1393,
+ "step": 31730
+ },
+ {
+ "epoch": 86.46049046321527,
+ "grad_norm": 7.143606662750244,
+ "learning_rate": 9.461536428568885e-07,
+ "loss": 0.0311,
+ "step": 31731
+ },
+ {
+ "epoch": 86.46321525885558,
+ "grad_norm": 2.643972396850586,
+ "learning_rate": 9.457789776440329e-07,
+ "loss": 0.044,
+ "step": 31732
+ },
+ {
+ "epoch": 86.46594005449592,
+ "grad_norm": 3.4036853313446045,
+ "learning_rate": 9.454043829451586e-07,
+ "loss": 0.2029,
+ "step": 31733
+ },
+ {
+ "epoch": 86.46866485013624,
+ "grad_norm": 2.121493101119995,
+ "learning_rate": 9.450298587631846e-07,
+ "loss": 0.0646,
+ "step": 31734
+ },
+ {
+ "epoch": 86.47138964577657,
+ "grad_norm": 2.426875591278076,
+ "learning_rate": 9.446554051010238e-07,
+ "loss": 0.0377,
+ "step": 31735
+ },
+ {
+ "epoch": 86.47411444141689,
+ "grad_norm": 2.656691312789917,
+ "learning_rate": 9.442810219615984e-07,
+ "loss": 0.0436,
+ "step": 31736
+ },
+ {
+ "epoch": 86.47683923705722,
+ "grad_norm": 2.8276569843292236,
+ "learning_rate": 9.439067093478171e-07,
+ "loss": 0.039,
+ "step": 31737
+ },
+ {
+ "epoch": 86.47956403269755,
+ "grad_norm": 2.29971981048584,
+ "learning_rate": 9.435324672626023e-07,
+ "loss": 0.0758,
+ "step": 31738
+ },
+ {
+ "epoch": 86.48228882833787,
+ "grad_norm": 2.5507752895355225,
+ "learning_rate": 9.431582957088625e-07,
+ "loss": 0.0374,
+ "step": 31739
+ },
+ {
+ "epoch": 86.4850136239782,
+ "grad_norm": 2.6894922256469727,
+ "learning_rate": 9.427841946895166e-07,
+ "loss": 0.0278,
+ "step": 31740
+ },
+ {
+ "epoch": 86.48773841961852,
+ "grad_norm": 2.1117866039276123,
+ "learning_rate": 9.424101642074756e-07,
+ "loss": 0.0237,
+ "step": 31741
+ },
+ {
+ "epoch": 86.49046321525886,
+ "grad_norm": 2.634681463241577,
+ "learning_rate": 9.420362042656539e-07,
+ "loss": 0.0397,
+ "step": 31742
+ },
+ {
+ "epoch": 86.49318801089919,
+ "grad_norm": 2.8264572620391846,
+ "learning_rate": 9.41662314866959e-07,
+ "loss": 0.0305,
+ "step": 31743
+ },
+ {
+ "epoch": 86.49591280653951,
+ "grad_norm": 2.0114846229553223,
+ "learning_rate": 9.412884960143099e-07,
+ "loss": 0.0215,
+ "step": 31744
+ },
+ {
+ "epoch": 86.49863760217984,
+ "grad_norm": 2.80314302444458,
+ "learning_rate": 9.409147477106139e-07,
+ "loss": 0.0903,
+ "step": 31745
+ },
+ {
+ "epoch": 86.50136239782016,
+ "grad_norm": 2.1577348709106445,
+ "learning_rate": 9.405410699587825e-07,
+ "loss": 0.0736,
+ "step": 31746
+ },
+ {
+ "epoch": 86.50408719346049,
+ "grad_norm": 1.879530906677246,
+ "learning_rate": 9.40167462761723e-07,
+ "loss": 0.0269,
+ "step": 31747
+ },
+ {
+ "epoch": 86.50681198910081,
+ "grad_norm": 5.320206165313721,
+ "learning_rate": 9.397939261223499e-07,
+ "loss": 0.0373,
+ "step": 31748
+ },
+ {
+ "epoch": 86.50953678474114,
+ "grad_norm": 4.1179423332214355,
+ "learning_rate": 9.394204600435708e-07,
+ "loss": 0.0325,
+ "step": 31749
+ },
+ {
+ "epoch": 86.51226158038148,
+ "grad_norm": 3.245192050933838,
+ "learning_rate": 9.390470645282923e-07,
+ "loss": 0.0913,
+ "step": 31750
+ },
+ {
+ "epoch": 86.5149863760218,
+ "grad_norm": 4.733980178833008,
+ "learning_rate": 9.386737395794232e-07,
+ "loss": 0.0546,
+ "step": 31751
+ },
+ {
+ "epoch": 86.51771117166213,
+ "grad_norm": 2.638227701187134,
+ "learning_rate": 9.383004851998723e-07,
+ "loss": 0.0668,
+ "step": 31752
+ },
+ {
+ "epoch": 86.52043596730245,
+ "grad_norm": 3.1194350719451904,
+ "learning_rate": 9.379273013925449e-07,
+ "loss": 0.1016,
+ "step": 31753
+ },
+ {
+ "epoch": 86.52316076294278,
+ "grad_norm": 2.7698941230773926,
+ "learning_rate": 9.375541881603479e-07,
+ "loss": 0.0289,
+ "step": 31754
+ },
+ {
+ "epoch": 86.52588555858311,
+ "grad_norm": 2.454678773880005,
+ "learning_rate": 9.371811455061874e-07,
+ "loss": 0.1671,
+ "step": 31755
+ },
+ {
+ "epoch": 86.52861035422343,
+ "grad_norm": 2.9940426349639893,
+ "learning_rate": 9.368081734329682e-07,
+ "loss": 0.0616,
+ "step": 31756
+ },
+ {
+ "epoch": 86.53133514986376,
+ "grad_norm": 3.0953903198242188,
+ "learning_rate": 9.364352719435965e-07,
+ "loss": 0.0616,
+ "step": 31757
+ },
+ {
+ "epoch": 86.53405994550408,
+ "grad_norm": 2.4276750087738037,
+ "learning_rate": 9.360624410409746e-07,
+ "loss": 0.0549,
+ "step": 31758
+ },
+ {
+ "epoch": 86.53678474114442,
+ "grad_norm": 3.2068097591400146,
+ "learning_rate": 9.356896807280047e-07,
+ "loss": 0.0746,
+ "step": 31759
+ },
+ {
+ "epoch": 86.53950953678473,
+ "grad_norm": 2.9232585430145264,
+ "learning_rate": 9.353169910075944e-07,
+ "loss": 0.203,
+ "step": 31760
+ },
+ {
+ "epoch": 86.54223433242507,
+ "grad_norm": 2.7625324726104736,
+ "learning_rate": 9.349443718826434e-07,
+ "loss": 0.1773,
+ "step": 31761
+ },
+ {
+ "epoch": 86.5449591280654,
+ "grad_norm": 2.888930082321167,
+ "learning_rate": 9.345718233560541e-07,
+ "loss": 0.0292,
+ "step": 31762
+ },
+ {
+ "epoch": 86.54768392370572,
+ "grad_norm": 2.8343310356140137,
+ "learning_rate": 9.341993454307252e-07,
+ "loss": 0.0463,
+ "step": 31763
+ },
+ {
+ "epoch": 86.55040871934605,
+ "grad_norm": 1.7458686828613281,
+ "learning_rate": 9.338269381095632e-07,
+ "loss": 0.0531,
+ "step": 31764
+ },
+ {
+ "epoch": 86.55313351498637,
+ "grad_norm": 1.3781216144561768,
+ "learning_rate": 9.334546013954637e-07,
+ "loss": 0.0244,
+ "step": 31765
+ },
+ {
+ "epoch": 86.5558583106267,
+ "grad_norm": 3.210026741027832,
+ "learning_rate": 9.330823352913287e-07,
+ "loss": 0.1514,
+ "step": 31766
+ },
+ {
+ "epoch": 86.55858310626704,
+ "grad_norm": 2.650787353515625,
+ "learning_rate": 9.327101398000548e-07,
+ "loss": 0.0203,
+ "step": 31767
+ },
+ {
+ "epoch": 86.56130790190736,
+ "grad_norm": 2.5487656593322754,
+ "learning_rate": 9.323380149245442e-07,
+ "loss": 0.031,
+ "step": 31768
+ },
+ {
+ "epoch": 86.56403269754769,
+ "grad_norm": 2.2274551391601562,
+ "learning_rate": 9.319659606676934e-07,
+ "loss": 0.0447,
+ "step": 31769
+ },
+ {
+ "epoch": 86.566757493188,
+ "grad_norm": 2.514932870864868,
+ "learning_rate": 9.315939770324e-07,
+ "loss": 0.0397,
+ "step": 31770
+ },
+ {
+ "epoch": 86.56948228882834,
+ "grad_norm": 2.385927438735962,
+ "learning_rate": 9.312220640215585e-07,
+ "loss": 0.0283,
+ "step": 31771
+ },
+ {
+ "epoch": 86.57220708446866,
+ "grad_norm": 3.0768346786499023,
+ "learning_rate": 9.308502216380677e-07,
+ "loss": 0.048,
+ "step": 31772
+ },
+ {
+ "epoch": 86.57493188010899,
+ "grad_norm": 3.3297297954559326,
+ "learning_rate": 9.304784498848263e-07,
+ "loss": 0.0755,
+ "step": 31773
+ },
+ {
+ "epoch": 86.57765667574932,
+ "grad_norm": 2.2790002822875977,
+ "learning_rate": 9.301067487647253e-07,
+ "loss": 0.0339,
+ "step": 31774
+ },
+ {
+ "epoch": 86.58038147138964,
+ "grad_norm": 3.9251515865325928,
+ "learning_rate": 9.297351182806624e-07,
+ "loss": 0.0542,
+ "step": 31775
+ },
+ {
+ "epoch": 86.58310626702998,
+ "grad_norm": 2.3171865940093994,
+ "learning_rate": 9.293635584355276e-07,
+ "loss": 0.0292,
+ "step": 31776
+ },
+ {
+ "epoch": 86.5858310626703,
+ "grad_norm": 2.964221239089966,
+ "learning_rate": 9.289920692322196e-07,
+ "loss": 0.147,
+ "step": 31777
+ },
+ {
+ "epoch": 86.58855585831063,
+ "grad_norm": 2.2152185440063477,
+ "learning_rate": 9.286206506736306e-07,
+ "loss": 0.0949,
+ "step": 31778
+ },
+ {
+ "epoch": 86.59128065395096,
+ "grad_norm": 1.898727297782898,
+ "learning_rate": 9.282493027626482e-07,
+ "loss": 0.0271,
+ "step": 31779
+ },
+ {
+ "epoch": 86.59400544959128,
+ "grad_norm": 3.3184823989868164,
+ "learning_rate": 9.278780255021713e-07,
+ "loss": 0.0466,
+ "step": 31780
+ },
+ {
+ "epoch": 86.59673024523161,
+ "grad_norm": 1.897197961807251,
+ "learning_rate": 9.275068188950887e-07,
+ "loss": 0.0414,
+ "step": 31781
+ },
+ {
+ "epoch": 86.59945504087193,
+ "grad_norm": 2.450909376144409,
+ "learning_rate": 9.271356829442902e-07,
+ "loss": 0.2228,
+ "step": 31782
+ },
+ {
+ "epoch": 86.60217983651226,
+ "grad_norm": 2.1270909309387207,
+ "learning_rate": 9.267646176526657e-07,
+ "loss": 0.0239,
+ "step": 31783
+ },
+ {
+ "epoch": 86.60490463215258,
+ "grad_norm": 2.101029872894287,
+ "learning_rate": 9.263936230231075e-07,
+ "loss": 0.0234,
+ "step": 31784
+ },
+ {
+ "epoch": 86.60762942779292,
+ "grad_norm": 2.107457160949707,
+ "learning_rate": 9.260226990585042e-07,
+ "loss": 0.0371,
+ "step": 31785
+ },
+ {
+ "epoch": 86.61035422343325,
+ "grad_norm": 2.3350908756256104,
+ "learning_rate": 9.256518457617436e-07,
+ "loss": 0.0318,
+ "step": 31786
+ },
+ {
+ "epoch": 86.61307901907357,
+ "grad_norm": 2.550260305404663,
+ "learning_rate": 9.252810631357134e-07,
+ "loss": 0.0377,
+ "step": 31787
+ },
+ {
+ "epoch": 86.6158038147139,
+ "grad_norm": 2.5874295234680176,
+ "learning_rate": 9.249103511833013e-07,
+ "loss": 0.1504,
+ "step": 31788
+ },
+ {
+ "epoch": 86.61852861035422,
+ "grad_norm": 2.730004072189331,
+ "learning_rate": 9.245397099073971e-07,
+ "loss": 0.0446,
+ "step": 31789
+ },
+ {
+ "epoch": 86.62125340599455,
+ "grad_norm": 7.804656028747559,
+ "learning_rate": 9.241691393108864e-07,
+ "loss": 0.044,
+ "step": 31790
+ },
+ {
+ "epoch": 86.62397820163488,
+ "grad_norm": 5.257740497589111,
+ "learning_rate": 9.237986393966536e-07,
+ "loss": 0.0382,
+ "step": 31791
+ },
+ {
+ "epoch": 86.6267029972752,
+ "grad_norm": 1.4204128980636597,
+ "learning_rate": 9.23428210167584e-07,
+ "loss": 0.0195,
+ "step": 31792
+ },
+ {
+ "epoch": 86.62942779291554,
+ "grad_norm": 1.9685324430465698,
+ "learning_rate": 9.230578516265642e-07,
+ "loss": 0.0283,
+ "step": 31793
+ },
+ {
+ "epoch": 86.63215258855585,
+ "grad_norm": 2.91001558303833,
+ "learning_rate": 9.226875637764788e-07,
+ "loss": 0.0483,
+ "step": 31794
+ },
+ {
+ "epoch": 86.63487738419619,
+ "grad_norm": 2.7391185760498047,
+ "learning_rate": 9.223173466202096e-07,
+ "loss": 0.105,
+ "step": 31795
+ },
+ {
+ "epoch": 86.6376021798365,
+ "grad_norm": 2.036832094192505,
+ "learning_rate": 9.219472001606389e-07,
+ "loss": 0.0445,
+ "step": 31796
+ },
+ {
+ "epoch": 86.64032697547684,
+ "grad_norm": 2.2425432205200195,
+ "learning_rate": 9.215771244006533e-07,
+ "loss": 0.0974,
+ "step": 31797
+ },
+ {
+ "epoch": 86.64305177111717,
+ "grad_norm": 4.180068492889404,
+ "learning_rate": 9.212071193431327e-07,
+ "loss": 0.1271,
+ "step": 31798
+ },
+ {
+ "epoch": 86.64577656675749,
+ "grad_norm": 2.0754756927490234,
+ "learning_rate": 9.208371849909592e-07,
+ "loss": 0.0266,
+ "step": 31799
+ },
+ {
+ "epoch": 86.64850136239782,
+ "grad_norm": 2.5021541118621826,
+ "learning_rate": 9.204673213470105e-07,
+ "loss": 0.0259,
+ "step": 31800
+ },
+ {
+ "epoch": 86.65122615803814,
+ "grad_norm": 2.7732303142547607,
+ "learning_rate": 9.200975284141733e-07,
+ "loss": 0.0308,
+ "step": 31801
+ },
+ {
+ "epoch": 86.65395095367847,
+ "grad_norm": 2.38616943359375,
+ "learning_rate": 9.197278061953241e-07,
+ "loss": 0.0898,
+ "step": 31802
+ },
+ {
+ "epoch": 86.65667574931881,
+ "grad_norm": 2.6551296710968018,
+ "learning_rate": 9.193581546933406e-07,
+ "loss": 0.0683,
+ "step": 31803
+ },
+ {
+ "epoch": 86.65940054495913,
+ "grad_norm": 2.102505922317505,
+ "learning_rate": 9.189885739111048e-07,
+ "loss": 0.0332,
+ "step": 31804
+ },
+ {
+ "epoch": 86.66212534059946,
+ "grad_norm": 3.7889506816864014,
+ "learning_rate": 9.186190638514925e-07,
+ "loss": 0.141,
+ "step": 31805
+ },
+ {
+ "epoch": 86.66485013623978,
+ "grad_norm": 1.921257495880127,
+ "learning_rate": 9.182496245173844e-07,
+ "loss": 0.0322,
+ "step": 31806
+ },
+ {
+ "epoch": 86.66757493188011,
+ "grad_norm": 3.020113229751587,
+ "learning_rate": 9.178802559116551e-07,
+ "loss": 0.1434,
+ "step": 31807
+ },
+ {
+ "epoch": 86.67029972752043,
+ "grad_norm": 2.542175531387329,
+ "learning_rate": 9.175109580371811e-07,
+ "loss": 0.0213,
+ "step": 31808
+ },
+ {
+ "epoch": 86.67302452316076,
+ "grad_norm": 2.8657314777374268,
+ "learning_rate": 9.171417308968411e-07,
+ "loss": 0.0614,
+ "step": 31809
+ },
+ {
+ "epoch": 86.6757493188011,
+ "grad_norm": 1.7940597534179688,
+ "learning_rate": 9.167725744935097e-07,
+ "loss": 0.0244,
+ "step": 31810
+ },
+ {
+ "epoch": 86.67847411444141,
+ "grad_norm": 2.6655895709991455,
+ "learning_rate": 9.1640348883006e-07,
+ "loss": 0.1663,
+ "step": 31811
+ },
+ {
+ "epoch": 86.68119891008175,
+ "grad_norm": 3.1102259159088135,
+ "learning_rate": 9.160344739093663e-07,
+ "loss": 0.1017,
+ "step": 31812
+ },
+ {
+ "epoch": 86.68392370572207,
+ "grad_norm": 2.133916139602661,
+ "learning_rate": 9.156655297343053e-07,
+ "loss": 0.0239,
+ "step": 31813
+ },
+ {
+ "epoch": 86.6866485013624,
+ "grad_norm": 2.9862277507781982,
+ "learning_rate": 9.152966563077492e-07,
+ "loss": 0.0505,
+ "step": 31814
+ },
+ {
+ "epoch": 86.68937329700273,
+ "grad_norm": 3.5533385276794434,
+ "learning_rate": 9.149278536325701e-07,
+ "loss": 0.0312,
+ "step": 31815
+ },
+ {
+ "epoch": 86.69209809264305,
+ "grad_norm": 2.2575623989105225,
+ "learning_rate": 9.145591217116378e-07,
+ "loss": 0.115,
+ "step": 31816
+ },
+ {
+ "epoch": 86.69482288828338,
+ "grad_norm": 2.2151005268096924,
+ "learning_rate": 9.141904605478291e-07,
+ "loss": 0.0812,
+ "step": 31817
+ },
+ {
+ "epoch": 86.6975476839237,
+ "grad_norm": 1.6522341966629028,
+ "learning_rate": 9.138218701440138e-07,
+ "loss": 0.0297,
+ "step": 31818
+ },
+ {
+ "epoch": 86.70027247956403,
+ "grad_norm": 2.0549027919769287,
+ "learning_rate": 9.134533505030596e-07,
+ "loss": 0.0254,
+ "step": 31819
+ },
+ {
+ "epoch": 86.70299727520435,
+ "grad_norm": 2.8211066722869873,
+ "learning_rate": 9.130849016278376e-07,
+ "loss": 0.1104,
+ "step": 31820
+ },
+ {
+ "epoch": 86.70572207084469,
+ "grad_norm": 11.08095932006836,
+ "learning_rate": 9.127165235212199e-07,
+ "loss": 0.0874,
+ "step": 31821
+ },
+ {
+ "epoch": 86.70844686648502,
+ "grad_norm": 2.0970847606658936,
+ "learning_rate": 9.12348216186072e-07,
+ "loss": 0.0357,
+ "step": 31822
+ },
+ {
+ "epoch": 86.71117166212534,
+ "grad_norm": 3.2193431854248047,
+ "learning_rate": 9.119799796252626e-07,
+ "loss": 0.0341,
+ "step": 31823
+ },
+ {
+ "epoch": 86.71389645776567,
+ "grad_norm": 3.7054831981658936,
+ "learning_rate": 9.116118138416619e-07,
+ "loss": 0.0803,
+ "step": 31824
+ },
+ {
+ "epoch": 86.71662125340599,
+ "grad_norm": 2.5147147178649902,
+ "learning_rate": 9.112437188381362e-07,
+ "loss": 0.0582,
+ "step": 31825
+ },
+ {
+ "epoch": 86.71934604904632,
+ "grad_norm": 2.2300379276275635,
+ "learning_rate": 9.108756946175523e-07,
+ "loss": 0.1179,
+ "step": 31826
+ },
+ {
+ "epoch": 86.72207084468666,
+ "grad_norm": 4.37146520614624,
+ "learning_rate": 9.105077411827757e-07,
+ "loss": 0.1824,
+ "step": 31827
+ },
+ {
+ "epoch": 86.72479564032697,
+ "grad_norm": 3.2096545696258545,
+ "learning_rate": 9.101398585366705e-07,
+ "loss": 0.1223,
+ "step": 31828
+ },
+ {
+ "epoch": 86.7275204359673,
+ "grad_norm": 3.0343284606933594,
+ "learning_rate": 9.097720466821059e-07,
+ "loss": 0.0778,
+ "step": 31829
+ },
+ {
+ "epoch": 86.73024523160763,
+ "grad_norm": 2.826237678527832,
+ "learning_rate": 9.094043056219437e-07,
+ "loss": 0.0406,
+ "step": 31830
+ },
+ {
+ "epoch": 86.73297002724796,
+ "grad_norm": 3.87508487701416,
+ "learning_rate": 9.090366353590485e-07,
+ "loss": 0.0679,
+ "step": 31831
+ },
+ {
+ "epoch": 86.73569482288828,
+ "grad_norm": 2.8609530925750732,
+ "learning_rate": 9.086690358962813e-07,
+ "loss": 0.0408,
+ "step": 31832
+ },
+ {
+ "epoch": 86.73841961852861,
+ "grad_norm": 3.1503353118896484,
+ "learning_rate": 9.083015072365087e-07,
+ "loss": 0.034,
+ "step": 31833
+ },
+ {
+ "epoch": 86.74114441416894,
+ "grad_norm": 2.6293821334838867,
+ "learning_rate": 9.079340493825916e-07,
+ "loss": 0.0878,
+ "step": 31834
+ },
+ {
+ "epoch": 86.74386920980926,
+ "grad_norm": 1.9450099468231201,
+ "learning_rate": 9.075666623373913e-07,
+ "loss": 0.1136,
+ "step": 31835
+ },
+ {
+ "epoch": 86.7465940054496,
+ "grad_norm": 2.772766351699829,
+ "learning_rate": 9.071993461037676e-07,
+ "loss": 0.097,
+ "step": 31836
+ },
+ {
+ "epoch": 86.74931880108991,
+ "grad_norm": 2.1210412979125977,
+ "learning_rate": 9.068321006845837e-07,
+ "loss": 0.0933,
+ "step": 31837
+ },
+ {
+ "epoch": 86.75204359673025,
+ "grad_norm": 3.3114240169525146,
+ "learning_rate": 9.064649260826997e-07,
+ "loss": 0.047,
+ "step": 31838
+ },
+ {
+ "epoch": 86.75476839237058,
+ "grad_norm": 1.7541974782943726,
+ "learning_rate": 9.060978223009742e-07,
+ "loss": 0.0447,
+ "step": 31839
+ },
+ {
+ "epoch": 86.7574931880109,
+ "grad_norm": 2.293485164642334,
+ "learning_rate": 9.05730789342264e-07,
+ "loss": 0.0547,
+ "step": 31840
+ },
+ {
+ "epoch": 86.76021798365123,
+ "grad_norm": 2.6151113510131836,
+ "learning_rate": 9.053638272094301e-07,
+ "loss": 0.0627,
+ "step": 31841
+ },
+ {
+ "epoch": 86.76294277929155,
+ "grad_norm": 3.138340473175049,
+ "learning_rate": 9.049969359053312e-07,
+ "loss": 0.0391,
+ "step": 31842
+ },
+ {
+ "epoch": 86.76566757493188,
+ "grad_norm": 2.081235647201538,
+ "learning_rate": 9.046301154328241e-07,
+ "loss": 0.1178,
+ "step": 31843
+ },
+ {
+ "epoch": 86.7683923705722,
+ "grad_norm": 2.535001516342163,
+ "learning_rate": 9.04263365794762e-07,
+ "loss": 0.0547,
+ "step": 31844
+ },
+ {
+ "epoch": 86.77111716621253,
+ "grad_norm": 3.6016337871551514,
+ "learning_rate": 9.038966869940069e-07,
+ "loss": 0.0424,
+ "step": 31845
+ },
+ {
+ "epoch": 86.77384196185287,
+ "grad_norm": 2.7954092025756836,
+ "learning_rate": 9.035300790334112e-07,
+ "loss": 0.1006,
+ "step": 31846
+ },
+ {
+ "epoch": 86.77656675749319,
+ "grad_norm": 2.7124500274658203,
+ "learning_rate": 9.031635419158314e-07,
+ "loss": 0.0766,
+ "step": 31847
+ },
+ {
+ "epoch": 86.77929155313352,
+ "grad_norm": 2.300968885421753,
+ "learning_rate": 9.027970756441184e-07,
+ "loss": 0.0377,
+ "step": 31848
+ },
+ {
+ "epoch": 86.78201634877384,
+ "grad_norm": 2.9123425483703613,
+ "learning_rate": 9.024306802211313e-07,
+ "loss": 0.0479,
+ "step": 31849
+ },
+ {
+ "epoch": 86.78474114441417,
+ "grad_norm": 2.441084861755371,
+ "learning_rate": 9.020643556497211e-07,
+ "loss": 0.0496,
+ "step": 31850
+ },
+ {
+ "epoch": 86.7874659400545,
+ "grad_norm": 3.1042938232421875,
+ "learning_rate": 9.016981019327397e-07,
+ "loss": 0.085,
+ "step": 31851
+ },
+ {
+ "epoch": 86.79019073569482,
+ "grad_norm": 2.328429698944092,
+ "learning_rate": 9.013319190730407e-07,
+ "loss": 0.0209,
+ "step": 31852
+ },
+ {
+ "epoch": 86.79291553133515,
+ "grad_norm": 4.259504318237305,
+ "learning_rate": 9.009658070734762e-07,
+ "loss": 0.1889,
+ "step": 31853
+ },
+ {
+ "epoch": 86.79564032697547,
+ "grad_norm": 2.216219902038574,
+ "learning_rate": 9.005997659368982e-07,
+ "loss": 0.0207,
+ "step": 31854
+ },
+ {
+ "epoch": 86.7983651226158,
+ "grad_norm": 2.459240674972534,
+ "learning_rate": 9.002337956661556e-07,
+ "loss": 0.0843,
+ "step": 31855
+ },
+ {
+ "epoch": 86.80108991825612,
+ "grad_norm": 2.159674882888794,
+ "learning_rate": 8.998678962640983e-07,
+ "loss": 0.0467,
+ "step": 31856
+ },
+ {
+ "epoch": 86.80381471389646,
+ "grad_norm": 2.2981133460998535,
+ "learning_rate": 8.995020677335764e-07,
+ "loss": 0.0356,
+ "step": 31857
+ },
+ {
+ "epoch": 86.80653950953679,
+ "grad_norm": 2.905636787414551,
+ "learning_rate": 8.99136310077442e-07,
+ "loss": 0.1357,
+ "step": 31858
+ },
+ {
+ "epoch": 86.80926430517711,
+ "grad_norm": 3.5976691246032715,
+ "learning_rate": 8.987706232985405e-07,
+ "loss": 0.0505,
+ "step": 31859
+ },
+ {
+ "epoch": 86.81198910081744,
+ "grad_norm": 3.997267961502075,
+ "learning_rate": 8.984050073997197e-07,
+ "loss": 0.0659,
+ "step": 31860
+ },
+ {
+ "epoch": 86.81471389645776,
+ "grad_norm": 3.3631575107574463,
+ "learning_rate": 8.980394623838273e-07,
+ "loss": 0.0684,
+ "step": 31861
+ },
+ {
+ "epoch": 86.8174386920981,
+ "grad_norm": 4.546899318695068,
+ "learning_rate": 8.976739882537122e-07,
+ "loss": 0.104,
+ "step": 31862
+ },
+ {
+ "epoch": 86.82016348773843,
+ "grad_norm": 2.5868873596191406,
+ "learning_rate": 8.973085850122187e-07,
+ "loss": 0.0408,
+ "step": 31863
+ },
+ {
+ "epoch": 86.82288828337875,
+ "grad_norm": 4.059663772583008,
+ "learning_rate": 8.969432526621924e-07,
+ "loss": 0.0644,
+ "step": 31864
+ },
+ {
+ "epoch": 86.82561307901908,
+ "grad_norm": 1.9142038822174072,
+ "learning_rate": 8.965779912064787e-07,
+ "loss": 0.0543,
+ "step": 31865
+ },
+ {
+ "epoch": 86.8283378746594,
+ "grad_norm": 2.3329153060913086,
+ "learning_rate": 8.962128006479232e-07,
+ "loss": 0.0354,
+ "step": 31866
+ },
+ {
+ "epoch": 86.83106267029973,
+ "grad_norm": 3.1029655933380127,
+ "learning_rate": 8.958476809893702e-07,
+ "loss": 0.0397,
+ "step": 31867
+ },
+ {
+ "epoch": 86.83378746594005,
+ "grad_norm": 2.926924705505371,
+ "learning_rate": 8.954826322336596e-07,
+ "loss": 0.0825,
+ "step": 31868
+ },
+ {
+ "epoch": 86.83651226158038,
+ "grad_norm": 2.328819513320923,
+ "learning_rate": 8.951176543836404e-07,
+ "loss": 0.0427,
+ "step": 31869
+ },
+ {
+ "epoch": 86.83923705722071,
+ "grad_norm": 1.3802648782730103,
+ "learning_rate": 8.947527474421513e-07,
+ "loss": 0.0187,
+ "step": 31870
+ },
+ {
+ "epoch": 86.84196185286103,
+ "grad_norm": 3.1059184074401855,
+ "learning_rate": 8.943879114120347e-07,
+ "loss": 0.0925,
+ "step": 31871
+ },
+ {
+ "epoch": 86.84468664850137,
+ "grad_norm": 3.1488611698150635,
+ "learning_rate": 8.940231462961302e-07,
+ "loss": 0.0365,
+ "step": 31872
+ },
+ {
+ "epoch": 86.84741144414168,
+ "grad_norm": 3.2357780933380127,
+ "learning_rate": 8.936584520972824e-07,
+ "loss": 0.0765,
+ "step": 31873
+ },
+ {
+ "epoch": 86.85013623978202,
+ "grad_norm": 4.385752201080322,
+ "learning_rate": 8.932938288183268e-07,
+ "loss": 0.1023,
+ "step": 31874
+ },
+ {
+ "epoch": 86.85286103542235,
+ "grad_norm": 1.538090705871582,
+ "learning_rate": 8.929292764621078e-07,
+ "loss": 0.0219,
+ "step": 31875
+ },
+ {
+ "epoch": 86.85558583106267,
+ "grad_norm": 3.7086973190307617,
+ "learning_rate": 8.925647950314631e-07,
+ "loss": 0.0296,
+ "step": 31876
+ },
+ {
+ "epoch": 86.858310626703,
+ "grad_norm": 1.9129804372787476,
+ "learning_rate": 8.922003845292293e-07,
+ "loss": 0.0354,
+ "step": 31877
+ },
+ {
+ "epoch": 86.86103542234332,
+ "grad_norm": 2.6988542079925537,
+ "learning_rate": 8.918360449582464e-07,
+ "loss": 0.0794,
+ "step": 31878
+ },
+ {
+ "epoch": 86.86376021798365,
+ "grad_norm": 2.3943700790405273,
+ "learning_rate": 8.914717763213521e-07,
+ "loss": 0.0245,
+ "step": 31879
+ },
+ {
+ "epoch": 86.86648501362397,
+ "grad_norm": 2.104721784591675,
+ "learning_rate": 8.911075786213819e-07,
+ "loss": 0.1231,
+ "step": 31880
+ },
+ {
+ "epoch": 86.8692098092643,
+ "grad_norm": 2.727410316467285,
+ "learning_rate": 8.907434518611713e-07,
+ "loss": 0.0293,
+ "step": 31881
+ },
+ {
+ "epoch": 86.87193460490464,
+ "grad_norm": 5.318673133850098,
+ "learning_rate": 8.903793960435592e-07,
+ "loss": 0.1412,
+ "step": 31882
+ },
+ {
+ "epoch": 86.87465940054496,
+ "grad_norm": 2.8119523525238037,
+ "learning_rate": 8.900154111713787e-07,
+ "loss": 0.0371,
+ "step": 31883
+ },
+ {
+ "epoch": 86.87738419618529,
+ "grad_norm": 3.3595151901245117,
+ "learning_rate": 8.896514972474657e-07,
+ "loss": 0.0228,
+ "step": 31884
+ },
+ {
+ "epoch": 86.88010899182561,
+ "grad_norm": 2.101471185684204,
+ "learning_rate": 8.892876542746509e-07,
+ "loss": 0.0845,
+ "step": 31885
+ },
+ {
+ "epoch": 86.88283378746594,
+ "grad_norm": 4.005616188049316,
+ "learning_rate": 8.889238822557733e-07,
+ "loss": 0.056,
+ "step": 31886
+ },
+ {
+ "epoch": 86.88555858310627,
+ "grad_norm": 2.5760974884033203,
+ "learning_rate": 8.885601811936628e-07,
+ "loss": 0.1622,
+ "step": 31887
+ },
+ {
+ "epoch": 86.88828337874659,
+ "grad_norm": 1.8493988513946533,
+ "learning_rate": 8.881965510911506e-07,
+ "loss": 0.0256,
+ "step": 31888
+ },
+ {
+ "epoch": 86.89100817438693,
+ "grad_norm": 4.823277950286865,
+ "learning_rate": 8.87832991951072e-07,
+ "loss": 0.0253,
+ "step": 31889
+ },
+ {
+ "epoch": 86.89373297002724,
+ "grad_norm": 2.7438676357269287,
+ "learning_rate": 8.874695037762571e-07,
+ "loss": 0.1183,
+ "step": 31890
+ },
+ {
+ "epoch": 86.89645776566758,
+ "grad_norm": 2.3376359939575195,
+ "learning_rate": 8.871060865695347e-07,
+ "loss": 0.0327,
+ "step": 31891
+ },
+ {
+ "epoch": 86.8991825613079,
+ "grad_norm": 2.2812001705169678,
+ "learning_rate": 8.867427403337392e-07,
+ "loss": 0.0224,
+ "step": 31892
+ },
+ {
+ "epoch": 86.90190735694823,
+ "grad_norm": 1.6706823110580444,
+ "learning_rate": 8.86379465071695e-07,
+ "loss": 0.0216,
+ "step": 31893
+ },
+ {
+ "epoch": 86.90463215258856,
+ "grad_norm": 5.328125,
+ "learning_rate": 8.860162607862366e-07,
+ "loss": 0.0358,
+ "step": 31894
+ },
+ {
+ "epoch": 86.90735694822888,
+ "grad_norm": 2.010127544403076,
+ "learning_rate": 8.856531274801904e-07,
+ "loss": 0.1028,
+ "step": 31895
+ },
+ {
+ "epoch": 86.91008174386921,
+ "grad_norm": 2.0606815814971924,
+ "learning_rate": 8.852900651563833e-07,
+ "loss": 0.0237,
+ "step": 31896
+ },
+ {
+ "epoch": 86.91280653950953,
+ "grad_norm": 2.7134268283843994,
+ "learning_rate": 8.84927073817643e-07,
+ "loss": 0.0866,
+ "step": 31897
+ },
+ {
+ "epoch": 86.91553133514986,
+ "grad_norm": 2.1887168884277344,
+ "learning_rate": 8.845641534667993e-07,
+ "loss": 0.0237,
+ "step": 31898
+ },
+ {
+ "epoch": 86.9182561307902,
+ "grad_norm": 2.4767327308654785,
+ "learning_rate": 8.842013041066754e-07,
+ "loss": 0.1119,
+ "step": 31899
+ },
+ {
+ "epoch": 86.92098092643052,
+ "grad_norm": 3.3079845905303955,
+ "learning_rate": 8.838385257400994e-07,
+ "loss": 0.043,
+ "step": 31900
+ },
+ {
+ "epoch": 86.92370572207085,
+ "grad_norm": 1.898982048034668,
+ "learning_rate": 8.834758183698933e-07,
+ "loss": 0.0299,
+ "step": 31901
+ },
+ {
+ "epoch": 86.92643051771117,
+ "grad_norm": 2.012143611907959,
+ "learning_rate": 8.831131819988859e-07,
+ "loss": 0.0359,
+ "step": 31902
+ },
+ {
+ "epoch": 86.9291553133515,
+ "grad_norm": 2.660198926925659,
+ "learning_rate": 8.827506166298994e-07,
+ "loss": 0.1469,
+ "step": 31903
+ },
+ {
+ "epoch": 86.93188010899182,
+ "grad_norm": 2.0650031566619873,
+ "learning_rate": 8.823881222657582e-07,
+ "loss": 0.0967,
+ "step": 31904
+ },
+ {
+ "epoch": 86.93460490463215,
+ "grad_norm": 2.527787208557129,
+ "learning_rate": 8.820256989092824e-07,
+ "loss": 0.07,
+ "step": 31905
+ },
+ {
+ "epoch": 86.93732970027249,
+ "grad_norm": 2.7898435592651367,
+ "learning_rate": 8.816633465632996e-07,
+ "loss": 0.1494,
+ "step": 31906
+ },
+ {
+ "epoch": 86.9400544959128,
+ "grad_norm": 1.7793904542922974,
+ "learning_rate": 8.813010652306286e-07,
+ "loss": 0.0227,
+ "step": 31907
+ },
+ {
+ "epoch": 86.94277929155314,
+ "grad_norm": 3.2279844284057617,
+ "learning_rate": 8.809388549140918e-07,
+ "loss": 0.0329,
+ "step": 31908
+ },
+ {
+ "epoch": 86.94550408719346,
+ "grad_norm": 1.4497243165969849,
+ "learning_rate": 8.805767156165057e-07,
+ "loss": 0.0203,
+ "step": 31909
+ },
+ {
+ "epoch": 86.94822888283379,
+ "grad_norm": 4.106661319732666,
+ "learning_rate": 8.802146473406991e-07,
+ "loss": 0.1039,
+ "step": 31910
+ },
+ {
+ "epoch": 86.95095367847412,
+ "grad_norm": 2.7305715084075928,
+ "learning_rate": 8.798526500894866e-07,
+ "loss": 0.0335,
+ "step": 31911
+ },
+ {
+ "epoch": 86.95367847411444,
+ "grad_norm": 2.0169501304626465,
+ "learning_rate": 8.79490723865688e-07,
+ "loss": 0.0247,
+ "step": 31912
+ },
+ {
+ "epoch": 86.95640326975477,
+ "grad_norm": 3.3821303844451904,
+ "learning_rate": 8.7912886867212e-07,
+ "loss": 0.0529,
+ "step": 31913
+ },
+ {
+ "epoch": 86.95912806539509,
+ "grad_norm": 4.41207218170166,
+ "learning_rate": 8.787670845116059e-07,
+ "loss": 0.1172,
+ "step": 31914
+ },
+ {
+ "epoch": 86.96185286103542,
+ "grad_norm": 2.8587772846221924,
+ "learning_rate": 8.784053713869589e-07,
+ "loss": 0.0516,
+ "step": 31915
+ },
+ {
+ "epoch": 86.96457765667574,
+ "grad_norm": 3.60770320892334,
+ "learning_rate": 8.78043729300998e-07,
+ "loss": 0.0603,
+ "step": 31916
+ },
+ {
+ "epoch": 86.96730245231608,
+ "grad_norm": 3.2521111965179443,
+ "learning_rate": 8.776821582565365e-07,
+ "loss": 0.0331,
+ "step": 31917
+ },
+ {
+ "epoch": 86.97002724795641,
+ "grad_norm": 2.495760917663574,
+ "learning_rate": 8.773206582563953e-07,
+ "loss": 0.0235,
+ "step": 31918
+ },
+ {
+ "epoch": 86.97275204359673,
+ "grad_norm": 4.632887363433838,
+ "learning_rate": 8.769592293033868e-07,
+ "loss": 0.036,
+ "step": 31919
+ },
+ {
+ "epoch": 86.97547683923706,
+ "grad_norm": 1.7221351861953735,
+ "learning_rate": 8.765978714003265e-07,
+ "loss": 0.0354,
+ "step": 31920
+ },
+ {
+ "epoch": 86.97820163487738,
+ "grad_norm": 2.451761245727539,
+ "learning_rate": 8.762365845500265e-07,
+ "loss": 0.0454,
+ "step": 31921
+ },
+ {
+ "epoch": 86.98092643051771,
+ "grad_norm": 4.969675064086914,
+ "learning_rate": 8.758753687553035e-07,
+ "loss": 0.1991,
+ "step": 31922
+ },
+ {
+ "epoch": 86.98365122615803,
+ "grad_norm": 1.9271904230117798,
+ "learning_rate": 8.755142240189706e-07,
+ "loss": 0.0205,
+ "step": 31923
+ },
+ {
+ "epoch": 86.98637602179836,
+ "grad_norm": 2.6992568969726562,
+ "learning_rate": 8.751531503438382e-07,
+ "loss": 0.041,
+ "step": 31924
+ },
+ {
+ "epoch": 86.9891008174387,
+ "grad_norm": 2.373265266418457,
+ "learning_rate": 8.747921477327182e-07,
+ "loss": 0.1707,
+ "step": 31925
+ },
+ {
+ "epoch": 86.99182561307902,
+ "grad_norm": 2.343313455581665,
+ "learning_rate": 8.744312161884228e-07,
+ "loss": 0.0607,
+ "step": 31926
+ },
+ {
+ "epoch": 86.99455040871935,
+ "grad_norm": 1.9195460081100464,
+ "learning_rate": 8.740703557137653e-07,
+ "loss": 0.0277,
+ "step": 31927
+ },
+ {
+ "epoch": 86.99727520435967,
+ "grad_norm": 1.5488792657852173,
+ "learning_rate": 8.737095663115547e-07,
+ "loss": 0.1361,
+ "step": 31928
+ },
+ {
+ "epoch": 87.0,
+ "grad_norm": 2.9402854442596436,
+ "learning_rate": 8.733488479845997e-07,
+ "loss": 0.0556,
+ "step": 31929
+ },
+ {
+ "epoch": 87.00272479564033,
+ "grad_norm": 2.30751895904541,
+ "learning_rate": 8.729882007357083e-07,
+ "loss": 0.026,
+ "step": 31930
+ },
+ {
+ "epoch": 87.00544959128065,
+ "grad_norm": 2.3755152225494385,
+ "learning_rate": 8.726276245676934e-07,
+ "loss": 0.1469,
+ "step": 31931
+ },
+ {
+ "epoch": 87.00817438692098,
+ "grad_norm": 2.6640377044677734,
+ "learning_rate": 8.722671194833598e-07,
+ "loss": 0.038,
+ "step": 31932
+ },
+ {
+ "epoch": 87.0108991825613,
+ "grad_norm": 2.6814212799072266,
+ "learning_rate": 8.719066854855151e-07,
+ "loss": 0.1313,
+ "step": 31933
+ },
+ {
+ "epoch": 87.01362397820164,
+ "grad_norm": 2.758610248565674,
+ "learning_rate": 8.715463225769693e-07,
+ "loss": 0.0336,
+ "step": 31934
+ },
+ {
+ "epoch": 87.01634877384195,
+ "grad_norm": 3.4616310596466064,
+ "learning_rate": 8.711860307605257e-07,
+ "loss": 0.1166,
+ "step": 31935
+ },
+ {
+ "epoch": 87.01907356948229,
+ "grad_norm": 1.5524550676345825,
+ "learning_rate": 8.708258100389933e-07,
+ "loss": 0.0221,
+ "step": 31936
+ },
+ {
+ "epoch": 87.02179836512262,
+ "grad_norm": 2.028284788131714,
+ "learning_rate": 8.704656604151729e-07,
+ "loss": 0.0186,
+ "step": 31937
+ },
+ {
+ "epoch": 87.02452316076294,
+ "grad_norm": 3.196913480758667,
+ "learning_rate": 8.701055818918736e-07,
+ "loss": 0.0307,
+ "step": 31938
+ },
+ {
+ "epoch": 87.02724795640327,
+ "grad_norm": 3.3685288429260254,
+ "learning_rate": 8.697455744718985e-07,
+ "loss": 0.0929,
+ "step": 31939
+ },
+ {
+ "epoch": 87.02997275204359,
+ "grad_norm": 2.4672834873199463,
+ "learning_rate": 8.693856381580512e-07,
+ "loss": 0.1396,
+ "step": 31940
+ },
+ {
+ "epoch": 87.03269754768392,
+ "grad_norm": 2.7180583477020264,
+ "learning_rate": 8.690257729531326e-07,
+ "loss": 0.0294,
+ "step": 31941
+ },
+ {
+ "epoch": 87.03542234332426,
+ "grad_norm": 1.4101189374923706,
+ "learning_rate": 8.686659788599494e-07,
+ "loss": 0.0237,
+ "step": 31942
+ },
+ {
+ "epoch": 87.03814713896458,
+ "grad_norm": 13.789135932922363,
+ "learning_rate": 8.683062558812994e-07,
+ "loss": 0.0596,
+ "step": 31943
+ },
+ {
+ "epoch": 87.04087193460491,
+ "grad_norm": 3.0247530937194824,
+ "learning_rate": 8.679466040199891e-07,
+ "loss": 0.0793,
+ "step": 31944
+ },
+ {
+ "epoch": 87.04359673024523,
+ "grad_norm": 3.7759997844696045,
+ "learning_rate": 8.675870232788164e-07,
+ "loss": 0.1435,
+ "step": 31945
+ },
+ {
+ "epoch": 87.04632152588556,
+ "grad_norm": 3.1340579986572266,
+ "learning_rate": 8.672275136605801e-07,
+ "loss": 0.1152,
+ "step": 31946
+ },
+ {
+ "epoch": 87.04904632152588,
+ "grad_norm": 2.5545504093170166,
+ "learning_rate": 8.668680751680836e-07,
+ "loss": 0.0429,
+ "step": 31947
+ },
+ {
+ "epoch": 87.05177111716621,
+ "grad_norm": 2.539555549621582,
+ "learning_rate": 8.665087078041245e-07,
+ "loss": 0.0214,
+ "step": 31948
+ },
+ {
+ "epoch": 87.05449591280654,
+ "grad_norm": 1.6589235067367554,
+ "learning_rate": 8.661494115715019e-07,
+ "loss": 0.0223,
+ "step": 31949
+ },
+ {
+ "epoch": 87.05722070844686,
+ "grad_norm": 2.8541224002838135,
+ "learning_rate": 8.657901864730112e-07,
+ "loss": 0.0499,
+ "step": 31950
+ },
+ {
+ "epoch": 87.0599455040872,
+ "grad_norm": 3.6259543895721436,
+ "learning_rate": 8.654310325114557e-07,
+ "loss": 0.0718,
+ "step": 31951
+ },
+ {
+ "epoch": 87.06267029972751,
+ "grad_norm": 6.198474407196045,
+ "learning_rate": 8.650719496896287e-07,
+ "loss": 0.0982,
+ "step": 31952
+ },
+ {
+ "epoch": 87.06539509536785,
+ "grad_norm": 2.609693765640259,
+ "learning_rate": 8.647129380103248e-07,
+ "loss": 0.0179,
+ "step": 31953
+ },
+ {
+ "epoch": 87.06811989100818,
+ "grad_norm": 2.1050493717193604,
+ "learning_rate": 8.643539974763449e-07,
+ "loss": 0.0784,
+ "step": 31954
+ },
+ {
+ "epoch": 87.0708446866485,
+ "grad_norm": 1.9728049039840698,
+ "learning_rate": 8.639951280904824e-07,
+ "loss": 0.1097,
+ "step": 31955
+ },
+ {
+ "epoch": 87.07356948228883,
+ "grad_norm": 2.081594467163086,
+ "learning_rate": 8.636363298555317e-07,
+ "loss": 0.0273,
+ "step": 31956
+ },
+ {
+ "epoch": 87.07629427792915,
+ "grad_norm": 1.9430947303771973,
+ "learning_rate": 8.632776027742851e-07,
+ "loss": 0.1135,
+ "step": 31957
+ },
+ {
+ "epoch": 87.07901907356948,
+ "grad_norm": 2.7454442977905273,
+ "learning_rate": 8.629189468495402e-07,
+ "loss": 0.0389,
+ "step": 31958
+ },
+ {
+ "epoch": 87.0817438692098,
+ "grad_norm": 5.959187984466553,
+ "learning_rate": 8.625603620840894e-07,
+ "loss": 0.0393,
+ "step": 31959
+ },
+ {
+ "epoch": 87.08446866485014,
+ "grad_norm": 1.8962658643722534,
+ "learning_rate": 8.622018484807215e-07,
+ "loss": 0.0295,
+ "step": 31960
+ },
+ {
+ "epoch": 87.08719346049047,
+ "grad_norm": 10.90555477142334,
+ "learning_rate": 8.618434060422331e-07,
+ "loss": 0.057,
+ "step": 31961
+ },
+ {
+ "epoch": 87.08991825613079,
+ "grad_norm": 2.2312071323394775,
+ "learning_rate": 8.614850347714132e-07,
+ "loss": 0.0691,
+ "step": 31962
+ },
+ {
+ "epoch": 87.09264305177112,
+ "grad_norm": 2.277768850326538,
+ "learning_rate": 8.61126734671055e-07,
+ "loss": 0.0458,
+ "step": 31963
+ },
+ {
+ "epoch": 87.09536784741144,
+ "grad_norm": 2.634031057357788,
+ "learning_rate": 8.607685057439486e-07,
+ "loss": 0.044,
+ "step": 31964
+ },
+ {
+ "epoch": 87.09809264305177,
+ "grad_norm": 1.797587275505066,
+ "learning_rate": 8.604103479928815e-07,
+ "loss": 0.0279,
+ "step": 31965
+ },
+ {
+ "epoch": 87.1008174386921,
+ "grad_norm": 3.5806045532226562,
+ "learning_rate": 8.600522614206442e-07,
+ "loss": 0.1663,
+ "step": 31966
+ },
+ {
+ "epoch": 87.10354223433242,
+ "grad_norm": 1.9146403074264526,
+ "learning_rate": 8.596942460300261e-07,
+ "loss": 0.0673,
+ "step": 31967
+ },
+ {
+ "epoch": 87.10626702997276,
+ "grad_norm": 3.6403446197509766,
+ "learning_rate": 8.593363018238154e-07,
+ "loss": 0.0812,
+ "step": 31968
+ },
+ {
+ "epoch": 87.10899182561307,
+ "grad_norm": 2.977989912033081,
+ "learning_rate": 8.589784288047997e-07,
+ "loss": 0.0325,
+ "step": 31969
+ },
+ {
+ "epoch": 87.11171662125341,
+ "grad_norm": 1.993374228477478,
+ "learning_rate": 8.586206269757647e-07,
+ "loss": 0.0668,
+ "step": 31970
+ },
+ {
+ "epoch": 87.11444141689373,
+ "grad_norm": 2.3206489086151123,
+ "learning_rate": 8.58262896339499e-07,
+ "loss": 0.0424,
+ "step": 31971
+ },
+ {
+ "epoch": 87.11716621253406,
+ "grad_norm": 3.1360924243927,
+ "learning_rate": 8.579052368987872e-07,
+ "loss": 0.0473,
+ "step": 31972
+ },
+ {
+ "epoch": 87.11989100817439,
+ "grad_norm": 2.342132329940796,
+ "learning_rate": 8.57547648656416e-07,
+ "loss": 0.1698,
+ "step": 31973
+ },
+ {
+ "epoch": 87.12261580381471,
+ "grad_norm": 2.187732458114624,
+ "learning_rate": 8.571901316151676e-07,
+ "loss": 0.0246,
+ "step": 31974
+ },
+ {
+ "epoch": 87.12534059945504,
+ "grad_norm": 1.0331571102142334,
+ "learning_rate": 8.568326857778297e-07,
+ "loss": 0.0133,
+ "step": 31975
+ },
+ {
+ "epoch": 87.12806539509536,
+ "grad_norm": 2.2067832946777344,
+ "learning_rate": 8.564753111471847e-07,
+ "loss": 0.0335,
+ "step": 31976
+ },
+ {
+ "epoch": 87.1307901907357,
+ "grad_norm": 2.947394609451294,
+ "learning_rate": 8.561180077260134e-07,
+ "loss": 0.0362,
+ "step": 31977
+ },
+ {
+ "epoch": 87.13351498637603,
+ "grad_norm": 2.036851406097412,
+ "learning_rate": 8.557607755171016e-07,
+ "loss": 0.024,
+ "step": 31978
+ },
+ {
+ "epoch": 87.13623978201635,
+ "grad_norm": 1.8236857652664185,
+ "learning_rate": 8.554036145232314e-07,
+ "loss": 0.0243,
+ "step": 31979
+ },
+ {
+ "epoch": 87.13896457765668,
+ "grad_norm": 1.9249520301818848,
+ "learning_rate": 8.550465247471839e-07,
+ "loss": 0.0346,
+ "step": 31980
+ },
+ {
+ "epoch": 87.141689373297,
+ "grad_norm": 2.917386770248413,
+ "learning_rate": 8.546895061917404e-07,
+ "loss": 0.0836,
+ "step": 31981
+ },
+ {
+ "epoch": 87.14441416893733,
+ "grad_norm": 3.850255250930786,
+ "learning_rate": 8.543325588596785e-07,
+ "loss": 0.0261,
+ "step": 31982
+ },
+ {
+ "epoch": 87.14713896457765,
+ "grad_norm": 2.069046974182129,
+ "learning_rate": 8.539756827537815e-07,
+ "loss": 0.0389,
+ "step": 31983
+ },
+ {
+ "epoch": 87.14986376021798,
+ "grad_norm": 9.028697967529297,
+ "learning_rate": 8.536188778768284e-07,
+ "loss": 0.0376,
+ "step": 31984
+ },
+ {
+ "epoch": 87.15258855585832,
+ "grad_norm": 4.243398666381836,
+ "learning_rate": 8.53262144231597e-07,
+ "loss": 0.0577,
+ "step": 31985
+ },
+ {
+ "epoch": 87.15531335149863,
+ "grad_norm": 2.879706382751465,
+ "learning_rate": 8.529054818208638e-07,
+ "loss": 0.0732,
+ "step": 31986
+ },
+ {
+ "epoch": 87.15803814713897,
+ "grad_norm": 2.511085033416748,
+ "learning_rate": 8.525488906474089e-07,
+ "loss": 0.1094,
+ "step": 31987
+ },
+ {
+ "epoch": 87.16076294277929,
+ "grad_norm": 1.7432821989059448,
+ "learning_rate": 8.521923707140101e-07,
+ "loss": 0.0207,
+ "step": 31988
+ },
+ {
+ "epoch": 87.16348773841962,
+ "grad_norm": 3.6034116744995117,
+ "learning_rate": 8.518359220234429e-07,
+ "loss": 0.0448,
+ "step": 31989
+ },
+ {
+ "epoch": 87.16621253405995,
+ "grad_norm": 1.8865264654159546,
+ "learning_rate": 8.514795445784807e-07,
+ "loss": 0.0292,
+ "step": 31990
+ },
+ {
+ "epoch": 87.16893732970027,
+ "grad_norm": 5.443391799926758,
+ "learning_rate": 8.511232383819024e-07,
+ "loss": 0.1571,
+ "step": 31991
+ },
+ {
+ "epoch": 87.1716621253406,
+ "grad_norm": 3.189753293991089,
+ "learning_rate": 8.507670034364834e-07,
+ "loss": 0.0864,
+ "step": 31992
+ },
+ {
+ "epoch": 87.17438692098092,
+ "grad_norm": 2.250596046447754,
+ "learning_rate": 8.504108397449962e-07,
+ "loss": 0.025,
+ "step": 31993
+ },
+ {
+ "epoch": 87.17711171662125,
+ "grad_norm": 2.4600954055786133,
+ "learning_rate": 8.500547473102116e-07,
+ "loss": 0.0389,
+ "step": 31994
+ },
+ {
+ "epoch": 87.17983651226157,
+ "grad_norm": 3.1625146865844727,
+ "learning_rate": 8.496987261349077e-07,
+ "loss": 0.0632,
+ "step": 31995
+ },
+ {
+ "epoch": 87.1825613079019,
+ "grad_norm": 3.342609167098999,
+ "learning_rate": 8.493427762218575e-07,
+ "loss": 0.0461,
+ "step": 31996
+ },
+ {
+ "epoch": 87.18528610354224,
+ "grad_norm": 4.623934268951416,
+ "learning_rate": 8.489868975738303e-07,
+ "loss": 0.0715,
+ "step": 31997
+ },
+ {
+ "epoch": 87.18801089918256,
+ "grad_norm": 2.85520601272583,
+ "learning_rate": 8.486310901935968e-07,
+ "loss": 0.0348,
+ "step": 31998
+ },
+ {
+ "epoch": 87.19073569482289,
+ "grad_norm": 2.3970866203308105,
+ "learning_rate": 8.482753540839328e-07,
+ "loss": 0.0296,
+ "step": 31999
+ },
+ {
+ "epoch": 87.19346049046321,
+ "grad_norm": 4.5319342613220215,
+ "learning_rate": 8.479196892476049e-07,
+ "loss": 0.0769,
+ "step": 32000
+ },
+ {
+ "epoch": 87.19618528610354,
+ "grad_norm": 3.3380751609802246,
+ "learning_rate": 8.475640956873843e-07,
+ "loss": 0.077,
+ "step": 32001
+ },
+ {
+ "epoch": 87.19891008174388,
+ "grad_norm": 2.58056640625,
+ "learning_rate": 8.472085734060376e-07,
+ "loss": 0.0666,
+ "step": 32002
+ },
+ {
+ "epoch": 87.2016348773842,
+ "grad_norm": 2.57891845703125,
+ "learning_rate": 8.468531224063381e-07,
+ "loss": 0.0326,
+ "step": 32003
+ },
+ {
+ "epoch": 87.20435967302453,
+ "grad_norm": 2.006296157836914,
+ "learning_rate": 8.464977426910514e-07,
+ "loss": 0.0281,
+ "step": 32004
+ },
+ {
+ "epoch": 87.20708446866485,
+ "grad_norm": 2.3370838165283203,
+ "learning_rate": 8.461424342629465e-07,
+ "loss": 0.0364,
+ "step": 32005
+ },
+ {
+ "epoch": 87.20980926430518,
+ "grad_norm": 2.5445826053619385,
+ "learning_rate": 8.457871971247877e-07,
+ "loss": 0.1144,
+ "step": 32006
+ },
+ {
+ "epoch": 87.2125340599455,
+ "grad_norm": 2.2657854557037354,
+ "learning_rate": 8.454320312793451e-07,
+ "loss": 0.0289,
+ "step": 32007
+ },
+ {
+ "epoch": 87.21525885558583,
+ "grad_norm": 6.7753825187683105,
+ "learning_rate": 8.450769367293832e-07,
+ "loss": 0.0304,
+ "step": 32008
+ },
+ {
+ "epoch": 87.21798365122616,
+ "grad_norm": 1.9065998792648315,
+ "learning_rate": 8.447219134776674e-07,
+ "loss": 0.0217,
+ "step": 32009
+ },
+ {
+ "epoch": 87.22070844686648,
+ "grad_norm": 2.338294744491577,
+ "learning_rate": 8.443669615269611e-07,
+ "loss": 0.1282,
+ "step": 32010
+ },
+ {
+ "epoch": 87.22343324250681,
+ "grad_norm": 2.3199870586395264,
+ "learning_rate": 8.440120808800323e-07,
+ "loss": 0.0515,
+ "step": 32011
+ },
+ {
+ "epoch": 87.22615803814713,
+ "grad_norm": 2.0141749382019043,
+ "learning_rate": 8.436572715396407e-07,
+ "loss": 0.0718,
+ "step": 32012
+ },
+ {
+ "epoch": 87.22888283378747,
+ "grad_norm": 2.863680362701416,
+ "learning_rate": 8.433025335085532e-07,
+ "loss": 0.0327,
+ "step": 32013
+ },
+ {
+ "epoch": 87.2316076294278,
+ "grad_norm": 2.172550916671753,
+ "learning_rate": 8.429478667895307e-07,
+ "loss": 0.0244,
+ "step": 32014
+ },
+ {
+ "epoch": 87.23433242506812,
+ "grad_norm": 3.00764799118042,
+ "learning_rate": 8.425932713853346e-07,
+ "loss": 0.0572,
+ "step": 32015
+ },
+ {
+ "epoch": 87.23705722070845,
+ "grad_norm": 15.083392143249512,
+ "learning_rate": 8.422387472987281e-07,
+ "loss": 0.0299,
+ "step": 32016
+ },
+ {
+ "epoch": 87.23978201634877,
+ "grad_norm": 2.5588722229003906,
+ "learning_rate": 8.418842945324724e-07,
+ "loss": 0.0271,
+ "step": 32017
+ },
+ {
+ "epoch": 87.2425068119891,
+ "grad_norm": 4.644388198852539,
+ "learning_rate": 8.415299130893251e-07,
+ "loss": 0.0737,
+ "step": 32018
+ },
+ {
+ "epoch": 87.24523160762942,
+ "grad_norm": 2.2760121822357178,
+ "learning_rate": 8.411756029720497e-07,
+ "loss": 0.0431,
+ "step": 32019
+ },
+ {
+ "epoch": 87.24795640326975,
+ "grad_norm": 2.807145118713379,
+ "learning_rate": 8.408213641834029e-07,
+ "loss": 0.0366,
+ "step": 32020
+ },
+ {
+ "epoch": 87.25068119891009,
+ "grad_norm": 1.9172195196151733,
+ "learning_rate": 8.404671967261457e-07,
+ "loss": 0.0674,
+ "step": 32021
+ },
+ {
+ "epoch": 87.2534059945504,
+ "grad_norm": 2.739680528640747,
+ "learning_rate": 8.401131006030327e-07,
+ "loss": 0.0451,
+ "step": 32022
+ },
+ {
+ "epoch": 87.25613079019074,
+ "grad_norm": 3.617414951324463,
+ "learning_rate": 8.397590758168272e-07,
+ "loss": 0.128,
+ "step": 32023
+ },
+ {
+ "epoch": 87.25885558583106,
+ "grad_norm": 2.3763816356658936,
+ "learning_rate": 8.394051223702815e-07,
+ "loss": 0.0491,
+ "step": 32024
+ },
+ {
+ "epoch": 87.26158038147139,
+ "grad_norm": 3.6216704845428467,
+ "learning_rate": 8.390512402661555e-07,
+ "loss": 0.1775,
+ "step": 32025
+ },
+ {
+ "epoch": 87.26430517711172,
+ "grad_norm": 2.240335464477539,
+ "learning_rate": 8.386974295072004e-07,
+ "loss": 0.025,
+ "step": 32026
+ },
+ {
+ "epoch": 87.26702997275204,
+ "grad_norm": 2.863473653793335,
+ "learning_rate": 8.383436900961772e-07,
+ "loss": 0.072,
+ "step": 32027
+ },
+ {
+ "epoch": 87.26975476839237,
+ "grad_norm": 3.8904831409454346,
+ "learning_rate": 8.379900220358384e-07,
+ "loss": 0.0481,
+ "step": 32028
+ },
+ {
+ "epoch": 87.2724795640327,
+ "grad_norm": 2.4198544025421143,
+ "learning_rate": 8.376364253289371e-07,
+ "loss": 0.1564,
+ "step": 32029
+ },
+ {
+ "epoch": 87.27520435967303,
+ "grad_norm": 2.7671501636505127,
+ "learning_rate": 8.372828999782301e-07,
+ "loss": 0.0377,
+ "step": 32030
+ },
+ {
+ "epoch": 87.27792915531334,
+ "grad_norm": 2.004340887069702,
+ "learning_rate": 8.369294459864663e-07,
+ "loss": 0.0227,
+ "step": 32031
+ },
+ {
+ "epoch": 87.28065395095368,
+ "grad_norm": 2.9251890182495117,
+ "learning_rate": 8.365760633564035e-07,
+ "loss": 0.0939,
+ "step": 32032
+ },
+ {
+ "epoch": 87.28337874659401,
+ "grad_norm": 4.655163764953613,
+ "learning_rate": 8.362227520907918e-07,
+ "loss": 0.0331,
+ "step": 32033
+ },
+ {
+ "epoch": 87.28610354223433,
+ "grad_norm": 3.044646978378296,
+ "learning_rate": 8.35869512192381e-07,
+ "loss": 0.035,
+ "step": 32034
+ },
+ {
+ "epoch": 87.28882833787466,
+ "grad_norm": 2.171783924102783,
+ "learning_rate": 8.355163436639236e-07,
+ "loss": 0.0323,
+ "step": 32035
+ },
+ {
+ "epoch": 87.29155313351498,
+ "grad_norm": 1.5490366220474243,
+ "learning_rate": 8.351632465081705e-07,
+ "loss": 0.2205,
+ "step": 32036
+ },
+ {
+ "epoch": 87.29427792915531,
+ "grad_norm": 2.554487466812134,
+ "learning_rate": 8.348102207278708e-07,
+ "loss": 0.1241,
+ "step": 32037
+ },
+ {
+ "epoch": 87.29700272479565,
+ "grad_norm": 1.847252607345581,
+ "learning_rate": 8.344572663257755e-07,
+ "loss": 0.0343,
+ "step": 32038
+ },
+ {
+ "epoch": 87.29972752043597,
+ "grad_norm": 2.1390950679779053,
+ "learning_rate": 8.341043833046292e-07,
+ "loss": 0.0283,
+ "step": 32039
+ },
+ {
+ "epoch": 87.3024523160763,
+ "grad_norm": 3.2583892345428467,
+ "learning_rate": 8.337515716671851e-07,
+ "loss": 0.1564,
+ "step": 32040
+ },
+ {
+ "epoch": 87.30517711171662,
+ "grad_norm": 3.5399813652038574,
+ "learning_rate": 8.333988314161879e-07,
+ "loss": 0.0613,
+ "step": 32041
+ },
+ {
+ "epoch": 87.30790190735695,
+ "grad_norm": 3.7903201580047607,
+ "learning_rate": 8.33046162554385e-07,
+ "loss": 0.0641,
+ "step": 32042
+ },
+ {
+ "epoch": 87.31062670299727,
+ "grad_norm": 5.673577308654785,
+ "learning_rate": 8.326935650845247e-07,
+ "loss": 0.0978,
+ "step": 32043
+ },
+ {
+ "epoch": 87.3133514986376,
+ "grad_norm": 2.934593915939331,
+ "learning_rate": 8.323410390093523e-07,
+ "loss": 0.0689,
+ "step": 32044
+ },
+ {
+ "epoch": 87.31607629427793,
+ "grad_norm": 3.9851810932159424,
+ "learning_rate": 8.319885843316123e-07,
+ "loss": 0.0618,
+ "step": 32045
+ },
+ {
+ "epoch": 87.31880108991825,
+ "grad_norm": 3.383972644805908,
+ "learning_rate": 8.316362010540479e-07,
+ "loss": 0.1647,
+ "step": 32046
+ },
+ {
+ "epoch": 87.32152588555859,
+ "grad_norm": 2.7322640419006348,
+ "learning_rate": 8.312838891794073e-07,
+ "loss": 0.0832,
+ "step": 32047
+ },
+ {
+ "epoch": 87.3242506811989,
+ "grad_norm": 3.392420768737793,
+ "learning_rate": 8.309316487104335e-07,
+ "loss": 0.0846,
+ "step": 32048
+ },
+ {
+ "epoch": 87.32697547683924,
+ "grad_norm": 3.0945212841033936,
+ "learning_rate": 8.305794796498689e-07,
+ "loss": 0.0451,
+ "step": 32049
+ },
+ {
+ "epoch": 87.32970027247957,
+ "grad_norm": 2.9162776470184326,
+ "learning_rate": 8.302273820004558e-07,
+ "loss": 0.1233,
+ "step": 32050
+ },
+ {
+ "epoch": 87.33242506811989,
+ "grad_norm": 3.2233474254608154,
+ "learning_rate": 8.298753557649353e-07,
+ "loss": 0.0765,
+ "step": 32051
+ },
+ {
+ "epoch": 87.33514986376022,
+ "grad_norm": 1.705782413482666,
+ "learning_rate": 8.295234009460529e-07,
+ "loss": 0.027,
+ "step": 32052
+ },
+ {
+ "epoch": 87.33787465940054,
+ "grad_norm": 2.5130674839019775,
+ "learning_rate": 8.291715175465453e-07,
+ "loss": 0.0302,
+ "step": 32053
+ },
+ {
+ "epoch": 87.34059945504087,
+ "grad_norm": 4.544942855834961,
+ "learning_rate": 8.288197055691561e-07,
+ "loss": 0.0852,
+ "step": 32054
+ },
+ {
+ "epoch": 87.34332425068119,
+ "grad_norm": 3.1552555561065674,
+ "learning_rate": 8.284679650166227e-07,
+ "loss": 0.1218,
+ "step": 32055
+ },
+ {
+ "epoch": 87.34604904632153,
+ "grad_norm": 2.733889579772949,
+ "learning_rate": 8.281162958916866e-07,
+ "loss": 0.116,
+ "step": 32056
+ },
+ {
+ "epoch": 87.34877384196186,
+ "grad_norm": 3.0717015266418457,
+ "learning_rate": 8.277646981970855e-07,
+ "loss": 0.1185,
+ "step": 32057
+ },
+ {
+ "epoch": 87.35149863760218,
+ "grad_norm": 2.7397303581237793,
+ "learning_rate": 8.274131719355571e-07,
+ "loss": 0.0383,
+ "step": 32058
+ },
+ {
+ "epoch": 87.35422343324251,
+ "grad_norm": 2.4850943088531494,
+ "learning_rate": 8.270617171098383e-07,
+ "loss": 0.0369,
+ "step": 32059
+ },
+ {
+ "epoch": 87.35694822888283,
+ "grad_norm": 5.439486503601074,
+ "learning_rate": 8.2671033372267e-07,
+ "loss": 0.0525,
+ "step": 32060
+ },
+ {
+ "epoch": 87.35967302452316,
+ "grad_norm": 2.633753538131714,
+ "learning_rate": 8.263590217767858e-07,
+ "loss": 0.1182,
+ "step": 32061
+ },
+ {
+ "epoch": 87.3623978201635,
+ "grad_norm": 3.2475616931915283,
+ "learning_rate": 8.260077812749212e-07,
+ "loss": 0.1208,
+ "step": 32062
+ },
+ {
+ "epoch": 87.36512261580381,
+ "grad_norm": 2.1586110591888428,
+ "learning_rate": 8.25656612219814e-07,
+ "loss": 0.1158,
+ "step": 32063
+ },
+ {
+ "epoch": 87.36784741144415,
+ "grad_norm": 2.7510464191436768,
+ "learning_rate": 8.253055146141964e-07,
+ "loss": 0.0754,
+ "step": 32064
+ },
+ {
+ "epoch": 87.37057220708446,
+ "grad_norm": 3.917447805404663,
+ "learning_rate": 8.249544884608052e-07,
+ "loss": 0.1799,
+ "step": 32065
+ },
+ {
+ "epoch": 87.3732970027248,
+ "grad_norm": 2.3031461238861084,
+ "learning_rate": 8.246035337623737e-07,
+ "loss": 0.0312,
+ "step": 32066
+ },
+ {
+ "epoch": 87.37602179836512,
+ "grad_norm": 10.528989791870117,
+ "learning_rate": 8.24252650521633e-07,
+ "loss": 0.031,
+ "step": 32067
+ },
+ {
+ "epoch": 87.37874659400545,
+ "grad_norm": 2.054379940032959,
+ "learning_rate": 8.23901838741319e-07,
+ "loss": 0.019,
+ "step": 32068
+ },
+ {
+ "epoch": 87.38147138964578,
+ "grad_norm": 1.4419647455215454,
+ "learning_rate": 8.235510984241623e-07,
+ "loss": 0.0164,
+ "step": 32069
+ },
+ {
+ "epoch": 87.3841961852861,
+ "grad_norm": 3.174726963043213,
+ "learning_rate": 8.232004295728935e-07,
+ "loss": 0.0544,
+ "step": 32070
+ },
+ {
+ "epoch": 87.38692098092643,
+ "grad_norm": 1.9841511249542236,
+ "learning_rate": 8.228498321902434e-07,
+ "loss": 0.1894,
+ "step": 32071
+ },
+ {
+ "epoch": 87.38964577656675,
+ "grad_norm": 3.0590014457702637,
+ "learning_rate": 8.224993062789443e-07,
+ "loss": 0.0258,
+ "step": 32072
+ },
+ {
+ "epoch": 87.39237057220708,
+ "grad_norm": 2.2886037826538086,
+ "learning_rate": 8.221488518417264e-07,
+ "loss": 0.0314,
+ "step": 32073
+ },
+ {
+ "epoch": 87.39509536784742,
+ "grad_norm": 2.3827927112579346,
+ "learning_rate": 8.217984688813174e-07,
+ "loss": 0.0601,
+ "step": 32074
+ },
+ {
+ "epoch": 87.39782016348774,
+ "grad_norm": 3.274296760559082,
+ "learning_rate": 8.21448157400444e-07,
+ "loss": 0.0284,
+ "step": 32075
+ },
+ {
+ "epoch": 87.40054495912807,
+ "grad_norm": 2.597504138946533,
+ "learning_rate": 8.210979174018397e-07,
+ "loss": 0.0489,
+ "step": 32076
+ },
+ {
+ "epoch": 87.40326975476839,
+ "grad_norm": 3.3759877681732178,
+ "learning_rate": 8.207477488882287e-07,
+ "loss": 0.0261,
+ "step": 32077
+ },
+ {
+ "epoch": 87.40599455040872,
+ "grad_norm": 2.5323102474212646,
+ "learning_rate": 8.203976518623402e-07,
+ "loss": 0.0358,
+ "step": 32078
+ },
+ {
+ "epoch": 87.40871934604904,
+ "grad_norm": 2.9436633586883545,
+ "learning_rate": 8.200476263268964e-07,
+ "loss": 0.1111,
+ "step": 32079
+ },
+ {
+ "epoch": 87.41144414168937,
+ "grad_norm": 2.8936707973480225,
+ "learning_rate": 8.196976722846273e-07,
+ "loss": 0.1125,
+ "step": 32080
+ },
+ {
+ "epoch": 87.4141689373297,
+ "grad_norm": 1.7252203226089478,
+ "learning_rate": 8.193477897382574e-07,
+ "loss": 0.0308,
+ "step": 32081
+ },
+ {
+ "epoch": 87.41689373297002,
+ "grad_norm": 2.6562628746032715,
+ "learning_rate": 8.189979786905111e-07,
+ "loss": 0.0883,
+ "step": 32082
+ },
+ {
+ "epoch": 87.41961852861036,
+ "grad_norm": 3.75610089302063,
+ "learning_rate": 8.186482391441131e-07,
+ "loss": 0.0711,
+ "step": 32083
+ },
+ {
+ "epoch": 87.42234332425068,
+ "grad_norm": 4.6357316970825195,
+ "learning_rate": 8.182985711017877e-07,
+ "loss": 0.0534,
+ "step": 32084
+ },
+ {
+ "epoch": 87.42506811989101,
+ "grad_norm": 2.3157403469085693,
+ "learning_rate": 8.179489745662583e-07,
+ "loss": 0.0459,
+ "step": 32085
+ },
+ {
+ "epoch": 87.42779291553134,
+ "grad_norm": 2.565436601638794,
+ "learning_rate": 8.175994495402462e-07,
+ "loss": 0.0541,
+ "step": 32086
+ },
+ {
+ "epoch": 87.43051771117166,
+ "grad_norm": 5.693440914154053,
+ "learning_rate": 8.172499960264724e-07,
+ "loss": 0.0571,
+ "step": 32087
+ },
+ {
+ "epoch": 87.433242506812,
+ "grad_norm": 2.6509525775909424,
+ "learning_rate": 8.169006140276614e-07,
+ "loss": 0.0276,
+ "step": 32088
+ },
+ {
+ "epoch": 87.43596730245231,
+ "grad_norm": 2.344193458557129,
+ "learning_rate": 8.165513035465345e-07,
+ "loss": 0.0299,
+ "step": 32089
+ },
+ {
+ "epoch": 87.43869209809264,
+ "grad_norm": 1.9711655378341675,
+ "learning_rate": 8.162020645858093e-07,
+ "loss": 0.0234,
+ "step": 32090
+ },
+ {
+ "epoch": 87.44141689373296,
+ "grad_norm": 2.739438056945801,
+ "learning_rate": 8.15852897148205e-07,
+ "loss": 0.0367,
+ "step": 32091
+ },
+ {
+ "epoch": 87.4441416893733,
+ "grad_norm": 3.3594422340393066,
+ "learning_rate": 8.155038012364447e-07,
+ "loss": 0.0476,
+ "step": 32092
+ },
+ {
+ "epoch": 87.44686648501363,
+ "grad_norm": 1.8658385276794434,
+ "learning_rate": 8.151547768532453e-07,
+ "loss": 0.0268,
+ "step": 32093
+ },
+ {
+ "epoch": 87.44959128065395,
+ "grad_norm": 4.355685234069824,
+ "learning_rate": 8.148058240013246e-07,
+ "loss": 0.0499,
+ "step": 32094
+ },
+ {
+ "epoch": 87.45231607629428,
+ "grad_norm": 3.1923887729644775,
+ "learning_rate": 8.144569426833981e-07,
+ "loss": 0.0757,
+ "step": 32095
+ },
+ {
+ "epoch": 87.4550408719346,
+ "grad_norm": 2.8732986450195312,
+ "learning_rate": 8.141081329021883e-07,
+ "loss": 0.0535,
+ "step": 32096
+ },
+ {
+ "epoch": 87.45776566757493,
+ "grad_norm": 2.132540702819824,
+ "learning_rate": 8.137593946604083e-07,
+ "loss": 0.0213,
+ "step": 32097
+ },
+ {
+ "epoch": 87.46049046321527,
+ "grad_norm": 1.7454577684402466,
+ "learning_rate": 8.134107279607728e-07,
+ "loss": 0.0297,
+ "step": 32098
+ },
+ {
+ "epoch": 87.46321525885558,
+ "grad_norm": 2.77207088470459,
+ "learning_rate": 8.130621328060006e-07,
+ "loss": 0.0528,
+ "step": 32099
+ },
+ {
+ "epoch": 87.46594005449592,
+ "grad_norm": 3.1678285598754883,
+ "learning_rate": 8.127136091988031e-07,
+ "loss": 0.0408,
+ "step": 32100
+ },
+ {
+ "epoch": 87.46866485013624,
+ "grad_norm": 2.4710707664489746,
+ "learning_rate": 8.123651571418978e-07,
+ "loss": 0.0288,
+ "step": 32101
+ },
+ {
+ "epoch": 87.47138964577657,
+ "grad_norm": 2.966733455657959,
+ "learning_rate": 8.120167766379972e-07,
+ "loss": 0.0286,
+ "step": 32102
+ },
+ {
+ "epoch": 87.47411444141689,
+ "grad_norm": 3.19575572013855,
+ "learning_rate": 8.116684676898134e-07,
+ "loss": 0.0757,
+ "step": 32103
+ },
+ {
+ "epoch": 87.47683923705722,
+ "grad_norm": 1.9228724241256714,
+ "learning_rate": 8.113202303000589e-07,
+ "loss": 0.0222,
+ "step": 32104
+ },
+ {
+ "epoch": 87.47956403269755,
+ "grad_norm": 1.4114537239074707,
+ "learning_rate": 8.109720644714492e-07,
+ "loss": 0.0157,
+ "step": 32105
+ },
+ {
+ "epoch": 87.48228882833787,
+ "grad_norm": 3.4534709453582764,
+ "learning_rate": 8.106239702066921e-07,
+ "loss": 0.0638,
+ "step": 32106
+ },
+ {
+ "epoch": 87.4850136239782,
+ "grad_norm": 2.5079915523529053,
+ "learning_rate": 8.102759475084986e-07,
+ "loss": 0.036,
+ "step": 32107
+ },
+ {
+ "epoch": 87.48773841961852,
+ "grad_norm": 2.964305877685547,
+ "learning_rate": 8.099279963795814e-07,
+ "loss": 0.0323,
+ "step": 32108
+ },
+ {
+ "epoch": 87.49046321525886,
+ "grad_norm": 2.582146406173706,
+ "learning_rate": 8.095801168226503e-07,
+ "loss": 0.0841,
+ "step": 32109
+ },
+ {
+ "epoch": 87.49318801089919,
+ "grad_norm": 2.275869369506836,
+ "learning_rate": 8.092323088404119e-07,
+ "loss": 0.0303,
+ "step": 32110
+ },
+ {
+ "epoch": 87.49591280653951,
+ "grad_norm": 2.0972752571105957,
+ "learning_rate": 8.088845724355765e-07,
+ "loss": 0.0321,
+ "step": 32111
+ },
+ {
+ "epoch": 87.49863760217984,
+ "grad_norm": 2.659170150756836,
+ "learning_rate": 8.085369076108529e-07,
+ "loss": 0.0449,
+ "step": 32112
+ },
+ {
+ "epoch": 87.50136239782016,
+ "grad_norm": 1.7420847415924072,
+ "learning_rate": 8.081893143689479e-07,
+ "loss": 0.0208,
+ "step": 32113
+ },
+ {
+ "epoch": 87.50408719346049,
+ "grad_norm": 3.0050289630889893,
+ "learning_rate": 8.078417927125692e-07,
+ "loss": 0.0508,
+ "step": 32114
+ },
+ {
+ "epoch": 87.50681198910081,
+ "grad_norm": 2.8802103996276855,
+ "learning_rate": 8.074943426444204e-07,
+ "loss": 0.0572,
+ "step": 32115
+ },
+ {
+ "epoch": 87.50953678474114,
+ "grad_norm": 2.531992197036743,
+ "learning_rate": 8.071469641672103e-07,
+ "loss": 0.0895,
+ "step": 32116
+ },
+ {
+ "epoch": 87.51226158038148,
+ "grad_norm": 2.5337300300598145,
+ "learning_rate": 8.067996572836456e-07,
+ "loss": 0.0654,
+ "step": 32117
+ },
+ {
+ "epoch": 87.5149863760218,
+ "grad_norm": 2.8185200691223145,
+ "learning_rate": 8.064524219964298e-07,
+ "loss": 0.0458,
+ "step": 32118
+ },
+ {
+ "epoch": 87.51771117166213,
+ "grad_norm": 1.8498786687850952,
+ "learning_rate": 8.061052583082652e-07,
+ "loss": 0.0232,
+ "step": 32119
+ },
+ {
+ "epoch": 87.52043596730245,
+ "grad_norm": 3.859872579574585,
+ "learning_rate": 8.057581662218561e-07,
+ "loss": 0.0749,
+ "step": 32120
+ },
+ {
+ "epoch": 87.52316076294278,
+ "grad_norm": 3.3445465564727783,
+ "learning_rate": 8.054111457399083e-07,
+ "loss": 0.0546,
+ "step": 32121
+ },
+ {
+ "epoch": 87.52588555858311,
+ "grad_norm": 2.920300006866455,
+ "learning_rate": 8.050641968651218e-07,
+ "loss": 0.0415,
+ "step": 32122
+ },
+ {
+ "epoch": 87.52861035422343,
+ "grad_norm": 2.1514246463775635,
+ "learning_rate": 8.047173196002001e-07,
+ "loss": 0.0347,
+ "step": 32123
+ },
+ {
+ "epoch": 87.53133514986376,
+ "grad_norm": 2.5154616832733154,
+ "learning_rate": 8.043705139478431e-07,
+ "loss": 0.0405,
+ "step": 32124
+ },
+ {
+ "epoch": 87.53405994550408,
+ "grad_norm": 2.2705025672912598,
+ "learning_rate": 8.040237799107531e-07,
+ "loss": 0.0333,
+ "step": 32125
+ },
+ {
+ "epoch": 87.53678474114442,
+ "grad_norm": 2.769376277923584,
+ "learning_rate": 8.036771174916302e-07,
+ "loss": 0.1692,
+ "step": 32126
+ },
+ {
+ "epoch": 87.53950953678473,
+ "grad_norm": 2.183717727661133,
+ "learning_rate": 8.033305266931712e-07,
+ "loss": 0.0616,
+ "step": 32127
+ },
+ {
+ "epoch": 87.54223433242507,
+ "grad_norm": 2.682685375213623,
+ "learning_rate": 8.029840075180817e-07,
+ "loss": 0.0854,
+ "step": 32128
+ },
+ {
+ "epoch": 87.5449591280654,
+ "grad_norm": 4.025137424468994,
+ "learning_rate": 8.026375599690551e-07,
+ "loss": 0.0759,
+ "step": 32129
+ },
+ {
+ "epoch": 87.54768392370572,
+ "grad_norm": 2.4038383960723877,
+ "learning_rate": 8.022911840487924e-07,
+ "loss": 0.0318,
+ "step": 32130
+ },
+ {
+ "epoch": 87.55040871934605,
+ "grad_norm": 2.478999614715576,
+ "learning_rate": 8.019448797599871e-07,
+ "loss": 0.047,
+ "step": 32131
+ },
+ {
+ "epoch": 87.55313351498637,
+ "grad_norm": 6.368683815002441,
+ "learning_rate": 8.015986471053394e-07,
+ "loss": 0.0592,
+ "step": 32132
+ },
+ {
+ "epoch": 87.5558583106267,
+ "grad_norm": 2.918562650680542,
+ "learning_rate": 8.012524860875481e-07,
+ "loss": 0.0561,
+ "step": 32133
+ },
+ {
+ "epoch": 87.55858310626704,
+ "grad_norm": 2.6399192810058594,
+ "learning_rate": 8.009063967093055e-07,
+ "loss": 0.0298,
+ "step": 32134
+ },
+ {
+ "epoch": 87.56130790190736,
+ "grad_norm": 2.8267951011657715,
+ "learning_rate": 8.005603789733074e-07,
+ "loss": 0.0333,
+ "step": 32135
+ },
+ {
+ "epoch": 87.56403269754769,
+ "grad_norm": 4.2104363441467285,
+ "learning_rate": 8.00214432882248e-07,
+ "loss": 0.1008,
+ "step": 32136
+ },
+ {
+ "epoch": 87.566757493188,
+ "grad_norm": 2.6444315910339355,
+ "learning_rate": 7.998685584388244e-07,
+ "loss": 0.0539,
+ "step": 32137
+ },
+ {
+ "epoch": 87.56948228882834,
+ "grad_norm": 3.156651020050049,
+ "learning_rate": 7.995227556457274e-07,
+ "loss": 0.1323,
+ "step": 32138
+ },
+ {
+ "epoch": 87.57220708446866,
+ "grad_norm": 2.1488776206970215,
+ "learning_rate": 7.991770245056519e-07,
+ "loss": 0.0454,
+ "step": 32139
+ },
+ {
+ "epoch": 87.57493188010899,
+ "grad_norm": 2.564025402069092,
+ "learning_rate": 7.988313650212876e-07,
+ "loss": 0.0574,
+ "step": 32140
+ },
+ {
+ "epoch": 87.57765667574932,
+ "grad_norm": 2.330198287963867,
+ "learning_rate": 7.984857771953303e-07,
+ "loss": 0.0727,
+ "step": 32141
+ },
+ {
+ "epoch": 87.58038147138964,
+ "grad_norm": 2.864098310470581,
+ "learning_rate": 7.981402610304689e-07,
+ "loss": 0.0481,
+ "step": 32142
+ },
+ {
+ "epoch": 87.58310626702998,
+ "grad_norm": 1.646061897277832,
+ "learning_rate": 7.977948165293959e-07,
+ "loss": 0.018,
+ "step": 32143
+ },
+ {
+ "epoch": 87.5858310626703,
+ "grad_norm": 5.705280780792236,
+ "learning_rate": 7.974494436947989e-07,
+ "loss": 0.1504,
+ "step": 32144
+ },
+ {
+ "epoch": 87.58855585831063,
+ "grad_norm": 2.3666508197784424,
+ "learning_rate": 7.971041425293713e-07,
+ "loss": 0.1041,
+ "step": 32145
+ },
+ {
+ "epoch": 87.59128065395096,
+ "grad_norm": 2.5445120334625244,
+ "learning_rate": 7.967589130358e-07,
+ "loss": 0.0336,
+ "step": 32146
+ },
+ {
+ "epoch": 87.59400544959128,
+ "grad_norm": 3.171571969985962,
+ "learning_rate": 7.964137552167739e-07,
+ "loss": 0.0631,
+ "step": 32147
+ },
+ {
+ "epoch": 87.59673024523161,
+ "grad_norm": 2.541062831878662,
+ "learning_rate": 7.960686690749797e-07,
+ "loss": 0.0292,
+ "step": 32148
+ },
+ {
+ "epoch": 87.59945504087193,
+ "grad_norm": 1.9698750972747803,
+ "learning_rate": 7.957236546131086e-07,
+ "loss": 0.0192,
+ "step": 32149
+ },
+ {
+ "epoch": 87.60217983651226,
+ "grad_norm": 3.2101454734802246,
+ "learning_rate": 7.95378711833843e-07,
+ "loss": 0.0677,
+ "step": 32150
+ },
+ {
+ "epoch": 87.60490463215258,
+ "grad_norm": 2.757845878601074,
+ "learning_rate": 7.950338407398739e-07,
+ "loss": 0.1025,
+ "step": 32151
+ },
+ {
+ "epoch": 87.60762942779292,
+ "grad_norm": 14.851627349853516,
+ "learning_rate": 7.946890413338837e-07,
+ "loss": 0.1651,
+ "step": 32152
+ },
+ {
+ "epoch": 87.61035422343325,
+ "grad_norm": 2.203108310699463,
+ "learning_rate": 7.943443136185602e-07,
+ "loss": 0.0231,
+ "step": 32153
+ },
+ {
+ "epoch": 87.61307901907357,
+ "grad_norm": 1.8596984148025513,
+ "learning_rate": 7.93999657596587e-07,
+ "loss": 0.0218,
+ "step": 32154
+ },
+ {
+ "epoch": 87.6158038147139,
+ "grad_norm": 2.512727975845337,
+ "learning_rate": 7.936550732706483e-07,
+ "loss": 0.1162,
+ "step": 32155
+ },
+ {
+ "epoch": 87.61852861035422,
+ "grad_norm": 2.3046913146972656,
+ "learning_rate": 7.933105606434255e-07,
+ "loss": 0.1044,
+ "step": 32156
+ },
+ {
+ "epoch": 87.62125340599455,
+ "grad_norm": 2.938237190246582,
+ "learning_rate": 7.929661197176052e-07,
+ "loss": 0.0777,
+ "step": 32157
+ },
+ {
+ "epoch": 87.62397820163488,
+ "grad_norm": 2.446826457977295,
+ "learning_rate": 7.926217504958688e-07,
+ "loss": 0.1203,
+ "step": 32158
+ },
+ {
+ "epoch": 87.6267029972752,
+ "grad_norm": 3.3570597171783447,
+ "learning_rate": 7.922774529808985e-07,
+ "loss": 0.1578,
+ "step": 32159
+ },
+ {
+ "epoch": 87.62942779291554,
+ "grad_norm": 2.6146492958068848,
+ "learning_rate": 7.919332271753722e-07,
+ "loss": 0.1479,
+ "step": 32160
+ },
+ {
+ "epoch": 87.63215258855585,
+ "grad_norm": 3.064115047454834,
+ "learning_rate": 7.915890730819764e-07,
+ "loss": 0.0384,
+ "step": 32161
+ },
+ {
+ "epoch": 87.63487738419619,
+ "grad_norm": 1.6859407424926758,
+ "learning_rate": 7.912449907033881e-07,
+ "loss": 0.031,
+ "step": 32162
+ },
+ {
+ "epoch": 87.6376021798365,
+ "grad_norm": 2.9649910926818848,
+ "learning_rate": 7.909009800422874e-07,
+ "loss": 0.0326,
+ "step": 32163
+ },
+ {
+ "epoch": 87.64032697547684,
+ "grad_norm": 2.7740511894226074,
+ "learning_rate": 7.905570411013519e-07,
+ "loss": 0.0332,
+ "step": 32164
+ },
+ {
+ "epoch": 87.64305177111717,
+ "grad_norm": 2.3737103939056396,
+ "learning_rate": 7.90213173883263e-07,
+ "loss": 0.0304,
+ "step": 32165
+ },
+ {
+ "epoch": 87.64577656675749,
+ "grad_norm": 5.280933856964111,
+ "learning_rate": 7.898693783906975e-07,
+ "loss": 0.0484,
+ "step": 32166
+ },
+ {
+ "epoch": 87.64850136239782,
+ "grad_norm": 1.931410551071167,
+ "learning_rate": 7.895256546263319e-07,
+ "loss": 0.055,
+ "step": 32167
+ },
+ {
+ "epoch": 87.65122615803814,
+ "grad_norm": 4.705388069152832,
+ "learning_rate": 7.891820025928432e-07,
+ "loss": 0.0601,
+ "step": 32168
+ },
+ {
+ "epoch": 87.65395095367847,
+ "grad_norm": 2.216409206390381,
+ "learning_rate": 7.888384222929101e-07,
+ "loss": 0.1683,
+ "step": 32169
+ },
+ {
+ "epoch": 87.65667574931881,
+ "grad_norm": 3.612227201461792,
+ "learning_rate": 7.884949137292075e-07,
+ "loss": 0.0587,
+ "step": 32170
+ },
+ {
+ "epoch": 87.65940054495913,
+ "grad_norm": 2.983952522277832,
+ "learning_rate": 7.881514769044107e-07,
+ "loss": 0.1444,
+ "step": 32171
+ },
+ {
+ "epoch": 87.66212534059946,
+ "grad_norm": 2.391012668609619,
+ "learning_rate": 7.878081118211911e-07,
+ "loss": 0.038,
+ "step": 32172
+ },
+ {
+ "epoch": 87.66485013623978,
+ "grad_norm": 3.45635724067688,
+ "learning_rate": 7.874648184822275e-07,
+ "loss": 0.0657,
+ "step": 32173
+ },
+ {
+ "epoch": 87.66757493188011,
+ "grad_norm": 1.6082489490509033,
+ "learning_rate": 7.871215968901913e-07,
+ "loss": 0.0208,
+ "step": 32174
+ },
+ {
+ "epoch": 87.67029972752043,
+ "grad_norm": 2.6080129146575928,
+ "learning_rate": 7.867784470477557e-07,
+ "loss": 0.1196,
+ "step": 32175
+ },
+ {
+ "epoch": 87.67302452316076,
+ "grad_norm": 2.555482864379883,
+ "learning_rate": 7.864353689575909e-07,
+ "loss": 0.0296,
+ "step": 32176
+ },
+ {
+ "epoch": 87.6757493188011,
+ "grad_norm": 2.4604551792144775,
+ "learning_rate": 7.860923626223726e-07,
+ "loss": 0.0606,
+ "step": 32177
+ },
+ {
+ "epoch": 87.67847411444141,
+ "grad_norm": 3.1521799564361572,
+ "learning_rate": 7.857494280447709e-07,
+ "loss": 0.1531,
+ "step": 32178
+ },
+ {
+ "epoch": 87.68119891008175,
+ "grad_norm": 4.707701683044434,
+ "learning_rate": 7.854065652274556e-07,
+ "loss": 0.0546,
+ "step": 32179
+ },
+ {
+ "epoch": 87.68392370572207,
+ "grad_norm": 1.743828535079956,
+ "learning_rate": 7.850637741730959e-07,
+ "loss": 0.087,
+ "step": 32180
+ },
+ {
+ "epoch": 87.6866485013624,
+ "grad_norm": 2.3071610927581787,
+ "learning_rate": 7.847210548843653e-07,
+ "loss": 0.05,
+ "step": 32181
+ },
+ {
+ "epoch": 87.68937329700273,
+ "grad_norm": 2.3715646266937256,
+ "learning_rate": 7.843784073639304e-07,
+ "loss": 0.0733,
+ "step": 32182
+ },
+ {
+ "epoch": 87.69209809264305,
+ "grad_norm": 7.41796875,
+ "learning_rate": 7.840358316144592e-07,
+ "loss": 0.023,
+ "step": 32183
+ },
+ {
+ "epoch": 87.69482288828338,
+ "grad_norm": 2.684610605239868,
+ "learning_rate": 7.836933276386183e-07,
+ "loss": 0.119,
+ "step": 32184
+ },
+ {
+ "epoch": 87.6975476839237,
+ "grad_norm": 2.3460471630096436,
+ "learning_rate": 7.833508954390778e-07,
+ "loss": 0.0304,
+ "step": 32185
+ },
+ {
+ "epoch": 87.70027247956403,
+ "grad_norm": 2.5405545234680176,
+ "learning_rate": 7.830085350185057e-07,
+ "loss": 0.0744,
+ "step": 32186
+ },
+ {
+ "epoch": 87.70299727520435,
+ "grad_norm": 3.223616123199463,
+ "learning_rate": 7.826662463795665e-07,
+ "loss": 0.1763,
+ "step": 32187
+ },
+ {
+ "epoch": 87.70572207084469,
+ "grad_norm": 3.933316707611084,
+ "learning_rate": 7.823240295249257e-07,
+ "loss": 0.0526,
+ "step": 32188
+ },
+ {
+ "epoch": 87.70844686648502,
+ "grad_norm": 2.4163014888763428,
+ "learning_rate": 7.819818844572468e-07,
+ "loss": 0.0845,
+ "step": 32189
+ },
+ {
+ "epoch": 87.71117166212534,
+ "grad_norm": 2.0288498401641846,
+ "learning_rate": 7.81639811179199e-07,
+ "loss": 0.0315,
+ "step": 32190
+ },
+ {
+ "epoch": 87.71389645776567,
+ "grad_norm": 2.184022903442383,
+ "learning_rate": 7.812978096934421e-07,
+ "loss": 0.109,
+ "step": 32191
+ },
+ {
+ "epoch": 87.71662125340599,
+ "grad_norm": 4.986965656280518,
+ "learning_rate": 7.809558800026407e-07,
+ "loss": 0.1037,
+ "step": 32192
+ },
+ {
+ "epoch": 87.71934604904632,
+ "grad_norm": 1.883907437324524,
+ "learning_rate": 7.806140221094593e-07,
+ "loss": 0.0278,
+ "step": 32193
+ },
+ {
+ "epoch": 87.72207084468666,
+ "grad_norm": 3.1499037742614746,
+ "learning_rate": 7.802722360165593e-07,
+ "loss": 0.0463,
+ "step": 32194
+ },
+ {
+ "epoch": 87.72479564032697,
+ "grad_norm": 1.8229411840438843,
+ "learning_rate": 7.799305217266018e-07,
+ "loss": 0.0257,
+ "step": 32195
+ },
+ {
+ "epoch": 87.7275204359673,
+ "grad_norm": 2.774632215499878,
+ "learning_rate": 7.795888792422479e-07,
+ "loss": 0.0601,
+ "step": 32196
+ },
+ {
+ "epoch": 87.73024523160763,
+ "grad_norm": 2.2164721488952637,
+ "learning_rate": 7.792473085661601e-07,
+ "loss": 0.0566,
+ "step": 32197
+ },
+ {
+ "epoch": 87.73297002724796,
+ "grad_norm": 2.9088759422302246,
+ "learning_rate": 7.789058097009983e-07,
+ "loss": 0.0343,
+ "step": 32198
+ },
+ {
+ "epoch": 87.73569482288828,
+ "grad_norm": 3.0221238136291504,
+ "learning_rate": 7.785643826494205e-07,
+ "loss": 0.0394,
+ "step": 32199
+ },
+ {
+ "epoch": 87.73841961852861,
+ "grad_norm": 3.420117139816284,
+ "learning_rate": 7.782230274140845e-07,
+ "loss": 0.0813,
+ "step": 32200
+ },
+ {
+ "epoch": 87.74114441416894,
+ "grad_norm": 2.453206777572632,
+ "learning_rate": 7.778817439976515e-07,
+ "loss": 0.0588,
+ "step": 32201
+ },
+ {
+ "epoch": 87.74386920980926,
+ "grad_norm": 2.2068138122558594,
+ "learning_rate": 7.775405324027807e-07,
+ "loss": 0.0209,
+ "step": 32202
+ },
+ {
+ "epoch": 87.7465940054496,
+ "grad_norm": 1.9418346881866455,
+ "learning_rate": 7.771993926321264e-07,
+ "loss": 0.0213,
+ "step": 32203
+ },
+ {
+ "epoch": 87.74931880108991,
+ "grad_norm": 2.20292592048645,
+ "learning_rate": 7.768583246883476e-07,
+ "loss": 0.1205,
+ "step": 32204
+ },
+ {
+ "epoch": 87.75204359673025,
+ "grad_norm": 2.0393476486206055,
+ "learning_rate": 7.765173285740968e-07,
+ "loss": 0.0307,
+ "step": 32205
+ },
+ {
+ "epoch": 87.75476839237058,
+ "grad_norm": 2.3173751831054688,
+ "learning_rate": 7.761764042920339e-07,
+ "loss": 0.0358,
+ "step": 32206
+ },
+ {
+ "epoch": 87.7574931880109,
+ "grad_norm": 2.642428159713745,
+ "learning_rate": 7.758355518448124e-07,
+ "loss": 0.0936,
+ "step": 32207
+ },
+ {
+ "epoch": 87.76021798365123,
+ "grad_norm": 1.9830187559127808,
+ "learning_rate": 7.754947712350869e-07,
+ "loss": 0.1085,
+ "step": 32208
+ },
+ {
+ "epoch": 87.76294277929155,
+ "grad_norm": 2.271312952041626,
+ "learning_rate": 7.751540624655085e-07,
+ "loss": 0.0237,
+ "step": 32209
+ },
+ {
+ "epoch": 87.76566757493188,
+ "grad_norm": 2.239161491394043,
+ "learning_rate": 7.748134255387363e-07,
+ "loss": 0.0584,
+ "step": 32210
+ },
+ {
+ "epoch": 87.7683923705722,
+ "grad_norm": 3.01596999168396,
+ "learning_rate": 7.744728604574203e-07,
+ "loss": 0.0421,
+ "step": 32211
+ },
+ {
+ "epoch": 87.77111716621253,
+ "grad_norm": 3.220775604248047,
+ "learning_rate": 7.741323672242118e-07,
+ "loss": 0.1589,
+ "step": 32212
+ },
+ {
+ "epoch": 87.77384196185287,
+ "grad_norm": 3.0501341819763184,
+ "learning_rate": 7.73791945841762e-07,
+ "loss": 0.1608,
+ "step": 32213
+ },
+ {
+ "epoch": 87.77656675749319,
+ "grad_norm": 2.0995032787323,
+ "learning_rate": 7.734515963127254e-07,
+ "loss": 0.0573,
+ "step": 32214
+ },
+ {
+ "epoch": 87.77929155313352,
+ "grad_norm": 3.8837478160858154,
+ "learning_rate": 7.73111318639751e-07,
+ "loss": 0.055,
+ "step": 32215
+ },
+ {
+ "epoch": 87.78201634877384,
+ "grad_norm": 3.704047203063965,
+ "learning_rate": 7.727711128254878e-07,
+ "loss": 0.0661,
+ "step": 32216
+ },
+ {
+ "epoch": 87.78474114441417,
+ "grad_norm": 2.4582417011260986,
+ "learning_rate": 7.72430978872587e-07,
+ "loss": 0.0637,
+ "step": 32217
+ },
+ {
+ "epoch": 87.7874659400545,
+ "grad_norm": 2.763697385787964,
+ "learning_rate": 7.720909167836943e-07,
+ "loss": 0.0205,
+ "step": 32218
+ },
+ {
+ "epoch": 87.79019073569482,
+ "grad_norm": 2.093129873275757,
+ "learning_rate": 7.717509265614631e-07,
+ "loss": 0.0347,
+ "step": 32219
+ },
+ {
+ "epoch": 87.79291553133515,
+ "grad_norm": 2.884716033935547,
+ "learning_rate": 7.714110082085391e-07,
+ "loss": 0.0815,
+ "step": 32220
+ },
+ {
+ "epoch": 87.79564032697547,
+ "grad_norm": 3.5441763401031494,
+ "learning_rate": 7.710711617275668e-07,
+ "loss": 0.0954,
+ "step": 32221
+ },
+ {
+ "epoch": 87.7983651226158,
+ "grad_norm": 2.7222464084625244,
+ "learning_rate": 7.707313871211974e-07,
+ "loss": 0.11,
+ "step": 32222
+ },
+ {
+ "epoch": 87.80108991825612,
+ "grad_norm": 1.983210563659668,
+ "learning_rate": 7.703916843920745e-07,
+ "loss": 0.0309,
+ "step": 32223
+ },
+ {
+ "epoch": 87.80381471389646,
+ "grad_norm": 1.9344252347946167,
+ "learning_rate": 7.700520535428435e-07,
+ "loss": 0.0193,
+ "step": 32224
+ },
+ {
+ "epoch": 87.80653950953679,
+ "grad_norm": 2.7835206985473633,
+ "learning_rate": 7.697124945761492e-07,
+ "loss": 0.147,
+ "step": 32225
+ },
+ {
+ "epoch": 87.80926430517711,
+ "grad_norm": 2.15885066986084,
+ "learning_rate": 7.693730074946393e-07,
+ "loss": 0.0991,
+ "step": 32226
+ },
+ {
+ "epoch": 87.81198910081744,
+ "grad_norm": 2.10834002494812,
+ "learning_rate": 7.690335923009539e-07,
+ "loss": 0.0279,
+ "step": 32227
+ },
+ {
+ "epoch": 87.81471389645776,
+ "grad_norm": 1.8662948608398438,
+ "learning_rate": 7.686942489977389e-07,
+ "loss": 0.063,
+ "step": 32228
+ },
+ {
+ "epoch": 87.8174386920981,
+ "grad_norm": 1.5790742635726929,
+ "learning_rate": 7.683549775876331e-07,
+ "loss": 0.0248,
+ "step": 32229
+ },
+ {
+ "epoch": 87.82016348773843,
+ "grad_norm": 3.244419813156128,
+ "learning_rate": 7.680157780732844e-07,
+ "loss": 0.0337,
+ "step": 32230
+ },
+ {
+ "epoch": 87.82288828337875,
+ "grad_norm": 1.9691389799118042,
+ "learning_rate": 7.676766504573319e-07,
+ "loss": 0.0315,
+ "step": 32231
+ },
+ {
+ "epoch": 87.82561307901908,
+ "grad_norm": 2.6122236251831055,
+ "learning_rate": 7.673375947424155e-07,
+ "loss": 0.0434,
+ "step": 32232
+ },
+ {
+ "epoch": 87.8283378746594,
+ "grad_norm": 2.582932710647583,
+ "learning_rate": 7.669986109311756e-07,
+ "loss": 0.1578,
+ "step": 32233
+ },
+ {
+ "epoch": 87.83106267029973,
+ "grad_norm": 1.9818381071090698,
+ "learning_rate": 7.666596990262542e-07,
+ "loss": 0.1266,
+ "step": 32234
+ },
+ {
+ "epoch": 87.83378746594005,
+ "grad_norm": 2.519568681716919,
+ "learning_rate": 7.663208590302907e-07,
+ "loss": 0.0409,
+ "step": 32235
+ },
+ {
+ "epoch": 87.83651226158038,
+ "grad_norm": 2.1832003593444824,
+ "learning_rate": 7.659820909459215e-07,
+ "loss": 0.0245,
+ "step": 32236
+ },
+ {
+ "epoch": 87.83923705722071,
+ "grad_norm": 3.458500385284424,
+ "learning_rate": 7.656433947757869e-07,
+ "loss": 0.1296,
+ "step": 32237
+ },
+ {
+ "epoch": 87.84196185286103,
+ "grad_norm": 2.5669286251068115,
+ "learning_rate": 7.653047705225258e-07,
+ "loss": 0.0553,
+ "step": 32238
+ },
+ {
+ "epoch": 87.84468664850137,
+ "grad_norm": 2.642077922821045,
+ "learning_rate": 7.649662181887729e-07,
+ "loss": 0.0323,
+ "step": 32239
+ },
+ {
+ "epoch": 87.84741144414168,
+ "grad_norm": 2.2836034297943115,
+ "learning_rate": 7.646277377771671e-07,
+ "loss": 0.0755,
+ "step": 32240
+ },
+ {
+ "epoch": 87.85013623978202,
+ "grad_norm": 1.9051963090896606,
+ "learning_rate": 7.642893292903408e-07,
+ "loss": 0.025,
+ "step": 32241
+ },
+ {
+ "epoch": 87.85286103542235,
+ "grad_norm": 3.2509732246398926,
+ "learning_rate": 7.639509927309341e-07,
+ "loss": 0.0227,
+ "step": 32242
+ },
+ {
+ "epoch": 87.85558583106267,
+ "grad_norm": 1.6330887079238892,
+ "learning_rate": 7.636127281015804e-07,
+ "loss": 0.0413,
+ "step": 32243
+ },
+ {
+ "epoch": 87.858310626703,
+ "grad_norm": 6.737751483917236,
+ "learning_rate": 7.63274535404912e-07,
+ "loss": 0.0305,
+ "step": 32244
+ },
+ {
+ "epoch": 87.86103542234332,
+ "grad_norm": 3.404038667678833,
+ "learning_rate": 7.629364146435636e-07,
+ "loss": 0.0403,
+ "step": 32245
+ },
+ {
+ "epoch": 87.86376021798365,
+ "grad_norm": 2.899501085281372,
+ "learning_rate": 7.625983658201708e-07,
+ "loss": 0.0215,
+ "step": 32246
+ },
+ {
+ "epoch": 87.86648501362397,
+ "grad_norm": 4.718465328216553,
+ "learning_rate": 7.622603889373648e-07,
+ "loss": 0.0831,
+ "step": 32247
+ },
+ {
+ "epoch": 87.8692098092643,
+ "grad_norm": 2.426079511642456,
+ "learning_rate": 7.619224839977767e-07,
+ "loss": 0.0834,
+ "step": 32248
+ },
+ {
+ "epoch": 87.87193460490464,
+ "grad_norm": 1.613516926765442,
+ "learning_rate": 7.615846510040381e-07,
+ "loss": 0.0174,
+ "step": 32249
+ },
+ {
+ "epoch": 87.87465940054496,
+ "grad_norm": 2.838158369064331,
+ "learning_rate": 7.612468899587822e-07,
+ "loss": 0.1398,
+ "step": 32250
+ },
+ {
+ "epoch": 87.87738419618529,
+ "grad_norm": 3.891223907470703,
+ "learning_rate": 7.609092008646379e-07,
+ "loss": 0.0727,
+ "step": 32251
+ },
+ {
+ "epoch": 87.88010899182561,
+ "grad_norm": 2.4520819187164307,
+ "learning_rate": 7.605715837242355e-07,
+ "loss": 0.0407,
+ "step": 32252
+ },
+ {
+ "epoch": 87.88283378746594,
+ "grad_norm": 3.366380453109741,
+ "learning_rate": 7.60234038540203e-07,
+ "loss": 0.0707,
+ "step": 32253
+ },
+ {
+ "epoch": 87.88555858310627,
+ "grad_norm": 4.714087009429932,
+ "learning_rate": 7.598965653151702e-07,
+ "loss": 0.0802,
+ "step": 32254
+ },
+ {
+ "epoch": 87.88828337874659,
+ "grad_norm": 2.2426202297210693,
+ "learning_rate": 7.595591640517663e-07,
+ "loss": 0.0403,
+ "step": 32255
+ },
+ {
+ "epoch": 87.89100817438693,
+ "grad_norm": 3.1924262046813965,
+ "learning_rate": 7.592218347526192e-07,
+ "loss": 0.0907,
+ "step": 32256
+ },
+ {
+ "epoch": 87.89373297002724,
+ "grad_norm": 2.122835636138916,
+ "learning_rate": 7.588845774203535e-07,
+ "loss": 0.0807,
+ "step": 32257
+ },
+ {
+ "epoch": 87.89645776566758,
+ "grad_norm": 2.4528744220733643,
+ "learning_rate": 7.585473920575992e-07,
+ "loss": 0.2641,
+ "step": 32258
+ },
+ {
+ "epoch": 87.8991825613079,
+ "grad_norm": 2.00410532951355,
+ "learning_rate": 7.582102786669798e-07,
+ "loss": 0.0358,
+ "step": 32259
+ },
+ {
+ "epoch": 87.90190735694823,
+ "grad_norm": 2.9289979934692383,
+ "learning_rate": 7.57873237251121e-07,
+ "loss": 0.0928,
+ "step": 32260
+ },
+ {
+ "epoch": 87.90463215258856,
+ "grad_norm": 3.34232759475708,
+ "learning_rate": 7.575362678126474e-07,
+ "loss": 0.096,
+ "step": 32261
+ },
+ {
+ "epoch": 87.90735694822888,
+ "grad_norm": 1.7234410047531128,
+ "learning_rate": 7.571993703541847e-07,
+ "loss": 0.0208,
+ "step": 32262
+ },
+ {
+ "epoch": 87.91008174386921,
+ "grad_norm": 2.5581438541412354,
+ "learning_rate": 7.568625448783562e-07,
+ "loss": 0.0578,
+ "step": 32263
+ },
+ {
+ "epoch": 87.91280653950953,
+ "grad_norm": 2.0092294216156006,
+ "learning_rate": 7.565257913877843e-07,
+ "loss": 0.0506,
+ "step": 32264
+ },
+ {
+ "epoch": 87.91553133514986,
+ "grad_norm": 1.4506932497024536,
+ "learning_rate": 7.561891098850904e-07,
+ "loss": 0.0207,
+ "step": 32265
+ },
+ {
+ "epoch": 87.9182561307902,
+ "grad_norm": 3.2845566272735596,
+ "learning_rate": 7.558525003729e-07,
+ "loss": 0.0319,
+ "step": 32266
+ },
+ {
+ "epoch": 87.92098092643052,
+ "grad_norm": 2.6187777519226074,
+ "learning_rate": 7.555159628538322e-07,
+ "loss": 0.1014,
+ "step": 32267
+ },
+ {
+ "epoch": 87.92370572207085,
+ "grad_norm": 4.789071083068848,
+ "learning_rate": 7.551794973305093e-07,
+ "loss": 0.1189,
+ "step": 32268
+ },
+ {
+ "epoch": 87.92643051771117,
+ "grad_norm": 3.519306182861328,
+ "learning_rate": 7.548431038055492e-07,
+ "loss": 0.04,
+ "step": 32269
+ },
+ {
+ "epoch": 87.9291553133515,
+ "grad_norm": 3.2069647312164307,
+ "learning_rate": 7.545067822815733e-07,
+ "loss": 0.0404,
+ "step": 32270
+ },
+ {
+ "epoch": 87.93188010899182,
+ "grad_norm": 3.5142273902893066,
+ "learning_rate": 7.541705327612037e-07,
+ "loss": 0.0307,
+ "step": 32271
+ },
+ {
+ "epoch": 87.93460490463215,
+ "grad_norm": 1.9941633939743042,
+ "learning_rate": 7.53834355247055e-07,
+ "loss": 0.0918,
+ "step": 32272
+ },
+ {
+ "epoch": 87.93732970027249,
+ "grad_norm": 2.765315055847168,
+ "learning_rate": 7.534982497417476e-07,
+ "loss": 0.0282,
+ "step": 32273
+ },
+ {
+ "epoch": 87.9400544959128,
+ "grad_norm": 2.1391522884368896,
+ "learning_rate": 7.531622162478957e-07,
+ "loss": 0.0342,
+ "step": 32274
+ },
+ {
+ "epoch": 87.94277929155314,
+ "grad_norm": 2.1447854042053223,
+ "learning_rate": 7.528262547681209e-07,
+ "loss": 0.0224,
+ "step": 32275
+ },
+ {
+ "epoch": 87.94550408719346,
+ "grad_norm": 1.431930661201477,
+ "learning_rate": 7.524903653050386e-07,
+ "loss": 0.0176,
+ "step": 32276
+ },
+ {
+ "epoch": 87.94822888283379,
+ "grad_norm": 3.4243528842926025,
+ "learning_rate": 7.521545478612624e-07,
+ "loss": 0.0597,
+ "step": 32277
+ },
+ {
+ "epoch": 87.95095367847412,
+ "grad_norm": 2.164825439453125,
+ "learning_rate": 7.518188024394079e-07,
+ "loss": 0.1031,
+ "step": 32278
+ },
+ {
+ "epoch": 87.95367847411444,
+ "grad_norm": 2.4001989364624023,
+ "learning_rate": 7.514831290420921e-07,
+ "loss": 0.0545,
+ "step": 32279
+ },
+ {
+ "epoch": 87.95640326975477,
+ "grad_norm": 2.551877975463867,
+ "learning_rate": 7.511475276719282e-07,
+ "loss": 0.0361,
+ "step": 32280
+ },
+ {
+ "epoch": 87.95912806539509,
+ "grad_norm": 3.5497496128082275,
+ "learning_rate": 7.508119983315288e-07,
+ "loss": 0.1386,
+ "step": 32281
+ },
+ {
+ "epoch": 87.96185286103542,
+ "grad_norm": 2.0387940406799316,
+ "learning_rate": 7.504765410235082e-07,
+ "loss": 0.0973,
+ "step": 32282
+ },
+ {
+ "epoch": 87.96457765667574,
+ "grad_norm": 1.8813186883926392,
+ "learning_rate": 7.501411557504801e-07,
+ "loss": 0.0243,
+ "step": 32283
+ },
+ {
+ "epoch": 87.96730245231608,
+ "grad_norm": 1.5467861890792847,
+ "learning_rate": 7.498058425150534e-07,
+ "loss": 0.015,
+ "step": 32284
+ },
+ {
+ "epoch": 87.97002724795641,
+ "grad_norm": 3.1045641899108887,
+ "learning_rate": 7.494706013198406e-07,
+ "loss": 0.0716,
+ "step": 32285
+ },
+ {
+ "epoch": 87.97275204359673,
+ "grad_norm": 2.660520553588867,
+ "learning_rate": 7.491354321674538e-07,
+ "loss": 0.0736,
+ "step": 32286
+ },
+ {
+ "epoch": 87.97547683923706,
+ "grad_norm": 2.425281524658203,
+ "learning_rate": 7.488003350605022e-07,
+ "loss": 0.0285,
+ "step": 32287
+ },
+ {
+ "epoch": 87.97820163487738,
+ "grad_norm": 1.9388577938079834,
+ "learning_rate": 7.48465310001596e-07,
+ "loss": 0.0358,
+ "step": 32288
+ },
+ {
+ "epoch": 87.98092643051771,
+ "grad_norm": 2.165494441986084,
+ "learning_rate": 7.481303569933452e-07,
+ "loss": 0.0271,
+ "step": 32289
+ },
+ {
+ "epoch": 87.98365122615803,
+ "grad_norm": 1.887526512145996,
+ "learning_rate": 7.477954760383554e-07,
+ "loss": 0.0485,
+ "step": 32290
+ },
+ {
+ "epoch": 87.98637602179836,
+ "grad_norm": 3.798539400100708,
+ "learning_rate": 7.474606671392381e-07,
+ "loss": 0.1476,
+ "step": 32291
+ },
+ {
+ "epoch": 87.9891008174387,
+ "grad_norm": 2.9195845127105713,
+ "learning_rate": 7.471259302986e-07,
+ "loss": 0.2573,
+ "step": 32292
+ },
+ {
+ "epoch": 87.99182561307902,
+ "grad_norm": 5.432840347290039,
+ "learning_rate": 7.467912655190468e-07,
+ "loss": 0.0782,
+ "step": 32293
+ },
+ {
+ "epoch": 87.99455040871935,
+ "grad_norm": 1.555138111114502,
+ "learning_rate": 7.46456672803183e-07,
+ "loss": 0.0223,
+ "step": 32294
+ },
+ {
+ "epoch": 87.99727520435967,
+ "grad_norm": 2.1178574562072754,
+ "learning_rate": 7.461221521536199e-07,
+ "loss": 0.1377,
+ "step": 32295
+ },
+ {
+ "epoch": 88.0,
+ "grad_norm": 2.321068525314331,
+ "learning_rate": 7.457877035729588e-07,
+ "loss": 0.031,
+ "step": 32296
+ },
+ {
+ "epoch": 88.00272479564033,
+ "grad_norm": 2.299448251724243,
+ "learning_rate": 7.454533270638054e-07,
+ "loss": 0.0275,
+ "step": 32297
+ },
+ {
+ "epoch": 88.00544959128065,
+ "grad_norm": 2.3229076862335205,
+ "learning_rate": 7.451190226287619e-07,
+ "loss": 0.0418,
+ "step": 32298
+ },
+ {
+ "epoch": 88.00817438692098,
+ "grad_norm": 3.0564043521881104,
+ "learning_rate": 7.447847902704364e-07,
+ "loss": 0.0577,
+ "step": 32299
+ },
+ {
+ "epoch": 88.0108991825613,
+ "grad_norm": 2.5883285999298096,
+ "learning_rate": 7.444506299914278e-07,
+ "loss": 0.125,
+ "step": 32300
+ },
+ {
+ "epoch": 88.01362397820164,
+ "grad_norm": 3.360523223876953,
+ "learning_rate": 7.441165417943386e-07,
+ "loss": 0.1188,
+ "step": 32301
+ },
+ {
+ "epoch": 88.01634877384195,
+ "grad_norm": 2.566993236541748,
+ "learning_rate": 7.437825256817732e-07,
+ "loss": 0.0786,
+ "step": 32302
+ },
+ {
+ "epoch": 88.01907356948229,
+ "grad_norm": 2.3333346843719482,
+ "learning_rate": 7.434485816563319e-07,
+ "loss": 0.0771,
+ "step": 32303
+ },
+ {
+ "epoch": 88.02179836512262,
+ "grad_norm": 2.5192739963531494,
+ "learning_rate": 7.431147097206126e-07,
+ "loss": 0.0413,
+ "step": 32304
+ },
+ {
+ "epoch": 88.02452316076294,
+ "grad_norm": 1.8936649560928345,
+ "learning_rate": 7.42780909877221e-07,
+ "loss": 0.02,
+ "step": 32305
+ },
+ {
+ "epoch": 88.02724795640327,
+ "grad_norm": 2.71415638923645,
+ "learning_rate": 7.424471821287516e-07,
+ "loss": 0.025,
+ "step": 32306
+ },
+ {
+ "epoch": 88.02997275204359,
+ "grad_norm": 1.6457340717315674,
+ "learning_rate": 7.421135264778067e-07,
+ "loss": 0.02,
+ "step": 32307
+ },
+ {
+ "epoch": 88.03269754768392,
+ "grad_norm": 1.7237062454223633,
+ "learning_rate": 7.417799429269835e-07,
+ "loss": 0.0206,
+ "step": 32308
+ },
+ {
+ "epoch": 88.03542234332426,
+ "grad_norm": 2.5964341163635254,
+ "learning_rate": 7.414464314788816e-07,
+ "loss": 0.0346,
+ "step": 32309
+ },
+ {
+ "epoch": 88.03814713896458,
+ "grad_norm": 2.292182683944702,
+ "learning_rate": 7.411129921360937e-07,
+ "loss": 0.0524,
+ "step": 32310
+ },
+ {
+ "epoch": 88.04087193460491,
+ "grad_norm": 2.4391493797302246,
+ "learning_rate": 7.407796249012223e-07,
+ "loss": 0.1095,
+ "step": 32311
+ },
+ {
+ "epoch": 88.04359673024523,
+ "grad_norm": 2.506728172302246,
+ "learning_rate": 7.404463297768616e-07,
+ "loss": 0.1574,
+ "step": 32312
+ },
+ {
+ "epoch": 88.04632152588556,
+ "grad_norm": 2.8812003135681152,
+ "learning_rate": 7.401131067656054e-07,
+ "loss": 0.1881,
+ "step": 32313
+ },
+ {
+ "epoch": 88.04904632152588,
+ "grad_norm": 2.4724903106689453,
+ "learning_rate": 7.397799558700502e-07,
+ "loss": 0.1441,
+ "step": 32314
+ },
+ {
+ "epoch": 88.05177111716621,
+ "grad_norm": 2.306126594543457,
+ "learning_rate": 7.394468770927909e-07,
+ "loss": 0.1513,
+ "step": 32315
+ },
+ {
+ "epoch": 88.05449591280654,
+ "grad_norm": 4.2841105461120605,
+ "learning_rate": 7.39113870436422e-07,
+ "loss": 0.083,
+ "step": 32316
+ },
+ {
+ "epoch": 88.05722070844686,
+ "grad_norm": 2.380880832672119,
+ "learning_rate": 7.387809359035369e-07,
+ "loss": 0.0379,
+ "step": 32317
+ },
+ {
+ "epoch": 88.0599455040872,
+ "grad_norm": 3.122007369995117,
+ "learning_rate": 7.384480734967248e-07,
+ "loss": 0.0279,
+ "step": 32318
+ },
+ {
+ "epoch": 88.06267029972751,
+ "grad_norm": 1.5502064228057861,
+ "learning_rate": 7.381152832185833e-07,
+ "loss": 0.0201,
+ "step": 32319
+ },
+ {
+ "epoch": 88.06539509536785,
+ "grad_norm": 2.653925657272339,
+ "learning_rate": 7.377825650717029e-07,
+ "loss": 0.0635,
+ "step": 32320
+ },
+ {
+ "epoch": 88.06811989100818,
+ "grad_norm": 2.0360612869262695,
+ "learning_rate": 7.374499190586725e-07,
+ "loss": 0.0219,
+ "step": 32321
+ },
+ {
+ "epoch": 88.0708446866485,
+ "grad_norm": 2.081451416015625,
+ "learning_rate": 7.371173451820812e-07,
+ "loss": 0.022,
+ "step": 32322
+ },
+ {
+ "epoch": 88.07356948228883,
+ "grad_norm": 3.6597652435302734,
+ "learning_rate": 7.367848434445246e-07,
+ "loss": 0.0615,
+ "step": 32323
+ },
+ {
+ "epoch": 88.07629427792915,
+ "grad_norm": 1.9606828689575195,
+ "learning_rate": 7.364524138485896e-07,
+ "loss": 0.0705,
+ "step": 32324
+ },
+ {
+ "epoch": 88.07901907356948,
+ "grad_norm": 3.023667335510254,
+ "learning_rate": 7.361200563968662e-07,
+ "loss": 0.0405,
+ "step": 32325
+ },
+ {
+ "epoch": 88.0817438692098,
+ "grad_norm": 1.8557109832763672,
+ "learning_rate": 7.357877710919392e-07,
+ "loss": 0.0492,
+ "step": 32326
+ },
+ {
+ "epoch": 88.08446866485014,
+ "grad_norm": 1.7654945850372314,
+ "learning_rate": 7.354555579363998e-07,
+ "loss": 0.0295,
+ "step": 32327
+ },
+ {
+ "epoch": 88.08719346049047,
+ "grad_norm": 1.9492478370666504,
+ "learning_rate": 7.351234169328359e-07,
+ "loss": 0.0215,
+ "step": 32328
+ },
+ {
+ "epoch": 88.08991825613079,
+ "grad_norm": 3.418755292892456,
+ "learning_rate": 7.34791348083831e-07,
+ "loss": 0.0381,
+ "step": 32329
+ },
+ {
+ "epoch": 88.09264305177112,
+ "grad_norm": 3.9958670139312744,
+ "learning_rate": 7.344593513919718e-07,
+ "loss": 0.038,
+ "step": 32330
+ },
+ {
+ "epoch": 88.09536784741144,
+ "grad_norm": 3.9633195400238037,
+ "learning_rate": 7.341274268598476e-07,
+ "loss": 0.2505,
+ "step": 32331
+ },
+ {
+ "epoch": 88.09809264305177,
+ "grad_norm": 2.639070510864258,
+ "learning_rate": 7.337955744900394e-07,
+ "loss": 0.036,
+ "step": 32332
+ },
+ {
+ "epoch": 88.1008174386921,
+ "grad_norm": 2.3801422119140625,
+ "learning_rate": 7.334637942851342e-07,
+ "loss": 0.0592,
+ "step": 32333
+ },
+ {
+ "epoch": 88.10354223433242,
+ "grad_norm": 2.8734068870544434,
+ "learning_rate": 7.331320862477121e-07,
+ "loss": 0.0909,
+ "step": 32334
+ },
+ {
+ "epoch": 88.10626702997276,
+ "grad_norm": 2.515087127685547,
+ "learning_rate": 7.328004503803609e-07,
+ "loss": 0.0249,
+ "step": 32335
+ },
+ {
+ "epoch": 88.10899182561307,
+ "grad_norm": 1.818914532661438,
+ "learning_rate": 7.324688866856621e-07,
+ "loss": 0.0232,
+ "step": 32336
+ },
+ {
+ "epoch": 88.11171662125341,
+ "grad_norm": 2.735673189163208,
+ "learning_rate": 7.321373951661969e-07,
+ "loss": 0.0587,
+ "step": 32337
+ },
+ {
+ "epoch": 88.11444141689373,
+ "grad_norm": 3.4093174934387207,
+ "learning_rate": 7.318059758245455e-07,
+ "loss": 0.1008,
+ "step": 32338
+ },
+ {
+ "epoch": 88.11716621253406,
+ "grad_norm": 2.8783583641052246,
+ "learning_rate": 7.314746286632913e-07,
+ "loss": 0.0341,
+ "step": 32339
+ },
+ {
+ "epoch": 88.11989100817439,
+ "grad_norm": 2.247035026550293,
+ "learning_rate": 7.311433536850165e-07,
+ "loss": 0.0234,
+ "step": 32340
+ },
+ {
+ "epoch": 88.12261580381471,
+ "grad_norm": 1.9902700185775757,
+ "learning_rate": 7.308121508922983e-07,
+ "loss": 0.0204,
+ "step": 32341
+ },
+ {
+ "epoch": 88.12534059945504,
+ "grad_norm": 2.9673802852630615,
+ "learning_rate": 7.304810202877144e-07,
+ "loss": 0.0478,
+ "step": 32342
+ },
+ {
+ "epoch": 88.12806539509536,
+ "grad_norm": 2.6950340270996094,
+ "learning_rate": 7.301499618738484e-07,
+ "loss": 0.0414,
+ "step": 32343
+ },
+ {
+ "epoch": 88.1307901907357,
+ "grad_norm": 2.5807995796203613,
+ "learning_rate": 7.29818975653277e-07,
+ "loss": 0.0248,
+ "step": 32344
+ },
+ {
+ "epoch": 88.13351498637603,
+ "grad_norm": 2.492432117462158,
+ "learning_rate": 7.29488061628576e-07,
+ "loss": 0.0307,
+ "step": 32345
+ },
+ {
+ "epoch": 88.13623978201635,
+ "grad_norm": 2.092982530593872,
+ "learning_rate": 7.291572198023223e-07,
+ "loss": 0.037,
+ "step": 32346
+ },
+ {
+ "epoch": 88.13896457765668,
+ "grad_norm": 2.8097760677337646,
+ "learning_rate": 7.288264501770947e-07,
+ "loss": 0.0783,
+ "step": 32347
+ },
+ {
+ "epoch": 88.141689373297,
+ "grad_norm": 2.8103179931640625,
+ "learning_rate": 7.284957527554693e-07,
+ "loss": 0.0889,
+ "step": 32348
+ },
+ {
+ "epoch": 88.14441416893733,
+ "grad_norm": 2.2878992557525635,
+ "learning_rate": 7.281651275400203e-07,
+ "loss": 0.0328,
+ "step": 32349
+ },
+ {
+ "epoch": 88.14713896457765,
+ "grad_norm": 2.0587637424468994,
+ "learning_rate": 7.278345745333204e-07,
+ "loss": 0.0832,
+ "step": 32350
+ },
+ {
+ "epoch": 88.14986376021798,
+ "grad_norm": 1.798496127128601,
+ "learning_rate": 7.275040937379485e-07,
+ "loss": 0.0194,
+ "step": 32351
+ },
+ {
+ "epoch": 88.15258855585832,
+ "grad_norm": 2.808852195739746,
+ "learning_rate": 7.27173685156477e-07,
+ "loss": 0.0619,
+ "step": 32352
+ },
+ {
+ "epoch": 88.15531335149863,
+ "grad_norm": 2.5652859210968018,
+ "learning_rate": 7.268433487914784e-07,
+ "loss": 0.1185,
+ "step": 32353
+ },
+ {
+ "epoch": 88.15803814713897,
+ "grad_norm": 2.514193058013916,
+ "learning_rate": 7.265130846455226e-07,
+ "loss": 0.0447,
+ "step": 32354
+ },
+ {
+ "epoch": 88.16076294277929,
+ "grad_norm": 4.0318121910095215,
+ "learning_rate": 7.261828927211867e-07,
+ "loss": 0.1139,
+ "step": 32355
+ },
+ {
+ "epoch": 88.16348773841962,
+ "grad_norm": 2.110468626022339,
+ "learning_rate": 7.258527730210385e-07,
+ "loss": 0.0774,
+ "step": 32356
+ },
+ {
+ "epoch": 88.16621253405995,
+ "grad_norm": 4.696341514587402,
+ "learning_rate": 7.255227255476516e-07,
+ "loss": 0.1724,
+ "step": 32357
+ },
+ {
+ "epoch": 88.16893732970027,
+ "grad_norm": 2.1733508110046387,
+ "learning_rate": 7.25192750303596e-07,
+ "loss": 0.0339,
+ "step": 32358
+ },
+ {
+ "epoch": 88.1716621253406,
+ "grad_norm": 1.6791229248046875,
+ "learning_rate": 7.248628472914388e-07,
+ "loss": 0.1437,
+ "step": 32359
+ },
+ {
+ "epoch": 88.17438692098092,
+ "grad_norm": 2.093832015991211,
+ "learning_rate": 7.245330165137521e-07,
+ "loss": 0.0719,
+ "step": 32360
+ },
+ {
+ "epoch": 88.17711171662125,
+ "grad_norm": 2.7660741806030273,
+ "learning_rate": 7.24203257973104e-07,
+ "loss": 0.0756,
+ "step": 32361
+ },
+ {
+ "epoch": 88.17983651226157,
+ "grad_norm": 2.537230968475342,
+ "learning_rate": 7.238735716720635e-07,
+ "loss": 0.0526,
+ "step": 32362
+ },
+ {
+ "epoch": 88.1825613079019,
+ "grad_norm": 2.3053700923919678,
+ "learning_rate": 7.235439576131942e-07,
+ "loss": 0.0202,
+ "step": 32363
+ },
+ {
+ "epoch": 88.18528610354224,
+ "grad_norm": 1.8766133785247803,
+ "learning_rate": 7.232144157990683e-07,
+ "loss": 0.0264,
+ "step": 32364
+ },
+ {
+ "epoch": 88.18801089918256,
+ "grad_norm": 2.5794596672058105,
+ "learning_rate": 7.228849462322496e-07,
+ "loss": 0.049,
+ "step": 32365
+ },
+ {
+ "epoch": 88.19073569482289,
+ "grad_norm": 2.2495250701904297,
+ "learning_rate": 7.225555489153024e-07,
+ "loss": 0.0662,
+ "step": 32366
+ },
+ {
+ "epoch": 88.19346049046321,
+ "grad_norm": 2.3065366744995117,
+ "learning_rate": 7.22226223850796e-07,
+ "loss": 0.1619,
+ "step": 32367
+ },
+ {
+ "epoch": 88.19618528610354,
+ "grad_norm": 1.8450549840927124,
+ "learning_rate": 7.218969710412938e-07,
+ "loss": 0.0533,
+ "step": 32368
+ },
+ {
+ "epoch": 88.19891008174388,
+ "grad_norm": 2.7415997982025146,
+ "learning_rate": 7.215677904893593e-07,
+ "loss": 0.1223,
+ "step": 32369
+ },
+ {
+ "epoch": 88.2016348773842,
+ "grad_norm": 2.997288465499878,
+ "learning_rate": 7.212386821975537e-07,
+ "loss": 0.0674,
+ "step": 32370
+ },
+ {
+ "epoch": 88.20435967302453,
+ "grad_norm": 3.6610023975372314,
+ "learning_rate": 7.209096461684451e-07,
+ "loss": 0.0831,
+ "step": 32371
+ },
+ {
+ "epoch": 88.20708446866485,
+ "grad_norm": 2.011756420135498,
+ "learning_rate": 7.205806824045924e-07,
+ "loss": 0.0334,
+ "step": 32372
+ },
+ {
+ "epoch": 88.20980926430518,
+ "grad_norm": 3.1290664672851562,
+ "learning_rate": 7.202517909085583e-07,
+ "loss": 0.1391,
+ "step": 32373
+ },
+ {
+ "epoch": 88.2125340599455,
+ "grad_norm": 5.271706581115723,
+ "learning_rate": 7.199229716829048e-07,
+ "loss": 0.0294,
+ "step": 32374
+ },
+ {
+ "epoch": 88.21525885558583,
+ "grad_norm": 4.0691142082214355,
+ "learning_rate": 7.195942247301923e-07,
+ "loss": 0.0679,
+ "step": 32375
+ },
+ {
+ "epoch": 88.21798365122616,
+ "grad_norm": 5.225517749786377,
+ "learning_rate": 7.192655500529821e-07,
+ "loss": 0.0513,
+ "step": 32376
+ },
+ {
+ "epoch": 88.22070844686648,
+ "grad_norm": 2.8964128494262695,
+ "learning_rate": 7.189369476538333e-07,
+ "loss": 0.0522,
+ "step": 32377
+ },
+ {
+ "epoch": 88.22343324250681,
+ "grad_norm": 2.045886754989624,
+ "learning_rate": 7.186084175353047e-07,
+ "loss": 0.0229,
+ "step": 32378
+ },
+ {
+ "epoch": 88.22615803814713,
+ "grad_norm": 2.279428243637085,
+ "learning_rate": 7.182799596999534e-07,
+ "loss": 0.0516,
+ "step": 32379
+ },
+ {
+ "epoch": 88.22888283378747,
+ "grad_norm": 1.5180741548538208,
+ "learning_rate": 7.179515741503418e-07,
+ "loss": 0.0172,
+ "step": 32380
+ },
+ {
+ "epoch": 88.2316076294278,
+ "grad_norm": 2.6171324253082275,
+ "learning_rate": 7.176232608890232e-07,
+ "loss": 0.0245,
+ "step": 32381
+ },
+ {
+ "epoch": 88.23433242506812,
+ "grad_norm": 2.1556520462036133,
+ "learning_rate": 7.172950199185569e-07,
+ "loss": 0.0244,
+ "step": 32382
+ },
+ {
+ "epoch": 88.23705722070845,
+ "grad_norm": 2.845304489135742,
+ "learning_rate": 7.169668512414951e-07,
+ "loss": 0.0274,
+ "step": 32383
+ },
+ {
+ "epoch": 88.23978201634877,
+ "grad_norm": 2.633047103881836,
+ "learning_rate": 7.166387548603993e-07,
+ "loss": 0.0269,
+ "step": 32384
+ },
+ {
+ "epoch": 88.2425068119891,
+ "grad_norm": 3.4355244636535645,
+ "learning_rate": 7.163107307778227e-07,
+ "loss": 0.1012,
+ "step": 32385
+ },
+ {
+ "epoch": 88.24523160762942,
+ "grad_norm": 1.8461685180664062,
+ "learning_rate": 7.159827789963181e-07,
+ "loss": 0.0284,
+ "step": 32386
+ },
+ {
+ "epoch": 88.24795640326975,
+ "grad_norm": 2.820727825164795,
+ "learning_rate": 7.156548995184398e-07,
+ "loss": 0.0233,
+ "step": 32387
+ },
+ {
+ "epoch": 88.25068119891009,
+ "grad_norm": 6.894948482513428,
+ "learning_rate": 7.153270923467437e-07,
+ "loss": 0.1378,
+ "step": 32388
+ },
+ {
+ "epoch": 88.2534059945504,
+ "grad_norm": 2.133219003677368,
+ "learning_rate": 7.149993574837822e-07,
+ "loss": 0.0366,
+ "step": 32389
+ },
+ {
+ "epoch": 88.25613079019074,
+ "grad_norm": 2.540095090866089,
+ "learning_rate": 7.146716949321042e-07,
+ "loss": 0.0585,
+ "step": 32390
+ },
+ {
+ "epoch": 88.25885558583106,
+ "grad_norm": 2.4622929096221924,
+ "learning_rate": 7.143441046942645e-07,
+ "loss": 0.0401,
+ "step": 32391
+ },
+ {
+ "epoch": 88.26158038147139,
+ "grad_norm": 2.0890092849731445,
+ "learning_rate": 7.140165867728166e-07,
+ "loss": 0.0298,
+ "step": 32392
+ },
+ {
+ "epoch": 88.26430517711172,
+ "grad_norm": 1.8422714471817017,
+ "learning_rate": 7.136891411703073e-07,
+ "loss": 0.0353,
+ "step": 32393
+ },
+ {
+ "epoch": 88.26702997275204,
+ "grad_norm": 3.064406394958496,
+ "learning_rate": 7.13361767889289e-07,
+ "loss": 0.0589,
+ "step": 32394
+ },
+ {
+ "epoch": 88.26975476839237,
+ "grad_norm": 2.9960241317749023,
+ "learning_rate": 7.130344669323086e-07,
+ "loss": 0.0678,
+ "step": 32395
+ },
+ {
+ "epoch": 88.2724795640327,
+ "grad_norm": 1.6039263010025024,
+ "learning_rate": 7.127072383019185e-07,
+ "loss": 0.0176,
+ "step": 32396
+ },
+ {
+ "epoch": 88.27520435967303,
+ "grad_norm": 2.260348081588745,
+ "learning_rate": 7.123800820006643e-07,
+ "loss": 0.076,
+ "step": 32397
+ },
+ {
+ "epoch": 88.27792915531334,
+ "grad_norm": 4.56273889541626,
+ "learning_rate": 7.120529980310964e-07,
+ "loss": 0.0361,
+ "step": 32398
+ },
+ {
+ "epoch": 88.28065395095368,
+ "grad_norm": 2.5440008640289307,
+ "learning_rate": 7.117259863957593e-07,
+ "loss": 0.0676,
+ "step": 32399
+ },
+ {
+ "epoch": 88.28337874659401,
+ "grad_norm": 2.3230483531951904,
+ "learning_rate": 7.113990470972021e-07,
+ "loss": 0.0304,
+ "step": 32400
+ },
+ {
+ "epoch": 88.28610354223433,
+ "grad_norm": 5.4216461181640625,
+ "learning_rate": 7.110721801379705e-07,
+ "loss": 0.0302,
+ "step": 32401
+ },
+ {
+ "epoch": 88.28882833787466,
+ "grad_norm": 1.4944161176681519,
+ "learning_rate": 7.107453855206103e-07,
+ "loss": 0.0178,
+ "step": 32402
+ },
+ {
+ "epoch": 88.29155313351498,
+ "grad_norm": 2.5314242839813232,
+ "learning_rate": 7.104186632476639e-07,
+ "loss": 0.0691,
+ "step": 32403
+ },
+ {
+ "epoch": 88.29427792915531,
+ "grad_norm": 2.4386959075927734,
+ "learning_rate": 7.100920133216793e-07,
+ "loss": 0.0376,
+ "step": 32404
+ },
+ {
+ "epoch": 88.29700272479565,
+ "grad_norm": 2.228200674057007,
+ "learning_rate": 7.097654357451999e-07,
+ "loss": 0.031,
+ "step": 32405
+ },
+ {
+ "epoch": 88.29972752043597,
+ "grad_norm": 1.8890329599380493,
+ "learning_rate": 7.094389305207683e-07,
+ "loss": 0.0435,
+ "step": 32406
+ },
+ {
+ "epoch": 88.3024523160763,
+ "grad_norm": 3.7059457302093506,
+ "learning_rate": 7.091124976509245e-07,
+ "loss": 0.0433,
+ "step": 32407
+ },
+ {
+ "epoch": 88.30517711171662,
+ "grad_norm": 3.3551275730133057,
+ "learning_rate": 7.087861371382143e-07,
+ "loss": 0.1015,
+ "step": 32408
+ },
+ {
+ "epoch": 88.30790190735695,
+ "grad_norm": 3.033982515335083,
+ "learning_rate": 7.084598489851813e-07,
+ "loss": 0.1362,
+ "step": 32409
+ },
+ {
+ "epoch": 88.31062670299727,
+ "grad_norm": 2.023897647857666,
+ "learning_rate": 7.081336331943623e-07,
+ "loss": 0.035,
+ "step": 32410
+ },
+ {
+ "epoch": 88.3133514986376,
+ "grad_norm": 3.2727036476135254,
+ "learning_rate": 7.078074897682985e-07,
+ "loss": 0.0595,
+ "step": 32411
+ },
+ {
+ "epoch": 88.31607629427793,
+ "grad_norm": 2.589975357055664,
+ "learning_rate": 7.074814187095324e-07,
+ "loss": 0.1007,
+ "step": 32412
+ },
+ {
+ "epoch": 88.31880108991825,
+ "grad_norm": 2.6098878383636475,
+ "learning_rate": 7.071554200206021e-07,
+ "loss": 0.0549,
+ "step": 32413
+ },
+ {
+ "epoch": 88.32152588555859,
+ "grad_norm": 1.8974101543426514,
+ "learning_rate": 7.068294937040465e-07,
+ "loss": 0.1426,
+ "step": 32414
+ },
+ {
+ "epoch": 88.3242506811989,
+ "grad_norm": 1.4538369178771973,
+ "learning_rate": 7.065036397624014e-07,
+ "loss": 0.015,
+ "step": 32415
+ },
+ {
+ "epoch": 88.32697547683924,
+ "grad_norm": 5.012216567993164,
+ "learning_rate": 7.061778581982093e-07,
+ "loss": 0.0572,
+ "step": 32416
+ },
+ {
+ "epoch": 88.32970027247957,
+ "grad_norm": 2.0124173164367676,
+ "learning_rate": 7.058521490140047e-07,
+ "loss": 0.0234,
+ "step": 32417
+ },
+ {
+ "epoch": 88.33242506811989,
+ "grad_norm": 2.1418280601501465,
+ "learning_rate": 7.055265122123245e-07,
+ "loss": 0.024,
+ "step": 32418
+ },
+ {
+ "epoch": 88.33514986376022,
+ "grad_norm": 1.74332857131958,
+ "learning_rate": 7.052009477957022e-07,
+ "loss": 0.0237,
+ "step": 32419
+ },
+ {
+ "epoch": 88.33787465940054,
+ "grad_norm": 2.2411975860595703,
+ "learning_rate": 7.048754557666781e-07,
+ "loss": 0.027,
+ "step": 32420
+ },
+ {
+ "epoch": 88.34059945504087,
+ "grad_norm": 2.1045470237731934,
+ "learning_rate": 7.045500361277846e-07,
+ "loss": 0.0547,
+ "step": 32421
+ },
+ {
+ "epoch": 88.34332425068119,
+ "grad_norm": 2.1541929244995117,
+ "learning_rate": 7.042246888815563e-07,
+ "loss": 0.0974,
+ "step": 32422
+ },
+ {
+ "epoch": 88.34604904632153,
+ "grad_norm": 2.5627400875091553,
+ "learning_rate": 7.038994140305255e-07,
+ "loss": 0.0273,
+ "step": 32423
+ },
+ {
+ "epoch": 88.34877384196186,
+ "grad_norm": 4.022182464599609,
+ "learning_rate": 7.035742115772281e-07,
+ "loss": 0.0455,
+ "step": 32424
+ },
+ {
+ "epoch": 88.35149863760218,
+ "grad_norm": 3.07271671295166,
+ "learning_rate": 7.032490815241943e-07,
+ "loss": 0.0936,
+ "step": 32425
+ },
+ {
+ "epoch": 88.35422343324251,
+ "grad_norm": 2.802013397216797,
+ "learning_rate": 7.029240238739587e-07,
+ "loss": 0.0806,
+ "step": 32426
+ },
+ {
+ "epoch": 88.35694822888283,
+ "grad_norm": 2.2961838245391846,
+ "learning_rate": 7.025990386290527e-07,
+ "loss": 0.1447,
+ "step": 32427
+ },
+ {
+ "epoch": 88.35967302452316,
+ "grad_norm": 2.2719388008117676,
+ "learning_rate": 7.022741257920029e-07,
+ "loss": 0.0492,
+ "step": 32428
+ },
+ {
+ "epoch": 88.3623978201635,
+ "grad_norm": 2.973801851272583,
+ "learning_rate": 7.019492853653454e-07,
+ "loss": 0.0564,
+ "step": 32429
+ },
+ {
+ "epoch": 88.36512261580381,
+ "grad_norm": 2.531278371810913,
+ "learning_rate": 7.016245173516079e-07,
+ "loss": 0.1216,
+ "step": 32430
+ },
+ {
+ "epoch": 88.36784741144415,
+ "grad_norm": 3.1131370067596436,
+ "learning_rate": 7.012998217533174e-07,
+ "loss": 0.2001,
+ "step": 32431
+ },
+ {
+ "epoch": 88.37057220708446,
+ "grad_norm": 3.001033306121826,
+ "learning_rate": 7.009751985730062e-07,
+ "loss": 0.062,
+ "step": 32432
+ },
+ {
+ "epoch": 88.3732970027248,
+ "grad_norm": 2.2466847896575928,
+ "learning_rate": 7.006506478132003e-07,
+ "loss": 0.0268,
+ "step": 32433
+ },
+ {
+ "epoch": 88.37602179836512,
+ "grad_norm": 2.386246919631958,
+ "learning_rate": 7.003261694764286e-07,
+ "loss": 0.024,
+ "step": 32434
+ },
+ {
+ "epoch": 88.37874659400545,
+ "grad_norm": 2.3541605472564697,
+ "learning_rate": 7.000017635652157e-07,
+ "loss": 0.0307,
+ "step": 32435
+ },
+ {
+ "epoch": 88.38147138964578,
+ "grad_norm": 3.0564053058624268,
+ "learning_rate": 6.996774300820919e-07,
+ "loss": 0.0902,
+ "step": 32436
+ },
+ {
+ "epoch": 88.3841961852861,
+ "grad_norm": 2.4900553226470947,
+ "learning_rate": 6.993531690295796e-07,
+ "loss": 0.0354,
+ "step": 32437
+ },
+ {
+ "epoch": 88.38692098092643,
+ "grad_norm": 3.019763469696045,
+ "learning_rate": 6.990289804102068e-07,
+ "loss": 0.245,
+ "step": 32438
+ },
+ {
+ "epoch": 88.38964577656675,
+ "grad_norm": 2.5645194053649902,
+ "learning_rate": 6.987048642264938e-07,
+ "loss": 0.0164,
+ "step": 32439
+ },
+ {
+ "epoch": 88.39237057220708,
+ "grad_norm": 2.028104305267334,
+ "learning_rate": 6.983808204809706e-07,
+ "loss": 0.0277,
+ "step": 32440
+ },
+ {
+ "epoch": 88.39509536784742,
+ "grad_norm": 3.1489453315734863,
+ "learning_rate": 6.980568491761586e-07,
+ "loss": 0.1471,
+ "step": 32441
+ },
+ {
+ "epoch": 88.39782016348774,
+ "grad_norm": 1.981988549232483,
+ "learning_rate": 6.97732950314578e-07,
+ "loss": 0.0334,
+ "step": 32442
+ },
+ {
+ "epoch": 88.40054495912807,
+ "grad_norm": 2.9888768196105957,
+ "learning_rate": 6.974091238987557e-07,
+ "loss": 0.1154,
+ "step": 32443
+ },
+ {
+ "epoch": 88.40326975476839,
+ "grad_norm": 2.751434564590454,
+ "learning_rate": 6.970853699312108e-07,
+ "loss": 0.0654,
+ "step": 32444
+ },
+ {
+ "epoch": 88.40599455040872,
+ "grad_norm": 3.876380681991577,
+ "learning_rate": 6.967616884144668e-07,
+ "loss": 0.0257,
+ "step": 32445
+ },
+ {
+ "epoch": 88.40871934604904,
+ "grad_norm": 2.447319746017456,
+ "learning_rate": 6.964380793510428e-07,
+ "loss": 0.057,
+ "step": 32446
+ },
+ {
+ "epoch": 88.41144414168937,
+ "grad_norm": 4.316874027252197,
+ "learning_rate": 6.961145427434601e-07,
+ "loss": 0.0249,
+ "step": 32447
+ },
+ {
+ "epoch": 88.4141689373297,
+ "grad_norm": 2.9538207054138184,
+ "learning_rate": 6.957910785942357e-07,
+ "loss": 0.2019,
+ "step": 32448
+ },
+ {
+ "epoch": 88.41689373297002,
+ "grad_norm": 2.0260610580444336,
+ "learning_rate": 6.95467686905893e-07,
+ "loss": 0.0491,
+ "step": 32449
+ },
+ {
+ "epoch": 88.41961852861036,
+ "grad_norm": 2.5340194702148438,
+ "learning_rate": 6.951443676809489e-07,
+ "loss": 0.0746,
+ "step": 32450
+ },
+ {
+ "epoch": 88.42234332425068,
+ "grad_norm": 2.870420455932617,
+ "learning_rate": 6.948211209219191e-07,
+ "loss": 0.0373,
+ "step": 32451
+ },
+ {
+ "epoch": 88.42506811989101,
+ "grad_norm": 2.812525749206543,
+ "learning_rate": 6.94497946631324e-07,
+ "loss": 0.0916,
+ "step": 32452
+ },
+ {
+ "epoch": 88.42779291553134,
+ "grad_norm": 2.9845118522644043,
+ "learning_rate": 6.941748448116803e-07,
+ "loss": 0.114,
+ "step": 32453
+ },
+ {
+ "epoch": 88.43051771117166,
+ "grad_norm": 2.2237348556518555,
+ "learning_rate": 6.938518154655027e-07,
+ "loss": 0.0196,
+ "step": 32454
+ },
+ {
+ "epoch": 88.433242506812,
+ "grad_norm": 1.488059401512146,
+ "learning_rate": 6.93528858595306e-07,
+ "loss": 0.025,
+ "step": 32455
+ },
+ {
+ "epoch": 88.43596730245231,
+ "grad_norm": 1.537386417388916,
+ "learning_rate": 6.93205974203609e-07,
+ "loss": 0.0183,
+ "step": 32456
+ },
+ {
+ "epoch": 88.43869209809264,
+ "grad_norm": 2.6214711666107178,
+ "learning_rate": 6.928831622929244e-07,
+ "loss": 0.0319,
+ "step": 32457
+ },
+ {
+ "epoch": 88.44141689373296,
+ "grad_norm": 1.4960311651229858,
+ "learning_rate": 6.925604228657657e-07,
+ "loss": 0.0173,
+ "step": 32458
+ },
+ {
+ "epoch": 88.4441416893733,
+ "grad_norm": 3.0551717281341553,
+ "learning_rate": 6.922377559246462e-07,
+ "loss": 0.0503,
+ "step": 32459
+ },
+ {
+ "epoch": 88.44686648501363,
+ "grad_norm": 4.646723747253418,
+ "learning_rate": 6.919151614720787e-07,
+ "loss": 0.0295,
+ "step": 32460
+ },
+ {
+ "epoch": 88.44959128065395,
+ "grad_norm": 1.8327277898788452,
+ "learning_rate": 6.915926395105776e-07,
+ "loss": 0.1291,
+ "step": 32461
+ },
+ {
+ "epoch": 88.45231607629428,
+ "grad_norm": 2.9880619049072266,
+ "learning_rate": 6.912701900426544e-07,
+ "loss": 0.0687,
+ "step": 32462
+ },
+ {
+ "epoch": 88.4550408719346,
+ "grad_norm": 3.8878345489501953,
+ "learning_rate": 6.909478130708192e-07,
+ "loss": 0.0314,
+ "step": 32463
+ },
+ {
+ "epoch": 88.45776566757493,
+ "grad_norm": 2.996694564819336,
+ "learning_rate": 6.906255085975799e-07,
+ "loss": 0.0989,
+ "step": 32464
+ },
+ {
+ "epoch": 88.46049046321527,
+ "grad_norm": 3.5452499389648438,
+ "learning_rate": 6.903032766254525e-07,
+ "loss": 0.0565,
+ "step": 32465
+ },
+ {
+ "epoch": 88.46321525885558,
+ "grad_norm": 4.170506000518799,
+ "learning_rate": 6.899811171569437e-07,
+ "loss": 0.1153,
+ "step": 32466
+ },
+ {
+ "epoch": 88.46594005449592,
+ "grad_norm": 2.7486510276794434,
+ "learning_rate": 6.896590301945616e-07,
+ "loss": 0.0625,
+ "step": 32467
+ },
+ {
+ "epoch": 88.46866485013624,
+ "grad_norm": 2.1080689430236816,
+ "learning_rate": 6.893370157408141e-07,
+ "loss": 0.0404,
+ "step": 32468
+ },
+ {
+ "epoch": 88.47138964577657,
+ "grad_norm": 2.5748252868652344,
+ "learning_rate": 6.890150737982115e-07,
+ "loss": 0.0474,
+ "step": 32469
+ },
+ {
+ "epoch": 88.47411444141689,
+ "grad_norm": 1.9797866344451904,
+ "learning_rate": 6.886932043692596e-07,
+ "loss": 0.0227,
+ "step": 32470
+ },
+ {
+ "epoch": 88.47683923705722,
+ "grad_norm": 2.369738817214966,
+ "learning_rate": 6.883714074564663e-07,
+ "loss": 0.0889,
+ "step": 32471
+ },
+ {
+ "epoch": 88.47956403269755,
+ "grad_norm": 4.690642833709717,
+ "learning_rate": 6.88049683062334e-07,
+ "loss": 0.0421,
+ "step": 32472
+ },
+ {
+ "epoch": 88.48228882833787,
+ "grad_norm": 2.9402341842651367,
+ "learning_rate": 6.87728031189373e-07,
+ "loss": 0.1101,
+ "step": 32473
+ },
+ {
+ "epoch": 88.4850136239782,
+ "grad_norm": 1.914718508720398,
+ "learning_rate": 6.874064518400869e-07,
+ "loss": 0.0365,
+ "step": 32474
+ },
+ {
+ "epoch": 88.48773841961852,
+ "grad_norm": 2.57735276222229,
+ "learning_rate": 6.870849450169781e-07,
+ "loss": 0.0219,
+ "step": 32475
+ },
+ {
+ "epoch": 88.49046321525886,
+ "grad_norm": 2.4926013946533203,
+ "learning_rate": 6.867635107225512e-07,
+ "loss": 0.0797,
+ "step": 32476
+ },
+ {
+ "epoch": 88.49318801089919,
+ "grad_norm": 3.515141010284424,
+ "learning_rate": 6.864421489593132e-07,
+ "loss": 0.0284,
+ "step": 32477
+ },
+ {
+ "epoch": 88.49591280653951,
+ "grad_norm": 3.1314024925231934,
+ "learning_rate": 6.861208597297631e-07,
+ "loss": 0.079,
+ "step": 32478
+ },
+ {
+ "epoch": 88.49863760217984,
+ "grad_norm": 2.2189550399780273,
+ "learning_rate": 6.857996430364045e-07,
+ "loss": 0.0621,
+ "step": 32479
+ },
+ {
+ "epoch": 88.50136239782016,
+ "grad_norm": 1.7627149820327759,
+ "learning_rate": 6.854784988817365e-07,
+ "loss": 0.0193,
+ "step": 32480
+ },
+ {
+ "epoch": 88.50408719346049,
+ "grad_norm": 1.8683980703353882,
+ "learning_rate": 6.851574272682638e-07,
+ "loss": 0.1362,
+ "step": 32481
+ },
+ {
+ "epoch": 88.50681198910081,
+ "grad_norm": 1.919998288154602,
+ "learning_rate": 6.848364281984843e-07,
+ "loss": 0.0213,
+ "step": 32482
+ },
+ {
+ "epoch": 88.50953678474114,
+ "grad_norm": 2.2226004600524902,
+ "learning_rate": 6.845155016749006e-07,
+ "loss": 0.0477,
+ "step": 32483
+ },
+ {
+ "epoch": 88.51226158038148,
+ "grad_norm": 2.1266064643859863,
+ "learning_rate": 6.841946477000072e-07,
+ "loss": 0.0384,
+ "step": 32484
+ },
+ {
+ "epoch": 88.5149863760218,
+ "grad_norm": 2.8746864795684814,
+ "learning_rate": 6.838738662763089e-07,
+ "loss": 0.0883,
+ "step": 32485
+ },
+ {
+ "epoch": 88.51771117166213,
+ "grad_norm": 3.0734643936157227,
+ "learning_rate": 6.835531574063003e-07,
+ "loss": 0.1,
+ "step": 32486
+ },
+ {
+ "epoch": 88.52043596730245,
+ "grad_norm": 1.7114530801773071,
+ "learning_rate": 6.832325210924806e-07,
+ "loss": 0.0313,
+ "step": 32487
+ },
+ {
+ "epoch": 88.52316076294278,
+ "grad_norm": 2.248533248901367,
+ "learning_rate": 6.829119573373443e-07,
+ "loss": 0.1137,
+ "step": 32488
+ },
+ {
+ "epoch": 88.52588555858311,
+ "grad_norm": 5.388162612915039,
+ "learning_rate": 6.825914661433908e-07,
+ "loss": 0.1057,
+ "step": 32489
+ },
+ {
+ "epoch": 88.52861035422343,
+ "grad_norm": 2.2857561111450195,
+ "learning_rate": 6.822710475131155e-07,
+ "loss": 0.0471,
+ "step": 32490
+ },
+ {
+ "epoch": 88.53133514986376,
+ "grad_norm": 3.316270112991333,
+ "learning_rate": 6.819507014490134e-07,
+ "loss": 0.0884,
+ "step": 32491
+ },
+ {
+ "epoch": 88.53405994550408,
+ "grad_norm": 2.7123632431030273,
+ "learning_rate": 6.81630427953578e-07,
+ "loss": 0.0441,
+ "step": 32492
+ },
+ {
+ "epoch": 88.53678474114442,
+ "grad_norm": 2.2796952724456787,
+ "learning_rate": 6.81310227029307e-07,
+ "loss": 0.0667,
+ "step": 32493
+ },
+ {
+ "epoch": 88.53950953678473,
+ "grad_norm": 2.4223263263702393,
+ "learning_rate": 6.809900986786889e-07,
+ "loss": 0.122,
+ "step": 32494
+ },
+ {
+ "epoch": 88.54223433242507,
+ "grad_norm": 1.859542727470398,
+ "learning_rate": 6.806700429042223e-07,
+ "loss": 0.0206,
+ "step": 32495
+ },
+ {
+ "epoch": 88.5449591280654,
+ "grad_norm": 2.8135170936584473,
+ "learning_rate": 6.803500597083967e-07,
+ "loss": 0.114,
+ "step": 32496
+ },
+ {
+ "epoch": 88.54768392370572,
+ "grad_norm": 2.5066561698913574,
+ "learning_rate": 6.800301490937056e-07,
+ "loss": 0.0545,
+ "step": 32497
+ },
+ {
+ "epoch": 88.55040871934605,
+ "grad_norm": 2.343372344970703,
+ "learning_rate": 6.797103110626402e-07,
+ "loss": 0.0327,
+ "step": 32498
+ },
+ {
+ "epoch": 88.55313351498637,
+ "grad_norm": 3.180253505706787,
+ "learning_rate": 6.793905456176909e-07,
+ "loss": 0.0798,
+ "step": 32499
+ },
+ {
+ "epoch": 88.5558583106267,
+ "grad_norm": 2.0128023624420166,
+ "learning_rate": 6.790708527613454e-07,
+ "loss": 0.086,
+ "step": 32500
+ },
+ {
+ "epoch": 88.55858310626704,
+ "grad_norm": 2.8150742053985596,
+ "learning_rate": 6.787512324960987e-07,
+ "loss": 0.0298,
+ "step": 32501
+ },
+ {
+ "epoch": 88.56130790190736,
+ "grad_norm": 2.445643424987793,
+ "learning_rate": 6.784316848244377e-07,
+ "loss": 0.0359,
+ "step": 32502
+ },
+ {
+ "epoch": 88.56403269754769,
+ "grad_norm": 1.6584358215332031,
+ "learning_rate": 6.781122097488501e-07,
+ "loss": 0.0202,
+ "step": 32503
+ },
+ {
+ "epoch": 88.566757493188,
+ "grad_norm": 2.5261402130126953,
+ "learning_rate": 6.777928072718232e-07,
+ "loss": 0.0983,
+ "step": 32504
+ },
+ {
+ "epoch": 88.56948228882834,
+ "grad_norm": 2.7514688968658447,
+ "learning_rate": 6.774734773958469e-07,
+ "loss": 0.0786,
+ "step": 32505
+ },
+ {
+ "epoch": 88.57220708446866,
+ "grad_norm": 2.7484543323516846,
+ "learning_rate": 6.771542201234071e-07,
+ "loss": 0.0911,
+ "step": 32506
+ },
+ {
+ "epoch": 88.57493188010899,
+ "grad_norm": 1.4559698104858398,
+ "learning_rate": 6.768350354569909e-07,
+ "loss": 0.0155,
+ "step": 32507
+ },
+ {
+ "epoch": 88.57765667574932,
+ "grad_norm": 5.5457658767700195,
+ "learning_rate": 6.765159233990814e-07,
+ "loss": 0.0483,
+ "step": 32508
+ },
+ {
+ "epoch": 88.58038147138964,
+ "grad_norm": 2.0925986766815186,
+ "learning_rate": 6.761968839521682e-07,
+ "loss": 0.0364,
+ "step": 32509
+ },
+ {
+ "epoch": 88.58310626702998,
+ "grad_norm": 3.045254707336426,
+ "learning_rate": 6.758779171187324e-07,
+ "loss": 0.0305,
+ "step": 32510
+ },
+ {
+ "epoch": 88.5858310626703,
+ "grad_norm": 7.752040863037109,
+ "learning_rate": 6.755590229012588e-07,
+ "loss": 0.0869,
+ "step": 32511
+ },
+ {
+ "epoch": 88.58855585831063,
+ "grad_norm": 5.426023483276367,
+ "learning_rate": 6.752402013022319e-07,
+ "loss": 0.1346,
+ "step": 32512
+ },
+ {
+ "epoch": 88.59128065395096,
+ "grad_norm": 3.487820625305176,
+ "learning_rate": 6.749214523241332e-07,
+ "loss": 0.0764,
+ "step": 32513
+ },
+ {
+ "epoch": 88.59400544959128,
+ "grad_norm": 2.4322376251220703,
+ "learning_rate": 6.746027759694474e-07,
+ "loss": 0.1689,
+ "step": 32514
+ },
+ {
+ "epoch": 88.59673024523161,
+ "grad_norm": 2.054391622543335,
+ "learning_rate": 6.742841722406556e-07,
+ "loss": 0.025,
+ "step": 32515
+ },
+ {
+ "epoch": 88.59945504087193,
+ "grad_norm": 2.9714245796203613,
+ "learning_rate": 6.739656411402363e-07,
+ "loss": 0.1152,
+ "step": 32516
+ },
+ {
+ "epoch": 88.60217983651226,
+ "grad_norm": 1.3651752471923828,
+ "learning_rate": 6.736471826706747e-07,
+ "loss": 0.0147,
+ "step": 32517
+ },
+ {
+ "epoch": 88.60490463215258,
+ "grad_norm": 2.0237410068511963,
+ "learning_rate": 6.733287968344482e-07,
+ "loss": 0.0799,
+ "step": 32518
+ },
+ {
+ "epoch": 88.60762942779292,
+ "grad_norm": 2.2222201824188232,
+ "learning_rate": 6.730104836340367e-07,
+ "loss": 0.0456,
+ "step": 32519
+ },
+ {
+ "epoch": 88.61035422343325,
+ "grad_norm": 2.871119260787964,
+ "learning_rate": 6.726922430719185e-07,
+ "loss": 0.0737,
+ "step": 32520
+ },
+ {
+ "epoch": 88.61307901907357,
+ "grad_norm": 1.9032843112945557,
+ "learning_rate": 6.723740751505736e-07,
+ "loss": 0.0749,
+ "step": 32521
+ },
+ {
+ "epoch": 88.6158038147139,
+ "grad_norm": 2.381385564804077,
+ "learning_rate": 6.720559798724801e-07,
+ "loss": 0.0239,
+ "step": 32522
+ },
+ {
+ "epoch": 88.61852861035422,
+ "grad_norm": 2.4233813285827637,
+ "learning_rate": 6.717379572401139e-07,
+ "loss": 0.043,
+ "step": 32523
+ },
+ {
+ "epoch": 88.62125340599455,
+ "grad_norm": 3.771385431289673,
+ "learning_rate": 6.714200072559507e-07,
+ "loss": 0.0514,
+ "step": 32524
+ },
+ {
+ "epoch": 88.62397820163488,
+ "grad_norm": 7.224627494812012,
+ "learning_rate": 6.711021299224696e-07,
+ "loss": 0.0377,
+ "step": 32525
+ },
+ {
+ "epoch": 88.6267029972752,
+ "grad_norm": 2.9198646545410156,
+ "learning_rate": 6.707843252421453e-07,
+ "loss": 0.1455,
+ "step": 32526
+ },
+ {
+ "epoch": 88.62942779291554,
+ "grad_norm": 4.023635387420654,
+ "learning_rate": 6.704665932174525e-07,
+ "loss": 0.1044,
+ "step": 32527
+ },
+ {
+ "epoch": 88.63215258855585,
+ "grad_norm": 2.3568904399871826,
+ "learning_rate": 6.701489338508638e-07,
+ "loss": 0.0357,
+ "step": 32528
+ },
+ {
+ "epoch": 88.63487738419619,
+ "grad_norm": 1.82301926612854,
+ "learning_rate": 6.698313471448547e-07,
+ "loss": 0.0942,
+ "step": 32529
+ },
+ {
+ "epoch": 88.6376021798365,
+ "grad_norm": 2.3839166164398193,
+ "learning_rate": 6.695138331019002e-07,
+ "loss": 0.1733,
+ "step": 32530
+ },
+ {
+ "epoch": 88.64032697547684,
+ "grad_norm": 2.619131088256836,
+ "learning_rate": 6.691963917244726e-07,
+ "loss": 0.0795,
+ "step": 32531
+ },
+ {
+ "epoch": 88.64305177111717,
+ "grad_norm": 2.787616014480591,
+ "learning_rate": 6.688790230150421e-07,
+ "loss": 0.0362,
+ "step": 32532
+ },
+ {
+ "epoch": 88.64577656675749,
+ "grad_norm": 2.427051067352295,
+ "learning_rate": 6.685617269760802e-07,
+ "loss": 0.025,
+ "step": 32533
+ },
+ {
+ "epoch": 88.64850136239782,
+ "grad_norm": 2.578310489654541,
+ "learning_rate": 6.682445036100616e-07,
+ "loss": 0.0972,
+ "step": 32534
+ },
+ {
+ "epoch": 88.65122615803814,
+ "grad_norm": 1.6142969131469727,
+ "learning_rate": 6.679273529194541e-07,
+ "loss": 0.0187,
+ "step": 32535
+ },
+ {
+ "epoch": 88.65395095367847,
+ "grad_norm": 4.000240802764893,
+ "learning_rate": 6.67610274906727e-07,
+ "loss": 0.1039,
+ "step": 32536
+ },
+ {
+ "epoch": 88.65667574931881,
+ "grad_norm": 2.3971710205078125,
+ "learning_rate": 6.672932695743506e-07,
+ "loss": 0.0202,
+ "step": 32537
+ },
+ {
+ "epoch": 88.65940054495913,
+ "grad_norm": 2.449756622314453,
+ "learning_rate": 6.669763369247939e-07,
+ "loss": 0.0776,
+ "step": 32538
+ },
+ {
+ "epoch": 88.66212534059946,
+ "grad_norm": 1.5375303030014038,
+ "learning_rate": 6.666594769605261e-07,
+ "loss": 0.0149,
+ "step": 32539
+ },
+ {
+ "epoch": 88.66485013623978,
+ "grad_norm": 3.071993827819824,
+ "learning_rate": 6.66342689684012e-07,
+ "loss": 0.047,
+ "step": 32540
+ },
+ {
+ "epoch": 88.66757493188011,
+ "grad_norm": 2.8569655418395996,
+ "learning_rate": 6.660259750977227e-07,
+ "loss": 0.0233,
+ "step": 32541
+ },
+ {
+ "epoch": 88.67029972752043,
+ "grad_norm": 2.814210891723633,
+ "learning_rate": 6.65709333204122e-07,
+ "loss": 0.0423,
+ "step": 32542
+ },
+ {
+ "epoch": 88.67302452316076,
+ "grad_norm": 2.6103148460388184,
+ "learning_rate": 6.653927640056779e-07,
+ "loss": 0.0371,
+ "step": 32543
+ },
+ {
+ "epoch": 88.6757493188011,
+ "grad_norm": 1.996567726135254,
+ "learning_rate": 6.650762675048516e-07,
+ "loss": 0.0309,
+ "step": 32544
+ },
+ {
+ "epoch": 88.67847411444141,
+ "grad_norm": 1.3965378999710083,
+ "learning_rate": 6.647598437041114e-07,
+ "loss": 0.0221,
+ "step": 32545
+ },
+ {
+ "epoch": 88.68119891008175,
+ "grad_norm": 2.909156322479248,
+ "learning_rate": 6.644434926059228e-07,
+ "loss": 0.031,
+ "step": 32546
+ },
+ {
+ "epoch": 88.68392370572207,
+ "grad_norm": 2.3875527381896973,
+ "learning_rate": 6.641272142127475e-07,
+ "loss": 0.0394,
+ "step": 32547
+ },
+ {
+ "epoch": 88.6866485013624,
+ "grad_norm": 1.9616997241973877,
+ "learning_rate": 6.638110085270488e-07,
+ "loss": 0.0276,
+ "step": 32548
+ },
+ {
+ "epoch": 88.68937329700273,
+ "grad_norm": 2.376124858856201,
+ "learning_rate": 6.634948755512882e-07,
+ "loss": 0.0341,
+ "step": 32549
+ },
+ {
+ "epoch": 88.69209809264305,
+ "grad_norm": 3.137643337249756,
+ "learning_rate": 6.631788152879304e-07,
+ "loss": 0.106,
+ "step": 32550
+ },
+ {
+ "epoch": 88.69482288828338,
+ "grad_norm": 3.1571850776672363,
+ "learning_rate": 6.628628277394356e-07,
+ "loss": 0.0565,
+ "step": 32551
+ },
+ {
+ "epoch": 88.6975476839237,
+ "grad_norm": 3.1629316806793213,
+ "learning_rate": 6.625469129082651e-07,
+ "loss": 0.137,
+ "step": 32552
+ },
+ {
+ "epoch": 88.70027247956403,
+ "grad_norm": 2.550363540649414,
+ "learning_rate": 6.62231070796876e-07,
+ "loss": 0.0909,
+ "step": 32553
+ },
+ {
+ "epoch": 88.70299727520435,
+ "grad_norm": 2.6861281394958496,
+ "learning_rate": 6.619153014077328e-07,
+ "loss": 0.0411,
+ "step": 32554
+ },
+ {
+ "epoch": 88.70572207084469,
+ "grad_norm": 1.8477747440338135,
+ "learning_rate": 6.615996047432937e-07,
+ "loss": 0.0589,
+ "step": 32555
+ },
+ {
+ "epoch": 88.70844686648502,
+ "grad_norm": 3.0497498512268066,
+ "learning_rate": 6.612839808060146e-07,
+ "loss": 0.061,
+ "step": 32556
+ },
+ {
+ "epoch": 88.71117166212534,
+ "grad_norm": 2.910400867462158,
+ "learning_rate": 6.609684295983553e-07,
+ "loss": 0.0485,
+ "step": 32557
+ },
+ {
+ "epoch": 88.71389645776567,
+ "grad_norm": 4.672149658203125,
+ "learning_rate": 6.606529511227743e-07,
+ "loss": 0.0623,
+ "step": 32558
+ },
+ {
+ "epoch": 88.71662125340599,
+ "grad_norm": 2.9744796752929688,
+ "learning_rate": 6.603375453817273e-07,
+ "loss": 0.094,
+ "step": 32559
+ },
+ {
+ "epoch": 88.71934604904632,
+ "grad_norm": 3.9777817726135254,
+ "learning_rate": 6.600222123776712e-07,
+ "loss": 0.0494,
+ "step": 32560
+ },
+ {
+ "epoch": 88.72207084468666,
+ "grad_norm": 2.20937442779541,
+ "learning_rate": 6.597069521130594e-07,
+ "loss": 0.0667,
+ "step": 32561
+ },
+ {
+ "epoch": 88.72479564032697,
+ "grad_norm": 2.979435443878174,
+ "learning_rate": 6.593917645903491e-07,
+ "loss": 0.0806,
+ "step": 32562
+ },
+ {
+ "epoch": 88.7275204359673,
+ "grad_norm": 1.8783541917800903,
+ "learning_rate": 6.590766498119983e-07,
+ "loss": 0.0202,
+ "step": 32563
+ },
+ {
+ "epoch": 88.73024523160763,
+ "grad_norm": 4.087584018707275,
+ "learning_rate": 6.58761607780456e-07,
+ "loss": 0.0829,
+ "step": 32564
+ },
+ {
+ "epoch": 88.73297002724796,
+ "grad_norm": 2.5798182487487793,
+ "learning_rate": 6.584466384981769e-07,
+ "loss": 0.0248,
+ "step": 32565
+ },
+ {
+ "epoch": 88.73569482288828,
+ "grad_norm": 3.663706064224243,
+ "learning_rate": 6.58131741967617e-07,
+ "loss": 0.1457,
+ "step": 32566
+ },
+ {
+ "epoch": 88.73841961852861,
+ "grad_norm": 3.7107369899749756,
+ "learning_rate": 6.578169181912252e-07,
+ "loss": 0.0469,
+ "step": 32567
+ },
+ {
+ "epoch": 88.74114441416894,
+ "grad_norm": 2.8559722900390625,
+ "learning_rate": 6.575021671714554e-07,
+ "loss": 0.0285,
+ "step": 32568
+ },
+ {
+ "epoch": 88.74386920980926,
+ "grad_norm": 1.462720513343811,
+ "learning_rate": 6.571874889107554e-07,
+ "loss": 0.0192,
+ "step": 32569
+ },
+ {
+ "epoch": 88.7465940054496,
+ "grad_norm": 1.8686283826828003,
+ "learning_rate": 6.568728834115812e-07,
+ "loss": 0.0382,
+ "step": 32570
+ },
+ {
+ "epoch": 88.74931880108991,
+ "grad_norm": 4.0126566886901855,
+ "learning_rate": 6.565583506763795e-07,
+ "loss": 0.0472,
+ "step": 32571
+ },
+ {
+ "epoch": 88.75204359673025,
+ "grad_norm": 2.335212230682373,
+ "learning_rate": 6.562438907076018e-07,
+ "loss": 0.0407,
+ "step": 32572
+ },
+ {
+ "epoch": 88.75476839237058,
+ "grad_norm": 2.825334310531616,
+ "learning_rate": 6.559295035076929e-07,
+ "loss": 0.0724,
+ "step": 32573
+ },
+ {
+ "epoch": 88.7574931880109,
+ "grad_norm": 2.296994924545288,
+ "learning_rate": 6.556151890791073e-07,
+ "loss": 0.0274,
+ "step": 32574
+ },
+ {
+ "epoch": 88.76021798365123,
+ "grad_norm": 3.0914974212646484,
+ "learning_rate": 6.553009474242888e-07,
+ "loss": 0.0387,
+ "step": 32575
+ },
+ {
+ "epoch": 88.76294277929155,
+ "grad_norm": 2.1979379653930664,
+ "learning_rate": 6.549867785456864e-07,
+ "loss": 0.0975,
+ "step": 32576
+ },
+ {
+ "epoch": 88.76566757493188,
+ "grad_norm": 3.263225555419922,
+ "learning_rate": 6.546726824457438e-07,
+ "loss": 0.0783,
+ "step": 32577
+ },
+ {
+ "epoch": 88.7683923705722,
+ "grad_norm": 3.954967975616455,
+ "learning_rate": 6.543586591269124e-07,
+ "loss": 0.1224,
+ "step": 32578
+ },
+ {
+ "epoch": 88.77111716621253,
+ "grad_norm": 2.4080593585968018,
+ "learning_rate": 6.540447085916346e-07,
+ "loss": 0.0678,
+ "step": 32579
+ },
+ {
+ "epoch": 88.77384196185287,
+ "grad_norm": 2.408904790878296,
+ "learning_rate": 6.537308308423529e-07,
+ "loss": 0.0414,
+ "step": 32580
+ },
+ {
+ "epoch": 88.77656675749319,
+ "grad_norm": 3.955139398574829,
+ "learning_rate": 6.534170258815165e-07,
+ "loss": 0.1601,
+ "step": 32581
+ },
+ {
+ "epoch": 88.77929155313352,
+ "grad_norm": 2.4776837825775146,
+ "learning_rate": 6.531032937115677e-07,
+ "loss": 0.0286,
+ "step": 32582
+ },
+ {
+ "epoch": 88.78201634877384,
+ "grad_norm": 2.7745254039764404,
+ "learning_rate": 6.527896343349505e-07,
+ "loss": 0.2462,
+ "step": 32583
+ },
+ {
+ "epoch": 88.78474114441417,
+ "grad_norm": 16.306833267211914,
+ "learning_rate": 6.52476047754107e-07,
+ "loss": 0.0215,
+ "step": 32584
+ },
+ {
+ "epoch": 88.7874659400545,
+ "grad_norm": 2.210672378540039,
+ "learning_rate": 6.521625339714765e-07,
+ "loss": 0.0875,
+ "step": 32585
+ },
+ {
+ "epoch": 88.79019073569482,
+ "grad_norm": 2.5565500259399414,
+ "learning_rate": 6.51849092989506e-07,
+ "loss": 0.0517,
+ "step": 32586
+ },
+ {
+ "epoch": 88.79291553133515,
+ "grad_norm": 3.453659772872925,
+ "learning_rate": 6.515357248106325e-07,
+ "loss": 0.1878,
+ "step": 32587
+ },
+ {
+ "epoch": 88.79564032697547,
+ "grad_norm": 2.9403576850891113,
+ "learning_rate": 6.512224294372993e-07,
+ "loss": 0.0333,
+ "step": 32588
+ },
+ {
+ "epoch": 88.7983651226158,
+ "grad_norm": 3.5595004558563232,
+ "learning_rate": 6.509092068719425e-07,
+ "loss": 0.0309,
+ "step": 32589
+ },
+ {
+ "epoch": 88.80108991825612,
+ "grad_norm": 2.377322196960449,
+ "learning_rate": 6.505960571170056e-07,
+ "loss": 0.0456,
+ "step": 32590
+ },
+ {
+ "epoch": 88.80381471389646,
+ "grad_norm": 2.6467015743255615,
+ "learning_rate": 6.502829801749266e-07,
+ "loss": 0.0956,
+ "step": 32591
+ },
+ {
+ "epoch": 88.80653950953679,
+ "grad_norm": 2.7683017253875732,
+ "learning_rate": 6.499699760481415e-07,
+ "loss": 0.069,
+ "step": 32592
+ },
+ {
+ "epoch": 88.80926430517711,
+ "grad_norm": 5.441568851470947,
+ "learning_rate": 6.496570447390893e-07,
+ "loss": 0.0245,
+ "step": 32593
+ },
+ {
+ "epoch": 88.81198910081744,
+ "grad_norm": 2.438164472579956,
+ "learning_rate": 6.49344186250207e-07,
+ "loss": 0.0317,
+ "step": 32594
+ },
+ {
+ "epoch": 88.81471389645776,
+ "grad_norm": 2.7427258491516113,
+ "learning_rate": 6.490314005839327e-07,
+ "loss": 0.082,
+ "step": 32595
+ },
+ {
+ "epoch": 88.8174386920981,
+ "grad_norm": 3.3365774154663086,
+ "learning_rate": 6.487186877426998e-07,
+ "loss": 0.0434,
+ "step": 32596
+ },
+ {
+ "epoch": 88.82016348773843,
+ "grad_norm": 6.6274542808532715,
+ "learning_rate": 6.484060477289433e-07,
+ "loss": 0.0313,
+ "step": 32597
+ },
+ {
+ "epoch": 88.82288828337875,
+ "grad_norm": 2.2954092025756836,
+ "learning_rate": 6.480934805451001e-07,
+ "loss": 0.0643,
+ "step": 32598
+ },
+ {
+ "epoch": 88.82561307901908,
+ "grad_norm": 2.240321636199951,
+ "learning_rate": 6.477809861936047e-07,
+ "loss": 0.0309,
+ "step": 32599
+ },
+ {
+ "epoch": 88.8283378746594,
+ "grad_norm": 3.0100510120391846,
+ "learning_rate": 6.474685646768908e-07,
+ "loss": 0.1114,
+ "step": 32600
+ },
+ {
+ "epoch": 88.83106267029973,
+ "grad_norm": 3.1723432540893555,
+ "learning_rate": 6.471562159973899e-07,
+ "loss": 0.0271,
+ "step": 32601
+ },
+ {
+ "epoch": 88.83378746594005,
+ "grad_norm": 1.8667747974395752,
+ "learning_rate": 6.468439401575344e-07,
+ "loss": 0.1159,
+ "step": 32602
+ },
+ {
+ "epoch": 88.83651226158038,
+ "grad_norm": 1.8212648630142212,
+ "learning_rate": 6.46531737159759e-07,
+ "loss": 0.0195,
+ "step": 32603
+ },
+ {
+ "epoch": 88.83923705722071,
+ "grad_norm": 1.2121655941009521,
+ "learning_rate": 6.46219607006493e-07,
+ "loss": 0.0145,
+ "step": 32604
+ },
+ {
+ "epoch": 88.84196185286103,
+ "grad_norm": 3.006887435913086,
+ "learning_rate": 6.459075497001655e-07,
+ "loss": 0.0489,
+ "step": 32605
+ },
+ {
+ "epoch": 88.84468664850137,
+ "grad_norm": 2.8322653770446777,
+ "learning_rate": 6.455955652432111e-07,
+ "loss": 0.021,
+ "step": 32606
+ },
+ {
+ "epoch": 88.84741144414168,
+ "grad_norm": 2.9975996017456055,
+ "learning_rate": 6.45283653638058e-07,
+ "loss": 0.0737,
+ "step": 32607
+ },
+ {
+ "epoch": 88.85013623978202,
+ "grad_norm": 3.215750217437744,
+ "learning_rate": 6.449718148871342e-07,
+ "loss": 0.1501,
+ "step": 32608
+ },
+ {
+ "epoch": 88.85286103542235,
+ "grad_norm": 3.315380096435547,
+ "learning_rate": 6.446600489928667e-07,
+ "loss": 0.0647,
+ "step": 32609
+ },
+ {
+ "epoch": 88.85558583106267,
+ "grad_norm": 2.2998287677764893,
+ "learning_rate": 6.443483559576879e-07,
+ "loss": 0.0519,
+ "step": 32610
+ },
+ {
+ "epoch": 88.858310626703,
+ "grad_norm": 3.173992872238159,
+ "learning_rate": 6.440367357840228e-07,
+ "loss": 0.0286,
+ "step": 32611
+ },
+ {
+ "epoch": 88.86103542234332,
+ "grad_norm": 3.3180930614471436,
+ "learning_rate": 6.43725188474299e-07,
+ "loss": 0.0357,
+ "step": 32612
+ },
+ {
+ "epoch": 88.86376021798365,
+ "grad_norm": 4.685422897338867,
+ "learning_rate": 6.434137140309393e-07,
+ "loss": 0.0883,
+ "step": 32613
+ },
+ {
+ "epoch": 88.86648501362397,
+ "grad_norm": 2.7520151138305664,
+ "learning_rate": 6.43102312456374e-07,
+ "loss": 0.0362,
+ "step": 32614
+ },
+ {
+ "epoch": 88.8692098092643,
+ "grad_norm": 2.7013070583343506,
+ "learning_rate": 6.427909837530278e-07,
+ "loss": 0.0324,
+ "step": 32615
+ },
+ {
+ "epoch": 88.87193460490464,
+ "grad_norm": 1.632001280784607,
+ "learning_rate": 6.424797279233242e-07,
+ "loss": 0.03,
+ "step": 32616
+ },
+ {
+ "epoch": 88.87465940054496,
+ "grad_norm": 2.813481092453003,
+ "learning_rate": 6.421685449696868e-07,
+ "loss": 0.0352,
+ "step": 32617
+ },
+ {
+ "epoch": 88.87738419618529,
+ "grad_norm": 2.818861246109009,
+ "learning_rate": 6.418574348945384e-07,
+ "loss": 0.0523,
+ "step": 32618
+ },
+ {
+ "epoch": 88.88010899182561,
+ "grad_norm": 2.4353575706481934,
+ "learning_rate": 6.415463977003045e-07,
+ "loss": 0.1397,
+ "step": 32619
+ },
+ {
+ "epoch": 88.88283378746594,
+ "grad_norm": 3.076411724090576,
+ "learning_rate": 6.412354333894067e-07,
+ "loss": 0.0355,
+ "step": 32620
+ },
+ {
+ "epoch": 88.88555858310627,
+ "grad_norm": 2.091139793395996,
+ "learning_rate": 6.409245419642663e-07,
+ "loss": 0.0232,
+ "step": 32621
+ },
+ {
+ "epoch": 88.88828337874659,
+ "grad_norm": 2.2614316940307617,
+ "learning_rate": 6.406137234273013e-07,
+ "loss": 0.0869,
+ "step": 32622
+ },
+ {
+ "epoch": 88.89100817438693,
+ "grad_norm": 3.105689525604248,
+ "learning_rate": 6.403029777809377e-07,
+ "loss": 0.0956,
+ "step": 32623
+ },
+ {
+ "epoch": 88.89373297002724,
+ "grad_norm": 5.176424503326416,
+ "learning_rate": 6.399923050275935e-07,
+ "loss": 0.0207,
+ "step": 32624
+ },
+ {
+ "epoch": 88.89645776566758,
+ "grad_norm": 2.1554253101348877,
+ "learning_rate": 6.396817051696869e-07,
+ "loss": 0.0654,
+ "step": 32625
+ },
+ {
+ "epoch": 88.8991825613079,
+ "grad_norm": 2.6068801879882812,
+ "learning_rate": 6.39371178209639e-07,
+ "loss": 0.0411,
+ "step": 32626
+ },
+ {
+ "epoch": 88.90190735694823,
+ "grad_norm": 3.9998323917388916,
+ "learning_rate": 6.39060724149867e-07,
+ "loss": 0.0851,
+ "step": 32627
+ },
+ {
+ "epoch": 88.90463215258856,
+ "grad_norm": 2.202383518218994,
+ "learning_rate": 6.387503429927888e-07,
+ "loss": 0.0947,
+ "step": 32628
+ },
+ {
+ "epoch": 88.90735694822888,
+ "grad_norm": 1.9589344263076782,
+ "learning_rate": 6.384400347408204e-07,
+ "loss": 0.0257,
+ "step": 32629
+ },
+ {
+ "epoch": 88.91008174386921,
+ "grad_norm": 4.329192638397217,
+ "learning_rate": 6.381297993963809e-07,
+ "loss": 0.1002,
+ "step": 32630
+ },
+ {
+ "epoch": 88.91280653950953,
+ "grad_norm": 3.230823516845703,
+ "learning_rate": 6.378196369618828e-07,
+ "loss": 0.0496,
+ "step": 32631
+ },
+ {
+ "epoch": 88.91553133514986,
+ "grad_norm": 2.3963263034820557,
+ "learning_rate": 6.375095474397475e-07,
+ "loss": 0.0968,
+ "step": 32632
+ },
+ {
+ "epoch": 88.9182561307902,
+ "grad_norm": 2.2858119010925293,
+ "learning_rate": 6.371995308323853e-07,
+ "loss": 0.0712,
+ "step": 32633
+ },
+ {
+ "epoch": 88.92098092643052,
+ "grad_norm": 5.101203918457031,
+ "learning_rate": 6.368895871422099e-07,
+ "loss": 0.0385,
+ "step": 32634
+ },
+ {
+ "epoch": 88.92370572207085,
+ "grad_norm": 2.0538389682769775,
+ "learning_rate": 6.365797163716392e-07,
+ "loss": 0.1404,
+ "step": 32635
+ },
+ {
+ "epoch": 88.92643051771117,
+ "grad_norm": 2.3281009197235107,
+ "learning_rate": 6.362699185230848e-07,
+ "loss": 0.0459,
+ "step": 32636
+ },
+ {
+ "epoch": 88.9291553133515,
+ "grad_norm": 2.309115409851074,
+ "learning_rate": 6.359601935989579e-07,
+ "loss": 0.0777,
+ "step": 32637
+ },
+ {
+ "epoch": 88.93188010899182,
+ "grad_norm": 2.052091598510742,
+ "learning_rate": 6.356505416016712e-07,
+ "loss": 0.029,
+ "step": 32638
+ },
+ {
+ "epoch": 88.93460490463215,
+ "grad_norm": 4.119014263153076,
+ "learning_rate": 6.353409625336371e-07,
+ "loss": 0.1418,
+ "step": 32639
+ },
+ {
+ "epoch": 88.93732970027249,
+ "grad_norm": 1.9511654376983643,
+ "learning_rate": 6.350314563972671e-07,
+ "loss": 0.1573,
+ "step": 32640
+ },
+ {
+ "epoch": 88.9400544959128,
+ "grad_norm": 2.795783758163452,
+ "learning_rate": 6.347220231949702e-07,
+ "loss": 0.0499,
+ "step": 32641
+ },
+ {
+ "epoch": 88.94277929155314,
+ "grad_norm": 3.338364601135254,
+ "learning_rate": 6.344126629291559e-07,
+ "loss": 0.1038,
+ "step": 32642
+ },
+ {
+ "epoch": 88.94550408719346,
+ "grad_norm": 3.1988728046417236,
+ "learning_rate": 6.341033756022352e-07,
+ "loss": 0.1616,
+ "step": 32643
+ },
+ {
+ "epoch": 88.94822888283379,
+ "grad_norm": 2.0884668827056885,
+ "learning_rate": 6.337941612166154e-07,
+ "loss": 0.0275,
+ "step": 32644
+ },
+ {
+ "epoch": 88.95095367847412,
+ "grad_norm": 2.2075607776641846,
+ "learning_rate": 6.334850197747066e-07,
+ "loss": 0.0252,
+ "step": 32645
+ },
+ {
+ "epoch": 88.95367847411444,
+ "grad_norm": 5.519400596618652,
+ "learning_rate": 6.331759512789126e-07,
+ "loss": 0.1259,
+ "step": 32646
+ },
+ {
+ "epoch": 88.95640326975477,
+ "grad_norm": 1.751410961151123,
+ "learning_rate": 6.328669557316447e-07,
+ "loss": 0.0471,
+ "step": 32647
+ },
+ {
+ "epoch": 88.95912806539509,
+ "grad_norm": 2.8046438694000244,
+ "learning_rate": 6.325580331353065e-07,
+ "loss": 0.0349,
+ "step": 32648
+ },
+ {
+ "epoch": 88.96185286103542,
+ "grad_norm": 2.2592806816101074,
+ "learning_rate": 6.32249183492305e-07,
+ "loss": 0.0233,
+ "step": 32649
+ },
+ {
+ "epoch": 88.96457765667574,
+ "grad_norm": 2.1258723735809326,
+ "learning_rate": 6.319404068050439e-07,
+ "loss": 0.0625,
+ "step": 32650
+ },
+ {
+ "epoch": 88.96730245231608,
+ "grad_norm": 3.519087076187134,
+ "learning_rate": 6.316317030759322e-07,
+ "loss": 0.067,
+ "step": 32651
+ },
+ {
+ "epoch": 88.97002724795641,
+ "grad_norm": 2.198286533355713,
+ "learning_rate": 6.313230723073704e-07,
+ "loss": 0.0326,
+ "step": 32652
+ },
+ {
+ "epoch": 88.97275204359673,
+ "grad_norm": 4.731808662414551,
+ "learning_rate": 6.310145145017633e-07,
+ "loss": 0.052,
+ "step": 32653
+ },
+ {
+ "epoch": 88.97547683923706,
+ "grad_norm": 1.3734490871429443,
+ "learning_rate": 6.30706029661512e-07,
+ "loss": 0.0265,
+ "step": 32654
+ },
+ {
+ "epoch": 88.97820163487738,
+ "grad_norm": 2.5870254039764404,
+ "learning_rate": 6.303976177890214e-07,
+ "loss": 0.0681,
+ "step": 32655
+ },
+ {
+ "epoch": 88.98092643051771,
+ "grad_norm": 2.2474260330200195,
+ "learning_rate": 6.300892788866942e-07,
+ "loss": 0.0476,
+ "step": 32656
+ },
+ {
+ "epoch": 88.98365122615803,
+ "grad_norm": 5.296260833740234,
+ "learning_rate": 6.297810129569282e-07,
+ "loss": 0.056,
+ "step": 32657
+ },
+ {
+ "epoch": 88.98637602179836,
+ "grad_norm": 2.11629056930542,
+ "learning_rate": 6.294728200021261e-07,
+ "loss": 0.0226,
+ "step": 32658
+ },
+ {
+ "epoch": 88.9891008174387,
+ "grad_norm": 2.8374900817871094,
+ "learning_rate": 6.291647000246892e-07,
+ "loss": 0.0688,
+ "step": 32659
+ },
+ {
+ "epoch": 88.99182561307902,
+ "grad_norm": 2.699063539505005,
+ "learning_rate": 6.288566530270157e-07,
+ "loss": 0.1188,
+ "step": 32660
+ },
+ {
+ "epoch": 88.99455040871935,
+ "grad_norm": 2.0384888648986816,
+ "learning_rate": 6.285486790115047e-07,
+ "loss": 0.0287,
+ "step": 32661
+ },
+ {
+ "epoch": 88.99727520435967,
+ "grad_norm": 2.511185884475708,
+ "learning_rate": 6.282407779805544e-07,
+ "loss": 0.1725,
+ "step": 32662
+ },
+ {
+ "epoch": 89.0,
+ "grad_norm": 2.5621845722198486,
+ "learning_rate": 6.279329499365649e-07,
+ "loss": 0.0365,
+ "step": 32663
+ },
+ {
+ "epoch": 89.00272479564033,
+ "grad_norm": 2.2070326805114746,
+ "learning_rate": 6.276251948819312e-07,
+ "loss": 0.1821,
+ "step": 32664
+ },
+ {
+ "epoch": 89.00544959128065,
+ "grad_norm": 9.901810646057129,
+ "learning_rate": 6.273175128190512e-07,
+ "loss": 0.0916,
+ "step": 32665
+ },
+ {
+ "epoch": 89.00817438692098,
+ "grad_norm": 2.8300845623016357,
+ "learning_rate": 6.270099037503185e-07,
+ "loss": 0.0399,
+ "step": 32666
+ },
+ {
+ "epoch": 89.0108991825613,
+ "grad_norm": 1.4365792274475098,
+ "learning_rate": 6.267023676781314e-07,
+ "loss": 0.0178,
+ "step": 32667
+ },
+ {
+ "epoch": 89.01362397820164,
+ "grad_norm": 3.269904136657715,
+ "learning_rate": 6.263949046048868e-07,
+ "loss": 0.1554,
+ "step": 32668
+ },
+ {
+ "epoch": 89.01634877384195,
+ "grad_norm": 2.946486234664917,
+ "learning_rate": 6.260875145329759e-07,
+ "loss": 0.0316,
+ "step": 32669
+ },
+ {
+ "epoch": 89.01907356948229,
+ "grad_norm": 1.9456405639648438,
+ "learning_rate": 6.257801974647937e-07,
+ "loss": 0.0381,
+ "step": 32670
+ },
+ {
+ "epoch": 89.02179836512262,
+ "grad_norm": 4.5912957191467285,
+ "learning_rate": 6.254729534027337e-07,
+ "loss": 0.1149,
+ "step": 32671
+ },
+ {
+ "epoch": 89.02452316076294,
+ "grad_norm": 2.9190385341644287,
+ "learning_rate": 6.251657823491897e-07,
+ "loss": 0.0414,
+ "step": 32672
+ },
+ {
+ "epoch": 89.02724795640327,
+ "grad_norm": 1.9378341436386108,
+ "learning_rate": 6.248586843065518e-07,
+ "loss": 0.037,
+ "step": 32673
+ },
+ {
+ "epoch": 89.02997275204359,
+ "grad_norm": 2.1198220252990723,
+ "learning_rate": 6.245516592772116e-07,
+ "loss": 0.0262,
+ "step": 32674
+ },
+ {
+ "epoch": 89.03269754768392,
+ "grad_norm": 2.846665382385254,
+ "learning_rate": 6.242447072635626e-07,
+ "loss": 0.1463,
+ "step": 32675
+ },
+ {
+ "epoch": 89.03542234332426,
+ "grad_norm": 1.989553689956665,
+ "learning_rate": 6.239378282679953e-07,
+ "loss": 0.0202,
+ "step": 32676
+ },
+ {
+ "epoch": 89.03814713896458,
+ "grad_norm": 4.744172096252441,
+ "learning_rate": 6.236310222928977e-07,
+ "loss": 0.0194,
+ "step": 32677
+ },
+ {
+ "epoch": 89.04087193460491,
+ "grad_norm": 2.6994283199310303,
+ "learning_rate": 6.233242893406577e-07,
+ "loss": 0.0284,
+ "step": 32678
+ },
+ {
+ "epoch": 89.04359673024523,
+ "grad_norm": 2.5558924674987793,
+ "learning_rate": 6.23017629413668e-07,
+ "loss": 0.0686,
+ "step": 32679
+ },
+ {
+ "epoch": 89.04632152588556,
+ "grad_norm": 2.528228521347046,
+ "learning_rate": 6.227110425143157e-07,
+ "loss": 0.0458,
+ "step": 32680
+ },
+ {
+ "epoch": 89.04904632152588,
+ "grad_norm": 2.8393657207489014,
+ "learning_rate": 6.224045286449887e-07,
+ "loss": 0.0368,
+ "step": 32681
+ },
+ {
+ "epoch": 89.05177111716621,
+ "grad_norm": 2.4981143474578857,
+ "learning_rate": 6.220980878080707e-07,
+ "loss": 0.0534,
+ "step": 32682
+ },
+ {
+ "epoch": 89.05449591280654,
+ "grad_norm": 3.4097540378570557,
+ "learning_rate": 6.217917200059509e-07,
+ "loss": 0.0827,
+ "step": 32683
+ },
+ {
+ "epoch": 89.05722070844686,
+ "grad_norm": 2.685373306274414,
+ "learning_rate": 6.214854252410174e-07,
+ "loss": 0.029,
+ "step": 32684
+ },
+ {
+ "epoch": 89.0599455040872,
+ "grad_norm": 1.9985028505325317,
+ "learning_rate": 6.211792035156539e-07,
+ "loss": 0.0213,
+ "step": 32685
+ },
+ {
+ "epoch": 89.06267029972751,
+ "grad_norm": 2.6448488235473633,
+ "learning_rate": 6.208730548322439e-07,
+ "loss": 0.0171,
+ "step": 32686
+ },
+ {
+ "epoch": 89.06539509536785,
+ "grad_norm": 2.493192195892334,
+ "learning_rate": 6.205669791931723e-07,
+ "loss": 0.0428,
+ "step": 32687
+ },
+ {
+ "epoch": 89.06811989100818,
+ "grad_norm": 2.4542465209960938,
+ "learning_rate": 6.202609766008239e-07,
+ "loss": 0.0311,
+ "step": 32688
+ },
+ {
+ "epoch": 89.0708446866485,
+ "grad_norm": 2.34928822517395,
+ "learning_rate": 6.199550470575821e-07,
+ "loss": 0.0509,
+ "step": 32689
+ },
+ {
+ "epoch": 89.07356948228883,
+ "grad_norm": 5.120890140533447,
+ "learning_rate": 6.196491905658264e-07,
+ "loss": 0.0955,
+ "step": 32690
+ },
+ {
+ "epoch": 89.07629427792915,
+ "grad_norm": 2.2139899730682373,
+ "learning_rate": 6.193434071279414e-07,
+ "loss": 0.1122,
+ "step": 32691
+ },
+ {
+ "epoch": 89.07901907356948,
+ "grad_norm": 1.9536000490188599,
+ "learning_rate": 6.190376967463097e-07,
+ "loss": 0.0192,
+ "step": 32692
+ },
+ {
+ "epoch": 89.0817438692098,
+ "grad_norm": 1.561396837234497,
+ "learning_rate": 6.187320594233093e-07,
+ "loss": 0.0187,
+ "step": 32693
+ },
+ {
+ "epoch": 89.08446866485014,
+ "grad_norm": 2.2661666870117188,
+ "learning_rate": 6.184264951613206e-07,
+ "loss": 0.1571,
+ "step": 32694
+ },
+ {
+ "epoch": 89.08719346049047,
+ "grad_norm": 4.047026634216309,
+ "learning_rate": 6.181210039627261e-07,
+ "loss": 0.1483,
+ "step": 32695
+ },
+ {
+ "epoch": 89.08991825613079,
+ "grad_norm": 3.3938167095184326,
+ "learning_rate": 6.178155858299029e-07,
+ "loss": 0.0966,
+ "step": 32696
+ },
+ {
+ "epoch": 89.09264305177112,
+ "grad_norm": 2.6834189891815186,
+ "learning_rate": 6.1751024076523e-07,
+ "loss": 0.0762,
+ "step": 32697
+ },
+ {
+ "epoch": 89.09536784741144,
+ "grad_norm": 2.593212842941284,
+ "learning_rate": 6.172049687710846e-07,
+ "loss": 0.049,
+ "step": 32698
+ },
+ {
+ "epoch": 89.09809264305177,
+ "grad_norm": 2.224918842315674,
+ "learning_rate": 6.168997698498458e-07,
+ "loss": 0.063,
+ "step": 32699
+ },
+ {
+ "epoch": 89.1008174386921,
+ "grad_norm": 3.1200671195983887,
+ "learning_rate": 6.165946440038883e-07,
+ "loss": 0.0706,
+ "step": 32700
+ },
+ {
+ "epoch": 89.10354223433242,
+ "grad_norm": 2.4436869621276855,
+ "learning_rate": 6.162895912355904e-07,
+ "loss": 0.0462,
+ "step": 32701
+ },
+ {
+ "epoch": 89.10626702997276,
+ "grad_norm": 1.949854850769043,
+ "learning_rate": 6.159846115473278e-07,
+ "loss": 0.0257,
+ "step": 32702
+ },
+ {
+ "epoch": 89.10899182561307,
+ "grad_norm": 2.124957323074341,
+ "learning_rate": 6.156797049414742e-07,
+ "loss": 0.0265,
+ "step": 32703
+ },
+ {
+ "epoch": 89.11171662125341,
+ "grad_norm": 3.6889209747314453,
+ "learning_rate": 6.153748714204055e-07,
+ "loss": 0.1115,
+ "step": 32704
+ },
+ {
+ "epoch": 89.11444141689373,
+ "grad_norm": 2.025499105453491,
+ "learning_rate": 6.150701109864954e-07,
+ "loss": 0.0258,
+ "step": 32705
+ },
+ {
+ "epoch": 89.11716621253406,
+ "grad_norm": 2.7911789417266846,
+ "learning_rate": 6.147654236421174e-07,
+ "loss": 0.0648,
+ "step": 32706
+ },
+ {
+ "epoch": 89.11989100817439,
+ "grad_norm": 1.8968440294265747,
+ "learning_rate": 6.144608093896431e-07,
+ "loss": 0.0244,
+ "step": 32707
+ },
+ {
+ "epoch": 89.12261580381471,
+ "grad_norm": 2.548025131225586,
+ "learning_rate": 6.141562682314473e-07,
+ "loss": 0.0776,
+ "step": 32708
+ },
+ {
+ "epoch": 89.12534059945504,
+ "grad_norm": 1.5753182172775269,
+ "learning_rate": 6.138518001699001e-07,
+ "loss": 0.0197,
+ "step": 32709
+ },
+ {
+ "epoch": 89.12806539509536,
+ "grad_norm": 2.8098111152648926,
+ "learning_rate": 6.135474052073731e-07,
+ "loss": 0.0239,
+ "step": 32710
+ },
+ {
+ "epoch": 89.1307901907357,
+ "grad_norm": 2.4336137771606445,
+ "learning_rate": 6.132430833462344e-07,
+ "loss": 0.0474,
+ "step": 32711
+ },
+ {
+ "epoch": 89.13351498637603,
+ "grad_norm": 2.1622588634490967,
+ "learning_rate": 6.129388345888598e-07,
+ "loss": 0.0456,
+ "step": 32712
+ },
+ {
+ "epoch": 89.13623978201635,
+ "grad_norm": 2.102802038192749,
+ "learning_rate": 6.126346589376142e-07,
+ "loss": 0.0259,
+ "step": 32713
+ },
+ {
+ "epoch": 89.13896457765668,
+ "grad_norm": 2.271444082260132,
+ "learning_rate": 6.123305563948667e-07,
+ "loss": 0.0731,
+ "step": 32714
+ },
+ {
+ "epoch": 89.141689373297,
+ "grad_norm": 2.9211630821228027,
+ "learning_rate": 6.120265269629877e-07,
+ "loss": 0.1062,
+ "step": 32715
+ },
+ {
+ "epoch": 89.14441416893733,
+ "grad_norm": 2.3627302646636963,
+ "learning_rate": 6.117225706443441e-07,
+ "loss": 0.1202,
+ "step": 32716
+ },
+ {
+ "epoch": 89.14713896457765,
+ "grad_norm": 2.4656448364257812,
+ "learning_rate": 6.11418687441302e-07,
+ "loss": 0.0507,
+ "step": 32717
+ },
+ {
+ "epoch": 89.14986376021798,
+ "grad_norm": 2.1551454067230225,
+ "learning_rate": 6.111148773562303e-07,
+ "loss": 0.0582,
+ "step": 32718
+ },
+ {
+ "epoch": 89.15258855585832,
+ "grad_norm": 2.709928274154663,
+ "learning_rate": 6.108111403914919e-07,
+ "loss": 0.0601,
+ "step": 32719
+ },
+ {
+ "epoch": 89.15531335149863,
+ "grad_norm": 4.146137237548828,
+ "learning_rate": 6.105074765494556e-07,
+ "loss": 0.0416,
+ "step": 32720
+ },
+ {
+ "epoch": 89.15803814713897,
+ "grad_norm": 4.809267997741699,
+ "learning_rate": 6.102038858324855e-07,
+ "loss": 0.0658,
+ "step": 32721
+ },
+ {
+ "epoch": 89.16076294277929,
+ "grad_norm": 10.87790584564209,
+ "learning_rate": 6.09900368242945e-07,
+ "loss": 0.0338,
+ "step": 32722
+ },
+ {
+ "epoch": 89.16348773841962,
+ "grad_norm": 3.1182589530944824,
+ "learning_rate": 6.095969237831956e-07,
+ "loss": 0.0901,
+ "step": 32723
+ },
+ {
+ "epoch": 89.16621253405995,
+ "grad_norm": 3.3349595069885254,
+ "learning_rate": 6.092935524556065e-07,
+ "loss": 0.0775,
+ "step": 32724
+ },
+ {
+ "epoch": 89.16893732970027,
+ "grad_norm": 2.543630599975586,
+ "learning_rate": 6.089902542625359e-07,
+ "loss": 0.0615,
+ "step": 32725
+ },
+ {
+ "epoch": 89.1716621253406,
+ "grad_norm": 3.363832712173462,
+ "learning_rate": 6.086870292063473e-07,
+ "loss": 0.0519,
+ "step": 32726
+ },
+ {
+ "epoch": 89.17438692098092,
+ "grad_norm": 3.0619161128997803,
+ "learning_rate": 6.083838772894002e-07,
+ "loss": 0.0495,
+ "step": 32727
+ },
+ {
+ "epoch": 89.17711171662125,
+ "grad_norm": 2.945568323135376,
+ "learning_rate": 6.080807985140591e-07,
+ "loss": 0.0461,
+ "step": 32728
+ },
+ {
+ "epoch": 89.17983651226157,
+ "grad_norm": 1.8759384155273438,
+ "learning_rate": 6.077777928826811e-07,
+ "loss": 0.025,
+ "step": 32729
+ },
+ {
+ "epoch": 89.1825613079019,
+ "grad_norm": 2.955927610397339,
+ "learning_rate": 6.074748603976288e-07,
+ "loss": 0.0773,
+ "step": 32730
+ },
+ {
+ "epoch": 89.18528610354224,
+ "grad_norm": 2.0474166870117188,
+ "learning_rate": 6.07172001061258e-07,
+ "loss": 0.0966,
+ "step": 32731
+ },
+ {
+ "epoch": 89.18801089918256,
+ "grad_norm": 4.1849493980407715,
+ "learning_rate": 6.068692148759314e-07,
+ "loss": 0.0876,
+ "step": 32732
+ },
+ {
+ "epoch": 89.19073569482289,
+ "grad_norm": 1.793718695640564,
+ "learning_rate": 6.065665018440037e-07,
+ "loss": 0.0181,
+ "step": 32733
+ },
+ {
+ "epoch": 89.19346049046321,
+ "grad_norm": 2.2312920093536377,
+ "learning_rate": 6.062638619678352e-07,
+ "loss": 0.0449,
+ "step": 32734
+ },
+ {
+ "epoch": 89.19618528610354,
+ "grad_norm": 3.3801324367523193,
+ "learning_rate": 6.059612952497773e-07,
+ "loss": 0.0439,
+ "step": 32735
+ },
+ {
+ "epoch": 89.19891008174388,
+ "grad_norm": 3.0099101066589355,
+ "learning_rate": 6.056588016921949e-07,
+ "loss": 0.0379,
+ "step": 32736
+ },
+ {
+ "epoch": 89.2016348773842,
+ "grad_norm": 2.1082236766815186,
+ "learning_rate": 6.053563812974384e-07,
+ "loss": 0.0338,
+ "step": 32737
+ },
+ {
+ "epoch": 89.20435967302453,
+ "grad_norm": 2.8980274200439453,
+ "learning_rate": 6.050540340678635e-07,
+ "loss": 0.0331,
+ "step": 32738
+ },
+ {
+ "epoch": 89.20708446866485,
+ "grad_norm": 2.985513687133789,
+ "learning_rate": 6.04751760005825e-07,
+ "loss": 0.0504,
+ "step": 32739
+ },
+ {
+ "epoch": 89.20980926430518,
+ "grad_norm": 2.653040647506714,
+ "learning_rate": 6.044495591136778e-07,
+ "loss": 0.0242,
+ "step": 32740
+ },
+ {
+ "epoch": 89.2125340599455,
+ "grad_norm": 2.725943088531494,
+ "learning_rate": 6.041474313937756e-07,
+ "loss": 0.0619,
+ "step": 32741
+ },
+ {
+ "epoch": 89.21525885558583,
+ "grad_norm": 1.5715361833572388,
+ "learning_rate": 6.038453768484709e-07,
+ "loss": 0.0226,
+ "step": 32742
+ },
+ {
+ "epoch": 89.21798365122616,
+ "grad_norm": 1.7930307388305664,
+ "learning_rate": 6.035433954801151e-07,
+ "loss": 0.0795,
+ "step": 32743
+ },
+ {
+ "epoch": 89.22070844686648,
+ "grad_norm": 3.3262786865234375,
+ "learning_rate": 6.03241487291062e-07,
+ "loss": 0.0284,
+ "step": 32744
+ },
+ {
+ "epoch": 89.22343324250681,
+ "grad_norm": 2.5820655822753906,
+ "learning_rate": 6.029396522836617e-07,
+ "loss": 0.0195,
+ "step": 32745
+ },
+ {
+ "epoch": 89.22615803814713,
+ "grad_norm": 18.499683380126953,
+ "learning_rate": 6.026378904602648e-07,
+ "loss": 0.0504,
+ "step": 32746
+ },
+ {
+ "epoch": 89.22888283378747,
+ "grad_norm": 2.052060604095459,
+ "learning_rate": 6.023362018232193e-07,
+ "loss": 0.0534,
+ "step": 32747
+ },
+ {
+ "epoch": 89.2316076294278,
+ "grad_norm": 2.4382376670837402,
+ "learning_rate": 6.0203458637488e-07,
+ "loss": 0.0599,
+ "step": 32748
+ },
+ {
+ "epoch": 89.23433242506812,
+ "grad_norm": 1.8200987577438354,
+ "learning_rate": 6.017330441175917e-07,
+ "loss": 0.0282,
+ "step": 32749
+ },
+ {
+ "epoch": 89.23705722070845,
+ "grad_norm": 2.2123477458953857,
+ "learning_rate": 6.014315750537048e-07,
+ "loss": 0.0412,
+ "step": 32750
+ },
+ {
+ "epoch": 89.23978201634877,
+ "grad_norm": 2.306133270263672,
+ "learning_rate": 6.011301791855639e-07,
+ "loss": 0.1808,
+ "step": 32751
+ },
+ {
+ "epoch": 89.2425068119891,
+ "grad_norm": 3.1010894775390625,
+ "learning_rate": 6.008288565155196e-07,
+ "loss": 0.0461,
+ "step": 32752
+ },
+ {
+ "epoch": 89.24523160762942,
+ "grad_norm": 2.197079658508301,
+ "learning_rate": 6.005276070459187e-07,
+ "loss": 0.0397,
+ "step": 32753
+ },
+ {
+ "epoch": 89.24795640326975,
+ "grad_norm": 4.151401996612549,
+ "learning_rate": 6.002264307791061e-07,
+ "loss": 0.0743,
+ "step": 32754
+ },
+ {
+ "epoch": 89.25068119891009,
+ "grad_norm": 2.712472677230835,
+ "learning_rate": 5.999253277174255e-07,
+ "loss": 0.0796,
+ "step": 32755
+ },
+ {
+ "epoch": 89.2534059945504,
+ "grad_norm": 2.7949860095977783,
+ "learning_rate": 5.996242978632271e-07,
+ "loss": 0.041,
+ "step": 32756
+ },
+ {
+ "epoch": 89.25613079019074,
+ "grad_norm": 2.4863429069519043,
+ "learning_rate": 5.993233412188504e-07,
+ "loss": 0.0537,
+ "step": 32757
+ },
+ {
+ "epoch": 89.25885558583106,
+ "grad_norm": 2.821411609649658,
+ "learning_rate": 5.990224577866422e-07,
+ "loss": 0.0728,
+ "step": 32758
+ },
+ {
+ "epoch": 89.26158038147139,
+ "grad_norm": 2.6806938648223877,
+ "learning_rate": 5.987216475689428e-07,
+ "loss": 0.039,
+ "step": 32759
+ },
+ {
+ "epoch": 89.26430517711172,
+ "grad_norm": 2.995911121368408,
+ "learning_rate": 5.984209105680972e-07,
+ "loss": 0.0403,
+ "step": 32760
+ },
+ {
+ "epoch": 89.26702997275204,
+ "grad_norm": 2.1803905963897705,
+ "learning_rate": 5.981202467864478e-07,
+ "loss": 0.0241,
+ "step": 32761
+ },
+ {
+ "epoch": 89.26975476839237,
+ "grad_norm": 2.5929770469665527,
+ "learning_rate": 5.97819656226335e-07,
+ "loss": 0.0323,
+ "step": 32762
+ },
+ {
+ "epoch": 89.2724795640327,
+ "grad_norm": 2.173696756362915,
+ "learning_rate": 5.975191388900991e-07,
+ "loss": 0.0647,
+ "step": 32763
+ },
+ {
+ "epoch": 89.27520435967303,
+ "grad_norm": 2.4097962379455566,
+ "learning_rate": 5.972186947800829e-07,
+ "loss": 0.0335,
+ "step": 32764
+ },
+ {
+ "epoch": 89.27792915531334,
+ "grad_norm": 3.4600203037261963,
+ "learning_rate": 5.969183238986243e-07,
+ "loss": 0.1017,
+ "step": 32765
+ },
+ {
+ "epoch": 89.28065395095368,
+ "grad_norm": 2.4017767906188965,
+ "learning_rate": 5.966180262480636e-07,
+ "loss": 0.0634,
+ "step": 32766
+ },
+ {
+ "epoch": 89.28337874659401,
+ "grad_norm": 2.3255603313446045,
+ "learning_rate": 5.96317801830737e-07,
+ "loss": 0.0643,
+ "step": 32767
+ },
+ {
+ "epoch": 89.28610354223433,
+ "grad_norm": 2.5896341800689697,
+ "learning_rate": 5.960176506489868e-07,
+ "loss": 0.0682,
+ "step": 32768
+ },
+ {
+ "epoch": 89.28882833787466,
+ "grad_norm": 2.865616798400879,
+ "learning_rate": 5.957175727051467e-07,
+ "loss": 0.0579,
+ "step": 32769
+ },
+ {
+ "epoch": 89.29155313351498,
+ "grad_norm": 2.599228858947754,
+ "learning_rate": 5.954175680015572e-07,
+ "loss": 0.0493,
+ "step": 32770
+ },
+ {
+ "epoch": 89.29427792915531,
+ "grad_norm": 2.905381679534912,
+ "learning_rate": 5.951176365405531e-07,
+ "loss": 0.1078,
+ "step": 32771
+ },
+ {
+ "epoch": 89.29700272479565,
+ "grad_norm": 2.6210904121398926,
+ "learning_rate": 5.948177783244691e-07,
+ "loss": 0.0334,
+ "step": 32772
+ },
+ {
+ "epoch": 89.29972752043597,
+ "grad_norm": 2.3333895206451416,
+ "learning_rate": 5.945179933556422e-07,
+ "loss": 0.1201,
+ "step": 32773
+ },
+ {
+ "epoch": 89.3024523160763,
+ "grad_norm": 2.521071672439575,
+ "learning_rate": 5.942182816364061e-07,
+ "loss": 0.0431,
+ "step": 32774
+ },
+ {
+ "epoch": 89.30517711171662,
+ "grad_norm": 3.2333972454071045,
+ "learning_rate": 5.939186431690957e-07,
+ "loss": 0.0611,
+ "step": 32775
+ },
+ {
+ "epoch": 89.30790190735695,
+ "grad_norm": 1.64311683177948,
+ "learning_rate": 5.936190779560435e-07,
+ "loss": 0.081,
+ "step": 32776
+ },
+ {
+ "epoch": 89.31062670299727,
+ "grad_norm": 2.312652349472046,
+ "learning_rate": 5.933195859995833e-07,
+ "loss": 0.0696,
+ "step": 32777
+ },
+ {
+ "epoch": 89.3133514986376,
+ "grad_norm": 2.7373828887939453,
+ "learning_rate": 5.930201673020486e-07,
+ "loss": 0.1133,
+ "step": 32778
+ },
+ {
+ "epoch": 89.31607629427793,
+ "grad_norm": 2.6825835704803467,
+ "learning_rate": 5.927208218657676e-07,
+ "loss": 0.1092,
+ "step": 32779
+ },
+ {
+ "epoch": 89.31880108991825,
+ "grad_norm": 2.91965913772583,
+ "learning_rate": 5.924215496930763e-07,
+ "loss": 0.0297,
+ "step": 32780
+ },
+ {
+ "epoch": 89.32152588555859,
+ "grad_norm": 1.9278688430786133,
+ "learning_rate": 5.921223507863028e-07,
+ "loss": 0.0203,
+ "step": 32781
+ },
+ {
+ "epoch": 89.3242506811989,
+ "grad_norm": 2.232983350753784,
+ "learning_rate": 5.918232251477784e-07,
+ "loss": 0.1147,
+ "step": 32782
+ },
+ {
+ "epoch": 89.32697547683924,
+ "grad_norm": 2.1401584148406982,
+ "learning_rate": 5.915241727798293e-07,
+ "loss": 0.029,
+ "step": 32783
+ },
+ {
+ "epoch": 89.32970027247957,
+ "grad_norm": 3.384432792663574,
+ "learning_rate": 5.91225193684789e-07,
+ "loss": 0.033,
+ "step": 32784
+ },
+ {
+ "epoch": 89.33242506811989,
+ "grad_norm": 2.4877140522003174,
+ "learning_rate": 5.909262878649846e-07,
+ "loss": 0.0331,
+ "step": 32785
+ },
+ {
+ "epoch": 89.33514986376022,
+ "grad_norm": 2.889374256134033,
+ "learning_rate": 5.90627455322742e-07,
+ "loss": 0.0335,
+ "step": 32786
+ },
+ {
+ "epoch": 89.33787465940054,
+ "grad_norm": 2.776301860809326,
+ "learning_rate": 5.903286960603905e-07,
+ "loss": 0.0567,
+ "step": 32787
+ },
+ {
+ "epoch": 89.34059945504087,
+ "grad_norm": 2.3320226669311523,
+ "learning_rate": 5.900300100802558e-07,
+ "loss": 0.0274,
+ "step": 32788
+ },
+ {
+ "epoch": 89.34332425068119,
+ "grad_norm": 2.927804946899414,
+ "learning_rate": 5.897313973846652e-07,
+ "loss": 0.1109,
+ "step": 32789
+ },
+ {
+ "epoch": 89.34604904632153,
+ "grad_norm": 1.7589563131332397,
+ "learning_rate": 5.894328579759434e-07,
+ "loss": 0.0797,
+ "step": 32790
+ },
+ {
+ "epoch": 89.34877384196186,
+ "grad_norm": 3.696570873260498,
+ "learning_rate": 5.891343918564163e-07,
+ "loss": 0.1422,
+ "step": 32791
+ },
+ {
+ "epoch": 89.35149863760218,
+ "grad_norm": 1.8898727893829346,
+ "learning_rate": 5.888359990284065e-07,
+ "loss": 0.0294,
+ "step": 32792
+ },
+ {
+ "epoch": 89.35422343324251,
+ "grad_norm": 1.7833526134490967,
+ "learning_rate": 5.885376794942399e-07,
+ "loss": 0.0138,
+ "step": 32793
+ },
+ {
+ "epoch": 89.35694822888283,
+ "grad_norm": 2.947908639907837,
+ "learning_rate": 5.882394332562392e-07,
+ "loss": 0.035,
+ "step": 32794
+ },
+ {
+ "epoch": 89.35967302452316,
+ "grad_norm": 1.8422151803970337,
+ "learning_rate": 5.879412603167267e-07,
+ "loss": 0.0899,
+ "step": 32795
+ },
+ {
+ "epoch": 89.3623978201635,
+ "grad_norm": 2.5154712200164795,
+ "learning_rate": 5.87643160678023e-07,
+ "loss": 0.1249,
+ "step": 32796
+ },
+ {
+ "epoch": 89.36512261580381,
+ "grad_norm": 4.435185432434082,
+ "learning_rate": 5.87345134342453e-07,
+ "loss": 0.0288,
+ "step": 32797
+ },
+ {
+ "epoch": 89.36784741144415,
+ "grad_norm": 2.7728612422943115,
+ "learning_rate": 5.870471813123368e-07,
+ "loss": 0.1315,
+ "step": 32798
+ },
+ {
+ "epoch": 89.37057220708446,
+ "grad_norm": 3.42110538482666,
+ "learning_rate": 5.867493015899916e-07,
+ "loss": 0.0632,
+ "step": 32799
+ },
+ {
+ "epoch": 89.3732970027248,
+ "grad_norm": 3.111011266708374,
+ "learning_rate": 5.864514951777423e-07,
+ "loss": 0.0719,
+ "step": 32800
+ },
+ {
+ "epoch": 89.37602179836512,
+ "grad_norm": 1.8426586389541626,
+ "learning_rate": 5.861537620779056e-07,
+ "loss": 0.0244,
+ "step": 32801
+ },
+ {
+ "epoch": 89.37874659400545,
+ "grad_norm": 3.0814948081970215,
+ "learning_rate": 5.858561022928e-07,
+ "loss": 0.112,
+ "step": 32802
+ },
+ {
+ "epoch": 89.38147138964578,
+ "grad_norm": 2.558114528656006,
+ "learning_rate": 5.855585158247434e-07,
+ "loss": 0.0428,
+ "step": 32803
+ },
+ {
+ "epoch": 89.3841961852861,
+ "grad_norm": 2.08484148979187,
+ "learning_rate": 5.852610026760541e-07,
+ "loss": 0.027,
+ "step": 32804
+ },
+ {
+ "epoch": 89.38692098092643,
+ "grad_norm": 3.1211516857147217,
+ "learning_rate": 5.849635628490502e-07,
+ "loss": 0.117,
+ "step": 32805
+ },
+ {
+ "epoch": 89.38964577656675,
+ "grad_norm": 1.9015812873840332,
+ "learning_rate": 5.846661963460465e-07,
+ "loss": 0.1303,
+ "step": 32806
+ },
+ {
+ "epoch": 89.39237057220708,
+ "grad_norm": 1.7309904098510742,
+ "learning_rate": 5.8436890316936e-07,
+ "loss": 0.0252,
+ "step": 32807
+ },
+ {
+ "epoch": 89.39509536784742,
+ "grad_norm": 1.7384289503097534,
+ "learning_rate": 5.840716833213033e-07,
+ "loss": 0.0389,
+ "step": 32808
+ },
+ {
+ "epoch": 89.39782016348774,
+ "grad_norm": 2.4681620597839355,
+ "learning_rate": 5.837745368041958e-07,
+ "loss": 0.0398,
+ "step": 32809
+ },
+ {
+ "epoch": 89.40054495912807,
+ "grad_norm": 2.519777774810791,
+ "learning_rate": 5.834774636203488e-07,
+ "loss": 0.0523,
+ "step": 32810
+ },
+ {
+ "epoch": 89.40326975476839,
+ "grad_norm": 1.971938133239746,
+ "learning_rate": 5.831804637720762e-07,
+ "loss": 0.0243,
+ "step": 32811
+ },
+ {
+ "epoch": 89.40599455040872,
+ "grad_norm": 4.039462089538574,
+ "learning_rate": 5.828835372616892e-07,
+ "loss": 0.0792,
+ "step": 32812
+ },
+ {
+ "epoch": 89.40871934604904,
+ "grad_norm": 2.5203163623809814,
+ "learning_rate": 5.82586684091504e-07,
+ "loss": 0.1002,
+ "step": 32813
+ },
+ {
+ "epoch": 89.41144414168937,
+ "grad_norm": 1.8804906606674194,
+ "learning_rate": 5.822899042638297e-07,
+ "loss": 0.1174,
+ "step": 32814
+ },
+ {
+ "epoch": 89.4141689373297,
+ "grad_norm": 3.847694158554077,
+ "learning_rate": 5.8199319778098e-07,
+ "loss": 0.0779,
+ "step": 32815
+ },
+ {
+ "epoch": 89.41689373297002,
+ "grad_norm": 2.758211612701416,
+ "learning_rate": 5.816965646452622e-07,
+ "loss": 0.0592,
+ "step": 32816
+ },
+ {
+ "epoch": 89.41961852861036,
+ "grad_norm": 2.610078811645508,
+ "learning_rate": 5.814000048589896e-07,
+ "loss": 0.0995,
+ "step": 32817
+ },
+ {
+ "epoch": 89.42234332425068,
+ "grad_norm": 4.977338790893555,
+ "learning_rate": 5.811035184244706e-07,
+ "loss": 0.0934,
+ "step": 32818
+ },
+ {
+ "epoch": 89.42506811989101,
+ "grad_norm": 4.272146701812744,
+ "learning_rate": 5.808071053440145e-07,
+ "loss": 0.0891,
+ "step": 32819
+ },
+ {
+ "epoch": 89.42779291553134,
+ "grad_norm": 1.384609341621399,
+ "learning_rate": 5.805107656199272e-07,
+ "loss": 0.0177,
+ "step": 32820
+ },
+ {
+ "epoch": 89.43051771117166,
+ "grad_norm": 2.0737600326538086,
+ "learning_rate": 5.8021449925452e-07,
+ "loss": 0.016,
+ "step": 32821
+ },
+ {
+ "epoch": 89.433242506812,
+ "grad_norm": 3.2330639362335205,
+ "learning_rate": 5.799183062501001e-07,
+ "loss": 0.069,
+ "step": 32822
+ },
+ {
+ "epoch": 89.43596730245231,
+ "grad_norm": 2.6659324169158936,
+ "learning_rate": 5.796221866089735e-07,
+ "loss": 0.0446,
+ "step": 32823
+ },
+ {
+ "epoch": 89.43869209809264,
+ "grad_norm": 3.4410345554351807,
+ "learning_rate": 5.79326140333445e-07,
+ "loss": 0.0375,
+ "step": 32824
+ },
+ {
+ "epoch": 89.44141689373296,
+ "grad_norm": 3.1975862979888916,
+ "learning_rate": 5.790301674258214e-07,
+ "loss": 0.0577,
+ "step": 32825
+ },
+ {
+ "epoch": 89.4441416893733,
+ "grad_norm": 2.658019781112671,
+ "learning_rate": 5.787342678884089e-07,
+ "loss": 0.1726,
+ "step": 32826
+ },
+ {
+ "epoch": 89.44686648501363,
+ "grad_norm": 1.9277862310409546,
+ "learning_rate": 5.784384417235101e-07,
+ "loss": 0.0254,
+ "step": 32827
+ },
+ {
+ "epoch": 89.44959128065395,
+ "grad_norm": 3.593170166015625,
+ "learning_rate": 5.781426889334285e-07,
+ "loss": 0.0748,
+ "step": 32828
+ },
+ {
+ "epoch": 89.45231607629428,
+ "grad_norm": 2.957268714904785,
+ "learning_rate": 5.778470095204691e-07,
+ "loss": 0.0733,
+ "step": 32829
+ },
+ {
+ "epoch": 89.4550408719346,
+ "grad_norm": 3.954479217529297,
+ "learning_rate": 5.775514034869345e-07,
+ "loss": 0.0798,
+ "step": 32830
+ },
+ {
+ "epoch": 89.45776566757493,
+ "grad_norm": 2.9770193099975586,
+ "learning_rate": 5.772558708351262e-07,
+ "loss": 0.0762,
+ "step": 32831
+ },
+ {
+ "epoch": 89.46049046321527,
+ "grad_norm": 2.866166591644287,
+ "learning_rate": 5.769604115673444e-07,
+ "loss": 0.0399,
+ "step": 32832
+ },
+ {
+ "epoch": 89.46321525885558,
+ "grad_norm": 2.224769353866577,
+ "learning_rate": 5.76665025685893e-07,
+ "loss": 0.0307,
+ "step": 32833
+ },
+ {
+ "epoch": 89.46594005449592,
+ "grad_norm": 2.5665481090545654,
+ "learning_rate": 5.763697131930712e-07,
+ "loss": 0.0352,
+ "step": 32834
+ },
+ {
+ "epoch": 89.46866485013624,
+ "grad_norm": 1.5102972984313965,
+ "learning_rate": 5.760744740911794e-07,
+ "loss": 0.0183,
+ "step": 32835
+ },
+ {
+ "epoch": 89.47138964577657,
+ "grad_norm": 2.10481595993042,
+ "learning_rate": 5.757793083825147e-07,
+ "loss": 0.0552,
+ "step": 32836
+ },
+ {
+ "epoch": 89.47411444141689,
+ "grad_norm": 4.771435260772705,
+ "learning_rate": 5.754842160693785e-07,
+ "loss": 0.0833,
+ "step": 32837
+ },
+ {
+ "epoch": 89.47683923705722,
+ "grad_norm": 2.789193868637085,
+ "learning_rate": 5.751891971540658e-07,
+ "loss": 0.0639,
+ "step": 32838
+ },
+ {
+ "epoch": 89.47956403269755,
+ "grad_norm": 2.961798906326294,
+ "learning_rate": 5.748942516388789e-07,
+ "loss": 0.1006,
+ "step": 32839
+ },
+ {
+ "epoch": 89.48228882833787,
+ "grad_norm": 3.6757514476776123,
+ "learning_rate": 5.745993795261096e-07,
+ "loss": 0.0284,
+ "step": 32840
+ },
+ {
+ "epoch": 89.4850136239782,
+ "grad_norm": 2.3897275924682617,
+ "learning_rate": 5.743045808180592e-07,
+ "loss": 0.0339,
+ "step": 32841
+ },
+ {
+ "epoch": 89.48773841961852,
+ "grad_norm": 2.893338918685913,
+ "learning_rate": 5.740098555170215e-07,
+ "loss": 0.1059,
+ "step": 32842
+ },
+ {
+ "epoch": 89.49046321525886,
+ "grad_norm": 2.3885364532470703,
+ "learning_rate": 5.737152036252914e-07,
+ "loss": 0.1679,
+ "step": 32843
+ },
+ {
+ "epoch": 89.49318801089919,
+ "grad_norm": 2.1282293796539307,
+ "learning_rate": 5.734206251451624e-07,
+ "loss": 0.0418,
+ "step": 32844
+ },
+ {
+ "epoch": 89.49591280653951,
+ "grad_norm": 2.4373741149902344,
+ "learning_rate": 5.731261200789318e-07,
+ "loss": 0.0537,
+ "step": 32845
+ },
+ {
+ "epoch": 89.49863760217984,
+ "grad_norm": 3.325336217880249,
+ "learning_rate": 5.728316884288909e-07,
+ "loss": 0.0233,
+ "step": 32846
+ },
+ {
+ "epoch": 89.50136239782016,
+ "grad_norm": 2.2183892726898193,
+ "learning_rate": 5.725373301973336e-07,
+ "loss": 0.0456,
+ "step": 32847
+ },
+ {
+ "epoch": 89.50408719346049,
+ "grad_norm": 1.9245525598526,
+ "learning_rate": 5.722430453865513e-07,
+ "loss": 0.0171,
+ "step": 32848
+ },
+ {
+ "epoch": 89.50681198910081,
+ "grad_norm": 1.6682052612304688,
+ "learning_rate": 5.719488339988378e-07,
+ "loss": 0.0232,
+ "step": 32849
+ },
+ {
+ "epoch": 89.50953678474114,
+ "grad_norm": 2.2161269187927246,
+ "learning_rate": 5.716546960364844e-07,
+ "loss": 0.0538,
+ "step": 32850
+ },
+ {
+ "epoch": 89.51226158038148,
+ "grad_norm": 14.691620826721191,
+ "learning_rate": 5.713606315017794e-07,
+ "loss": 0.0448,
+ "step": 32851
+ },
+ {
+ "epoch": 89.5149863760218,
+ "grad_norm": 2.354126453399658,
+ "learning_rate": 5.710666403970133e-07,
+ "loss": 0.0698,
+ "step": 32852
+ },
+ {
+ "epoch": 89.51771117166213,
+ "grad_norm": 3.4341745376586914,
+ "learning_rate": 5.707727227244786e-07,
+ "loss": 0.0202,
+ "step": 32853
+ },
+ {
+ "epoch": 89.52043596730245,
+ "grad_norm": 2.4215874671936035,
+ "learning_rate": 5.704788784864612e-07,
+ "loss": 0.1346,
+ "step": 32854
+ },
+ {
+ "epoch": 89.52316076294278,
+ "grad_norm": 2.959627628326416,
+ "learning_rate": 5.701851076852504e-07,
+ "loss": 0.1062,
+ "step": 32855
+ },
+ {
+ "epoch": 89.52588555858311,
+ "grad_norm": 1.748242735862732,
+ "learning_rate": 5.698914103231357e-07,
+ "loss": 0.0253,
+ "step": 32856
+ },
+ {
+ "epoch": 89.52861035422343,
+ "grad_norm": 3.1157803535461426,
+ "learning_rate": 5.695977864024016e-07,
+ "loss": 0.226,
+ "step": 32857
+ },
+ {
+ "epoch": 89.53133514986376,
+ "grad_norm": 3.9220938682556152,
+ "learning_rate": 5.693042359253387e-07,
+ "loss": 0.0638,
+ "step": 32858
+ },
+ {
+ "epoch": 89.53405994550408,
+ "grad_norm": 3.532024621963501,
+ "learning_rate": 5.690107588942306e-07,
+ "loss": 0.1261,
+ "step": 32859
+ },
+ {
+ "epoch": 89.53678474114442,
+ "grad_norm": 2.2799363136291504,
+ "learning_rate": 5.687173553113623e-07,
+ "loss": 0.0352,
+ "step": 32860
+ },
+ {
+ "epoch": 89.53950953678473,
+ "grad_norm": 2.646981954574585,
+ "learning_rate": 5.684240251790186e-07,
+ "loss": 0.0389,
+ "step": 32861
+ },
+ {
+ "epoch": 89.54223433242507,
+ "grad_norm": 2.868276357650757,
+ "learning_rate": 5.681307684994874e-07,
+ "loss": 0.0541,
+ "step": 32862
+ },
+ {
+ "epoch": 89.5449591280654,
+ "grad_norm": 3.010094165802002,
+ "learning_rate": 5.678375852750496e-07,
+ "loss": 0.1429,
+ "step": 32863
+ },
+ {
+ "epoch": 89.54768392370572,
+ "grad_norm": 2.4626591205596924,
+ "learning_rate": 5.675444755079873e-07,
+ "loss": 0.0528,
+ "step": 32864
+ },
+ {
+ "epoch": 89.55040871934605,
+ "grad_norm": 5.357175350189209,
+ "learning_rate": 5.672514392005868e-07,
+ "loss": 0.2043,
+ "step": 32865
+ },
+ {
+ "epoch": 89.55313351498637,
+ "grad_norm": 2.567004919052124,
+ "learning_rate": 5.669584763551284e-07,
+ "loss": 0.0909,
+ "step": 32866
+ },
+ {
+ "epoch": 89.5558583106267,
+ "grad_norm": 5.483394622802734,
+ "learning_rate": 5.666655869738935e-07,
+ "loss": 0.0738,
+ "step": 32867
+ },
+ {
+ "epoch": 89.55858310626704,
+ "grad_norm": 2.470198154449463,
+ "learning_rate": 5.663727710591627e-07,
+ "loss": 0.0701,
+ "step": 32868
+ },
+ {
+ "epoch": 89.56130790190736,
+ "grad_norm": 3.3590195178985596,
+ "learning_rate": 5.660800286132173e-07,
+ "loss": 0.2203,
+ "step": 32869
+ },
+ {
+ "epoch": 89.56403269754769,
+ "grad_norm": 2.435865640640259,
+ "learning_rate": 5.657873596383378e-07,
+ "loss": 0.1519,
+ "step": 32870
+ },
+ {
+ "epoch": 89.566757493188,
+ "grad_norm": 2.570725202560425,
+ "learning_rate": 5.654947641368036e-07,
+ "loss": 0.0366,
+ "step": 32871
+ },
+ {
+ "epoch": 89.56948228882834,
+ "grad_norm": 1.5694717168807983,
+ "learning_rate": 5.652022421108894e-07,
+ "loss": 0.024,
+ "step": 32872
+ },
+ {
+ "epoch": 89.57220708446866,
+ "grad_norm": 2.274602174758911,
+ "learning_rate": 5.649097935628778e-07,
+ "loss": 0.0638,
+ "step": 32873
+ },
+ {
+ "epoch": 89.57493188010899,
+ "grad_norm": 2.2057981491088867,
+ "learning_rate": 5.646174184950459e-07,
+ "loss": 0.0829,
+ "step": 32874
+ },
+ {
+ "epoch": 89.57765667574932,
+ "grad_norm": 3.423875570297241,
+ "learning_rate": 5.643251169096698e-07,
+ "loss": 0.1163,
+ "step": 32875
+ },
+ {
+ "epoch": 89.58038147138964,
+ "grad_norm": 1.4155492782592773,
+ "learning_rate": 5.640328888090263e-07,
+ "loss": 0.0162,
+ "step": 32876
+ },
+ {
+ "epoch": 89.58310626702998,
+ "grad_norm": 2.519733190536499,
+ "learning_rate": 5.637407341953893e-07,
+ "loss": 0.0652,
+ "step": 32877
+ },
+ {
+ "epoch": 89.5858310626703,
+ "grad_norm": 2.3193299770355225,
+ "learning_rate": 5.634486530710382e-07,
+ "loss": 0.0406,
+ "step": 32878
+ },
+ {
+ "epoch": 89.58855585831063,
+ "grad_norm": 3.3823933601379395,
+ "learning_rate": 5.631566454382442e-07,
+ "loss": 0.022,
+ "step": 32879
+ },
+ {
+ "epoch": 89.59128065395096,
+ "grad_norm": 2.3177411556243896,
+ "learning_rate": 5.628647112992824e-07,
+ "loss": 0.0357,
+ "step": 32880
+ },
+ {
+ "epoch": 89.59400544959128,
+ "grad_norm": 2.8449323177337646,
+ "learning_rate": 5.625728506564254e-07,
+ "loss": 0.0537,
+ "step": 32881
+ },
+ {
+ "epoch": 89.59673024523161,
+ "grad_norm": 3.5362963676452637,
+ "learning_rate": 5.622810635119491e-07,
+ "loss": 0.1477,
+ "step": 32882
+ },
+ {
+ "epoch": 89.59945504087193,
+ "grad_norm": 3.34096622467041,
+ "learning_rate": 5.61989349868124e-07,
+ "loss": 0.0932,
+ "step": 32883
+ },
+ {
+ "epoch": 89.60217983651226,
+ "grad_norm": 2.2542879581451416,
+ "learning_rate": 5.616977097272214e-07,
+ "loss": 0.0302,
+ "step": 32884
+ },
+ {
+ "epoch": 89.60490463215258,
+ "grad_norm": 2.017786741256714,
+ "learning_rate": 5.614061430915118e-07,
+ "loss": 0.0296,
+ "step": 32885
+ },
+ {
+ "epoch": 89.60762942779292,
+ "grad_norm": 2.867518186569214,
+ "learning_rate": 5.611146499632692e-07,
+ "loss": 0.0371,
+ "step": 32886
+ },
+ {
+ "epoch": 89.61035422343325,
+ "grad_norm": 2.4117448329925537,
+ "learning_rate": 5.608232303447625e-07,
+ "loss": 0.051,
+ "step": 32887
+ },
+ {
+ "epoch": 89.61307901907357,
+ "grad_norm": 4.533914566040039,
+ "learning_rate": 5.605318842382589e-07,
+ "loss": 0.0869,
+ "step": 32888
+ },
+ {
+ "epoch": 89.6158038147139,
+ "grad_norm": 2.6035053730010986,
+ "learning_rate": 5.60240611646029e-07,
+ "loss": 0.0285,
+ "step": 32889
+ },
+ {
+ "epoch": 89.61852861035422,
+ "grad_norm": 1.7373334169387817,
+ "learning_rate": 5.599494125703431e-07,
+ "loss": 0.0671,
+ "step": 32890
+ },
+ {
+ "epoch": 89.62125340599455,
+ "grad_norm": 4.364772796630859,
+ "learning_rate": 5.59658287013467e-07,
+ "loss": 0.0485,
+ "step": 32891
+ },
+ {
+ "epoch": 89.62397820163488,
+ "grad_norm": 3.0294835567474365,
+ "learning_rate": 5.59367234977668e-07,
+ "loss": 0.0429,
+ "step": 32892
+ },
+ {
+ "epoch": 89.6267029972752,
+ "grad_norm": 2.105394124984741,
+ "learning_rate": 5.590762564652119e-07,
+ "loss": 0.1594,
+ "step": 32893
+ },
+ {
+ "epoch": 89.62942779291554,
+ "grad_norm": 2.268779754638672,
+ "learning_rate": 5.587853514783681e-07,
+ "loss": 0.0267,
+ "step": 32894
+ },
+ {
+ "epoch": 89.63215258855585,
+ "grad_norm": 1.684410572052002,
+ "learning_rate": 5.584945200193992e-07,
+ "loss": 0.0327,
+ "step": 32895
+ },
+ {
+ "epoch": 89.63487738419619,
+ "grad_norm": 2.1431210041046143,
+ "learning_rate": 5.582037620905723e-07,
+ "loss": 0.025,
+ "step": 32896
+ },
+ {
+ "epoch": 89.6376021798365,
+ "grad_norm": 3.0194146633148193,
+ "learning_rate": 5.579130776941488e-07,
+ "loss": 0.0322,
+ "step": 32897
+ },
+ {
+ "epoch": 89.64032697547684,
+ "grad_norm": 1.8627034425735474,
+ "learning_rate": 5.576224668323949e-07,
+ "loss": 0.0215,
+ "step": 32898
+ },
+ {
+ "epoch": 89.64305177111717,
+ "grad_norm": 1.5820367336273193,
+ "learning_rate": 5.57331929507574e-07,
+ "loss": 0.0902,
+ "step": 32899
+ },
+ {
+ "epoch": 89.64577656675749,
+ "grad_norm": 5.083982467651367,
+ "learning_rate": 5.570414657219481e-07,
+ "loss": 0.021,
+ "step": 32900
+ },
+ {
+ "epoch": 89.64850136239782,
+ "grad_norm": 1.6487438678741455,
+ "learning_rate": 5.567510754777782e-07,
+ "loss": 0.0175,
+ "step": 32901
+ },
+ {
+ "epoch": 89.65122615803814,
+ "grad_norm": 2.657700538635254,
+ "learning_rate": 5.564607587773274e-07,
+ "loss": 0.0336,
+ "step": 32902
+ },
+ {
+ "epoch": 89.65395095367847,
+ "grad_norm": 2.9634604454040527,
+ "learning_rate": 5.561705156228569e-07,
+ "loss": 0.0368,
+ "step": 32903
+ },
+ {
+ "epoch": 89.65667574931881,
+ "grad_norm": 1.4109307527542114,
+ "learning_rate": 5.558803460166274e-07,
+ "loss": 0.0159,
+ "step": 32904
+ },
+ {
+ "epoch": 89.65940054495913,
+ "grad_norm": 3.901301383972168,
+ "learning_rate": 5.555902499608956e-07,
+ "loss": 0.0363,
+ "step": 32905
+ },
+ {
+ "epoch": 89.66212534059946,
+ "grad_norm": 2.360651731491089,
+ "learning_rate": 5.553002274579244e-07,
+ "loss": 0.0452,
+ "step": 32906
+ },
+ {
+ "epoch": 89.66485013623978,
+ "grad_norm": 3.332643508911133,
+ "learning_rate": 5.550102785099687e-07,
+ "loss": 0.0926,
+ "step": 32907
+ },
+ {
+ "epoch": 89.66757493188011,
+ "grad_norm": 3.7273032665252686,
+ "learning_rate": 5.547204031192921e-07,
+ "loss": 0.1203,
+ "step": 32908
+ },
+ {
+ "epoch": 89.67029972752043,
+ "grad_norm": 2.0486652851104736,
+ "learning_rate": 5.544306012881462e-07,
+ "loss": 0.2535,
+ "step": 32909
+ },
+ {
+ "epoch": 89.67302452316076,
+ "grad_norm": 3.2788918018341064,
+ "learning_rate": 5.541408730187925e-07,
+ "loss": 0.0579,
+ "step": 32910
+ },
+ {
+ "epoch": 89.6757493188011,
+ "grad_norm": 2.957430601119995,
+ "learning_rate": 5.538512183134859e-07,
+ "loss": 0.1201,
+ "step": 32911
+ },
+ {
+ "epoch": 89.67847411444141,
+ "grad_norm": 5.769819259643555,
+ "learning_rate": 5.535616371744823e-07,
+ "loss": 0.0732,
+ "step": 32912
+ },
+ {
+ "epoch": 89.68119891008175,
+ "grad_norm": 2.5564122200012207,
+ "learning_rate": 5.532721296040344e-07,
+ "loss": 0.0898,
+ "step": 32913
+ },
+ {
+ "epoch": 89.68392370572207,
+ "grad_norm": 2.6478564739227295,
+ "learning_rate": 5.529826956044016e-07,
+ "loss": 0.0967,
+ "step": 32914
+ },
+ {
+ "epoch": 89.6866485013624,
+ "grad_norm": 2.3558647632598877,
+ "learning_rate": 5.526933351778352e-07,
+ "loss": 0.0333,
+ "step": 32915
+ },
+ {
+ "epoch": 89.68937329700273,
+ "grad_norm": 2.0492758750915527,
+ "learning_rate": 5.52404048326588e-07,
+ "loss": 0.0197,
+ "step": 32916
+ },
+ {
+ "epoch": 89.69209809264305,
+ "grad_norm": 1.885439157485962,
+ "learning_rate": 5.521148350529137e-07,
+ "loss": 0.0267,
+ "step": 32917
+ },
+ {
+ "epoch": 89.69482288828338,
+ "grad_norm": 2.625890016555786,
+ "learning_rate": 5.518256953590661e-07,
+ "loss": 0.083,
+ "step": 32918
+ },
+ {
+ "epoch": 89.6975476839237,
+ "grad_norm": 2.996981382369995,
+ "learning_rate": 5.515366292472956e-07,
+ "loss": 0.1002,
+ "step": 32919
+ },
+ {
+ "epoch": 89.70027247956403,
+ "grad_norm": 2.68178653717041,
+ "learning_rate": 5.512476367198538e-07,
+ "loss": 0.0501,
+ "step": 32920
+ },
+ {
+ "epoch": 89.70299727520435,
+ "grad_norm": 2.323176860809326,
+ "learning_rate": 5.509587177789911e-07,
+ "loss": 0.0574,
+ "step": 32921
+ },
+ {
+ "epoch": 89.70572207084469,
+ "grad_norm": 2.613534927368164,
+ "learning_rate": 5.506698724269577e-07,
+ "loss": 0.0295,
+ "step": 32922
+ },
+ {
+ "epoch": 89.70844686648502,
+ "grad_norm": 2.291454315185547,
+ "learning_rate": 5.503811006660032e-07,
+ "loss": 0.1754,
+ "step": 32923
+ },
+ {
+ "epoch": 89.71117166212534,
+ "grad_norm": 2.5666966438293457,
+ "learning_rate": 5.500924024983756e-07,
+ "loss": 0.0284,
+ "step": 32924
+ },
+ {
+ "epoch": 89.71389645776567,
+ "grad_norm": 2.7875821590423584,
+ "learning_rate": 5.498037779263265e-07,
+ "loss": 0.1326,
+ "step": 32925
+ },
+ {
+ "epoch": 89.71662125340599,
+ "grad_norm": 2.7814249992370605,
+ "learning_rate": 5.495152269520987e-07,
+ "loss": 0.097,
+ "step": 32926
+ },
+ {
+ "epoch": 89.71934604904632,
+ "grad_norm": 4.380067348480225,
+ "learning_rate": 5.492267495779447e-07,
+ "loss": 0.0491,
+ "step": 32927
+ },
+ {
+ "epoch": 89.72207084468666,
+ "grad_norm": 2.6277806758880615,
+ "learning_rate": 5.489383458061071e-07,
+ "loss": 0.0769,
+ "step": 32928
+ },
+ {
+ "epoch": 89.72479564032697,
+ "grad_norm": 3.794962167739868,
+ "learning_rate": 5.48650015638833e-07,
+ "loss": 0.0611,
+ "step": 32929
+ },
+ {
+ "epoch": 89.7275204359673,
+ "grad_norm": 2.078131914138794,
+ "learning_rate": 5.483617590783696e-07,
+ "loss": 0.1018,
+ "step": 32930
+ },
+ {
+ "epoch": 89.73024523160763,
+ "grad_norm": 2.3437399864196777,
+ "learning_rate": 5.480735761269607e-07,
+ "loss": 0.0845,
+ "step": 32931
+ },
+ {
+ "epoch": 89.73297002724796,
+ "grad_norm": 3.3094420433044434,
+ "learning_rate": 5.477854667868509e-07,
+ "loss": 0.1088,
+ "step": 32932
+ },
+ {
+ "epoch": 89.73569482288828,
+ "grad_norm": 5.927574634552002,
+ "learning_rate": 5.474974310602821e-07,
+ "loss": 0.0262,
+ "step": 32933
+ },
+ {
+ "epoch": 89.73841961852861,
+ "grad_norm": 2.4199492931365967,
+ "learning_rate": 5.472094689495e-07,
+ "loss": 0.039,
+ "step": 32934
+ },
+ {
+ "epoch": 89.74114441416894,
+ "grad_norm": 2.1367902755737305,
+ "learning_rate": 5.469215804567474e-07,
+ "loss": 0.033,
+ "step": 32935
+ },
+ {
+ "epoch": 89.74386920980926,
+ "grad_norm": 2.1038002967834473,
+ "learning_rate": 5.466337655842647e-07,
+ "loss": 0.0301,
+ "step": 32936
+ },
+ {
+ "epoch": 89.7465940054496,
+ "grad_norm": 1.8601211309432983,
+ "learning_rate": 5.463460243342922e-07,
+ "loss": 0.0213,
+ "step": 32937
+ },
+ {
+ "epoch": 89.74931880108991,
+ "grad_norm": 2.783090114593506,
+ "learning_rate": 5.460583567090738e-07,
+ "loss": 0.0622,
+ "step": 32938
+ },
+ {
+ "epoch": 89.75204359673025,
+ "grad_norm": 2.488863229751587,
+ "learning_rate": 5.457707627108489e-07,
+ "loss": 0.0536,
+ "step": 32939
+ },
+ {
+ "epoch": 89.75476839237058,
+ "grad_norm": 2.3114936351776123,
+ "learning_rate": 5.454832423418577e-07,
+ "loss": 0.1343,
+ "step": 32940
+ },
+ {
+ "epoch": 89.7574931880109,
+ "grad_norm": 2.3771212100982666,
+ "learning_rate": 5.451957956043363e-07,
+ "loss": 0.0267,
+ "step": 32941
+ },
+ {
+ "epoch": 89.76021798365123,
+ "grad_norm": 2.1391761302948,
+ "learning_rate": 5.449084225005263e-07,
+ "loss": 0.026,
+ "step": 32942
+ },
+ {
+ "epoch": 89.76294277929155,
+ "grad_norm": 3.2617347240448,
+ "learning_rate": 5.44621123032667e-07,
+ "loss": 0.2307,
+ "step": 32943
+ },
+ {
+ "epoch": 89.76566757493188,
+ "grad_norm": 1.751294493675232,
+ "learning_rate": 5.443338972029932e-07,
+ "loss": 0.0131,
+ "step": 32944
+ },
+ {
+ "epoch": 89.7683923705722,
+ "grad_norm": 3.4908711910247803,
+ "learning_rate": 5.440467450137432e-07,
+ "loss": 0.1128,
+ "step": 32945
+ },
+ {
+ "epoch": 89.77111716621253,
+ "grad_norm": 2.7195677757263184,
+ "learning_rate": 5.437596664671518e-07,
+ "loss": 0.0578,
+ "step": 32946
+ },
+ {
+ "epoch": 89.77384196185287,
+ "grad_norm": 3.3138933181762695,
+ "learning_rate": 5.434726615654562e-07,
+ "loss": 0.1062,
+ "step": 32947
+ },
+ {
+ "epoch": 89.77656675749319,
+ "grad_norm": 2.702662467956543,
+ "learning_rate": 5.431857303108923e-07,
+ "loss": 0.0457,
+ "step": 32948
+ },
+ {
+ "epoch": 89.77929155313352,
+ "grad_norm": 2.3171818256378174,
+ "learning_rate": 5.428988727056928e-07,
+ "loss": 0.081,
+ "step": 32949
+ },
+ {
+ "epoch": 89.78201634877384,
+ "grad_norm": 4.419804573059082,
+ "learning_rate": 5.426120887520914e-07,
+ "loss": 0.1153,
+ "step": 32950
+ },
+ {
+ "epoch": 89.78474114441417,
+ "grad_norm": 2.3891665935516357,
+ "learning_rate": 5.423253784523241e-07,
+ "loss": 0.0311,
+ "step": 32951
+ },
+ {
+ "epoch": 89.7874659400545,
+ "grad_norm": 2.4410691261291504,
+ "learning_rate": 5.420387418086215e-07,
+ "loss": 0.0289,
+ "step": 32952
+ },
+ {
+ "epoch": 89.79019073569482,
+ "grad_norm": 2.494887351989746,
+ "learning_rate": 5.417521788232161e-07,
+ "loss": 0.0427,
+ "step": 32953
+ },
+ {
+ "epoch": 89.79291553133515,
+ "grad_norm": 2.5476417541503906,
+ "learning_rate": 5.414656894983416e-07,
+ "loss": 0.0401,
+ "step": 32954
+ },
+ {
+ "epoch": 89.79564032697547,
+ "grad_norm": 3.26421856880188,
+ "learning_rate": 5.411792738362275e-07,
+ "loss": 0.1295,
+ "step": 32955
+ },
+ {
+ "epoch": 89.7983651226158,
+ "grad_norm": 2.7946064472198486,
+ "learning_rate": 5.408929318391054e-07,
+ "loss": 0.0589,
+ "step": 32956
+ },
+ {
+ "epoch": 89.80108991825612,
+ "grad_norm": 1.8081120252609253,
+ "learning_rate": 5.406066635092034e-07,
+ "loss": 0.0244,
+ "step": 32957
+ },
+ {
+ "epoch": 89.80381471389646,
+ "grad_norm": 1.8078542947769165,
+ "learning_rate": 5.403204688487517e-07,
+ "loss": 0.0253,
+ "step": 32958
+ },
+ {
+ "epoch": 89.80653950953679,
+ "grad_norm": 1.895068883895874,
+ "learning_rate": 5.400343478599812e-07,
+ "loss": 0.0264,
+ "step": 32959
+ },
+ {
+ "epoch": 89.80926430517711,
+ "grad_norm": 2.275346040725708,
+ "learning_rate": 5.397483005451199e-07,
+ "loss": 0.0461,
+ "step": 32960
+ },
+ {
+ "epoch": 89.81198910081744,
+ "grad_norm": 4.531795024871826,
+ "learning_rate": 5.394623269063926e-07,
+ "loss": 0.0252,
+ "step": 32961
+ },
+ {
+ "epoch": 89.81471389645776,
+ "grad_norm": 3.631432294845581,
+ "learning_rate": 5.391764269460276e-07,
+ "loss": 0.1023,
+ "step": 32962
+ },
+ {
+ "epoch": 89.8174386920981,
+ "grad_norm": 3.0109949111938477,
+ "learning_rate": 5.388906006662542e-07,
+ "loss": 0.0214,
+ "step": 32963
+ },
+ {
+ "epoch": 89.82016348773843,
+ "grad_norm": 3.0166165828704834,
+ "learning_rate": 5.386048480692952e-07,
+ "loss": 0.0717,
+ "step": 32964
+ },
+ {
+ "epoch": 89.82288828337875,
+ "grad_norm": 1.6970953941345215,
+ "learning_rate": 5.383191691573775e-07,
+ "loss": 0.0299,
+ "step": 32965
+ },
+ {
+ "epoch": 89.82561307901908,
+ "grad_norm": 2.4598007202148438,
+ "learning_rate": 5.380335639327238e-07,
+ "loss": 0.0297,
+ "step": 32966
+ },
+ {
+ "epoch": 89.8283378746594,
+ "grad_norm": 2.238889694213867,
+ "learning_rate": 5.377480323975626e-07,
+ "loss": 0.0941,
+ "step": 32967
+ },
+ {
+ "epoch": 89.83106267029973,
+ "grad_norm": 2.525719165802002,
+ "learning_rate": 5.37462574554114e-07,
+ "loss": 0.112,
+ "step": 32968
+ },
+ {
+ "epoch": 89.83378746594005,
+ "grad_norm": 1.9318571090698242,
+ "learning_rate": 5.37177190404603e-07,
+ "loss": 0.0241,
+ "step": 32969
+ },
+ {
+ "epoch": 89.83651226158038,
+ "grad_norm": 2.7263565063476562,
+ "learning_rate": 5.368918799512502e-07,
+ "loss": 0.089,
+ "step": 32970
+ },
+ {
+ "epoch": 89.83923705722071,
+ "grad_norm": 2.8696954250335693,
+ "learning_rate": 5.366066431962802e-07,
+ "loss": 0.151,
+ "step": 32971
+ },
+ {
+ "epoch": 89.84196185286103,
+ "grad_norm": 2.8988192081451416,
+ "learning_rate": 5.363214801419126e-07,
+ "loss": 0.1698,
+ "step": 32972
+ },
+ {
+ "epoch": 89.84468664850137,
+ "grad_norm": 2.658188581466675,
+ "learning_rate": 5.360363907903676e-07,
+ "loss": 0.1053,
+ "step": 32973
+ },
+ {
+ "epoch": 89.84741144414168,
+ "grad_norm": 3.5899264812469482,
+ "learning_rate": 5.357513751438682e-07,
+ "loss": 0.0692,
+ "step": 32974
+ },
+ {
+ "epoch": 89.85013623978202,
+ "grad_norm": 2.681520938873291,
+ "learning_rate": 5.354664332046311e-07,
+ "loss": 0.0356,
+ "step": 32975
+ },
+ {
+ "epoch": 89.85286103542235,
+ "grad_norm": 2.867356300354004,
+ "learning_rate": 5.351815649748782e-07,
+ "loss": 0.0275,
+ "step": 32976
+ },
+ {
+ "epoch": 89.85558583106267,
+ "grad_norm": 2.661987543106079,
+ "learning_rate": 5.348967704568265e-07,
+ "loss": 0.0327,
+ "step": 32977
+ },
+ {
+ "epoch": 89.858310626703,
+ "grad_norm": 3.018894910812378,
+ "learning_rate": 5.34612049652693e-07,
+ "loss": 0.1273,
+ "step": 32978
+ },
+ {
+ "epoch": 89.86103542234332,
+ "grad_norm": 2.4152638912200928,
+ "learning_rate": 5.343274025646972e-07,
+ "loss": 0.0289,
+ "step": 32979
+ },
+ {
+ "epoch": 89.86376021798365,
+ "grad_norm": 2.1353743076324463,
+ "learning_rate": 5.34042829195055e-07,
+ "loss": 0.0716,
+ "step": 32980
+ },
+ {
+ "epoch": 89.86648501362397,
+ "grad_norm": 2.2595503330230713,
+ "learning_rate": 5.337583295459825e-07,
+ "loss": 0.1349,
+ "step": 32981
+ },
+ {
+ "epoch": 89.8692098092643,
+ "grad_norm": 2.7043895721435547,
+ "learning_rate": 5.334739036196945e-07,
+ "loss": 0.0464,
+ "step": 32982
+ },
+ {
+ "epoch": 89.87193460490464,
+ "grad_norm": 1.942264199256897,
+ "learning_rate": 5.331895514184083e-07,
+ "loss": 0.0253,
+ "step": 32983
+ },
+ {
+ "epoch": 89.87465940054496,
+ "grad_norm": 1.7817914485931396,
+ "learning_rate": 5.329052729443363e-07,
+ "loss": 0.0239,
+ "step": 32984
+ },
+ {
+ "epoch": 89.87738419618529,
+ "grad_norm": 2.8188374042510986,
+ "learning_rate": 5.326210681996947e-07,
+ "loss": 0.054,
+ "step": 32985
+ },
+ {
+ "epoch": 89.88010899182561,
+ "grad_norm": 3.5125081539154053,
+ "learning_rate": 5.323369371866926e-07,
+ "loss": 0.04,
+ "step": 32986
+ },
+ {
+ "epoch": 89.88283378746594,
+ "grad_norm": 2.6244945526123047,
+ "learning_rate": 5.320528799075486e-07,
+ "loss": 0.0191,
+ "step": 32987
+ },
+ {
+ "epoch": 89.88555858310627,
+ "grad_norm": 3.1844279766082764,
+ "learning_rate": 5.317688963644718e-07,
+ "loss": 0.1572,
+ "step": 32988
+ },
+ {
+ "epoch": 89.88828337874659,
+ "grad_norm": 4.102267742156982,
+ "learning_rate": 5.314849865596738e-07,
+ "loss": 0.0503,
+ "step": 32989
+ },
+ {
+ "epoch": 89.89100817438693,
+ "grad_norm": 3.608659029006958,
+ "learning_rate": 5.312011504953641e-07,
+ "loss": 0.0674,
+ "step": 32990
+ },
+ {
+ "epoch": 89.89373297002724,
+ "grad_norm": 2.702633857727051,
+ "learning_rate": 5.309173881737573e-07,
+ "loss": 0.0263,
+ "step": 32991
+ },
+ {
+ "epoch": 89.89645776566758,
+ "grad_norm": 3.237031936645508,
+ "learning_rate": 5.306336995970607e-07,
+ "loss": 0.0351,
+ "step": 32992
+ },
+ {
+ "epoch": 89.8991825613079,
+ "grad_norm": 2.228076219558716,
+ "learning_rate": 5.303500847674825e-07,
+ "loss": 0.1762,
+ "step": 32993
+ },
+ {
+ "epoch": 89.90190735694823,
+ "grad_norm": 2.669952630996704,
+ "learning_rate": 5.300665436872332e-07,
+ "loss": 0.0774,
+ "step": 32994
+ },
+ {
+ "epoch": 89.90463215258856,
+ "grad_norm": 1.98214852809906,
+ "learning_rate": 5.297830763585221e-07,
+ "loss": 0.0528,
+ "step": 32995
+ },
+ {
+ "epoch": 89.90735694822888,
+ "grad_norm": 2.620363473892212,
+ "learning_rate": 5.294996827835564e-07,
+ "loss": 0.0258,
+ "step": 32996
+ },
+ {
+ "epoch": 89.91008174386921,
+ "grad_norm": 2.039790153503418,
+ "learning_rate": 5.292163629645419e-07,
+ "loss": 0.0275,
+ "step": 32997
+ },
+ {
+ "epoch": 89.91280653950953,
+ "grad_norm": 2.1500163078308105,
+ "learning_rate": 5.289331169036838e-07,
+ "loss": 0.035,
+ "step": 32998
+ },
+ {
+ "epoch": 89.91553133514986,
+ "grad_norm": 1.4995557069778442,
+ "learning_rate": 5.286499446031912e-07,
+ "loss": 0.016,
+ "step": 32999
+ },
+ {
+ "epoch": 89.9182561307902,
+ "grad_norm": 3.5196704864501953,
+ "learning_rate": 5.28366846065268e-07,
+ "loss": 0.1035,
+ "step": 33000
+ },
+ {
+ "epoch": 89.92098092643052,
+ "grad_norm": 2.2869179248809814,
+ "learning_rate": 5.280838212921192e-07,
+ "loss": 0.0532,
+ "step": 33001
+ },
+ {
+ "epoch": 89.92370572207085,
+ "grad_norm": 2.1659247875213623,
+ "learning_rate": 5.278008702859471e-07,
+ "loss": 0.0358,
+ "step": 33002
+ },
+ {
+ "epoch": 89.92643051771117,
+ "grad_norm": 2.7991530895233154,
+ "learning_rate": 5.275179930489593e-07,
+ "loss": 0.0675,
+ "step": 33003
+ },
+ {
+ "epoch": 89.9291553133515,
+ "grad_norm": 3.941906452178955,
+ "learning_rate": 5.272351895833561e-07,
+ "loss": 0.187,
+ "step": 33004
+ },
+ {
+ "epoch": 89.93188010899182,
+ "grad_norm": 2.4331722259521484,
+ "learning_rate": 5.2695245989134e-07,
+ "loss": 0.0365,
+ "step": 33005
+ },
+ {
+ "epoch": 89.93460490463215,
+ "grad_norm": 2.5806493759155273,
+ "learning_rate": 5.266698039751117e-07,
+ "loss": 0.0153,
+ "step": 33006
+ },
+ {
+ "epoch": 89.93732970027249,
+ "grad_norm": 2.010847568511963,
+ "learning_rate": 5.263872218368759e-07,
+ "loss": 0.0286,
+ "step": 33007
+ },
+ {
+ "epoch": 89.9400544959128,
+ "grad_norm": 1.869657039642334,
+ "learning_rate": 5.261047134788311e-07,
+ "loss": 0.034,
+ "step": 33008
+ },
+ {
+ "epoch": 89.94277929155314,
+ "grad_norm": 6.215493202209473,
+ "learning_rate": 5.258222789031775e-07,
+ "loss": 0.0331,
+ "step": 33009
+ },
+ {
+ "epoch": 89.94550408719346,
+ "grad_norm": 3.4132604598999023,
+ "learning_rate": 5.255399181121146e-07,
+ "loss": 0.0513,
+ "step": 33010
+ },
+ {
+ "epoch": 89.94822888283379,
+ "grad_norm": 2.238222360610962,
+ "learning_rate": 5.252576311078417e-07,
+ "loss": 0.0507,
+ "step": 33011
+ },
+ {
+ "epoch": 89.95095367847412,
+ "grad_norm": 2.523106336593628,
+ "learning_rate": 5.249754178925581e-07,
+ "loss": 0.029,
+ "step": 33012
+ },
+ {
+ "epoch": 89.95367847411444,
+ "grad_norm": 2.9947681427001953,
+ "learning_rate": 5.246932784684622e-07,
+ "loss": 0.0417,
+ "step": 33013
+ },
+ {
+ "epoch": 89.95640326975477,
+ "grad_norm": 3.382309913635254,
+ "learning_rate": 5.244112128377477e-07,
+ "loss": 0.0535,
+ "step": 33014
+ },
+ {
+ "epoch": 89.95912806539509,
+ "grad_norm": 1.5899206399917603,
+ "learning_rate": 5.241292210026161e-07,
+ "loss": 0.1373,
+ "step": 33015
+ },
+ {
+ "epoch": 89.96185286103542,
+ "grad_norm": 1.6889121532440186,
+ "learning_rate": 5.238473029652602e-07,
+ "loss": 0.0222,
+ "step": 33016
+ },
+ {
+ "epoch": 89.96457765667574,
+ "grad_norm": 2.2443130016326904,
+ "learning_rate": 5.235654587278771e-07,
+ "loss": 0.0392,
+ "step": 33017
+ },
+ {
+ "epoch": 89.96730245231608,
+ "grad_norm": 2.3111021518707275,
+ "learning_rate": 5.232836882926596e-07,
+ "loss": 0.0418,
+ "step": 33018
+ },
+ {
+ "epoch": 89.97002724795641,
+ "grad_norm": 2.983551263809204,
+ "learning_rate": 5.230019916618046e-07,
+ "loss": 0.0503,
+ "step": 33019
+ },
+ {
+ "epoch": 89.97275204359673,
+ "grad_norm": 2.7868733406066895,
+ "learning_rate": 5.227203688375049e-07,
+ "loss": 0.1354,
+ "step": 33020
+ },
+ {
+ "epoch": 89.97547683923706,
+ "grad_norm": 2.1836066246032715,
+ "learning_rate": 5.224388198219554e-07,
+ "loss": 0.0221,
+ "step": 33021
+ },
+ {
+ "epoch": 89.97820163487738,
+ "grad_norm": 3.358785629272461,
+ "learning_rate": 5.221573446173444e-07,
+ "loss": 0.0671,
+ "step": 33022
+ },
+ {
+ "epoch": 89.98092643051771,
+ "grad_norm": 3.126645803451538,
+ "learning_rate": 5.218759432258691e-07,
+ "loss": 0.0469,
+ "step": 33023
+ },
+ {
+ "epoch": 89.98365122615803,
+ "grad_norm": 2.0958292484283447,
+ "learning_rate": 5.215946156497187e-07,
+ "loss": 0.018,
+ "step": 33024
+ },
+ {
+ "epoch": 89.98637602179836,
+ "grad_norm": 2.102900505065918,
+ "learning_rate": 5.213133618910849e-07,
+ "loss": 0.0749,
+ "step": 33025
+ },
+ {
+ "epoch": 89.9891008174387,
+ "grad_norm": 1.6311944723129272,
+ "learning_rate": 5.210321819521558e-07,
+ "loss": 0.032,
+ "step": 33026
+ },
+ {
+ "epoch": 89.99182561307902,
+ "grad_norm": 1.8994883298873901,
+ "learning_rate": 5.207510758351231e-07,
+ "loss": 0.0353,
+ "step": 33027
+ },
+ {
+ "epoch": 89.99455040871935,
+ "grad_norm": 1.4795035123825073,
+ "learning_rate": 5.204700435421772e-07,
+ "loss": 0.0137,
+ "step": 33028
+ },
+ {
+ "epoch": 89.99727520435967,
+ "grad_norm": 2.647529363632202,
+ "learning_rate": 5.201890850755054e-07,
+ "loss": 0.0511,
+ "step": 33029
+ },
+ {
+ "epoch": 90.0,
+ "grad_norm": 2.3613972663879395,
+ "learning_rate": 5.199082004372958e-07,
+ "loss": 0.0328,
+ "step": 33030
+ },
+ {
+ "epoch": 90.00272479564033,
+ "grad_norm": 2.134033679962158,
+ "learning_rate": 5.196273896297354e-07,
+ "loss": 0.0479,
+ "step": 33031
+ },
+ {
+ "epoch": 90.00544959128065,
+ "grad_norm": 2.578030824661255,
+ "learning_rate": 5.193466526550117e-07,
+ "loss": 0.0362,
+ "step": 33032
+ },
+ {
+ "epoch": 90.00817438692098,
+ "grad_norm": 3.1712164878845215,
+ "learning_rate": 5.190659895153127e-07,
+ "loss": 0.0901,
+ "step": 33033
+ },
+ {
+ "epoch": 90.0108991825613,
+ "grad_norm": 2.9159908294677734,
+ "learning_rate": 5.187854002128223e-07,
+ "loss": 0.0516,
+ "step": 33034
+ },
+ {
+ "epoch": 90.01362397820164,
+ "grad_norm": 6.015149116516113,
+ "learning_rate": 5.185048847497242e-07,
+ "loss": 0.0363,
+ "step": 33035
+ },
+ {
+ "epoch": 90.01634877384195,
+ "grad_norm": 2.3716206550598145,
+ "learning_rate": 5.182244431282058e-07,
+ "loss": 0.0229,
+ "step": 33036
+ },
+ {
+ "epoch": 90.01907356948229,
+ "grad_norm": 3.414368152618408,
+ "learning_rate": 5.179440753504517e-07,
+ "loss": 0.0395,
+ "step": 33037
+ },
+ {
+ "epoch": 90.02179836512262,
+ "grad_norm": 2.8145992755889893,
+ "learning_rate": 5.176637814186414e-07,
+ "loss": 0.0249,
+ "step": 33038
+ },
+ {
+ "epoch": 90.02452316076294,
+ "grad_norm": 3.2736363410949707,
+ "learning_rate": 5.17383561334962e-07,
+ "loss": 0.0338,
+ "step": 33039
+ },
+ {
+ "epoch": 90.02724795640327,
+ "grad_norm": 2.978874921798706,
+ "learning_rate": 5.171034151015941e-07,
+ "loss": 0.0396,
+ "step": 33040
+ },
+ {
+ "epoch": 90.02997275204359,
+ "grad_norm": 2.7185943126678467,
+ "learning_rate": 5.168233427207204e-07,
+ "loss": 0.084,
+ "step": 33041
+ },
+ {
+ "epoch": 90.03269754768392,
+ "grad_norm": 2.609410285949707,
+ "learning_rate": 5.165433441945189e-07,
+ "loss": 0.0838,
+ "step": 33042
+ },
+ {
+ "epoch": 90.03542234332426,
+ "grad_norm": 1.7382959127426147,
+ "learning_rate": 5.162634195251748e-07,
+ "loss": 0.0211,
+ "step": 33043
+ },
+ {
+ "epoch": 90.03814713896458,
+ "grad_norm": 2.75905179977417,
+ "learning_rate": 5.15983568714864e-07,
+ "loss": 0.034,
+ "step": 33044
+ },
+ {
+ "epoch": 90.04087193460491,
+ "grad_norm": 1.7357958555221558,
+ "learning_rate": 5.157037917657692e-07,
+ "loss": 0.0248,
+ "step": 33045
+ },
+ {
+ "epoch": 90.04359673024523,
+ "grad_norm": 2.1174702644348145,
+ "learning_rate": 5.154240886800688e-07,
+ "loss": 0.0367,
+ "step": 33046
+ },
+ {
+ "epoch": 90.04632152588556,
+ "grad_norm": 6.2968878746032715,
+ "learning_rate": 5.151444594599386e-07,
+ "loss": 0.05,
+ "step": 33047
+ },
+ {
+ "epoch": 90.04904632152588,
+ "grad_norm": 1.8036682605743408,
+ "learning_rate": 5.148649041075593e-07,
+ "loss": 0.0173,
+ "step": 33048
+ },
+ {
+ "epoch": 90.05177111716621,
+ "grad_norm": 2.6650938987731934,
+ "learning_rate": 5.145854226251068e-07,
+ "loss": 0.057,
+ "step": 33049
+ },
+ {
+ "epoch": 90.05449591280654,
+ "grad_norm": 27.12366485595703,
+ "learning_rate": 5.143060150147583e-07,
+ "loss": 0.0246,
+ "step": 33050
+ },
+ {
+ "epoch": 90.05722070844686,
+ "grad_norm": 2.7090585231781006,
+ "learning_rate": 5.140266812786865e-07,
+ "loss": 0.035,
+ "step": 33051
+ },
+ {
+ "epoch": 90.0599455040872,
+ "grad_norm": 2.360356569290161,
+ "learning_rate": 5.137474214190719e-07,
+ "loss": 0.081,
+ "step": 33052
+ },
+ {
+ "epoch": 90.06267029972751,
+ "grad_norm": 2.3694264888763428,
+ "learning_rate": 5.134682354380871e-07,
+ "loss": 0.0348,
+ "step": 33053
+ },
+ {
+ "epoch": 90.06539509536785,
+ "grad_norm": 2.62050199508667,
+ "learning_rate": 5.131891233379071e-07,
+ "loss": 0.0666,
+ "step": 33054
+ },
+ {
+ "epoch": 90.06811989100818,
+ "grad_norm": 11.05138874053955,
+ "learning_rate": 5.129100851207025e-07,
+ "loss": 0.321,
+ "step": 33055
+ },
+ {
+ "epoch": 90.0708446866485,
+ "grad_norm": 3.2369446754455566,
+ "learning_rate": 5.126311207886503e-07,
+ "loss": 0.1585,
+ "step": 33056
+ },
+ {
+ "epoch": 90.07356948228883,
+ "grad_norm": 3.03149676322937,
+ "learning_rate": 5.123522303439222e-07,
+ "loss": 0.0489,
+ "step": 33057
+ },
+ {
+ "epoch": 90.07629427792915,
+ "grad_norm": 3.8002331256866455,
+ "learning_rate": 5.120734137886884e-07,
+ "loss": 0.0504,
+ "step": 33058
+ },
+ {
+ "epoch": 90.07901907356948,
+ "grad_norm": 2.704076051712036,
+ "learning_rate": 5.117946711251209e-07,
+ "loss": 0.0787,
+ "step": 33059
+ },
+ {
+ "epoch": 90.0817438692098,
+ "grad_norm": 3.1726512908935547,
+ "learning_rate": 5.115160023553922e-07,
+ "loss": 0.1538,
+ "step": 33060
+ },
+ {
+ "epoch": 90.08446866485014,
+ "grad_norm": 2.7844386100769043,
+ "learning_rate": 5.112374074816706e-07,
+ "loss": 0.0571,
+ "step": 33061
+ },
+ {
+ "epoch": 90.08719346049047,
+ "grad_norm": 3.116177797317505,
+ "learning_rate": 5.109588865061277e-07,
+ "loss": 0.0287,
+ "step": 33062
+ },
+ {
+ "epoch": 90.08991825613079,
+ "grad_norm": 2.319117307662964,
+ "learning_rate": 5.106804394309306e-07,
+ "loss": 0.0217,
+ "step": 33063
+ },
+ {
+ "epoch": 90.09264305177112,
+ "grad_norm": 2.8059732913970947,
+ "learning_rate": 5.104020662582499e-07,
+ "loss": 0.0293,
+ "step": 33064
+ },
+ {
+ "epoch": 90.09536784741144,
+ "grad_norm": 2.308300733566284,
+ "learning_rate": 5.101237669902526e-07,
+ "loss": 0.1803,
+ "step": 33065
+ },
+ {
+ "epoch": 90.09809264305177,
+ "grad_norm": 2.789944887161255,
+ "learning_rate": 5.09845541629106e-07,
+ "loss": 0.0535,
+ "step": 33066
+ },
+ {
+ "epoch": 90.1008174386921,
+ "grad_norm": 2.59648060798645,
+ "learning_rate": 5.095673901769749e-07,
+ "loss": 0.1116,
+ "step": 33067
+ },
+ {
+ "epoch": 90.10354223433242,
+ "grad_norm": 1.695949673652649,
+ "learning_rate": 5.092893126360288e-07,
+ "loss": 0.0651,
+ "step": 33068
+ },
+ {
+ "epoch": 90.10626702997276,
+ "grad_norm": 2.5341873168945312,
+ "learning_rate": 5.090113090084325e-07,
+ "loss": 0.0886,
+ "step": 33069
+ },
+ {
+ "epoch": 90.10899182561307,
+ "grad_norm": 6.12711763381958,
+ "learning_rate": 5.087333792963512e-07,
+ "loss": 0.0248,
+ "step": 33070
+ },
+ {
+ "epoch": 90.11171662125341,
+ "grad_norm": 3.309462547302246,
+ "learning_rate": 5.084555235019473e-07,
+ "loss": 0.1271,
+ "step": 33071
+ },
+ {
+ "epoch": 90.11444141689373,
+ "grad_norm": 2.403449535369873,
+ "learning_rate": 5.081777416273869e-07,
+ "loss": 0.0511,
+ "step": 33072
+ },
+ {
+ "epoch": 90.11716621253406,
+ "grad_norm": 3.0937139987945557,
+ "learning_rate": 5.079000336748341e-07,
+ "loss": 0.0382,
+ "step": 33073
+ },
+ {
+ "epoch": 90.11989100817439,
+ "grad_norm": 5.334840774536133,
+ "learning_rate": 5.076223996464491e-07,
+ "loss": 0.0422,
+ "step": 33074
+ },
+ {
+ "epoch": 90.12261580381471,
+ "grad_norm": 3.4917781352996826,
+ "learning_rate": 5.073448395443948e-07,
+ "loss": 0.131,
+ "step": 33075
+ },
+ {
+ "epoch": 90.12534059945504,
+ "grad_norm": 2.161721706390381,
+ "learning_rate": 5.070673533708337e-07,
+ "loss": 0.0455,
+ "step": 33076
+ },
+ {
+ "epoch": 90.12806539509536,
+ "grad_norm": 2.2415032386779785,
+ "learning_rate": 5.067899411279276e-07,
+ "loss": 0.0374,
+ "step": 33077
+ },
+ {
+ "epoch": 90.1307901907357,
+ "grad_norm": 3.1583940982818604,
+ "learning_rate": 5.065126028178357e-07,
+ "loss": 0.081,
+ "step": 33078
+ },
+ {
+ "epoch": 90.13351498637603,
+ "grad_norm": 2.8492276668548584,
+ "learning_rate": 5.062353384427144e-07,
+ "loss": 0.0925,
+ "step": 33079
+ },
+ {
+ "epoch": 90.13623978201635,
+ "grad_norm": 3.782942295074463,
+ "learning_rate": 5.059581480047304e-07,
+ "loss": 0.1233,
+ "step": 33080
+ },
+ {
+ "epoch": 90.13896457765668,
+ "grad_norm": 2.2050328254699707,
+ "learning_rate": 5.05681031506039e-07,
+ "loss": 0.0781,
+ "step": 33081
+ },
+ {
+ "epoch": 90.141689373297,
+ "grad_norm": 2.3911116123199463,
+ "learning_rate": 5.054039889487972e-07,
+ "loss": 0.0867,
+ "step": 33082
+ },
+ {
+ "epoch": 90.14441416893733,
+ "grad_norm": 2.5510473251342773,
+ "learning_rate": 5.051270203351632e-07,
+ "loss": 0.0259,
+ "step": 33083
+ },
+ {
+ "epoch": 90.14713896457765,
+ "grad_norm": 2.6050610542297363,
+ "learning_rate": 5.048501256672955e-07,
+ "loss": 0.198,
+ "step": 33084
+ },
+ {
+ "epoch": 90.14986376021798,
+ "grad_norm": 4.228565692901611,
+ "learning_rate": 5.045733049473489e-07,
+ "loss": 0.0959,
+ "step": 33085
+ },
+ {
+ "epoch": 90.15258855585832,
+ "grad_norm": 2.5402660369873047,
+ "learning_rate": 5.042965581774794e-07,
+ "loss": 0.1167,
+ "step": 33086
+ },
+ {
+ "epoch": 90.15531335149863,
+ "grad_norm": 2.778419256210327,
+ "learning_rate": 5.040198853598421e-07,
+ "loss": 0.0978,
+ "step": 33087
+ },
+ {
+ "epoch": 90.15803814713897,
+ "grad_norm": 3.5623526573181152,
+ "learning_rate": 5.037432864965941e-07,
+ "loss": 0.0295,
+ "step": 33088
+ },
+ {
+ "epoch": 90.16076294277929,
+ "grad_norm": 2.1568751335144043,
+ "learning_rate": 5.034667615898869e-07,
+ "loss": 0.0753,
+ "step": 33089
+ },
+ {
+ "epoch": 90.16348773841962,
+ "grad_norm": 3.8411865234375,
+ "learning_rate": 5.031903106418756e-07,
+ "loss": 0.0773,
+ "step": 33090
+ },
+ {
+ "epoch": 90.16621253405995,
+ "grad_norm": 2.954439163208008,
+ "learning_rate": 5.029139336547106e-07,
+ "loss": 0.1143,
+ "step": 33091
+ },
+ {
+ "epoch": 90.16893732970027,
+ "grad_norm": 3.459062099456787,
+ "learning_rate": 5.02637630630548e-07,
+ "loss": 0.0978,
+ "step": 33092
+ },
+ {
+ "epoch": 90.1716621253406,
+ "grad_norm": 2.2669992446899414,
+ "learning_rate": 5.023614015715372e-07,
+ "loss": 0.0756,
+ "step": 33093
+ },
+ {
+ "epoch": 90.17438692098092,
+ "grad_norm": 2.870089530944824,
+ "learning_rate": 5.020852464798309e-07,
+ "loss": 0.0579,
+ "step": 33094
+ },
+ {
+ "epoch": 90.17711171662125,
+ "grad_norm": 2.030543565750122,
+ "learning_rate": 5.018091653575774e-07,
+ "loss": 0.0234,
+ "step": 33095
+ },
+ {
+ "epoch": 90.17983651226157,
+ "grad_norm": 3.0314953327178955,
+ "learning_rate": 5.015331582069282e-07,
+ "loss": 0.0378,
+ "step": 33096
+ },
+ {
+ "epoch": 90.1825613079019,
+ "grad_norm": 2.4393393993377686,
+ "learning_rate": 5.01257225030034e-07,
+ "loss": 0.0844,
+ "step": 33097
+ },
+ {
+ "epoch": 90.18528610354224,
+ "grad_norm": 3.483377456665039,
+ "learning_rate": 5.009813658290441e-07,
+ "loss": 0.0524,
+ "step": 33098
+ },
+ {
+ "epoch": 90.18801089918256,
+ "grad_norm": 3.7955992221832275,
+ "learning_rate": 5.007055806061045e-07,
+ "loss": 0.0236,
+ "step": 33099
+ },
+ {
+ "epoch": 90.19073569482289,
+ "grad_norm": 2.5338237285614014,
+ "learning_rate": 5.004298693633625e-07,
+ "loss": 0.046,
+ "step": 33100
+ },
+ {
+ "epoch": 90.19346049046321,
+ "grad_norm": 2.2801761627197266,
+ "learning_rate": 5.001542321029695e-07,
+ "loss": 0.0709,
+ "step": 33101
+ },
+ {
+ "epoch": 90.19618528610354,
+ "grad_norm": 2.7014200687408447,
+ "learning_rate": 4.998786688270685e-07,
+ "loss": 0.0285,
+ "step": 33102
+ },
+ {
+ "epoch": 90.19891008174388,
+ "grad_norm": 2.956639289855957,
+ "learning_rate": 4.996031795378065e-07,
+ "loss": 0.0345,
+ "step": 33103
+ },
+ {
+ "epoch": 90.2016348773842,
+ "grad_norm": 2.349761486053467,
+ "learning_rate": 4.993277642373296e-07,
+ "loss": 0.1865,
+ "step": 33104
+ },
+ {
+ "epoch": 90.20435967302453,
+ "grad_norm": 1.7927157878875732,
+ "learning_rate": 4.990524229277826e-07,
+ "loss": 0.0331,
+ "step": 33105
+ },
+ {
+ "epoch": 90.20708446866485,
+ "grad_norm": 1.8765418529510498,
+ "learning_rate": 4.987771556113096e-07,
+ "loss": 0.0277,
+ "step": 33106
+ },
+ {
+ "epoch": 90.20980926430518,
+ "grad_norm": 1.8036874532699585,
+ "learning_rate": 4.985019622900522e-07,
+ "loss": 0.0833,
+ "step": 33107
+ },
+ {
+ "epoch": 90.2125340599455,
+ "grad_norm": 3.2392690181732178,
+ "learning_rate": 4.982268429661575e-07,
+ "loss": 0.0361,
+ "step": 33108
+ },
+ {
+ "epoch": 90.21525885558583,
+ "grad_norm": 3.99721622467041,
+ "learning_rate": 4.979517976417669e-07,
+ "loss": 0.0561,
+ "step": 33109
+ },
+ {
+ "epoch": 90.21798365122616,
+ "grad_norm": 2.079462766647339,
+ "learning_rate": 4.976768263190212e-07,
+ "loss": 0.0234,
+ "step": 33110
+ },
+ {
+ "epoch": 90.22070844686648,
+ "grad_norm": 1.9858804941177368,
+ "learning_rate": 4.97401929000062e-07,
+ "loss": 0.1116,
+ "step": 33111
+ },
+ {
+ "epoch": 90.22343324250681,
+ "grad_norm": 2.7112207412719727,
+ "learning_rate": 4.971271056870308e-07,
+ "loss": 0.1189,
+ "step": 33112
+ },
+ {
+ "epoch": 90.22615803814713,
+ "grad_norm": 2.296314001083374,
+ "learning_rate": 4.968523563820682e-07,
+ "loss": 0.0404,
+ "step": 33113
+ },
+ {
+ "epoch": 90.22888283378747,
+ "grad_norm": 2.176239252090454,
+ "learning_rate": 4.965776810873135e-07,
+ "loss": 0.0473,
+ "step": 33114
+ },
+ {
+ "epoch": 90.2316076294278,
+ "grad_norm": 2.048495292663574,
+ "learning_rate": 4.963030798049063e-07,
+ "loss": 0.0205,
+ "step": 33115
+ },
+ {
+ "epoch": 90.23433242506812,
+ "grad_norm": 2.07379412651062,
+ "learning_rate": 4.960285525369834e-07,
+ "loss": 0.0272,
+ "step": 33116
+ },
+ {
+ "epoch": 90.23705722070845,
+ "grad_norm": 2.025475025177002,
+ "learning_rate": 4.957540992856869e-07,
+ "loss": 0.0797,
+ "step": 33117
+ },
+ {
+ "epoch": 90.23978201634877,
+ "grad_norm": 2.2327964305877686,
+ "learning_rate": 4.954797200531502e-07,
+ "loss": 0.0743,
+ "step": 33118
+ },
+ {
+ "epoch": 90.2425068119891,
+ "grad_norm": 2.112105131149292,
+ "learning_rate": 4.95205414841512e-07,
+ "loss": 0.044,
+ "step": 33119
+ },
+ {
+ "epoch": 90.24523160762942,
+ "grad_norm": 2.899749755859375,
+ "learning_rate": 4.949311836529059e-07,
+ "loss": 0.0462,
+ "step": 33120
+ },
+ {
+ "epoch": 90.24795640326975,
+ "grad_norm": 2.9915671348571777,
+ "learning_rate": 4.946570264894724e-07,
+ "loss": 0.0679,
+ "step": 33121
+ },
+ {
+ "epoch": 90.25068119891009,
+ "grad_norm": 3.773315668106079,
+ "learning_rate": 4.943829433533431e-07,
+ "loss": 0.1619,
+ "step": 33122
+ },
+ {
+ "epoch": 90.2534059945504,
+ "grad_norm": 2.1987504959106445,
+ "learning_rate": 4.941089342466543e-07,
+ "loss": 0.0253,
+ "step": 33123
+ },
+ {
+ "epoch": 90.25613079019074,
+ "grad_norm": 1.9298509359359741,
+ "learning_rate": 4.938349991715375e-07,
+ "loss": 0.0744,
+ "step": 33124
+ },
+ {
+ "epoch": 90.25885558583106,
+ "grad_norm": 2.095750570297241,
+ "learning_rate": 4.935611381301298e-07,
+ "loss": 0.0176,
+ "step": 33125
+ },
+ {
+ "epoch": 90.26158038147139,
+ "grad_norm": 2.950507402420044,
+ "learning_rate": 4.932873511245606e-07,
+ "loss": 0.027,
+ "step": 33126
+ },
+ {
+ "epoch": 90.26430517711172,
+ "grad_norm": 1.4579638242721558,
+ "learning_rate": 4.930136381569628e-07,
+ "loss": 0.1051,
+ "step": 33127
+ },
+ {
+ "epoch": 90.26702997275204,
+ "grad_norm": 1.8372451066970825,
+ "learning_rate": 4.927399992294701e-07,
+ "loss": 0.1445,
+ "step": 33128
+ },
+ {
+ "epoch": 90.26975476839237,
+ "grad_norm": 2.2512099742889404,
+ "learning_rate": 4.924664343442132e-07,
+ "loss": 0.0766,
+ "step": 33129
+ },
+ {
+ "epoch": 90.2724795640327,
+ "grad_norm": 2.2136800289154053,
+ "learning_rate": 4.92192943503319e-07,
+ "loss": 0.0802,
+ "step": 33130
+ },
+ {
+ "epoch": 90.27520435967303,
+ "grad_norm": 3.093181848526001,
+ "learning_rate": 4.919195267089227e-07,
+ "loss": 0.0328,
+ "step": 33131
+ },
+ {
+ "epoch": 90.27792915531334,
+ "grad_norm": 2.9186415672302246,
+ "learning_rate": 4.916461839631492e-07,
+ "loss": 0.1646,
+ "step": 33132
+ },
+ {
+ "epoch": 90.28065395095368,
+ "grad_norm": 2.292050838470459,
+ "learning_rate": 4.913729152681302e-07,
+ "loss": 0.0657,
+ "step": 33133
+ },
+ {
+ "epoch": 90.28337874659401,
+ "grad_norm": 2.6327805519104004,
+ "learning_rate": 4.910997206259927e-07,
+ "loss": 0.0357,
+ "step": 33134
+ },
+ {
+ "epoch": 90.28610354223433,
+ "grad_norm": 1.9433643817901611,
+ "learning_rate": 4.908266000388651e-07,
+ "loss": 0.0195,
+ "step": 33135
+ },
+ {
+ "epoch": 90.28882833787466,
+ "grad_norm": 2.821531057357788,
+ "learning_rate": 4.905535535088724e-07,
+ "loss": 0.0333,
+ "step": 33136
+ },
+ {
+ "epoch": 90.29155313351498,
+ "grad_norm": 2.54772686958313,
+ "learning_rate": 4.902805810381439e-07,
+ "loss": 0.0794,
+ "step": 33137
+ },
+ {
+ "epoch": 90.29427792915531,
+ "grad_norm": 1.4708597660064697,
+ "learning_rate": 4.900076826288047e-07,
+ "loss": 0.0215,
+ "step": 33138
+ },
+ {
+ "epoch": 90.29700272479565,
+ "grad_norm": 1.879388451576233,
+ "learning_rate": 4.897348582829797e-07,
+ "loss": 0.0272,
+ "step": 33139
+ },
+ {
+ "epoch": 90.29972752043597,
+ "grad_norm": 14.01826000213623,
+ "learning_rate": 4.894621080027906e-07,
+ "loss": 0.0364,
+ "step": 33140
+ },
+ {
+ "epoch": 90.3024523160763,
+ "grad_norm": 2.1911098957061768,
+ "learning_rate": 4.891894317903678e-07,
+ "loss": 0.1552,
+ "step": 33141
+ },
+ {
+ "epoch": 90.30517711171662,
+ "grad_norm": 2.230325222015381,
+ "learning_rate": 4.889168296478309e-07,
+ "loss": 0.093,
+ "step": 33142
+ },
+ {
+ "epoch": 90.30790190735695,
+ "grad_norm": 3.2192161083221436,
+ "learning_rate": 4.886443015773023e-07,
+ "loss": 0.0432,
+ "step": 33143
+ },
+ {
+ "epoch": 90.31062670299727,
+ "grad_norm": 2.402613878250122,
+ "learning_rate": 4.883718475809063e-07,
+ "loss": 0.0865,
+ "step": 33144
+ },
+ {
+ "epoch": 90.3133514986376,
+ "grad_norm": 3.3279948234558105,
+ "learning_rate": 4.880994676607642e-07,
+ "loss": 0.1136,
+ "step": 33145
+ },
+ {
+ "epoch": 90.31607629427793,
+ "grad_norm": 2.0511176586151123,
+ "learning_rate": 4.878271618189978e-07,
+ "loss": 0.0278,
+ "step": 33146
+ },
+ {
+ "epoch": 90.31880108991825,
+ "grad_norm": 3.2558493614196777,
+ "learning_rate": 4.875549300577264e-07,
+ "loss": 0.0614,
+ "step": 33147
+ },
+ {
+ "epoch": 90.32152588555859,
+ "grad_norm": 2.5872344970703125,
+ "learning_rate": 4.872827723790707e-07,
+ "loss": 0.1026,
+ "step": 33148
+ },
+ {
+ "epoch": 90.3242506811989,
+ "grad_norm": 3.384432077407837,
+ "learning_rate": 4.870106887851522e-07,
+ "loss": 0.0583,
+ "step": 33149
+ },
+ {
+ "epoch": 90.32697547683924,
+ "grad_norm": 3.299123764038086,
+ "learning_rate": 4.867386792780882e-07,
+ "loss": 0.0501,
+ "step": 33150
+ },
+ {
+ "epoch": 90.32970027247957,
+ "grad_norm": 2.722965955734253,
+ "learning_rate": 4.864667438599968e-07,
+ "loss": 0.0472,
+ "step": 33151
+ },
+ {
+ "epoch": 90.33242506811989,
+ "grad_norm": 2.200094699859619,
+ "learning_rate": 4.861948825329954e-07,
+ "loss": 0.0862,
+ "step": 33152
+ },
+ {
+ "epoch": 90.33514986376022,
+ "grad_norm": 2.139737844467163,
+ "learning_rate": 4.859230952992022e-07,
+ "loss": 0.0257,
+ "step": 33153
+ },
+ {
+ "epoch": 90.33787465940054,
+ "grad_norm": 3.265510082244873,
+ "learning_rate": 4.856513821607356e-07,
+ "loss": 0.1213,
+ "step": 33154
+ },
+ {
+ "epoch": 90.34059945504087,
+ "grad_norm": 2.391695976257324,
+ "learning_rate": 4.853797431197082e-07,
+ "loss": 0.1046,
+ "step": 33155
+ },
+ {
+ "epoch": 90.34332425068119,
+ "grad_norm": 2.397998571395874,
+ "learning_rate": 4.851081781782363e-07,
+ "loss": 0.0173,
+ "step": 33156
+ },
+ {
+ "epoch": 90.34604904632153,
+ "grad_norm": 2.9855945110321045,
+ "learning_rate": 4.84836687338438e-07,
+ "loss": 0.0661,
+ "step": 33157
+ },
+ {
+ "epoch": 90.34877384196186,
+ "grad_norm": 3.025181293487549,
+ "learning_rate": 4.84565270602424e-07,
+ "loss": 0.194,
+ "step": 33158
+ },
+ {
+ "epoch": 90.35149863760218,
+ "grad_norm": 3.4120302200317383,
+ "learning_rate": 4.842939279723102e-07,
+ "loss": 0.0836,
+ "step": 33159
+ },
+ {
+ "epoch": 90.35422343324251,
+ "grad_norm": 2.47977876663208,
+ "learning_rate": 4.840226594502073e-07,
+ "loss": 0.1062,
+ "step": 33160
+ },
+ {
+ "epoch": 90.35694822888283,
+ "grad_norm": 3.055844306945801,
+ "learning_rate": 4.837514650382313e-07,
+ "loss": 0.0697,
+ "step": 33161
+ },
+ {
+ "epoch": 90.35967302452316,
+ "grad_norm": 4.376160144805908,
+ "learning_rate": 4.834803447384917e-07,
+ "loss": 0.0312,
+ "step": 33162
+ },
+ {
+ "epoch": 90.3623978201635,
+ "grad_norm": 3.98852276802063,
+ "learning_rate": 4.832092985531023e-07,
+ "loss": 0.1487,
+ "step": 33163
+ },
+ {
+ "epoch": 90.36512261580381,
+ "grad_norm": 2.69901442527771,
+ "learning_rate": 4.829383264841703e-07,
+ "loss": 0.0318,
+ "step": 33164
+ },
+ {
+ "epoch": 90.36784741144415,
+ "grad_norm": 1.9195072650909424,
+ "learning_rate": 4.826674285338085e-07,
+ "loss": 0.029,
+ "step": 33165
+ },
+ {
+ "epoch": 90.37057220708446,
+ "grad_norm": 13.976252555847168,
+ "learning_rate": 4.823966047041273e-07,
+ "loss": 0.036,
+ "step": 33166
+ },
+ {
+ "epoch": 90.3732970027248,
+ "grad_norm": 1.4326947927474976,
+ "learning_rate": 4.821258549972363e-07,
+ "loss": 0.017,
+ "step": 33167
+ },
+ {
+ "epoch": 90.37602179836512,
+ "grad_norm": 1.6718900203704834,
+ "learning_rate": 4.818551794152404e-07,
+ "loss": 0.0183,
+ "step": 33168
+ },
+ {
+ "epoch": 90.37874659400545,
+ "grad_norm": 2.5900321006774902,
+ "learning_rate": 4.815845779602512e-07,
+ "loss": 0.0364,
+ "step": 33169
+ },
+ {
+ "epoch": 90.38147138964578,
+ "grad_norm": 1.4867286682128906,
+ "learning_rate": 4.813140506343761e-07,
+ "loss": 0.0152,
+ "step": 33170
+ },
+ {
+ "epoch": 90.3841961852861,
+ "grad_norm": 2.70233416557312,
+ "learning_rate": 4.810435974397199e-07,
+ "loss": 0.0428,
+ "step": 33171
+ },
+ {
+ "epoch": 90.38692098092643,
+ "grad_norm": 2.667961359024048,
+ "learning_rate": 4.807732183783886e-07,
+ "loss": 0.0329,
+ "step": 33172
+ },
+ {
+ "epoch": 90.38964577656675,
+ "grad_norm": 8.53109073638916,
+ "learning_rate": 4.805029134524908e-07,
+ "loss": 0.0294,
+ "step": 33173
+ },
+ {
+ "epoch": 90.39237057220708,
+ "grad_norm": 2.219076633453369,
+ "learning_rate": 4.80232682664129e-07,
+ "loss": 0.0242,
+ "step": 33174
+ },
+ {
+ "epoch": 90.39509536784742,
+ "grad_norm": 2.394843578338623,
+ "learning_rate": 4.799625260154095e-07,
+ "loss": 0.0703,
+ "step": 33175
+ },
+ {
+ "epoch": 90.39782016348774,
+ "grad_norm": 2.4840338230133057,
+ "learning_rate": 4.796924435084338e-07,
+ "loss": 0.1506,
+ "step": 33176
+ },
+ {
+ "epoch": 90.40054495912807,
+ "grad_norm": 2.4439096450805664,
+ "learning_rate": 4.794224351453092e-07,
+ "loss": 0.0293,
+ "step": 33177
+ },
+ {
+ "epoch": 90.40326975476839,
+ "grad_norm": 2.4611148834228516,
+ "learning_rate": 4.79152500928135e-07,
+ "loss": 0.0281,
+ "step": 33178
+ },
+ {
+ "epoch": 90.40599455040872,
+ "grad_norm": 2.7731146812438965,
+ "learning_rate": 4.788826408590153e-07,
+ "loss": 0.1032,
+ "step": 33179
+ },
+ {
+ "epoch": 90.40871934604904,
+ "grad_norm": 3.252362012863159,
+ "learning_rate": 4.786128549400492e-07,
+ "loss": 0.1381,
+ "step": 33180
+ },
+ {
+ "epoch": 90.41144414168937,
+ "grad_norm": 2.8525171279907227,
+ "learning_rate": 4.783431431733421e-07,
+ "loss": 0.057,
+ "step": 33181
+ },
+ {
+ "epoch": 90.4141689373297,
+ "grad_norm": 3.271495819091797,
+ "learning_rate": 4.780735055609908e-07,
+ "loss": 0.0342,
+ "step": 33182
+ },
+ {
+ "epoch": 90.41689373297002,
+ "grad_norm": 2.9020233154296875,
+ "learning_rate": 4.778039421050973e-07,
+ "loss": 0.0522,
+ "step": 33183
+ },
+ {
+ "epoch": 90.41961852861036,
+ "grad_norm": 2.4161126613616943,
+ "learning_rate": 4.775344528077596e-07,
+ "loss": 0.0938,
+ "step": 33184
+ },
+ {
+ "epoch": 90.42234332425068,
+ "grad_norm": 2.141167640686035,
+ "learning_rate": 4.772650376710775e-07,
+ "loss": 0.0195,
+ "step": 33185
+ },
+ {
+ "epoch": 90.42506811989101,
+ "grad_norm": 2.094120502471924,
+ "learning_rate": 4.76995696697149e-07,
+ "loss": 0.0517,
+ "step": 33186
+ },
+ {
+ "epoch": 90.42779291553134,
+ "grad_norm": 2.9432313442230225,
+ "learning_rate": 4.767264298880714e-07,
+ "loss": 0.0285,
+ "step": 33187
+ },
+ {
+ "epoch": 90.43051771117166,
+ "grad_norm": 2.2481791973114014,
+ "learning_rate": 4.7645723724594084e-07,
+ "loss": 0.0209,
+ "step": 33188
+ },
+ {
+ "epoch": 90.433242506812,
+ "grad_norm": 2.260496139526367,
+ "learning_rate": 4.7618811877285566e-07,
+ "loss": 0.1094,
+ "step": 33189
+ },
+ {
+ "epoch": 90.43596730245231,
+ "grad_norm": 1.7597731351852417,
+ "learning_rate": 4.759190744709119e-07,
+ "loss": 0.0279,
+ "step": 33190
+ },
+ {
+ "epoch": 90.43869209809264,
+ "grad_norm": 1.820627212524414,
+ "learning_rate": 4.756501043422024e-07,
+ "loss": 0.0206,
+ "step": 33191
+ },
+ {
+ "epoch": 90.44141689373296,
+ "grad_norm": 1.9359986782073975,
+ "learning_rate": 4.7538120838882317e-07,
+ "loss": 0.0673,
+ "step": 33192
+ },
+ {
+ "epoch": 90.4441416893733,
+ "grad_norm": 1.9540246725082397,
+ "learning_rate": 4.751123866128693e-07,
+ "loss": 0.0265,
+ "step": 33193
+ },
+ {
+ "epoch": 90.44686648501363,
+ "grad_norm": 1.3852287530899048,
+ "learning_rate": 4.748436390164346e-07,
+ "loss": 0.0168,
+ "step": 33194
+ },
+ {
+ "epoch": 90.44959128065395,
+ "grad_norm": 2.3974239826202393,
+ "learning_rate": 4.7457496560160966e-07,
+ "loss": 0.0339,
+ "step": 33195
+ },
+ {
+ "epoch": 90.45231607629428,
+ "grad_norm": 3.4479024410247803,
+ "learning_rate": 4.743063663704883e-07,
+ "loss": 0.0371,
+ "step": 33196
+ },
+ {
+ "epoch": 90.4550408719346,
+ "grad_norm": 2.633267402648926,
+ "learning_rate": 4.740378413251634e-07,
+ "loss": 0.0262,
+ "step": 33197
+ },
+ {
+ "epoch": 90.45776566757493,
+ "grad_norm": 2.8179562091827393,
+ "learning_rate": 4.737693904677243e-07,
+ "loss": 0.0523,
+ "step": 33198
+ },
+ {
+ "epoch": 90.46049046321527,
+ "grad_norm": 4.019863128662109,
+ "learning_rate": 4.735010138002616e-07,
+ "loss": 0.0303,
+ "step": 33199
+ },
+ {
+ "epoch": 90.46321525885558,
+ "grad_norm": 3.3150060176849365,
+ "learning_rate": 4.7323271132486805e-07,
+ "loss": 0.0812,
+ "step": 33200
+ },
+ {
+ "epoch": 90.46594005449592,
+ "grad_norm": 2.257672071456909,
+ "learning_rate": 4.7296448304363086e-07,
+ "loss": 0.1424,
+ "step": 33201
+ },
+ {
+ "epoch": 90.46866485013624,
+ "grad_norm": 1.8890174627304077,
+ "learning_rate": 4.726963289586395e-07,
+ "loss": 0.0244,
+ "step": 33202
+ },
+ {
+ "epoch": 90.47138964577657,
+ "grad_norm": 2.707345962524414,
+ "learning_rate": 4.7242824907198335e-07,
+ "loss": 0.0507,
+ "step": 33203
+ },
+ {
+ "epoch": 90.47411444141689,
+ "grad_norm": 2.1585302352905273,
+ "learning_rate": 4.721602433857497e-07,
+ "loss": 0.0332,
+ "step": 33204
+ },
+ {
+ "epoch": 90.47683923705722,
+ "grad_norm": 3.414416790008545,
+ "learning_rate": 4.7189231190202353e-07,
+ "loss": 0.0402,
+ "step": 33205
+ },
+ {
+ "epoch": 90.47956403269755,
+ "grad_norm": 3.5887913703918457,
+ "learning_rate": 4.716244546228943e-07,
+ "loss": 0.1115,
+ "step": 33206
+ },
+ {
+ "epoch": 90.48228882833787,
+ "grad_norm": 2.6446781158447266,
+ "learning_rate": 4.7135667155044807e-07,
+ "loss": 0.0781,
+ "step": 33207
+ },
+ {
+ "epoch": 90.4850136239782,
+ "grad_norm": 2.568363904953003,
+ "learning_rate": 4.710889626867687e-07,
+ "loss": 0.0355,
+ "step": 33208
+ },
+ {
+ "epoch": 90.48773841961852,
+ "grad_norm": 3.135401725769043,
+ "learning_rate": 4.7082132803394133e-07,
+ "loss": 0.1715,
+ "step": 33209
+ },
+ {
+ "epoch": 90.49046321525886,
+ "grad_norm": 2.086153030395508,
+ "learning_rate": 4.7055376759405083e-07,
+ "loss": 0.0418,
+ "step": 33210
+ },
+ {
+ "epoch": 90.49318801089919,
+ "grad_norm": 2.0694377422332764,
+ "learning_rate": 4.702862813691822e-07,
+ "loss": 0.032,
+ "step": 33211
+ },
+ {
+ "epoch": 90.49591280653951,
+ "grad_norm": 3.0108795166015625,
+ "learning_rate": 4.700188693614149e-07,
+ "loss": 0.0358,
+ "step": 33212
+ },
+ {
+ "epoch": 90.49863760217984,
+ "grad_norm": 2.128230333328247,
+ "learning_rate": 4.6975153157283624e-07,
+ "loss": 0.0269,
+ "step": 33213
+ },
+ {
+ "epoch": 90.50136239782016,
+ "grad_norm": 2.0283594131469727,
+ "learning_rate": 4.6948426800552447e-07,
+ "loss": 0.0262,
+ "step": 33214
+ },
+ {
+ "epoch": 90.50408719346049,
+ "grad_norm": 2.122006416320801,
+ "learning_rate": 4.692170786615635e-07,
+ "loss": 0.0266,
+ "step": 33215
+ },
+ {
+ "epoch": 90.50681198910081,
+ "grad_norm": 2.366952896118164,
+ "learning_rate": 4.689499635430317e-07,
+ "loss": 0.0328,
+ "step": 33216
+ },
+ {
+ "epoch": 90.50953678474114,
+ "grad_norm": 4.551375865936279,
+ "learning_rate": 4.6868292265201176e-07,
+ "loss": 0.1529,
+ "step": 33217
+ },
+ {
+ "epoch": 90.51226158038148,
+ "grad_norm": 3.2515320777893066,
+ "learning_rate": 4.684159559905821e-07,
+ "loss": 0.089,
+ "step": 33218
+ },
+ {
+ "epoch": 90.5149863760218,
+ "grad_norm": 2.7918386459350586,
+ "learning_rate": 4.681490635608232e-07,
+ "loss": 0.0421,
+ "step": 33219
+ },
+ {
+ "epoch": 90.51771117166213,
+ "grad_norm": 2.5816855430603027,
+ "learning_rate": 4.678822453648124e-07,
+ "loss": 0.1112,
+ "step": 33220
+ },
+ {
+ "epoch": 90.52043596730245,
+ "grad_norm": 3.7270753383636475,
+ "learning_rate": 4.676155014046269e-07,
+ "loss": 0.0949,
+ "step": 33221
+ },
+ {
+ "epoch": 90.52316076294278,
+ "grad_norm": 1.7641098499298096,
+ "learning_rate": 4.6734883168234603e-07,
+ "loss": 0.0251,
+ "step": 33222
+ },
+ {
+ "epoch": 90.52588555858311,
+ "grad_norm": 2.6046302318573,
+ "learning_rate": 4.67082236200046e-07,
+ "loss": 0.2202,
+ "step": 33223
+ },
+ {
+ "epoch": 90.52861035422343,
+ "grad_norm": 2.0669286251068115,
+ "learning_rate": 4.6681571495980184e-07,
+ "loss": 0.0338,
+ "step": 33224
+ },
+ {
+ "epoch": 90.53133514986376,
+ "grad_norm": 2.0476019382476807,
+ "learning_rate": 4.665492679636896e-07,
+ "loss": 0.0939,
+ "step": 33225
+ },
+ {
+ "epoch": 90.53405994550408,
+ "grad_norm": 1.4179803133010864,
+ "learning_rate": 4.6628289521378543e-07,
+ "loss": 0.0189,
+ "step": 33226
+ },
+ {
+ "epoch": 90.53678474114442,
+ "grad_norm": 1.2024822235107422,
+ "learning_rate": 4.6601659671216325e-07,
+ "loss": 0.0137,
+ "step": 33227
+ },
+ {
+ "epoch": 90.53950953678473,
+ "grad_norm": 2.3939061164855957,
+ "learning_rate": 4.6575037246089807e-07,
+ "loss": 0.0314,
+ "step": 33228
+ },
+ {
+ "epoch": 90.54223433242507,
+ "grad_norm": 3.4228403568267822,
+ "learning_rate": 4.6548422246206036e-07,
+ "loss": 0.0695,
+ "step": 33229
+ },
+ {
+ "epoch": 90.5449591280654,
+ "grad_norm": 3.3970940113067627,
+ "learning_rate": 4.6521814671772525e-07,
+ "loss": 0.0558,
+ "step": 33230
+ },
+ {
+ "epoch": 90.54768392370572,
+ "grad_norm": 2.596010446548462,
+ "learning_rate": 4.6495214522996435e-07,
+ "loss": 0.0431,
+ "step": 33231
+ },
+ {
+ "epoch": 90.55040871934605,
+ "grad_norm": 2.1344926357269287,
+ "learning_rate": 4.6468621800085043e-07,
+ "loss": 0.0554,
+ "step": 33232
+ },
+ {
+ "epoch": 90.55313351498637,
+ "grad_norm": 2.735389232635498,
+ "learning_rate": 4.644203650324508e-07,
+ "loss": 0.0426,
+ "step": 33233
+ },
+ {
+ "epoch": 90.5558583106267,
+ "grad_norm": 2.161064624786377,
+ "learning_rate": 4.641545863268393e-07,
+ "loss": 0.0639,
+ "step": 33234
+ },
+ {
+ "epoch": 90.55858310626704,
+ "grad_norm": 1.9047894477844238,
+ "learning_rate": 4.6388888188608537e-07,
+ "loss": 0.169,
+ "step": 33235
+ },
+ {
+ "epoch": 90.56130790190736,
+ "grad_norm": 2.8913934230804443,
+ "learning_rate": 4.636232517122585e-07,
+ "loss": 0.0823,
+ "step": 33236
+ },
+ {
+ "epoch": 90.56403269754769,
+ "grad_norm": 3.5276243686676025,
+ "learning_rate": 4.6335769580742594e-07,
+ "loss": 0.0984,
+ "step": 33237
+ },
+ {
+ "epoch": 90.566757493188,
+ "grad_norm": 3.1056935787200928,
+ "learning_rate": 4.6309221417365826e-07,
+ "loss": 0.0543,
+ "step": 33238
+ },
+ {
+ "epoch": 90.56948228882834,
+ "grad_norm": 2.3912622928619385,
+ "learning_rate": 4.6282680681302037e-07,
+ "loss": 0.0452,
+ "step": 33239
+ },
+ {
+ "epoch": 90.57220708446866,
+ "grad_norm": 2.9406867027282715,
+ "learning_rate": 4.6256147372758074e-07,
+ "loss": 0.0303,
+ "step": 33240
+ },
+ {
+ "epoch": 90.57493188010899,
+ "grad_norm": 2.1630442142486572,
+ "learning_rate": 4.622962149194044e-07,
+ "loss": 0.0268,
+ "step": 33241
+ },
+ {
+ "epoch": 90.57765667574932,
+ "grad_norm": 2.3760886192321777,
+ "learning_rate": 4.620310303905584e-07,
+ "loss": 0.0304,
+ "step": 33242
+ },
+ {
+ "epoch": 90.58038147138964,
+ "grad_norm": 1.802119255065918,
+ "learning_rate": 4.617659201431091e-07,
+ "loss": 0.0811,
+ "step": 33243
+ },
+ {
+ "epoch": 90.58310626702998,
+ "grad_norm": 1.9501885175704956,
+ "learning_rate": 4.6150088417911907e-07,
+ "loss": 0.0422,
+ "step": 33244
+ },
+ {
+ "epoch": 90.5858310626703,
+ "grad_norm": 2.0498251914978027,
+ "learning_rate": 4.612359225006524e-07,
+ "loss": 0.0322,
+ "step": 33245
+ },
+ {
+ "epoch": 90.58855585831063,
+ "grad_norm": 2.3923566341400146,
+ "learning_rate": 4.60971035109774e-07,
+ "loss": 0.024,
+ "step": 33246
+ },
+ {
+ "epoch": 90.59128065395096,
+ "grad_norm": 1.9519447088241577,
+ "learning_rate": 4.6070622200854673e-07,
+ "loss": 0.0396,
+ "step": 33247
+ },
+ {
+ "epoch": 90.59400544959128,
+ "grad_norm": 5.094139575958252,
+ "learning_rate": 4.6044148319903225e-07,
+ "loss": 0.0344,
+ "step": 33248
+ },
+ {
+ "epoch": 90.59673024523161,
+ "grad_norm": 1.788164496421814,
+ "learning_rate": 4.6017681868329114e-07,
+ "loss": 0.0995,
+ "step": 33249
+ },
+ {
+ "epoch": 90.59945504087193,
+ "grad_norm": 2.2989003658294678,
+ "learning_rate": 4.5991222846338724e-07,
+ "loss": 0.1095,
+ "step": 33250
+ },
+ {
+ "epoch": 90.60217983651226,
+ "grad_norm": 2.3944873809814453,
+ "learning_rate": 4.5964771254137785e-07,
+ "loss": 0.0313,
+ "step": 33251
+ },
+ {
+ "epoch": 90.60490463215258,
+ "grad_norm": 3.388947010040283,
+ "learning_rate": 4.5938327091932687e-07,
+ "loss": 0.1775,
+ "step": 33252
+ },
+ {
+ "epoch": 90.60762942779292,
+ "grad_norm": 3.04106068611145,
+ "learning_rate": 4.591189035992916e-07,
+ "loss": 0.1037,
+ "step": 33253
+ },
+ {
+ "epoch": 90.61035422343325,
+ "grad_norm": 3.9841744899749756,
+ "learning_rate": 4.5885461058333137e-07,
+ "loss": 0.0915,
+ "step": 33254
+ },
+ {
+ "epoch": 90.61307901907357,
+ "grad_norm": 2.1753439903259277,
+ "learning_rate": 4.585903918735046e-07,
+ "loss": 0.0271,
+ "step": 33255
+ },
+ {
+ "epoch": 90.6158038147139,
+ "grad_norm": 2.460171937942505,
+ "learning_rate": 4.583262474718686e-07,
+ "loss": 0.0358,
+ "step": 33256
+ },
+ {
+ "epoch": 90.61852861035422,
+ "grad_norm": 1.941246747970581,
+ "learning_rate": 4.5806217738047944e-07,
+ "loss": 0.0189,
+ "step": 33257
+ },
+ {
+ "epoch": 90.62125340599455,
+ "grad_norm": 2.2588279247283936,
+ "learning_rate": 4.5779818160139657e-07,
+ "loss": 0.0527,
+ "step": 33258
+ },
+ {
+ "epoch": 90.62397820163488,
+ "grad_norm": 2.660083293914795,
+ "learning_rate": 4.575342601366739e-07,
+ "loss": 0.1105,
+ "step": 33259
+ },
+ {
+ "epoch": 90.6267029972752,
+ "grad_norm": 2.6605067253112793,
+ "learning_rate": 4.572704129883676e-07,
+ "loss": 0.1001,
+ "step": 33260
+ },
+ {
+ "epoch": 90.62942779291554,
+ "grad_norm": 3.0070695877075195,
+ "learning_rate": 4.5700664015853045e-07,
+ "loss": 0.045,
+ "step": 33261
+ },
+ {
+ "epoch": 90.63215258855585,
+ "grad_norm": 2.5714046955108643,
+ "learning_rate": 4.567429416492208e-07,
+ "loss": 0.0329,
+ "step": 33262
+ },
+ {
+ "epoch": 90.63487738419619,
+ "grad_norm": 2.4974591732025146,
+ "learning_rate": 4.564793174624893e-07,
+ "loss": 0.0388,
+ "step": 33263
+ },
+ {
+ "epoch": 90.6376021798365,
+ "grad_norm": 2.819182872772217,
+ "learning_rate": 4.5621576760038975e-07,
+ "loss": 0.0227,
+ "step": 33264
+ },
+ {
+ "epoch": 90.64032697547684,
+ "grad_norm": 2.4309027194976807,
+ "learning_rate": 4.5595229206497283e-07,
+ "loss": 0.0433,
+ "step": 33265
+ },
+ {
+ "epoch": 90.64305177111717,
+ "grad_norm": 2.3355817794799805,
+ "learning_rate": 4.556888908582946e-07,
+ "loss": 0.0586,
+ "step": 33266
+ },
+ {
+ "epoch": 90.64577656675749,
+ "grad_norm": 3.9397144317626953,
+ "learning_rate": 4.5542556398240347e-07,
+ "loss": 0.0755,
+ "step": 33267
+ },
+ {
+ "epoch": 90.64850136239782,
+ "grad_norm": 2.4091289043426514,
+ "learning_rate": 4.5516231143935e-07,
+ "loss": 0.0391,
+ "step": 33268
+ },
+ {
+ "epoch": 90.65122615803814,
+ "grad_norm": 1.3573044538497925,
+ "learning_rate": 4.5489913323118585e-07,
+ "loss": 0.0272,
+ "step": 33269
+ },
+ {
+ "epoch": 90.65395095367847,
+ "grad_norm": 1.8493995666503906,
+ "learning_rate": 4.546360293599594e-07,
+ "loss": 0.0203,
+ "step": 33270
+ },
+ {
+ "epoch": 90.65667574931881,
+ "grad_norm": 4.400302410125732,
+ "learning_rate": 4.543729998277213e-07,
+ "loss": 0.0481,
+ "step": 33271
+ },
+ {
+ "epoch": 90.65940054495913,
+ "grad_norm": 2.390752077102661,
+ "learning_rate": 4.5411004463651877e-07,
+ "loss": 0.1424,
+ "step": 33272
+ },
+ {
+ "epoch": 90.66212534059946,
+ "grad_norm": 2.43003511428833,
+ "learning_rate": 4.538471637884001e-07,
+ "loss": 0.0527,
+ "step": 33273
+ },
+ {
+ "epoch": 90.66485013623978,
+ "grad_norm": 2.8040931224823,
+ "learning_rate": 4.535843572854115e-07,
+ "loss": 0.0502,
+ "step": 33274
+ },
+ {
+ "epoch": 90.66757493188011,
+ "grad_norm": 2.7672746181488037,
+ "learning_rate": 4.5332162512960245e-07,
+ "loss": 0.0543,
+ "step": 33275
+ },
+ {
+ "epoch": 90.67029972752043,
+ "grad_norm": 2.0645103454589844,
+ "learning_rate": 4.5305896732301566e-07,
+ "loss": 0.0863,
+ "step": 33276
+ },
+ {
+ "epoch": 90.67302452316076,
+ "grad_norm": 4.056310653686523,
+ "learning_rate": 4.527963838676985e-07,
+ "loss": 0.0236,
+ "step": 33277
+ },
+ {
+ "epoch": 90.6757493188011,
+ "grad_norm": 1.9052339792251587,
+ "learning_rate": 4.525338747656971e-07,
+ "loss": 0.0204,
+ "step": 33278
+ },
+ {
+ "epoch": 90.67847411444141,
+ "grad_norm": 3.4017715454101562,
+ "learning_rate": 4.522714400190542e-07,
+ "loss": 0.1799,
+ "step": 33279
+ },
+ {
+ "epoch": 90.68119891008175,
+ "grad_norm": 1.9250975847244263,
+ "learning_rate": 4.5200907962981376e-07,
+ "loss": 0.0192,
+ "step": 33280
+ },
+ {
+ "epoch": 90.68392370572207,
+ "grad_norm": 2.553457260131836,
+ "learning_rate": 4.517467936000186e-07,
+ "loss": 0.0503,
+ "step": 33281
+ },
+ {
+ "epoch": 90.6866485013624,
+ "grad_norm": 2.4489798545837402,
+ "learning_rate": 4.5148458193171264e-07,
+ "loss": 0.0429,
+ "step": 33282
+ },
+ {
+ "epoch": 90.68937329700273,
+ "grad_norm": 2.2490460872650146,
+ "learning_rate": 4.5122244462693865e-07,
+ "loss": 0.0753,
+ "step": 33283
+ },
+ {
+ "epoch": 90.69209809264305,
+ "grad_norm": 2.6086504459381104,
+ "learning_rate": 4.5096038168773613e-07,
+ "loss": 0.1151,
+ "step": 33284
+ },
+ {
+ "epoch": 90.69482288828338,
+ "grad_norm": 2.2189416885375977,
+ "learning_rate": 4.506983931161457e-07,
+ "loss": 0.1018,
+ "step": 33285
+ },
+ {
+ "epoch": 90.6975476839237,
+ "grad_norm": 1.7940874099731445,
+ "learning_rate": 4.5043647891420794e-07,
+ "loss": 0.0262,
+ "step": 33286
+ },
+ {
+ "epoch": 90.70027247956403,
+ "grad_norm": 1.604964256286621,
+ "learning_rate": 4.5017463908396564e-07,
+ "loss": 0.015,
+ "step": 33287
+ },
+ {
+ "epoch": 90.70299727520435,
+ "grad_norm": 2.4309797286987305,
+ "learning_rate": 4.4991287362745604e-07,
+ "loss": 0.051,
+ "step": 33288
+ },
+ {
+ "epoch": 90.70572207084469,
+ "grad_norm": 2.2586495876312256,
+ "learning_rate": 4.496511825467176e-07,
+ "loss": 0.0343,
+ "step": 33289
+ },
+ {
+ "epoch": 90.70844686648502,
+ "grad_norm": 3.711592197418213,
+ "learning_rate": 4.493895658437875e-07,
+ "loss": 0.0437,
+ "step": 33290
+ },
+ {
+ "epoch": 90.71117166212534,
+ "grad_norm": 2.5330240726470947,
+ "learning_rate": 4.4912802352070406e-07,
+ "loss": 0.0431,
+ "step": 33291
+ },
+ {
+ "epoch": 90.71389645776567,
+ "grad_norm": 2.8791136741638184,
+ "learning_rate": 4.4886655557950576e-07,
+ "loss": 0.0315,
+ "step": 33292
+ },
+ {
+ "epoch": 90.71662125340599,
+ "grad_norm": 2.8156704902648926,
+ "learning_rate": 4.486051620222265e-07,
+ "loss": 0.0554,
+ "step": 33293
+ },
+ {
+ "epoch": 90.71934604904632,
+ "grad_norm": 1.548614501953125,
+ "learning_rate": 4.4834384285090126e-07,
+ "loss": 0.027,
+ "step": 33294
+ },
+ {
+ "epoch": 90.72207084468666,
+ "grad_norm": 2.3263797760009766,
+ "learning_rate": 4.480825980675685e-07,
+ "loss": 0.0552,
+ "step": 33295
+ },
+ {
+ "epoch": 90.72479564032697,
+ "grad_norm": 1.9418562650680542,
+ "learning_rate": 4.47821427674261e-07,
+ "loss": 0.2023,
+ "step": 33296
+ },
+ {
+ "epoch": 90.7275204359673,
+ "grad_norm": 3.4640796184539795,
+ "learning_rate": 4.475603316730115e-07,
+ "loss": 0.0359,
+ "step": 33297
+ },
+ {
+ "epoch": 90.73024523160763,
+ "grad_norm": 2.2104876041412354,
+ "learning_rate": 4.4729931006585514e-07,
+ "loss": 0.0195,
+ "step": 33298
+ },
+ {
+ "epoch": 90.73297002724796,
+ "grad_norm": 2.9146504402160645,
+ "learning_rate": 4.470383628548247e-07,
+ "loss": 0.0797,
+ "step": 33299
+ },
+ {
+ "epoch": 90.73569482288828,
+ "grad_norm": 2.01104736328125,
+ "learning_rate": 4.4677749004195305e-07,
+ "loss": 0.0232,
+ "step": 33300
+ },
+ {
+ "epoch": 90.73841961852861,
+ "grad_norm": 2.4689102172851562,
+ "learning_rate": 4.4651669162926847e-07,
+ "loss": 0.0239,
+ "step": 33301
+ },
+ {
+ "epoch": 90.74114441416894,
+ "grad_norm": 2.313556671142578,
+ "learning_rate": 4.4625596761880496e-07,
+ "loss": 0.0345,
+ "step": 33302
+ },
+ {
+ "epoch": 90.74386920980926,
+ "grad_norm": 3.654481887817383,
+ "learning_rate": 4.459953180125931e-07,
+ "loss": 0.0701,
+ "step": 33303
+ },
+ {
+ "epoch": 90.7465940054496,
+ "grad_norm": 3.117694616317749,
+ "learning_rate": 4.457347428126635e-07,
+ "loss": 0.0298,
+ "step": 33304
+ },
+ {
+ "epoch": 90.74931880108991,
+ "grad_norm": 2.7887511253356934,
+ "learning_rate": 4.454742420210434e-07,
+ "loss": 0.0302,
+ "step": 33305
+ },
+ {
+ "epoch": 90.75204359673025,
+ "grad_norm": 1.46806001663208,
+ "learning_rate": 4.452138156397612e-07,
+ "loss": 0.0195,
+ "step": 33306
+ },
+ {
+ "epoch": 90.75476839237058,
+ "grad_norm": 2.515507459640503,
+ "learning_rate": 4.449534636708475e-07,
+ "loss": 0.1116,
+ "step": 33307
+ },
+ {
+ "epoch": 90.7574931880109,
+ "grad_norm": 2.274747848510742,
+ "learning_rate": 4.446931861163284e-07,
+ "loss": 0.0289,
+ "step": 33308
+ },
+ {
+ "epoch": 90.76021798365123,
+ "grad_norm": 1.96199631690979,
+ "learning_rate": 4.4443298297823124e-07,
+ "loss": 0.0757,
+ "step": 33309
+ },
+ {
+ "epoch": 90.76294277929155,
+ "grad_norm": 2.8164730072021484,
+ "learning_rate": 4.4417285425858213e-07,
+ "loss": 0.0958,
+ "step": 33310
+ },
+ {
+ "epoch": 90.76566757493188,
+ "grad_norm": 2.6038970947265625,
+ "learning_rate": 4.4391279995940727e-07,
+ "loss": 0.1446,
+ "step": 33311
+ },
+ {
+ "epoch": 90.7683923705722,
+ "grad_norm": 4.647005081176758,
+ "learning_rate": 4.436528200827328e-07,
+ "loss": 0.0769,
+ "step": 33312
+ },
+ {
+ "epoch": 90.77111716621253,
+ "grad_norm": 2.5276827812194824,
+ "learning_rate": 4.4339291463058266e-07,
+ "loss": 0.0724,
+ "step": 33313
+ },
+ {
+ "epoch": 90.77384196185287,
+ "grad_norm": 2.7569687366485596,
+ "learning_rate": 4.4313308360497855e-07,
+ "loss": 0.0411,
+ "step": 33314
+ },
+ {
+ "epoch": 90.77656675749319,
+ "grad_norm": 3.9350979328155518,
+ "learning_rate": 4.428733270079488e-07,
+ "loss": 0.0261,
+ "step": 33315
+ },
+ {
+ "epoch": 90.77929155313352,
+ "grad_norm": 3.995311737060547,
+ "learning_rate": 4.4261364484151416e-07,
+ "loss": 0.0485,
+ "step": 33316
+ },
+ {
+ "epoch": 90.78201634877384,
+ "grad_norm": 2.352081775665283,
+ "learning_rate": 4.423540371076962e-07,
+ "loss": 0.0359,
+ "step": 33317
+ },
+ {
+ "epoch": 90.78474114441417,
+ "grad_norm": 1.513340950012207,
+ "learning_rate": 4.420945038085156e-07,
+ "loss": 0.1367,
+ "step": 33318
+ },
+ {
+ "epoch": 90.7874659400545,
+ "grad_norm": 2.9075117111206055,
+ "learning_rate": 4.418350449459974e-07,
+ "loss": 0.0439,
+ "step": 33319
+ },
+ {
+ "epoch": 90.79019073569482,
+ "grad_norm": 2.7996304035186768,
+ "learning_rate": 4.4157566052215885e-07,
+ "loss": 0.0388,
+ "step": 33320
+ },
+ {
+ "epoch": 90.79291553133515,
+ "grad_norm": 2.642317533493042,
+ "learning_rate": 4.413163505390228e-07,
+ "loss": 0.0463,
+ "step": 33321
+ },
+ {
+ "epoch": 90.79564032697547,
+ "grad_norm": 2.271878957748413,
+ "learning_rate": 4.410571149986065e-07,
+ "loss": 0.0385,
+ "step": 33322
+ },
+ {
+ "epoch": 90.7983651226158,
+ "grad_norm": 3.982398271560669,
+ "learning_rate": 4.4079795390293057e-07,
+ "loss": 0.062,
+ "step": 33323
+ },
+ {
+ "epoch": 90.80108991825612,
+ "grad_norm": 2.5257749557495117,
+ "learning_rate": 4.405388672540123e-07,
+ "loss": 0.1699,
+ "step": 33324
+ },
+ {
+ "epoch": 90.80381471389646,
+ "grad_norm": 1.8141134977340698,
+ "learning_rate": 4.4027985505387005e-07,
+ "loss": 0.0563,
+ "step": 33325
+ },
+ {
+ "epoch": 90.80653950953679,
+ "grad_norm": 2.4545209407806396,
+ "learning_rate": 4.400209173045189e-07,
+ "loss": 0.061,
+ "step": 33326
+ },
+ {
+ "epoch": 90.80926430517711,
+ "grad_norm": 2.4928431510925293,
+ "learning_rate": 4.397620540079794e-07,
+ "loss": 0.1313,
+ "step": 33327
+ },
+ {
+ "epoch": 90.81198910081744,
+ "grad_norm": 2.2530672550201416,
+ "learning_rate": 4.395032651662645e-07,
+ "loss": 0.1197,
+ "step": 33328
+ },
+ {
+ "epoch": 90.81471389645776,
+ "grad_norm": 3.323392152786255,
+ "learning_rate": 4.3924455078139027e-07,
+ "loss": 0.0545,
+ "step": 33329
+ },
+ {
+ "epoch": 90.8174386920981,
+ "grad_norm": 3.538079261779785,
+ "learning_rate": 4.389859108553707e-07,
+ "loss": 0.043,
+ "step": 33330
+ },
+ {
+ "epoch": 90.82016348773843,
+ "grad_norm": 2.706392526626587,
+ "learning_rate": 4.38727345390223e-07,
+ "loss": 0.1092,
+ "step": 33331
+ },
+ {
+ "epoch": 90.82288828337875,
+ "grad_norm": 2.1860039234161377,
+ "learning_rate": 4.384688543879578e-07,
+ "loss": 0.0803,
+ "step": 33332
+ },
+ {
+ "epoch": 90.82561307901908,
+ "grad_norm": 2.5086474418640137,
+ "learning_rate": 4.382104378505903e-07,
+ "loss": 0.0513,
+ "step": 33333
+ },
+ {
+ "epoch": 90.8283378746594,
+ "grad_norm": 2.532987356185913,
+ "learning_rate": 4.3795209578013085e-07,
+ "loss": 0.0891,
+ "step": 33334
+ },
+ {
+ "epoch": 90.83106267029973,
+ "grad_norm": 3.6119742393493652,
+ "learning_rate": 4.3769382817859363e-07,
+ "loss": 0.1391,
+ "step": 33335
+ },
+ {
+ "epoch": 90.83378746594005,
+ "grad_norm": 2.609095335006714,
+ "learning_rate": 4.3743563504799027e-07,
+ "loss": 0.0496,
+ "step": 33336
+ },
+ {
+ "epoch": 90.83651226158038,
+ "grad_norm": 2.4013712406158447,
+ "learning_rate": 4.37177516390328e-07,
+ "loss": 0.0557,
+ "step": 33337
+ },
+ {
+ "epoch": 90.83923705722071,
+ "grad_norm": 2.670222043991089,
+ "learning_rate": 4.3691947220762087e-07,
+ "loss": 0.0429,
+ "step": 33338
+ },
+ {
+ "epoch": 90.84196185286103,
+ "grad_norm": 2.525219202041626,
+ "learning_rate": 4.366615025018761e-07,
+ "loss": 0.0419,
+ "step": 33339
+ },
+ {
+ "epoch": 90.84468664850137,
+ "grad_norm": 1.774667501449585,
+ "learning_rate": 4.364036072751043e-07,
+ "loss": 0.0353,
+ "step": 33340
+ },
+ {
+ "epoch": 90.84741144414168,
+ "grad_norm": 2.6277847290039062,
+ "learning_rate": 4.361457865293139e-07,
+ "loss": 0.089,
+ "step": 33341
+ },
+ {
+ "epoch": 90.85013623978202,
+ "grad_norm": 3.0051229000091553,
+ "learning_rate": 4.358880402665111e-07,
+ "loss": 0.0772,
+ "step": 33342
+ },
+ {
+ "epoch": 90.85286103542235,
+ "grad_norm": 2.5538885593414307,
+ "learning_rate": 4.3563036848870535e-07,
+ "loss": 0.0836,
+ "step": 33343
+ },
+ {
+ "epoch": 90.85558583106267,
+ "grad_norm": 2.340928077697754,
+ "learning_rate": 4.353727711979028e-07,
+ "loss": 0.0471,
+ "step": 33344
+ },
+ {
+ "epoch": 90.858310626703,
+ "grad_norm": 2.7762279510498047,
+ "learning_rate": 4.351152483961096e-07,
+ "loss": 0.0334,
+ "step": 33345
+ },
+ {
+ "epoch": 90.86103542234332,
+ "grad_norm": 3.309253215789795,
+ "learning_rate": 4.3485780008532987e-07,
+ "loss": 0.2737,
+ "step": 33346
+ },
+ {
+ "epoch": 90.86376021798365,
+ "grad_norm": 1.7336481809616089,
+ "learning_rate": 4.346004262675707e-07,
+ "loss": 0.0176,
+ "step": 33347
+ },
+ {
+ "epoch": 90.86648501362397,
+ "grad_norm": 3.786724805831909,
+ "learning_rate": 4.3434312694483504e-07,
+ "loss": 0.1904,
+ "step": 33348
+ },
+ {
+ "epoch": 90.8692098092643,
+ "grad_norm": 2.521250009536743,
+ "learning_rate": 4.3408590211912793e-07,
+ "loss": 0.0308,
+ "step": 33349
+ },
+ {
+ "epoch": 90.87193460490464,
+ "grad_norm": 4.147480010986328,
+ "learning_rate": 4.3382875179244997e-07,
+ "loss": 0.0684,
+ "step": 33350
+ },
+ {
+ "epoch": 90.87465940054496,
+ "grad_norm": 3.3927242755889893,
+ "learning_rate": 4.335716759668074e-07,
+ "loss": 0.0555,
+ "step": 33351
+ },
+ {
+ "epoch": 90.87738419618529,
+ "grad_norm": 3.3246638774871826,
+ "learning_rate": 4.3331467464420076e-07,
+ "loss": 0.0367,
+ "step": 33352
+ },
+ {
+ "epoch": 90.88010899182561,
+ "grad_norm": 3.043524742126465,
+ "learning_rate": 4.330577478266318e-07,
+ "loss": 0.0418,
+ "step": 33353
+ },
+ {
+ "epoch": 90.88283378746594,
+ "grad_norm": 2.6775705814361572,
+ "learning_rate": 4.3280089551609895e-07,
+ "loss": 0.0372,
+ "step": 33354
+ },
+ {
+ "epoch": 90.88555858310627,
+ "grad_norm": 2.337829351425171,
+ "learning_rate": 4.3254411771460616e-07,
+ "loss": 0.0257,
+ "step": 33355
+ },
+ {
+ "epoch": 90.88828337874659,
+ "grad_norm": 2.7748048305511475,
+ "learning_rate": 4.322874144241518e-07,
+ "loss": 0.0877,
+ "step": 33356
+ },
+ {
+ "epoch": 90.89100817438693,
+ "grad_norm": 2.3835325241088867,
+ "learning_rate": 4.320307856467365e-07,
+ "loss": 0.0485,
+ "step": 33357
+ },
+ {
+ "epoch": 90.89373297002724,
+ "grad_norm": 3.358006477355957,
+ "learning_rate": 4.317742313843565e-07,
+ "loss": 0.0338,
+ "step": 33358
+ },
+ {
+ "epoch": 90.89645776566758,
+ "grad_norm": 2.6560401916503906,
+ "learning_rate": 4.315177516390101e-07,
+ "loss": 0.0605,
+ "step": 33359
+ },
+ {
+ "epoch": 90.8991825613079,
+ "grad_norm": 1.7317368984222412,
+ "learning_rate": 4.312613464126958e-07,
+ "loss": 0.0275,
+ "step": 33360
+ },
+ {
+ "epoch": 90.90190735694823,
+ "grad_norm": 3.597325086593628,
+ "learning_rate": 4.310050157074108e-07,
+ "loss": 0.1089,
+ "step": 33361
+ },
+ {
+ "epoch": 90.90463215258856,
+ "grad_norm": 1.9957163333892822,
+ "learning_rate": 4.307487595251503e-07,
+ "loss": 0.0344,
+ "step": 33362
+ },
+ {
+ "epoch": 90.90735694822888,
+ "grad_norm": 2.671257734298706,
+ "learning_rate": 4.304925778679103e-07,
+ "loss": 0.029,
+ "step": 33363
+ },
+ {
+ "epoch": 90.91008174386921,
+ "grad_norm": 2.490180730819702,
+ "learning_rate": 4.3023647073768716e-07,
+ "loss": 0.0937,
+ "step": 33364
+ },
+ {
+ "epoch": 90.91280653950953,
+ "grad_norm": 3.191882848739624,
+ "learning_rate": 4.299804381364736e-07,
+ "loss": 0.0824,
+ "step": 33365
+ },
+ {
+ "epoch": 90.91553133514986,
+ "grad_norm": 2.27536678314209,
+ "learning_rate": 4.2972448006626366e-07,
+ "loss": 0.0944,
+ "step": 33366
+ },
+ {
+ "epoch": 90.9182561307902,
+ "grad_norm": 1.630289912223816,
+ "learning_rate": 4.294685965290535e-07,
+ "loss": 0.02,
+ "step": 33367
+ },
+ {
+ "epoch": 90.92098092643052,
+ "grad_norm": 2.409642219543457,
+ "learning_rate": 4.292127875268326e-07,
+ "loss": 0.054,
+ "step": 33368
+ },
+ {
+ "epoch": 90.92370572207085,
+ "grad_norm": 2.299753189086914,
+ "learning_rate": 4.2895705306159497e-07,
+ "loss": 0.0938,
+ "step": 33369
+ },
+ {
+ "epoch": 90.92643051771117,
+ "grad_norm": 2.03139066696167,
+ "learning_rate": 4.2870139313533013e-07,
+ "loss": 0.0332,
+ "step": 33370
+ },
+ {
+ "epoch": 90.9291553133515,
+ "grad_norm": 2.4000296592712402,
+ "learning_rate": 4.284458077500309e-07,
+ "loss": 0.0326,
+ "step": 33371
+ },
+ {
+ "epoch": 90.93188010899182,
+ "grad_norm": 2.0949079990386963,
+ "learning_rate": 4.2819029690768896e-07,
+ "loss": 0.0334,
+ "step": 33372
+ },
+ {
+ "epoch": 90.93460490463215,
+ "grad_norm": 1.8479863405227661,
+ "learning_rate": 4.27934860610294e-07,
+ "loss": 0.0391,
+ "step": 33373
+ },
+ {
+ "epoch": 90.93732970027249,
+ "grad_norm": 3.3907392024993896,
+ "learning_rate": 4.2767949885983316e-07,
+ "loss": 0.0548,
+ "step": 33374
+ },
+ {
+ "epoch": 90.9400544959128,
+ "grad_norm": 5.232072830200195,
+ "learning_rate": 4.27424211658295e-07,
+ "loss": 0.0527,
+ "step": 33375
+ },
+ {
+ "epoch": 90.94277929155314,
+ "grad_norm": 6.1928277015686035,
+ "learning_rate": 4.2716899900766994e-07,
+ "loss": 0.0623,
+ "step": 33376
+ },
+ {
+ "epoch": 90.94550408719346,
+ "grad_norm": 2.1101908683776855,
+ "learning_rate": 4.2691386090994545e-07,
+ "loss": 0.0787,
+ "step": 33377
+ },
+ {
+ "epoch": 90.94822888283379,
+ "grad_norm": 2.824894666671753,
+ "learning_rate": 4.266587973671077e-07,
+ "loss": 0.0559,
+ "step": 33378
+ },
+ {
+ "epoch": 90.95095367847412,
+ "grad_norm": 2.098055839538574,
+ "learning_rate": 4.264038083811417e-07,
+ "loss": 0.0314,
+ "step": 33379
+ },
+ {
+ "epoch": 90.95367847411444,
+ "grad_norm": 1.8382599353790283,
+ "learning_rate": 4.261488939540348e-07,
+ "loss": 0.0219,
+ "step": 33380
+ },
+ {
+ "epoch": 90.95640326975477,
+ "grad_norm": 1.9304697513580322,
+ "learning_rate": 4.2589405408777426e-07,
+ "loss": 0.041,
+ "step": 33381
+ },
+ {
+ "epoch": 90.95912806539509,
+ "grad_norm": 1.5916671752929688,
+ "learning_rate": 4.256392887843408e-07,
+ "loss": 0.0181,
+ "step": 33382
+ },
+ {
+ "epoch": 90.96185286103542,
+ "grad_norm": 3.523991584777832,
+ "learning_rate": 4.2538459804572053e-07,
+ "loss": 0.0605,
+ "step": 33383
+ },
+ {
+ "epoch": 90.96457765667574,
+ "grad_norm": 2.8593709468841553,
+ "learning_rate": 4.251299818738974e-07,
+ "loss": 0.0684,
+ "step": 33384
+ },
+ {
+ "epoch": 90.96730245231608,
+ "grad_norm": 1.5864038467407227,
+ "learning_rate": 4.2487544027085435e-07,
+ "loss": 0.021,
+ "step": 33385
+ },
+ {
+ "epoch": 90.97002724795641,
+ "grad_norm": 2.613136053085327,
+ "learning_rate": 4.246209732385709e-07,
+ "loss": 0.0299,
+ "step": 33386
+ },
+ {
+ "epoch": 90.97275204359673,
+ "grad_norm": 2.5730583667755127,
+ "learning_rate": 4.2436658077903316e-07,
+ "loss": 0.0347,
+ "step": 33387
+ },
+ {
+ "epoch": 90.97547683923706,
+ "grad_norm": 2.8248631954193115,
+ "learning_rate": 4.2411226289421846e-07,
+ "loss": 0.0812,
+ "step": 33388
+ },
+ {
+ "epoch": 90.97820163487738,
+ "grad_norm": 1.930606484413147,
+ "learning_rate": 4.2385801958611196e-07,
+ "loss": 0.0202,
+ "step": 33389
+ },
+ {
+ "epoch": 90.98092643051771,
+ "grad_norm": 2.477756977081299,
+ "learning_rate": 4.2360385085668976e-07,
+ "loss": 0.083,
+ "step": 33390
+ },
+ {
+ "epoch": 90.98365122615803,
+ "grad_norm": 2.007246494293213,
+ "learning_rate": 4.2334975670793145e-07,
+ "loss": 0.093,
+ "step": 33391
+ },
+ {
+ "epoch": 90.98637602179836,
+ "grad_norm": 2.4395124912261963,
+ "learning_rate": 4.2309573714181763e-07,
+ "loss": 0.0392,
+ "step": 33392
+ },
+ {
+ "epoch": 90.9891008174387,
+ "grad_norm": 1.9157994985580444,
+ "learning_rate": 4.2284179216032675e-07,
+ "loss": 0.0248,
+ "step": 33393
+ },
+ {
+ "epoch": 90.99182561307902,
+ "grad_norm": 2.822202444076538,
+ "learning_rate": 4.2258792176543604e-07,
+ "loss": 0.0293,
+ "step": 33394
+ },
+ {
+ "epoch": 90.99455040871935,
+ "grad_norm": 2.7082839012145996,
+ "learning_rate": 4.223341259591207e-07,
+ "loss": 0.1149,
+ "step": 33395
+ },
+ {
+ "epoch": 90.99727520435967,
+ "grad_norm": 1.8892465829849243,
+ "learning_rate": 4.220804047433602e-07,
+ "loss": 0.0301,
+ "step": 33396
+ },
+ {
+ "epoch": 91.0,
+ "grad_norm": 2.780186653137207,
+ "learning_rate": 4.218267581201296e-07,
+ "loss": 0.0568,
+ "step": 33397
+ },
+ {
+ "epoch": 91.00272479564033,
+ "grad_norm": 1.4437553882598877,
+ "learning_rate": 4.2157318609140407e-07,
+ "loss": 0.0134,
+ "step": 33398
+ },
+ {
+ "epoch": 91.00544959128065,
+ "grad_norm": 3.407665491104126,
+ "learning_rate": 4.213196886591564e-07,
+ "loss": 0.0875,
+ "step": 33399
+ },
+ {
+ "epoch": 91.00817438692098,
+ "grad_norm": 2.379626512527466,
+ "learning_rate": 4.2106626582536394e-07,
+ "loss": 0.0695,
+ "step": 33400
+ },
+ {
+ "epoch": 91.0108991825613,
+ "grad_norm": 2.8182828426361084,
+ "learning_rate": 4.208129175919995e-07,
+ "loss": 0.0438,
+ "step": 33401
+ },
+ {
+ "epoch": 91.01362397820164,
+ "grad_norm": 3.4735851287841797,
+ "learning_rate": 4.205596439610349e-07,
+ "loss": 0.0233,
+ "step": 33402
+ },
+ {
+ "epoch": 91.01634877384195,
+ "grad_norm": 2.151665687561035,
+ "learning_rate": 4.2030644493444294e-07,
+ "loss": 0.0711,
+ "step": 33403
+ },
+ {
+ "epoch": 91.01907356948229,
+ "grad_norm": 2.8269784450531006,
+ "learning_rate": 4.200533205141977e-07,
+ "loss": 0.0331,
+ "step": 33404
+ },
+ {
+ "epoch": 91.02179836512262,
+ "grad_norm": 2.588975191116333,
+ "learning_rate": 4.1980027070226857e-07,
+ "loss": 0.1352,
+ "step": 33405
+ },
+ {
+ "epoch": 91.02452316076294,
+ "grad_norm": 2.4744315147399902,
+ "learning_rate": 4.195472955006252e-07,
+ "loss": 0.1165,
+ "step": 33406
+ },
+ {
+ "epoch": 91.02724795640327,
+ "grad_norm": 3.606994867324829,
+ "learning_rate": 4.1929439491123936e-07,
+ "loss": 0.0979,
+ "step": 33407
+ },
+ {
+ "epoch": 91.02997275204359,
+ "grad_norm": 2.223158359527588,
+ "learning_rate": 4.190415689360816e-07,
+ "loss": 0.0704,
+ "step": 33408
+ },
+ {
+ "epoch": 91.03269754768392,
+ "grad_norm": 2.95735502243042,
+ "learning_rate": 4.187888175771193e-07,
+ "loss": 0.1644,
+ "step": 33409
+ },
+ {
+ "epoch": 91.03542234332426,
+ "grad_norm": 2.433638095855713,
+ "learning_rate": 4.1853614083632197e-07,
+ "loss": 0.144,
+ "step": 33410
+ },
+ {
+ "epoch": 91.03814713896458,
+ "grad_norm": 2.4552266597747803,
+ "learning_rate": 4.1828353871565473e-07,
+ "loss": 0.0506,
+ "step": 33411
+ },
+ {
+ "epoch": 91.04087193460491,
+ "grad_norm": 3.9573609828948975,
+ "learning_rate": 4.180310112170882e-07,
+ "loss": 0.1673,
+ "step": 33412
+ },
+ {
+ "epoch": 91.04359673024523,
+ "grad_norm": 3.0006465911865234,
+ "learning_rate": 4.177785583425886e-07,
+ "loss": 0.0325,
+ "step": 33413
+ },
+ {
+ "epoch": 91.04632152588556,
+ "grad_norm": 2.318074941635132,
+ "learning_rate": 4.1752618009412105e-07,
+ "loss": 0.1645,
+ "step": 33414
+ },
+ {
+ "epoch": 91.04904632152588,
+ "grad_norm": 3.8660340309143066,
+ "learning_rate": 4.1727387647364945e-07,
+ "loss": 0.0506,
+ "step": 33415
+ },
+ {
+ "epoch": 91.05177111716621,
+ "grad_norm": 2.045443296432495,
+ "learning_rate": 4.1702164748314236e-07,
+ "loss": 0.0262,
+ "step": 33416
+ },
+ {
+ "epoch": 91.05449591280654,
+ "grad_norm": 2.0326268672943115,
+ "learning_rate": 4.167694931245614e-07,
+ "loss": 0.0406,
+ "step": 33417
+ },
+ {
+ "epoch": 91.05722070844686,
+ "grad_norm": 2.635942220687866,
+ "learning_rate": 4.165174133998717e-07,
+ "loss": 0.0441,
+ "step": 33418
+ },
+ {
+ "epoch": 91.0599455040872,
+ "grad_norm": 2.3526809215545654,
+ "learning_rate": 4.1626540831103513e-07,
+ "loss": 0.1848,
+ "step": 33419
+ },
+ {
+ "epoch": 91.06267029972751,
+ "grad_norm": 2.0343103408813477,
+ "learning_rate": 4.1601347786001557e-07,
+ "loss": 0.0459,
+ "step": 33420
+ },
+ {
+ "epoch": 91.06539509536785,
+ "grad_norm": 2.195220947265625,
+ "learning_rate": 4.1576162204877477e-07,
+ "loss": 0.0446,
+ "step": 33421
+ },
+ {
+ "epoch": 91.06811989100818,
+ "grad_norm": 2.0926713943481445,
+ "learning_rate": 4.155098408792735e-07,
+ "loss": 0.0235,
+ "step": 33422
+ },
+ {
+ "epoch": 91.0708446866485,
+ "grad_norm": 2.789863109588623,
+ "learning_rate": 4.152581343534734e-07,
+ "loss": 0.0288,
+ "step": 33423
+ },
+ {
+ "epoch": 91.07356948228883,
+ "grad_norm": 3.174238920211792,
+ "learning_rate": 4.1500650247333294e-07,
+ "loss": 0.131,
+ "step": 33424
+ },
+ {
+ "epoch": 91.07629427792915,
+ "grad_norm": 2.6352181434631348,
+ "learning_rate": 4.1475494524081504e-07,
+ "loss": 0.1396,
+ "step": 33425
+ },
+ {
+ "epoch": 91.07901907356948,
+ "grad_norm": 2.5747056007385254,
+ "learning_rate": 4.14503462657877e-07,
+ "loss": 0.0291,
+ "step": 33426
+ },
+ {
+ "epoch": 91.0817438692098,
+ "grad_norm": 1.8077361583709717,
+ "learning_rate": 4.142520547264772e-07,
+ "loss": 0.0832,
+ "step": 33427
+ },
+ {
+ "epoch": 91.08446866485014,
+ "grad_norm": 5.838677406311035,
+ "learning_rate": 4.140007214485742e-07,
+ "loss": 0.0286,
+ "step": 33428
+ },
+ {
+ "epoch": 91.08719346049047,
+ "grad_norm": 2.1196765899658203,
+ "learning_rate": 4.1374946282612517e-07,
+ "loss": 0.0281,
+ "step": 33429
+ },
+ {
+ "epoch": 91.08991825613079,
+ "grad_norm": 2.8270084857940674,
+ "learning_rate": 4.134982788610875e-07,
+ "loss": 0.1324,
+ "step": 33430
+ },
+ {
+ "epoch": 91.09264305177112,
+ "grad_norm": 2.859435796737671,
+ "learning_rate": 4.132471695554141e-07,
+ "loss": 0.0835,
+ "step": 33431
+ },
+ {
+ "epoch": 91.09536784741144,
+ "grad_norm": 1.551326036453247,
+ "learning_rate": 4.1299613491106563e-07,
+ "loss": 0.057,
+ "step": 33432
+ },
+ {
+ "epoch": 91.09809264305177,
+ "grad_norm": 2.9040513038635254,
+ "learning_rate": 4.127451749299938e-07,
+ "loss": 0.1105,
+ "step": 33433
+ },
+ {
+ "epoch": 91.1008174386921,
+ "grad_norm": 3.816948175430298,
+ "learning_rate": 4.1249428961415485e-07,
+ "loss": 0.0303,
+ "step": 33434
+ },
+ {
+ "epoch": 91.10354223433242,
+ "grad_norm": 2.374884605407715,
+ "learning_rate": 4.122434789655005e-07,
+ "loss": 0.0507,
+ "step": 33435
+ },
+ {
+ "epoch": 91.10626702997276,
+ "grad_norm": 2.461409330368042,
+ "learning_rate": 4.11992742985986e-07,
+ "loss": 0.1273,
+ "step": 33436
+ },
+ {
+ "epoch": 91.10899182561307,
+ "grad_norm": 2.029978036880493,
+ "learning_rate": 4.1174208167756414e-07,
+ "loss": 0.0329,
+ "step": 33437
+ },
+ {
+ "epoch": 91.11171662125341,
+ "grad_norm": 2.182032823562622,
+ "learning_rate": 4.1149149504218553e-07,
+ "loss": 0.0626,
+ "step": 33438
+ },
+ {
+ "epoch": 91.11444141689373,
+ "grad_norm": 2.0493831634521484,
+ "learning_rate": 4.1124098308180204e-07,
+ "loss": 0.0948,
+ "step": 33439
+ },
+ {
+ "epoch": 91.11716621253406,
+ "grad_norm": 5.559768199920654,
+ "learning_rate": 4.109905457983643e-07,
+ "loss": 0.0607,
+ "step": 33440
+ },
+ {
+ "epoch": 91.11989100817439,
+ "grad_norm": 3.1644163131713867,
+ "learning_rate": 4.1074018319382513e-07,
+ "loss": 0.0151,
+ "step": 33441
+ },
+ {
+ "epoch": 91.12261580381471,
+ "grad_norm": 2.7557992935180664,
+ "learning_rate": 4.1048989527013306e-07,
+ "loss": 0.0219,
+ "step": 33442
+ },
+ {
+ "epoch": 91.12534059945504,
+ "grad_norm": 2.05183744430542,
+ "learning_rate": 4.102396820292376e-07,
+ "loss": 0.0322,
+ "step": 33443
+ },
+ {
+ "epoch": 91.12806539509536,
+ "grad_norm": 2.707655429840088,
+ "learning_rate": 4.0998954347308496e-07,
+ "loss": 0.0763,
+ "step": 33444
+ },
+ {
+ "epoch": 91.1307901907357,
+ "grad_norm": 4.005188941955566,
+ "learning_rate": 4.0973947960362583e-07,
+ "loss": 0.1092,
+ "step": 33445
+ },
+ {
+ "epoch": 91.13351498637603,
+ "grad_norm": 2.3927321434020996,
+ "learning_rate": 4.094894904228075e-07,
+ "loss": 0.0331,
+ "step": 33446
+ },
+ {
+ "epoch": 91.13623978201635,
+ "grad_norm": 2.6593899726867676,
+ "learning_rate": 4.0923957593257626e-07,
+ "loss": 0.1845,
+ "step": 33447
+ },
+ {
+ "epoch": 91.13896457765668,
+ "grad_norm": 5.125622749328613,
+ "learning_rate": 4.0898973613487714e-07,
+ "loss": 0.0479,
+ "step": 33448
+ },
+ {
+ "epoch": 91.141689373297,
+ "grad_norm": 2.3418519496917725,
+ "learning_rate": 4.0873997103165976e-07,
+ "loss": 0.0268,
+ "step": 33449
+ },
+ {
+ "epoch": 91.14441416893733,
+ "grad_norm": 2.0520389080047607,
+ "learning_rate": 4.084902806248647e-07,
+ "loss": 0.056,
+ "step": 33450
+ },
+ {
+ "epoch": 91.14713896457765,
+ "grad_norm": 1.4824223518371582,
+ "learning_rate": 4.0824066491643944e-07,
+ "loss": 0.0185,
+ "step": 33451
+ },
+ {
+ "epoch": 91.14986376021798,
+ "grad_norm": 1.5708297491073608,
+ "learning_rate": 4.079911239083267e-07,
+ "loss": 0.0176,
+ "step": 33452
+ },
+ {
+ "epoch": 91.15258855585832,
+ "grad_norm": 2.229505777359009,
+ "learning_rate": 4.0774165760247177e-07,
+ "loss": 0.0347,
+ "step": 33453
+ },
+ {
+ "epoch": 91.15531335149863,
+ "grad_norm": 2.8612000942230225,
+ "learning_rate": 4.0749226600081513e-07,
+ "loss": 0.1015,
+ "step": 33454
+ },
+ {
+ "epoch": 91.15803814713897,
+ "grad_norm": 6.5360002517700195,
+ "learning_rate": 4.0724294910529873e-07,
+ "loss": 0.0984,
+ "step": 33455
+ },
+ {
+ "epoch": 91.16076294277929,
+ "grad_norm": 2.2636289596557617,
+ "learning_rate": 4.069937069178675e-07,
+ "loss": 0.0405,
+ "step": 33456
+ },
+ {
+ "epoch": 91.16348773841962,
+ "grad_norm": 2.311821699142456,
+ "learning_rate": 4.06744539440459e-07,
+ "loss": 0.0265,
+ "step": 33457
+ },
+ {
+ "epoch": 91.16621253405995,
+ "grad_norm": 2.3678250312805176,
+ "learning_rate": 4.0649544667501595e-07,
+ "loss": 0.0243,
+ "step": 33458
+ },
+ {
+ "epoch": 91.16893732970027,
+ "grad_norm": 2.6175408363342285,
+ "learning_rate": 4.0624642862347796e-07,
+ "loss": 0.1141,
+ "step": 33459
+ },
+ {
+ "epoch": 91.1716621253406,
+ "grad_norm": 2.510948896408081,
+ "learning_rate": 4.059974852877824e-07,
+ "loss": 0.0226,
+ "step": 33460
+ },
+ {
+ "epoch": 91.17438692098092,
+ "grad_norm": 5.691770553588867,
+ "learning_rate": 4.057486166698721e-07,
+ "loss": 0.0702,
+ "step": 33461
+ },
+ {
+ "epoch": 91.17711171662125,
+ "grad_norm": 2.44684100151062,
+ "learning_rate": 4.054998227716822e-07,
+ "loss": 0.0304,
+ "step": 33462
+ },
+ {
+ "epoch": 91.17983651226157,
+ "grad_norm": 5.354679584503174,
+ "learning_rate": 4.0525110359515005e-07,
+ "loss": 0.0891,
+ "step": 33463
+ },
+ {
+ "epoch": 91.1825613079019,
+ "grad_norm": 2.2572429180145264,
+ "learning_rate": 4.0500245914221303e-07,
+ "loss": 0.0472,
+ "step": 33464
+ },
+ {
+ "epoch": 91.18528610354224,
+ "grad_norm": 2.445316791534424,
+ "learning_rate": 4.0475388941480955e-07,
+ "loss": 0.099,
+ "step": 33465
+ },
+ {
+ "epoch": 91.18801089918256,
+ "grad_norm": 2.737708568572998,
+ "learning_rate": 4.045053944148736e-07,
+ "loss": 0.1087,
+ "step": 33466
+ },
+ {
+ "epoch": 91.19073569482289,
+ "grad_norm": 7.153319835662842,
+ "learning_rate": 4.0425697414434027e-07,
+ "loss": 0.0616,
+ "step": 33467
+ },
+ {
+ "epoch": 91.19346049046321,
+ "grad_norm": 3.299309730529785,
+ "learning_rate": 4.0400862860514366e-07,
+ "loss": 0.0564,
+ "step": 33468
+ },
+ {
+ "epoch": 91.19618528610354,
+ "grad_norm": 1.737561583518982,
+ "learning_rate": 4.037603577992211e-07,
+ "loss": 0.0378,
+ "step": 33469
+ },
+ {
+ "epoch": 91.19891008174388,
+ "grad_norm": 3.6247615814208984,
+ "learning_rate": 4.035121617285032e-07,
+ "loss": 0.1782,
+ "step": 33470
+ },
+ {
+ "epoch": 91.2016348773842,
+ "grad_norm": 1.6658930778503418,
+ "learning_rate": 4.0326404039492283e-07,
+ "loss": 0.0205,
+ "step": 33471
+ },
+ {
+ "epoch": 91.20435967302453,
+ "grad_norm": 2.3101959228515625,
+ "learning_rate": 4.030159938004141e-07,
+ "loss": 0.052,
+ "step": 33472
+ },
+ {
+ "epoch": 91.20708446866485,
+ "grad_norm": 3.1363327503204346,
+ "learning_rate": 4.027680219469088e-07,
+ "loss": 0.0296,
+ "step": 33473
+ },
+ {
+ "epoch": 91.20980926430518,
+ "grad_norm": 2.6599698066711426,
+ "learning_rate": 4.025201248363353e-07,
+ "loss": 0.0759,
+ "step": 33474
+ },
+ {
+ "epoch": 91.2125340599455,
+ "grad_norm": 3.1961421966552734,
+ "learning_rate": 4.0227230247062765e-07,
+ "loss": 0.0918,
+ "step": 33475
+ },
+ {
+ "epoch": 91.21525885558583,
+ "grad_norm": 2.746758222579956,
+ "learning_rate": 4.020245548517132e-07,
+ "loss": 0.0485,
+ "step": 33476
+ },
+ {
+ "epoch": 91.21798365122616,
+ "grad_norm": 1.916736125946045,
+ "learning_rate": 4.017768819815238e-07,
+ "loss": 0.0269,
+ "step": 33477
+ },
+ {
+ "epoch": 91.22070844686648,
+ "grad_norm": 2.2074666023254395,
+ "learning_rate": 4.0152928386198775e-07,
+ "loss": 0.0681,
+ "step": 33478
+ },
+ {
+ "epoch": 91.22343324250681,
+ "grad_norm": 2.259948968887329,
+ "learning_rate": 4.0128176049503145e-07,
+ "loss": 0.0316,
+ "step": 33479
+ },
+ {
+ "epoch": 91.22615803814713,
+ "grad_norm": 2.186495780944824,
+ "learning_rate": 4.0103431188258324e-07,
+ "loss": 0.0496,
+ "step": 33480
+ },
+ {
+ "epoch": 91.22888283378747,
+ "grad_norm": 2.4739370346069336,
+ "learning_rate": 4.0078693802657273e-07,
+ "loss": 0.0324,
+ "step": 33481
+ },
+ {
+ "epoch": 91.2316076294278,
+ "grad_norm": 2.4121856689453125,
+ "learning_rate": 4.00539638928924e-07,
+ "loss": 0.0351,
+ "step": 33482
+ },
+ {
+ "epoch": 91.23433242506812,
+ "grad_norm": 1.9716999530792236,
+ "learning_rate": 4.002924145915632e-07,
+ "loss": 0.0273,
+ "step": 33483
+ },
+ {
+ "epoch": 91.23705722070845,
+ "grad_norm": 8.593786239624023,
+ "learning_rate": 4.000452650164155e-07,
+ "loss": 0.0512,
+ "step": 33484
+ },
+ {
+ "epoch": 91.23978201634877,
+ "grad_norm": 2.205383777618408,
+ "learning_rate": 3.997981902054071e-07,
+ "loss": 0.0648,
+ "step": 33485
+ },
+ {
+ "epoch": 91.2425068119891,
+ "grad_norm": 2.3848838806152344,
+ "learning_rate": 3.9955119016046206e-07,
+ "loss": 0.0469,
+ "step": 33486
+ },
+ {
+ "epoch": 91.24523160762942,
+ "grad_norm": 2.675579071044922,
+ "learning_rate": 3.9930426488350215e-07,
+ "loss": 0.0393,
+ "step": 33487
+ },
+ {
+ "epoch": 91.24795640326975,
+ "grad_norm": 2.5658624172210693,
+ "learning_rate": 3.990574143764514e-07,
+ "loss": 0.061,
+ "step": 33488
+ },
+ {
+ "epoch": 91.25068119891009,
+ "grad_norm": 4.218019485473633,
+ "learning_rate": 3.988106386412338e-07,
+ "loss": 0.1922,
+ "step": 33489
+ },
+ {
+ "epoch": 91.2534059945504,
+ "grad_norm": 4.758276462554932,
+ "learning_rate": 3.9856393767976896e-07,
+ "loss": 0.0652,
+ "step": 33490
+ },
+ {
+ "epoch": 91.25613079019074,
+ "grad_norm": 2.8237547874450684,
+ "learning_rate": 3.983173114939798e-07,
+ "loss": 0.147,
+ "step": 33491
+ },
+ {
+ "epoch": 91.25885558583106,
+ "grad_norm": 3.6301066875457764,
+ "learning_rate": 3.980707600857847e-07,
+ "loss": 0.0747,
+ "step": 33492
+ },
+ {
+ "epoch": 91.26158038147139,
+ "grad_norm": 3.5691137313842773,
+ "learning_rate": 3.9782428345710665e-07,
+ "loss": 0.0587,
+ "step": 33493
+ },
+ {
+ "epoch": 91.26430517711172,
+ "grad_norm": 1.843849778175354,
+ "learning_rate": 3.9757788160986524e-07,
+ "loss": 0.0175,
+ "step": 33494
+ },
+ {
+ "epoch": 91.26702997275204,
+ "grad_norm": 2.163905143737793,
+ "learning_rate": 3.9733155454597774e-07,
+ "loss": 0.0555,
+ "step": 33495
+ },
+ {
+ "epoch": 91.26975476839237,
+ "grad_norm": 2.266207456588745,
+ "learning_rate": 3.970853022673615e-07,
+ "loss": 0.0617,
+ "step": 33496
+ },
+ {
+ "epoch": 91.2724795640327,
+ "grad_norm": 2.2678987979888916,
+ "learning_rate": 3.9683912477593734e-07,
+ "loss": 0.1042,
+ "step": 33497
+ },
+ {
+ "epoch": 91.27520435967303,
+ "grad_norm": 3.014303684234619,
+ "learning_rate": 3.965930220736203e-07,
+ "loss": 0.099,
+ "step": 33498
+ },
+ {
+ "epoch": 91.27792915531334,
+ "grad_norm": 2.7640128135681152,
+ "learning_rate": 3.963469941623288e-07,
+ "loss": 0.0359,
+ "step": 33499
+ },
+ {
+ "epoch": 91.28065395095368,
+ "grad_norm": 3.1587300300598145,
+ "learning_rate": 3.9610104104397586e-07,
+ "loss": 0.0582,
+ "step": 33500
+ },
+ {
+ "epoch": 91.28337874659401,
+ "grad_norm": 2.873241901397705,
+ "learning_rate": 3.9585516272047984e-07,
+ "loss": 0.051,
+ "step": 33501
+ },
+ {
+ "epoch": 91.28610354223433,
+ "grad_norm": 1.3458555936813354,
+ "learning_rate": 3.9560935919375597e-07,
+ "loss": 0.0152,
+ "step": 33502
+ },
+ {
+ "epoch": 91.28882833787466,
+ "grad_norm": 1.8848713636398315,
+ "learning_rate": 3.95363630465716e-07,
+ "loss": 0.0282,
+ "step": 33503
+ },
+ {
+ "epoch": 91.29155313351498,
+ "grad_norm": 3.7567384243011475,
+ "learning_rate": 3.95117976538274e-07,
+ "loss": 0.0269,
+ "step": 33504
+ },
+ {
+ "epoch": 91.29427792915531,
+ "grad_norm": 1.807776689529419,
+ "learning_rate": 3.9487239741334615e-07,
+ "loss": 0.0602,
+ "step": 33505
+ },
+ {
+ "epoch": 91.29700272479565,
+ "grad_norm": 2.626446485519409,
+ "learning_rate": 3.946268930928421e-07,
+ "loss": 0.035,
+ "step": 33506
+ },
+ {
+ "epoch": 91.29972752043597,
+ "grad_norm": 2.3312532901763916,
+ "learning_rate": 3.9438146357867467e-07,
+ "loss": 0.0379,
+ "step": 33507
+ },
+ {
+ "epoch": 91.3024523160763,
+ "grad_norm": 2.165179967880249,
+ "learning_rate": 3.9413610887275466e-07,
+ "loss": 0.0512,
+ "step": 33508
+ },
+ {
+ "epoch": 91.30517711171662,
+ "grad_norm": 6.76454496383667,
+ "learning_rate": 3.938908289769927e-07,
+ "loss": 0.0985,
+ "step": 33509
+ },
+ {
+ "epoch": 91.30790190735695,
+ "grad_norm": 1.9388389587402344,
+ "learning_rate": 3.9364562389330174e-07,
+ "loss": 0.0325,
+ "step": 33510
+ },
+ {
+ "epoch": 91.31062670299727,
+ "grad_norm": 3.389204978942871,
+ "learning_rate": 3.934004936235891e-07,
+ "loss": 0.1059,
+ "step": 33511
+ },
+ {
+ "epoch": 91.3133514986376,
+ "grad_norm": 3.885791540145874,
+ "learning_rate": 3.9315543816976444e-07,
+ "loss": 0.1031,
+ "step": 33512
+ },
+ {
+ "epoch": 91.31607629427793,
+ "grad_norm": 5.326609134674072,
+ "learning_rate": 3.92910457533735e-07,
+ "loss": 0.0411,
+ "step": 33513
+ },
+ {
+ "epoch": 91.31880108991825,
+ "grad_norm": 3.149608850479126,
+ "learning_rate": 3.926655517174105e-07,
+ "loss": 0.0509,
+ "step": 33514
+ },
+ {
+ "epoch": 91.32152588555859,
+ "grad_norm": 2.390986919403076,
+ "learning_rate": 3.924207207226971e-07,
+ "loss": 0.0467,
+ "step": 33515
+ },
+ {
+ "epoch": 91.3242506811989,
+ "grad_norm": 4.05216121673584,
+ "learning_rate": 3.9217596455150107e-07,
+ "loss": 0.0544,
+ "step": 33516
+ },
+ {
+ "epoch": 91.32697547683924,
+ "grad_norm": 2.684932231903076,
+ "learning_rate": 3.9193128320573095e-07,
+ "loss": 0.036,
+ "step": 33517
+ },
+ {
+ "epoch": 91.32970027247957,
+ "grad_norm": 3.469726085662842,
+ "learning_rate": 3.916866766872907e-07,
+ "loss": 0.0539,
+ "step": 33518
+ },
+ {
+ "epoch": 91.33242506811989,
+ "grad_norm": 4.65806245803833,
+ "learning_rate": 3.914421449980854e-07,
+ "loss": 0.1012,
+ "step": 33519
+ },
+ {
+ "epoch": 91.33514986376022,
+ "grad_norm": 1.6177089214324951,
+ "learning_rate": 3.9119768814001813e-07,
+ "loss": 0.0148,
+ "step": 33520
+ },
+ {
+ "epoch": 91.33787465940054,
+ "grad_norm": 2.87542462348938,
+ "learning_rate": 3.9095330611499506e-07,
+ "loss": 0.0337,
+ "step": 33521
+ },
+ {
+ "epoch": 91.34059945504087,
+ "grad_norm": 2.579695701599121,
+ "learning_rate": 3.90708998924918e-07,
+ "loss": 0.0322,
+ "step": 33522
+ },
+ {
+ "epoch": 91.34332425068119,
+ "grad_norm": 1.7988877296447754,
+ "learning_rate": 3.9046476657168985e-07,
+ "loss": 0.018,
+ "step": 33523
+ },
+ {
+ "epoch": 91.34604904632153,
+ "grad_norm": 4.781064510345459,
+ "learning_rate": 3.9022060905721246e-07,
+ "loss": 0.1467,
+ "step": 33524
+ },
+ {
+ "epoch": 91.34877384196186,
+ "grad_norm": 3.165649652481079,
+ "learning_rate": 3.8997652638338876e-07,
+ "loss": 0.0347,
+ "step": 33525
+ },
+ {
+ "epoch": 91.35149863760218,
+ "grad_norm": 2.6371865272521973,
+ "learning_rate": 3.8973251855211726e-07,
+ "loss": 0.0762,
+ "step": 33526
+ },
+ {
+ "epoch": 91.35422343324251,
+ "grad_norm": 1.6691075563430786,
+ "learning_rate": 3.8948858556530077e-07,
+ "loss": 0.1173,
+ "step": 33527
+ },
+ {
+ "epoch": 91.35694822888283,
+ "grad_norm": 2.2323529720306396,
+ "learning_rate": 3.8924472742483785e-07,
+ "loss": 0.0237,
+ "step": 33528
+ },
+ {
+ "epoch": 91.35967302452316,
+ "grad_norm": 2.1835381984710693,
+ "learning_rate": 3.890009441326259e-07,
+ "loss": 0.1515,
+ "step": 33529
+ },
+ {
+ "epoch": 91.3623978201635,
+ "grad_norm": 1.8728735446929932,
+ "learning_rate": 3.887572356905678e-07,
+ "loss": 0.096,
+ "step": 33530
+ },
+ {
+ "epoch": 91.36512261580381,
+ "grad_norm": 2.2562313079833984,
+ "learning_rate": 3.8851360210055755e-07,
+ "loss": 0.0289,
+ "step": 33531
+ },
+ {
+ "epoch": 91.36784741144415,
+ "grad_norm": 2.5280210971832275,
+ "learning_rate": 3.882700433644948e-07,
+ "loss": 0.0519,
+ "step": 33532
+ },
+ {
+ "epoch": 91.37057220708446,
+ "grad_norm": 2.778721809387207,
+ "learning_rate": 3.880265594842747e-07,
+ "loss": 0.0577,
+ "step": 33533
+ },
+ {
+ "epoch": 91.3732970027248,
+ "grad_norm": 3.2019004821777344,
+ "learning_rate": 3.877831504617946e-07,
+ "loss": 0.0572,
+ "step": 33534
+ },
+ {
+ "epoch": 91.37602179836512,
+ "grad_norm": 2.290388584136963,
+ "learning_rate": 3.8753981629895076e-07,
+ "loss": 0.0806,
+ "step": 33535
+ },
+ {
+ "epoch": 91.37874659400545,
+ "grad_norm": 8.816770553588867,
+ "learning_rate": 3.8729655699763613e-07,
+ "loss": 0.0885,
+ "step": 33536
+ },
+ {
+ "epoch": 91.38147138964578,
+ "grad_norm": 3.0813393592834473,
+ "learning_rate": 3.8705337255974697e-07,
+ "loss": 0.0245,
+ "step": 33537
+ },
+ {
+ "epoch": 91.3841961852861,
+ "grad_norm": 2.967586040496826,
+ "learning_rate": 3.8681026298717836e-07,
+ "loss": 0.0285,
+ "step": 33538
+ },
+ {
+ "epoch": 91.38692098092643,
+ "grad_norm": 2.6449077129364014,
+ "learning_rate": 3.8656722828182115e-07,
+ "loss": 0.0307,
+ "step": 33539
+ },
+ {
+ "epoch": 91.38964577656675,
+ "grad_norm": 2.673945426940918,
+ "learning_rate": 3.86324268445567e-07,
+ "loss": 0.0283,
+ "step": 33540
+ },
+ {
+ "epoch": 91.39237057220708,
+ "grad_norm": 3.387751579284668,
+ "learning_rate": 3.860813834803123e-07,
+ "loss": 0.0396,
+ "step": 33541
+ },
+ {
+ "epoch": 91.39509536784742,
+ "grad_norm": 2.536093235015869,
+ "learning_rate": 3.858385733879455e-07,
+ "loss": 0.0341,
+ "step": 33542
+ },
+ {
+ "epoch": 91.39782016348774,
+ "grad_norm": 2.1067984104156494,
+ "learning_rate": 3.855958381703584e-07,
+ "loss": 0.0208,
+ "step": 33543
+ },
+ {
+ "epoch": 91.40054495912807,
+ "grad_norm": 2.023822069168091,
+ "learning_rate": 3.853531778294417e-07,
+ "loss": 0.024,
+ "step": 33544
+ },
+ {
+ "epoch": 91.40326975476839,
+ "grad_norm": 14.900796890258789,
+ "learning_rate": 3.851105923670839e-07,
+ "loss": 0.024,
+ "step": 33545
+ },
+ {
+ "epoch": 91.40599455040872,
+ "grad_norm": 1.3199199438095093,
+ "learning_rate": 3.848680817851769e-07,
+ "loss": 0.0131,
+ "step": 33546
+ },
+ {
+ "epoch": 91.40871934604904,
+ "grad_norm": 2.8630051612854004,
+ "learning_rate": 3.8462564608560793e-07,
+ "loss": 0.0668,
+ "step": 33547
+ },
+ {
+ "epoch": 91.41144414168937,
+ "grad_norm": 2.70255970954895,
+ "learning_rate": 3.8438328527026445e-07,
+ "loss": 0.1183,
+ "step": 33548
+ },
+ {
+ "epoch": 91.4141689373297,
+ "grad_norm": 1.9144985675811768,
+ "learning_rate": 3.8414099934103386e-07,
+ "loss": 0.0836,
+ "step": 33549
+ },
+ {
+ "epoch": 91.41689373297002,
+ "grad_norm": 1.8344573974609375,
+ "learning_rate": 3.8389878829980465e-07,
+ "loss": 0.028,
+ "step": 33550
+ },
+ {
+ "epoch": 91.41961852861036,
+ "grad_norm": 2.180424690246582,
+ "learning_rate": 3.836566521484619e-07,
+ "loss": 0.0435,
+ "step": 33551
+ },
+ {
+ "epoch": 91.42234332425068,
+ "grad_norm": 2.846090793609619,
+ "learning_rate": 3.83414590888892e-07,
+ "loss": 0.0677,
+ "step": 33552
+ },
+ {
+ "epoch": 91.42506811989101,
+ "grad_norm": 3.0681021213531494,
+ "learning_rate": 3.8317260452297776e-07,
+ "loss": 0.051,
+ "step": 33553
+ },
+ {
+ "epoch": 91.42779291553134,
+ "grad_norm": 2.614234447479248,
+ "learning_rate": 3.8293069305260776e-07,
+ "loss": 0.0422,
+ "step": 33554
+ },
+ {
+ "epoch": 91.43051771117166,
+ "grad_norm": 2.4826254844665527,
+ "learning_rate": 3.826888564796638e-07,
+ "loss": 0.1028,
+ "step": 33555
+ },
+ {
+ "epoch": 91.433242506812,
+ "grad_norm": 2.5016932487487793,
+ "learning_rate": 3.824470948060299e-07,
+ "loss": 0.031,
+ "step": 33556
+ },
+ {
+ "epoch": 91.43596730245231,
+ "grad_norm": 1.9077481031417847,
+ "learning_rate": 3.8220540803358687e-07,
+ "loss": 0.0524,
+ "step": 33557
+ },
+ {
+ "epoch": 91.43869209809264,
+ "grad_norm": 2.917414426803589,
+ "learning_rate": 3.8196379616421975e-07,
+ "loss": 0.1687,
+ "step": 33558
+ },
+ {
+ "epoch": 91.44141689373296,
+ "grad_norm": 2.3211934566497803,
+ "learning_rate": 3.817222591998093e-07,
+ "loss": 0.0548,
+ "step": 33559
+ },
+ {
+ "epoch": 91.4441416893733,
+ "grad_norm": 1.7042837142944336,
+ "learning_rate": 3.8148079714223407e-07,
+ "loss": 0.018,
+ "step": 33560
+ },
+ {
+ "epoch": 91.44686648501363,
+ "grad_norm": 3.297069549560547,
+ "learning_rate": 3.812394099933781e-07,
+ "loss": 0.0708,
+ "step": 33561
+ },
+ {
+ "epoch": 91.44959128065395,
+ "grad_norm": 2.1418566703796387,
+ "learning_rate": 3.809980977551209e-07,
+ "loss": 0.041,
+ "step": 33562
+ },
+ {
+ "epoch": 91.45231607629428,
+ "grad_norm": 1.7914178371429443,
+ "learning_rate": 3.80756860429341e-07,
+ "loss": 0.0184,
+ "step": 33563
+ },
+ {
+ "epoch": 91.4550408719346,
+ "grad_norm": 2.666574239730835,
+ "learning_rate": 3.80515698017917e-07,
+ "loss": 0.168,
+ "step": 33564
+ },
+ {
+ "epoch": 91.45776566757493,
+ "grad_norm": 2.6954071521759033,
+ "learning_rate": 3.802746105227251e-07,
+ "loss": 0.0319,
+ "step": 33565
+ },
+ {
+ "epoch": 91.46049046321527,
+ "grad_norm": 2.6725752353668213,
+ "learning_rate": 3.800335979456471e-07,
+ "loss": 0.0334,
+ "step": 33566
+ },
+ {
+ "epoch": 91.46321525885558,
+ "grad_norm": 2.1421608924865723,
+ "learning_rate": 3.797926602885582e-07,
+ "loss": 0.0235,
+ "step": 33567
+ },
+ {
+ "epoch": 91.46594005449592,
+ "grad_norm": 2.6930532455444336,
+ "learning_rate": 3.795517975533336e-07,
+ "loss": 0.0431,
+ "step": 33568
+ },
+ {
+ "epoch": 91.46866485013624,
+ "grad_norm": 1.8473962545394897,
+ "learning_rate": 3.7931100974184843e-07,
+ "loss": 0.0312,
+ "step": 33569
+ },
+ {
+ "epoch": 91.47138964577657,
+ "grad_norm": 2.257495641708374,
+ "learning_rate": 3.790702968559812e-07,
+ "loss": 0.0495,
+ "step": 33570
+ },
+ {
+ "epoch": 91.47411444141689,
+ "grad_norm": 5.894565105438232,
+ "learning_rate": 3.788296588976048e-07,
+ "loss": 0.1056,
+ "step": 33571
+ },
+ {
+ "epoch": 91.47683923705722,
+ "grad_norm": 1.855755090713501,
+ "learning_rate": 3.785890958685945e-07,
+ "loss": 0.024,
+ "step": 33572
+ },
+ {
+ "epoch": 91.47956403269755,
+ "grad_norm": 1.4998773336410522,
+ "learning_rate": 3.783486077708198e-07,
+ "loss": 0.0202,
+ "step": 33573
+ },
+ {
+ "epoch": 91.48228882833787,
+ "grad_norm": 2.37126088142395,
+ "learning_rate": 3.781081946061582e-07,
+ "loss": 0.075,
+ "step": 33574
+ },
+ {
+ "epoch": 91.4850136239782,
+ "grad_norm": 2.227522373199463,
+ "learning_rate": 3.778678563764804e-07,
+ "loss": 0.0289,
+ "step": 33575
+ },
+ {
+ "epoch": 91.48773841961852,
+ "grad_norm": 2.0605151653289795,
+ "learning_rate": 3.7762759308365814e-07,
+ "loss": 0.0328,
+ "step": 33576
+ },
+ {
+ "epoch": 91.49046321525886,
+ "grad_norm": 3.265958786010742,
+ "learning_rate": 3.7738740472956115e-07,
+ "loss": 0.0554,
+ "step": 33577
+ },
+ {
+ "epoch": 91.49318801089919,
+ "grad_norm": 2.8525846004486084,
+ "learning_rate": 3.771472913160612e-07,
+ "loss": 0.0791,
+ "step": 33578
+ },
+ {
+ "epoch": 91.49591280653951,
+ "grad_norm": 2.7092018127441406,
+ "learning_rate": 3.769072528450302e-07,
+ "loss": 0.1028,
+ "step": 33579
+ },
+ {
+ "epoch": 91.49863760217984,
+ "grad_norm": 2.29067325592041,
+ "learning_rate": 3.766672893183354e-07,
+ "loss": 0.0203,
+ "step": 33580
+ },
+ {
+ "epoch": 91.50136239782016,
+ "grad_norm": 1.9763702154159546,
+ "learning_rate": 3.7642740073784435e-07,
+ "loss": 0.0196,
+ "step": 33581
+ },
+ {
+ "epoch": 91.50408719346049,
+ "grad_norm": 4.412403583526611,
+ "learning_rate": 3.761875871054288e-07,
+ "loss": 0.046,
+ "step": 33582
+ },
+ {
+ "epoch": 91.50681198910081,
+ "grad_norm": 2.6487820148468018,
+ "learning_rate": 3.7594784842295505e-07,
+ "loss": 0.1694,
+ "step": 33583
+ },
+ {
+ "epoch": 91.50953678474114,
+ "grad_norm": 4.80283260345459,
+ "learning_rate": 3.7570818469228834e-07,
+ "loss": 0.1223,
+ "step": 33584
+ },
+ {
+ "epoch": 91.51226158038148,
+ "grad_norm": 2.7220542430877686,
+ "learning_rate": 3.754685959152971e-07,
+ "loss": 0.1134,
+ "step": 33585
+ },
+ {
+ "epoch": 91.5149863760218,
+ "grad_norm": 3.8485357761383057,
+ "learning_rate": 3.7522908209384644e-07,
+ "loss": 0.2028,
+ "step": 33586
+ },
+ {
+ "epoch": 91.51771117166213,
+ "grad_norm": 2.6554503440856934,
+ "learning_rate": 3.749896432298017e-07,
+ "loss": 0.1133,
+ "step": 33587
+ },
+ {
+ "epoch": 91.52043596730245,
+ "grad_norm": 2.0981926918029785,
+ "learning_rate": 3.7475027932502904e-07,
+ "loss": 0.0922,
+ "step": 33588
+ },
+ {
+ "epoch": 91.52316076294278,
+ "grad_norm": 3.087574005126953,
+ "learning_rate": 3.7451099038138926e-07,
+ "loss": 0.0973,
+ "step": 33589
+ },
+ {
+ "epoch": 91.52588555858311,
+ "grad_norm": 3.2297282218933105,
+ "learning_rate": 3.742717764007497e-07,
+ "loss": 0.0312,
+ "step": 33590
+ },
+ {
+ "epoch": 91.52861035422343,
+ "grad_norm": 3.242899179458618,
+ "learning_rate": 3.740326373849723e-07,
+ "loss": 0.0356,
+ "step": 33591
+ },
+ {
+ "epoch": 91.53133514986376,
+ "grad_norm": 2.4582908153533936,
+ "learning_rate": 3.737935733359177e-07,
+ "loss": 0.0553,
+ "step": 33592
+ },
+ {
+ "epoch": 91.53405994550408,
+ "grad_norm": 3.2118515968322754,
+ "learning_rate": 3.735545842554489e-07,
+ "loss": 0.1782,
+ "step": 33593
+ },
+ {
+ "epoch": 91.53678474114442,
+ "grad_norm": 2.3374011516571045,
+ "learning_rate": 3.733156701454277e-07,
+ "loss": 0.0223,
+ "step": 33594
+ },
+ {
+ "epoch": 91.53950953678473,
+ "grad_norm": 1.7692631483078003,
+ "learning_rate": 3.7307683100771377e-07,
+ "loss": 0.0255,
+ "step": 33595
+ },
+ {
+ "epoch": 91.54223433242507,
+ "grad_norm": 2.864637851715088,
+ "learning_rate": 3.7283806684416777e-07,
+ "loss": 0.0542,
+ "step": 33596
+ },
+ {
+ "epoch": 91.5449591280654,
+ "grad_norm": 3.0823960304260254,
+ "learning_rate": 3.7259937765664943e-07,
+ "loss": 0.0928,
+ "step": 33597
+ },
+ {
+ "epoch": 91.54768392370572,
+ "grad_norm": 2.6931047439575195,
+ "learning_rate": 3.7236076344701613e-07,
+ "loss": 0.0545,
+ "step": 33598
+ },
+ {
+ "epoch": 91.55040871934605,
+ "grad_norm": 3.286928415298462,
+ "learning_rate": 3.721222242171285e-07,
+ "loss": 0.1571,
+ "step": 33599
+ },
+ {
+ "epoch": 91.55313351498637,
+ "grad_norm": 2.4106199741363525,
+ "learning_rate": 3.7188375996884295e-07,
+ "loss": 0.027,
+ "step": 33600
+ },
+ {
+ "epoch": 91.5558583106267,
+ "grad_norm": 2.004592180252075,
+ "learning_rate": 3.7164537070401573e-07,
+ "loss": 0.0409,
+ "step": 33601
+ },
+ {
+ "epoch": 91.55858310626704,
+ "grad_norm": 2.57600998878479,
+ "learning_rate": 3.7140705642450647e-07,
+ "loss": 0.0441,
+ "step": 33602
+ },
+ {
+ "epoch": 91.56130790190736,
+ "grad_norm": 3.2495641708374023,
+ "learning_rate": 3.711688171321681e-07,
+ "loss": 0.0579,
+ "step": 33603
+ },
+ {
+ "epoch": 91.56403269754769,
+ "grad_norm": 2.7735214233398438,
+ "learning_rate": 3.709306528288581e-07,
+ "loss": 0.1541,
+ "step": 33604
+ },
+ {
+ "epoch": 91.566757493188,
+ "grad_norm": 2.1506876945495605,
+ "learning_rate": 3.7069256351642823e-07,
+ "loss": 0.0256,
+ "step": 33605
+ },
+ {
+ "epoch": 91.56948228882834,
+ "grad_norm": 1.6449873447418213,
+ "learning_rate": 3.7045454919673597e-07,
+ "loss": 0.0372,
+ "step": 33606
+ },
+ {
+ "epoch": 91.57220708446866,
+ "grad_norm": 2.3814804553985596,
+ "learning_rate": 3.702166098716342e-07,
+ "loss": 0.0548,
+ "step": 33607
+ },
+ {
+ "epoch": 91.57493188010899,
+ "grad_norm": 2.2766847610473633,
+ "learning_rate": 3.6997874554297484e-07,
+ "loss": 0.0293,
+ "step": 33608
+ },
+ {
+ "epoch": 91.57765667574932,
+ "grad_norm": 2.326969861984253,
+ "learning_rate": 3.697409562126109e-07,
+ "loss": 0.0851,
+ "step": 33609
+ },
+ {
+ "epoch": 91.58038147138964,
+ "grad_norm": 2.594961166381836,
+ "learning_rate": 3.6950324188239517e-07,
+ "loss": 0.0711,
+ "step": 33610
+ },
+ {
+ "epoch": 91.58310626702998,
+ "grad_norm": 3.5385637283325195,
+ "learning_rate": 3.6926560255417745e-07,
+ "loss": 0.0458,
+ "step": 33611
+ },
+ {
+ "epoch": 91.5858310626703,
+ "grad_norm": 2.9375243186950684,
+ "learning_rate": 3.690280382298095e-07,
+ "loss": 0.11,
+ "step": 33612
+ },
+ {
+ "epoch": 91.58855585831063,
+ "grad_norm": 2.3595938682556152,
+ "learning_rate": 3.68790548911141e-07,
+ "loss": 0.1431,
+ "step": 33613
+ },
+ {
+ "epoch": 91.59128065395096,
+ "grad_norm": 3.097893238067627,
+ "learning_rate": 3.685531346000215e-07,
+ "loss": 0.1205,
+ "step": 33614
+ },
+ {
+ "epoch": 91.59400544959128,
+ "grad_norm": 2.1998302936553955,
+ "learning_rate": 3.6831579529830076e-07,
+ "loss": 0.0663,
+ "step": 33615
+ },
+ {
+ "epoch": 91.59673024523161,
+ "grad_norm": 2.487896203994751,
+ "learning_rate": 3.680785310078272e-07,
+ "loss": 0.0908,
+ "step": 33616
+ },
+ {
+ "epoch": 91.59945504087193,
+ "grad_norm": 2.552617311477661,
+ "learning_rate": 3.6784134173044716e-07,
+ "loss": 0.1584,
+ "step": 33617
+ },
+ {
+ "epoch": 91.60217983651226,
+ "grad_norm": 3.077333688735962,
+ "learning_rate": 3.6760422746800806e-07,
+ "loss": 0.0641,
+ "step": 33618
+ },
+ {
+ "epoch": 91.60490463215258,
+ "grad_norm": 2.582639455795288,
+ "learning_rate": 3.673671882223595e-07,
+ "loss": 0.0266,
+ "step": 33619
+ },
+ {
+ "epoch": 91.60762942779292,
+ "grad_norm": 1.9093434810638428,
+ "learning_rate": 3.671302239953434e-07,
+ "loss": 0.0241,
+ "step": 33620
+ },
+ {
+ "epoch": 91.61035422343325,
+ "grad_norm": 2.607896566390991,
+ "learning_rate": 3.6689333478880816e-07,
+ "loss": 0.0547,
+ "step": 33621
+ },
+ {
+ "epoch": 91.61307901907357,
+ "grad_norm": 2.725715398788452,
+ "learning_rate": 3.6665652060459576e-07,
+ "loss": 0.0311,
+ "step": 33622
+ },
+ {
+ "epoch": 91.6158038147139,
+ "grad_norm": 3.2464728355407715,
+ "learning_rate": 3.664197814445547e-07,
+ "loss": 0.0368,
+ "step": 33623
+ },
+ {
+ "epoch": 91.61852861035422,
+ "grad_norm": 2.1419646739959717,
+ "learning_rate": 3.661831173105257e-07,
+ "loss": 0.0655,
+ "step": 33624
+ },
+ {
+ "epoch": 91.62125340599455,
+ "grad_norm": 2.5510311126708984,
+ "learning_rate": 3.6594652820435064e-07,
+ "loss": 0.0382,
+ "step": 33625
+ },
+ {
+ "epoch": 91.62397820163488,
+ "grad_norm": 3.1216113567352295,
+ "learning_rate": 3.657100141278758e-07,
+ "loss": 0.1129,
+ "step": 33626
+ },
+ {
+ "epoch": 91.6267029972752,
+ "grad_norm": 2.985828399658203,
+ "learning_rate": 3.654735750829408e-07,
+ "loss": 0.0323,
+ "step": 33627
+ },
+ {
+ "epoch": 91.62942779291554,
+ "grad_norm": 2.9723455905914307,
+ "learning_rate": 3.652372110713887e-07,
+ "loss": 0.0374,
+ "step": 33628
+ },
+ {
+ "epoch": 91.63215258855585,
+ "grad_norm": 1.8881319761276245,
+ "learning_rate": 3.650009220950568e-07,
+ "loss": 0.0244,
+ "step": 33629
+ },
+ {
+ "epoch": 91.63487738419619,
+ "grad_norm": 3.5544631481170654,
+ "learning_rate": 3.647647081557881e-07,
+ "loss": 0.0679,
+ "step": 33630
+ },
+ {
+ "epoch": 91.6376021798365,
+ "grad_norm": 2.0359060764312744,
+ "learning_rate": 3.6452856925542235e-07,
+ "loss": 0.1462,
+ "step": 33631
+ },
+ {
+ "epoch": 91.64032697547684,
+ "grad_norm": 5.320764541625977,
+ "learning_rate": 3.642925053957991e-07,
+ "loss": 0.0766,
+ "step": 33632
+ },
+ {
+ "epoch": 91.64305177111717,
+ "grad_norm": 3.1832618713378906,
+ "learning_rate": 3.6405651657875464e-07,
+ "loss": 0.1352,
+ "step": 33633
+ },
+ {
+ "epoch": 91.64577656675749,
+ "grad_norm": 2.471998929977417,
+ "learning_rate": 3.638206028061264e-07,
+ "loss": 0.0287,
+ "step": 33634
+ },
+ {
+ "epoch": 91.64850136239782,
+ "grad_norm": 2.826984405517578,
+ "learning_rate": 3.635847640797552e-07,
+ "loss": 0.0576,
+ "step": 33635
+ },
+ {
+ "epoch": 91.65122615803814,
+ "grad_norm": 2.281329393386841,
+ "learning_rate": 3.6334900040147615e-07,
+ "loss": 0.0428,
+ "step": 33636
+ },
+ {
+ "epoch": 91.65395095367847,
+ "grad_norm": 2.644656181335449,
+ "learning_rate": 3.6311331177312447e-07,
+ "loss": 0.0397,
+ "step": 33637
+ },
+ {
+ "epoch": 91.65667574931881,
+ "grad_norm": 2.2187631130218506,
+ "learning_rate": 3.628776981965343e-07,
+ "loss": 0.0267,
+ "step": 33638
+ },
+ {
+ "epoch": 91.65940054495913,
+ "grad_norm": 3.246809720993042,
+ "learning_rate": 3.626421596735441e-07,
+ "loss": 0.1343,
+ "step": 33639
+ },
+ {
+ "epoch": 91.66212534059946,
+ "grad_norm": 3.6670730113983154,
+ "learning_rate": 3.624066962059869e-07,
+ "loss": 0.0282,
+ "step": 33640
+ },
+ {
+ "epoch": 91.66485013623978,
+ "grad_norm": 2.6588709354400635,
+ "learning_rate": 3.6217130779569565e-07,
+ "loss": 0.1344,
+ "step": 33641
+ },
+ {
+ "epoch": 91.66757493188011,
+ "grad_norm": 2.7214791774749756,
+ "learning_rate": 3.6193599444450335e-07,
+ "loss": 0.0726,
+ "step": 33642
+ },
+ {
+ "epoch": 91.67029972752043,
+ "grad_norm": 2.9262428283691406,
+ "learning_rate": 3.6170075615424407e-07,
+ "loss": 0.0926,
+ "step": 33643
+ },
+ {
+ "epoch": 91.67302452316076,
+ "grad_norm": 2.1330814361572266,
+ "learning_rate": 3.6146559292674967e-07,
+ "loss": 0.0458,
+ "step": 33644
+ },
+ {
+ "epoch": 91.6757493188011,
+ "grad_norm": 5.586047172546387,
+ "learning_rate": 3.612305047638487e-07,
+ "loss": 0.0862,
+ "step": 33645
+ },
+ {
+ "epoch": 91.67847411444141,
+ "grad_norm": 4.77297306060791,
+ "learning_rate": 3.6099549166737527e-07,
+ "loss": 0.0338,
+ "step": 33646
+ },
+ {
+ "epoch": 91.68119891008175,
+ "grad_norm": 2.5954415798187256,
+ "learning_rate": 3.6076055363916005e-07,
+ "loss": 0.0248,
+ "step": 33647
+ },
+ {
+ "epoch": 91.68392370572207,
+ "grad_norm": 1.8317947387695312,
+ "learning_rate": 3.605256906810306e-07,
+ "loss": 0.053,
+ "step": 33648
+ },
+ {
+ "epoch": 91.6866485013624,
+ "grad_norm": 2.3642208576202393,
+ "learning_rate": 3.602909027948176e-07,
+ "loss": 0.0615,
+ "step": 33649
+ },
+ {
+ "epoch": 91.68937329700273,
+ "grad_norm": 1.713407278060913,
+ "learning_rate": 3.6005618998234736e-07,
+ "loss": 0.02,
+ "step": 33650
+ },
+ {
+ "epoch": 91.69209809264305,
+ "grad_norm": 2.612757682800293,
+ "learning_rate": 3.598215522454507e-07,
+ "loss": 0.0179,
+ "step": 33651
+ },
+ {
+ "epoch": 91.69482288828338,
+ "grad_norm": 2.575063467025757,
+ "learning_rate": 3.595869895859527e-07,
+ "loss": 0.0919,
+ "step": 33652
+ },
+ {
+ "epoch": 91.6975476839237,
+ "grad_norm": 3.129669189453125,
+ "learning_rate": 3.593525020056821e-07,
+ "loss": 0.0883,
+ "step": 33653
+ },
+ {
+ "epoch": 91.70027247956403,
+ "grad_norm": 2.1432507038116455,
+ "learning_rate": 3.5911808950646165e-07,
+ "loss": 0.0318,
+ "step": 33654
+ },
+ {
+ "epoch": 91.70299727520435,
+ "grad_norm": 2.2757797241210938,
+ "learning_rate": 3.588837520901212e-07,
+ "loss": 0.0857,
+ "step": 33655
+ },
+ {
+ "epoch": 91.70572207084469,
+ "grad_norm": 1.5385581254959106,
+ "learning_rate": 3.586494897584836e-07,
+ "loss": 0.0671,
+ "step": 33656
+ },
+ {
+ "epoch": 91.70844686648502,
+ "grad_norm": 2.107974052429199,
+ "learning_rate": 3.5841530251337297e-07,
+ "loss": 0.034,
+ "step": 33657
+ },
+ {
+ "epoch": 91.71117166212534,
+ "grad_norm": 1.6791565418243408,
+ "learning_rate": 3.581811903566135e-07,
+ "loss": 0.0604,
+ "step": 33658
+ },
+ {
+ "epoch": 91.71389645776567,
+ "grad_norm": 2.79116153717041,
+ "learning_rate": 3.5794715329002805e-07,
+ "loss": 0.0358,
+ "step": 33659
+ },
+ {
+ "epoch": 91.71662125340599,
+ "grad_norm": 1.8962323665618896,
+ "learning_rate": 3.577131913154419e-07,
+ "loss": 0.0316,
+ "step": 33660
+ },
+ {
+ "epoch": 91.71934604904632,
+ "grad_norm": 3.239900827407837,
+ "learning_rate": 3.574793044346736e-07,
+ "loss": 0.0465,
+ "step": 33661
+ },
+ {
+ "epoch": 91.72207084468666,
+ "grad_norm": 2.495074510574341,
+ "learning_rate": 3.57245492649545e-07,
+ "loss": 0.0499,
+ "step": 33662
+ },
+ {
+ "epoch": 91.72479564032697,
+ "grad_norm": 1.73086416721344,
+ "learning_rate": 3.570117559618802e-07,
+ "loss": 0.0188,
+ "step": 33663
+ },
+ {
+ "epoch": 91.7275204359673,
+ "grad_norm": 2.6486928462982178,
+ "learning_rate": 3.5677809437349554e-07,
+ "loss": 0.0922,
+ "step": 33664
+ },
+ {
+ "epoch": 91.73024523160763,
+ "grad_norm": 4.095842361450195,
+ "learning_rate": 3.565445078862151e-07,
+ "loss": 0.0817,
+ "step": 33665
+ },
+ {
+ "epoch": 91.73297002724796,
+ "grad_norm": 2.5894007682800293,
+ "learning_rate": 3.5631099650185294e-07,
+ "loss": 0.1523,
+ "step": 33666
+ },
+ {
+ "epoch": 91.73569482288828,
+ "grad_norm": 3.8926684856414795,
+ "learning_rate": 3.5607756022223216e-07,
+ "loss": 0.0471,
+ "step": 33667
+ },
+ {
+ "epoch": 91.73841961852861,
+ "grad_norm": 1.8081189393997192,
+ "learning_rate": 3.55844199049169e-07,
+ "loss": 0.0228,
+ "step": 33668
+ },
+ {
+ "epoch": 91.74114441416894,
+ "grad_norm": 2.48095703125,
+ "learning_rate": 3.556109129844809e-07,
+ "loss": 0.0646,
+ "step": 33669
+ },
+ {
+ "epoch": 91.74386920980926,
+ "grad_norm": 1.7749342918395996,
+ "learning_rate": 3.5537770202998314e-07,
+ "loss": 0.0618,
+ "step": 33670
+ },
+ {
+ "epoch": 91.7465940054496,
+ "grad_norm": 2.6271684169769287,
+ "learning_rate": 3.551445661874953e-07,
+ "loss": 0.0256,
+ "step": 33671
+ },
+ {
+ "epoch": 91.74931880108991,
+ "grad_norm": 2.2914161682128906,
+ "learning_rate": 3.5491150545883034e-07,
+ "loss": 0.0509,
+ "step": 33672
+ },
+ {
+ "epoch": 91.75204359673025,
+ "grad_norm": 2.0748889446258545,
+ "learning_rate": 3.546785198458047e-07,
+ "loss": 0.0317,
+ "step": 33673
+ },
+ {
+ "epoch": 91.75476839237058,
+ "grad_norm": 3.947211742401123,
+ "learning_rate": 3.544456093502313e-07,
+ "loss": 0.0782,
+ "step": 33674
+ },
+ {
+ "epoch": 91.7574931880109,
+ "grad_norm": 3.420990228652954,
+ "learning_rate": 3.542127739739254e-07,
+ "loss": 0.1598,
+ "step": 33675
+ },
+ {
+ "epoch": 91.76021798365123,
+ "grad_norm": 2.767961263656616,
+ "learning_rate": 3.5398001371870104e-07,
+ "loss": 0.1616,
+ "step": 33676
+ },
+ {
+ "epoch": 91.76294277929155,
+ "grad_norm": 2.000896692276001,
+ "learning_rate": 3.537473285863691e-07,
+ "loss": 0.0293,
+ "step": 33677
+ },
+ {
+ "epoch": 91.76566757493188,
+ "grad_norm": 2.8828723430633545,
+ "learning_rate": 3.535147185787413e-07,
+ "loss": 0.0387,
+ "step": 33678
+ },
+ {
+ "epoch": 91.7683923705722,
+ "grad_norm": 2.0531177520751953,
+ "learning_rate": 3.532821836976319e-07,
+ "loss": 0.0248,
+ "step": 33679
+ },
+ {
+ "epoch": 91.77111716621253,
+ "grad_norm": 2.825890064239502,
+ "learning_rate": 3.530497239448505e-07,
+ "loss": 0.0398,
+ "step": 33680
+ },
+ {
+ "epoch": 91.77384196185287,
+ "grad_norm": 3.0841400623321533,
+ "learning_rate": 3.5281733932220566e-07,
+ "loss": 0.079,
+ "step": 33681
+ },
+ {
+ "epoch": 91.77656675749319,
+ "grad_norm": 2.8627307415008545,
+ "learning_rate": 3.525850298315103e-07,
+ "loss": 0.0676,
+ "step": 33682
+ },
+ {
+ "epoch": 91.77929155313352,
+ "grad_norm": 2.518963575363159,
+ "learning_rate": 3.523527954745709e-07,
+ "loss": 0.0749,
+ "step": 33683
+ },
+ {
+ "epoch": 91.78201634877384,
+ "grad_norm": 3.7561941146850586,
+ "learning_rate": 3.5212063625319925e-07,
+ "loss": 0.102,
+ "step": 33684
+ },
+ {
+ "epoch": 91.78474114441417,
+ "grad_norm": 1.9617749452590942,
+ "learning_rate": 3.518885521692006e-07,
+ "loss": 0.0882,
+ "step": 33685
+ },
+ {
+ "epoch": 91.7874659400545,
+ "grad_norm": 2.847410202026367,
+ "learning_rate": 3.516565432243824e-07,
+ "loss": 0.0457,
+ "step": 33686
+ },
+ {
+ "epoch": 91.79019073569482,
+ "grad_norm": 2.5235135555267334,
+ "learning_rate": 3.5142460942055424e-07,
+ "loss": 0.0293,
+ "step": 33687
+ },
+ {
+ "epoch": 91.79291553133515,
+ "grad_norm": 1.7744661569595337,
+ "learning_rate": 3.511927507595203e-07,
+ "loss": 0.0175,
+ "step": 33688
+ },
+ {
+ "epoch": 91.79564032697547,
+ "grad_norm": 3.418145179748535,
+ "learning_rate": 3.5096096724308694e-07,
+ "loss": 0.1074,
+ "step": 33689
+ },
+ {
+ "epoch": 91.7983651226158,
+ "grad_norm": 3.91782283782959,
+ "learning_rate": 3.507292588730582e-07,
+ "loss": 0.0572,
+ "step": 33690
+ },
+ {
+ "epoch": 91.80108991825612,
+ "grad_norm": 2.7733798027038574,
+ "learning_rate": 3.5049762565123936e-07,
+ "loss": 0.0856,
+ "step": 33691
+ },
+ {
+ "epoch": 91.80381471389646,
+ "grad_norm": 2.2111968994140625,
+ "learning_rate": 3.502660675794356e-07,
+ "loss": 0.0317,
+ "step": 33692
+ },
+ {
+ "epoch": 91.80653950953679,
+ "grad_norm": 2.8142967224121094,
+ "learning_rate": 3.5003458465944884e-07,
+ "loss": 0.0327,
+ "step": 33693
+ },
+ {
+ "epoch": 91.80926430517711,
+ "grad_norm": 3.807567596435547,
+ "learning_rate": 3.4980317689308094e-07,
+ "loss": 0.0731,
+ "step": 33694
+ },
+ {
+ "epoch": 91.81198910081744,
+ "grad_norm": 2.0858969688415527,
+ "learning_rate": 3.495718442821361e-07,
+ "loss": 0.0324,
+ "step": 33695
+ },
+ {
+ "epoch": 91.81471389645776,
+ "grad_norm": 3.3685550689697266,
+ "learning_rate": 3.493405868284161e-07,
+ "loss": 0.0615,
+ "step": 33696
+ },
+ {
+ "epoch": 91.8174386920981,
+ "grad_norm": 2.0874626636505127,
+ "learning_rate": 3.491094045337196e-07,
+ "loss": 0.0597,
+ "step": 33697
+ },
+ {
+ "epoch": 91.82016348773843,
+ "grad_norm": 2.850393295288086,
+ "learning_rate": 3.4887829739984836e-07,
+ "loss": 0.0755,
+ "step": 33698
+ },
+ {
+ "epoch": 91.82288828337875,
+ "grad_norm": 2.832606792449951,
+ "learning_rate": 3.486472654286022e-07,
+ "loss": 0.0285,
+ "step": 33699
+ },
+ {
+ "epoch": 91.82561307901908,
+ "grad_norm": 2.2394144535064697,
+ "learning_rate": 3.484163086217818e-07,
+ "loss": 0.0505,
+ "step": 33700
+ },
+ {
+ "epoch": 91.8283378746594,
+ "grad_norm": 2.5283920764923096,
+ "learning_rate": 3.481854269811835e-07,
+ "loss": 0.0438,
+ "step": 33701
+ },
+ {
+ "epoch": 91.83106267029973,
+ "grad_norm": 2.624202251434326,
+ "learning_rate": 3.4795462050860704e-07,
+ "loss": 0.0469,
+ "step": 33702
+ },
+ {
+ "epoch": 91.83378746594005,
+ "grad_norm": 2.273449182510376,
+ "learning_rate": 3.4772388920584877e-07,
+ "loss": 0.0507,
+ "step": 33703
+ },
+ {
+ "epoch": 91.83651226158038,
+ "grad_norm": 2.364443063735962,
+ "learning_rate": 3.4749323307470717e-07,
+ "loss": 0.0252,
+ "step": 33704
+ },
+ {
+ "epoch": 91.83923705722071,
+ "grad_norm": 1.9928584098815918,
+ "learning_rate": 3.472626521169775e-07,
+ "loss": 0.027,
+ "step": 33705
+ },
+ {
+ "epoch": 91.84196185286103,
+ "grad_norm": 1.871195912361145,
+ "learning_rate": 3.4703214633445504e-07,
+ "loss": 0.0257,
+ "step": 33706
+ },
+ {
+ "epoch": 91.84468664850137,
+ "grad_norm": 3.812786102294922,
+ "learning_rate": 3.4680171572893494e-07,
+ "loss": 0.0723,
+ "step": 33707
+ },
+ {
+ "epoch": 91.84741144414168,
+ "grad_norm": 1.8385227918624878,
+ "learning_rate": 3.465713603022136e-07,
+ "loss": 0.0223,
+ "step": 33708
+ },
+ {
+ "epoch": 91.85013623978202,
+ "grad_norm": 2.821190357208252,
+ "learning_rate": 3.463410800560829e-07,
+ "loss": 0.0453,
+ "step": 33709
+ },
+ {
+ "epoch": 91.85286103542235,
+ "grad_norm": 1.599543809890747,
+ "learning_rate": 3.4611087499233696e-07,
+ "loss": 0.0168,
+ "step": 33710
+ },
+ {
+ "epoch": 91.85558583106267,
+ "grad_norm": 3.0530357360839844,
+ "learning_rate": 3.458807451127699e-07,
+ "loss": 0.1428,
+ "step": 33711
+ },
+ {
+ "epoch": 91.858310626703,
+ "grad_norm": 2.7457163333892822,
+ "learning_rate": 3.4565069041917256e-07,
+ "loss": 0.0344,
+ "step": 33712
+ },
+ {
+ "epoch": 91.86103542234332,
+ "grad_norm": 3.1225500106811523,
+ "learning_rate": 3.4542071091333674e-07,
+ "loss": 0.0873,
+ "step": 33713
+ },
+ {
+ "epoch": 91.86376021798365,
+ "grad_norm": 2.1477506160736084,
+ "learning_rate": 3.451908065970533e-07,
+ "loss": 0.0194,
+ "step": 33714
+ },
+ {
+ "epoch": 91.86648501362397,
+ "grad_norm": 2.862032175064087,
+ "learning_rate": 3.44960977472113e-07,
+ "loss": 0.0379,
+ "step": 33715
+ },
+ {
+ "epoch": 91.8692098092643,
+ "grad_norm": 2.6753666400909424,
+ "learning_rate": 3.4473122354030663e-07,
+ "loss": 0.0976,
+ "step": 33716
+ },
+ {
+ "epoch": 91.87193460490464,
+ "grad_norm": 2.248840093612671,
+ "learning_rate": 3.445015448034228e-07,
+ "loss": 0.0481,
+ "step": 33717
+ },
+ {
+ "epoch": 91.87465940054496,
+ "grad_norm": 3.4635705947875977,
+ "learning_rate": 3.4427194126325006e-07,
+ "loss": 0.0485,
+ "step": 33718
+ },
+ {
+ "epoch": 91.87738419618529,
+ "grad_norm": 3.2419512271881104,
+ "learning_rate": 3.4404241292157583e-07,
+ "loss": 0.0752,
+ "step": 33719
+ },
+ {
+ "epoch": 91.88010899182561,
+ "grad_norm": 2.5881309509277344,
+ "learning_rate": 3.438129597801898e-07,
+ "loss": 0.0365,
+ "step": 33720
+ },
+ {
+ "epoch": 91.88283378746594,
+ "grad_norm": 1.7208349704742432,
+ "learning_rate": 3.4358358184087727e-07,
+ "loss": 0.0199,
+ "step": 33721
+ },
+ {
+ "epoch": 91.88555858310627,
+ "grad_norm": 2.5771822929382324,
+ "learning_rate": 3.433542791054245e-07,
+ "loss": 0.0535,
+ "step": 33722
+ },
+ {
+ "epoch": 91.88828337874659,
+ "grad_norm": 3.0956103801727295,
+ "learning_rate": 3.4312505157561794e-07,
+ "loss": 0.0918,
+ "step": 33723
+ },
+ {
+ "epoch": 91.89100817438693,
+ "grad_norm": 4.567342758178711,
+ "learning_rate": 3.428958992532427e-07,
+ "loss": 0.0456,
+ "step": 33724
+ },
+ {
+ "epoch": 91.89373297002724,
+ "grad_norm": 2.660275936126709,
+ "learning_rate": 3.4266682214008416e-07,
+ "loss": 0.0622,
+ "step": 33725
+ },
+ {
+ "epoch": 91.89645776566758,
+ "grad_norm": 2.371448278427124,
+ "learning_rate": 3.424378202379253e-07,
+ "loss": 0.1388,
+ "step": 33726
+ },
+ {
+ "epoch": 91.8991825613079,
+ "grad_norm": 2.8419129848480225,
+ "learning_rate": 3.422088935485479e-07,
+ "loss": 0.0684,
+ "step": 33727
+ },
+ {
+ "epoch": 91.90190735694823,
+ "grad_norm": 2.1045830249786377,
+ "learning_rate": 3.419800420737396e-07,
+ "loss": 0.0243,
+ "step": 33728
+ },
+ {
+ "epoch": 91.90463215258856,
+ "grad_norm": 2.5817203521728516,
+ "learning_rate": 3.4175126581527883e-07,
+ "loss": 0.0577,
+ "step": 33729
+ },
+ {
+ "epoch": 91.90735694822888,
+ "grad_norm": 3.000640869140625,
+ "learning_rate": 3.4152256477494874e-07,
+ "loss": 0.0625,
+ "step": 33730
+ },
+ {
+ "epoch": 91.91008174386921,
+ "grad_norm": 2.578950881958008,
+ "learning_rate": 3.412939389545289e-07,
+ "loss": 0.0262,
+ "step": 33731
+ },
+ {
+ "epoch": 91.91280653950953,
+ "grad_norm": 3.0867624282836914,
+ "learning_rate": 3.410653883558002e-07,
+ "loss": 0.0719,
+ "step": 33732
+ },
+ {
+ "epoch": 91.91553133514986,
+ "grad_norm": 3.0393404960632324,
+ "learning_rate": 3.4083691298054556e-07,
+ "loss": 0.0374,
+ "step": 33733
+ },
+ {
+ "epoch": 91.9182561307902,
+ "grad_norm": 1.9768339395523071,
+ "learning_rate": 3.406085128305414e-07,
+ "loss": 0.1099,
+ "step": 33734
+ },
+ {
+ "epoch": 91.92098092643052,
+ "grad_norm": 1.7287859916687012,
+ "learning_rate": 3.4038018790756634e-07,
+ "loss": 0.0207,
+ "step": 33735
+ },
+ {
+ "epoch": 91.92370572207085,
+ "grad_norm": 2.799020290374756,
+ "learning_rate": 3.401519382134011e-07,
+ "loss": 0.026,
+ "step": 33736
+ },
+ {
+ "epoch": 91.92643051771117,
+ "grad_norm": 2.3542044162750244,
+ "learning_rate": 3.3992376374982097e-07,
+ "loss": 0.0261,
+ "step": 33737
+ },
+ {
+ "epoch": 91.9291553133515,
+ "grad_norm": 2.599226236343384,
+ "learning_rate": 3.396956645186045e-07,
+ "loss": 0.1167,
+ "step": 33738
+ },
+ {
+ "epoch": 91.93188010899182,
+ "grad_norm": 3.9881465435028076,
+ "learning_rate": 3.3946764052152583e-07,
+ "loss": 0.0425,
+ "step": 33739
+ },
+ {
+ "epoch": 91.93460490463215,
+ "grad_norm": 2.5314364433288574,
+ "learning_rate": 3.392396917603624e-07,
+ "loss": 0.096,
+ "step": 33740
+ },
+ {
+ "epoch": 91.93732970027249,
+ "grad_norm": 3.1245369911193848,
+ "learning_rate": 3.3901181823689065e-07,
+ "loss": 0.1295,
+ "step": 33741
+ },
+ {
+ "epoch": 91.9400544959128,
+ "grad_norm": 2.1980035305023193,
+ "learning_rate": 3.3878401995288357e-07,
+ "loss": 0.0631,
+ "step": 33742
+ },
+ {
+ "epoch": 91.94277929155314,
+ "grad_norm": 4.632396221160889,
+ "learning_rate": 3.385562969101142e-07,
+ "loss": 0.0321,
+ "step": 33743
+ },
+ {
+ "epoch": 91.94550408719346,
+ "grad_norm": 2.9690186977386475,
+ "learning_rate": 3.3832864911035877e-07,
+ "loss": 0.0629,
+ "step": 33744
+ },
+ {
+ "epoch": 91.94822888283379,
+ "grad_norm": 4.375700950622559,
+ "learning_rate": 3.3810107655538826e-07,
+ "loss": 0.0235,
+ "step": 33745
+ },
+ {
+ "epoch": 91.95095367847412,
+ "grad_norm": 2.0469024181365967,
+ "learning_rate": 3.378735792469756e-07,
+ "loss": 0.1086,
+ "step": 33746
+ },
+ {
+ "epoch": 91.95367847411444,
+ "grad_norm": 2.8312370777130127,
+ "learning_rate": 3.3764615718689273e-07,
+ "loss": 0.039,
+ "step": 33747
+ },
+ {
+ "epoch": 91.95640326975477,
+ "grad_norm": 2.2449893951416016,
+ "learning_rate": 3.374188103769105e-07,
+ "loss": 0.0656,
+ "step": 33748
+ },
+ {
+ "epoch": 91.95912806539509,
+ "grad_norm": 1.5328950881958008,
+ "learning_rate": 3.3719153881879963e-07,
+ "loss": 0.0206,
+ "step": 33749
+ },
+ {
+ "epoch": 91.96185286103542,
+ "grad_norm": 2.7683541774749756,
+ "learning_rate": 3.3696434251432984e-07,
+ "loss": 0.0481,
+ "step": 33750
+ },
+ {
+ "epoch": 91.96457765667574,
+ "grad_norm": 2.1966023445129395,
+ "learning_rate": 3.3673722146526976e-07,
+ "loss": 0.0204,
+ "step": 33751
+ },
+ {
+ "epoch": 91.96730245231608,
+ "grad_norm": 2.9148166179656982,
+ "learning_rate": 3.365101756733913e-07,
+ "loss": 0.138,
+ "step": 33752
+ },
+ {
+ "epoch": 91.97002724795641,
+ "grad_norm": 1.3568527698516846,
+ "learning_rate": 3.3628320514045963e-07,
+ "loss": 0.0172,
+ "step": 33753
+ },
+ {
+ "epoch": 91.97275204359673,
+ "grad_norm": 2.014632225036621,
+ "learning_rate": 3.3605630986824346e-07,
+ "loss": 0.0262,
+ "step": 33754
+ },
+ {
+ "epoch": 91.97547683923706,
+ "grad_norm": 2.359649181365967,
+ "learning_rate": 3.3582948985850904e-07,
+ "loss": 0.0657,
+ "step": 33755
+ },
+ {
+ "epoch": 91.97820163487738,
+ "grad_norm": 2.4967103004455566,
+ "learning_rate": 3.35602745113025e-07,
+ "loss": 0.0798,
+ "step": 33756
+ },
+ {
+ "epoch": 91.98092643051771,
+ "grad_norm": 3.5767691135406494,
+ "learning_rate": 3.3537607563355447e-07,
+ "loss": 0.1311,
+ "step": 33757
+ },
+ {
+ "epoch": 91.98365122615803,
+ "grad_norm": 2.6671438217163086,
+ "learning_rate": 3.3514948142186476e-07,
+ "loss": 0.0781,
+ "step": 33758
+ },
+ {
+ "epoch": 91.98637602179836,
+ "grad_norm": 2.795790195465088,
+ "learning_rate": 3.34922962479719e-07,
+ "loss": 0.0394,
+ "step": 33759
+ },
+ {
+ "epoch": 91.9891008174387,
+ "grad_norm": 2.46382737159729,
+ "learning_rate": 3.3469651880888245e-07,
+ "loss": 0.0613,
+ "step": 33760
+ },
+ {
+ "epoch": 91.99182561307902,
+ "grad_norm": 2.0662951469421387,
+ "learning_rate": 3.344701504111192e-07,
+ "loss": 0.0232,
+ "step": 33761
+ },
+ {
+ "epoch": 91.99455040871935,
+ "grad_norm": 3.3746325969696045,
+ "learning_rate": 3.342438572881912e-07,
+ "loss": 0.0299,
+ "step": 33762
+ },
+ {
+ "epoch": 91.99727520435967,
+ "grad_norm": 2.9933717250823975,
+ "learning_rate": 3.3401763944185927e-07,
+ "loss": 0.0388,
+ "step": 33763
+ },
+ {
+ "epoch": 92.0,
+ "grad_norm": 2.1233444213867188,
+ "learning_rate": 3.3379149687388866e-07,
+ "loss": 0.0288,
+ "step": 33764
+ },
+ {
+ "epoch": 92.00272479564033,
+ "grad_norm": 1.8295189142227173,
+ "learning_rate": 3.33565429586038e-07,
+ "loss": 0.0429,
+ "step": 33765
+ },
+ {
+ "epoch": 92.00544959128065,
+ "grad_norm": 2.276864528656006,
+ "learning_rate": 3.3333943758006914e-07,
+ "loss": 0.024,
+ "step": 33766
+ },
+ {
+ "epoch": 92.00817438692098,
+ "grad_norm": 1.9273000955581665,
+ "learning_rate": 3.331135208577407e-07,
+ "loss": 0.023,
+ "step": 33767
+ },
+ {
+ "epoch": 92.0108991825613,
+ "grad_norm": 3.3115742206573486,
+ "learning_rate": 3.3288767942081244e-07,
+ "loss": 0.047,
+ "step": 33768
+ },
+ {
+ "epoch": 92.01362397820164,
+ "grad_norm": 2.849778652191162,
+ "learning_rate": 3.326619132710451e-07,
+ "loss": 0.1022,
+ "step": 33769
+ },
+ {
+ "epoch": 92.01634877384195,
+ "grad_norm": 6.2739152908325195,
+ "learning_rate": 3.3243622241019623e-07,
+ "loss": 0.0394,
+ "step": 33770
+ },
+ {
+ "epoch": 92.01907356948229,
+ "grad_norm": 2.2515010833740234,
+ "learning_rate": 3.3221060684002217e-07,
+ "loss": 0.0365,
+ "step": 33771
+ },
+ {
+ "epoch": 92.02179836512262,
+ "grad_norm": 2.3634426593780518,
+ "learning_rate": 3.3198506656228037e-07,
+ "loss": 0.0382,
+ "step": 33772
+ },
+ {
+ "epoch": 92.02452316076294,
+ "grad_norm": 2.7536566257476807,
+ "learning_rate": 3.317596015787283e-07,
+ "loss": 0.1642,
+ "step": 33773
+ },
+ {
+ "epoch": 92.02724795640327,
+ "grad_norm": 2.3946402072906494,
+ "learning_rate": 3.3153421189112136e-07,
+ "loss": 0.0194,
+ "step": 33774
+ },
+ {
+ "epoch": 92.02997275204359,
+ "grad_norm": 4.876133441925049,
+ "learning_rate": 3.313088975012135e-07,
+ "loss": 0.081,
+ "step": 33775
+ },
+ {
+ "epoch": 92.03269754768392,
+ "grad_norm": 2.2528655529022217,
+ "learning_rate": 3.310836584107624e-07,
+ "loss": 0.0558,
+ "step": 33776
+ },
+ {
+ "epoch": 92.03542234332426,
+ "grad_norm": 4.052096843719482,
+ "learning_rate": 3.308584946215199e-07,
+ "loss": 0.1273,
+ "step": 33777
+ },
+ {
+ "epoch": 92.03814713896458,
+ "grad_norm": 2.179211139678955,
+ "learning_rate": 3.306334061352401e-07,
+ "loss": 0.0219,
+ "step": 33778
+ },
+ {
+ "epoch": 92.04087193460491,
+ "grad_norm": 3.1627750396728516,
+ "learning_rate": 3.304083929536761e-07,
+ "loss": 0.0674,
+ "step": 33779
+ },
+ {
+ "epoch": 92.04359673024523,
+ "grad_norm": 1.9695805311203003,
+ "learning_rate": 3.3018345507858094e-07,
+ "loss": 0.0354,
+ "step": 33780
+ },
+ {
+ "epoch": 92.04632152588556,
+ "grad_norm": 2.447617530822754,
+ "learning_rate": 3.2995859251170547e-07,
+ "loss": 0.0315,
+ "step": 33781
+ },
+ {
+ "epoch": 92.04904632152588,
+ "grad_norm": 2.6950347423553467,
+ "learning_rate": 3.297338052548016e-07,
+ "loss": 0.0234,
+ "step": 33782
+ },
+ {
+ "epoch": 92.05177111716621,
+ "grad_norm": 2.954461097717285,
+ "learning_rate": 3.295090933096179e-07,
+ "loss": 0.03,
+ "step": 33783
+ },
+ {
+ "epoch": 92.05449591280654,
+ "grad_norm": 2.3865628242492676,
+ "learning_rate": 3.292844566779063e-07,
+ "loss": 0.0267,
+ "step": 33784
+ },
+ {
+ "epoch": 92.05722070844686,
+ "grad_norm": 2.331212043762207,
+ "learning_rate": 3.290598953614177e-07,
+ "loss": 0.0233,
+ "step": 33785
+ },
+ {
+ "epoch": 92.0599455040872,
+ "grad_norm": 3.273543357849121,
+ "learning_rate": 3.288354093618995e-07,
+ "loss": 0.0275,
+ "step": 33786
+ },
+ {
+ "epoch": 92.06267029972751,
+ "grad_norm": 2.712019443511963,
+ "learning_rate": 3.2861099868109924e-07,
+ "loss": 0.0686,
+ "step": 33787
+ },
+ {
+ "epoch": 92.06539509536785,
+ "grad_norm": 3.1281256675720215,
+ "learning_rate": 3.283866633207644e-07,
+ "loss": 0.0644,
+ "step": 33788
+ },
+ {
+ "epoch": 92.06811989100818,
+ "grad_norm": 2.5526158809661865,
+ "learning_rate": 3.281624032826447e-07,
+ "loss": 0.1136,
+ "step": 33789
+ },
+ {
+ "epoch": 92.0708446866485,
+ "grad_norm": 7.320584297180176,
+ "learning_rate": 3.279382185684843e-07,
+ "loss": 0.1053,
+ "step": 33790
+ },
+ {
+ "epoch": 92.07356948228883,
+ "grad_norm": 2.609349489212036,
+ "learning_rate": 3.2771410918002954e-07,
+ "loss": 0.1718,
+ "step": 33791
+ },
+ {
+ "epoch": 92.07629427792915,
+ "grad_norm": 3.035057544708252,
+ "learning_rate": 3.2749007511902463e-07,
+ "loss": 0.1156,
+ "step": 33792
+ },
+ {
+ "epoch": 92.07901907356948,
+ "grad_norm": 2.4524147510528564,
+ "learning_rate": 3.272661163872182e-07,
+ "loss": 0.0752,
+ "step": 33793
+ },
+ {
+ "epoch": 92.0817438692098,
+ "grad_norm": 2.105128526687622,
+ "learning_rate": 3.2704223298635096e-07,
+ "loss": 0.0281,
+ "step": 33794
+ },
+ {
+ "epoch": 92.08446866485014,
+ "grad_norm": 1.708139419555664,
+ "learning_rate": 3.2681842491816716e-07,
+ "loss": 0.0242,
+ "step": 33795
+ },
+ {
+ "epoch": 92.08719346049047,
+ "grad_norm": 2.3079190254211426,
+ "learning_rate": 3.2659469218440986e-07,
+ "loss": 0.0351,
+ "step": 33796
+ },
+ {
+ "epoch": 92.08991825613079,
+ "grad_norm": 3.039968967437744,
+ "learning_rate": 3.263710347868221e-07,
+ "loss": 0.0407,
+ "step": 33797
+ },
+ {
+ "epoch": 92.09264305177112,
+ "grad_norm": 1.8194310665130615,
+ "learning_rate": 3.2614745272714577e-07,
+ "loss": 0.2152,
+ "step": 33798
+ },
+ {
+ "epoch": 92.09536784741144,
+ "grad_norm": 2.3963255882263184,
+ "learning_rate": 3.2592394600712065e-07,
+ "loss": 0.0882,
+ "step": 33799
+ },
+ {
+ "epoch": 92.09809264305177,
+ "grad_norm": 2.6452293395996094,
+ "learning_rate": 3.2570051462848973e-07,
+ "loss": 0.1105,
+ "step": 33800
+ },
+ {
+ "epoch": 92.1008174386921,
+ "grad_norm": 4.206119060516357,
+ "learning_rate": 3.2547715859299055e-07,
+ "loss": 0.0643,
+ "step": 33801
+ },
+ {
+ "epoch": 92.10354223433242,
+ "grad_norm": 3.5175535678863525,
+ "learning_rate": 3.2525387790236507e-07,
+ "loss": 0.14,
+ "step": 33802
+ },
+ {
+ "epoch": 92.10626702997276,
+ "grad_norm": 2.516937255859375,
+ "learning_rate": 3.250306725583507e-07,
+ "loss": 0.0917,
+ "step": 33803
+ },
+ {
+ "epoch": 92.10899182561307,
+ "grad_norm": 2.569063186645508,
+ "learning_rate": 3.248075425626851e-07,
+ "loss": 0.0828,
+ "step": 33804
+ },
+ {
+ "epoch": 92.11171662125341,
+ "grad_norm": 4.731888771057129,
+ "learning_rate": 3.2458448791710786e-07,
+ "loss": 0.0611,
+ "step": 33805
+ },
+ {
+ "epoch": 92.11444141689373,
+ "grad_norm": 3.3217012882232666,
+ "learning_rate": 3.2436150862335536e-07,
+ "loss": 0.1254,
+ "step": 33806
+ },
+ {
+ "epoch": 92.11716621253406,
+ "grad_norm": 1.359853982925415,
+ "learning_rate": 3.2413860468316517e-07,
+ "loss": 0.0155,
+ "step": 33807
+ },
+ {
+ "epoch": 92.11989100817439,
+ "grad_norm": 3.0055317878723145,
+ "learning_rate": 3.239157760982692e-07,
+ "loss": 0.0317,
+ "step": 33808
+ },
+ {
+ "epoch": 92.12261580381471,
+ "grad_norm": 2.7368526458740234,
+ "learning_rate": 3.2369302287040826e-07,
+ "loss": 0.0179,
+ "step": 33809
+ },
+ {
+ "epoch": 92.12534059945504,
+ "grad_norm": 2.9150002002716064,
+ "learning_rate": 3.234703450013132e-07,
+ "loss": 0.0273,
+ "step": 33810
+ },
+ {
+ "epoch": 92.12806539509536,
+ "grad_norm": 3.0399937629699707,
+ "learning_rate": 3.232477424927205e-07,
+ "loss": 0.03,
+ "step": 33811
+ },
+ {
+ "epoch": 92.1307901907357,
+ "grad_norm": 2.771402597427368,
+ "learning_rate": 3.23025215346362e-07,
+ "loss": 0.0927,
+ "step": 33812
+ },
+ {
+ "epoch": 92.13351498637603,
+ "grad_norm": 3.0156381130218506,
+ "learning_rate": 3.22802763563973e-07,
+ "loss": 0.0229,
+ "step": 33813
+ },
+ {
+ "epoch": 92.13623978201635,
+ "grad_norm": 4.398390769958496,
+ "learning_rate": 3.2258038714728436e-07,
+ "loss": 0.0324,
+ "step": 33814
+ },
+ {
+ "epoch": 92.13896457765668,
+ "grad_norm": 2.441612958908081,
+ "learning_rate": 3.22358086098028e-07,
+ "loss": 0.077,
+ "step": 33815
+ },
+ {
+ "epoch": 92.141689373297,
+ "grad_norm": 3.5289855003356934,
+ "learning_rate": 3.2213586041793364e-07,
+ "loss": 0.0612,
+ "step": 33816
+ },
+ {
+ "epoch": 92.14441416893733,
+ "grad_norm": 4.272944927215576,
+ "learning_rate": 3.219137101087355e-07,
+ "loss": 0.1212,
+ "step": 33817
+ },
+ {
+ "epoch": 92.14713896457765,
+ "grad_norm": 2.395763874053955,
+ "learning_rate": 3.2169163517216217e-07,
+ "loss": 0.0767,
+ "step": 33818
+ },
+ {
+ "epoch": 92.14986376021798,
+ "grad_norm": 2.5885632038116455,
+ "learning_rate": 3.2146963560994226e-07,
+ "loss": 0.0385,
+ "step": 33819
+ },
+ {
+ "epoch": 92.15258855585832,
+ "grad_norm": 2.7076330184936523,
+ "learning_rate": 3.212477114238044e-07,
+ "loss": 0.0864,
+ "step": 33820
+ },
+ {
+ "epoch": 92.15531335149863,
+ "grad_norm": 1.8669532537460327,
+ "learning_rate": 3.210258626154794e-07,
+ "loss": 0.0355,
+ "step": 33821
+ },
+ {
+ "epoch": 92.15803814713897,
+ "grad_norm": 2.4068408012390137,
+ "learning_rate": 3.208040891866926e-07,
+ "loss": 0.085,
+ "step": 33822
+ },
+ {
+ "epoch": 92.16076294277929,
+ "grad_norm": 1.6939899921417236,
+ "learning_rate": 3.2058239113917256e-07,
+ "loss": 0.0219,
+ "step": 33823
+ },
+ {
+ "epoch": 92.16348773841962,
+ "grad_norm": 2.367842435836792,
+ "learning_rate": 3.2036076847464457e-07,
+ "loss": 0.0448,
+ "step": 33824
+ },
+ {
+ "epoch": 92.16621253405995,
+ "grad_norm": 2.184643030166626,
+ "learning_rate": 3.201392211948362e-07,
+ "loss": 0.1056,
+ "step": 33825
+ },
+ {
+ "epoch": 92.16893732970027,
+ "grad_norm": 1.9597187042236328,
+ "learning_rate": 3.199177493014716e-07,
+ "loss": 0.019,
+ "step": 33826
+ },
+ {
+ "epoch": 92.1716621253406,
+ "grad_norm": 2.8972485065460205,
+ "learning_rate": 3.196963527962771e-07,
+ "loss": 0.0623,
+ "step": 33827
+ },
+ {
+ "epoch": 92.17438692098092,
+ "grad_norm": 1.8783094882965088,
+ "learning_rate": 3.194750316809736e-07,
+ "loss": 0.0487,
+ "step": 33828
+ },
+ {
+ "epoch": 92.17711171662125,
+ "grad_norm": 2.029810905456543,
+ "learning_rate": 3.192537859572886e-07,
+ "loss": 0.0499,
+ "step": 33829
+ },
+ {
+ "epoch": 92.17983651226157,
+ "grad_norm": 1.5199320316314697,
+ "learning_rate": 3.190326156269441e-07,
+ "loss": 0.0205,
+ "step": 33830
+ },
+ {
+ "epoch": 92.1825613079019,
+ "grad_norm": 2.1136865615844727,
+ "learning_rate": 3.188115206916609e-07,
+ "loss": 0.0296,
+ "step": 33831
+ },
+ {
+ "epoch": 92.18528610354224,
+ "grad_norm": 4.115062713623047,
+ "learning_rate": 3.1859050115316205e-07,
+ "loss": 0.1639,
+ "step": 33832
+ },
+ {
+ "epoch": 92.18801089918256,
+ "grad_norm": 2.2568817138671875,
+ "learning_rate": 3.183695570131695e-07,
+ "loss": 0.028,
+ "step": 33833
+ },
+ {
+ "epoch": 92.19073569482289,
+ "grad_norm": 2.664994239807129,
+ "learning_rate": 3.1814868827340194e-07,
+ "loss": 0.0336,
+ "step": 33834
+ },
+ {
+ "epoch": 92.19346049046321,
+ "grad_norm": 2.2303590774536133,
+ "learning_rate": 3.179278949355824e-07,
+ "loss": 0.0771,
+ "step": 33835
+ },
+ {
+ "epoch": 92.19618528610354,
+ "grad_norm": 2.1022610664367676,
+ "learning_rate": 3.177071770014273e-07,
+ "loss": 0.0669,
+ "step": 33836
+ },
+ {
+ "epoch": 92.19891008174388,
+ "grad_norm": 2.6430466175079346,
+ "learning_rate": 3.1748653447265634e-07,
+ "loss": 0.1713,
+ "step": 33837
+ },
+ {
+ "epoch": 92.2016348773842,
+ "grad_norm": 2.0570852756500244,
+ "learning_rate": 3.1726596735099035e-07,
+ "loss": 0.0271,
+ "step": 33838
+ },
+ {
+ "epoch": 92.20435967302453,
+ "grad_norm": 3.03989315032959,
+ "learning_rate": 3.1704547563814583e-07,
+ "loss": 0.0814,
+ "step": 33839
+ },
+ {
+ "epoch": 92.20708446866485,
+ "grad_norm": 2.5764822959899902,
+ "learning_rate": 3.1682505933583796e-07,
+ "loss": 0.0468,
+ "step": 33840
+ },
+ {
+ "epoch": 92.20980926430518,
+ "grad_norm": 1.3078769445419312,
+ "learning_rate": 3.166047184457854e-07,
+ "loss": 0.014,
+ "step": 33841
+ },
+ {
+ "epoch": 92.2125340599455,
+ "grad_norm": 2.423530340194702,
+ "learning_rate": 3.1638445296970463e-07,
+ "loss": 0.0674,
+ "step": 33842
+ },
+ {
+ "epoch": 92.21525885558583,
+ "grad_norm": 2.24601149559021,
+ "learning_rate": 3.1616426290930977e-07,
+ "loss": 0.0497,
+ "step": 33843
+ },
+ {
+ "epoch": 92.21798365122616,
+ "grad_norm": 2.4931259155273438,
+ "learning_rate": 3.159441482663139e-07,
+ "loss": 0.0338,
+ "step": 33844
+ },
+ {
+ "epoch": 92.22070844686648,
+ "grad_norm": 2.9073128700256348,
+ "learning_rate": 3.1572410904243566e-07,
+ "loss": 0.025,
+ "step": 33845
+ },
+ {
+ "epoch": 92.22343324250681,
+ "grad_norm": 2.2473936080932617,
+ "learning_rate": 3.155041452393859e-07,
+ "loss": 0.0278,
+ "step": 33846
+ },
+ {
+ "epoch": 92.22615803814713,
+ "grad_norm": 2.516573429107666,
+ "learning_rate": 3.1528425685887874e-07,
+ "loss": 0.0929,
+ "step": 33847
+ },
+ {
+ "epoch": 92.22888283378747,
+ "grad_norm": 1.886380910873413,
+ "learning_rate": 3.15064443902624e-07,
+ "loss": 0.0492,
+ "step": 33848
+ },
+ {
+ "epoch": 92.2316076294278,
+ "grad_norm": 2.5071778297424316,
+ "learning_rate": 3.14844706372337e-07,
+ "loss": 0.0298,
+ "step": 33849
+ },
+ {
+ "epoch": 92.23433242506812,
+ "grad_norm": 2.0962769985198975,
+ "learning_rate": 3.146250442697285e-07,
+ "loss": 0.0935,
+ "step": 33850
+ },
+ {
+ "epoch": 92.23705722070845,
+ "grad_norm": 1.873889446258545,
+ "learning_rate": 3.144054575965072e-07,
+ "loss": 0.131,
+ "step": 33851
+ },
+ {
+ "epoch": 92.23978201634877,
+ "grad_norm": 2.5482842922210693,
+ "learning_rate": 3.141859463543839e-07,
+ "loss": 0.0302,
+ "step": 33852
+ },
+ {
+ "epoch": 92.2425068119891,
+ "grad_norm": 2.989535331726074,
+ "learning_rate": 3.1396651054506956e-07,
+ "loss": 0.0689,
+ "step": 33853
+ },
+ {
+ "epoch": 92.24523160762942,
+ "grad_norm": 4.189667701721191,
+ "learning_rate": 3.137471501702727e-07,
+ "loss": 0.1763,
+ "step": 33854
+ },
+ {
+ "epoch": 92.24795640326975,
+ "grad_norm": 2.7423295974731445,
+ "learning_rate": 3.1352786523170085e-07,
+ "loss": 0.0604,
+ "step": 33855
+ },
+ {
+ "epoch": 92.25068119891009,
+ "grad_norm": 2.076279640197754,
+ "learning_rate": 3.1330865573106274e-07,
+ "loss": 0.0995,
+ "step": 33856
+ },
+ {
+ "epoch": 92.2534059945504,
+ "grad_norm": 3.0084567070007324,
+ "learning_rate": 3.130895216700636e-07,
+ "loss": 0.0348,
+ "step": 33857
+ },
+ {
+ "epoch": 92.25613079019074,
+ "grad_norm": 2.3064050674438477,
+ "learning_rate": 3.1287046305041313e-07,
+ "loss": 0.0329,
+ "step": 33858
+ },
+ {
+ "epoch": 92.25885558583106,
+ "grad_norm": 2.7155561447143555,
+ "learning_rate": 3.126514798738156e-07,
+ "loss": 0.0493,
+ "step": 33859
+ },
+ {
+ "epoch": 92.26158038147139,
+ "grad_norm": 2.3363630771636963,
+ "learning_rate": 3.124325721419752e-07,
+ "loss": 0.1445,
+ "step": 33860
+ },
+ {
+ "epoch": 92.26430517711172,
+ "grad_norm": 2.6246142387390137,
+ "learning_rate": 3.122137398565994e-07,
+ "loss": 0.0325,
+ "step": 33861
+ },
+ {
+ "epoch": 92.26702997275204,
+ "grad_norm": 2.3935251235961914,
+ "learning_rate": 3.119949830193902e-07,
+ "loss": 0.0408,
+ "step": 33862
+ },
+ {
+ "epoch": 92.26975476839237,
+ "grad_norm": 2.4321534633636475,
+ "learning_rate": 3.1177630163205406e-07,
+ "loss": 0.0187,
+ "step": 33863
+ },
+ {
+ "epoch": 92.2724795640327,
+ "grad_norm": 2.471033811569214,
+ "learning_rate": 3.115576956962896e-07,
+ "loss": 0.0168,
+ "step": 33864
+ },
+ {
+ "epoch": 92.27520435967303,
+ "grad_norm": 3.132131576538086,
+ "learning_rate": 3.1133916521380427e-07,
+ "loss": 0.0318,
+ "step": 33865
+ },
+ {
+ "epoch": 92.27792915531334,
+ "grad_norm": 1.8041948080062866,
+ "learning_rate": 3.111207101862968e-07,
+ "loss": 0.1519,
+ "step": 33866
+ },
+ {
+ "epoch": 92.28065395095368,
+ "grad_norm": 2.8425796031951904,
+ "learning_rate": 3.1090233061547017e-07,
+ "loss": 0.0531,
+ "step": 33867
+ },
+ {
+ "epoch": 92.28337874659401,
+ "grad_norm": 2.4926719665527344,
+ "learning_rate": 3.106840265030231e-07,
+ "loss": 0.0273,
+ "step": 33868
+ },
+ {
+ "epoch": 92.28610354223433,
+ "grad_norm": 2.3687140941619873,
+ "learning_rate": 3.1046579785065756e-07,
+ "loss": 0.0198,
+ "step": 33869
+ },
+ {
+ "epoch": 92.28882833787466,
+ "grad_norm": 2.088261604309082,
+ "learning_rate": 3.1024764466007106e-07,
+ "loss": 0.1923,
+ "step": 33870
+ },
+ {
+ "epoch": 92.29155313351498,
+ "grad_norm": 1.6418927907943726,
+ "learning_rate": 3.100295669329667e-07,
+ "loss": 0.0157,
+ "step": 33871
+ },
+ {
+ "epoch": 92.29427792915531,
+ "grad_norm": 2.099968671798706,
+ "learning_rate": 3.0981156467103867e-07,
+ "loss": 0.0943,
+ "step": 33872
+ },
+ {
+ "epoch": 92.29700272479565,
+ "grad_norm": 2.534358024597168,
+ "learning_rate": 3.095936378759856e-07,
+ "loss": 0.0436,
+ "step": 33873
+ },
+ {
+ "epoch": 92.29972752043597,
+ "grad_norm": 1.4658430814743042,
+ "learning_rate": 3.0937578654950727e-07,
+ "loss": 0.0202,
+ "step": 33874
+ },
+ {
+ "epoch": 92.3024523160763,
+ "grad_norm": 1.372265338897705,
+ "learning_rate": 3.091580106932979e-07,
+ "loss": 0.0189,
+ "step": 33875
+ },
+ {
+ "epoch": 92.30517711171662,
+ "grad_norm": 2.6411492824554443,
+ "learning_rate": 3.089403103090538e-07,
+ "loss": 0.0938,
+ "step": 33876
+ },
+ {
+ "epoch": 92.30790190735695,
+ "grad_norm": 2.502680778503418,
+ "learning_rate": 3.0872268539846926e-07,
+ "loss": 0.0486,
+ "step": 33877
+ },
+ {
+ "epoch": 92.31062670299727,
+ "grad_norm": 2.4906811714172363,
+ "learning_rate": 3.0850513596324294e-07,
+ "loss": 0.0482,
+ "step": 33878
+ },
+ {
+ "epoch": 92.3133514986376,
+ "grad_norm": 2.694629430770874,
+ "learning_rate": 3.0828766200506563e-07,
+ "loss": 0.0248,
+ "step": 33879
+ },
+ {
+ "epoch": 92.31607629427793,
+ "grad_norm": 2.9682085514068604,
+ "learning_rate": 3.0807026352563273e-07,
+ "loss": 0.0943,
+ "step": 33880
+ },
+ {
+ "epoch": 92.31880108991825,
+ "grad_norm": 2.0423824787139893,
+ "learning_rate": 3.078529405266351e-07,
+ "loss": 0.0683,
+ "step": 33881
+ },
+ {
+ "epoch": 92.32152588555859,
+ "grad_norm": 2.5169155597686768,
+ "learning_rate": 3.0763569300976794e-07,
+ "loss": 0.0746,
+ "step": 33882
+ },
+ {
+ "epoch": 92.3242506811989,
+ "grad_norm": 3.171461820602417,
+ "learning_rate": 3.074185209767222e-07,
+ "loss": 0.0347,
+ "step": 33883
+ },
+ {
+ "epoch": 92.32697547683924,
+ "grad_norm": 1.595274567604065,
+ "learning_rate": 3.0720142442918765e-07,
+ "loss": 0.0359,
+ "step": 33884
+ },
+ {
+ "epoch": 92.32970027247957,
+ "grad_norm": 2.9492576122283936,
+ "learning_rate": 3.069844033688574e-07,
+ "loss": 0.0247,
+ "step": 33885
+ },
+ {
+ "epoch": 92.33242506811989,
+ "grad_norm": 2.830124616622925,
+ "learning_rate": 3.0676745779742114e-07,
+ "loss": 0.0705,
+ "step": 33886
+ },
+ {
+ "epoch": 92.33514986376022,
+ "grad_norm": 1.7882606983184814,
+ "learning_rate": 3.0655058771656755e-07,
+ "loss": 0.024,
+ "step": 33887
+ },
+ {
+ "epoch": 92.33787465940054,
+ "grad_norm": 3.2372705936431885,
+ "learning_rate": 3.0633379312798637e-07,
+ "loss": 0.1056,
+ "step": 33888
+ },
+ {
+ "epoch": 92.34059945504087,
+ "grad_norm": 2.8747408390045166,
+ "learning_rate": 3.061170740333641e-07,
+ "loss": 0.0396,
+ "step": 33889
+ },
+ {
+ "epoch": 92.34332425068119,
+ "grad_norm": 3.1066174507141113,
+ "learning_rate": 3.0590043043439156e-07,
+ "loss": 0.0566,
+ "step": 33890
+ },
+ {
+ "epoch": 92.34604904632153,
+ "grad_norm": 2.6151490211486816,
+ "learning_rate": 3.0568386233275404e-07,
+ "loss": 0.0434,
+ "step": 33891
+ },
+ {
+ "epoch": 92.34877384196186,
+ "grad_norm": 2.095111131668091,
+ "learning_rate": 3.0546736973013915e-07,
+ "loss": 0.0364,
+ "step": 33892
+ },
+ {
+ "epoch": 92.35149863760218,
+ "grad_norm": 2.777678966522217,
+ "learning_rate": 3.05250952628231e-07,
+ "loss": 0.1083,
+ "step": 33893
+ },
+ {
+ "epoch": 92.35422343324251,
+ "grad_norm": 4.020278453826904,
+ "learning_rate": 3.0503461102871836e-07,
+ "loss": 0.0248,
+ "step": 33894
+ },
+ {
+ "epoch": 92.35694822888283,
+ "grad_norm": 2.4880988597869873,
+ "learning_rate": 3.048183449332831e-07,
+ "loss": 0.1197,
+ "step": 33895
+ },
+ {
+ "epoch": 92.35967302452316,
+ "grad_norm": 2.075143575668335,
+ "learning_rate": 3.046021543436106e-07,
+ "loss": 0.0303,
+ "step": 33896
+ },
+ {
+ "epoch": 92.3623978201635,
+ "grad_norm": 2.5300533771514893,
+ "learning_rate": 3.04386039261384e-07,
+ "loss": 0.0272,
+ "step": 33897
+ },
+ {
+ "epoch": 92.36512261580381,
+ "grad_norm": 2.7739245891571045,
+ "learning_rate": 3.0416999968828743e-07,
+ "loss": 0.0377,
+ "step": 33898
+ },
+ {
+ "epoch": 92.36784741144415,
+ "grad_norm": 3.773585557937622,
+ "learning_rate": 3.039540356260029e-07,
+ "loss": 0.2318,
+ "step": 33899
+ },
+ {
+ "epoch": 92.37057220708446,
+ "grad_norm": 7.179575443267822,
+ "learning_rate": 3.037381470762124e-07,
+ "loss": 0.0426,
+ "step": 33900
+ },
+ {
+ "epoch": 92.3732970027248,
+ "grad_norm": 3.2828152179718018,
+ "learning_rate": 3.035223340405957e-07,
+ "loss": 0.0307,
+ "step": 33901
+ },
+ {
+ "epoch": 92.37602179836512,
+ "grad_norm": 1.574810266494751,
+ "learning_rate": 3.033065965208359e-07,
+ "loss": 0.0183,
+ "step": 33902
+ },
+ {
+ "epoch": 92.37874659400545,
+ "grad_norm": 3.448099374771118,
+ "learning_rate": 3.030909345186128e-07,
+ "loss": 0.0909,
+ "step": 33903
+ },
+ {
+ "epoch": 92.38147138964578,
+ "grad_norm": 2.6964199542999268,
+ "learning_rate": 3.028753480356061e-07,
+ "loss": 0.0343,
+ "step": 33904
+ },
+ {
+ "epoch": 92.3841961852861,
+ "grad_norm": 3.373821973800659,
+ "learning_rate": 3.026598370734912e-07,
+ "loss": 0.0957,
+ "step": 33905
+ },
+ {
+ "epoch": 92.38692098092643,
+ "grad_norm": 2.0266878604888916,
+ "learning_rate": 3.0244440163395115e-07,
+ "loss": 0.0232,
+ "step": 33906
+ },
+ {
+ "epoch": 92.38964577656675,
+ "grad_norm": 2.847181558609009,
+ "learning_rate": 3.022290417186624e-07,
+ "loss": 0.0471,
+ "step": 33907
+ },
+ {
+ "epoch": 92.39237057220708,
+ "grad_norm": 2.4669415950775146,
+ "learning_rate": 3.020137573293014e-07,
+ "loss": 0.0267,
+ "step": 33908
+ },
+ {
+ "epoch": 92.39509536784742,
+ "grad_norm": 2.3490042686462402,
+ "learning_rate": 3.0179854846754455e-07,
+ "loss": 0.1935,
+ "step": 33909
+ },
+ {
+ "epoch": 92.39782016348774,
+ "grad_norm": 2.1643900871276855,
+ "learning_rate": 3.015834151350694e-07,
+ "loss": 0.0982,
+ "step": 33910
+ },
+ {
+ "epoch": 92.40054495912807,
+ "grad_norm": 2.525986671447754,
+ "learning_rate": 3.0136835733355017e-07,
+ "loss": 0.1271,
+ "step": 33911
+ },
+ {
+ "epoch": 92.40326975476839,
+ "grad_norm": 2.159219264984131,
+ "learning_rate": 3.0115337506466226e-07,
+ "loss": 0.034,
+ "step": 33912
+ },
+ {
+ "epoch": 92.40599455040872,
+ "grad_norm": 1.880326271057129,
+ "learning_rate": 3.009384683300787e-07,
+ "loss": 0.0264,
+ "step": 33913
+ },
+ {
+ "epoch": 92.40871934604904,
+ "grad_norm": 2.5172228813171387,
+ "learning_rate": 3.007236371314748e-07,
+ "loss": 0.0838,
+ "step": 33914
+ },
+ {
+ "epoch": 92.41144414168937,
+ "grad_norm": 2.4819085597991943,
+ "learning_rate": 3.0050888147052373e-07,
+ "loss": 0.0646,
+ "step": 33915
+ },
+ {
+ "epoch": 92.4141689373297,
+ "grad_norm": 2.8474478721618652,
+ "learning_rate": 3.002942013488974e-07,
+ "loss": 0.1233,
+ "step": 33916
+ },
+ {
+ "epoch": 92.41689373297002,
+ "grad_norm": 3.8018252849578857,
+ "learning_rate": 3.000795967682657e-07,
+ "loss": 0.0632,
+ "step": 33917
+ },
+ {
+ "epoch": 92.41961852861036,
+ "grad_norm": 2.0780482292175293,
+ "learning_rate": 2.9986506773030386e-07,
+ "loss": 0.0195,
+ "step": 33918
+ },
+ {
+ "epoch": 92.42234332425068,
+ "grad_norm": 2.081063985824585,
+ "learning_rate": 2.996506142366795e-07,
+ "loss": 0.0369,
+ "step": 33919
+ },
+ {
+ "epoch": 92.42506811989101,
+ "grad_norm": 2.663294553756714,
+ "learning_rate": 2.994362362890657e-07,
+ "loss": 0.105,
+ "step": 33920
+ },
+ {
+ "epoch": 92.42779291553134,
+ "grad_norm": 6.76279354095459,
+ "learning_rate": 2.992219338891278e-07,
+ "loss": 0.0461,
+ "step": 33921
+ },
+ {
+ "epoch": 92.43051771117166,
+ "grad_norm": 7.834489345550537,
+ "learning_rate": 2.9900770703853774e-07,
+ "loss": 0.1696,
+ "step": 33922
+ },
+ {
+ "epoch": 92.433242506812,
+ "grad_norm": 2.504335880279541,
+ "learning_rate": 2.9879355573896427e-07,
+ "loss": 0.0169,
+ "step": 33923
+ },
+ {
+ "epoch": 92.43596730245231,
+ "grad_norm": 3.097688674926758,
+ "learning_rate": 2.9857947999207493e-07,
+ "loss": 0.114,
+ "step": 33924
+ },
+ {
+ "epoch": 92.43869209809264,
+ "grad_norm": 2.420255184173584,
+ "learning_rate": 2.98365479799535e-07,
+ "loss": 0.1299,
+ "step": 33925
+ },
+ {
+ "epoch": 92.44141689373296,
+ "grad_norm": 1.806056261062622,
+ "learning_rate": 2.981515551630132e-07,
+ "loss": 0.1179,
+ "step": 33926
+ },
+ {
+ "epoch": 92.4441416893733,
+ "grad_norm": 2.9265284538269043,
+ "learning_rate": 2.979377060841748e-07,
+ "loss": 0.0961,
+ "step": 33927
+ },
+ {
+ "epoch": 92.44686648501363,
+ "grad_norm": 1.9160208702087402,
+ "learning_rate": 2.9772393256468634e-07,
+ "loss": 0.0191,
+ "step": 33928
+ },
+ {
+ "epoch": 92.44959128065395,
+ "grad_norm": 4.044418811798096,
+ "learning_rate": 2.9751023460620975e-07,
+ "loss": 0.0364,
+ "step": 33929
+ },
+ {
+ "epoch": 92.45231607629428,
+ "grad_norm": 1.8257092237472534,
+ "learning_rate": 2.972966122104115e-07,
+ "loss": 0.0263,
+ "step": 33930
+ },
+ {
+ "epoch": 92.4550408719346,
+ "grad_norm": 4.9430084228515625,
+ "learning_rate": 2.9708306537895583e-07,
+ "loss": 0.0443,
+ "step": 33931
+ },
+ {
+ "epoch": 92.45776566757493,
+ "grad_norm": 2.891047716140747,
+ "learning_rate": 2.968695941135047e-07,
+ "loss": 0.0549,
+ "step": 33932
+ },
+ {
+ "epoch": 92.46049046321527,
+ "grad_norm": 2.730832576751709,
+ "learning_rate": 2.9665619841572015e-07,
+ "loss": 0.057,
+ "step": 33933
+ },
+ {
+ "epoch": 92.46321525885558,
+ "grad_norm": 2.0785939693450928,
+ "learning_rate": 2.964428782872664e-07,
+ "loss": 0.0262,
+ "step": 33934
+ },
+ {
+ "epoch": 92.46594005449592,
+ "grad_norm": 2.5021350383758545,
+ "learning_rate": 2.9622963372980204e-07,
+ "loss": 0.1014,
+ "step": 33935
+ },
+ {
+ "epoch": 92.46866485013624,
+ "grad_norm": 4.288695335388184,
+ "learning_rate": 2.9601646474498926e-07,
+ "loss": 0.089,
+ "step": 33936
+ },
+ {
+ "epoch": 92.47138964577657,
+ "grad_norm": 1.9641176462173462,
+ "learning_rate": 2.958033713344877e-07,
+ "loss": 0.0488,
+ "step": 33937
+ },
+ {
+ "epoch": 92.47411444141689,
+ "grad_norm": 1.865676999092102,
+ "learning_rate": 2.9559035349995715e-07,
+ "loss": 0.0206,
+ "step": 33938
+ },
+ {
+ "epoch": 92.47683923705722,
+ "grad_norm": 3.2440242767333984,
+ "learning_rate": 2.953774112430563e-07,
+ "loss": 0.0937,
+ "step": 33939
+ },
+ {
+ "epoch": 92.47956403269755,
+ "grad_norm": 3.238081932067871,
+ "learning_rate": 2.9516454456544386e-07,
+ "loss": 0.0362,
+ "step": 33940
+ },
+ {
+ "epoch": 92.48228882833787,
+ "grad_norm": 2.4168434143066406,
+ "learning_rate": 2.9495175346877846e-07,
+ "loss": 0.0429,
+ "step": 33941
+ },
+ {
+ "epoch": 92.4850136239782,
+ "grad_norm": 2.8645784854888916,
+ "learning_rate": 2.9473903795471546e-07,
+ "loss": 0.0703,
+ "step": 33942
+ },
+ {
+ "epoch": 92.48773841961852,
+ "grad_norm": 1.7716959714889526,
+ "learning_rate": 2.9452639802491356e-07,
+ "loss": 0.1213,
+ "step": 33943
+ },
+ {
+ "epoch": 92.49046321525886,
+ "grad_norm": 1.8242135047912598,
+ "learning_rate": 2.9431383368102696e-07,
+ "loss": 0.0413,
+ "step": 33944
+ },
+ {
+ "epoch": 92.49318801089919,
+ "grad_norm": 5.517455101013184,
+ "learning_rate": 2.941013449247132e-07,
+ "loss": 0.0914,
+ "step": 33945
+ },
+ {
+ "epoch": 92.49591280653951,
+ "grad_norm": 1.8510369062423706,
+ "learning_rate": 2.9388893175762325e-07,
+ "loss": 0.0972,
+ "step": 33946
+ },
+ {
+ "epoch": 92.49863760217984,
+ "grad_norm": 9.689813613891602,
+ "learning_rate": 2.936765941814157e-07,
+ "loss": 0.2035,
+ "step": 33947
+ },
+ {
+ "epoch": 92.50136239782016,
+ "grad_norm": 4.921730995178223,
+ "learning_rate": 2.934643321977426e-07,
+ "loss": 0.0542,
+ "step": 33948
+ },
+ {
+ "epoch": 92.50408719346049,
+ "grad_norm": 2.1656479835510254,
+ "learning_rate": 2.932521458082549e-07,
+ "loss": 0.0777,
+ "step": 33949
+ },
+ {
+ "epoch": 92.50681198910081,
+ "grad_norm": 1.4755820035934448,
+ "learning_rate": 2.93040035014609e-07,
+ "loss": 0.0167,
+ "step": 33950
+ },
+ {
+ "epoch": 92.50953678474114,
+ "grad_norm": 1.8112258911132812,
+ "learning_rate": 2.9282799981845464e-07,
+ "loss": 0.0222,
+ "step": 33951
+ },
+ {
+ "epoch": 92.51226158038148,
+ "grad_norm": 2.7130534648895264,
+ "learning_rate": 2.9261604022144397e-07,
+ "loss": 0.0382,
+ "step": 33952
+ },
+ {
+ "epoch": 92.5149863760218,
+ "grad_norm": 3.03053879737854,
+ "learning_rate": 2.9240415622522557e-07,
+ "loss": 0.0258,
+ "step": 33953
+ },
+ {
+ "epoch": 92.51771117166213,
+ "grad_norm": 2.6802375316619873,
+ "learning_rate": 2.9219234783145147e-07,
+ "loss": 0.042,
+ "step": 33954
+ },
+ {
+ "epoch": 92.52043596730245,
+ "grad_norm": 1.7798711061477661,
+ "learning_rate": 2.9198061504177144e-07,
+ "loss": 0.0275,
+ "step": 33955
+ },
+ {
+ "epoch": 92.52316076294278,
+ "grad_norm": 2.7639007568359375,
+ "learning_rate": 2.917689578578331e-07,
+ "loss": 0.0403,
+ "step": 33956
+ },
+ {
+ "epoch": 92.52588555858311,
+ "grad_norm": 2.2817227840423584,
+ "learning_rate": 2.915573762812873e-07,
+ "loss": 0.0218,
+ "step": 33957
+ },
+ {
+ "epoch": 92.52861035422343,
+ "grad_norm": 2.4043657779693604,
+ "learning_rate": 2.9134587031377835e-07,
+ "loss": 0.037,
+ "step": 33958
+ },
+ {
+ "epoch": 92.53133514986376,
+ "grad_norm": 2.5717053413391113,
+ "learning_rate": 2.91134439956956e-07,
+ "loss": 0.0334,
+ "step": 33959
+ },
+ {
+ "epoch": 92.53405994550408,
+ "grad_norm": 1.61574387550354,
+ "learning_rate": 2.909230852124667e-07,
+ "loss": 0.0585,
+ "step": 33960
+ },
+ {
+ "epoch": 92.53678474114442,
+ "grad_norm": 5.058300495147705,
+ "learning_rate": 2.907118060819569e-07,
+ "loss": 0.0487,
+ "step": 33961
+ },
+ {
+ "epoch": 92.53950953678473,
+ "grad_norm": 8.652349472045898,
+ "learning_rate": 2.905006025670687e-07,
+ "loss": 0.051,
+ "step": 33962
+ },
+ {
+ "epoch": 92.54223433242507,
+ "grad_norm": 1.8410452604293823,
+ "learning_rate": 2.902894746694507e-07,
+ "loss": 0.0222,
+ "step": 33963
+ },
+ {
+ "epoch": 92.5449591280654,
+ "grad_norm": 2.593010902404785,
+ "learning_rate": 2.90078422390746e-07,
+ "loss": 0.1177,
+ "step": 33964
+ },
+ {
+ "epoch": 92.54768392370572,
+ "grad_norm": 2.5542678833007812,
+ "learning_rate": 2.898674457325967e-07,
+ "loss": 0.0236,
+ "step": 33965
+ },
+ {
+ "epoch": 92.55040871934605,
+ "grad_norm": 2.2600033283233643,
+ "learning_rate": 2.8965654469664815e-07,
+ "loss": 0.0518,
+ "step": 33966
+ },
+ {
+ "epoch": 92.55313351498637,
+ "grad_norm": 3.8037288188934326,
+ "learning_rate": 2.8944571928454126e-07,
+ "loss": 0.034,
+ "step": 33967
+ },
+ {
+ "epoch": 92.5558583106267,
+ "grad_norm": 2.4722979068756104,
+ "learning_rate": 2.892349694979202e-07,
+ "loss": 0.0835,
+ "step": 33968
+ },
+ {
+ "epoch": 92.55858310626704,
+ "grad_norm": 2.584477424621582,
+ "learning_rate": 2.890242953384237e-07,
+ "loss": 0.0879,
+ "step": 33969
+ },
+ {
+ "epoch": 92.56130790190736,
+ "grad_norm": 3.628197431564331,
+ "learning_rate": 2.888136968076927e-07,
+ "loss": 0.0753,
+ "step": 33970
+ },
+ {
+ "epoch": 92.56403269754769,
+ "grad_norm": 4.6860456466674805,
+ "learning_rate": 2.88603173907368e-07,
+ "loss": 0.028,
+ "step": 33971
+ },
+ {
+ "epoch": 92.566757493188,
+ "grad_norm": 2.555469512939453,
+ "learning_rate": 2.883927266390907e-07,
+ "loss": 0.1143,
+ "step": 33972
+ },
+ {
+ "epoch": 92.56948228882834,
+ "grad_norm": 2.003568410873413,
+ "learning_rate": 2.88182355004496e-07,
+ "loss": 0.0231,
+ "step": 33973
+ },
+ {
+ "epoch": 92.57220708446866,
+ "grad_norm": 2.3181540966033936,
+ "learning_rate": 2.8797205900522594e-07,
+ "loss": 0.0463,
+ "step": 33974
+ },
+ {
+ "epoch": 92.57493188010899,
+ "grad_norm": 2.0930943489074707,
+ "learning_rate": 2.877618386429171e-07,
+ "loss": 0.0286,
+ "step": 33975
+ },
+ {
+ "epoch": 92.57765667574932,
+ "grad_norm": 3.4334566593170166,
+ "learning_rate": 2.875516939192069e-07,
+ "loss": 0.1159,
+ "step": 33976
+ },
+ {
+ "epoch": 92.58038147138964,
+ "grad_norm": 2.914374589920044,
+ "learning_rate": 2.873416248357308e-07,
+ "loss": 0.0362,
+ "step": 33977
+ },
+ {
+ "epoch": 92.58310626702998,
+ "grad_norm": 2.764923572540283,
+ "learning_rate": 2.8713163139412527e-07,
+ "loss": 0.0882,
+ "step": 33978
+ },
+ {
+ "epoch": 92.5858310626703,
+ "grad_norm": 2.67028546333313,
+ "learning_rate": 2.869217135960267e-07,
+ "loss": 0.0173,
+ "step": 33979
+ },
+ {
+ "epoch": 92.58855585831063,
+ "grad_norm": 3.2267072200775146,
+ "learning_rate": 2.8671187144306834e-07,
+ "loss": 0.1514,
+ "step": 33980
+ },
+ {
+ "epoch": 92.59128065395096,
+ "grad_norm": 3.0317184925079346,
+ "learning_rate": 2.8650210493688656e-07,
+ "loss": 0.0301,
+ "step": 33981
+ },
+ {
+ "epoch": 92.59400544959128,
+ "grad_norm": 2.4306561946868896,
+ "learning_rate": 2.862924140791123e-07,
+ "loss": 0.0282,
+ "step": 33982
+ },
+ {
+ "epoch": 92.59673024523161,
+ "grad_norm": 3.262852668762207,
+ "learning_rate": 2.8608279887138103e-07,
+ "loss": 0.1281,
+ "step": 33983
+ },
+ {
+ "epoch": 92.59945504087193,
+ "grad_norm": 1.7691593170166016,
+ "learning_rate": 2.858732593153246e-07,
+ "loss": 0.0888,
+ "step": 33984
+ },
+ {
+ "epoch": 92.60217983651226,
+ "grad_norm": 2.297663450241089,
+ "learning_rate": 2.8566379541257406e-07,
+ "loss": 0.0638,
+ "step": 33985
+ },
+ {
+ "epoch": 92.60490463215258,
+ "grad_norm": 2.7999699115753174,
+ "learning_rate": 2.8545440716476025e-07,
+ "loss": 0.0363,
+ "step": 33986
+ },
+ {
+ "epoch": 92.60762942779292,
+ "grad_norm": 2.7875518798828125,
+ "learning_rate": 2.8524509457351635e-07,
+ "loss": 0.2239,
+ "step": 33987
+ },
+ {
+ "epoch": 92.61035422343325,
+ "grad_norm": 2.7598700523376465,
+ "learning_rate": 2.85035857640471e-07,
+ "loss": 0.066,
+ "step": 33988
+ },
+ {
+ "epoch": 92.61307901907357,
+ "grad_norm": 2.471369743347168,
+ "learning_rate": 2.84826696367253e-07,
+ "loss": 0.0293,
+ "step": 33989
+ },
+ {
+ "epoch": 92.6158038147139,
+ "grad_norm": 4.669155597686768,
+ "learning_rate": 2.846176107554921e-07,
+ "loss": 0.1098,
+ "step": 33990
+ },
+ {
+ "epoch": 92.61852861035422,
+ "grad_norm": 3.655745029449463,
+ "learning_rate": 2.8440860080681587e-07,
+ "loss": 0.053,
+ "step": 33991
+ },
+ {
+ "epoch": 92.62125340599455,
+ "grad_norm": 4.2164387702941895,
+ "learning_rate": 2.8419966652285303e-07,
+ "loss": 0.0607,
+ "step": 33992
+ },
+ {
+ "epoch": 92.62397820163488,
+ "grad_norm": 2.9698784351348877,
+ "learning_rate": 2.8399080790523227e-07,
+ "loss": 0.0811,
+ "step": 33993
+ },
+ {
+ "epoch": 92.6267029972752,
+ "grad_norm": 2.3326776027679443,
+ "learning_rate": 2.837820249555756e-07,
+ "loss": 0.0591,
+ "step": 33994
+ },
+ {
+ "epoch": 92.62942779291554,
+ "grad_norm": 2.5954360961914062,
+ "learning_rate": 2.8357331767551397e-07,
+ "loss": 0.1233,
+ "step": 33995
+ },
+ {
+ "epoch": 92.63215258855585,
+ "grad_norm": 2.092036485671997,
+ "learning_rate": 2.8336468606667057e-07,
+ "loss": 0.0322,
+ "step": 33996
+ },
+ {
+ "epoch": 92.63487738419619,
+ "grad_norm": 2.1663055419921875,
+ "learning_rate": 2.8315613013066954e-07,
+ "loss": 0.0681,
+ "step": 33997
+ },
+ {
+ "epoch": 92.6376021798365,
+ "grad_norm": 3.1835341453552246,
+ "learning_rate": 2.8294764986913524e-07,
+ "loss": 0.0715,
+ "step": 33998
+ },
+ {
+ "epoch": 92.64032697547684,
+ "grad_norm": 2.3628365993499756,
+ "learning_rate": 2.82739245283693e-07,
+ "loss": 0.0383,
+ "step": 33999
+ },
+ {
+ "epoch": 92.64305177111717,
+ "grad_norm": 2.6618759632110596,
+ "learning_rate": 2.8253091637596485e-07,
+ "loss": 0.0366,
+ "step": 34000
+ },
+ {
+ "epoch": 92.64577656675749,
+ "grad_norm": 1.9609527587890625,
+ "learning_rate": 2.8232266314757286e-07,
+ "loss": 0.0268,
+ "step": 34001
+ },
+ {
+ "epoch": 92.64850136239782,
+ "grad_norm": 2.5003442764282227,
+ "learning_rate": 2.8211448560013787e-07,
+ "loss": 0.0296,
+ "step": 34002
+ },
+ {
+ "epoch": 92.65122615803814,
+ "grad_norm": 2.237795829772949,
+ "learning_rate": 2.8190638373528423e-07,
+ "loss": 0.1536,
+ "step": 34003
+ },
+ {
+ "epoch": 92.65395095367847,
+ "grad_norm": 1.9150476455688477,
+ "learning_rate": 2.816983575546306e-07,
+ "loss": 0.0887,
+ "step": 34004
+ },
+ {
+ "epoch": 92.65667574931881,
+ "grad_norm": 1.8825595378875732,
+ "learning_rate": 2.814904070597979e-07,
+ "loss": 0.0742,
+ "step": 34005
+ },
+ {
+ "epoch": 92.65940054495913,
+ "grad_norm": 2.8478167057037354,
+ "learning_rate": 2.8128253225240376e-07,
+ "loss": 0.0588,
+ "step": 34006
+ },
+ {
+ "epoch": 92.66212534059946,
+ "grad_norm": 2.597182035446167,
+ "learning_rate": 2.810747331340691e-07,
+ "loss": 0.0318,
+ "step": 34007
+ },
+ {
+ "epoch": 92.66485013623978,
+ "grad_norm": 2.7154324054718018,
+ "learning_rate": 2.8086700970641034e-07,
+ "loss": 0.0613,
+ "step": 34008
+ },
+ {
+ "epoch": 92.66757493188011,
+ "grad_norm": 1.348683476448059,
+ "learning_rate": 2.806593619710485e-07,
+ "loss": 0.0579,
+ "step": 34009
+ },
+ {
+ "epoch": 92.67029972752043,
+ "grad_norm": 2.6856653690338135,
+ "learning_rate": 2.804517899295978e-07,
+ "loss": 0.0467,
+ "step": 34010
+ },
+ {
+ "epoch": 92.67302452316076,
+ "grad_norm": 2.5943455696105957,
+ "learning_rate": 2.802442935836758e-07,
+ "loss": 0.0436,
+ "step": 34011
+ },
+ {
+ "epoch": 92.6757493188011,
+ "grad_norm": 2.033085346221924,
+ "learning_rate": 2.800368729348979e-07,
+ "loss": 0.0649,
+ "step": 34012
+ },
+ {
+ "epoch": 92.67847411444141,
+ "grad_norm": 2.114762783050537,
+ "learning_rate": 2.798295279848817e-07,
+ "loss": 0.0651,
+ "step": 34013
+ },
+ {
+ "epoch": 92.68119891008175,
+ "grad_norm": 1.8358843326568604,
+ "learning_rate": 2.796222587352382e-07,
+ "loss": 0.0417,
+ "step": 34014
+ },
+ {
+ "epoch": 92.68392370572207,
+ "grad_norm": 2.147197961807251,
+ "learning_rate": 2.7941506518758486e-07,
+ "loss": 0.0844,
+ "step": 34015
+ },
+ {
+ "epoch": 92.6866485013624,
+ "grad_norm": 3.4548144340515137,
+ "learning_rate": 2.7920794734353384e-07,
+ "loss": 0.1095,
+ "step": 34016
+ },
+ {
+ "epoch": 92.68937329700273,
+ "grad_norm": 2.261824607849121,
+ "learning_rate": 2.790009052046994e-07,
+ "loss": 0.0237,
+ "step": 34017
+ },
+ {
+ "epoch": 92.69209809264305,
+ "grad_norm": 3.58293080329895,
+ "learning_rate": 2.787939387726912e-07,
+ "loss": 0.1708,
+ "step": 34018
+ },
+ {
+ "epoch": 92.69482288828338,
+ "grad_norm": 2.4535138607025146,
+ "learning_rate": 2.7858704804912483e-07,
+ "loss": 0.0762,
+ "step": 34019
+ },
+ {
+ "epoch": 92.6975476839237,
+ "grad_norm": 2.3390798568725586,
+ "learning_rate": 2.7838023303560893e-07,
+ "loss": 0.0258,
+ "step": 34020
+ },
+ {
+ "epoch": 92.70027247956403,
+ "grad_norm": 3.6526169776916504,
+ "learning_rate": 2.7817349373375545e-07,
+ "loss": 0.1148,
+ "step": 34021
+ },
+ {
+ "epoch": 92.70299727520435,
+ "grad_norm": 3.0535171031951904,
+ "learning_rate": 2.779668301451721e-07,
+ "loss": 0.1209,
+ "step": 34022
+ },
+ {
+ "epoch": 92.70572207084469,
+ "grad_norm": 2.691586971282959,
+ "learning_rate": 2.7776024227147093e-07,
+ "loss": 0.1376,
+ "step": 34023
+ },
+ {
+ "epoch": 92.70844686648502,
+ "grad_norm": 2.9899306297302246,
+ "learning_rate": 2.775537301142617e-07,
+ "loss": 0.0464,
+ "step": 34024
+ },
+ {
+ "epoch": 92.71117166212534,
+ "grad_norm": 2.928201675415039,
+ "learning_rate": 2.773472936751487e-07,
+ "loss": 0.0454,
+ "step": 34025
+ },
+ {
+ "epoch": 92.71389645776567,
+ "grad_norm": 2.3313519954681396,
+ "learning_rate": 2.7714093295574285e-07,
+ "loss": 0.0542,
+ "step": 34026
+ },
+ {
+ "epoch": 92.71662125340599,
+ "grad_norm": 2.7227885723114014,
+ "learning_rate": 2.769346479576507e-07,
+ "loss": 0.0309,
+ "step": 34027
+ },
+ {
+ "epoch": 92.71934604904632,
+ "grad_norm": 2.697957992553711,
+ "learning_rate": 2.7672843868247865e-07,
+ "loss": 0.0889,
+ "step": 34028
+ },
+ {
+ "epoch": 92.72207084468666,
+ "grad_norm": 2.8073959350585938,
+ "learning_rate": 2.765223051318333e-07,
+ "loss": 0.0918,
+ "step": 34029
+ },
+ {
+ "epoch": 92.72479564032697,
+ "grad_norm": 2.9638912677764893,
+ "learning_rate": 2.7631624730731887e-07,
+ "loss": 0.0469,
+ "step": 34030
+ },
+ {
+ "epoch": 92.7275204359673,
+ "grad_norm": 2.047313928604126,
+ "learning_rate": 2.7611026521053963e-07,
+ "loss": 0.0369,
+ "step": 34031
+ },
+ {
+ "epoch": 92.73024523160763,
+ "grad_norm": 2.096829414367676,
+ "learning_rate": 2.75904358843101e-07,
+ "loss": 0.178,
+ "step": 34032
+ },
+ {
+ "epoch": 92.73297002724796,
+ "grad_norm": 1.9505131244659424,
+ "learning_rate": 2.7569852820660713e-07,
+ "loss": 0.0207,
+ "step": 34033
+ },
+ {
+ "epoch": 92.73569482288828,
+ "grad_norm": 2.60426664352417,
+ "learning_rate": 2.754927733026591e-07,
+ "loss": 0.0933,
+ "step": 34034
+ },
+ {
+ "epoch": 92.73841961852861,
+ "grad_norm": 2.333433151245117,
+ "learning_rate": 2.7528709413286116e-07,
+ "loss": 0.0694,
+ "step": 34035
+ },
+ {
+ "epoch": 92.74114441416894,
+ "grad_norm": 5.702267646789551,
+ "learning_rate": 2.750814906988142e-07,
+ "loss": 0.0833,
+ "step": 34036
+ },
+ {
+ "epoch": 92.74386920980926,
+ "grad_norm": 2.6554129123687744,
+ "learning_rate": 2.748759630021203e-07,
+ "loss": 0.0762,
+ "step": 34037
+ },
+ {
+ "epoch": 92.7465940054496,
+ "grad_norm": 2.1196606159210205,
+ "learning_rate": 2.74670511044377e-07,
+ "loss": 0.0267,
+ "step": 34038
+ },
+ {
+ "epoch": 92.74931880108991,
+ "grad_norm": 3.2828564643859863,
+ "learning_rate": 2.7446513482718874e-07,
+ "loss": 0.0958,
+ "step": 34039
+ },
+ {
+ "epoch": 92.75204359673025,
+ "grad_norm": 1.9908270835876465,
+ "learning_rate": 2.74259834352153e-07,
+ "loss": 0.0813,
+ "step": 34040
+ },
+ {
+ "epoch": 92.75476839237058,
+ "grad_norm": 2.8551061153411865,
+ "learning_rate": 2.740546096208685e-07,
+ "loss": 0.0485,
+ "step": 34041
+ },
+ {
+ "epoch": 92.7574931880109,
+ "grad_norm": 2.666900634765625,
+ "learning_rate": 2.738494606349329e-07,
+ "loss": 0.1288,
+ "step": 34042
+ },
+ {
+ "epoch": 92.76021798365123,
+ "grad_norm": 2.8463668823242188,
+ "learning_rate": 2.736443873959449e-07,
+ "loss": 0.0801,
+ "step": 34043
+ },
+ {
+ "epoch": 92.76294277929155,
+ "grad_norm": 2.9144234657287598,
+ "learning_rate": 2.73439389905501e-07,
+ "loss": 0.1398,
+ "step": 34044
+ },
+ {
+ "epoch": 92.76566757493188,
+ "grad_norm": 3.478212833404541,
+ "learning_rate": 2.7323446816519993e-07,
+ "loss": 0.0857,
+ "step": 34045
+ },
+ {
+ "epoch": 92.7683923705722,
+ "grad_norm": 2.7649264335632324,
+ "learning_rate": 2.7302962217663486e-07,
+ "loss": 0.0933,
+ "step": 34046
+ },
+ {
+ "epoch": 92.77111716621253,
+ "grad_norm": 1.8461920022964478,
+ "learning_rate": 2.728248519414001e-07,
+ "loss": 0.0556,
+ "step": 34047
+ },
+ {
+ "epoch": 92.77384196185287,
+ "grad_norm": 1.3719723224639893,
+ "learning_rate": 2.7262015746109425e-07,
+ "loss": 0.0191,
+ "step": 34048
+ },
+ {
+ "epoch": 92.77656675749319,
+ "grad_norm": 1.9794155359268188,
+ "learning_rate": 2.7241553873730953e-07,
+ "loss": 0.0377,
+ "step": 34049
+ },
+ {
+ "epoch": 92.77929155313352,
+ "grad_norm": 2.6414873600006104,
+ "learning_rate": 2.722109957716401e-07,
+ "loss": 0.0381,
+ "step": 34050
+ },
+ {
+ "epoch": 92.78201634877384,
+ "grad_norm": 1.8735049962997437,
+ "learning_rate": 2.72006528565677e-07,
+ "loss": 0.0307,
+ "step": 34051
+ },
+ {
+ "epoch": 92.78474114441417,
+ "grad_norm": 2.5010695457458496,
+ "learning_rate": 2.7180213712101444e-07,
+ "loss": 0.0549,
+ "step": 34052
+ },
+ {
+ "epoch": 92.7874659400545,
+ "grad_norm": 3.3076906204223633,
+ "learning_rate": 2.715978214392434e-07,
+ "loss": 0.0963,
+ "step": 34053
+ },
+ {
+ "epoch": 92.79019073569482,
+ "grad_norm": 2.291006088256836,
+ "learning_rate": 2.7139358152195707e-07,
+ "loss": 0.0794,
+ "step": 34054
+ },
+ {
+ "epoch": 92.79291553133515,
+ "grad_norm": 2.7565507888793945,
+ "learning_rate": 2.711894173707419e-07,
+ "loss": 0.0644,
+ "step": 34055
+ },
+ {
+ "epoch": 92.79564032697547,
+ "grad_norm": 2.482112169265747,
+ "learning_rate": 2.709853289871922e-07,
+ "loss": 0.0345,
+ "step": 34056
+ },
+ {
+ "epoch": 92.7983651226158,
+ "grad_norm": 4.1855974197387695,
+ "learning_rate": 2.707813163728945e-07,
+ "loss": 0.0315,
+ "step": 34057
+ },
+ {
+ "epoch": 92.80108991825612,
+ "grad_norm": 3.153151512145996,
+ "learning_rate": 2.7057737952943863e-07,
+ "loss": 0.0973,
+ "step": 34058
+ },
+ {
+ "epoch": 92.80381471389646,
+ "grad_norm": 2.8204071521759033,
+ "learning_rate": 2.703735184584133e-07,
+ "loss": 0.1251,
+ "step": 34059
+ },
+ {
+ "epoch": 92.80653950953679,
+ "grad_norm": 2.1790354251861572,
+ "learning_rate": 2.701697331614062e-07,
+ "loss": 0.0381,
+ "step": 34060
+ },
+ {
+ "epoch": 92.80926430517711,
+ "grad_norm": 1.5505914688110352,
+ "learning_rate": 2.699660236400048e-07,
+ "loss": 0.0189,
+ "step": 34061
+ },
+ {
+ "epoch": 92.81198910081744,
+ "grad_norm": 2.216620445251465,
+ "learning_rate": 2.697623898957946e-07,
+ "loss": 0.037,
+ "step": 34062
+ },
+ {
+ "epoch": 92.81471389645776,
+ "grad_norm": 2.371647834777832,
+ "learning_rate": 2.695588319303599e-07,
+ "loss": 0.0263,
+ "step": 34063
+ },
+ {
+ "epoch": 92.8174386920981,
+ "grad_norm": 4.299121856689453,
+ "learning_rate": 2.693553497452905e-07,
+ "loss": 0.0937,
+ "step": 34064
+ },
+ {
+ "epoch": 92.82016348773843,
+ "grad_norm": 2.558760643005371,
+ "learning_rate": 2.6915194334216743e-07,
+ "loss": 0.1025,
+ "step": 34065
+ },
+ {
+ "epoch": 92.82288828337875,
+ "grad_norm": 2.4167726039886475,
+ "learning_rate": 2.68948612722576e-07,
+ "loss": 0.0633,
+ "step": 34066
+ },
+ {
+ "epoch": 92.82561307901908,
+ "grad_norm": 5.8445634841918945,
+ "learning_rate": 2.687453578880983e-07,
+ "loss": 0.0416,
+ "step": 34067
+ },
+ {
+ "epoch": 92.8283378746594,
+ "grad_norm": 2.8583555221557617,
+ "learning_rate": 2.6854217884031974e-07,
+ "loss": 0.0557,
+ "step": 34068
+ },
+ {
+ "epoch": 92.83106267029973,
+ "grad_norm": 2.0511131286621094,
+ "learning_rate": 2.683390755808213e-07,
+ "loss": 0.0339,
+ "step": 34069
+ },
+ {
+ "epoch": 92.83378746594005,
+ "grad_norm": 2.37980055809021,
+ "learning_rate": 2.68136048111185e-07,
+ "loss": 0.0433,
+ "step": 34070
+ },
+ {
+ "epoch": 92.83651226158038,
+ "grad_norm": 2.8480749130249023,
+ "learning_rate": 2.679330964329907e-07,
+ "loss": 0.0747,
+ "step": 34071
+ },
+ {
+ "epoch": 92.83923705722071,
+ "grad_norm": 2.049267053604126,
+ "learning_rate": 2.677302205478216e-07,
+ "loss": 0.0238,
+ "step": 34072
+ },
+ {
+ "epoch": 92.84196185286103,
+ "grad_norm": 2.4598608016967773,
+ "learning_rate": 2.675274204572564e-07,
+ "loss": 0.0273,
+ "step": 34073
+ },
+ {
+ "epoch": 92.84468664850137,
+ "grad_norm": 2.6839537620544434,
+ "learning_rate": 2.6732469616287393e-07,
+ "loss": 0.043,
+ "step": 34074
+ },
+ {
+ "epoch": 92.84741144414168,
+ "grad_norm": 1.7694298028945923,
+ "learning_rate": 2.671220476662528e-07,
+ "loss": 0.0244,
+ "step": 34075
+ },
+ {
+ "epoch": 92.85013623978202,
+ "grad_norm": 4.0129547119140625,
+ "learning_rate": 2.66919474968973e-07,
+ "loss": 0.0408,
+ "step": 34076
+ },
+ {
+ "epoch": 92.85286103542235,
+ "grad_norm": 2.5996809005737305,
+ "learning_rate": 2.667169780726109e-07,
+ "loss": 0.031,
+ "step": 34077
+ },
+ {
+ "epoch": 92.85558583106267,
+ "grad_norm": 1.9990999698638916,
+ "learning_rate": 2.6651455697874306e-07,
+ "loss": 0.0315,
+ "step": 34078
+ },
+ {
+ "epoch": 92.858310626703,
+ "grad_norm": 3.263554811477661,
+ "learning_rate": 2.6631221168894603e-07,
+ "loss": 0.0862,
+ "step": 34079
+ },
+ {
+ "epoch": 92.86103542234332,
+ "grad_norm": 3.1881675720214844,
+ "learning_rate": 2.661099422047986e-07,
+ "loss": 0.0491,
+ "step": 34080
+ },
+ {
+ "epoch": 92.86376021798365,
+ "grad_norm": 2.8475282192230225,
+ "learning_rate": 2.659077485278716e-07,
+ "loss": 0.1043,
+ "step": 34081
+ },
+ {
+ "epoch": 92.86648501362397,
+ "grad_norm": 2.2266502380371094,
+ "learning_rate": 2.6570563065974273e-07,
+ "loss": 0.0251,
+ "step": 34082
+ },
+ {
+ "epoch": 92.8692098092643,
+ "grad_norm": 2.85383677482605,
+ "learning_rate": 2.655035886019841e-07,
+ "loss": 0.0694,
+ "step": 34083
+ },
+ {
+ "epoch": 92.87193460490464,
+ "grad_norm": 2.5152273178100586,
+ "learning_rate": 2.653016223561722e-07,
+ "loss": 0.0277,
+ "step": 34084
+ },
+ {
+ "epoch": 92.87465940054496,
+ "grad_norm": 2.0699732303619385,
+ "learning_rate": 2.650997319238768e-07,
+ "loss": 0.0297,
+ "step": 34085
+ },
+ {
+ "epoch": 92.87738419618529,
+ "grad_norm": 2.2521121501922607,
+ "learning_rate": 2.6489791730667125e-07,
+ "loss": 0.0556,
+ "step": 34086
+ },
+ {
+ "epoch": 92.88010899182561,
+ "grad_norm": 4.227232933044434,
+ "learning_rate": 2.6469617850612637e-07,
+ "loss": 0.0309,
+ "step": 34087
+ },
+ {
+ "epoch": 92.88283378746594,
+ "grad_norm": 3.299978494644165,
+ "learning_rate": 2.6449451552381653e-07,
+ "loss": 0.042,
+ "step": 34088
+ },
+ {
+ "epoch": 92.88555858310627,
+ "grad_norm": 1.921689510345459,
+ "learning_rate": 2.642929283613094e-07,
+ "loss": 0.0245,
+ "step": 34089
+ },
+ {
+ "epoch": 92.88828337874659,
+ "grad_norm": 2.025585174560547,
+ "learning_rate": 2.640914170201747e-07,
+ "loss": 0.0316,
+ "step": 34090
+ },
+ {
+ "epoch": 92.89100817438693,
+ "grad_norm": 3.765036106109619,
+ "learning_rate": 2.6388998150198243e-07,
+ "loss": 0.0277,
+ "step": 34091
+ },
+ {
+ "epoch": 92.89373297002724,
+ "grad_norm": 2.3546907901763916,
+ "learning_rate": 2.6368862180830234e-07,
+ "loss": 0.0305,
+ "step": 34092
+ },
+ {
+ "epoch": 92.89645776566758,
+ "grad_norm": 3.1595547199249268,
+ "learning_rate": 2.6348733794070215e-07,
+ "loss": 0.0391,
+ "step": 34093
+ },
+ {
+ "epoch": 92.8991825613079,
+ "grad_norm": 2.0853705406188965,
+ "learning_rate": 2.632861299007483e-07,
+ "loss": 0.0227,
+ "step": 34094
+ },
+ {
+ "epoch": 92.90190735694823,
+ "grad_norm": 2.2090907096862793,
+ "learning_rate": 2.6308499769000963e-07,
+ "loss": 0.1551,
+ "step": 34095
+ },
+ {
+ "epoch": 92.90463215258856,
+ "grad_norm": 2.1396069526672363,
+ "learning_rate": 2.6288394131005147e-07,
+ "loss": 0.0316,
+ "step": 34096
+ },
+ {
+ "epoch": 92.90735694822888,
+ "grad_norm": 1.9962027072906494,
+ "learning_rate": 2.6268296076243925e-07,
+ "loss": 0.0397,
+ "step": 34097
+ },
+ {
+ "epoch": 92.91008174386921,
+ "grad_norm": 3.098529815673828,
+ "learning_rate": 2.6248205604873955e-07,
+ "loss": 0.0372,
+ "step": 34098
+ },
+ {
+ "epoch": 92.91280653950953,
+ "grad_norm": 1.867499828338623,
+ "learning_rate": 2.622812271705155e-07,
+ "loss": 0.0802,
+ "step": 34099
+ },
+ {
+ "epoch": 92.91553133514986,
+ "grad_norm": 3.4928348064422607,
+ "learning_rate": 2.6208047412933145e-07,
+ "loss": 0.0863,
+ "step": 34100
+ },
+ {
+ "epoch": 92.9182561307902,
+ "grad_norm": 2.3808937072753906,
+ "learning_rate": 2.618797969267528e-07,
+ "loss": 0.134,
+ "step": 34101
+ },
+ {
+ "epoch": 92.92098092643052,
+ "grad_norm": 2.0302734375,
+ "learning_rate": 2.616791955643405e-07,
+ "loss": 0.0347,
+ "step": 34102
+ },
+ {
+ "epoch": 92.92370572207085,
+ "grad_norm": 3.0014467239379883,
+ "learning_rate": 2.614786700436556e-07,
+ "loss": 0.0685,
+ "step": 34103
+ },
+ {
+ "epoch": 92.92643051771117,
+ "grad_norm": 2.118467092514038,
+ "learning_rate": 2.6127822036626337e-07,
+ "loss": 0.0334,
+ "step": 34104
+ },
+ {
+ "epoch": 92.9291553133515,
+ "grad_norm": 2.6980319023132324,
+ "learning_rate": 2.610778465337216e-07,
+ "loss": 0.0775,
+ "step": 34105
+ },
+ {
+ "epoch": 92.93188010899182,
+ "grad_norm": 2.85756254196167,
+ "learning_rate": 2.608775485475934e-07,
+ "loss": 0.0507,
+ "step": 34106
+ },
+ {
+ "epoch": 92.93460490463215,
+ "grad_norm": 2.651165723800659,
+ "learning_rate": 2.606773264094353e-07,
+ "loss": 0.0421,
+ "step": 34107
+ },
+ {
+ "epoch": 92.93732970027249,
+ "grad_norm": 2.8043205738067627,
+ "learning_rate": 2.6047718012081056e-07,
+ "loss": 0.0273,
+ "step": 34108
+ },
+ {
+ "epoch": 92.9400544959128,
+ "grad_norm": 1.5109548568725586,
+ "learning_rate": 2.602771096832757e-07,
+ "loss": 0.0216,
+ "step": 34109
+ },
+ {
+ "epoch": 92.94277929155314,
+ "grad_norm": 3.034245491027832,
+ "learning_rate": 2.600771150983894e-07,
+ "loss": 0.0412,
+ "step": 34110
+ },
+ {
+ "epoch": 92.94550408719346,
+ "grad_norm": 1.7956622838974,
+ "learning_rate": 2.5987719636770824e-07,
+ "loss": 0.0181,
+ "step": 34111
+ },
+ {
+ "epoch": 92.94822888283379,
+ "grad_norm": 2.136606216430664,
+ "learning_rate": 2.5967735349278877e-07,
+ "loss": 0.0679,
+ "step": 34112
+ },
+ {
+ "epoch": 92.95095367847412,
+ "grad_norm": 6.898420810699463,
+ "learning_rate": 2.5947758647519085e-07,
+ "loss": 0.0742,
+ "step": 34113
+ },
+ {
+ "epoch": 92.95367847411444,
+ "grad_norm": 2.685142755508423,
+ "learning_rate": 2.592778953164676e-07,
+ "loss": 0.0492,
+ "step": 34114
+ },
+ {
+ "epoch": 92.95640326975477,
+ "grad_norm": 2.132816791534424,
+ "learning_rate": 2.590782800181746e-07,
+ "loss": 0.0309,
+ "step": 34115
+ },
+ {
+ "epoch": 92.95912806539509,
+ "grad_norm": 2.2591047286987305,
+ "learning_rate": 2.5887874058186604e-07,
+ "loss": 0.0847,
+ "step": 34116
+ },
+ {
+ "epoch": 92.96185286103542,
+ "grad_norm": 2.0352091789245605,
+ "learning_rate": 2.5867927700909624e-07,
+ "loss": 0.0544,
+ "step": 34117
+ },
+ {
+ "epoch": 92.96457765667574,
+ "grad_norm": 1.5847419500350952,
+ "learning_rate": 2.584798893014195e-07,
+ "loss": 0.0198,
+ "step": 34118
+ },
+ {
+ "epoch": 92.96730245231608,
+ "grad_norm": 2.906217336654663,
+ "learning_rate": 2.58280577460388e-07,
+ "loss": 0.0427,
+ "step": 34119
+ },
+ {
+ "epoch": 92.97002724795641,
+ "grad_norm": 1.7440987825393677,
+ "learning_rate": 2.580813414875516e-07,
+ "loss": 0.0764,
+ "step": 34120
+ },
+ {
+ "epoch": 92.97275204359673,
+ "grad_norm": 1.9244767427444458,
+ "learning_rate": 2.578821813844667e-07,
+ "loss": 0.0396,
+ "step": 34121
+ },
+ {
+ "epoch": 92.97547683923706,
+ "grad_norm": 2.3534650802612305,
+ "learning_rate": 2.5768309715268116e-07,
+ "loss": 0.0735,
+ "step": 34122
+ },
+ {
+ "epoch": 92.97820163487738,
+ "grad_norm": 3.1908464431762695,
+ "learning_rate": 2.5748408879374463e-07,
+ "loss": 0.0278,
+ "step": 34123
+ },
+ {
+ "epoch": 92.98092643051771,
+ "grad_norm": 2.015676498413086,
+ "learning_rate": 2.572851563092105e-07,
+ "loss": 0.0538,
+ "step": 34124
+ },
+ {
+ "epoch": 92.98365122615803,
+ "grad_norm": 2.5479812622070312,
+ "learning_rate": 2.5708629970062516e-07,
+ "loss": 0.0211,
+ "step": 34125
+ },
+ {
+ "epoch": 92.98637602179836,
+ "grad_norm": 2.6128368377685547,
+ "learning_rate": 2.5688751896953854e-07,
+ "loss": 0.0451,
+ "step": 34126
+ },
+ {
+ "epoch": 92.9891008174387,
+ "grad_norm": 2.622509717941284,
+ "learning_rate": 2.566888141174972e-07,
+ "loss": 0.0434,
+ "step": 34127
+ },
+ {
+ "epoch": 92.99182561307902,
+ "grad_norm": 2.1178672313690186,
+ "learning_rate": 2.5649018514604995e-07,
+ "loss": 0.0419,
+ "step": 34128
+ },
+ {
+ "epoch": 92.99455040871935,
+ "grad_norm": 2.688542604446411,
+ "learning_rate": 2.5629163205674434e-07,
+ "loss": 0.0435,
+ "step": 34129
+ },
+ {
+ "epoch": 92.99727520435967,
+ "grad_norm": 3.2054944038391113,
+ "learning_rate": 2.5609315485112583e-07,
+ "loss": 0.0137,
+ "step": 34130
+ },
+ {
+ "epoch": 93.0,
+ "grad_norm": 2.3210439682006836,
+ "learning_rate": 2.5589475353073987e-07,
+ "loss": 0.0262,
+ "step": 34131
+ },
+ {
+ "epoch": 93.00272479564033,
+ "grad_norm": 4.622258186340332,
+ "learning_rate": 2.556964280971319e-07,
+ "loss": 0.0309,
+ "step": 34132
+ },
+ {
+ "epoch": 93.00544959128065,
+ "grad_norm": 2.673596143722534,
+ "learning_rate": 2.5549817855184624e-07,
+ "loss": 0.0432,
+ "step": 34133
+ },
+ {
+ "epoch": 93.00817438692098,
+ "grad_norm": 1.615040898323059,
+ "learning_rate": 2.5530000489642823e-07,
+ "loss": 0.0253,
+ "step": 34134
+ },
+ {
+ "epoch": 93.0108991825613,
+ "grad_norm": 3.2961864471435547,
+ "learning_rate": 2.5510190713242014e-07,
+ "loss": 0.0502,
+ "step": 34135
+ },
+ {
+ "epoch": 93.01362397820164,
+ "grad_norm": 2.0259194374084473,
+ "learning_rate": 2.5490388526136387e-07,
+ "loss": 0.069,
+ "step": 34136
+ },
+ {
+ "epoch": 93.01634877384195,
+ "grad_norm": 3.0652382373809814,
+ "learning_rate": 2.547059392848028e-07,
+ "loss": 0.1025,
+ "step": 34137
+ },
+ {
+ "epoch": 93.01907356948229,
+ "grad_norm": 1.6499525308609009,
+ "learning_rate": 2.5450806920427783e-07,
+ "loss": 0.0217,
+ "step": 34138
+ },
+ {
+ "epoch": 93.02179836512262,
+ "grad_norm": 2.7060530185699463,
+ "learning_rate": 2.543102750213311e-07,
+ "loss": 0.1126,
+ "step": 34139
+ },
+ {
+ "epoch": 93.02452316076294,
+ "grad_norm": 1.6776399612426758,
+ "learning_rate": 2.5411255673750137e-07,
+ "loss": 0.1076,
+ "step": 34140
+ },
+ {
+ "epoch": 93.02724795640327,
+ "grad_norm": 2.6825172901153564,
+ "learning_rate": 2.539149143543307e-07,
+ "loss": 0.1334,
+ "step": 34141
+ },
+ {
+ "epoch": 93.02997275204359,
+ "grad_norm": 2.8298847675323486,
+ "learning_rate": 2.5371734787335676e-07,
+ "loss": 0.0385,
+ "step": 34142
+ },
+ {
+ "epoch": 93.03269754768392,
+ "grad_norm": 2.77170991897583,
+ "learning_rate": 2.535198572961173e-07,
+ "loss": 0.1052,
+ "step": 34143
+ },
+ {
+ "epoch": 93.03542234332426,
+ "grad_norm": 4.709928512573242,
+ "learning_rate": 2.5332244262415207e-07,
+ "loss": 0.1541,
+ "step": 34144
+ },
+ {
+ "epoch": 93.03814713896458,
+ "grad_norm": 2.9608826637268066,
+ "learning_rate": 2.5312510385899767e-07,
+ "loss": 0.0999,
+ "step": 34145
+ },
+ {
+ "epoch": 93.04087193460491,
+ "grad_norm": 3.854839324951172,
+ "learning_rate": 2.5292784100219184e-07,
+ "loss": 0.0419,
+ "step": 34146
+ },
+ {
+ "epoch": 93.04359673024523,
+ "grad_norm": 2.5647788047790527,
+ "learning_rate": 2.5273065405526986e-07,
+ "loss": 0.0319,
+ "step": 34147
+ },
+ {
+ "epoch": 93.04632152588556,
+ "grad_norm": 2.588716506958008,
+ "learning_rate": 2.525335430197673e-07,
+ "loss": 0.0529,
+ "step": 34148
+ },
+ {
+ "epoch": 93.04904632152588,
+ "grad_norm": 2.4272661209106445,
+ "learning_rate": 2.5233650789722063e-07,
+ "loss": 0.0329,
+ "step": 34149
+ },
+ {
+ "epoch": 93.05177111716621,
+ "grad_norm": 2.615199565887451,
+ "learning_rate": 2.5213954868916425e-07,
+ "loss": 0.0225,
+ "step": 34150
+ },
+ {
+ "epoch": 93.05449591280654,
+ "grad_norm": 1.897565245628357,
+ "learning_rate": 2.519426653971302e-07,
+ "loss": 0.074,
+ "step": 34151
+ },
+ {
+ "epoch": 93.05722070844686,
+ "grad_norm": 2.6388299465179443,
+ "learning_rate": 2.517458580226528e-07,
+ "loss": 0.0837,
+ "step": 34152
+ },
+ {
+ "epoch": 93.0599455040872,
+ "grad_norm": 1.9054664373397827,
+ "learning_rate": 2.515491265672654e-07,
+ "loss": 0.0197,
+ "step": 34153
+ },
+ {
+ "epoch": 93.06267029972751,
+ "grad_norm": 2.1602330207824707,
+ "learning_rate": 2.513524710324999e-07,
+ "loss": 0.0283,
+ "step": 34154
+ },
+ {
+ "epoch": 93.06539509536785,
+ "grad_norm": 2.7745659351348877,
+ "learning_rate": 2.511558914198875e-07,
+ "loss": 0.1196,
+ "step": 34155
+ },
+ {
+ "epoch": 93.06811989100818,
+ "grad_norm": 2.5935699939727783,
+ "learning_rate": 2.5095938773095906e-07,
+ "loss": 0.0422,
+ "step": 34156
+ },
+ {
+ "epoch": 93.0708446866485,
+ "grad_norm": 2.0105862617492676,
+ "learning_rate": 2.5076295996724454e-07,
+ "loss": 0.0292,
+ "step": 34157
+ },
+ {
+ "epoch": 93.07356948228883,
+ "grad_norm": 2.6986520290374756,
+ "learning_rate": 2.5056660813027603e-07,
+ "loss": 0.0456,
+ "step": 34158
+ },
+ {
+ "epoch": 93.07629427792915,
+ "grad_norm": 3.2956032752990723,
+ "learning_rate": 2.5037033222158003e-07,
+ "loss": 0.1097,
+ "step": 34159
+ },
+ {
+ "epoch": 93.07901907356948,
+ "grad_norm": 2.2541451454162598,
+ "learning_rate": 2.501741322426854e-07,
+ "loss": 0.0521,
+ "step": 34160
+ },
+ {
+ "epoch": 93.0817438692098,
+ "grad_norm": 3.0680980682373047,
+ "learning_rate": 2.4997800819512086e-07,
+ "loss": 0.1117,
+ "step": 34161
+ },
+ {
+ "epoch": 93.08446866485014,
+ "grad_norm": 1.7472697496414185,
+ "learning_rate": 2.497819600804152e-07,
+ "loss": 0.0215,
+ "step": 34162
+ },
+ {
+ "epoch": 93.08719346049047,
+ "grad_norm": 2.953049421310425,
+ "learning_rate": 2.495859879000917e-07,
+ "loss": 0.0596,
+ "step": 34163
+ },
+ {
+ "epoch": 93.08991825613079,
+ "grad_norm": 2.394619941711426,
+ "learning_rate": 2.4939009165567904e-07,
+ "loss": 0.158,
+ "step": 34164
+ },
+ {
+ "epoch": 93.09264305177112,
+ "grad_norm": 2.5953469276428223,
+ "learning_rate": 2.491942713487039e-07,
+ "loss": 0.0652,
+ "step": 34165
+ },
+ {
+ "epoch": 93.09536784741144,
+ "grad_norm": 2.1170380115509033,
+ "learning_rate": 2.4899852698068937e-07,
+ "loss": 0.0165,
+ "step": 34166
+ },
+ {
+ "epoch": 93.09809264305177,
+ "grad_norm": 2.6129448413848877,
+ "learning_rate": 2.48802858553161e-07,
+ "loss": 0.0543,
+ "step": 34167
+ },
+ {
+ "epoch": 93.1008174386921,
+ "grad_norm": 2.3921217918395996,
+ "learning_rate": 2.4860726606764086e-07,
+ "loss": 0.1412,
+ "step": 34168
+ },
+ {
+ "epoch": 93.10354223433242,
+ "grad_norm": 2.644024133682251,
+ "learning_rate": 2.484117495256544e-07,
+ "loss": 0.1369,
+ "step": 34169
+ },
+ {
+ "epoch": 93.10626702997276,
+ "grad_norm": 2.567168951034546,
+ "learning_rate": 2.4821630892872375e-07,
+ "loss": 0.0346,
+ "step": 34170
+ },
+ {
+ "epoch": 93.10899182561307,
+ "grad_norm": 2.645113945007324,
+ "learning_rate": 2.48020944278371e-07,
+ "loss": 0.0458,
+ "step": 34171
+ },
+ {
+ "epoch": 93.11171662125341,
+ "grad_norm": 4.088079452514648,
+ "learning_rate": 2.4782565557611494e-07,
+ "loss": 0.0426,
+ "step": 34172
+ },
+ {
+ "epoch": 93.11444141689373,
+ "grad_norm": 3.1976189613342285,
+ "learning_rate": 2.4763044282348105e-07,
+ "loss": 0.1211,
+ "step": 34173
+ },
+ {
+ "epoch": 93.11716621253406,
+ "grad_norm": 1.549565076828003,
+ "learning_rate": 2.47435306021987e-07,
+ "loss": 0.056,
+ "step": 34174
+ },
+ {
+ "epoch": 93.11989100817439,
+ "grad_norm": 2.4160778522491455,
+ "learning_rate": 2.472402451731526e-07,
+ "loss": 0.0659,
+ "step": 34175
+ },
+ {
+ "epoch": 93.12261580381471,
+ "grad_norm": 3.090144395828247,
+ "learning_rate": 2.4704526027849675e-07,
+ "loss": 0.0466,
+ "step": 34176
+ },
+ {
+ "epoch": 93.12534059945504,
+ "grad_norm": 1.9743715524673462,
+ "learning_rate": 2.4685035133953926e-07,
+ "loss": 0.1164,
+ "step": 34177
+ },
+ {
+ "epoch": 93.12806539509536,
+ "grad_norm": 2.8321149349212646,
+ "learning_rate": 2.466555183577968e-07,
+ "loss": 0.0461,
+ "step": 34178
+ },
+ {
+ "epoch": 93.1307901907357,
+ "grad_norm": 3.1648738384246826,
+ "learning_rate": 2.4646076133478803e-07,
+ "loss": 0.0556,
+ "step": 34179
+ },
+ {
+ "epoch": 93.13351498637603,
+ "grad_norm": 1.6319115161895752,
+ "learning_rate": 2.4626608027202735e-07,
+ "loss": 0.0174,
+ "step": 34180
+ },
+ {
+ "epoch": 93.13623978201635,
+ "grad_norm": 2.7480781078338623,
+ "learning_rate": 2.4607147517103356e-07,
+ "loss": 0.0356,
+ "step": 34181
+ },
+ {
+ "epoch": 93.13896457765668,
+ "grad_norm": 3.361598014831543,
+ "learning_rate": 2.45876946033321e-07,
+ "loss": 0.1172,
+ "step": 34182
+ },
+ {
+ "epoch": 93.141689373297,
+ "grad_norm": 2.1728339195251465,
+ "learning_rate": 2.456824928604051e-07,
+ "loss": 0.1057,
+ "step": 34183
+ },
+ {
+ "epoch": 93.14441416893733,
+ "grad_norm": 2.9169201850891113,
+ "learning_rate": 2.454881156538003e-07,
+ "loss": 0.073,
+ "step": 34184
+ },
+ {
+ "epoch": 93.14713896457765,
+ "grad_norm": 1.6619789600372314,
+ "learning_rate": 2.4529381441501963e-07,
+ "loss": 0.0222,
+ "step": 34185
+ },
+ {
+ "epoch": 93.14986376021798,
+ "grad_norm": 3.128669500350952,
+ "learning_rate": 2.450995891455765e-07,
+ "loss": 0.0412,
+ "step": 34186
+ },
+ {
+ "epoch": 93.15258855585832,
+ "grad_norm": 3.3330488204956055,
+ "learning_rate": 2.449054398469852e-07,
+ "loss": 0.0367,
+ "step": 34187
+ },
+ {
+ "epoch": 93.15531335149863,
+ "grad_norm": 2.5604634284973145,
+ "learning_rate": 2.4471136652075454e-07,
+ "loss": 0.0289,
+ "step": 34188
+ },
+ {
+ "epoch": 93.15803814713897,
+ "grad_norm": 3.2581260204315186,
+ "learning_rate": 2.4451736916839884e-07,
+ "loss": 0.028,
+ "step": 34189
+ },
+ {
+ "epoch": 93.16076294277929,
+ "grad_norm": 2.336686134338379,
+ "learning_rate": 2.44323447791428e-07,
+ "loss": 0.052,
+ "step": 34190
+ },
+ {
+ "epoch": 93.16348773841962,
+ "grad_norm": 11.666519165039062,
+ "learning_rate": 2.44129602391352e-07,
+ "loss": 0.0311,
+ "step": 34191
+ },
+ {
+ "epoch": 93.16621253405995,
+ "grad_norm": 4.859091758728027,
+ "learning_rate": 2.439358329696795e-07,
+ "loss": 0.0224,
+ "step": 34192
+ },
+ {
+ "epoch": 93.16893732970027,
+ "grad_norm": 3.556523561477661,
+ "learning_rate": 2.437421395279216e-07,
+ "loss": 0.0548,
+ "step": 34193
+ },
+ {
+ "epoch": 93.1716621253406,
+ "grad_norm": 2.490582227706909,
+ "learning_rate": 2.4354852206758705e-07,
+ "loss": 0.1204,
+ "step": 34194
+ },
+ {
+ "epoch": 93.17438692098092,
+ "grad_norm": 3.8178818225860596,
+ "learning_rate": 2.4335498059018135e-07,
+ "loss": 0.0335,
+ "step": 34195
+ },
+ {
+ "epoch": 93.17711171662125,
+ "grad_norm": 2.508756637573242,
+ "learning_rate": 2.431615150972133e-07,
+ "loss": 0.0202,
+ "step": 34196
+ },
+ {
+ "epoch": 93.17983651226157,
+ "grad_norm": 2.6220171451568604,
+ "learning_rate": 2.4296812559018835e-07,
+ "loss": 0.0391,
+ "step": 34197
+ },
+ {
+ "epoch": 93.1825613079019,
+ "grad_norm": 6.727607727050781,
+ "learning_rate": 2.4277481207061527e-07,
+ "loss": 0.0764,
+ "step": 34198
+ },
+ {
+ "epoch": 93.18528610354224,
+ "grad_norm": 2.875270366668701,
+ "learning_rate": 2.425815745399973e-07,
+ "loss": 0.0705,
+ "step": 34199
+ },
+ {
+ "epoch": 93.18801089918256,
+ "grad_norm": 3.164824962615967,
+ "learning_rate": 2.4238841299983997e-07,
+ "loss": 0.1021,
+ "step": 34200
+ },
+ {
+ "epoch": 93.19073569482289,
+ "grad_norm": 2.8297324180603027,
+ "learning_rate": 2.421953274516464e-07,
+ "loss": 0.0582,
+ "step": 34201
+ },
+ {
+ "epoch": 93.19346049046321,
+ "grad_norm": 2.2060811519622803,
+ "learning_rate": 2.420023178969233e-07,
+ "loss": 0.0214,
+ "step": 34202
+ },
+ {
+ "epoch": 93.19618528610354,
+ "grad_norm": 1.5179919004440308,
+ "learning_rate": 2.418093843371716e-07,
+ "loss": 0.0166,
+ "step": 34203
+ },
+ {
+ "epoch": 93.19891008174388,
+ "grad_norm": 2.476790189743042,
+ "learning_rate": 2.416165267738946e-07,
+ "loss": 0.0463,
+ "step": 34204
+ },
+ {
+ "epoch": 93.2016348773842,
+ "grad_norm": 3.1280102729797363,
+ "learning_rate": 2.414237452085932e-07,
+ "loss": 0.2226,
+ "step": 34205
+ },
+ {
+ "epoch": 93.20435967302453,
+ "grad_norm": 2.301055431365967,
+ "learning_rate": 2.4123103964277085e-07,
+ "loss": 0.0308,
+ "step": 34206
+ },
+ {
+ "epoch": 93.20708446866485,
+ "grad_norm": 2.773564338684082,
+ "learning_rate": 2.410384100779262e-07,
+ "loss": 0.0365,
+ "step": 34207
+ },
+ {
+ "epoch": 93.20980926430518,
+ "grad_norm": 2.866030693054199,
+ "learning_rate": 2.4084585651556025e-07,
+ "loss": 0.1479,
+ "step": 34208
+ },
+ {
+ "epoch": 93.2125340599455,
+ "grad_norm": 1.6615641117095947,
+ "learning_rate": 2.40653378957173e-07,
+ "loss": 0.0245,
+ "step": 34209
+ },
+ {
+ "epoch": 93.21525885558583,
+ "grad_norm": 2.9816291332244873,
+ "learning_rate": 2.404609774042632e-07,
+ "loss": 0.0344,
+ "step": 34210
+ },
+ {
+ "epoch": 93.21798365122616,
+ "grad_norm": 2.267970561981201,
+ "learning_rate": 2.402686518583297e-07,
+ "loss": 0.0972,
+ "step": 34211
+ },
+ {
+ "epoch": 93.22070844686648,
+ "grad_norm": 2.694411516189575,
+ "learning_rate": 2.4007640232086793e-07,
+ "loss": 0.0242,
+ "step": 34212
+ },
+ {
+ "epoch": 93.22343324250681,
+ "grad_norm": 1.6629489660263062,
+ "learning_rate": 2.398842287933789e-07,
+ "loss": 0.0738,
+ "step": 34213
+ },
+ {
+ "epoch": 93.22615803814713,
+ "grad_norm": 2.829502582550049,
+ "learning_rate": 2.396921312773559e-07,
+ "loss": 0.0413,
+ "step": 34214
+ },
+ {
+ "epoch": 93.22888283378747,
+ "grad_norm": 1.7646427154541016,
+ "learning_rate": 2.395001097742977e-07,
+ "loss": 0.0263,
+ "step": 34215
+ },
+ {
+ "epoch": 93.2316076294278,
+ "grad_norm": 3.0148816108703613,
+ "learning_rate": 2.393081642856976e-07,
+ "loss": 0.0272,
+ "step": 34216
+ },
+ {
+ "epoch": 93.23433242506812,
+ "grad_norm": 2.923034191131592,
+ "learning_rate": 2.39116294813051e-07,
+ "loss": 0.0519,
+ "step": 34217
+ },
+ {
+ "epoch": 93.23705722070845,
+ "grad_norm": 3.248408794403076,
+ "learning_rate": 2.3892450135785447e-07,
+ "loss": 0.1798,
+ "step": 34218
+ },
+ {
+ "epoch": 93.23978201634877,
+ "grad_norm": 3.2799253463745117,
+ "learning_rate": 2.3873278392159806e-07,
+ "loss": 0.0405,
+ "step": 34219
+ },
+ {
+ "epoch": 93.2425068119891,
+ "grad_norm": 3.820754289627075,
+ "learning_rate": 2.385411425057782e-07,
+ "loss": 0.0569,
+ "step": 34220
+ },
+ {
+ "epoch": 93.24523160762942,
+ "grad_norm": 2.1387405395507812,
+ "learning_rate": 2.3834957711188378e-07,
+ "loss": 0.0413,
+ "step": 34221
+ },
+ {
+ "epoch": 93.24795640326975,
+ "grad_norm": 2.9989240169525146,
+ "learning_rate": 2.3815808774141025e-07,
+ "loss": 0.0516,
+ "step": 34222
+ },
+ {
+ "epoch": 93.25068119891009,
+ "grad_norm": 2.485605001449585,
+ "learning_rate": 2.379666743958464e-07,
+ "loss": 0.0338,
+ "step": 34223
+ },
+ {
+ "epoch": 93.2534059945504,
+ "grad_norm": 3.5497841835021973,
+ "learning_rate": 2.3777533707668444e-07,
+ "loss": 0.1429,
+ "step": 34224
+ },
+ {
+ "epoch": 93.25613079019074,
+ "grad_norm": 4.257180690765381,
+ "learning_rate": 2.375840757854131e-07,
+ "loss": 0.0999,
+ "step": 34225
+ },
+ {
+ "epoch": 93.25885558583106,
+ "grad_norm": 2.6541223526000977,
+ "learning_rate": 2.3739289052352344e-07,
+ "loss": 0.0505,
+ "step": 34226
+ },
+ {
+ "epoch": 93.26158038147139,
+ "grad_norm": 2.5403902530670166,
+ "learning_rate": 2.3720178129250425e-07,
+ "loss": 0.1491,
+ "step": 34227
+ },
+ {
+ "epoch": 93.26430517711172,
+ "grad_norm": 1.8508092164993286,
+ "learning_rate": 2.3701074809384327e-07,
+ "loss": 0.0757,
+ "step": 34228
+ },
+ {
+ "epoch": 93.26702997275204,
+ "grad_norm": 4.365070819854736,
+ "learning_rate": 2.3681979092902706e-07,
+ "loss": 0.0883,
+ "step": 34229
+ },
+ {
+ "epoch": 93.26975476839237,
+ "grad_norm": 2.5791027545928955,
+ "learning_rate": 2.3662890979954556e-07,
+ "loss": 0.0205,
+ "step": 34230
+ },
+ {
+ "epoch": 93.2724795640327,
+ "grad_norm": 2.260385036468506,
+ "learning_rate": 2.36438104706882e-07,
+ "loss": 0.031,
+ "step": 34231
+ },
+ {
+ "epoch": 93.27520435967303,
+ "grad_norm": 3.0480616092681885,
+ "learning_rate": 2.362473756525263e-07,
+ "loss": 0.0362,
+ "step": 34232
+ },
+ {
+ "epoch": 93.27792915531334,
+ "grad_norm": 2.6555707454681396,
+ "learning_rate": 2.3605672263796066e-07,
+ "loss": 0.0336,
+ "step": 34233
+ },
+ {
+ "epoch": 93.28065395095368,
+ "grad_norm": 5.330408573150635,
+ "learning_rate": 2.358661456646716e-07,
+ "loss": 0.0981,
+ "step": 34234
+ },
+ {
+ "epoch": 93.28337874659401,
+ "grad_norm": 1.8813849687576294,
+ "learning_rate": 2.3567564473414239e-07,
+ "loss": 0.0253,
+ "step": 34235
+ },
+ {
+ "epoch": 93.28610354223433,
+ "grad_norm": 3.5582058429718018,
+ "learning_rate": 2.3548521984785745e-07,
+ "loss": 0.0325,
+ "step": 34236
+ },
+ {
+ "epoch": 93.28882833787466,
+ "grad_norm": 2.186025857925415,
+ "learning_rate": 2.3529487100729774e-07,
+ "loss": 0.1027,
+ "step": 34237
+ },
+ {
+ "epoch": 93.29155313351498,
+ "grad_norm": 1.7551841735839844,
+ "learning_rate": 2.3510459821394883e-07,
+ "loss": 0.0227,
+ "step": 34238
+ },
+ {
+ "epoch": 93.29427792915531,
+ "grad_norm": 5.63027286529541,
+ "learning_rate": 2.3491440146929168e-07,
+ "loss": 0.1174,
+ "step": 34239
+ },
+ {
+ "epoch": 93.29700272479565,
+ "grad_norm": 3.5584611892700195,
+ "learning_rate": 2.3472428077480625e-07,
+ "loss": 0.0759,
+ "step": 34240
+ },
+ {
+ "epoch": 93.29972752043597,
+ "grad_norm": 1.5529555082321167,
+ "learning_rate": 2.3453423613197245e-07,
+ "loss": 0.0208,
+ "step": 34241
+ },
+ {
+ "epoch": 93.3024523160763,
+ "grad_norm": 2.823137044906616,
+ "learning_rate": 2.3434426754227358e-07,
+ "loss": 0.0649,
+ "step": 34242
+ },
+ {
+ "epoch": 93.30517711171662,
+ "grad_norm": 2.305696964263916,
+ "learning_rate": 2.3415437500718618e-07,
+ "loss": 0.0302,
+ "step": 34243
+ },
+ {
+ "epoch": 93.30790190735695,
+ "grad_norm": 2.765134811401367,
+ "learning_rate": 2.3396455852819133e-07,
+ "loss": 0.0973,
+ "step": 34244
+ },
+ {
+ "epoch": 93.31062670299727,
+ "grad_norm": 2.4256081581115723,
+ "learning_rate": 2.337748181067645e-07,
+ "loss": 0.0542,
+ "step": 34245
+ },
+ {
+ "epoch": 93.3133514986376,
+ "grad_norm": 3.1596426963806152,
+ "learning_rate": 2.335851537443856e-07,
+ "loss": 0.1633,
+ "step": 34246
+ },
+ {
+ "epoch": 93.31607629427793,
+ "grad_norm": 2.5621795654296875,
+ "learning_rate": 2.3339556544253238e-07,
+ "loss": 0.0685,
+ "step": 34247
+ },
+ {
+ "epoch": 93.31880108991825,
+ "grad_norm": 2.953115701675415,
+ "learning_rate": 2.332060532026792e-07,
+ "loss": 0.0967,
+ "step": 34248
+ },
+ {
+ "epoch": 93.32152588555859,
+ "grad_norm": 1.5390170812606812,
+ "learning_rate": 2.3301661702630153e-07,
+ "loss": 0.023,
+ "step": 34249
+ },
+ {
+ "epoch": 93.3242506811989,
+ "grad_norm": 3.682244300842285,
+ "learning_rate": 2.3282725691487817e-07,
+ "loss": 0.0305,
+ "step": 34250
+ },
+ {
+ "epoch": 93.32697547683924,
+ "grad_norm": 2.5427091121673584,
+ "learning_rate": 2.3263797286988132e-07,
+ "loss": 0.042,
+ "step": 34251
+ },
+ {
+ "epoch": 93.32970027247957,
+ "grad_norm": 1.9223684072494507,
+ "learning_rate": 2.3244876489278534e-07,
+ "loss": 0.0358,
+ "step": 34252
+ },
+ {
+ "epoch": 93.33242506811989,
+ "grad_norm": 1.8607436418533325,
+ "learning_rate": 2.3225963298506348e-07,
+ "loss": 0.0421,
+ "step": 34253
+ },
+ {
+ "epoch": 93.33514986376022,
+ "grad_norm": 3.368166446685791,
+ "learning_rate": 2.3207057714819015e-07,
+ "loss": 0.031,
+ "step": 34254
+ },
+ {
+ "epoch": 93.33787465940054,
+ "grad_norm": 2.6873717308044434,
+ "learning_rate": 2.3188159738363637e-07,
+ "loss": 0.0496,
+ "step": 34255
+ },
+ {
+ "epoch": 93.34059945504087,
+ "grad_norm": 1.9688893556594849,
+ "learning_rate": 2.316926936928754e-07,
+ "loss": 0.0509,
+ "step": 34256
+ },
+ {
+ "epoch": 93.34332425068119,
+ "grad_norm": 2.0882997512817383,
+ "learning_rate": 2.3150386607737497e-07,
+ "loss": 0.0204,
+ "step": 34257
+ },
+ {
+ "epoch": 93.34604904632153,
+ "grad_norm": 1.618839144706726,
+ "learning_rate": 2.3131511453861056e-07,
+ "loss": 0.0216,
+ "step": 34258
+ },
+ {
+ "epoch": 93.34877384196186,
+ "grad_norm": 2.171215534210205,
+ "learning_rate": 2.3112643907804877e-07,
+ "loss": 0.0214,
+ "step": 34259
+ },
+ {
+ "epoch": 93.35149863760218,
+ "grad_norm": 2.2503678798675537,
+ "learning_rate": 2.3093783969715954e-07,
+ "loss": 0.0209,
+ "step": 34260
+ },
+ {
+ "epoch": 93.35422343324251,
+ "grad_norm": 3.4730801582336426,
+ "learning_rate": 2.3074931639741172e-07,
+ "loss": 0.0775,
+ "step": 34261
+ },
+ {
+ "epoch": 93.35694822888283,
+ "grad_norm": 1.5985684394836426,
+ "learning_rate": 2.305608691802741e-07,
+ "loss": 0.018,
+ "step": 34262
+ },
+ {
+ "epoch": 93.35967302452316,
+ "grad_norm": 2.013010025024414,
+ "learning_rate": 2.303724980472144e-07,
+ "loss": 0.0174,
+ "step": 34263
+ },
+ {
+ "epoch": 93.3623978201635,
+ "grad_norm": 2.307169198989868,
+ "learning_rate": 2.3018420299969924e-07,
+ "loss": 0.0526,
+ "step": 34264
+ },
+ {
+ "epoch": 93.36512261580381,
+ "grad_norm": 3.5073304176330566,
+ "learning_rate": 2.299959840391941e-07,
+ "loss": 0.0499,
+ "step": 34265
+ },
+ {
+ "epoch": 93.36784741144415,
+ "grad_norm": 2.8495914936065674,
+ "learning_rate": 2.298078411671656e-07,
+ "loss": 0.0715,
+ "step": 34266
+ },
+ {
+ "epoch": 93.37057220708446,
+ "grad_norm": 3.1446921825408936,
+ "learning_rate": 2.2961977438508033e-07,
+ "loss": 0.0734,
+ "step": 34267
+ },
+ {
+ "epoch": 93.3732970027248,
+ "grad_norm": 2.7543461322784424,
+ "learning_rate": 2.2943178369440155e-07,
+ "loss": 0.1745,
+ "step": 34268
+ },
+ {
+ "epoch": 93.37602179836512,
+ "grad_norm": 2.799346923828125,
+ "learning_rate": 2.292438690965937e-07,
+ "loss": 0.0898,
+ "step": 34269
+ },
+ {
+ "epoch": 93.37874659400545,
+ "grad_norm": 3.420541524887085,
+ "learning_rate": 2.2905603059311998e-07,
+ "loss": 0.0635,
+ "step": 34270
+ },
+ {
+ "epoch": 93.38147138964578,
+ "grad_norm": 2.3576390743255615,
+ "learning_rate": 2.2886826818544262e-07,
+ "loss": 0.0312,
+ "step": 34271
+ },
+ {
+ "epoch": 93.3841961852861,
+ "grad_norm": 1.5556529760360718,
+ "learning_rate": 2.2868058187502595e-07,
+ "loss": 0.0141,
+ "step": 34272
+ },
+ {
+ "epoch": 93.38692098092643,
+ "grad_norm": 1.5678285360336304,
+ "learning_rate": 2.2849297166332996e-07,
+ "loss": 0.0245,
+ "step": 34273
+ },
+ {
+ "epoch": 93.38964577656675,
+ "grad_norm": 2.376685857772827,
+ "learning_rate": 2.2830543755181566e-07,
+ "loss": 0.1673,
+ "step": 34274
+ },
+ {
+ "epoch": 93.39237057220708,
+ "grad_norm": 2.1394050121307373,
+ "learning_rate": 2.2811797954194527e-07,
+ "loss": 0.0282,
+ "step": 34275
+ },
+ {
+ "epoch": 93.39509536784742,
+ "grad_norm": 2.103039264678955,
+ "learning_rate": 2.2793059763517756e-07,
+ "loss": 0.0496,
+ "step": 34276
+ },
+ {
+ "epoch": 93.39782016348774,
+ "grad_norm": 1.8962243795394897,
+ "learning_rate": 2.277432918329703e-07,
+ "loss": 0.0658,
+ "step": 34277
+ },
+ {
+ "epoch": 93.40054495912807,
+ "grad_norm": 2.451472759246826,
+ "learning_rate": 2.2755606213678448e-07,
+ "loss": 0.0565,
+ "step": 34278
+ },
+ {
+ "epoch": 93.40326975476839,
+ "grad_norm": 2.0736703872680664,
+ "learning_rate": 2.2736890854807792e-07,
+ "loss": 0.0239,
+ "step": 34279
+ },
+ {
+ "epoch": 93.40599455040872,
+ "grad_norm": 3.8964591026306152,
+ "learning_rate": 2.2718183106830826e-07,
+ "loss": 0.0884,
+ "step": 34280
+ },
+ {
+ "epoch": 93.40871934604904,
+ "grad_norm": 3.147368907928467,
+ "learning_rate": 2.2699482969892994e-07,
+ "loss": 0.0358,
+ "step": 34281
+ },
+ {
+ "epoch": 93.41144414168937,
+ "grad_norm": 3.8105955123901367,
+ "learning_rate": 2.2680790444140287e-07,
+ "loss": 0.0969,
+ "step": 34282
+ },
+ {
+ "epoch": 93.4141689373297,
+ "grad_norm": 3.1020357608795166,
+ "learning_rate": 2.2662105529718036e-07,
+ "loss": 0.0388,
+ "step": 34283
+ },
+ {
+ "epoch": 93.41689373297002,
+ "grad_norm": 2.4139652252197266,
+ "learning_rate": 2.2643428226772013e-07,
+ "loss": 0.0501,
+ "step": 34284
+ },
+ {
+ "epoch": 93.41961852861036,
+ "grad_norm": 2.5008866786956787,
+ "learning_rate": 2.2624758535447432e-07,
+ "loss": 0.0276,
+ "step": 34285
+ },
+ {
+ "epoch": 93.42234332425068,
+ "grad_norm": 3.279120683670044,
+ "learning_rate": 2.2606096455889736e-07,
+ "loss": 0.1095,
+ "step": 34286
+ },
+ {
+ "epoch": 93.42506811989101,
+ "grad_norm": 3.0299057960510254,
+ "learning_rate": 2.2587441988244362e-07,
+ "loss": 0.0421,
+ "step": 34287
+ },
+ {
+ "epoch": 93.42779291553134,
+ "grad_norm": 2.426337718963623,
+ "learning_rate": 2.256879513265653e-07,
+ "loss": 0.028,
+ "step": 34288
+ },
+ {
+ "epoch": 93.43051771117166,
+ "grad_norm": 3.697620391845703,
+ "learning_rate": 2.2550155889271453e-07,
+ "loss": 0.0427,
+ "step": 34289
+ },
+ {
+ "epoch": 93.433242506812,
+ "grad_norm": 2.769820213317871,
+ "learning_rate": 2.2531524258234238e-07,
+ "loss": 0.0496,
+ "step": 34290
+ },
+ {
+ "epoch": 93.43596730245231,
+ "grad_norm": 1.7424660921096802,
+ "learning_rate": 2.2512900239690104e-07,
+ "loss": 0.1147,
+ "step": 34291
+ },
+ {
+ "epoch": 93.43869209809264,
+ "grad_norm": 1.9787771701812744,
+ "learning_rate": 2.2494283833784047e-07,
+ "loss": 0.0147,
+ "step": 34292
+ },
+ {
+ "epoch": 93.44141689373296,
+ "grad_norm": 2.9561150074005127,
+ "learning_rate": 2.247567504066106e-07,
+ "loss": 0.1082,
+ "step": 34293
+ },
+ {
+ "epoch": 93.4441416893733,
+ "grad_norm": 3.1463584899902344,
+ "learning_rate": 2.2457073860466028e-07,
+ "loss": 0.0487,
+ "step": 34294
+ },
+ {
+ "epoch": 93.44686648501363,
+ "grad_norm": 1.4194004535675049,
+ "learning_rate": 2.2438480293343833e-07,
+ "loss": 0.0172,
+ "step": 34295
+ },
+ {
+ "epoch": 93.44959128065395,
+ "grad_norm": 3.0458099842071533,
+ "learning_rate": 2.2419894339439364e-07,
+ "loss": 0.0996,
+ "step": 34296
+ },
+ {
+ "epoch": 93.45231607629428,
+ "grad_norm": 2.9101486206054688,
+ "learning_rate": 2.2401315998897166e-07,
+ "loss": 0.0496,
+ "step": 34297
+ },
+ {
+ "epoch": 93.4550408719346,
+ "grad_norm": 1.791276216506958,
+ "learning_rate": 2.2382745271862128e-07,
+ "loss": 0.0283,
+ "step": 34298
+ },
+ {
+ "epoch": 93.45776566757493,
+ "grad_norm": 2.2020905017852783,
+ "learning_rate": 2.2364182158478797e-07,
+ "loss": 0.0927,
+ "step": 34299
+ },
+ {
+ "epoch": 93.46049046321527,
+ "grad_norm": 3.559235095977783,
+ "learning_rate": 2.2345626658891728e-07,
+ "loss": 0.0484,
+ "step": 34300
+ },
+ {
+ "epoch": 93.46321525885558,
+ "grad_norm": 2.6800601482391357,
+ "learning_rate": 2.232707877324547e-07,
+ "loss": 0.1808,
+ "step": 34301
+ },
+ {
+ "epoch": 93.46594005449592,
+ "grad_norm": 2.735093832015991,
+ "learning_rate": 2.2308538501684464e-07,
+ "loss": 0.0293,
+ "step": 34302
+ },
+ {
+ "epoch": 93.46866485013624,
+ "grad_norm": 1.8304994106292725,
+ "learning_rate": 2.2290005844353145e-07,
+ "loss": 0.0239,
+ "step": 34303
+ },
+ {
+ "epoch": 93.47138964577657,
+ "grad_norm": 1.9497863054275513,
+ "learning_rate": 2.227148080139574e-07,
+ "loss": 0.0234,
+ "step": 34304
+ },
+ {
+ "epoch": 93.47411444141689,
+ "grad_norm": 2.7205569744110107,
+ "learning_rate": 2.2252963372956572e-07,
+ "loss": 0.0502,
+ "step": 34305
+ },
+ {
+ "epoch": 93.47683923705722,
+ "grad_norm": 3.152188301086426,
+ "learning_rate": 2.2234453559179858e-07,
+ "loss": 0.056,
+ "step": 34306
+ },
+ {
+ "epoch": 93.47956403269755,
+ "grad_norm": 3.2019495964050293,
+ "learning_rate": 2.221595136020971e-07,
+ "loss": 0.0511,
+ "step": 34307
+ },
+ {
+ "epoch": 93.48228882833787,
+ "grad_norm": 2.1643855571746826,
+ "learning_rate": 2.219745677619034e-07,
+ "loss": 0.0601,
+ "step": 34308
+ },
+ {
+ "epoch": 93.4850136239782,
+ "grad_norm": 3.378383159637451,
+ "learning_rate": 2.217896980726575e-07,
+ "loss": 0.0843,
+ "step": 34309
+ },
+ {
+ "epoch": 93.48773841961852,
+ "grad_norm": 1.9036085605621338,
+ "learning_rate": 2.2160490453579707e-07,
+ "loss": 0.0252,
+ "step": 34310
+ },
+ {
+ "epoch": 93.49046321525886,
+ "grad_norm": 2.122843027114868,
+ "learning_rate": 2.2142018715276437e-07,
+ "loss": 0.0597,
+ "step": 34311
+ },
+ {
+ "epoch": 93.49318801089919,
+ "grad_norm": 2.473475694656372,
+ "learning_rate": 2.2123554592499598e-07,
+ "loss": 0.0629,
+ "step": 34312
+ },
+ {
+ "epoch": 93.49591280653951,
+ "grad_norm": 2.287557363510132,
+ "learning_rate": 2.2105098085393073e-07,
+ "loss": 0.0385,
+ "step": 34313
+ },
+ {
+ "epoch": 93.49863760217984,
+ "grad_norm": 3.523827075958252,
+ "learning_rate": 2.208664919410053e-07,
+ "loss": 0.0415,
+ "step": 34314
+ },
+ {
+ "epoch": 93.50136239782016,
+ "grad_norm": 1.7135145664215088,
+ "learning_rate": 2.2068207918765738e-07,
+ "loss": 0.0199,
+ "step": 34315
+ },
+ {
+ "epoch": 93.50408719346049,
+ "grad_norm": 2.7096970081329346,
+ "learning_rate": 2.2049774259532253e-07,
+ "loss": 0.1068,
+ "step": 34316
+ },
+ {
+ "epoch": 93.50681198910081,
+ "grad_norm": 2.7034780979156494,
+ "learning_rate": 2.2031348216543514e-07,
+ "loss": 0.0798,
+ "step": 34317
+ },
+ {
+ "epoch": 93.50953678474114,
+ "grad_norm": 2.822631359100342,
+ "learning_rate": 2.2012929789943183e-07,
+ "loss": 0.0187,
+ "step": 34318
+ },
+ {
+ "epoch": 93.51226158038148,
+ "grad_norm": 1.7559870481491089,
+ "learning_rate": 2.1994518979874812e-07,
+ "loss": 0.0385,
+ "step": 34319
+ },
+ {
+ "epoch": 93.5149863760218,
+ "grad_norm": 3.9192328453063965,
+ "learning_rate": 2.197611578648162e-07,
+ "loss": 0.0231,
+ "step": 34320
+ },
+ {
+ "epoch": 93.51771117166213,
+ "grad_norm": 2.06367826461792,
+ "learning_rate": 2.195772020990705e-07,
+ "loss": 0.0432,
+ "step": 34321
+ },
+ {
+ "epoch": 93.52043596730245,
+ "grad_norm": 2.2036385536193848,
+ "learning_rate": 2.19393322502941e-07,
+ "loss": 0.0238,
+ "step": 34322
+ },
+ {
+ "epoch": 93.52316076294278,
+ "grad_norm": 2.166105270385742,
+ "learning_rate": 2.1920951907786204e-07,
+ "loss": 0.1484,
+ "step": 34323
+ },
+ {
+ "epoch": 93.52588555858311,
+ "grad_norm": 2.125516653060913,
+ "learning_rate": 2.1902579182526584e-07,
+ "loss": 0.0339,
+ "step": 34324
+ },
+ {
+ "epoch": 93.52861035422343,
+ "grad_norm": 2.5359044075012207,
+ "learning_rate": 2.1884214074658127e-07,
+ "loss": 0.061,
+ "step": 34325
+ },
+ {
+ "epoch": 93.53133514986376,
+ "grad_norm": 4.177691459655762,
+ "learning_rate": 2.186585658432383e-07,
+ "loss": 0.1618,
+ "step": 34326
+ },
+ {
+ "epoch": 93.53405994550408,
+ "grad_norm": 4.603385925292969,
+ "learning_rate": 2.18475067116668e-07,
+ "loss": 0.0564,
+ "step": 34327
+ },
+ {
+ "epoch": 93.53678474114442,
+ "grad_norm": 3.4245223999023438,
+ "learning_rate": 2.1829164456829922e-07,
+ "loss": 0.0345,
+ "step": 34328
+ },
+ {
+ "epoch": 93.53950953678473,
+ "grad_norm": 4.157337665557861,
+ "learning_rate": 2.181082981995608e-07,
+ "loss": 0.0201,
+ "step": 34329
+ },
+ {
+ "epoch": 93.54223433242507,
+ "grad_norm": 2.2463536262512207,
+ "learning_rate": 2.1792502801187944e-07,
+ "loss": 0.0282,
+ "step": 34330
+ },
+ {
+ "epoch": 93.5449591280654,
+ "grad_norm": 3.085951805114746,
+ "learning_rate": 2.177418340066839e-07,
+ "loss": 0.0392,
+ "step": 34331
+ },
+ {
+ "epoch": 93.54768392370572,
+ "grad_norm": 2.7970926761627197,
+ "learning_rate": 2.1755871618539981e-07,
+ "loss": 0.0347,
+ "step": 34332
+ },
+ {
+ "epoch": 93.55040871934605,
+ "grad_norm": 3.0887789726257324,
+ "learning_rate": 2.1737567454945374e-07,
+ "loss": 0.0295,
+ "step": 34333
+ },
+ {
+ "epoch": 93.55313351498637,
+ "grad_norm": 2.192136526107788,
+ "learning_rate": 2.1719270910027013e-07,
+ "loss": 0.0428,
+ "step": 34334
+ },
+ {
+ "epoch": 93.5558583106267,
+ "grad_norm": 1.9388835430145264,
+ "learning_rate": 2.1700981983927448e-07,
+ "loss": 0.0249,
+ "step": 34335
+ },
+ {
+ "epoch": 93.55858310626704,
+ "grad_norm": 2.0230979919433594,
+ "learning_rate": 2.1682700676789236e-07,
+ "loss": 0.0259,
+ "step": 34336
+ },
+ {
+ "epoch": 93.56130790190736,
+ "grad_norm": 2.2906877994537354,
+ "learning_rate": 2.1664426988754705e-07,
+ "loss": 0.0628,
+ "step": 34337
+ },
+ {
+ "epoch": 93.56403269754769,
+ "grad_norm": 3.3800113201141357,
+ "learning_rate": 2.1646160919966076e-07,
+ "loss": 0.1021,
+ "step": 34338
+ },
+ {
+ "epoch": 93.566757493188,
+ "grad_norm": 1.5669342279434204,
+ "learning_rate": 2.1627902470565675e-07,
+ "loss": 0.1427,
+ "step": 34339
+ },
+ {
+ "epoch": 93.56948228882834,
+ "grad_norm": 3.2367019653320312,
+ "learning_rate": 2.1609651640695727e-07,
+ "loss": 0.0375,
+ "step": 34340
+ },
+ {
+ "epoch": 93.57220708446866,
+ "grad_norm": 2.5182316303253174,
+ "learning_rate": 2.159140843049834e-07,
+ "loss": 0.0315,
+ "step": 34341
+ },
+ {
+ "epoch": 93.57493188010899,
+ "grad_norm": 3.962669610977173,
+ "learning_rate": 2.1573172840115397e-07,
+ "loss": 0.0244,
+ "step": 34342
+ },
+ {
+ "epoch": 93.57765667574932,
+ "grad_norm": 2.234757423400879,
+ "learning_rate": 2.155494486968923e-07,
+ "loss": 0.0802,
+ "step": 34343
+ },
+ {
+ "epoch": 93.58038147138964,
+ "grad_norm": 4.146871566772461,
+ "learning_rate": 2.153672451936173e-07,
+ "loss": 0.188,
+ "step": 34344
+ },
+ {
+ "epoch": 93.58310626702998,
+ "grad_norm": 3.737558603286743,
+ "learning_rate": 2.1518511789274666e-07,
+ "loss": 0.0419,
+ "step": 34345
+ },
+ {
+ "epoch": 93.5858310626703,
+ "grad_norm": 2.5635979175567627,
+ "learning_rate": 2.1500306679569816e-07,
+ "loss": 0.0322,
+ "step": 34346
+ },
+ {
+ "epoch": 93.58855585831063,
+ "grad_norm": 2.7324888706207275,
+ "learning_rate": 2.1482109190389178e-07,
+ "loss": 0.0655,
+ "step": 34347
+ },
+ {
+ "epoch": 93.59128065395096,
+ "grad_norm": 2.9860117435455322,
+ "learning_rate": 2.1463919321874415e-07,
+ "loss": 0.1257,
+ "step": 34348
+ },
+ {
+ "epoch": 93.59400544959128,
+ "grad_norm": 6.02388334274292,
+ "learning_rate": 2.1445737074167194e-07,
+ "loss": 0.1173,
+ "step": 34349
+ },
+ {
+ "epoch": 93.59673024523161,
+ "grad_norm": 2.5729589462280273,
+ "learning_rate": 2.1427562447408957e-07,
+ "loss": 0.095,
+ "step": 34350
+ },
+ {
+ "epoch": 93.59945504087193,
+ "grad_norm": 6.943117141723633,
+ "learning_rate": 2.1409395441741477e-07,
+ "loss": 0.0283,
+ "step": 34351
+ },
+ {
+ "epoch": 93.60217983651226,
+ "grad_norm": 3.964367151260376,
+ "learning_rate": 2.1391236057305974e-07,
+ "loss": 0.072,
+ "step": 34352
+ },
+ {
+ "epoch": 93.60490463215258,
+ "grad_norm": 2.762946605682373,
+ "learning_rate": 2.1373084294244118e-07,
+ "loss": 0.0445,
+ "step": 34353
+ },
+ {
+ "epoch": 93.60762942779292,
+ "grad_norm": 2.5655124187469482,
+ "learning_rate": 2.1354940152697234e-07,
+ "loss": 0.0266,
+ "step": 34354
+ },
+ {
+ "epoch": 93.61035422343325,
+ "grad_norm": 1.9681520462036133,
+ "learning_rate": 2.1336803632806436e-07,
+ "loss": 0.0277,
+ "step": 34355
+ },
+ {
+ "epoch": 93.61307901907357,
+ "grad_norm": 2.3756961822509766,
+ "learning_rate": 2.1318674734713273e-07,
+ "loss": 0.093,
+ "step": 34356
+ },
+ {
+ "epoch": 93.6158038147139,
+ "grad_norm": 4.2671918869018555,
+ "learning_rate": 2.130055345855875e-07,
+ "loss": 0.107,
+ "step": 34357
+ },
+ {
+ "epoch": 93.61852861035422,
+ "grad_norm": 4.12216854095459,
+ "learning_rate": 2.1282439804483966e-07,
+ "loss": 0.0344,
+ "step": 34358
+ },
+ {
+ "epoch": 93.62125340599455,
+ "grad_norm": 2.038247585296631,
+ "learning_rate": 2.126433377263004e-07,
+ "loss": 0.1056,
+ "step": 34359
+ },
+ {
+ "epoch": 93.62397820163488,
+ "grad_norm": 2.291226863861084,
+ "learning_rate": 2.1246235363137968e-07,
+ "loss": 0.0285,
+ "step": 34360
+ },
+ {
+ "epoch": 93.6267029972752,
+ "grad_norm": 4.159404277801514,
+ "learning_rate": 2.1228144576148857e-07,
+ "loss": 0.055,
+ "step": 34361
+ },
+ {
+ "epoch": 93.62942779291554,
+ "grad_norm": 2.844003438949585,
+ "learning_rate": 2.1210061411803262e-07,
+ "loss": 0.0615,
+ "step": 34362
+ },
+ {
+ "epoch": 93.63215258855585,
+ "grad_norm": 2.2398364543914795,
+ "learning_rate": 2.1191985870242293e-07,
+ "loss": 0.0427,
+ "step": 34363
+ },
+ {
+ "epoch": 93.63487738419619,
+ "grad_norm": 3.2485857009887695,
+ "learning_rate": 2.1173917951606615e-07,
+ "loss": 0.019,
+ "step": 34364
+ },
+ {
+ "epoch": 93.6376021798365,
+ "grad_norm": 2.3822646141052246,
+ "learning_rate": 2.1155857656037004e-07,
+ "loss": 0.029,
+ "step": 34365
+ },
+ {
+ "epoch": 93.64032697547684,
+ "grad_norm": 1.5049999952316284,
+ "learning_rate": 2.1137804983674014e-07,
+ "loss": 0.0185,
+ "step": 34366
+ },
+ {
+ "epoch": 93.64305177111717,
+ "grad_norm": 2.549562692642212,
+ "learning_rate": 2.1119759934658313e-07,
+ "loss": 0.0777,
+ "step": 34367
+ },
+ {
+ "epoch": 93.64577656675749,
+ "grad_norm": 1.8893696069717407,
+ "learning_rate": 2.110172250913045e-07,
+ "loss": 0.0235,
+ "step": 34368
+ },
+ {
+ "epoch": 93.64850136239782,
+ "grad_norm": 6.346429824829102,
+ "learning_rate": 2.1083692707230763e-07,
+ "loss": 0.0666,
+ "step": 34369
+ },
+ {
+ "epoch": 93.65122615803814,
+ "grad_norm": 2.1284542083740234,
+ "learning_rate": 2.1065670529099914e-07,
+ "loss": 0.0283,
+ "step": 34370
+ },
+ {
+ "epoch": 93.65395095367847,
+ "grad_norm": 3.1872403621673584,
+ "learning_rate": 2.1047655974878012e-07,
+ "loss": 0.0365,
+ "step": 34371
+ },
+ {
+ "epoch": 93.65667574931881,
+ "grad_norm": 4.941776752471924,
+ "learning_rate": 2.10296490447055e-07,
+ "loss": 0.1092,
+ "step": 34372
+ },
+ {
+ "epoch": 93.65940054495913,
+ "grad_norm": 2.912961959838867,
+ "learning_rate": 2.1011649738722606e-07,
+ "loss": 0.0403,
+ "step": 34373
+ },
+ {
+ "epoch": 93.66212534059946,
+ "grad_norm": 2.130218267440796,
+ "learning_rate": 2.0993658057069432e-07,
+ "loss": 0.0346,
+ "step": 34374
+ },
+ {
+ "epoch": 93.66485013623978,
+ "grad_norm": 2.6625425815582275,
+ "learning_rate": 2.0975673999886093e-07,
+ "loss": 0.0248,
+ "step": 34375
+ },
+ {
+ "epoch": 93.66757493188011,
+ "grad_norm": 1.9598931074142456,
+ "learning_rate": 2.0957697567312807e-07,
+ "loss": 0.0479,
+ "step": 34376
+ },
+ {
+ "epoch": 93.67029972752043,
+ "grad_norm": 5.38246488571167,
+ "learning_rate": 2.0939728759489463e-07,
+ "loss": 0.0697,
+ "step": 34377
+ },
+ {
+ "epoch": 93.67302452316076,
+ "grad_norm": 1.8101924657821655,
+ "learning_rate": 2.0921767576555952e-07,
+ "loss": 0.113,
+ "step": 34378
+ },
+ {
+ "epoch": 93.6757493188011,
+ "grad_norm": 2.1005547046661377,
+ "learning_rate": 2.0903814018652047e-07,
+ "loss": 0.0214,
+ "step": 34379
+ },
+ {
+ "epoch": 93.67847411444141,
+ "grad_norm": 4.3197855949401855,
+ "learning_rate": 2.088586808591797e-07,
+ "loss": 0.1892,
+ "step": 34380
+ },
+ {
+ "epoch": 93.68119891008175,
+ "grad_norm": 2.731203556060791,
+ "learning_rate": 2.0867929778493167e-07,
+ "loss": 0.038,
+ "step": 34381
+ },
+ {
+ "epoch": 93.68392370572207,
+ "grad_norm": 2.2792117595672607,
+ "learning_rate": 2.0849999096517304e-07,
+ "loss": 0.0729,
+ "step": 34382
+ },
+ {
+ "epoch": 93.6866485013624,
+ "grad_norm": 3.9346883296966553,
+ "learning_rate": 2.0832076040130267e-07,
+ "loss": 0.0845,
+ "step": 34383
+ },
+ {
+ "epoch": 93.68937329700273,
+ "grad_norm": 2.5368058681488037,
+ "learning_rate": 2.08141606094715e-07,
+ "loss": 0.0493,
+ "step": 34384
+ },
+ {
+ "epoch": 93.69209809264305,
+ "grad_norm": 2.3298025131225586,
+ "learning_rate": 2.079625280468045e-07,
+ "loss": 0.0607,
+ "step": 34385
+ },
+ {
+ "epoch": 93.69482288828338,
+ "grad_norm": 2.9570140838623047,
+ "learning_rate": 2.077835262589667e-07,
+ "loss": 0.0229,
+ "step": 34386
+ },
+ {
+ "epoch": 93.6975476839237,
+ "grad_norm": 2.169262170791626,
+ "learning_rate": 2.0760460073259603e-07,
+ "loss": 0.0641,
+ "step": 34387
+ },
+ {
+ "epoch": 93.70027247956403,
+ "grad_norm": 2.960768938064575,
+ "learning_rate": 2.0742575146908583e-07,
+ "loss": 0.0899,
+ "step": 34388
+ },
+ {
+ "epoch": 93.70299727520435,
+ "grad_norm": 3.048086404800415,
+ "learning_rate": 2.0724697846982832e-07,
+ "loss": 0.2102,
+ "step": 34389
+ },
+ {
+ "epoch": 93.70572207084469,
+ "grad_norm": 5.074772357940674,
+ "learning_rate": 2.0706828173621684e-07,
+ "loss": 0.1722,
+ "step": 34390
+ },
+ {
+ "epoch": 93.70844686648502,
+ "grad_norm": 3.0789027214050293,
+ "learning_rate": 2.0688966126964138e-07,
+ "loss": 0.0328,
+ "step": 34391
+ },
+ {
+ "epoch": 93.71117166212534,
+ "grad_norm": 2.1476850509643555,
+ "learning_rate": 2.0671111707149416e-07,
+ "loss": 0.0343,
+ "step": 34392
+ },
+ {
+ "epoch": 93.71389645776567,
+ "grad_norm": 2.010178804397583,
+ "learning_rate": 2.065326491431663e-07,
+ "loss": 0.1128,
+ "step": 34393
+ },
+ {
+ "epoch": 93.71662125340599,
+ "grad_norm": 2.3575823307037354,
+ "learning_rate": 2.0635425748604664e-07,
+ "loss": 0.0239,
+ "step": 34394
+ },
+ {
+ "epoch": 93.71934604904632,
+ "grad_norm": 2.0335638523101807,
+ "learning_rate": 2.0617594210152413e-07,
+ "loss": 0.0266,
+ "step": 34395
+ },
+ {
+ "epoch": 93.72207084468666,
+ "grad_norm": 3.2877469062805176,
+ "learning_rate": 2.0599770299098987e-07,
+ "loss": 0.146,
+ "step": 34396
+ },
+ {
+ "epoch": 93.72479564032697,
+ "grad_norm": 2.5627589225769043,
+ "learning_rate": 2.058195401558294e-07,
+ "loss": 0.0241,
+ "step": 34397
+ },
+ {
+ "epoch": 93.7275204359673,
+ "grad_norm": 2.51062273979187,
+ "learning_rate": 2.0564145359743048e-07,
+ "loss": 0.0372,
+ "step": 34398
+ },
+ {
+ "epoch": 93.73024523160763,
+ "grad_norm": 2.7507593631744385,
+ "learning_rate": 2.0546344331718092e-07,
+ "loss": 0.0503,
+ "step": 34399
+ },
+ {
+ "epoch": 93.73297002724796,
+ "grad_norm": 2.953214645385742,
+ "learning_rate": 2.052855093164674e-07,
+ "loss": 0.0551,
+ "step": 34400
+ },
+ {
+ "epoch": 93.73569482288828,
+ "grad_norm": 3.533792734146118,
+ "learning_rate": 2.0510765159667546e-07,
+ "loss": 0.1486,
+ "step": 34401
+ },
+ {
+ "epoch": 93.73841961852861,
+ "grad_norm": 2.928157091140747,
+ "learning_rate": 2.049298701591884e-07,
+ "loss": 0.0521,
+ "step": 34402
+ },
+ {
+ "epoch": 93.74114441416894,
+ "grad_norm": 5.785929203033447,
+ "learning_rate": 2.0475216500539298e-07,
+ "loss": 0.033,
+ "step": 34403
+ },
+ {
+ "epoch": 93.74386920980926,
+ "grad_norm": 2.49468731880188,
+ "learning_rate": 2.0457453613667134e-07,
+ "loss": 0.0869,
+ "step": 34404
+ },
+ {
+ "epoch": 93.7465940054496,
+ "grad_norm": 1.9557398557662964,
+ "learning_rate": 2.043969835544102e-07,
+ "loss": 0.0263,
+ "step": 34405
+ },
+ {
+ "epoch": 93.74931880108991,
+ "grad_norm": 1.865979552268982,
+ "learning_rate": 2.042195072599884e-07,
+ "loss": 0.0207,
+ "step": 34406
+ },
+ {
+ "epoch": 93.75204359673025,
+ "grad_norm": 10.877952575683594,
+ "learning_rate": 2.0404210725479046e-07,
+ "loss": 0.0242,
+ "step": 34407
+ },
+ {
+ "epoch": 93.75476839237058,
+ "grad_norm": 2.2763140201568604,
+ "learning_rate": 2.0386478354019745e-07,
+ "loss": 0.0702,
+ "step": 34408
+ },
+ {
+ "epoch": 93.7574931880109,
+ "grad_norm": 2.745971202850342,
+ "learning_rate": 2.0368753611759052e-07,
+ "loss": 0.065,
+ "step": 34409
+ },
+ {
+ "epoch": 93.76021798365123,
+ "grad_norm": 2.8336164951324463,
+ "learning_rate": 2.0351036498834965e-07,
+ "loss": 0.1588,
+ "step": 34410
+ },
+ {
+ "epoch": 93.76294277929155,
+ "grad_norm": 2.2845332622528076,
+ "learning_rate": 2.0333327015385373e-07,
+ "loss": 0.0428,
+ "step": 34411
+ },
+ {
+ "epoch": 93.76566757493188,
+ "grad_norm": 1.7977302074432373,
+ "learning_rate": 2.0315625161548392e-07,
+ "loss": 0.0799,
+ "step": 34412
+ },
+ {
+ "epoch": 93.7683923705722,
+ "grad_norm": 2.4740443229675293,
+ "learning_rate": 2.0297930937461685e-07,
+ "loss": 0.0457,
+ "step": 34413
+ },
+ {
+ "epoch": 93.77111716621253,
+ "grad_norm": 2.2012076377868652,
+ "learning_rate": 2.0280244343263366e-07,
+ "loss": 0.034,
+ "step": 34414
+ },
+ {
+ "epoch": 93.77384196185287,
+ "grad_norm": 1.926122784614563,
+ "learning_rate": 2.026256537909077e-07,
+ "loss": 0.034,
+ "step": 34415
+ },
+ {
+ "epoch": 93.77656675749319,
+ "grad_norm": 1.7271753549575806,
+ "learning_rate": 2.0244894045081898e-07,
+ "loss": 0.0214,
+ "step": 34416
+ },
+ {
+ "epoch": 93.77929155313352,
+ "grad_norm": 2.1036386489868164,
+ "learning_rate": 2.0227230341374194e-07,
+ "loss": 0.0583,
+ "step": 34417
+ },
+ {
+ "epoch": 93.78201634877384,
+ "grad_norm": 2.506817102432251,
+ "learning_rate": 2.0209574268105324e-07,
+ "loss": 0.0401,
+ "step": 34418
+ },
+ {
+ "epoch": 93.78474114441417,
+ "grad_norm": 2.632697820663452,
+ "learning_rate": 2.0191925825412739e-07,
+ "loss": 0.0306,
+ "step": 34419
+ },
+ {
+ "epoch": 93.7874659400545,
+ "grad_norm": 2.7037792205810547,
+ "learning_rate": 2.017428501343388e-07,
+ "loss": 0.0372,
+ "step": 34420
+ },
+ {
+ "epoch": 93.79019073569482,
+ "grad_norm": 2.159956216812134,
+ "learning_rate": 2.0156651832306085e-07,
+ "loss": 0.0497,
+ "step": 34421
+ },
+ {
+ "epoch": 93.79291553133515,
+ "grad_norm": 2.0200798511505127,
+ "learning_rate": 2.0139026282166908e-07,
+ "loss": 0.0236,
+ "step": 34422
+ },
+ {
+ "epoch": 93.79564032697547,
+ "grad_norm": 1.5987173318862915,
+ "learning_rate": 2.012140836315335e-07,
+ "loss": 0.0349,
+ "step": 34423
+ },
+ {
+ "epoch": 93.7983651226158,
+ "grad_norm": 4.3370680809021,
+ "learning_rate": 2.0103798075402747e-07,
+ "loss": 0.1231,
+ "step": 34424
+ },
+ {
+ "epoch": 93.80108991825612,
+ "grad_norm": 1.7332193851470947,
+ "learning_rate": 2.0086195419052323e-07,
+ "loss": 0.0479,
+ "step": 34425
+ },
+ {
+ "epoch": 93.80381471389646,
+ "grad_norm": 2.297229766845703,
+ "learning_rate": 2.0068600394238968e-07,
+ "loss": 0.0286,
+ "step": 34426
+ },
+ {
+ "epoch": 93.80653950953679,
+ "grad_norm": 1.7435134649276733,
+ "learning_rate": 2.0051013001099794e-07,
+ "loss": 0.078,
+ "step": 34427
+ },
+ {
+ "epoch": 93.80926430517711,
+ "grad_norm": 2.4305944442749023,
+ "learning_rate": 2.0033433239771803e-07,
+ "loss": 0.0347,
+ "step": 34428
+ },
+ {
+ "epoch": 93.81198910081744,
+ "grad_norm": 2.4918837547302246,
+ "learning_rate": 2.0015861110392e-07,
+ "loss": 0.0374,
+ "step": 34429
+ },
+ {
+ "epoch": 93.81471389645776,
+ "grad_norm": 2.407262086868286,
+ "learning_rate": 1.9998296613097046e-07,
+ "loss": 0.027,
+ "step": 34430
+ },
+ {
+ "epoch": 93.8174386920981,
+ "grad_norm": 2.703068256378174,
+ "learning_rate": 1.9980739748023837e-07,
+ "loss": 0.0343,
+ "step": 34431
+ },
+ {
+ "epoch": 93.82016348773843,
+ "grad_norm": 3.4068539142608643,
+ "learning_rate": 1.9963190515309038e-07,
+ "loss": 0.0329,
+ "step": 34432
+ },
+ {
+ "epoch": 93.82288828337875,
+ "grad_norm": 2.6142091751098633,
+ "learning_rate": 1.9945648915089432e-07,
+ "loss": 0.0707,
+ "step": 34433
+ },
+ {
+ "epoch": 93.82561307901908,
+ "grad_norm": 1.7220866680145264,
+ "learning_rate": 1.9928114947501577e-07,
+ "loss": 0.0222,
+ "step": 34434
+ },
+ {
+ "epoch": 93.8283378746594,
+ "grad_norm": 2.0930206775665283,
+ "learning_rate": 1.9910588612681914e-07,
+ "loss": 0.0268,
+ "step": 34435
+ },
+ {
+ "epoch": 93.83106267029973,
+ "grad_norm": 1.6667646169662476,
+ "learning_rate": 1.9893069910767117e-07,
+ "loss": 0.0158,
+ "step": 34436
+ },
+ {
+ "epoch": 93.83378746594005,
+ "grad_norm": 3.9746711254119873,
+ "learning_rate": 1.9875558841893627e-07,
+ "loss": 0.046,
+ "step": 34437
+ },
+ {
+ "epoch": 93.83651226158038,
+ "grad_norm": 2.515366554260254,
+ "learning_rate": 1.9858055406197562e-07,
+ "loss": 0.1202,
+ "step": 34438
+ },
+ {
+ "epoch": 93.83923705722071,
+ "grad_norm": 3.2645912170410156,
+ "learning_rate": 1.984055960381559e-07,
+ "loss": 0.0312,
+ "step": 34439
+ },
+ {
+ "epoch": 93.84196185286103,
+ "grad_norm": 2.400242328643799,
+ "learning_rate": 1.98230714348836e-07,
+ "loss": 0.0531,
+ "step": 34440
+ },
+ {
+ "epoch": 93.84468664850137,
+ "grad_norm": 2.1673269271850586,
+ "learning_rate": 1.9805590899538152e-07,
+ "loss": 0.0214,
+ "step": 34441
+ },
+ {
+ "epoch": 93.84741144414168,
+ "grad_norm": 3.565842628479004,
+ "learning_rate": 1.9788117997915136e-07,
+ "loss": 0.122,
+ "step": 34442
+ },
+ {
+ "epoch": 93.85013623978202,
+ "grad_norm": 1.8552443981170654,
+ "learning_rate": 1.9770652730150775e-07,
+ "loss": 0.0175,
+ "step": 34443
+ },
+ {
+ "epoch": 93.85286103542235,
+ "grad_norm": 3.700861692428589,
+ "learning_rate": 1.9753195096380962e-07,
+ "loss": 0.1114,
+ "step": 34444
+ },
+ {
+ "epoch": 93.85558583106267,
+ "grad_norm": 3.854320764541626,
+ "learning_rate": 1.973574509674181e-07,
+ "loss": 0.0952,
+ "step": 34445
+ },
+ {
+ "epoch": 93.858310626703,
+ "grad_norm": 3.0832605361938477,
+ "learning_rate": 1.9718302731368988e-07,
+ "loss": 0.0577,
+ "step": 34446
+ },
+ {
+ "epoch": 93.86103542234332,
+ "grad_norm": 3.7628276348114014,
+ "learning_rate": 1.97008680003985e-07,
+ "loss": 0.0654,
+ "step": 34447
+ },
+ {
+ "epoch": 93.86376021798365,
+ "grad_norm": 2.3134407997131348,
+ "learning_rate": 1.9683440903966123e-07,
+ "loss": 0.0609,
+ "step": 34448
+ },
+ {
+ "epoch": 93.86648501362397,
+ "grad_norm": 3.2816579341888428,
+ "learning_rate": 1.9666021442207638e-07,
+ "loss": 0.0334,
+ "step": 34449
+ },
+ {
+ "epoch": 93.8692098092643,
+ "grad_norm": 3.8966357707977295,
+ "learning_rate": 1.9648609615258606e-07,
+ "loss": 0.1089,
+ "step": 34450
+ },
+ {
+ "epoch": 93.87193460490464,
+ "grad_norm": 2.2153778076171875,
+ "learning_rate": 1.9631205423254586e-07,
+ "loss": 0.0731,
+ "step": 34451
+ },
+ {
+ "epoch": 93.87465940054496,
+ "grad_norm": 2.281461000442505,
+ "learning_rate": 1.961380886633113e-07,
+ "loss": 0.0522,
+ "step": 34452
+ },
+ {
+ "epoch": 93.87738419618529,
+ "grad_norm": 2.045767307281494,
+ "learning_rate": 1.959641994462391e-07,
+ "loss": 0.0919,
+ "step": 34453
+ },
+ {
+ "epoch": 93.88010899182561,
+ "grad_norm": 3.1510367393493652,
+ "learning_rate": 1.9579038658268157e-07,
+ "loss": 0.0767,
+ "step": 34454
+ },
+ {
+ "epoch": 93.88283378746594,
+ "grad_norm": 2.3584213256835938,
+ "learning_rate": 1.9561665007399312e-07,
+ "loss": 0.0968,
+ "step": 34455
+ },
+ {
+ "epoch": 93.88555858310627,
+ "grad_norm": 2.3251776695251465,
+ "learning_rate": 1.95442989921526e-07,
+ "loss": 0.0256,
+ "step": 34456
+ },
+ {
+ "epoch": 93.88828337874659,
+ "grad_norm": 1.996802806854248,
+ "learning_rate": 1.9526940612663359e-07,
+ "loss": 0.054,
+ "step": 34457
+ },
+ {
+ "epoch": 93.89100817438693,
+ "grad_norm": 2.232168436050415,
+ "learning_rate": 1.9509589869066814e-07,
+ "loss": 0.0228,
+ "step": 34458
+ },
+ {
+ "epoch": 93.89373297002724,
+ "grad_norm": 4.788763046264648,
+ "learning_rate": 1.9492246761497967e-07,
+ "loss": 0.0692,
+ "step": 34459
+ },
+ {
+ "epoch": 93.89645776566758,
+ "grad_norm": 2.8546571731567383,
+ "learning_rate": 1.9474911290091936e-07,
+ "loss": 0.0291,
+ "step": 34460
+ },
+ {
+ "epoch": 93.8991825613079,
+ "grad_norm": 2.0369200706481934,
+ "learning_rate": 1.9457583454983719e-07,
+ "loss": 0.0261,
+ "step": 34461
+ },
+ {
+ "epoch": 93.90190735694823,
+ "grad_norm": 3.6039161682128906,
+ "learning_rate": 1.9440263256308433e-07,
+ "loss": 0.0405,
+ "step": 34462
+ },
+ {
+ "epoch": 93.90463215258856,
+ "grad_norm": 2.0535991191864014,
+ "learning_rate": 1.942295069420075e-07,
+ "loss": 0.0367,
+ "step": 34463
+ },
+ {
+ "epoch": 93.90735694822888,
+ "grad_norm": 1.9097617864608765,
+ "learning_rate": 1.9405645768795446e-07,
+ "loss": 0.0474,
+ "step": 34464
+ },
+ {
+ "epoch": 93.91008174386921,
+ "grad_norm": 1.9148390293121338,
+ "learning_rate": 1.9388348480227525e-07,
+ "loss": 0.0228,
+ "step": 34465
+ },
+ {
+ "epoch": 93.91280653950953,
+ "grad_norm": 3.3699679374694824,
+ "learning_rate": 1.937105882863155e-07,
+ "loss": 0.2528,
+ "step": 34466
+ },
+ {
+ "epoch": 93.91553133514986,
+ "grad_norm": 2.8437659740448,
+ "learning_rate": 1.935377681414219e-07,
+ "loss": 0.0644,
+ "step": 34467
+ },
+ {
+ "epoch": 93.9182561307902,
+ "grad_norm": 1.9749023914337158,
+ "learning_rate": 1.933650243689411e-07,
+ "loss": 0.0271,
+ "step": 34468
+ },
+ {
+ "epoch": 93.92098092643052,
+ "grad_norm": 2.847459316253662,
+ "learning_rate": 1.9319235697021766e-07,
+ "loss": 0.0997,
+ "step": 34469
+ },
+ {
+ "epoch": 93.92370572207085,
+ "grad_norm": 2.587817907333374,
+ "learning_rate": 1.93019765946596e-07,
+ "loss": 0.0269,
+ "step": 34470
+ },
+ {
+ "epoch": 93.92643051771117,
+ "grad_norm": 1.9004254341125488,
+ "learning_rate": 1.928472512994206e-07,
+ "loss": 0.1499,
+ "step": 34471
+ },
+ {
+ "epoch": 93.9291553133515,
+ "grad_norm": 2.5846543312072754,
+ "learning_rate": 1.9267481303003487e-07,
+ "loss": 0.0754,
+ "step": 34472
+ },
+ {
+ "epoch": 93.93188010899182,
+ "grad_norm": 2.302259922027588,
+ "learning_rate": 1.9250245113978329e-07,
+ "loss": 0.0876,
+ "step": 34473
+ },
+ {
+ "epoch": 93.93460490463215,
+ "grad_norm": 1.8402637243270874,
+ "learning_rate": 1.9233016563000695e-07,
+ "loss": 0.1349,
+ "step": 34474
+ },
+ {
+ "epoch": 93.93732970027249,
+ "grad_norm": 3.4466936588287354,
+ "learning_rate": 1.9215795650204817e-07,
+ "loss": 0.072,
+ "step": 34475
+ },
+ {
+ "epoch": 93.9400544959128,
+ "grad_norm": 2.3628551959991455,
+ "learning_rate": 1.9198582375724584e-07,
+ "loss": 0.0607,
+ "step": 34476
+ },
+ {
+ "epoch": 93.94277929155314,
+ "grad_norm": 2.3989202976226807,
+ "learning_rate": 1.9181376739694336e-07,
+ "loss": 0.1096,
+ "step": 34477
+ },
+ {
+ "epoch": 93.94550408719346,
+ "grad_norm": 1.715238094329834,
+ "learning_rate": 1.9164178742247964e-07,
+ "loss": 0.0213,
+ "step": 34478
+ },
+ {
+ "epoch": 93.94822888283379,
+ "grad_norm": 2.344977855682373,
+ "learning_rate": 1.914698838351936e-07,
+ "loss": 0.1036,
+ "step": 34479
+ },
+ {
+ "epoch": 93.95095367847412,
+ "grad_norm": 2.1506311893463135,
+ "learning_rate": 1.912980566364231e-07,
+ "loss": 0.073,
+ "step": 34480
+ },
+ {
+ "epoch": 93.95367847411444,
+ "grad_norm": 2.3233208656311035,
+ "learning_rate": 1.9112630582750924e-07,
+ "loss": 0.0492,
+ "step": 34481
+ },
+ {
+ "epoch": 93.95640326975477,
+ "grad_norm": 2.677304267883301,
+ "learning_rate": 1.9095463140978876e-07,
+ "loss": 0.1065,
+ "step": 34482
+ },
+ {
+ "epoch": 93.95912806539509,
+ "grad_norm": 3.472522735595703,
+ "learning_rate": 1.9078303338459725e-07,
+ "loss": 0.0603,
+ "step": 34483
+ },
+ {
+ "epoch": 93.96185286103542,
+ "grad_norm": 2.663081169128418,
+ "learning_rate": 1.906115117532703e-07,
+ "loss": 0.068,
+ "step": 34484
+ },
+ {
+ "epoch": 93.96457765667574,
+ "grad_norm": 2.479199171066284,
+ "learning_rate": 1.9044006651714686e-07,
+ "loss": 0.1596,
+ "step": 34485
+ },
+ {
+ "epoch": 93.96730245231608,
+ "grad_norm": 2.600506544113159,
+ "learning_rate": 1.902686976775603e-07,
+ "loss": 0.0496,
+ "step": 34486
+ },
+ {
+ "epoch": 93.97002724795641,
+ "grad_norm": 3.1799991130828857,
+ "learning_rate": 1.9009740523584507e-07,
+ "loss": 0.0471,
+ "step": 34487
+ },
+ {
+ "epoch": 93.97275204359673,
+ "grad_norm": 2.479637861251831,
+ "learning_rate": 1.899261891933346e-07,
+ "loss": 0.097,
+ "step": 34488
+ },
+ {
+ "epoch": 93.97547683923706,
+ "grad_norm": 2.694652795791626,
+ "learning_rate": 1.897550495513645e-07,
+ "loss": 0.1886,
+ "step": 34489
+ },
+ {
+ "epoch": 93.97820163487738,
+ "grad_norm": 3.3574304580688477,
+ "learning_rate": 1.8958398631126586e-07,
+ "loss": 0.0381,
+ "step": 34490
+ },
+ {
+ "epoch": 93.98092643051771,
+ "grad_norm": 2.4085183143615723,
+ "learning_rate": 1.8941299947437098e-07,
+ "loss": 0.0169,
+ "step": 34491
+ },
+ {
+ "epoch": 93.98365122615803,
+ "grad_norm": 2.778902292251587,
+ "learning_rate": 1.8924208904201215e-07,
+ "loss": 0.1611,
+ "step": 34492
+ },
+ {
+ "epoch": 93.98637602179836,
+ "grad_norm": 2.933116912841797,
+ "learning_rate": 1.890712550155205e-07,
+ "loss": 0.0443,
+ "step": 34493
+ },
+ {
+ "epoch": 93.9891008174387,
+ "grad_norm": 2.296523094177246,
+ "learning_rate": 1.8890049739622606e-07,
+ "loss": 0.0734,
+ "step": 34494
+ },
+ {
+ "epoch": 93.99182561307902,
+ "grad_norm": 1.8806663751602173,
+ "learning_rate": 1.8872981618545894e-07,
+ "loss": 0.0219,
+ "step": 34495
+ },
+ {
+ "epoch": 93.99455040871935,
+ "grad_norm": 3.0775694847106934,
+ "learning_rate": 1.8855921138454802e-07,
+ "loss": 0.0251,
+ "step": 34496
+ },
+ {
+ "epoch": 93.99727520435967,
+ "grad_norm": 3.0466701984405518,
+ "learning_rate": 1.8838868299482227e-07,
+ "loss": 0.0656,
+ "step": 34497
+ },
+ {
+ "epoch": 94.0,
+ "grad_norm": 2.0074522495269775,
+ "learning_rate": 1.8821823101760949e-07,
+ "loss": 0.024,
+ "step": 34498
+ },
+ {
+ "epoch": 94.00272479564033,
+ "grad_norm": 2.8768908977508545,
+ "learning_rate": 1.8804785545423753e-07,
+ "loss": 0.0665,
+ "step": 34499
+ },
+ {
+ "epoch": 94.00544959128065,
+ "grad_norm": 3.1508963108062744,
+ "learning_rate": 1.878775563060331e-07,
+ "loss": 0.0528,
+ "step": 34500
+ },
+ {
+ "epoch": 94.00817438692098,
+ "grad_norm": 2.9554028511047363,
+ "learning_rate": 1.8770733357432293e-07,
+ "loss": 0.0806,
+ "step": 34501
+ },
+ {
+ "epoch": 94.0108991825613,
+ "grad_norm": 2.331803560256958,
+ "learning_rate": 1.8753718726043146e-07,
+ "loss": 0.0652,
+ "step": 34502
+ },
+ {
+ "epoch": 94.01362397820164,
+ "grad_norm": 2.272080898284912,
+ "learning_rate": 1.8736711736568547e-07,
+ "loss": 0.0625,
+ "step": 34503
+ },
+ {
+ "epoch": 94.01634877384195,
+ "grad_norm": 3.1528565883636475,
+ "learning_rate": 1.871971238914072e-07,
+ "loss": 0.0565,
+ "step": 34504
+ },
+ {
+ "epoch": 94.01907356948229,
+ "grad_norm": 1.681414246559143,
+ "learning_rate": 1.870272068389223e-07,
+ "loss": 0.1208,
+ "step": 34505
+ },
+ {
+ "epoch": 94.02179836512262,
+ "grad_norm": 3.2219901084899902,
+ "learning_rate": 1.868573662095541e-07,
+ "loss": 0.069,
+ "step": 34506
+ },
+ {
+ "epoch": 94.02452316076294,
+ "grad_norm": 3.2177181243896484,
+ "learning_rate": 1.8668760200462488e-07,
+ "loss": 0.1558,
+ "step": 34507
+ },
+ {
+ "epoch": 94.02724795640327,
+ "grad_norm": 1.7715153694152832,
+ "learning_rate": 1.8651791422545697e-07,
+ "loss": 0.0177,
+ "step": 34508
+ },
+ {
+ "epoch": 94.02997275204359,
+ "grad_norm": 2.3313074111938477,
+ "learning_rate": 1.8634830287337036e-07,
+ "loss": 0.034,
+ "step": 34509
+ },
+ {
+ "epoch": 94.03269754768392,
+ "grad_norm": 1.9339600801467896,
+ "learning_rate": 1.861787679496885e-07,
+ "loss": 0.0208,
+ "step": 34510
+ },
+ {
+ "epoch": 94.03542234332426,
+ "grad_norm": 2.1006815433502197,
+ "learning_rate": 1.8600930945573027e-07,
+ "loss": 0.1225,
+ "step": 34511
+ },
+ {
+ "epoch": 94.03814713896458,
+ "grad_norm": 1.6775445938110352,
+ "learning_rate": 1.8583992739281577e-07,
+ "loss": 0.0198,
+ "step": 34512
+ },
+ {
+ "epoch": 94.04087193460491,
+ "grad_norm": 2.6415295600891113,
+ "learning_rate": 1.8567062176226393e-07,
+ "loss": 0.0387,
+ "step": 34513
+ },
+ {
+ "epoch": 94.04359673024523,
+ "grad_norm": 1.607471227645874,
+ "learning_rate": 1.8550139256539368e-07,
+ "loss": 0.0159,
+ "step": 34514
+ },
+ {
+ "epoch": 94.04632152588556,
+ "grad_norm": 2.5552589893341064,
+ "learning_rate": 1.8533223980352288e-07,
+ "loss": 0.1056,
+ "step": 34515
+ },
+ {
+ "epoch": 94.04904632152588,
+ "grad_norm": 2.36251163482666,
+ "learning_rate": 1.8516316347796826e-07,
+ "loss": 0.1004,
+ "step": 34516
+ },
+ {
+ "epoch": 94.05177111716621,
+ "grad_norm": 2.898721218109131,
+ "learning_rate": 1.8499416359004763e-07,
+ "loss": 0.1699,
+ "step": 34517
+ },
+ {
+ "epoch": 94.05449591280654,
+ "grad_norm": 9.90404224395752,
+ "learning_rate": 1.848252401410755e-07,
+ "loss": 0.185,
+ "step": 34518
+ },
+ {
+ "epoch": 94.05722070844686,
+ "grad_norm": 2.253108024597168,
+ "learning_rate": 1.846563931323697e-07,
+ "loss": 0.0209,
+ "step": 34519
+ },
+ {
+ "epoch": 94.0599455040872,
+ "grad_norm": 2.2060775756835938,
+ "learning_rate": 1.8448762256524256e-07,
+ "loss": 0.047,
+ "step": 34520
+ },
+ {
+ "epoch": 94.06267029972751,
+ "grad_norm": 2.2302207946777344,
+ "learning_rate": 1.8431892844101183e-07,
+ "loss": 0.0645,
+ "step": 34521
+ },
+ {
+ "epoch": 94.06539509536785,
+ "grad_norm": 1.3667473793029785,
+ "learning_rate": 1.8415031076098767e-07,
+ "loss": 0.0154,
+ "step": 34522
+ },
+ {
+ "epoch": 94.06811989100818,
+ "grad_norm": 1.537326693534851,
+ "learning_rate": 1.8398176952648672e-07,
+ "loss": 0.0214,
+ "step": 34523
+ },
+ {
+ "epoch": 94.0708446866485,
+ "grad_norm": 2.7625930309295654,
+ "learning_rate": 1.8381330473881797e-07,
+ "loss": 0.0634,
+ "step": 34524
+ },
+ {
+ "epoch": 94.07356948228883,
+ "grad_norm": 2.4522831439971924,
+ "learning_rate": 1.836449163992948e-07,
+ "loss": 0.0379,
+ "step": 34525
+ },
+ {
+ "epoch": 94.07629427792915,
+ "grad_norm": 5.569437026977539,
+ "learning_rate": 1.8347660450923066e-07,
+ "loss": 0.046,
+ "step": 34526
+ },
+ {
+ "epoch": 94.07901907356948,
+ "grad_norm": 3.3365516662597656,
+ "learning_rate": 1.8330836906993443e-07,
+ "loss": 0.0771,
+ "step": 34527
+ },
+ {
+ "epoch": 94.0817438692098,
+ "grad_norm": 5.334017753601074,
+ "learning_rate": 1.8314021008271732e-07,
+ "loss": 0.1219,
+ "step": 34528
+ },
+ {
+ "epoch": 94.08446866485014,
+ "grad_norm": 1.5066051483154297,
+ "learning_rate": 1.8297212754888716e-07,
+ "loss": 0.0149,
+ "step": 34529
+ },
+ {
+ "epoch": 94.08719346049047,
+ "grad_norm": 2.745513916015625,
+ "learning_rate": 1.8280412146975512e-07,
+ "loss": 0.0592,
+ "step": 34530
+ },
+ {
+ "epoch": 94.08991825613079,
+ "grad_norm": 3.194516897201538,
+ "learning_rate": 1.8263619184662796e-07,
+ "loss": 0.0473,
+ "step": 34531
+ },
+ {
+ "epoch": 94.09264305177112,
+ "grad_norm": 2.812309503555298,
+ "learning_rate": 1.8246833868081348e-07,
+ "loss": 0.0649,
+ "step": 34532
+ },
+ {
+ "epoch": 94.09536784741144,
+ "grad_norm": 3.361938714981079,
+ "learning_rate": 1.8230056197362068e-07,
+ "loss": 0.0297,
+ "step": 34533
+ },
+ {
+ "epoch": 94.09809264305177,
+ "grad_norm": 2.9348504543304443,
+ "learning_rate": 1.8213286172635514e-07,
+ "loss": 0.0749,
+ "step": 34534
+ },
+ {
+ "epoch": 94.1008174386921,
+ "grad_norm": 2.29144024848938,
+ "learning_rate": 1.819652379403225e-07,
+ "loss": 0.0453,
+ "step": 34535
+ },
+ {
+ "epoch": 94.10354223433242,
+ "grad_norm": 2.3790197372436523,
+ "learning_rate": 1.8179769061682838e-07,
+ "loss": 0.0277,
+ "step": 34536
+ },
+ {
+ "epoch": 94.10626702997276,
+ "grad_norm": 3.2483694553375244,
+ "learning_rate": 1.8163021975717841e-07,
+ "loss": 0.0656,
+ "step": 34537
+ },
+ {
+ "epoch": 94.10899182561307,
+ "grad_norm": 2.4094700813293457,
+ "learning_rate": 1.8146282536267602e-07,
+ "loss": 0.0263,
+ "step": 34538
+ },
+ {
+ "epoch": 94.11171662125341,
+ "grad_norm": 2.520822525024414,
+ "learning_rate": 1.8129550743462565e-07,
+ "loss": 0.032,
+ "step": 34539
+ },
+ {
+ "epoch": 94.11444141689373,
+ "grad_norm": 1.7595480680465698,
+ "learning_rate": 1.8112826597432854e-07,
+ "loss": 0.0228,
+ "step": 34540
+ },
+ {
+ "epoch": 94.11716621253406,
+ "grad_norm": 2.2441720962524414,
+ "learning_rate": 1.8096110098308917e-07,
+ "loss": 0.0673,
+ "step": 34541
+ },
+ {
+ "epoch": 94.11989100817439,
+ "grad_norm": 2.098578929901123,
+ "learning_rate": 1.8079401246220874e-07,
+ "loss": 0.0374,
+ "step": 34542
+ },
+ {
+ "epoch": 94.12261580381471,
+ "grad_norm": 2.2614755630493164,
+ "learning_rate": 1.8062700041298952e-07,
+ "loss": 0.1671,
+ "step": 34543
+ },
+ {
+ "epoch": 94.12534059945504,
+ "grad_norm": 3.3669607639312744,
+ "learning_rate": 1.8046006483673052e-07,
+ "loss": 0.0585,
+ "step": 34544
+ },
+ {
+ "epoch": 94.12806539509536,
+ "grad_norm": 2.245502233505249,
+ "learning_rate": 1.8029320573473063e-07,
+ "loss": 0.1347,
+ "step": 34545
+ },
+ {
+ "epoch": 94.1307901907357,
+ "grad_norm": 3.2562201023101807,
+ "learning_rate": 1.801264231082933e-07,
+ "loss": 0.022,
+ "step": 34546
+ },
+ {
+ "epoch": 94.13351498637603,
+ "grad_norm": 4.390142917633057,
+ "learning_rate": 1.7995971695871528e-07,
+ "loss": 0.0534,
+ "step": 34547
+ },
+ {
+ "epoch": 94.13623978201635,
+ "grad_norm": 3.1623430252075195,
+ "learning_rate": 1.7979308728729438e-07,
+ "loss": 0.0414,
+ "step": 34548
+ },
+ {
+ "epoch": 94.13896457765668,
+ "grad_norm": 3.983569622039795,
+ "learning_rate": 1.7962653409532848e-07,
+ "loss": 0.0453,
+ "step": 34549
+ },
+ {
+ "epoch": 94.141689373297,
+ "grad_norm": 1.9424781799316406,
+ "learning_rate": 1.7946005738411654e-07,
+ "loss": 0.0469,
+ "step": 34550
+ },
+ {
+ "epoch": 94.14441416893733,
+ "grad_norm": 2.724827527999878,
+ "learning_rate": 1.7929365715495305e-07,
+ "loss": 0.1282,
+ "step": 34551
+ },
+ {
+ "epoch": 94.14713896457765,
+ "grad_norm": 1.7867093086242676,
+ "learning_rate": 1.791273334091337e-07,
+ "loss": 0.0156,
+ "step": 34552
+ },
+ {
+ "epoch": 94.14986376021798,
+ "grad_norm": 2.4984583854675293,
+ "learning_rate": 1.7896108614795406e-07,
+ "loss": 0.0294,
+ "step": 34553
+ },
+ {
+ "epoch": 94.15258855585832,
+ "grad_norm": 2.506727695465088,
+ "learning_rate": 1.7879491537271087e-07,
+ "loss": 0.0465,
+ "step": 34554
+ },
+ {
+ "epoch": 94.15531335149863,
+ "grad_norm": 2.2438740730285645,
+ "learning_rate": 1.7862882108469648e-07,
+ "loss": 0.0544,
+ "step": 34555
+ },
+ {
+ "epoch": 94.15803814713897,
+ "grad_norm": 4.8143086433410645,
+ "learning_rate": 1.7846280328520428e-07,
+ "loss": 0.0566,
+ "step": 34556
+ },
+ {
+ "epoch": 94.16076294277929,
+ "grad_norm": 2.9258768558502197,
+ "learning_rate": 1.7829686197552766e-07,
+ "loss": 0.0673,
+ "step": 34557
+ },
+ {
+ "epoch": 94.16348773841962,
+ "grad_norm": 2.362107515335083,
+ "learning_rate": 1.7813099715695892e-07,
+ "loss": 0.1055,
+ "step": 34558
+ },
+ {
+ "epoch": 94.16621253405995,
+ "grad_norm": 2.643925905227661,
+ "learning_rate": 1.7796520883079038e-07,
+ "loss": 0.03,
+ "step": 34559
+ },
+ {
+ "epoch": 94.16893732970027,
+ "grad_norm": 3.002138137817383,
+ "learning_rate": 1.7779949699831212e-07,
+ "loss": 0.0386,
+ "step": 34560
+ },
+ {
+ "epoch": 94.1716621253406,
+ "grad_norm": 2.3722450733184814,
+ "learning_rate": 1.776338616608153e-07,
+ "loss": 0.04,
+ "step": 34561
+ },
+ {
+ "epoch": 94.17438692098092,
+ "grad_norm": 2.956449270248413,
+ "learning_rate": 1.7746830281959005e-07,
+ "loss": 0.0302,
+ "step": 34562
+ },
+ {
+ "epoch": 94.17711171662125,
+ "grad_norm": 2.5882420539855957,
+ "learning_rate": 1.7730282047592528e-07,
+ "loss": 0.0322,
+ "step": 34563
+ },
+ {
+ "epoch": 94.17983651226157,
+ "grad_norm": 2.4424173831939697,
+ "learning_rate": 1.7713741463111112e-07,
+ "loss": 0.0422,
+ "step": 34564
+ },
+ {
+ "epoch": 94.1825613079019,
+ "grad_norm": 2.284702777862549,
+ "learning_rate": 1.7697208528643316e-07,
+ "loss": 0.0971,
+ "step": 34565
+ },
+ {
+ "epoch": 94.18528610354224,
+ "grad_norm": 1.9086081981658936,
+ "learning_rate": 1.7680683244318154e-07,
+ "loss": 0.0183,
+ "step": 34566
+ },
+ {
+ "epoch": 94.18801089918256,
+ "grad_norm": 4.8580403327941895,
+ "learning_rate": 1.7664165610264184e-07,
+ "loss": 0.0258,
+ "step": 34567
+ },
+ {
+ "epoch": 94.19073569482289,
+ "grad_norm": 1.9023826122283936,
+ "learning_rate": 1.7647655626610083e-07,
+ "loss": 0.0848,
+ "step": 34568
+ },
+ {
+ "epoch": 94.19346049046321,
+ "grad_norm": 2.0843896865844727,
+ "learning_rate": 1.7631153293484305e-07,
+ "loss": 0.1473,
+ "step": 34569
+ },
+ {
+ "epoch": 94.19618528610354,
+ "grad_norm": 0.9969910979270935,
+ "learning_rate": 1.7614658611015635e-07,
+ "loss": 0.0124,
+ "step": 34570
+ },
+ {
+ "epoch": 94.19891008174388,
+ "grad_norm": 1.8536566495895386,
+ "learning_rate": 1.75981715793323e-07,
+ "loss": 0.0433,
+ "step": 34571
+ },
+ {
+ "epoch": 94.2016348773842,
+ "grad_norm": 2.623291015625,
+ "learning_rate": 1.758169219856287e-07,
+ "loss": 0.0685,
+ "step": 34572
+ },
+ {
+ "epoch": 94.20435967302453,
+ "grad_norm": 3.871629238128662,
+ "learning_rate": 1.7565220468835465e-07,
+ "loss": 0.0569,
+ "step": 34573
+ },
+ {
+ "epoch": 94.20708446866485,
+ "grad_norm": 1.906101107597351,
+ "learning_rate": 1.7548756390278642e-07,
+ "loss": 0.0122,
+ "step": 34574
+ },
+ {
+ "epoch": 94.20980926430518,
+ "grad_norm": 2.549010992050171,
+ "learning_rate": 1.7532299963020417e-07,
+ "loss": 0.0999,
+ "step": 34575
+ },
+ {
+ "epoch": 94.2125340599455,
+ "grad_norm": 3.426013469696045,
+ "learning_rate": 1.7515851187189015e-07,
+ "loss": 0.0925,
+ "step": 34576
+ },
+ {
+ "epoch": 94.21525885558583,
+ "grad_norm": 1.9996252059936523,
+ "learning_rate": 1.749941006291245e-07,
+ "loss": 0.0175,
+ "step": 34577
+ },
+ {
+ "epoch": 94.21798365122616,
+ "grad_norm": 5.493715763092041,
+ "learning_rate": 1.7482976590319058e-07,
+ "loss": 0.0508,
+ "step": 34578
+ },
+ {
+ "epoch": 94.22070844686648,
+ "grad_norm": 3.023439645767212,
+ "learning_rate": 1.7466550769536516e-07,
+ "loss": 0.0948,
+ "step": 34579
+ },
+ {
+ "epoch": 94.22343324250681,
+ "grad_norm": 3.408459424972534,
+ "learning_rate": 1.7450132600692947e-07,
+ "loss": 0.1383,
+ "step": 34580
+ },
+ {
+ "epoch": 94.22615803814713,
+ "grad_norm": 1.7766079902648926,
+ "learning_rate": 1.7433722083915915e-07,
+ "loss": 0.0212,
+ "step": 34581
+ },
+ {
+ "epoch": 94.22888283378747,
+ "grad_norm": 2.550326108932495,
+ "learning_rate": 1.741731921933365e-07,
+ "loss": 0.0548,
+ "step": 34582
+ },
+ {
+ "epoch": 94.2316076294278,
+ "grad_norm": 1.5890072584152222,
+ "learning_rate": 1.7400924007073604e-07,
+ "loss": 0.0243,
+ "step": 34583
+ },
+ {
+ "epoch": 94.23433242506812,
+ "grad_norm": 1.7090826034545898,
+ "learning_rate": 1.7384536447263457e-07,
+ "loss": 0.0283,
+ "step": 34584
+ },
+ {
+ "epoch": 94.23705722070845,
+ "grad_norm": 2.8559112548828125,
+ "learning_rate": 1.736815654003099e-07,
+ "loss": 0.0353,
+ "step": 34585
+ },
+ {
+ "epoch": 94.23978201634877,
+ "grad_norm": 3.16033673286438,
+ "learning_rate": 1.7351784285503658e-07,
+ "loss": 0.0755,
+ "step": 34586
+ },
+ {
+ "epoch": 94.2425068119891,
+ "grad_norm": 2.2204842567443848,
+ "learning_rate": 1.733541968380914e-07,
+ "loss": 0.0777,
+ "step": 34587
+ },
+ {
+ "epoch": 94.24523160762942,
+ "grad_norm": 3.550560235977173,
+ "learning_rate": 1.7319062735074666e-07,
+ "loss": 0.0356,
+ "step": 34588
+ },
+ {
+ "epoch": 94.24795640326975,
+ "grad_norm": 2.5729455947875977,
+ "learning_rate": 1.7302713439427577e-07,
+ "loss": 0.0206,
+ "step": 34589
+ },
+ {
+ "epoch": 94.25068119891009,
+ "grad_norm": 2.397031784057617,
+ "learning_rate": 1.7286371796995438e-07,
+ "loss": 0.0401,
+ "step": 34590
+ },
+ {
+ "epoch": 94.2534059945504,
+ "grad_norm": 2.22430419921875,
+ "learning_rate": 1.7270037807905372e-07,
+ "loss": 0.0473,
+ "step": 34591
+ },
+ {
+ "epoch": 94.25613079019074,
+ "grad_norm": 2.6075212955474854,
+ "learning_rate": 1.7253711472284717e-07,
+ "loss": 0.0376,
+ "step": 34592
+ },
+ {
+ "epoch": 94.25885558583106,
+ "grad_norm": 2.732367992401123,
+ "learning_rate": 1.7237392790260377e-07,
+ "loss": 0.0377,
+ "step": 34593
+ },
+ {
+ "epoch": 94.26158038147139,
+ "grad_norm": 2.5315537452697754,
+ "learning_rate": 1.722108176195958e-07,
+ "loss": 0.053,
+ "step": 34594
+ },
+ {
+ "epoch": 94.26430517711172,
+ "grad_norm": 2.3362369537353516,
+ "learning_rate": 1.7204778387509559e-07,
+ "loss": 0.1016,
+ "step": 34595
+ },
+ {
+ "epoch": 94.26702997275204,
+ "grad_norm": 2.551574230194092,
+ "learning_rate": 1.7188482667036986e-07,
+ "loss": 0.0376,
+ "step": 34596
+ },
+ {
+ "epoch": 94.26975476839237,
+ "grad_norm": 1.8957818746566772,
+ "learning_rate": 1.7172194600668767e-07,
+ "loss": 0.0707,
+ "step": 34597
+ },
+ {
+ "epoch": 94.2724795640327,
+ "grad_norm": 1.700167179107666,
+ "learning_rate": 1.715591418853202e-07,
+ "loss": 0.0179,
+ "step": 34598
+ },
+ {
+ "epoch": 94.27520435967303,
+ "grad_norm": 1.6797950267791748,
+ "learning_rate": 1.7139641430753419e-07,
+ "loss": 0.0238,
+ "step": 34599
+ },
+ {
+ "epoch": 94.27792915531334,
+ "grad_norm": 2.126771926879883,
+ "learning_rate": 1.712337632745964e-07,
+ "loss": 0.0237,
+ "step": 34600
+ },
+ {
+ "epoch": 94.28065395095368,
+ "grad_norm": 1.526766061782837,
+ "learning_rate": 1.7107118878777251e-07,
+ "loss": 0.0227,
+ "step": 34601
+ },
+ {
+ "epoch": 94.28337874659401,
+ "grad_norm": 2.9766311645507812,
+ "learning_rate": 1.709086908483304e-07,
+ "loss": 0.1157,
+ "step": 34602
+ },
+ {
+ "epoch": 94.28610354223433,
+ "grad_norm": 2.0408859252929688,
+ "learning_rate": 1.707462694575357e-07,
+ "loss": 0.0818,
+ "step": 34603
+ },
+ {
+ "epoch": 94.28882833787466,
+ "grad_norm": 2.0950992107391357,
+ "learning_rate": 1.7058392461665185e-07,
+ "loss": 0.0423,
+ "step": 34604
+ },
+ {
+ "epoch": 94.29155313351498,
+ "grad_norm": 2.3778860569000244,
+ "learning_rate": 1.704216563269434e-07,
+ "loss": 0.0412,
+ "step": 34605
+ },
+ {
+ "epoch": 94.29427792915531,
+ "grad_norm": 2.916978597640991,
+ "learning_rate": 1.7025946458967602e-07,
+ "loss": 0.0325,
+ "step": 34606
+ },
+ {
+ "epoch": 94.29700272479565,
+ "grad_norm": 3.0695154666900635,
+ "learning_rate": 1.70097349406112e-07,
+ "loss": 0.0301,
+ "step": 34607
+ },
+ {
+ "epoch": 94.29972752043597,
+ "grad_norm": 2.0341145992279053,
+ "learning_rate": 1.6993531077751256e-07,
+ "loss": 0.0266,
+ "step": 34608
+ },
+ {
+ "epoch": 94.3024523160763,
+ "grad_norm": 3.028540849685669,
+ "learning_rate": 1.6977334870514007e-07,
+ "loss": 0.0536,
+ "step": 34609
+ },
+ {
+ "epoch": 94.30517711171662,
+ "grad_norm": 2.2184524536132812,
+ "learning_rate": 1.696114631902568e-07,
+ "loss": 0.0932,
+ "step": 34610
+ },
+ {
+ "epoch": 94.30790190735695,
+ "grad_norm": 3.4266767501831055,
+ "learning_rate": 1.6944965423412286e-07,
+ "loss": 0.1048,
+ "step": 34611
+ },
+ {
+ "epoch": 94.31062670299727,
+ "grad_norm": 2.3393688201904297,
+ "learning_rate": 1.6928792183799948e-07,
+ "loss": 0.0234,
+ "step": 34612
+ },
+ {
+ "epoch": 94.3133514986376,
+ "grad_norm": 1.8931456804275513,
+ "learning_rate": 1.6912626600314452e-07,
+ "loss": 0.0588,
+ "step": 34613
+ },
+ {
+ "epoch": 94.31607629427793,
+ "grad_norm": 2.8492913246154785,
+ "learning_rate": 1.6896468673081812e-07,
+ "loss": 0.0502,
+ "step": 34614
+ },
+ {
+ "epoch": 94.31880108991825,
+ "grad_norm": 3.497866153717041,
+ "learning_rate": 1.6880318402227814e-07,
+ "loss": 0.0441,
+ "step": 34615
+ },
+ {
+ "epoch": 94.32152588555859,
+ "grad_norm": 2.6030144691467285,
+ "learning_rate": 1.6864175787878244e-07,
+ "loss": 0.0354,
+ "step": 34616
+ },
+ {
+ "epoch": 94.3242506811989,
+ "grad_norm": 1.3896472454071045,
+ "learning_rate": 1.6848040830158895e-07,
+ "loss": 0.0108,
+ "step": 34617
+ },
+ {
+ "epoch": 94.32697547683924,
+ "grad_norm": 2.356647253036499,
+ "learning_rate": 1.683191352919533e-07,
+ "loss": 0.049,
+ "step": 34618
+ },
+ {
+ "epoch": 94.32970027247957,
+ "grad_norm": 2.475054979324341,
+ "learning_rate": 1.681579388511323e-07,
+ "loss": 0.0868,
+ "step": 34619
+ },
+ {
+ "epoch": 94.33242506811989,
+ "grad_norm": 4.608496189117432,
+ "learning_rate": 1.6799681898038044e-07,
+ "loss": 0.0525,
+ "step": 34620
+ },
+ {
+ "epoch": 94.33514986376022,
+ "grad_norm": 2.7545180320739746,
+ "learning_rate": 1.6783577568095123e-07,
+ "loss": 0.1164,
+ "step": 34621
+ },
+ {
+ "epoch": 94.33787465940054,
+ "grad_norm": 5.152946472167969,
+ "learning_rate": 1.6767480895410248e-07,
+ "loss": 0.0321,
+ "step": 34622
+ },
+ {
+ "epoch": 94.34059945504087,
+ "grad_norm": 2.800403356552124,
+ "learning_rate": 1.6751391880108548e-07,
+ "loss": 0.0271,
+ "step": 34623
+ },
+ {
+ "epoch": 94.34332425068119,
+ "grad_norm": 4.446054458618164,
+ "learning_rate": 1.6735310522315473e-07,
+ "loss": 0.0853,
+ "step": 34624
+ },
+ {
+ "epoch": 94.34604904632153,
+ "grad_norm": 3.2290141582489014,
+ "learning_rate": 1.6719236822155927e-07,
+ "loss": 0.0699,
+ "step": 34625
+ },
+ {
+ "epoch": 94.34877384196186,
+ "grad_norm": 2.38934588432312,
+ "learning_rate": 1.6703170779755474e-07,
+ "loss": 0.0337,
+ "step": 34626
+ },
+ {
+ "epoch": 94.35149863760218,
+ "grad_norm": 2.058783531188965,
+ "learning_rate": 1.6687112395239014e-07,
+ "loss": 0.0264,
+ "step": 34627
+ },
+ {
+ "epoch": 94.35422343324251,
+ "grad_norm": 2.4210948944091797,
+ "learning_rate": 1.667106166873167e-07,
+ "loss": 0.0656,
+ "step": 34628
+ },
+ {
+ "epoch": 94.35694822888283,
+ "grad_norm": 2.59696626663208,
+ "learning_rate": 1.6655018600358452e-07,
+ "loss": 0.0207,
+ "step": 34629
+ },
+ {
+ "epoch": 94.35967302452316,
+ "grad_norm": 2.635974407196045,
+ "learning_rate": 1.6638983190244374e-07,
+ "loss": 0.0218,
+ "step": 34630
+ },
+ {
+ "epoch": 94.3623978201635,
+ "grad_norm": 2.3381271362304688,
+ "learning_rate": 1.6622955438514111e-07,
+ "loss": 0.068,
+ "step": 34631
+ },
+ {
+ "epoch": 94.36512261580381,
+ "grad_norm": 2.0427045822143555,
+ "learning_rate": 1.6606935345292785e-07,
+ "loss": 0.041,
+ "step": 34632
+ },
+ {
+ "epoch": 94.36784741144415,
+ "grad_norm": 1.729866623878479,
+ "learning_rate": 1.6590922910704966e-07,
+ "loss": 0.0193,
+ "step": 34633
+ },
+ {
+ "epoch": 94.37057220708446,
+ "grad_norm": 1.777673602104187,
+ "learning_rate": 1.6574918134875216e-07,
+ "loss": 0.0764,
+ "step": 34634
+ },
+ {
+ "epoch": 94.3732970027248,
+ "grad_norm": 2.5636448860168457,
+ "learning_rate": 1.6558921017928554e-07,
+ "loss": 0.0331,
+ "step": 34635
+ },
+ {
+ "epoch": 94.37602179836512,
+ "grad_norm": 3.057037830352783,
+ "learning_rate": 1.6542931559989316e-07,
+ "loss": 0.0802,
+ "step": 34636
+ },
+ {
+ "epoch": 94.37874659400545,
+ "grad_norm": 1.9381567239761353,
+ "learning_rate": 1.6526949761182076e-07,
+ "loss": 0.0238,
+ "step": 34637
+ },
+ {
+ "epoch": 94.38147138964578,
+ "grad_norm": 2.2974367141723633,
+ "learning_rate": 1.6510975621631177e-07,
+ "loss": 0.028,
+ "step": 34638
+ },
+ {
+ "epoch": 94.3841961852861,
+ "grad_norm": 2.2948877811431885,
+ "learning_rate": 1.6495009141461293e-07,
+ "loss": 0.0575,
+ "step": 34639
+ },
+ {
+ "epoch": 94.38692098092643,
+ "grad_norm": 2.0891711711883545,
+ "learning_rate": 1.6479050320796552e-07,
+ "loss": 0.0268,
+ "step": 34640
+ },
+ {
+ "epoch": 94.38964577656675,
+ "grad_norm": 2.469036340713501,
+ "learning_rate": 1.646309915976141e-07,
+ "loss": 0.0417,
+ "step": 34641
+ },
+ {
+ "epoch": 94.39237057220708,
+ "grad_norm": 2.298543930053711,
+ "learning_rate": 1.6447155658479763e-07,
+ "loss": 0.0302,
+ "step": 34642
+ },
+ {
+ "epoch": 94.39509536784742,
+ "grad_norm": 2.1329193115234375,
+ "learning_rate": 1.6431219817076182e-07,
+ "loss": 0.0637,
+ "step": 34643
+ },
+ {
+ "epoch": 94.39782016348774,
+ "grad_norm": 1.99644136428833,
+ "learning_rate": 1.6415291635674567e-07,
+ "loss": 0.016,
+ "step": 34644
+ },
+ {
+ "epoch": 94.40054495912807,
+ "grad_norm": 3.191816806793213,
+ "learning_rate": 1.6399371114399043e-07,
+ "loss": 0.0399,
+ "step": 34645
+ },
+ {
+ "epoch": 94.40326975476839,
+ "grad_norm": 2.9646823406219482,
+ "learning_rate": 1.6383458253373508e-07,
+ "loss": 0.1386,
+ "step": 34646
+ },
+ {
+ "epoch": 94.40599455040872,
+ "grad_norm": 2.5656116008758545,
+ "learning_rate": 1.6367553052721973e-07,
+ "loss": 0.0417,
+ "step": 34647
+ },
+ {
+ "epoch": 94.40871934604904,
+ "grad_norm": 2.7245559692382812,
+ "learning_rate": 1.6351655512568343e-07,
+ "loss": 0.0449,
+ "step": 34648
+ },
+ {
+ "epoch": 94.41144414168937,
+ "grad_norm": 3.228842258453369,
+ "learning_rate": 1.6335765633036294e-07,
+ "loss": 0.0432,
+ "step": 34649
+ },
+ {
+ "epoch": 94.4141689373297,
+ "grad_norm": 3.2125754356384277,
+ "learning_rate": 1.6319883414249615e-07,
+ "loss": 0.0931,
+ "step": 34650
+ },
+ {
+ "epoch": 94.41689373297002,
+ "grad_norm": 7.564841270446777,
+ "learning_rate": 1.63040088563321e-07,
+ "loss": 0.0781,
+ "step": 34651
+ },
+ {
+ "epoch": 94.41961852861036,
+ "grad_norm": 1.8873380422592163,
+ "learning_rate": 1.62881419594072e-07,
+ "loss": 0.1736,
+ "step": 34652
+ },
+ {
+ "epoch": 94.42234332425068,
+ "grad_norm": 2.9355266094207764,
+ "learning_rate": 1.6272282723598709e-07,
+ "loss": 0.0941,
+ "step": 34653
+ },
+ {
+ "epoch": 94.42506811989101,
+ "grad_norm": 1.7448080778121948,
+ "learning_rate": 1.625643114902986e-07,
+ "loss": 0.0231,
+ "step": 34654
+ },
+ {
+ "epoch": 94.42779291553134,
+ "grad_norm": 2.837740182876587,
+ "learning_rate": 1.6240587235824445e-07,
+ "loss": 0.1172,
+ "step": 34655
+ },
+ {
+ "epoch": 94.43051771117166,
+ "grad_norm": 2.8005638122558594,
+ "learning_rate": 1.6224750984105586e-07,
+ "loss": 0.0266,
+ "step": 34656
+ },
+ {
+ "epoch": 94.433242506812,
+ "grad_norm": 2.181720733642578,
+ "learning_rate": 1.620892239399674e-07,
+ "loss": 0.0925,
+ "step": 34657
+ },
+ {
+ "epoch": 94.43596730245231,
+ "grad_norm": 1.8403340578079224,
+ "learning_rate": 1.6193101465621031e-07,
+ "loss": 0.0208,
+ "step": 34658
+ },
+ {
+ "epoch": 94.43869209809264,
+ "grad_norm": 1.3620636463165283,
+ "learning_rate": 1.6177288199101915e-07,
+ "loss": 0.014,
+ "step": 34659
+ },
+ {
+ "epoch": 94.44141689373296,
+ "grad_norm": 2.899869918823242,
+ "learning_rate": 1.6161482594562404e-07,
+ "loss": 0.0623,
+ "step": 34660
+ },
+ {
+ "epoch": 94.4441416893733,
+ "grad_norm": 3.126708745956421,
+ "learning_rate": 1.6145684652125625e-07,
+ "loss": 0.0266,
+ "step": 34661
+ },
+ {
+ "epoch": 94.44686648501363,
+ "grad_norm": 2.637641668319702,
+ "learning_rate": 1.6129894371914368e-07,
+ "loss": 0.1349,
+ "step": 34662
+ },
+ {
+ "epoch": 94.44959128065395,
+ "grad_norm": 1.7988773584365845,
+ "learning_rate": 1.6114111754051976e-07,
+ "loss": 0.0491,
+ "step": 34663
+ },
+ {
+ "epoch": 94.45231607629428,
+ "grad_norm": 2.367905616760254,
+ "learning_rate": 1.609833679866124e-07,
+ "loss": 0.0518,
+ "step": 34664
+ },
+ {
+ "epoch": 94.4550408719346,
+ "grad_norm": 2.809880018234253,
+ "learning_rate": 1.6082569505865064e-07,
+ "loss": 0.0969,
+ "step": 34665
+ },
+ {
+ "epoch": 94.45776566757493,
+ "grad_norm": 1.9134714603424072,
+ "learning_rate": 1.6066809875786016e-07,
+ "loss": 0.0241,
+ "step": 34666
+ },
+ {
+ "epoch": 94.46049046321527,
+ "grad_norm": 5.269023418426514,
+ "learning_rate": 1.6051057908546997e-07,
+ "loss": 0.0367,
+ "step": 34667
+ },
+ {
+ "epoch": 94.46321525885558,
+ "grad_norm": 1.4486260414123535,
+ "learning_rate": 1.6035313604270798e-07,
+ "loss": 0.026,
+ "step": 34668
+ },
+ {
+ "epoch": 94.46594005449592,
+ "grad_norm": 2.5442888736724854,
+ "learning_rate": 1.6019576963079875e-07,
+ "loss": 0.1106,
+ "step": 34669
+ },
+ {
+ "epoch": 94.46866485013624,
+ "grad_norm": 1.3832812309265137,
+ "learning_rate": 1.6003847985096687e-07,
+ "loss": 0.1066,
+ "step": 34670
+ },
+ {
+ "epoch": 94.47138964577657,
+ "grad_norm": 2.9172377586364746,
+ "learning_rate": 1.5988126670444026e-07,
+ "loss": 0.0438,
+ "step": 34671
+ },
+ {
+ "epoch": 94.47411444141689,
+ "grad_norm": 1.9467462301254272,
+ "learning_rate": 1.5972413019244014e-07,
+ "loss": 0.0671,
+ "step": 34672
+ },
+ {
+ "epoch": 94.47683923705722,
+ "grad_norm": 2.916339159011841,
+ "learning_rate": 1.5956707031619333e-07,
+ "loss": 0.1237,
+ "step": 34673
+ },
+ {
+ "epoch": 94.47956403269755,
+ "grad_norm": 2.2039833068847656,
+ "learning_rate": 1.5941008707691996e-07,
+ "loss": 0.0389,
+ "step": 34674
+ },
+ {
+ "epoch": 94.48228882833787,
+ "grad_norm": 3.202559232711792,
+ "learning_rate": 1.592531804758446e-07,
+ "loss": 0.0786,
+ "step": 34675
+ },
+ {
+ "epoch": 94.4850136239782,
+ "grad_norm": 1.8219290971755981,
+ "learning_rate": 1.590963505141896e-07,
+ "loss": 0.0706,
+ "step": 34676
+ },
+ {
+ "epoch": 94.48773841961852,
+ "grad_norm": 3.4272594451904297,
+ "learning_rate": 1.589395971931751e-07,
+ "loss": 0.1694,
+ "step": 34677
+ },
+ {
+ "epoch": 94.49046321525886,
+ "grad_norm": 3.208918333053589,
+ "learning_rate": 1.5878292051402123e-07,
+ "loss": 0.159,
+ "step": 34678
+ },
+ {
+ "epoch": 94.49318801089919,
+ "grad_norm": 2.3203773498535156,
+ "learning_rate": 1.5862632047795033e-07,
+ "loss": 0.0333,
+ "step": 34679
+ },
+ {
+ "epoch": 94.49591280653951,
+ "grad_norm": 2.039985418319702,
+ "learning_rate": 1.5846979708618038e-07,
+ "loss": 0.089,
+ "step": 34680
+ },
+ {
+ "epoch": 94.49863760217984,
+ "grad_norm": 4.308788299560547,
+ "learning_rate": 1.5831335033993144e-07,
+ "loss": 0.0241,
+ "step": 34681
+ },
+ {
+ "epoch": 94.50136239782016,
+ "grad_norm": 2.6852211952209473,
+ "learning_rate": 1.5815698024042147e-07,
+ "loss": 0.0672,
+ "step": 34682
+ },
+ {
+ "epoch": 94.50408719346049,
+ "grad_norm": 3.191239833831787,
+ "learning_rate": 1.5800068678886726e-07,
+ "loss": 0.0601,
+ "step": 34683
+ },
+ {
+ "epoch": 94.50681198910081,
+ "grad_norm": 2.4062161445617676,
+ "learning_rate": 1.5784446998648784e-07,
+ "loss": 0.0248,
+ "step": 34684
+ },
+ {
+ "epoch": 94.50953678474114,
+ "grad_norm": 2.261762857437134,
+ "learning_rate": 1.5768832983449888e-07,
+ "loss": 0.0362,
+ "step": 34685
+ },
+ {
+ "epoch": 94.51226158038148,
+ "grad_norm": 2.3534913063049316,
+ "learning_rate": 1.57532266334115e-07,
+ "loss": 0.1233,
+ "step": 34686
+ },
+ {
+ "epoch": 94.5149863760218,
+ "grad_norm": 4.368196964263916,
+ "learning_rate": 1.573762794865541e-07,
+ "loss": 0.3018,
+ "step": 34687
+ },
+ {
+ "epoch": 94.51771117166213,
+ "grad_norm": 2.6892006397247314,
+ "learning_rate": 1.5722036929303075e-07,
+ "loss": 0.0598,
+ "step": 34688
+ },
+ {
+ "epoch": 94.52043596730245,
+ "grad_norm": 2.1162848472595215,
+ "learning_rate": 1.5706453575475733e-07,
+ "loss": 0.0225,
+ "step": 34689
+ },
+ {
+ "epoch": 94.52316076294278,
+ "grad_norm": 3.426241874694824,
+ "learning_rate": 1.5690877887294843e-07,
+ "loss": 0.0446,
+ "step": 34690
+ },
+ {
+ "epoch": 94.52588555858311,
+ "grad_norm": 5.542628288269043,
+ "learning_rate": 1.567530986488186e-07,
+ "loss": 0.0381,
+ "step": 34691
+ },
+ {
+ "epoch": 94.52861035422343,
+ "grad_norm": 1.7282050848007202,
+ "learning_rate": 1.5659749508357802e-07,
+ "loss": 0.028,
+ "step": 34692
+ },
+ {
+ "epoch": 94.53133514986376,
+ "grad_norm": 3.235380172729492,
+ "learning_rate": 1.5644196817843904e-07,
+ "loss": 0.0677,
+ "step": 34693
+ },
+ {
+ "epoch": 94.53405994550408,
+ "grad_norm": 2.2509677410125732,
+ "learning_rate": 1.5628651793461292e-07,
+ "loss": 0.0837,
+ "step": 34694
+ },
+ {
+ "epoch": 94.53678474114442,
+ "grad_norm": 2.4903781414031982,
+ "learning_rate": 1.561311443533109e-07,
+ "loss": 0.0388,
+ "step": 34695
+ },
+ {
+ "epoch": 94.53950953678473,
+ "grad_norm": 2.4005839824676514,
+ "learning_rate": 1.55975847435742e-07,
+ "loss": 0.1346,
+ "step": 34696
+ },
+ {
+ "epoch": 94.54223433242507,
+ "grad_norm": 2.1250245571136475,
+ "learning_rate": 1.558206271831175e-07,
+ "loss": 0.1697,
+ "step": 34697
+ },
+ {
+ "epoch": 94.5449591280654,
+ "grad_norm": 2.4313042163848877,
+ "learning_rate": 1.5566548359664423e-07,
+ "loss": 0.0278,
+ "step": 34698
+ },
+ {
+ "epoch": 94.54768392370572,
+ "grad_norm": 2.4750702381134033,
+ "learning_rate": 1.555104166775323e-07,
+ "loss": 0.1176,
+ "step": 34699
+ },
+ {
+ "epoch": 94.55040871934605,
+ "grad_norm": 2.4606995582580566,
+ "learning_rate": 1.5535542642698742e-07,
+ "loss": 0.0412,
+ "step": 34700
+ },
+ {
+ "epoch": 94.55313351498637,
+ "grad_norm": 2.120288848876953,
+ "learning_rate": 1.5520051284621862e-07,
+ "loss": 0.0402,
+ "step": 34701
+ },
+ {
+ "epoch": 94.5558583106267,
+ "grad_norm": 2.3898894786834717,
+ "learning_rate": 1.550456759364316e-07,
+ "loss": 0.0478,
+ "step": 34702
+ },
+ {
+ "epoch": 94.55858310626704,
+ "grad_norm": 1.8887131214141846,
+ "learning_rate": 1.5489091569882986e-07,
+ "loss": 0.0418,
+ "step": 34703
+ },
+ {
+ "epoch": 94.56130790190736,
+ "grad_norm": 2.0389652252197266,
+ "learning_rate": 1.547362321346224e-07,
+ "loss": 0.0515,
+ "step": 34704
+ },
+ {
+ "epoch": 94.56403269754769,
+ "grad_norm": 1.8987900018692017,
+ "learning_rate": 1.5458162524501274e-07,
+ "loss": 0.0426,
+ "step": 34705
+ },
+ {
+ "epoch": 94.566757493188,
+ "grad_norm": 2.3834776878356934,
+ "learning_rate": 1.5442709503120322e-07,
+ "loss": 0.0643,
+ "step": 34706
+ },
+ {
+ "epoch": 94.56948228882834,
+ "grad_norm": 2.5971760749816895,
+ "learning_rate": 1.5427264149439957e-07,
+ "loss": 0.0614,
+ "step": 34707
+ },
+ {
+ "epoch": 94.57220708446866,
+ "grad_norm": 3.2082934379577637,
+ "learning_rate": 1.5411826463580414e-07,
+ "loss": 0.0374,
+ "step": 34708
+ },
+ {
+ "epoch": 94.57493188010899,
+ "grad_norm": 1.9501131772994995,
+ "learning_rate": 1.5396396445661822e-07,
+ "loss": 0.0257,
+ "step": 34709
+ },
+ {
+ "epoch": 94.57765667574932,
+ "grad_norm": 2.9001870155334473,
+ "learning_rate": 1.5380974095804303e-07,
+ "loss": 0.0464,
+ "step": 34710
+ },
+ {
+ "epoch": 94.58038147138964,
+ "grad_norm": 4.064499855041504,
+ "learning_rate": 1.5365559414128207e-07,
+ "loss": 0.0391,
+ "step": 34711
+ },
+ {
+ "epoch": 94.58310626702998,
+ "grad_norm": 3.1410655975341797,
+ "learning_rate": 1.5350152400753326e-07,
+ "loss": 0.0931,
+ "step": 34712
+ },
+ {
+ "epoch": 94.5858310626703,
+ "grad_norm": 3.293938636779785,
+ "learning_rate": 1.533475305579979e-07,
+ "loss": 0.189,
+ "step": 34713
+ },
+ {
+ "epoch": 94.58855585831063,
+ "grad_norm": 3.631631851196289,
+ "learning_rate": 1.5319361379387609e-07,
+ "loss": 0.0344,
+ "step": 34714
+ },
+ {
+ "epoch": 94.59128065395096,
+ "grad_norm": 2.9691922664642334,
+ "learning_rate": 1.530397737163647e-07,
+ "loss": 0.1473,
+ "step": 34715
+ },
+ {
+ "epoch": 94.59400544959128,
+ "grad_norm": 2.1044015884399414,
+ "learning_rate": 1.5288601032666272e-07,
+ "loss": 0.0305,
+ "step": 34716
+ },
+ {
+ "epoch": 94.59673024523161,
+ "grad_norm": 2.1065657138824463,
+ "learning_rate": 1.5273232362596812e-07,
+ "loss": 0.0323,
+ "step": 34717
+ },
+ {
+ "epoch": 94.59945504087193,
+ "grad_norm": 4.500377655029297,
+ "learning_rate": 1.525787136154766e-07,
+ "loss": 0.0367,
+ "step": 34718
+ },
+ {
+ "epoch": 94.60217983651226,
+ "grad_norm": 2.984140157699585,
+ "learning_rate": 1.52425180296385e-07,
+ "loss": 0.0672,
+ "step": 34719
+ },
+ {
+ "epoch": 94.60490463215258,
+ "grad_norm": 1.8051056861877441,
+ "learning_rate": 1.5227172366989006e-07,
+ "loss": 0.0218,
+ "step": 34720
+ },
+ {
+ "epoch": 94.60762942779292,
+ "grad_norm": 2.263307571411133,
+ "learning_rate": 1.5211834373718536e-07,
+ "loss": 0.0372,
+ "step": 34721
+ },
+ {
+ "epoch": 94.61035422343325,
+ "grad_norm": 2.80877423286438,
+ "learning_rate": 1.519650404994666e-07,
+ "loss": 0.0327,
+ "step": 34722
+ },
+ {
+ "epoch": 94.61307901907357,
+ "grad_norm": 2.9288394451141357,
+ "learning_rate": 1.518118139579261e-07,
+ "loss": 0.0445,
+ "step": 34723
+ },
+ {
+ "epoch": 94.6158038147139,
+ "grad_norm": 2.3656704425811768,
+ "learning_rate": 1.516586641137585e-07,
+ "loss": 0.064,
+ "step": 34724
+ },
+ {
+ "epoch": 94.61852861035422,
+ "grad_norm": 2.8486154079437256,
+ "learning_rate": 1.515055909681562e-07,
+ "loss": 0.0574,
+ "step": 34725
+ },
+ {
+ "epoch": 94.62125340599455,
+ "grad_norm": 3.6664655208587646,
+ "learning_rate": 1.5135259452231265e-07,
+ "loss": 0.0231,
+ "step": 34726
+ },
+ {
+ "epoch": 94.62397820163488,
+ "grad_norm": 2.1733145713806152,
+ "learning_rate": 1.5119967477741694e-07,
+ "loss": 0.0218,
+ "step": 34727
+ },
+ {
+ "epoch": 94.6267029972752,
+ "grad_norm": 2.5935847759246826,
+ "learning_rate": 1.5104683173466139e-07,
+ "loss": 0.1029,
+ "step": 34728
+ },
+ {
+ "epoch": 94.62942779291554,
+ "grad_norm": 2.7075705528259277,
+ "learning_rate": 1.508940653952362e-07,
+ "loss": 0.0567,
+ "step": 34729
+ },
+ {
+ "epoch": 94.63215258855585,
+ "grad_norm": 3.5815441608428955,
+ "learning_rate": 1.5074137576033044e-07,
+ "loss": 0.0384,
+ "step": 34730
+ },
+ {
+ "epoch": 94.63487738419619,
+ "grad_norm": 1.7786641120910645,
+ "learning_rate": 1.5058876283113423e-07,
+ "loss": 0.047,
+ "step": 34731
+ },
+ {
+ "epoch": 94.6376021798365,
+ "grad_norm": 2.469461441040039,
+ "learning_rate": 1.504362266088355e-07,
+ "loss": 0.0628,
+ "step": 34732
+ },
+ {
+ "epoch": 94.64032697547684,
+ "grad_norm": 2.8403401374816895,
+ "learning_rate": 1.5028376709462335e-07,
+ "loss": 0.1161,
+ "step": 34733
+ },
+ {
+ "epoch": 94.64305177111717,
+ "grad_norm": 2.908555746078491,
+ "learning_rate": 1.5013138428968344e-07,
+ "loss": 0.0575,
+ "step": 34734
+ },
+ {
+ "epoch": 94.64577656675749,
+ "grad_norm": 2.3483283519744873,
+ "learning_rate": 1.4997907819520373e-07,
+ "loss": 0.0565,
+ "step": 34735
+ },
+ {
+ "epoch": 94.64850136239782,
+ "grad_norm": 6.889547824859619,
+ "learning_rate": 1.4982684881236996e-07,
+ "loss": 0.081,
+ "step": 34736
+ },
+ {
+ "epoch": 94.65122615803814,
+ "grad_norm": 2.152317762374878,
+ "learning_rate": 1.4967469614236673e-07,
+ "loss": 0.0224,
+ "step": 34737
+ },
+ {
+ "epoch": 94.65395095367847,
+ "grad_norm": 1.7832682132720947,
+ "learning_rate": 1.4952262018638087e-07,
+ "loss": 0.0297,
+ "step": 34738
+ },
+ {
+ "epoch": 94.65667574931881,
+ "grad_norm": 2.1328957080841064,
+ "learning_rate": 1.4937062094559584e-07,
+ "loss": 0.0452,
+ "step": 34739
+ },
+ {
+ "epoch": 94.65940054495913,
+ "grad_norm": 4.166618824005127,
+ "learning_rate": 1.4921869842119518e-07,
+ "loss": 0.0283,
+ "step": 34740
+ },
+ {
+ "epoch": 94.66212534059946,
+ "grad_norm": 2.2828242778778076,
+ "learning_rate": 1.4906685261436238e-07,
+ "loss": 0.1821,
+ "step": 34741
+ },
+ {
+ "epoch": 94.66485013623978,
+ "grad_norm": 5.564267158508301,
+ "learning_rate": 1.4891508352627982e-07,
+ "loss": 0.0812,
+ "step": 34742
+ },
+ {
+ "epoch": 94.66757493188011,
+ "grad_norm": 2.802478551864624,
+ "learning_rate": 1.4876339115812878e-07,
+ "loss": 0.0782,
+ "step": 34743
+ },
+ {
+ "epoch": 94.67029972752043,
+ "grad_norm": 2.5819175243377686,
+ "learning_rate": 1.4861177551109273e-07,
+ "loss": 0.0679,
+ "step": 34744
+ },
+ {
+ "epoch": 94.67302452316076,
+ "grad_norm": 2.0222177505493164,
+ "learning_rate": 1.4846023658634967e-07,
+ "loss": 0.0399,
+ "step": 34745
+ },
+ {
+ "epoch": 94.6757493188011,
+ "grad_norm": 3.721381187438965,
+ "learning_rate": 1.4830877438508308e-07,
+ "loss": 0.096,
+ "step": 34746
+ },
+ {
+ "epoch": 94.67847411444141,
+ "grad_norm": 2.32200026512146,
+ "learning_rate": 1.4815738890846864e-07,
+ "loss": 0.0876,
+ "step": 34747
+ },
+ {
+ "epoch": 94.68119891008175,
+ "grad_norm": 2.822448492050171,
+ "learning_rate": 1.4800608015768768e-07,
+ "loss": 0.1562,
+ "step": 34748
+ },
+ {
+ "epoch": 94.68392370572207,
+ "grad_norm": 2.120591640472412,
+ "learning_rate": 1.4785484813391927e-07,
+ "loss": 0.0304,
+ "step": 34749
+ },
+ {
+ "epoch": 94.6866485013624,
+ "grad_norm": 2.949368476867676,
+ "learning_rate": 1.477036928383402e-07,
+ "loss": 0.0335,
+ "step": 34750
+ },
+ {
+ "epoch": 94.68937329700273,
+ "grad_norm": 2.3968918323516846,
+ "learning_rate": 1.475526142721262e-07,
+ "loss": 0.0876,
+ "step": 34751
+ },
+ {
+ "epoch": 94.69209809264305,
+ "grad_norm": 2.2223854064941406,
+ "learning_rate": 1.4740161243645634e-07,
+ "loss": 0.1126,
+ "step": 34752
+ },
+ {
+ "epoch": 94.69482288828338,
+ "grad_norm": 2.491565465927124,
+ "learning_rate": 1.4725068733250636e-07,
+ "loss": 0.0706,
+ "step": 34753
+ },
+ {
+ "epoch": 94.6975476839237,
+ "grad_norm": 2.282160758972168,
+ "learning_rate": 1.4709983896145085e-07,
+ "loss": 0.0501,
+ "step": 34754
+ },
+ {
+ "epoch": 94.70027247956403,
+ "grad_norm": 2.711899757385254,
+ "learning_rate": 1.4694906732446334e-07,
+ "loss": 0.0634,
+ "step": 34755
+ },
+ {
+ "epoch": 94.70299727520435,
+ "grad_norm": 2.785217523574829,
+ "learning_rate": 1.4679837242272065e-07,
+ "loss": 0.0427,
+ "step": 34756
+ },
+ {
+ "epoch": 94.70572207084469,
+ "grad_norm": 2.9921822547912598,
+ "learning_rate": 1.4664775425739408e-07,
+ "loss": 0.1068,
+ "step": 34757
+ },
+ {
+ "epoch": 94.70844686648502,
+ "grad_norm": 3.676082134246826,
+ "learning_rate": 1.4649721282965934e-07,
+ "loss": 0.0345,
+ "step": 34758
+ },
+ {
+ "epoch": 94.71117166212534,
+ "grad_norm": 2.53202486038208,
+ "learning_rate": 1.463467481406855e-07,
+ "loss": 0.0923,
+ "step": 34759
+ },
+ {
+ "epoch": 94.71389645776567,
+ "grad_norm": 2.301422357559204,
+ "learning_rate": 1.4619636019164608e-07,
+ "loss": 0.0299,
+ "step": 34760
+ },
+ {
+ "epoch": 94.71662125340599,
+ "grad_norm": 3.420034170150757,
+ "learning_rate": 1.4604604898371344e-07,
+ "loss": 0.12,
+ "step": 34761
+ },
+ {
+ "epoch": 94.71934604904632,
+ "grad_norm": 3.044668436050415,
+ "learning_rate": 1.4589581451805666e-07,
+ "loss": 0.0365,
+ "step": 34762
+ },
+ {
+ "epoch": 94.72207084468666,
+ "grad_norm": 2.417459726333618,
+ "learning_rate": 1.4574565679584485e-07,
+ "loss": 0.0298,
+ "step": 34763
+ },
+ {
+ "epoch": 94.72479564032697,
+ "grad_norm": 3.5302438735961914,
+ "learning_rate": 1.4559557581825034e-07,
+ "loss": 0.0893,
+ "step": 34764
+ },
+ {
+ "epoch": 94.7275204359673,
+ "grad_norm": 3.776052951812744,
+ "learning_rate": 1.4544557158643892e-07,
+ "loss": 0.1533,
+ "step": 34765
+ },
+ {
+ "epoch": 94.73024523160763,
+ "grad_norm": 2.5752294063568115,
+ "learning_rate": 1.452956441015807e-07,
+ "loss": 0.0309,
+ "step": 34766
+ },
+ {
+ "epoch": 94.73297002724796,
+ "grad_norm": 2.660784959793091,
+ "learning_rate": 1.4514579336484368e-07,
+ "loss": 0.0954,
+ "step": 34767
+ },
+ {
+ "epoch": 94.73569482288828,
+ "grad_norm": 2.7385683059692383,
+ "learning_rate": 1.4499601937739249e-07,
+ "loss": 0.0214,
+ "step": 34768
+ },
+ {
+ "epoch": 94.73841961852861,
+ "grad_norm": 4.5096354484558105,
+ "learning_rate": 1.448463221403962e-07,
+ "loss": 0.0708,
+ "step": 34769
+ },
+ {
+ "epoch": 94.74114441416894,
+ "grad_norm": 3.276843786239624,
+ "learning_rate": 1.4469670165502047e-07,
+ "loss": 0.1191,
+ "step": 34770
+ },
+ {
+ "epoch": 94.74386920980926,
+ "grad_norm": 1.9798550605773926,
+ "learning_rate": 1.445471579224278e-07,
+ "loss": 0.0333,
+ "step": 34771
+ },
+ {
+ "epoch": 94.7465940054496,
+ "grad_norm": 13.764991760253906,
+ "learning_rate": 1.4439769094378498e-07,
+ "loss": 0.1301,
+ "step": 34772
+ },
+ {
+ "epoch": 94.74931880108991,
+ "grad_norm": 2.390716791152954,
+ "learning_rate": 1.4424830072025664e-07,
+ "loss": 0.0536,
+ "step": 34773
+ },
+ {
+ "epoch": 94.75204359673025,
+ "grad_norm": 1.7884615659713745,
+ "learning_rate": 1.440989872530052e-07,
+ "loss": 0.023,
+ "step": 34774
+ },
+ {
+ "epoch": 94.75476839237058,
+ "grad_norm": 2.6902616024017334,
+ "learning_rate": 1.4394975054319305e-07,
+ "loss": 0.0813,
+ "step": 34775
+ },
+ {
+ "epoch": 94.7574931880109,
+ "grad_norm": 3.49226450920105,
+ "learning_rate": 1.438005905919837e-07,
+ "loss": 0.1183,
+ "step": 34776
+ },
+ {
+ "epoch": 94.76021798365123,
+ "grad_norm": 3.289321184158325,
+ "learning_rate": 1.4365150740053735e-07,
+ "loss": 0.0721,
+ "step": 34777
+ },
+ {
+ "epoch": 94.76294277929155,
+ "grad_norm": 2.1775777339935303,
+ "learning_rate": 1.435025009700175e-07,
+ "loss": 0.0245,
+ "step": 34778
+ },
+ {
+ "epoch": 94.76566757493188,
+ "grad_norm": 2.1738474369049072,
+ "learning_rate": 1.43353571301581e-07,
+ "loss": 0.0346,
+ "step": 34779
+ },
+ {
+ "epoch": 94.7683923705722,
+ "grad_norm": 2.144057273864746,
+ "learning_rate": 1.4320471839639027e-07,
+ "loss": 0.1144,
+ "step": 34780
+ },
+ {
+ "epoch": 94.77111716621253,
+ "grad_norm": 2.4447195529937744,
+ "learning_rate": 1.4305594225560438e-07,
+ "loss": 0.0375,
+ "step": 34781
+ },
+ {
+ "epoch": 94.77384196185287,
+ "grad_norm": 2.6953911781311035,
+ "learning_rate": 1.4290724288038016e-07,
+ "loss": 0.0446,
+ "step": 34782
+ },
+ {
+ "epoch": 94.77656675749319,
+ "grad_norm": 2.8725662231445312,
+ "learning_rate": 1.4275862027187893e-07,
+ "loss": 0.0365,
+ "step": 34783
+ },
+ {
+ "epoch": 94.77929155313352,
+ "grad_norm": 2.246803045272827,
+ "learning_rate": 1.4261007443125418e-07,
+ "loss": 0.0665,
+ "step": 34784
+ },
+ {
+ "epoch": 94.78201634877384,
+ "grad_norm": 3.250502586364746,
+ "learning_rate": 1.4246160535966725e-07,
+ "loss": 0.0291,
+ "step": 34785
+ },
+ {
+ "epoch": 94.78474114441417,
+ "grad_norm": 2.5454702377319336,
+ "learning_rate": 1.423132130582705e-07,
+ "loss": 0.0901,
+ "step": 34786
+ },
+ {
+ "epoch": 94.7874659400545,
+ "grad_norm": 4.991804122924805,
+ "learning_rate": 1.4216489752822192e-07,
+ "loss": 0.1351,
+ "step": 34787
+ },
+ {
+ "epoch": 94.79019073569482,
+ "grad_norm": 2.541097640991211,
+ "learning_rate": 1.4201665877067615e-07,
+ "loss": 0.0225,
+ "step": 34788
+ },
+ {
+ "epoch": 94.79291553133515,
+ "grad_norm": 2.268462896347046,
+ "learning_rate": 1.418684967867867e-07,
+ "loss": 0.0845,
+ "step": 34789
+ },
+ {
+ "epoch": 94.79564032697547,
+ "grad_norm": 3.6317033767700195,
+ "learning_rate": 1.4172041157770822e-07,
+ "loss": 0.1054,
+ "step": 34790
+ },
+ {
+ "epoch": 94.7983651226158,
+ "grad_norm": 3.203853130340576,
+ "learning_rate": 1.415724031445942e-07,
+ "loss": 0.0231,
+ "step": 34791
+ },
+ {
+ "epoch": 94.80108991825612,
+ "grad_norm": 1.9054230451583862,
+ "learning_rate": 1.4142447148859706e-07,
+ "loss": 0.0158,
+ "step": 34792
+ },
+ {
+ "epoch": 94.80381471389646,
+ "grad_norm": 2.7306485176086426,
+ "learning_rate": 1.412766166108681e-07,
+ "loss": 0.0643,
+ "step": 34793
+ },
+ {
+ "epoch": 94.80653950953679,
+ "grad_norm": 2.510159730911255,
+ "learning_rate": 1.4112883851256088e-07,
+ "loss": 0.0526,
+ "step": 34794
+ },
+ {
+ "epoch": 94.80926430517711,
+ "grad_norm": 2.6023669242858887,
+ "learning_rate": 1.4098113719482333e-07,
+ "loss": 0.0602,
+ "step": 34795
+ },
+ {
+ "epoch": 94.81198910081744,
+ "grad_norm": 2.7218353748321533,
+ "learning_rate": 1.4083351265880786e-07,
+ "loss": 0.0315,
+ "step": 34796
+ },
+ {
+ "epoch": 94.81471389645776,
+ "grad_norm": 2.2368712425231934,
+ "learning_rate": 1.4068596490566467e-07,
+ "loss": 0.0282,
+ "step": 34797
+ },
+ {
+ "epoch": 94.8174386920981,
+ "grad_norm": 2.698629379272461,
+ "learning_rate": 1.405384939365406e-07,
+ "loss": 0.1544,
+ "step": 34798
+ },
+ {
+ "epoch": 94.82016348773843,
+ "grad_norm": 2.3174290657043457,
+ "learning_rate": 1.403910997525859e-07,
+ "loss": 0.0643,
+ "step": 34799
+ },
+ {
+ "epoch": 94.82288828337875,
+ "grad_norm": 2.633542537689209,
+ "learning_rate": 1.402437823549474e-07,
+ "loss": 0.106,
+ "step": 34800
+ },
+ {
+ "epoch": 94.82561307901908,
+ "grad_norm": 3.1691648960113525,
+ "learning_rate": 1.4009654174477417e-07,
+ "loss": 0.0706,
+ "step": 34801
+ },
+ {
+ "epoch": 94.8283378746594,
+ "grad_norm": 2.363712787628174,
+ "learning_rate": 1.3994937792321085e-07,
+ "loss": 0.0458,
+ "step": 34802
+ },
+ {
+ "epoch": 94.83106267029973,
+ "grad_norm": 2.7807717323303223,
+ "learning_rate": 1.398022908914054e-07,
+ "loss": 0.0264,
+ "step": 34803
+ },
+ {
+ "epoch": 94.83378746594005,
+ "grad_norm": 1.9537835121154785,
+ "learning_rate": 1.3965528065050137e-07,
+ "loss": 0.0303,
+ "step": 34804
+ },
+ {
+ "epoch": 94.83651226158038,
+ "grad_norm": 3.4546995162963867,
+ "learning_rate": 1.3950834720164453e-07,
+ "loss": 0.0301,
+ "step": 34805
+ },
+ {
+ "epoch": 94.83923705722071,
+ "grad_norm": 1.9009343385696411,
+ "learning_rate": 1.3936149054598058e-07,
+ "loss": 0.2329,
+ "step": 34806
+ },
+ {
+ "epoch": 94.84196185286103,
+ "grad_norm": 7.271117210388184,
+ "learning_rate": 1.3921471068465085e-07,
+ "loss": 0.0348,
+ "step": 34807
+ },
+ {
+ "epoch": 94.84468664850137,
+ "grad_norm": 1.2325505018234253,
+ "learning_rate": 1.390680076188e-07,
+ "loss": 0.014,
+ "step": 34808
+ },
+ {
+ "epoch": 94.84741144414168,
+ "grad_norm": 3.228151798248291,
+ "learning_rate": 1.3892138134957045e-07,
+ "loss": 0.0402,
+ "step": 34809
+ },
+ {
+ "epoch": 94.85013623978202,
+ "grad_norm": 2.0668442249298096,
+ "learning_rate": 1.3877483187810348e-07,
+ "loss": 0.0264,
+ "step": 34810
+ },
+ {
+ "epoch": 94.85286103542235,
+ "grad_norm": 2.6093668937683105,
+ "learning_rate": 1.386283592055404e-07,
+ "loss": 0.0447,
+ "step": 34811
+ },
+ {
+ "epoch": 94.85558583106267,
+ "grad_norm": 2.0860109329223633,
+ "learning_rate": 1.3848196333302255e-07,
+ "loss": 0.0235,
+ "step": 34812
+ },
+ {
+ "epoch": 94.858310626703,
+ "grad_norm": 2.5715420246124268,
+ "learning_rate": 1.383356442616901e-07,
+ "loss": 0.0397,
+ "step": 34813
+ },
+ {
+ "epoch": 94.86103542234332,
+ "grad_norm": 2.8539466857910156,
+ "learning_rate": 1.3818940199268216e-07,
+ "loss": 0.0655,
+ "step": 34814
+ },
+ {
+ "epoch": 94.86376021798365,
+ "grad_norm": 2.208131790161133,
+ "learning_rate": 1.380432365271378e-07,
+ "loss": 0.0873,
+ "step": 34815
+ },
+ {
+ "epoch": 94.86648501362397,
+ "grad_norm": 3.4260189533233643,
+ "learning_rate": 1.378971478661939e-07,
+ "loss": 0.0779,
+ "step": 34816
+ },
+ {
+ "epoch": 94.8692098092643,
+ "grad_norm": 2.421434164047241,
+ "learning_rate": 1.3775113601099067e-07,
+ "loss": 0.1207,
+ "step": 34817
+ },
+ {
+ "epoch": 94.87193460490464,
+ "grad_norm": 2.585602283477783,
+ "learning_rate": 1.3760520096266494e-07,
+ "loss": 0.0743,
+ "step": 34818
+ },
+ {
+ "epoch": 94.87465940054496,
+ "grad_norm": 2.9377658367156982,
+ "learning_rate": 1.374593427223514e-07,
+ "loss": 0.1534,
+ "step": 34819
+ },
+ {
+ "epoch": 94.87738419618529,
+ "grad_norm": 2.74346661567688,
+ "learning_rate": 1.373135612911869e-07,
+ "loss": 0.041,
+ "step": 34820
+ },
+ {
+ "epoch": 94.88010899182561,
+ "grad_norm": 2.9906270503997803,
+ "learning_rate": 1.371678566703083e-07,
+ "loss": 0.0464,
+ "step": 34821
+ },
+ {
+ "epoch": 94.88283378746594,
+ "grad_norm": 1.8314659595489502,
+ "learning_rate": 1.3702222886084803e-07,
+ "loss": 0.155,
+ "step": 34822
+ },
+ {
+ "epoch": 94.88555858310627,
+ "grad_norm": 1.394993782043457,
+ "learning_rate": 1.3687667786394188e-07,
+ "loss": 0.0141,
+ "step": 34823
+ },
+ {
+ "epoch": 94.88828337874659,
+ "grad_norm": 3.0631768703460693,
+ "learning_rate": 1.3673120368072224e-07,
+ "loss": 0.0293,
+ "step": 34824
+ },
+ {
+ "epoch": 94.89100817438693,
+ "grad_norm": 3.240985870361328,
+ "learning_rate": 1.3658580631232266e-07,
+ "loss": 0.0798,
+ "step": 34825
+ },
+ {
+ "epoch": 94.89373297002724,
+ "grad_norm": 1.8917561769485474,
+ "learning_rate": 1.3644048575987557e-07,
+ "loss": 0.0424,
+ "step": 34826
+ },
+ {
+ "epoch": 94.89645776566758,
+ "grad_norm": 2.289652109146118,
+ "learning_rate": 1.3629524202451228e-07,
+ "loss": 0.0411,
+ "step": 34827
+ },
+ {
+ "epoch": 94.8991825613079,
+ "grad_norm": 2.186800003051758,
+ "learning_rate": 1.36150075107363e-07,
+ "loss": 0.0278,
+ "step": 34828
+ },
+ {
+ "epoch": 94.90190735694823,
+ "grad_norm": 3.771892547607422,
+ "learning_rate": 1.3600498500956129e-07,
+ "loss": 0.0681,
+ "step": 34829
+ },
+ {
+ "epoch": 94.90463215258856,
+ "grad_norm": 2.043431282043457,
+ "learning_rate": 1.3585997173223396e-07,
+ "loss": 0.0308,
+ "step": 34830
+ },
+ {
+ "epoch": 94.90735694822888,
+ "grad_norm": 2.3939459323883057,
+ "learning_rate": 1.3571503527651352e-07,
+ "loss": 0.0374,
+ "step": 34831
+ },
+ {
+ "epoch": 94.91008174386921,
+ "grad_norm": 3.482168197631836,
+ "learning_rate": 1.355701756435246e-07,
+ "loss": 0.1204,
+ "step": 34832
+ },
+ {
+ "epoch": 94.91280653950953,
+ "grad_norm": 1.9421875476837158,
+ "learning_rate": 1.3542539283439959e-07,
+ "loss": 0.0264,
+ "step": 34833
+ },
+ {
+ "epoch": 94.91553133514986,
+ "grad_norm": 2.034855842590332,
+ "learning_rate": 1.3528068685026208e-07,
+ "loss": 0.0312,
+ "step": 34834
+ },
+ {
+ "epoch": 94.9182561307902,
+ "grad_norm": 3.001547336578369,
+ "learning_rate": 1.3513605769224225e-07,
+ "loss": 0.0714,
+ "step": 34835
+ },
+ {
+ "epoch": 94.92098092643052,
+ "grad_norm": 4.648657321929932,
+ "learning_rate": 1.3499150536146588e-07,
+ "loss": 0.1142,
+ "step": 34836
+ },
+ {
+ "epoch": 94.92370572207085,
+ "grad_norm": 1.7883365154266357,
+ "learning_rate": 1.3484702985905763e-07,
+ "loss": 0.0209,
+ "step": 34837
+ },
+ {
+ "epoch": 94.92643051771117,
+ "grad_norm": 2.4563634395599365,
+ "learning_rate": 1.3470263118614324e-07,
+ "loss": 0.0313,
+ "step": 34838
+ },
+ {
+ "epoch": 94.9291553133515,
+ "grad_norm": 3.1272811889648438,
+ "learning_rate": 1.345583093438474e-07,
+ "loss": 0.0541,
+ "step": 34839
+ },
+ {
+ "epoch": 94.93188010899182,
+ "grad_norm": 2.5367186069488525,
+ "learning_rate": 1.3441406433329362e-07,
+ "loss": 0.0364,
+ "step": 34840
+ },
+ {
+ "epoch": 94.93460490463215,
+ "grad_norm": 2.2692346572875977,
+ "learning_rate": 1.3426989615560548e-07,
+ "loss": 0.0676,
+ "step": 34841
+ },
+ {
+ "epoch": 94.93732970027249,
+ "grad_norm": 1.523105263710022,
+ "learning_rate": 1.3412580481190651e-07,
+ "loss": 0.0242,
+ "step": 34842
+ },
+ {
+ "epoch": 94.9400544959128,
+ "grad_norm": 2.6941287517547607,
+ "learning_rate": 1.3398179030331805e-07,
+ "loss": 0.1296,
+ "step": 34843
+ },
+ {
+ "epoch": 94.94277929155314,
+ "grad_norm": 3.5964252948760986,
+ "learning_rate": 1.3383785263096138e-07,
+ "loss": 0.0895,
+ "step": 34844
+ },
+ {
+ "epoch": 94.94550408719346,
+ "grad_norm": 2.8641791343688965,
+ "learning_rate": 1.3369399179595787e-07,
+ "loss": 0.0594,
+ "step": 34845
+ },
+ {
+ "epoch": 94.94822888283379,
+ "grad_norm": 3.23000168800354,
+ "learning_rate": 1.3355020779942883e-07,
+ "loss": 0.0459,
+ "step": 34846
+ },
+ {
+ "epoch": 94.95095367847412,
+ "grad_norm": 2.3119685649871826,
+ "learning_rate": 1.3340650064249337e-07,
+ "loss": 0.0358,
+ "step": 34847
+ },
+ {
+ "epoch": 94.95367847411444,
+ "grad_norm": 2.7140254974365234,
+ "learning_rate": 1.3326287032626838e-07,
+ "loss": 0.2672,
+ "step": 34848
+ },
+ {
+ "epoch": 94.95640326975477,
+ "grad_norm": 1.8845314979553223,
+ "learning_rate": 1.331193168518774e-07,
+ "loss": 0.0227,
+ "step": 34849
+ },
+ {
+ "epoch": 94.95912806539509,
+ "grad_norm": 3.730475664138794,
+ "learning_rate": 1.3297584022043396e-07,
+ "loss": 0.0285,
+ "step": 34850
+ },
+ {
+ "epoch": 94.96185286103542,
+ "grad_norm": 1.4961528778076172,
+ "learning_rate": 1.328324404330572e-07,
+ "loss": 0.0202,
+ "step": 34851
+ },
+ {
+ "epoch": 94.96457765667574,
+ "grad_norm": 2.212015151977539,
+ "learning_rate": 1.32689117490864e-07,
+ "loss": 0.0771,
+ "step": 34852
+ },
+ {
+ "epoch": 94.96730245231608,
+ "grad_norm": 2.486266851425171,
+ "learning_rate": 1.325458713949701e-07,
+ "loss": 0.0441,
+ "step": 34853
+ },
+ {
+ "epoch": 94.97002724795641,
+ "grad_norm": 2.460434675216675,
+ "learning_rate": 1.3240270214649242e-07,
+ "loss": 0.0419,
+ "step": 34854
+ },
+ {
+ "epoch": 94.97275204359673,
+ "grad_norm": 3.0918476581573486,
+ "learning_rate": 1.322596097465445e-07,
+ "loss": 0.1347,
+ "step": 34855
+ },
+ {
+ "epoch": 94.97547683923706,
+ "grad_norm": 3.1286609172821045,
+ "learning_rate": 1.3211659419624102e-07,
+ "loss": 0.0341,
+ "step": 34856
+ },
+ {
+ "epoch": 94.97820163487738,
+ "grad_norm": 2.5470151901245117,
+ "learning_rate": 1.319736554966955e-07,
+ "loss": 0.0253,
+ "step": 34857
+ },
+ {
+ "epoch": 94.98092643051771,
+ "grad_norm": 1.877874493598938,
+ "learning_rate": 1.3183079364902153e-07,
+ "loss": 0.0297,
+ "step": 34858
+ },
+ {
+ "epoch": 94.98365122615803,
+ "grad_norm": 2.961230516433716,
+ "learning_rate": 1.3168800865433262e-07,
+ "loss": 0.0691,
+ "step": 34859
+ },
+ {
+ "epoch": 94.98637602179836,
+ "grad_norm": 2.6252262592315674,
+ "learning_rate": 1.3154530051373904e-07,
+ "loss": 0.0482,
+ "step": 34860
+ },
+ {
+ "epoch": 94.9891008174387,
+ "grad_norm": 3.1088922023773193,
+ "learning_rate": 1.3140266922835322e-07,
+ "loss": 0.1247,
+ "step": 34861
+ },
+ {
+ "epoch": 94.99182561307902,
+ "grad_norm": 2.101668119430542,
+ "learning_rate": 1.3126011479928646e-07,
+ "loss": 0.0299,
+ "step": 34862
+ },
+ {
+ "epoch": 94.99455040871935,
+ "grad_norm": 2.313483476638794,
+ "learning_rate": 1.3111763722764792e-07,
+ "loss": 0.0253,
+ "step": 34863
+ },
+ {
+ "epoch": 94.99727520435967,
+ "grad_norm": 2.9240059852600098,
+ "learning_rate": 1.3097523651454668e-07,
+ "loss": 0.0541,
+ "step": 34864
+ },
+ {
+ "epoch": 95.0,
+ "grad_norm": 3.7429819107055664,
+ "learning_rate": 1.30832912661093e-07,
+ "loss": 0.0527,
+ "step": 34865
+ },
+ {
+ "epoch": 95.00272479564033,
+ "grad_norm": 2.7895829677581787,
+ "learning_rate": 1.3069066566839594e-07,
+ "loss": 0.1409,
+ "step": 34866
+ },
+ {
+ "epoch": 95.00544959128065,
+ "grad_norm": 2.324601888656616,
+ "learning_rate": 1.3054849553756243e-07,
+ "loss": 0.03,
+ "step": 34867
+ },
+ {
+ "epoch": 95.00817438692098,
+ "grad_norm": 2.12203049659729,
+ "learning_rate": 1.3040640226969824e-07,
+ "loss": 0.0517,
+ "step": 34868
+ },
+ {
+ "epoch": 95.0108991825613,
+ "grad_norm": 3.364262104034424,
+ "learning_rate": 1.3026438586591138e-07,
+ "loss": 0.0823,
+ "step": 34869
+ },
+ {
+ "epoch": 95.01362397820164,
+ "grad_norm": 2.6119232177734375,
+ "learning_rate": 1.3012244632730876e-07,
+ "loss": 0.0527,
+ "step": 34870
+ },
+ {
+ "epoch": 95.01634877384195,
+ "grad_norm": 2.1571426391601562,
+ "learning_rate": 1.29980583654995e-07,
+ "loss": 0.0944,
+ "step": 34871
+ },
+ {
+ "epoch": 95.01907356948229,
+ "grad_norm": 1.6402757167816162,
+ "learning_rate": 1.298387978500737e-07,
+ "loss": 0.0158,
+ "step": 34872
+ },
+ {
+ "epoch": 95.02179836512262,
+ "grad_norm": 2.856287956237793,
+ "learning_rate": 1.2969708891365063e-07,
+ "loss": 0.0481,
+ "step": 34873
+ },
+ {
+ "epoch": 95.02452316076294,
+ "grad_norm": 3.9047768115997314,
+ "learning_rate": 1.2955545684682935e-07,
+ "loss": 0.0425,
+ "step": 34874
+ },
+ {
+ "epoch": 95.02724795640327,
+ "grad_norm": 2.873523473739624,
+ "learning_rate": 1.2941390165071232e-07,
+ "loss": 0.0315,
+ "step": 34875
+ },
+ {
+ "epoch": 95.02997275204359,
+ "grad_norm": 2.794736862182617,
+ "learning_rate": 1.292724233264031e-07,
+ "loss": 0.04,
+ "step": 34876
+ },
+ {
+ "epoch": 95.03269754768392,
+ "grad_norm": 1.4680901765823364,
+ "learning_rate": 1.2913102187500083e-07,
+ "loss": 0.0192,
+ "step": 34877
+ },
+ {
+ "epoch": 95.03542234332426,
+ "grad_norm": 2.1529393196105957,
+ "learning_rate": 1.2898969729760903e-07,
+ "loss": 0.2289,
+ "step": 34878
+ },
+ {
+ "epoch": 95.03814713896458,
+ "grad_norm": 3.5629093647003174,
+ "learning_rate": 1.2884844959532795e-07,
+ "loss": 0.0351,
+ "step": 34879
+ },
+ {
+ "epoch": 95.04087193460491,
+ "grad_norm": 4.032271862030029,
+ "learning_rate": 1.287072787692567e-07,
+ "loss": 0.1118,
+ "step": 34880
+ },
+ {
+ "epoch": 95.04359673024523,
+ "grad_norm": 2.075810670852661,
+ "learning_rate": 1.2856618482049664e-07,
+ "loss": 0.1547,
+ "step": 34881
+ },
+ {
+ "epoch": 95.04632152588556,
+ "grad_norm": 1.9002879858016968,
+ "learning_rate": 1.284251677501458e-07,
+ "loss": 0.0226,
+ "step": 34882
+ },
+ {
+ "epoch": 95.04904632152588,
+ "grad_norm": 3.5459165573120117,
+ "learning_rate": 1.2828422755930103e-07,
+ "loss": 0.0554,
+ "step": 34883
+ },
+ {
+ "epoch": 95.05177111716621,
+ "grad_norm": 2.863830089569092,
+ "learning_rate": 1.2814336424906038e-07,
+ "loss": 0.0791,
+ "step": 34884
+ },
+ {
+ "epoch": 95.05449591280654,
+ "grad_norm": 3.0242042541503906,
+ "learning_rate": 1.2800257782052183e-07,
+ "loss": 0.0974,
+ "step": 34885
+ },
+ {
+ "epoch": 95.05722070844686,
+ "grad_norm": 1.5003838539123535,
+ "learning_rate": 1.2786186827478231e-07,
+ "loss": 0.0198,
+ "step": 34886
+ },
+ {
+ "epoch": 95.0599455040872,
+ "grad_norm": 2.3934693336486816,
+ "learning_rate": 1.2772123561293648e-07,
+ "loss": 0.0198,
+ "step": 34887
+ },
+ {
+ "epoch": 95.06267029972751,
+ "grad_norm": 2.5218911170959473,
+ "learning_rate": 1.2758067983608013e-07,
+ "loss": 0.0914,
+ "step": 34888
+ },
+ {
+ "epoch": 95.06539509536785,
+ "grad_norm": 3.184844493865967,
+ "learning_rate": 1.2744020094530684e-07,
+ "loss": 0.1183,
+ "step": 34889
+ },
+ {
+ "epoch": 95.06811989100818,
+ "grad_norm": 4.118417739868164,
+ "learning_rate": 1.272997989417124e-07,
+ "loss": 0.124,
+ "step": 34890
+ },
+ {
+ "epoch": 95.0708446866485,
+ "grad_norm": 4.425246238708496,
+ "learning_rate": 1.2715947382638927e-07,
+ "loss": 0.0249,
+ "step": 34891
+ },
+ {
+ "epoch": 95.07356948228883,
+ "grad_norm": 2.5153684616088867,
+ "learning_rate": 1.27019225600431e-07,
+ "loss": 0.089,
+ "step": 34892
+ },
+ {
+ "epoch": 95.07629427792915,
+ "grad_norm": 2.478933572769165,
+ "learning_rate": 1.2687905426492786e-07,
+ "loss": 0.1829,
+ "step": 34893
+ },
+ {
+ "epoch": 95.07901907356948,
+ "grad_norm": 3.415781259536743,
+ "learning_rate": 1.267389598209734e-07,
+ "loss": 0.0884,
+ "step": 34894
+ },
+ {
+ "epoch": 95.0817438692098,
+ "grad_norm": 2.6993184089660645,
+ "learning_rate": 1.2659894226965896e-07,
+ "loss": 0.0449,
+ "step": 34895
+ },
+ {
+ "epoch": 95.08446866485014,
+ "grad_norm": 3.928115129470825,
+ "learning_rate": 1.264590016120737e-07,
+ "loss": 0.1692,
+ "step": 34896
+ },
+ {
+ "epoch": 95.08719346049047,
+ "grad_norm": 2.283688545227051,
+ "learning_rate": 1.2631913784930673e-07,
+ "loss": 0.0338,
+ "step": 34897
+ },
+ {
+ "epoch": 95.08991825613079,
+ "grad_norm": 2.976043939590454,
+ "learning_rate": 1.261793509824505e-07,
+ "loss": 0.0985,
+ "step": 34898
+ },
+ {
+ "epoch": 95.09264305177112,
+ "grad_norm": 3.0505940914154053,
+ "learning_rate": 1.260396410125908e-07,
+ "loss": 0.0369,
+ "step": 34899
+ },
+ {
+ "epoch": 95.09536784741144,
+ "grad_norm": 2.1225483417510986,
+ "learning_rate": 1.2590000794081681e-07,
+ "loss": 0.0746,
+ "step": 34900
+ },
+ {
+ "epoch": 95.09809264305177,
+ "grad_norm": 2.9096975326538086,
+ "learning_rate": 1.2576045176821429e-07,
+ "loss": 0.1006,
+ "step": 34901
+ },
+ {
+ "epoch": 95.1008174386921,
+ "grad_norm": 3.1333768367767334,
+ "learning_rate": 1.2562097249587235e-07,
+ "loss": 0.0552,
+ "step": 34902
+ },
+ {
+ "epoch": 95.10354223433242,
+ "grad_norm": 2.8274359703063965,
+ "learning_rate": 1.2548157012487684e-07,
+ "loss": 0.0454,
+ "step": 34903
+ },
+ {
+ "epoch": 95.10626702997276,
+ "grad_norm": 2.766693353652954,
+ "learning_rate": 1.253422446563135e-07,
+ "loss": 0.1045,
+ "step": 34904
+ },
+ {
+ "epoch": 95.10899182561307,
+ "grad_norm": 2.684654474258423,
+ "learning_rate": 1.2520299609126597e-07,
+ "loss": 0.1276,
+ "step": 34905
+ },
+ {
+ "epoch": 95.11171662125341,
+ "grad_norm": 2.9204459190368652,
+ "learning_rate": 1.250638244308211e-07,
+ "loss": 0.0339,
+ "step": 34906
+ },
+ {
+ "epoch": 95.11444141689373,
+ "grad_norm": 2.671907901763916,
+ "learning_rate": 1.2492472967606028e-07,
+ "loss": 0.0387,
+ "step": 34907
+ },
+ {
+ "epoch": 95.11716621253406,
+ "grad_norm": 2.584839105606079,
+ "learning_rate": 1.247857118280682e-07,
+ "loss": 0.0333,
+ "step": 34908
+ },
+ {
+ "epoch": 95.11989100817439,
+ "grad_norm": 1.9556174278259277,
+ "learning_rate": 1.246467708879262e-07,
+ "loss": 0.0238,
+ "step": 34909
+ },
+ {
+ "epoch": 95.12261580381471,
+ "grad_norm": 2.7594969272613525,
+ "learning_rate": 1.2450790685671898e-07,
+ "loss": 0.0455,
+ "step": 34910
+ },
+ {
+ "epoch": 95.12534059945504,
+ "grad_norm": 2.3766114711761475,
+ "learning_rate": 1.2436911973552567e-07,
+ "loss": 0.0196,
+ "step": 34911
+ },
+ {
+ "epoch": 95.12806539509536,
+ "grad_norm": 2.2204349040985107,
+ "learning_rate": 1.2423040952542764e-07,
+ "loss": 0.0708,
+ "step": 34912
+ },
+ {
+ "epoch": 95.1307901907357,
+ "grad_norm": 1.9182202816009521,
+ "learning_rate": 1.2409177622750511e-07,
+ "loss": 0.0375,
+ "step": 34913
+ },
+ {
+ "epoch": 95.13351498637603,
+ "grad_norm": 1.9348313808441162,
+ "learning_rate": 1.2395321984283836e-07,
+ "loss": 0.0236,
+ "step": 34914
+ },
+ {
+ "epoch": 95.13623978201635,
+ "grad_norm": 2.7442848682403564,
+ "learning_rate": 1.238147403725054e-07,
+ "loss": 0.0482,
+ "step": 34915
+ },
+ {
+ "epoch": 95.13896457765668,
+ "grad_norm": 2.229963779449463,
+ "learning_rate": 1.236763378175865e-07,
+ "loss": 0.0523,
+ "step": 34916
+ },
+ {
+ "epoch": 95.141689373297,
+ "grad_norm": 2.6778433322906494,
+ "learning_rate": 1.235380121791574e-07,
+ "loss": 0.0208,
+ "step": 34917
+ },
+ {
+ "epoch": 95.14441416893733,
+ "grad_norm": 2.4531588554382324,
+ "learning_rate": 1.233997634582973e-07,
+ "loss": 0.0577,
+ "step": 34918
+ },
+ {
+ "epoch": 95.14713896457765,
+ "grad_norm": 2.508636474609375,
+ "learning_rate": 1.2326159165608086e-07,
+ "loss": 0.0738,
+ "step": 34919
+ },
+ {
+ "epoch": 95.14986376021798,
+ "grad_norm": 2.7733452320098877,
+ "learning_rate": 1.2312349677358615e-07,
+ "loss": 0.0658,
+ "step": 34920
+ },
+ {
+ "epoch": 95.15258855585832,
+ "grad_norm": 2.0371108055114746,
+ "learning_rate": 1.2298547881188672e-07,
+ "loss": 0.0215,
+ "step": 34921
+ },
+ {
+ "epoch": 95.15531335149863,
+ "grad_norm": 2.1744349002838135,
+ "learning_rate": 1.228475377720595e-07,
+ "loss": 0.0386,
+ "step": 34922
+ },
+ {
+ "epoch": 95.15803814713897,
+ "grad_norm": 2.2133798599243164,
+ "learning_rate": 1.2270967365517694e-07,
+ "loss": 0.0324,
+ "step": 34923
+ },
+ {
+ "epoch": 95.16076294277929,
+ "grad_norm": 2.2831597328186035,
+ "learning_rate": 1.2257188646231487e-07,
+ "loss": 0.0644,
+ "step": 34924
+ },
+ {
+ "epoch": 95.16348773841962,
+ "grad_norm": 2.0685505867004395,
+ "learning_rate": 1.2243417619454356e-07,
+ "loss": 0.0373,
+ "step": 34925
+ },
+ {
+ "epoch": 95.16621253405995,
+ "grad_norm": 2.232891321182251,
+ "learning_rate": 1.2229654285293767e-07,
+ "loss": 0.0218,
+ "step": 34926
+ },
+ {
+ "epoch": 95.16893732970027,
+ "grad_norm": 2.931797981262207,
+ "learning_rate": 1.221589864385686e-07,
+ "loss": 0.0796,
+ "step": 34927
+ },
+ {
+ "epoch": 95.1716621253406,
+ "grad_norm": 1.7469284534454346,
+ "learning_rate": 1.220215069525077e-07,
+ "loss": 0.021,
+ "step": 34928
+ },
+ {
+ "epoch": 95.17438692098092,
+ "grad_norm": 1.9482605457305908,
+ "learning_rate": 1.218841043958241e-07,
+ "loss": 0.0509,
+ "step": 34929
+ },
+ {
+ "epoch": 95.17711171662125,
+ "grad_norm": 1.85743248462677,
+ "learning_rate": 1.217467787695903e-07,
+ "loss": 0.0395,
+ "step": 34930
+ },
+ {
+ "epoch": 95.17983651226157,
+ "grad_norm": 3.2541394233703613,
+ "learning_rate": 1.216095300748743e-07,
+ "loss": 0.1675,
+ "step": 34931
+ },
+ {
+ "epoch": 95.1825613079019,
+ "grad_norm": 4.0061421394348145,
+ "learning_rate": 1.214723583127464e-07,
+ "loss": 0.0344,
+ "step": 34932
+ },
+ {
+ "epoch": 95.18528610354224,
+ "grad_norm": 1.9873977899551392,
+ "learning_rate": 1.2133526348427237e-07,
+ "loss": 0.147,
+ "step": 34933
+ },
+ {
+ "epoch": 95.18801089918256,
+ "grad_norm": 3.1552674770355225,
+ "learning_rate": 1.211982455905214e-07,
+ "loss": 0.0817,
+ "step": 34934
+ },
+ {
+ "epoch": 95.19073569482289,
+ "grad_norm": 3.555838108062744,
+ "learning_rate": 1.210613046325615e-07,
+ "loss": 0.0433,
+ "step": 34935
+ },
+ {
+ "epoch": 95.19346049046321,
+ "grad_norm": 5.451581954956055,
+ "learning_rate": 1.2092444061145737e-07,
+ "loss": 0.0562,
+ "step": 34936
+ },
+ {
+ "epoch": 95.19618528610354,
+ "grad_norm": 2.656935453414917,
+ "learning_rate": 1.2078765352827591e-07,
+ "loss": 0.0331,
+ "step": 34937
+ },
+ {
+ "epoch": 95.19891008174388,
+ "grad_norm": 1.7232446670532227,
+ "learning_rate": 1.206509433840819e-07,
+ "loss": 0.0239,
+ "step": 34938
+ },
+ {
+ "epoch": 95.2016348773842,
+ "grad_norm": 2.219930410385132,
+ "learning_rate": 1.205143101799411e-07,
+ "loss": 0.0266,
+ "step": 34939
+ },
+ {
+ "epoch": 95.20435967302453,
+ "grad_norm": 2.011101722717285,
+ "learning_rate": 1.2037775391691708e-07,
+ "loss": 0.0352,
+ "step": 34940
+ },
+ {
+ "epoch": 95.20708446866485,
+ "grad_norm": 3.57807993888855,
+ "learning_rate": 1.2024127459607237e-07,
+ "loss": 0.0253,
+ "step": 34941
+ },
+ {
+ "epoch": 95.20980926430518,
+ "grad_norm": 4.179675102233887,
+ "learning_rate": 1.2010487221847056e-07,
+ "loss": 0.0483,
+ "step": 34942
+ },
+ {
+ "epoch": 95.2125340599455,
+ "grad_norm": 2.4080264568328857,
+ "learning_rate": 1.199685467851741e-07,
+ "loss": 0.0838,
+ "step": 34943
+ },
+ {
+ "epoch": 95.21525885558583,
+ "grad_norm": 4.186582088470459,
+ "learning_rate": 1.1983229829724552e-07,
+ "loss": 0.1244,
+ "step": 34944
+ },
+ {
+ "epoch": 95.21798365122616,
+ "grad_norm": 2.866173267364502,
+ "learning_rate": 1.1969612675574394e-07,
+ "loss": 0.0232,
+ "step": 34945
+ },
+ {
+ "epoch": 95.22070844686648,
+ "grad_norm": 3.340458869934082,
+ "learning_rate": 1.1956003216173184e-07,
+ "loss": 0.0741,
+ "step": 34946
+ },
+ {
+ "epoch": 95.22343324250681,
+ "grad_norm": 1.252720832824707,
+ "learning_rate": 1.194240145162673e-07,
+ "loss": 0.0143,
+ "step": 34947
+ },
+ {
+ "epoch": 95.22615803814713,
+ "grad_norm": 2.7562851905822754,
+ "learning_rate": 1.1928807382041163e-07,
+ "loss": 0.0262,
+ "step": 34948
+ },
+ {
+ "epoch": 95.22888283378747,
+ "grad_norm": 2.7015018463134766,
+ "learning_rate": 1.1915221007522182e-07,
+ "loss": 0.0258,
+ "step": 34949
+ },
+ {
+ "epoch": 95.2316076294278,
+ "grad_norm": 3.2789742946624756,
+ "learning_rate": 1.1901642328175589e-07,
+ "loss": 0.1718,
+ "step": 34950
+ },
+ {
+ "epoch": 95.23433242506812,
+ "grad_norm": 2.6375033855438232,
+ "learning_rate": 1.1888071344107299e-07,
+ "loss": 0.0342,
+ "step": 34951
+ },
+ {
+ "epoch": 95.23705722070845,
+ "grad_norm": 1.6955173015594482,
+ "learning_rate": 1.1874508055422895e-07,
+ "loss": 0.0219,
+ "step": 34952
+ },
+ {
+ "epoch": 95.23978201634877,
+ "grad_norm": 2.1850240230560303,
+ "learning_rate": 1.1860952462227959e-07,
+ "loss": 0.2059,
+ "step": 34953
+ },
+ {
+ "epoch": 95.2425068119891,
+ "grad_norm": 3.0885190963745117,
+ "learning_rate": 1.1847404564628185e-07,
+ "loss": 0.2006,
+ "step": 34954
+ },
+ {
+ "epoch": 95.24523160762942,
+ "grad_norm": 5.636951923370361,
+ "learning_rate": 1.1833864362729042e-07,
+ "loss": 0.1476,
+ "step": 34955
+ },
+ {
+ "epoch": 95.24795640326975,
+ "grad_norm": 2.7337357997894287,
+ "learning_rate": 1.1820331856635891e-07,
+ "loss": 0.0357,
+ "step": 34956
+ },
+ {
+ "epoch": 95.25068119891009,
+ "grad_norm": 2.0418336391448975,
+ "learning_rate": 1.1806807046454205e-07,
+ "loss": 0.0322,
+ "step": 34957
+ },
+ {
+ "epoch": 95.2534059945504,
+ "grad_norm": 4.560342311859131,
+ "learning_rate": 1.1793289932289343e-07,
+ "loss": 0.0235,
+ "step": 34958
+ },
+ {
+ "epoch": 95.25613079019074,
+ "grad_norm": 2.69103741645813,
+ "learning_rate": 1.1779780514246442e-07,
+ "loss": 0.0459,
+ "step": 34959
+ },
+ {
+ "epoch": 95.25885558583106,
+ "grad_norm": 4.488551139831543,
+ "learning_rate": 1.1766278792430974e-07,
+ "loss": 0.0322,
+ "step": 34960
+ },
+ {
+ "epoch": 95.26158038147139,
+ "grad_norm": 2.9406447410583496,
+ "learning_rate": 1.1752784766947744e-07,
+ "loss": 0.071,
+ "step": 34961
+ },
+ {
+ "epoch": 95.26430517711172,
+ "grad_norm": 3.2513558864593506,
+ "learning_rate": 1.1739298437902114e-07,
+ "loss": 0.0599,
+ "step": 34962
+ },
+ {
+ "epoch": 95.26702997275204,
+ "grad_norm": 1.8449701070785522,
+ "learning_rate": 1.1725819805398997e-07,
+ "loss": 0.0858,
+ "step": 34963
+ },
+ {
+ "epoch": 95.26975476839237,
+ "grad_norm": 2.264432668685913,
+ "learning_rate": 1.1712348869543421e-07,
+ "loss": 0.0307,
+ "step": 34964
+ },
+ {
+ "epoch": 95.2724795640327,
+ "grad_norm": 3.0598464012145996,
+ "learning_rate": 1.1698885630440193e-07,
+ "loss": 0.127,
+ "step": 34965
+ },
+ {
+ "epoch": 95.27520435967303,
+ "grad_norm": 5.287500858306885,
+ "learning_rate": 1.1685430088194227e-07,
+ "loss": 0.0581,
+ "step": 34966
+ },
+ {
+ "epoch": 95.27792915531334,
+ "grad_norm": 2.593297004699707,
+ "learning_rate": 1.167198224291044e-07,
+ "loss": 0.0199,
+ "step": 34967
+ },
+ {
+ "epoch": 95.28065395095368,
+ "grad_norm": 3.269404411315918,
+ "learning_rate": 1.1658542094693415e-07,
+ "loss": 0.159,
+ "step": 34968
+ },
+ {
+ "epoch": 95.28337874659401,
+ "grad_norm": 2.7901294231414795,
+ "learning_rate": 1.1645109643647734e-07,
+ "loss": 0.0303,
+ "step": 34969
+ },
+ {
+ "epoch": 95.28610354223433,
+ "grad_norm": 1.7133756875991821,
+ "learning_rate": 1.1631684889878203e-07,
+ "loss": 0.157,
+ "step": 34970
+ },
+ {
+ "epoch": 95.28882833787466,
+ "grad_norm": 2.4325482845306396,
+ "learning_rate": 1.1618267833489294e-07,
+ "loss": 0.0488,
+ "step": 34971
+ },
+ {
+ "epoch": 95.29155313351498,
+ "grad_norm": 2.3382508754730225,
+ "learning_rate": 1.160485847458559e-07,
+ "loss": 0.0534,
+ "step": 34972
+ },
+ {
+ "epoch": 95.29427792915531,
+ "grad_norm": 1.6980870962142944,
+ "learning_rate": 1.159145681327134e-07,
+ "loss": 0.025,
+ "step": 34973
+ },
+ {
+ "epoch": 95.29700272479565,
+ "grad_norm": 3.9710137844085693,
+ "learning_rate": 1.1578062849651017e-07,
+ "loss": 0.0851,
+ "step": 34974
+ },
+ {
+ "epoch": 95.29972752043597,
+ "grad_norm": 2.86478328704834,
+ "learning_rate": 1.1564676583828982e-07,
+ "loss": 0.0642,
+ "step": 34975
+ },
+ {
+ "epoch": 95.3024523160763,
+ "grad_norm": 3.3024609088897705,
+ "learning_rate": 1.1551298015909373e-07,
+ "loss": 0.0735,
+ "step": 34976
+ },
+ {
+ "epoch": 95.30517711171662,
+ "grad_norm": 2.7386791706085205,
+ "learning_rate": 1.1537927145996441e-07,
+ "loss": 0.0259,
+ "step": 34977
+ },
+ {
+ "epoch": 95.30790190735695,
+ "grad_norm": 2.7702622413635254,
+ "learning_rate": 1.1524563974194325e-07,
+ "loss": 0.0774,
+ "step": 34978
+ },
+ {
+ "epoch": 95.31062670299727,
+ "grad_norm": 2.326133966445923,
+ "learning_rate": 1.1511208500607163e-07,
+ "loss": 0.0227,
+ "step": 34979
+ },
+ {
+ "epoch": 95.3133514986376,
+ "grad_norm": 6.5108723640441895,
+ "learning_rate": 1.1497860725338872e-07,
+ "loss": 0.0345,
+ "step": 34980
+ },
+ {
+ "epoch": 95.31607629427793,
+ "grad_norm": 3.1286725997924805,
+ "learning_rate": 1.148452064849337e-07,
+ "loss": 0.0433,
+ "step": 34981
+ },
+ {
+ "epoch": 95.31880108991825,
+ "grad_norm": 1.9681954383850098,
+ "learning_rate": 1.1471188270174571e-07,
+ "loss": 0.0226,
+ "step": 34982
+ },
+ {
+ "epoch": 95.32152588555859,
+ "grad_norm": 2.716500997543335,
+ "learning_rate": 1.1457863590486507e-07,
+ "loss": 0.0421,
+ "step": 34983
+ },
+ {
+ "epoch": 95.3242506811989,
+ "grad_norm": 2.188465118408203,
+ "learning_rate": 1.1444546609532648e-07,
+ "loss": 0.0491,
+ "step": 34984
+ },
+ {
+ "epoch": 95.32697547683924,
+ "grad_norm": 2.2012417316436768,
+ "learning_rate": 1.1431237327416911e-07,
+ "loss": 0.054,
+ "step": 34985
+ },
+ {
+ "epoch": 95.32970027247957,
+ "grad_norm": 2.2194905281066895,
+ "learning_rate": 1.1417935744242769e-07,
+ "loss": 0.1597,
+ "step": 34986
+ },
+ {
+ "epoch": 95.33242506811989,
+ "grad_norm": 2.5500473976135254,
+ "learning_rate": 1.140464186011403e-07,
+ "loss": 0.0604,
+ "step": 34987
+ },
+ {
+ "epoch": 95.33514986376022,
+ "grad_norm": 2.875729560852051,
+ "learning_rate": 1.1391355675134164e-07,
+ "loss": 0.0867,
+ "step": 34988
+ },
+ {
+ "epoch": 95.33787465940054,
+ "grad_norm": 2.884606122970581,
+ "learning_rate": 1.1378077189406422e-07,
+ "loss": 0.0252,
+ "step": 34989
+ },
+ {
+ "epoch": 95.34059945504087,
+ "grad_norm": 2.349778890609741,
+ "learning_rate": 1.13648064030345e-07,
+ "loss": 0.0254,
+ "step": 34990
+ },
+ {
+ "epoch": 95.34332425068119,
+ "grad_norm": 2.657801628112793,
+ "learning_rate": 1.135154331612165e-07,
+ "loss": 0.0343,
+ "step": 34991
+ },
+ {
+ "epoch": 95.34604904632153,
+ "grad_norm": 3.0789895057678223,
+ "learning_rate": 1.133828792877123e-07,
+ "loss": 0.1523,
+ "step": 34992
+ },
+ {
+ "epoch": 95.34877384196186,
+ "grad_norm": 2.754234790802002,
+ "learning_rate": 1.1325040241086383e-07,
+ "loss": 0.0944,
+ "step": 34993
+ },
+ {
+ "epoch": 95.35149863760218,
+ "grad_norm": 1.4009101390838623,
+ "learning_rate": 1.1311800253170246e-07,
+ "loss": 0.017,
+ "step": 34994
+ },
+ {
+ "epoch": 95.35422343324251,
+ "grad_norm": 2.27170467376709,
+ "learning_rate": 1.1298567965125962e-07,
+ "loss": 0.0333,
+ "step": 34995
+ },
+ {
+ "epoch": 95.35694822888283,
+ "grad_norm": 2.2349345684051514,
+ "learning_rate": 1.1285343377056668e-07,
+ "loss": 0.0234,
+ "step": 34996
+ },
+ {
+ "epoch": 95.35967302452316,
+ "grad_norm": 2.849677562713623,
+ "learning_rate": 1.1272126489065283e-07,
+ "loss": 0.0922,
+ "step": 34997
+ },
+ {
+ "epoch": 95.3623978201635,
+ "grad_norm": 3.9061155319213867,
+ "learning_rate": 1.1258917301254724e-07,
+ "loss": 0.0728,
+ "step": 34998
+ },
+ {
+ "epoch": 95.36512261580381,
+ "grad_norm": 2.703514575958252,
+ "learning_rate": 1.1245715813727908e-07,
+ "loss": 0.0204,
+ "step": 34999
+ },
+ {
+ "epoch": 95.36784741144415,
+ "grad_norm": 4.365962505340576,
+ "learning_rate": 1.1232522026587755e-07,
+ "loss": 0.1399,
+ "step": 35000
+ },
+ {
+ "epoch": 95.37057220708446,
+ "grad_norm": 3.200329065322876,
+ "learning_rate": 1.1219335939936738e-07,
+ "loss": 0.1848,
+ "step": 35001
+ },
+ {
+ "epoch": 95.3732970027248,
+ "grad_norm": 2.2563517093658447,
+ "learning_rate": 1.1206157553877772e-07,
+ "loss": 0.0317,
+ "step": 35002
+ },
+ {
+ "epoch": 95.37602179836512,
+ "grad_norm": 2.1221606731414795,
+ "learning_rate": 1.1192986868513445e-07,
+ "loss": 0.0275,
+ "step": 35003
+ },
+ {
+ "epoch": 95.37874659400545,
+ "grad_norm": 4.090084075927734,
+ "learning_rate": 1.1179823883946228e-07,
+ "loss": 0.0462,
+ "step": 35004
+ },
+ {
+ "epoch": 95.38147138964578,
+ "grad_norm": 3.4763824939727783,
+ "learning_rate": 1.1166668600278818e-07,
+ "loss": 0.1238,
+ "step": 35005
+ },
+ {
+ "epoch": 95.3841961852861,
+ "grad_norm": 1.9323807954788208,
+ "learning_rate": 1.1153521017613467e-07,
+ "loss": 0.0498,
+ "step": 35006
+ },
+ {
+ "epoch": 95.38692098092643,
+ "grad_norm": 3.275866985321045,
+ "learning_rate": 1.1140381136052758e-07,
+ "loss": 0.0597,
+ "step": 35007
+ },
+ {
+ "epoch": 95.38964577656675,
+ "grad_norm": 2.1088693141937256,
+ "learning_rate": 1.1127248955698833e-07,
+ "loss": 0.0225,
+ "step": 35008
+ },
+ {
+ "epoch": 95.39237057220708,
+ "grad_norm": 3.1419129371643066,
+ "learning_rate": 1.1114124476654164e-07,
+ "loss": 0.0229,
+ "step": 35009
+ },
+ {
+ "epoch": 95.39509536784742,
+ "grad_norm": 2.0916402339935303,
+ "learning_rate": 1.1101007699020782e-07,
+ "loss": 0.0295,
+ "step": 35010
+ },
+ {
+ "epoch": 95.39782016348774,
+ "grad_norm": 2.159738779067993,
+ "learning_rate": 1.108789862290105e-07,
+ "loss": 0.0459,
+ "step": 35011
+ },
+ {
+ "epoch": 95.40054495912807,
+ "grad_norm": 1.6449337005615234,
+ "learning_rate": 1.1074797248396884e-07,
+ "loss": 0.0187,
+ "step": 35012
+ },
+ {
+ "epoch": 95.40326975476839,
+ "grad_norm": 2.5766232013702393,
+ "learning_rate": 1.1061703575610316e-07,
+ "loss": 0.0264,
+ "step": 35013
+ },
+ {
+ "epoch": 95.40599455040872,
+ "grad_norm": 2.9680097103118896,
+ "learning_rate": 1.1048617604643374e-07,
+ "loss": 0.0848,
+ "step": 35014
+ },
+ {
+ "epoch": 95.40871934604904,
+ "grad_norm": 2.2628979682922363,
+ "learning_rate": 1.1035539335598089e-07,
+ "loss": 0.0191,
+ "step": 35015
+ },
+ {
+ "epoch": 95.41144414168937,
+ "grad_norm": 2.8828155994415283,
+ "learning_rate": 1.1022468768576044e-07,
+ "loss": 0.0382,
+ "step": 35016
+ },
+ {
+ "epoch": 95.4141689373297,
+ "grad_norm": 3.371868133544922,
+ "learning_rate": 1.1009405903679271e-07,
+ "loss": 0.0622,
+ "step": 35017
+ },
+ {
+ "epoch": 95.41689373297002,
+ "grad_norm": 2.551166296005249,
+ "learning_rate": 1.0996350741009355e-07,
+ "loss": 0.0514,
+ "step": 35018
+ },
+ {
+ "epoch": 95.41961852861036,
+ "grad_norm": 2.7263717651367188,
+ "learning_rate": 1.0983303280668101e-07,
+ "loss": 0.0601,
+ "step": 35019
+ },
+ {
+ "epoch": 95.42234332425068,
+ "grad_norm": 3.4563968181610107,
+ "learning_rate": 1.0970263522756985e-07,
+ "loss": 0.0473,
+ "step": 35020
+ },
+ {
+ "epoch": 95.42506811989101,
+ "grad_norm": 2.899994373321533,
+ "learning_rate": 1.0957231467377704e-07,
+ "loss": 0.0742,
+ "step": 35021
+ },
+ {
+ "epoch": 95.42779291553134,
+ "grad_norm": 2.167938709259033,
+ "learning_rate": 1.0944207114631622e-07,
+ "loss": 0.0417,
+ "step": 35022
+ },
+ {
+ "epoch": 95.43051771117166,
+ "grad_norm": 1.9148547649383545,
+ "learning_rate": 1.09311904646201e-07,
+ "loss": 0.0265,
+ "step": 35023
+ },
+ {
+ "epoch": 95.433242506812,
+ "grad_norm": 2.099299669265747,
+ "learning_rate": 1.0918181517444836e-07,
+ "loss": 0.0368,
+ "step": 35024
+ },
+ {
+ "epoch": 95.43596730245231,
+ "grad_norm": 2.237480401992798,
+ "learning_rate": 1.0905180273206862e-07,
+ "loss": 0.0728,
+ "step": 35025
+ },
+ {
+ "epoch": 95.43869209809264,
+ "grad_norm": 10.043222427368164,
+ "learning_rate": 1.0892186732007538e-07,
+ "loss": 0.2052,
+ "step": 35026
+ },
+ {
+ "epoch": 95.44141689373296,
+ "grad_norm": 2.3342204093933105,
+ "learning_rate": 1.0879200893947895e-07,
+ "loss": 0.0426,
+ "step": 35027
+ },
+ {
+ "epoch": 95.4441416893733,
+ "grad_norm": 2.1813864707946777,
+ "learning_rate": 1.0866222759129296e-07,
+ "loss": 0.0953,
+ "step": 35028
+ },
+ {
+ "epoch": 95.44686648501363,
+ "grad_norm": 2.487837553024292,
+ "learning_rate": 1.0853252327652775e-07,
+ "loss": 0.0555,
+ "step": 35029
+ },
+ {
+ "epoch": 95.44959128065395,
+ "grad_norm": 2.4842350482940674,
+ "learning_rate": 1.0840289599619247e-07,
+ "loss": 0.0201,
+ "step": 35030
+ },
+ {
+ "epoch": 95.45231607629428,
+ "grad_norm": 7.030800819396973,
+ "learning_rate": 1.0827334575129633e-07,
+ "loss": 0.0904,
+ "step": 35031
+ },
+ {
+ "epoch": 95.4550408719346,
+ "grad_norm": 3.4436264038085938,
+ "learning_rate": 1.0814387254284964e-07,
+ "loss": 0.0826,
+ "step": 35032
+ },
+ {
+ "epoch": 95.45776566757493,
+ "grad_norm": 4.5369086265563965,
+ "learning_rate": 1.0801447637186047e-07,
+ "loss": 0.033,
+ "step": 35033
+ },
+ {
+ "epoch": 95.46049046321527,
+ "grad_norm": 2.9388928413391113,
+ "learning_rate": 1.0788515723933579e-07,
+ "loss": 0.0466,
+ "step": 35034
+ },
+ {
+ "epoch": 95.46321525885558,
+ "grad_norm": 9.000701904296875,
+ "learning_rate": 1.077559151462837e-07,
+ "loss": 0.1025,
+ "step": 35035
+ },
+ {
+ "epoch": 95.46594005449592,
+ "grad_norm": 1.9095757007598877,
+ "learning_rate": 1.0762675009370893e-07,
+ "loss": 0.0186,
+ "step": 35036
+ },
+ {
+ "epoch": 95.46866485013624,
+ "grad_norm": 2.6702628135681152,
+ "learning_rate": 1.0749766208261959e-07,
+ "loss": 0.0462,
+ "step": 35037
+ },
+ {
+ "epoch": 95.47138964577657,
+ "grad_norm": 2.052314519882202,
+ "learning_rate": 1.073686511140204e-07,
+ "loss": 0.0338,
+ "step": 35038
+ },
+ {
+ "epoch": 95.47411444141689,
+ "grad_norm": 3.0173497200012207,
+ "learning_rate": 1.0723971718891502e-07,
+ "loss": 0.0507,
+ "step": 35039
+ },
+ {
+ "epoch": 95.47683923705722,
+ "grad_norm": 2.7834537029266357,
+ "learning_rate": 1.071108603083082e-07,
+ "loss": 0.0232,
+ "step": 35040
+ },
+ {
+ "epoch": 95.47956403269755,
+ "grad_norm": 3.012296199798584,
+ "learning_rate": 1.0698208047320358e-07,
+ "loss": 0.0333,
+ "step": 35041
+ },
+ {
+ "epoch": 95.48228882833787,
+ "grad_norm": 2.0441133975982666,
+ "learning_rate": 1.068533776846048e-07,
+ "loss": 0.1981,
+ "step": 35042
+ },
+ {
+ "epoch": 95.4850136239782,
+ "grad_norm": 2.503466844558716,
+ "learning_rate": 1.0672475194351328e-07,
+ "loss": 0.1128,
+ "step": 35043
+ },
+ {
+ "epoch": 95.48773841961852,
+ "grad_norm": 3.115562915802002,
+ "learning_rate": 1.0659620325093045e-07,
+ "loss": 0.1557,
+ "step": 35044
+ },
+ {
+ "epoch": 95.49046321525886,
+ "grad_norm": 3.1295604705810547,
+ "learning_rate": 1.0646773160785884e-07,
+ "loss": 0.1138,
+ "step": 35045
+ },
+ {
+ "epoch": 95.49318801089919,
+ "grad_norm": 1.9670004844665527,
+ "learning_rate": 1.0633933701529764e-07,
+ "loss": 0.0264,
+ "step": 35046
+ },
+ {
+ "epoch": 95.49591280653951,
+ "grad_norm": 2.5413930416107178,
+ "learning_rate": 1.0621101947424717e-07,
+ "loss": 0.0849,
+ "step": 35047
+ },
+ {
+ "epoch": 95.49863760217984,
+ "grad_norm": 4.066226482391357,
+ "learning_rate": 1.0608277898570663e-07,
+ "loss": 0.1332,
+ "step": 35048
+ },
+ {
+ "epoch": 95.50136239782016,
+ "grad_norm": 2.419011354446411,
+ "learning_rate": 1.0595461555067521e-07,
+ "loss": 0.0991,
+ "step": 35049
+ },
+ {
+ "epoch": 95.50408719346049,
+ "grad_norm": 2.352062702178955,
+ "learning_rate": 1.0582652917015101e-07,
+ "loss": 0.02,
+ "step": 35050
+ },
+ {
+ "epoch": 95.50681198910081,
+ "grad_norm": 4.402019023895264,
+ "learning_rate": 1.0569851984513102e-07,
+ "loss": 0.0727,
+ "step": 35051
+ },
+ {
+ "epoch": 95.50953678474114,
+ "grad_norm": 2.710862398147583,
+ "learning_rate": 1.0557058757661331e-07,
+ "loss": 0.0717,
+ "step": 35052
+ },
+ {
+ "epoch": 95.51226158038148,
+ "grad_norm": 3.1294167041778564,
+ "learning_rate": 1.0544273236559266e-07,
+ "loss": 0.0402,
+ "step": 35053
+ },
+ {
+ "epoch": 95.5149863760218,
+ "grad_norm": 2.3434746265411377,
+ "learning_rate": 1.0531495421306492e-07,
+ "loss": 0.0988,
+ "step": 35054
+ },
+ {
+ "epoch": 95.51771117166213,
+ "grad_norm": 7.592291831970215,
+ "learning_rate": 1.0518725312002709e-07,
+ "loss": 0.0843,
+ "step": 35055
+ },
+ {
+ "epoch": 95.52043596730245,
+ "grad_norm": 3.7560784816741943,
+ "learning_rate": 1.0505962908747281e-07,
+ "loss": 0.051,
+ "step": 35056
+ },
+ {
+ "epoch": 95.52316076294278,
+ "grad_norm": 2.4683263301849365,
+ "learning_rate": 1.0493208211639349e-07,
+ "loss": 0.0423,
+ "step": 35057
+ },
+ {
+ "epoch": 95.52588555858311,
+ "grad_norm": 2.3147597312927246,
+ "learning_rate": 1.0480461220778725e-07,
+ "loss": 0.0788,
+ "step": 35058
+ },
+ {
+ "epoch": 95.52861035422343,
+ "grad_norm": 1.7609657049179077,
+ "learning_rate": 1.0467721936264219e-07,
+ "loss": 0.0219,
+ "step": 35059
+ },
+ {
+ "epoch": 95.53133514986376,
+ "grad_norm": 1.9314008951187134,
+ "learning_rate": 1.0454990358195305e-07,
+ "loss": 0.0304,
+ "step": 35060
+ },
+ {
+ "epoch": 95.53405994550408,
+ "grad_norm": 2.434859037399292,
+ "learning_rate": 1.0442266486671126e-07,
+ "loss": 0.0556,
+ "step": 35061
+ },
+ {
+ "epoch": 95.53678474114442,
+ "grad_norm": 2.1970648765563965,
+ "learning_rate": 1.0429550321790716e-07,
+ "loss": 0.0566,
+ "step": 35062
+ },
+ {
+ "epoch": 95.53950953678473,
+ "grad_norm": 3.4781670570373535,
+ "learning_rate": 1.0416841863653105e-07,
+ "loss": 0.04,
+ "step": 35063
+ },
+ {
+ "epoch": 95.54223433242507,
+ "grad_norm": 2.1384620666503906,
+ "learning_rate": 1.0404141112357325e-07,
+ "loss": 0.0196,
+ "step": 35064
+ },
+ {
+ "epoch": 95.5449591280654,
+ "grad_norm": 1.8867310285568237,
+ "learning_rate": 1.0391448068002185e-07,
+ "loss": 0.0286,
+ "step": 35065
+ },
+ {
+ "epoch": 95.54768392370572,
+ "grad_norm": 2.1695098876953125,
+ "learning_rate": 1.0378762730686609e-07,
+ "loss": 0.0344,
+ "step": 35066
+ },
+ {
+ "epoch": 95.55040871934605,
+ "grad_norm": 2.2543327808380127,
+ "learning_rate": 1.0366085100509405e-07,
+ "loss": 0.0485,
+ "step": 35067
+ },
+ {
+ "epoch": 95.55313351498637,
+ "grad_norm": 2.3990397453308105,
+ "learning_rate": 1.0353415177569271e-07,
+ "loss": 0.024,
+ "step": 35068
+ },
+ {
+ "epoch": 95.5558583106267,
+ "grad_norm": 4.668440818786621,
+ "learning_rate": 1.0340752961964795e-07,
+ "loss": 0.1383,
+ "step": 35069
+ },
+ {
+ "epoch": 95.55858310626704,
+ "grad_norm": 3.2616732120513916,
+ "learning_rate": 1.0328098453794788e-07,
+ "loss": 0.1184,
+ "step": 35070
+ },
+ {
+ "epoch": 95.56130790190736,
+ "grad_norm": 2.650279998779297,
+ "learning_rate": 1.0315451653157615e-07,
+ "loss": 0.0627,
+ "step": 35071
+ },
+ {
+ "epoch": 95.56403269754769,
+ "grad_norm": 3.5118069648742676,
+ "learning_rate": 1.0302812560151976e-07,
+ "loss": 0.084,
+ "step": 35072
+ },
+ {
+ "epoch": 95.566757493188,
+ "grad_norm": 2.4976346492767334,
+ "learning_rate": 1.0290181174876124e-07,
+ "loss": 0.1904,
+ "step": 35073
+ },
+ {
+ "epoch": 95.56948228882834,
+ "grad_norm": 2.72570538520813,
+ "learning_rate": 1.0277557497428536e-07,
+ "loss": 0.0304,
+ "step": 35074
+ },
+ {
+ "epoch": 95.57220708446866,
+ "grad_norm": 4.170415878295898,
+ "learning_rate": 1.0264941527907247e-07,
+ "loss": 0.1321,
+ "step": 35075
+ },
+ {
+ "epoch": 95.57493188010899,
+ "grad_norm": 4.140685081481934,
+ "learning_rate": 1.0252333266410952e-07,
+ "loss": 0.0586,
+ "step": 35076
+ },
+ {
+ "epoch": 95.57765667574932,
+ "grad_norm": 2.057738780975342,
+ "learning_rate": 1.0239732713037576e-07,
+ "loss": 0.0273,
+ "step": 35077
+ },
+ {
+ "epoch": 95.58038147138964,
+ "grad_norm": 1.8662406206130981,
+ "learning_rate": 1.0227139867885371e-07,
+ "loss": 0.059,
+ "step": 35078
+ },
+ {
+ "epoch": 95.58310626702998,
+ "grad_norm": 2.9774651527404785,
+ "learning_rate": 1.0214554731052261e-07,
+ "loss": 0.0301,
+ "step": 35079
+ },
+ {
+ "epoch": 95.5858310626703,
+ "grad_norm": 1.653913974761963,
+ "learning_rate": 1.020197730263639e-07,
+ "loss": 0.0138,
+ "step": 35080
+ },
+ {
+ "epoch": 95.58855585831063,
+ "grad_norm": 1.8388270139694214,
+ "learning_rate": 1.0189407582735566e-07,
+ "loss": 0.0581,
+ "step": 35081
+ },
+ {
+ "epoch": 95.59128065395096,
+ "grad_norm": 3.453791379928589,
+ "learning_rate": 1.0176845571447936e-07,
+ "loss": 0.0999,
+ "step": 35082
+ },
+ {
+ "epoch": 95.59400544959128,
+ "grad_norm": 3.2059035301208496,
+ "learning_rate": 1.0164291268870974e-07,
+ "loss": 0.0825,
+ "step": 35083
+ },
+ {
+ "epoch": 95.59673024523161,
+ "grad_norm": 1.9955600500106812,
+ "learning_rate": 1.0151744675102826e-07,
+ "loss": 0.0237,
+ "step": 35084
+ },
+ {
+ "epoch": 95.59945504087193,
+ "grad_norm": 2.2362756729125977,
+ "learning_rate": 1.0139205790240969e-07,
+ "loss": 0.0336,
+ "step": 35085
+ },
+ {
+ "epoch": 95.60217983651226,
+ "grad_norm": 2.192676067352295,
+ "learning_rate": 1.0126674614383214e-07,
+ "loss": 0.1018,
+ "step": 35086
+ },
+ {
+ "epoch": 95.60490463215258,
+ "grad_norm": 3.1578562259674072,
+ "learning_rate": 1.0114151147626927e-07,
+ "loss": 0.1314,
+ "step": 35087
+ },
+ {
+ "epoch": 95.60762942779292,
+ "grad_norm": 2.281991958618164,
+ "learning_rate": 1.0101635390069809e-07,
+ "loss": 0.032,
+ "step": 35088
+ },
+ {
+ "epoch": 95.61035422343325,
+ "grad_norm": 1.8152971267700195,
+ "learning_rate": 1.0089127341809336e-07,
+ "loss": 0.0204,
+ "step": 35089
+ },
+ {
+ "epoch": 95.61307901907357,
+ "grad_norm": 2.4973959922790527,
+ "learning_rate": 1.0076627002942873e-07,
+ "loss": 0.0382,
+ "step": 35090
+ },
+ {
+ "epoch": 95.6158038147139,
+ "grad_norm": 2.242245674133301,
+ "learning_rate": 1.006413437356768e-07,
+ "loss": 0.0788,
+ "step": 35091
+ },
+ {
+ "epoch": 95.61852861035422,
+ "grad_norm": 3.0806093215942383,
+ "learning_rate": 1.0051649453781231e-07,
+ "loss": 0.0406,
+ "step": 35092
+ },
+ {
+ "epoch": 95.62125340599455,
+ "grad_norm": 2.292752265930176,
+ "learning_rate": 1.0039172243680673e-07,
+ "loss": 0.0349,
+ "step": 35093
+ },
+ {
+ "epoch": 95.62397820163488,
+ "grad_norm": 3.0341873168945312,
+ "learning_rate": 1.0026702743363148e-07,
+ "loss": 0.0481,
+ "step": 35094
+ },
+ {
+ "epoch": 95.6267029972752,
+ "grad_norm": 2.9238197803497314,
+ "learning_rate": 1.0014240952925803e-07,
+ "loss": 0.0355,
+ "step": 35095
+ },
+ {
+ "epoch": 95.62942779291554,
+ "grad_norm": 3.0007381439208984,
+ "learning_rate": 1.000178687246578e-07,
+ "loss": 0.1112,
+ "step": 35096
+ },
+ {
+ "epoch": 95.63215258855585,
+ "grad_norm": 2.056663990020752,
+ "learning_rate": 9.989340502079891e-08,
+ "loss": 0.0726,
+ "step": 35097
+ },
+ {
+ "epoch": 95.63487738419619,
+ "grad_norm": 2.571248769760132,
+ "learning_rate": 9.976901841865172e-08,
+ "loss": 0.0842,
+ "step": 35098
+ },
+ {
+ "epoch": 95.6376021798365,
+ "grad_norm": 3.0214622020721436,
+ "learning_rate": 9.964470891918431e-08,
+ "loss": 0.1119,
+ "step": 35099
+ },
+ {
+ "epoch": 95.64032697547684,
+ "grad_norm": 2.4208412170410156,
+ "learning_rate": 9.952047652336594e-08,
+ "loss": 0.0899,
+ "step": 35100
+ },
+ {
+ "epoch": 95.64305177111717,
+ "grad_norm": 4.0630974769592285,
+ "learning_rate": 9.939632123216359e-08,
+ "loss": 0.1332,
+ "step": 35101
+ },
+ {
+ "epoch": 95.64577656675749,
+ "grad_norm": 2.8814077377319336,
+ "learning_rate": 9.927224304654315e-08,
+ "loss": 0.1247,
+ "step": 35102
+ },
+ {
+ "epoch": 95.64850136239782,
+ "grad_norm": 1.5603978633880615,
+ "learning_rate": 9.914824196747274e-08,
+ "loss": 0.0197,
+ "step": 35103
+ },
+ {
+ "epoch": 95.65122615803814,
+ "grad_norm": 3.7697665691375732,
+ "learning_rate": 9.902431799591605e-08,
+ "loss": 0.0686,
+ "step": 35104
+ },
+ {
+ "epoch": 95.65395095367847,
+ "grad_norm": 1.7513145208358765,
+ "learning_rate": 9.890047113284118e-08,
+ "loss": 0.0263,
+ "step": 35105
+ },
+ {
+ "epoch": 95.65667574931881,
+ "grad_norm": 2.5381932258605957,
+ "learning_rate": 9.877670137920958e-08,
+ "loss": 0.1025,
+ "step": 35106
+ },
+ {
+ "epoch": 95.65940054495913,
+ "grad_norm": 2.0419929027557373,
+ "learning_rate": 9.865300873598605e-08,
+ "loss": 0.0169,
+ "step": 35107
+ },
+ {
+ "epoch": 95.66212534059946,
+ "grad_norm": 2.7394063472747803,
+ "learning_rate": 9.852939320413424e-08,
+ "loss": 0.0265,
+ "step": 35108
+ },
+ {
+ "epoch": 95.66485013623978,
+ "grad_norm": 2.241105079650879,
+ "learning_rate": 9.840585478461673e-08,
+ "loss": 0.0373,
+ "step": 35109
+ },
+ {
+ "epoch": 95.66757493188011,
+ "grad_norm": 3.284921646118164,
+ "learning_rate": 9.828239347839607e-08,
+ "loss": 0.0297,
+ "step": 35110
+ },
+ {
+ "epoch": 95.67029972752043,
+ "grad_norm": 2.441310167312622,
+ "learning_rate": 9.815900928643374e-08,
+ "loss": 0.055,
+ "step": 35111
+ },
+ {
+ "epoch": 95.67302452316076,
+ "grad_norm": 2.2745747566223145,
+ "learning_rate": 9.803570220969006e-08,
+ "loss": 0.0336,
+ "step": 35112
+ },
+ {
+ "epoch": 95.6757493188011,
+ "grad_norm": 2.1112680435180664,
+ "learning_rate": 9.791247224912647e-08,
+ "loss": 0.0533,
+ "step": 35113
+ },
+ {
+ "epoch": 95.67847411444141,
+ "grad_norm": 2.212068796157837,
+ "learning_rate": 9.778931940570113e-08,
+ "loss": 0.0273,
+ "step": 35114
+ },
+ {
+ "epoch": 95.68119891008175,
+ "grad_norm": 1.7880301475524902,
+ "learning_rate": 9.766624368037436e-08,
+ "loss": 0.0239,
+ "step": 35115
+ },
+ {
+ "epoch": 95.68392370572207,
+ "grad_norm": 2.708158254623413,
+ "learning_rate": 9.754324507410317e-08,
+ "loss": 0.0559,
+ "step": 35116
+ },
+ {
+ "epoch": 95.6866485013624,
+ "grad_norm": 2.7598323822021484,
+ "learning_rate": 9.742032358784681e-08,
+ "loss": 0.0802,
+ "step": 35117
+ },
+ {
+ "epoch": 95.68937329700273,
+ "grad_norm": 1.3291863203048706,
+ "learning_rate": 9.729747922256228e-08,
+ "loss": 0.1452,
+ "step": 35118
+ },
+ {
+ "epoch": 95.69209809264305,
+ "grad_norm": 2.062356472015381,
+ "learning_rate": 9.717471197920658e-08,
+ "loss": 0.0476,
+ "step": 35119
+ },
+ {
+ "epoch": 95.69482288828338,
+ "grad_norm": 3.2122371196746826,
+ "learning_rate": 9.705202185873563e-08,
+ "loss": 0.0231,
+ "step": 35120
+ },
+ {
+ "epoch": 95.6975476839237,
+ "grad_norm": 1.874733328819275,
+ "learning_rate": 9.692940886210422e-08,
+ "loss": 0.0655,
+ "step": 35121
+ },
+ {
+ "epoch": 95.70027247956403,
+ "grad_norm": 2.1043713092803955,
+ "learning_rate": 9.680687299026826e-08,
+ "loss": 0.0402,
+ "step": 35122
+ },
+ {
+ "epoch": 95.70299727520435,
+ "grad_norm": 2.0644664764404297,
+ "learning_rate": 9.66844142441814e-08,
+ "loss": 0.0464,
+ "step": 35123
+ },
+ {
+ "epoch": 95.70572207084469,
+ "grad_norm": 2.392665147781372,
+ "learning_rate": 9.656203262479735e-08,
+ "loss": 0.031,
+ "step": 35124
+ },
+ {
+ "epoch": 95.70844686648502,
+ "grad_norm": 2.3267199993133545,
+ "learning_rate": 9.64397281330709e-08,
+ "loss": 0.0273,
+ "step": 35125
+ },
+ {
+ "epoch": 95.71117166212534,
+ "grad_norm": 2.2901506423950195,
+ "learning_rate": 9.631750076995128e-08,
+ "loss": 0.0514,
+ "step": 35126
+ },
+ {
+ "epoch": 95.71389645776567,
+ "grad_norm": 1.840728521347046,
+ "learning_rate": 9.619535053639328e-08,
+ "loss": 0.0261,
+ "step": 35127
+ },
+ {
+ "epoch": 95.71662125340599,
+ "grad_norm": 2.655202627182007,
+ "learning_rate": 9.607327743334616e-08,
+ "loss": 0.0269,
+ "step": 35128
+ },
+ {
+ "epoch": 95.71934604904632,
+ "grad_norm": 2.934680223464966,
+ "learning_rate": 9.595128146176247e-08,
+ "loss": 0.1405,
+ "step": 35129
+ },
+ {
+ "epoch": 95.72207084468666,
+ "grad_norm": 1.86601722240448,
+ "learning_rate": 9.582936262259146e-08,
+ "loss": 0.0825,
+ "step": 35130
+ },
+ {
+ "epoch": 95.72479564032697,
+ "grad_norm": 3.856334686279297,
+ "learning_rate": 9.570752091678237e-08,
+ "loss": 0.1767,
+ "step": 35131
+ },
+ {
+ "epoch": 95.7275204359673,
+ "grad_norm": 1.8248963356018066,
+ "learning_rate": 9.558575634528444e-08,
+ "loss": 0.0625,
+ "step": 35132
+ },
+ {
+ "epoch": 95.73024523160763,
+ "grad_norm": 2.632397174835205,
+ "learning_rate": 9.54640689090458e-08,
+ "loss": 0.0634,
+ "step": 35133
+ },
+ {
+ "epoch": 95.73297002724796,
+ "grad_norm": 2.9107959270477295,
+ "learning_rate": 9.534245860901347e-08,
+ "loss": 0.0526,
+ "step": 35134
+ },
+ {
+ "epoch": 95.73569482288828,
+ "grad_norm": 2.6701486110687256,
+ "learning_rate": 9.522092544613671e-08,
+ "loss": 0.0803,
+ "step": 35135
+ },
+ {
+ "epoch": 95.73841961852861,
+ "grad_norm": 2.162994623184204,
+ "learning_rate": 9.509946942135916e-08,
+ "loss": 0.0482,
+ "step": 35136
+ },
+ {
+ "epoch": 95.74114441416894,
+ "grad_norm": 3.5007174015045166,
+ "learning_rate": 9.497809053562901e-08,
+ "loss": 0.219,
+ "step": 35137
+ },
+ {
+ "epoch": 95.74386920980926,
+ "grad_norm": 2.6569952964782715,
+ "learning_rate": 9.485678878989102e-08,
+ "loss": 0.0795,
+ "step": 35138
+ },
+ {
+ "epoch": 95.7465940054496,
+ "grad_norm": 2.499392032623291,
+ "learning_rate": 9.473556418508889e-08,
+ "loss": 0.0744,
+ "step": 35139
+ },
+ {
+ "epoch": 95.74931880108991,
+ "grad_norm": 2.9137237071990967,
+ "learning_rate": 9.461441672216743e-08,
+ "loss": 0.0993,
+ "step": 35140
+ },
+ {
+ "epoch": 95.75204359673025,
+ "grad_norm": 1.7527599334716797,
+ "learning_rate": 9.449334640207031e-08,
+ "loss": 0.018,
+ "step": 35141
+ },
+ {
+ "epoch": 95.75476839237058,
+ "grad_norm": 2.412987470626831,
+ "learning_rate": 9.437235322574123e-08,
+ "loss": 0.0639,
+ "step": 35142
+ },
+ {
+ "epoch": 95.7574931880109,
+ "grad_norm": 2.5925357341766357,
+ "learning_rate": 9.425143719411945e-08,
+ "loss": 0.034,
+ "step": 35143
+ },
+ {
+ "epoch": 95.76021798365123,
+ "grad_norm": 2.732663154602051,
+ "learning_rate": 9.413059830814975e-08,
+ "loss": 0.0427,
+ "step": 35144
+ },
+ {
+ "epoch": 95.76294277929155,
+ "grad_norm": 3.209555149078369,
+ "learning_rate": 9.400983656877138e-08,
+ "loss": 0.0641,
+ "step": 35145
+ },
+ {
+ "epoch": 95.76566757493188,
+ "grad_norm": 1.7188575267791748,
+ "learning_rate": 9.388915197692694e-08,
+ "loss": 0.0236,
+ "step": 35146
+ },
+ {
+ "epoch": 95.7683923705722,
+ "grad_norm": 2.841384172439575,
+ "learning_rate": 9.376854453355455e-08,
+ "loss": 0.0549,
+ "step": 35147
+ },
+ {
+ "epoch": 95.77111716621253,
+ "grad_norm": 3.503021717071533,
+ "learning_rate": 9.364801423959235e-08,
+ "loss": 0.0352,
+ "step": 35148
+ },
+ {
+ "epoch": 95.77384196185287,
+ "grad_norm": 2.6008212566375732,
+ "learning_rate": 9.352756109598183e-08,
+ "loss": 0.0562,
+ "step": 35149
+ },
+ {
+ "epoch": 95.77656675749319,
+ "grad_norm": 2.5199153423309326,
+ "learning_rate": 9.340718510365998e-08,
+ "loss": 0.0309,
+ "step": 35150
+ },
+ {
+ "epoch": 95.77929155313352,
+ "grad_norm": 1.8979390859603882,
+ "learning_rate": 9.328688626356497e-08,
+ "loss": 0.0221,
+ "step": 35151
+ },
+ {
+ "epoch": 95.78201634877384,
+ "grad_norm": 6.1602983474731445,
+ "learning_rate": 9.316666457663048e-08,
+ "loss": 0.1581,
+ "step": 35152
+ },
+ {
+ "epoch": 95.78474114441417,
+ "grad_norm": 2.225799083709717,
+ "learning_rate": 9.304652004379689e-08,
+ "loss": 0.1517,
+ "step": 35153
+ },
+ {
+ "epoch": 95.7874659400545,
+ "grad_norm": 1.7097855806350708,
+ "learning_rate": 9.292645266599787e-08,
+ "loss": 0.0147,
+ "step": 35154
+ },
+ {
+ "epoch": 95.79019073569482,
+ "grad_norm": 2.0193722248077393,
+ "learning_rate": 9.280646244416936e-08,
+ "loss": 0.0239,
+ "step": 35155
+ },
+ {
+ "epoch": 95.79291553133515,
+ "grad_norm": 1.4210405349731445,
+ "learning_rate": 9.268654937924393e-08,
+ "loss": 0.0171,
+ "step": 35156
+ },
+ {
+ "epoch": 95.79564032697547,
+ "grad_norm": 1.6739972829818726,
+ "learning_rate": 9.256671347215751e-08,
+ "loss": 0.0285,
+ "step": 35157
+ },
+ {
+ "epoch": 95.7983651226158,
+ "grad_norm": 3.580216884613037,
+ "learning_rate": 9.244695472384268e-08,
+ "loss": 0.1765,
+ "step": 35158
+ },
+ {
+ "epoch": 95.80108991825612,
+ "grad_norm": 3.1134626865386963,
+ "learning_rate": 9.232727313523204e-08,
+ "loss": 0.0541,
+ "step": 35159
+ },
+ {
+ "epoch": 95.80381471389646,
+ "grad_norm": 2.7235796451568604,
+ "learning_rate": 9.220766870725705e-08,
+ "loss": 0.0528,
+ "step": 35160
+ },
+ {
+ "epoch": 95.80653950953679,
+ "grad_norm": 2.136178970336914,
+ "learning_rate": 9.208814144085032e-08,
+ "loss": 0.0256,
+ "step": 35161
+ },
+ {
+ "epoch": 95.80926430517711,
+ "grad_norm": 2.6942789554595947,
+ "learning_rate": 9.19686913369422e-08,
+ "loss": 0.0469,
+ "step": 35162
+ },
+ {
+ "epoch": 95.81198910081744,
+ "grad_norm": 2.219843626022339,
+ "learning_rate": 9.184931839646417e-08,
+ "loss": 0.1022,
+ "step": 35163
+ },
+ {
+ "epoch": 95.81471389645776,
+ "grad_norm": 2.1608901023864746,
+ "learning_rate": 9.173002262034326e-08,
+ "loss": 0.0179,
+ "step": 35164
+ },
+ {
+ "epoch": 95.8174386920981,
+ "grad_norm": 1.7062442302703857,
+ "learning_rate": 9.161080400951095e-08,
+ "loss": 0.0196,
+ "step": 35165
+ },
+ {
+ "epoch": 95.82016348773843,
+ "grad_norm": 2.1895999908447266,
+ "learning_rate": 9.149166256489428e-08,
+ "loss": 0.0239,
+ "step": 35166
+ },
+ {
+ "epoch": 95.82288828337875,
+ "grad_norm": 2.4063527584075928,
+ "learning_rate": 9.13725982874214e-08,
+ "loss": 0.0263,
+ "step": 35167
+ },
+ {
+ "epoch": 95.82561307901908,
+ "grad_norm": 2.45184326171875,
+ "learning_rate": 9.125361117802045e-08,
+ "loss": 0.0287,
+ "step": 35168
+ },
+ {
+ "epoch": 95.8283378746594,
+ "grad_norm": 2.480238437652588,
+ "learning_rate": 9.113470123761736e-08,
+ "loss": 0.1217,
+ "step": 35169
+ },
+ {
+ "epoch": 95.83106267029973,
+ "grad_norm": 1.7759056091308594,
+ "learning_rate": 9.101586846713806e-08,
+ "loss": 0.0375,
+ "step": 35170
+ },
+ {
+ "epoch": 95.83378746594005,
+ "grad_norm": 3.341256856918335,
+ "learning_rate": 9.089711286750847e-08,
+ "loss": 0.0796,
+ "step": 35171
+ },
+ {
+ "epoch": 95.83651226158038,
+ "grad_norm": 2.291745185852051,
+ "learning_rate": 9.077843443965229e-08,
+ "loss": 0.0355,
+ "step": 35172
+ },
+ {
+ "epoch": 95.83923705722071,
+ "grad_norm": 2.4249584674835205,
+ "learning_rate": 9.065983318449656e-08,
+ "loss": 0.0615,
+ "step": 35173
+ },
+ {
+ "epoch": 95.84196185286103,
+ "grad_norm": 1.8145699501037598,
+ "learning_rate": 9.054130910296166e-08,
+ "loss": 0.043,
+ "step": 35174
+ },
+ {
+ "epoch": 95.84468664850137,
+ "grad_norm": 3.3663463592529297,
+ "learning_rate": 9.042286219597352e-08,
+ "loss": 0.0606,
+ "step": 35175
+ },
+ {
+ "epoch": 95.84741144414168,
+ "grad_norm": 2.636873722076416,
+ "learning_rate": 9.030449246445139e-08,
+ "loss": 0.0606,
+ "step": 35176
+ },
+ {
+ "epoch": 95.85013623978202,
+ "grad_norm": 4.4239959716796875,
+ "learning_rate": 9.018619990932009e-08,
+ "loss": 0.0872,
+ "step": 35177
+ },
+ {
+ "epoch": 95.85286103542235,
+ "grad_norm": 3.954174757003784,
+ "learning_rate": 9.00679845314989e-08,
+ "loss": 0.0411,
+ "step": 35178
+ },
+ {
+ "epoch": 95.85558583106267,
+ "grad_norm": 2.208061933517456,
+ "learning_rate": 8.99498463319104e-08,
+ "loss": 0.0258,
+ "step": 35179
+ },
+ {
+ "epoch": 95.858310626703,
+ "grad_norm": 2.1602532863616943,
+ "learning_rate": 8.983178531147274e-08,
+ "loss": 0.0322,
+ "step": 35180
+ },
+ {
+ "epoch": 95.86103542234332,
+ "grad_norm": 2.9143776893615723,
+ "learning_rate": 8.971380147110632e-08,
+ "loss": 0.0405,
+ "step": 35181
+ },
+ {
+ "epoch": 95.86376021798365,
+ "grad_norm": 1.969183325767517,
+ "learning_rate": 8.959589481172925e-08,
+ "loss": 0.0227,
+ "step": 35182
+ },
+ {
+ "epoch": 95.86648501362397,
+ "grad_norm": 3.16774320602417,
+ "learning_rate": 8.947806533426195e-08,
+ "loss": 0.0354,
+ "step": 35183
+ },
+ {
+ "epoch": 95.8692098092643,
+ "grad_norm": 1.8806781768798828,
+ "learning_rate": 8.936031303961922e-08,
+ "loss": 0.0323,
+ "step": 35184
+ },
+ {
+ "epoch": 95.87193460490464,
+ "grad_norm": 3.9964778423309326,
+ "learning_rate": 8.924263792872035e-08,
+ "loss": 0.066,
+ "step": 35185
+ },
+ {
+ "epoch": 95.87465940054496,
+ "grad_norm": 1.8949394226074219,
+ "learning_rate": 8.912504000248012e-08,
+ "loss": 0.0278,
+ "step": 35186
+ },
+ {
+ "epoch": 95.87738419618529,
+ "grad_norm": 2.26131010055542,
+ "learning_rate": 8.900751926181561e-08,
+ "loss": 0.0507,
+ "step": 35187
+ },
+ {
+ "epoch": 95.88010899182561,
+ "grad_norm": 3.028347969055176,
+ "learning_rate": 8.889007570764052e-08,
+ "loss": 0.0646,
+ "step": 35188
+ },
+ {
+ "epoch": 95.88283378746594,
+ "grad_norm": 2.306881904602051,
+ "learning_rate": 8.87727093408708e-08,
+ "loss": 0.0378,
+ "step": 35189
+ },
+ {
+ "epoch": 95.88555858310627,
+ "grad_norm": 1.7207473516464233,
+ "learning_rate": 8.865542016242124e-08,
+ "loss": 0.0357,
+ "step": 35190
+ },
+ {
+ "epoch": 95.88828337874659,
+ "grad_norm": 2.7475287914276123,
+ "learning_rate": 8.853820817320447e-08,
+ "loss": 0.13,
+ "step": 35191
+ },
+ {
+ "epoch": 95.89100817438693,
+ "grad_norm": 1.9305124282836914,
+ "learning_rate": 8.842107337413197e-08,
+ "loss": 0.0186,
+ "step": 35192
+ },
+ {
+ "epoch": 95.89373297002724,
+ "grad_norm": 3.2990758419036865,
+ "learning_rate": 8.830401576611747e-08,
+ "loss": 0.0805,
+ "step": 35193
+ },
+ {
+ "epoch": 95.89645776566758,
+ "grad_norm": 2.719024658203125,
+ "learning_rate": 8.818703535007245e-08,
+ "loss": 0.029,
+ "step": 35194
+ },
+ {
+ "epoch": 95.8991825613079,
+ "grad_norm": 2.380613327026367,
+ "learning_rate": 8.807013212690729e-08,
+ "loss": 0.0452,
+ "step": 35195
+ },
+ {
+ "epoch": 95.90190735694823,
+ "grad_norm": 2.605151653289795,
+ "learning_rate": 8.795330609753349e-08,
+ "loss": 0.088,
+ "step": 35196
+ },
+ {
+ "epoch": 95.90463215258856,
+ "grad_norm": 2.2973361015319824,
+ "learning_rate": 8.783655726285922e-08,
+ "loss": 0.0336,
+ "step": 35197
+ },
+ {
+ "epoch": 95.90735694822888,
+ "grad_norm": 1.9996578693389893,
+ "learning_rate": 8.771988562379596e-08,
+ "loss": 0.0179,
+ "step": 35198
+ },
+ {
+ "epoch": 95.91008174386921,
+ "grad_norm": 3.072854518890381,
+ "learning_rate": 8.760329118125189e-08,
+ "loss": 0.0742,
+ "step": 35199
+ },
+ {
+ "epoch": 95.91280653950953,
+ "grad_norm": 2.327976703643799,
+ "learning_rate": 8.748677393613292e-08,
+ "loss": 0.0356,
+ "step": 35200
+ },
+ {
+ "epoch": 95.91553133514986,
+ "grad_norm": 2.217430591583252,
+ "learning_rate": 8.737033388934834e-08,
+ "loss": 0.0746,
+ "step": 35201
+ },
+ {
+ "epoch": 95.9182561307902,
+ "grad_norm": 2.879448413848877,
+ "learning_rate": 8.725397104180521e-08,
+ "loss": 0.0832,
+ "step": 35202
+ },
+ {
+ "epoch": 95.92098092643052,
+ "grad_norm": 1.991579294204712,
+ "learning_rate": 8.713768539440836e-08,
+ "loss": 0.0212,
+ "step": 35203
+ },
+ {
+ "epoch": 95.92370572207085,
+ "grad_norm": 3.104318380355835,
+ "learning_rate": 8.702147694806484e-08,
+ "loss": 0.0521,
+ "step": 35204
+ },
+ {
+ "epoch": 95.92643051771117,
+ "grad_norm": 6.036311149597168,
+ "learning_rate": 8.690534570367837e-08,
+ "loss": 0.0264,
+ "step": 35205
+ },
+ {
+ "epoch": 95.9291553133515,
+ "grad_norm": 2.8335986137390137,
+ "learning_rate": 8.678929166215377e-08,
+ "loss": 0.03,
+ "step": 35206
+ },
+ {
+ "epoch": 95.93188010899182,
+ "grad_norm": 2.896843910217285,
+ "learning_rate": 8.66733148243959e-08,
+ "loss": 0.0449,
+ "step": 35207
+ },
+ {
+ "epoch": 95.93460490463215,
+ "grad_norm": 2.7111401557922363,
+ "learning_rate": 8.655741519130622e-08,
+ "loss": 0.0224,
+ "step": 35208
+ },
+ {
+ "epoch": 95.93732970027249,
+ "grad_norm": 2.886784315109253,
+ "learning_rate": 8.644159276378961e-08,
+ "loss": 0.0323,
+ "step": 35209
+ },
+ {
+ "epoch": 95.9400544959128,
+ "grad_norm": 2.641713857650757,
+ "learning_rate": 8.632584754274642e-08,
+ "loss": 0.0948,
+ "step": 35210
+ },
+ {
+ "epoch": 95.94277929155314,
+ "grad_norm": 9.331111907958984,
+ "learning_rate": 8.621017952907817e-08,
+ "loss": 0.112,
+ "step": 35211
+ },
+ {
+ "epoch": 95.94550408719346,
+ "grad_norm": 2.2131526470184326,
+ "learning_rate": 8.609458872368526e-08,
+ "loss": 0.0623,
+ "step": 35212
+ },
+ {
+ "epoch": 95.94822888283379,
+ "grad_norm": 13.232500076293945,
+ "learning_rate": 8.597907512746917e-08,
+ "loss": 0.0298,
+ "step": 35213
+ },
+ {
+ "epoch": 95.95095367847412,
+ "grad_norm": 2.437865734100342,
+ "learning_rate": 8.58636387413292e-08,
+ "loss": 0.0221,
+ "step": 35214
+ },
+ {
+ "epoch": 95.95367847411444,
+ "grad_norm": 2.714003324508667,
+ "learning_rate": 8.57482795661646e-08,
+ "loss": 0.0283,
+ "step": 35215
+ },
+ {
+ "epoch": 95.95640326975477,
+ "grad_norm": 2.802816867828369,
+ "learning_rate": 8.563299760287358e-08,
+ "loss": 0.2306,
+ "step": 35216
+ },
+ {
+ "epoch": 95.95912806539509,
+ "grad_norm": 2.068948268890381,
+ "learning_rate": 8.551779285235206e-08,
+ "loss": 0.0736,
+ "step": 35217
+ },
+ {
+ "epoch": 95.96185286103542,
+ "grad_norm": 2.125474452972412,
+ "learning_rate": 8.540266531549934e-08,
+ "loss": 0.0278,
+ "step": 35218
+ },
+ {
+ "epoch": 95.96457765667574,
+ "grad_norm": 2.1596126556396484,
+ "learning_rate": 8.528761499321247e-08,
+ "loss": 0.1153,
+ "step": 35219
+ },
+ {
+ "epoch": 95.96730245231608,
+ "grad_norm": 3.537027597427368,
+ "learning_rate": 8.51726418863863e-08,
+ "loss": 0.0246,
+ "step": 35220
+ },
+ {
+ "epoch": 95.97002724795641,
+ "grad_norm": 2.5084664821624756,
+ "learning_rate": 8.505774599591566e-08,
+ "loss": 0.0961,
+ "step": 35221
+ },
+ {
+ "epoch": 95.97275204359673,
+ "grad_norm": 3.3551576137542725,
+ "learning_rate": 8.49429273226976e-08,
+ "loss": 0.0367,
+ "step": 35222
+ },
+ {
+ "epoch": 95.97547683923706,
+ "grad_norm": 1.8011064529418945,
+ "learning_rate": 8.482818586762365e-08,
+ "loss": 0.085,
+ "step": 35223
+ },
+ {
+ "epoch": 95.97820163487738,
+ "grad_norm": 3.4674816131591797,
+ "learning_rate": 8.471352163158974e-08,
+ "loss": 0.0311,
+ "step": 35224
+ },
+ {
+ "epoch": 95.98092643051771,
+ "grad_norm": 4.035762310028076,
+ "learning_rate": 8.45989346154863e-08,
+ "loss": 0.0504,
+ "step": 35225
+ },
+ {
+ "epoch": 95.98365122615803,
+ "grad_norm": 2.319643020629883,
+ "learning_rate": 8.448442482020814e-08,
+ "loss": 0.0291,
+ "step": 35226
+ },
+ {
+ "epoch": 95.98637602179836,
+ "grad_norm": 2.304887533187866,
+ "learning_rate": 8.436999224664677e-08,
+ "loss": 0.1227,
+ "step": 35227
+ },
+ {
+ "epoch": 95.9891008174387,
+ "grad_norm": 3.8282926082611084,
+ "learning_rate": 8.42556368956915e-08,
+ "loss": 0.03,
+ "step": 35228
+ },
+ {
+ "epoch": 95.99182561307902,
+ "grad_norm": 1.3371766805648804,
+ "learning_rate": 8.414135876823382e-08,
+ "loss": 0.0232,
+ "step": 35229
+ },
+ {
+ "epoch": 95.99455040871935,
+ "grad_norm": 2.040874719619751,
+ "learning_rate": 8.402715786516524e-08,
+ "loss": 0.0617,
+ "step": 35230
+ },
+ {
+ "epoch": 95.99727520435967,
+ "grad_norm": 3.1709978580474854,
+ "learning_rate": 8.391303418737395e-08,
+ "loss": 0.1659,
+ "step": 35231
+ },
+ {
+ "epoch": 96.0,
+ "grad_norm": 2.1919538974761963,
+ "learning_rate": 8.379898773574924e-08,
+ "loss": 0.0646,
+ "step": 35232
+ },
+ {
+ "epoch": 96.00272479564033,
+ "grad_norm": 2.3267288208007812,
+ "learning_rate": 8.368501851117816e-08,
+ "loss": 0.0264,
+ "step": 35233
+ },
+ {
+ "epoch": 96.00544959128065,
+ "grad_norm": 2.963054656982422,
+ "learning_rate": 8.357112651454891e-08,
+ "loss": 0.0735,
+ "step": 35234
+ },
+ {
+ "epoch": 96.00817438692098,
+ "grad_norm": 2.328134298324585,
+ "learning_rate": 8.345731174674854e-08,
+ "loss": 0.06,
+ "step": 35235
+ },
+ {
+ "epoch": 96.0108991825613,
+ "grad_norm": 2.6362593173980713,
+ "learning_rate": 8.334357420866413e-08,
+ "loss": 0.0876,
+ "step": 35236
+ },
+ {
+ "epoch": 96.01362397820164,
+ "grad_norm": 2.74820876121521,
+ "learning_rate": 8.322991390117941e-08,
+ "loss": 0.072,
+ "step": 35237
+ },
+ {
+ "epoch": 96.01634877384195,
+ "grad_norm": 3.324258804321289,
+ "learning_rate": 8.311633082518256e-08,
+ "loss": 0.0661,
+ "step": 35238
+ },
+ {
+ "epoch": 96.01907356948229,
+ "grad_norm": 1.7469960451126099,
+ "learning_rate": 8.300282498155621e-08,
+ "loss": 0.0268,
+ "step": 35239
+ },
+ {
+ "epoch": 96.02179836512262,
+ "grad_norm": 3.1011860370635986,
+ "learning_rate": 8.28893963711841e-08,
+ "loss": 0.0396,
+ "step": 35240
+ },
+ {
+ "epoch": 96.02452316076294,
+ "grad_norm": 4.629014492034912,
+ "learning_rate": 8.277604499494995e-08,
+ "loss": 0.0416,
+ "step": 35241
+ },
+ {
+ "epoch": 96.02724795640327,
+ "grad_norm": 4.329613208770752,
+ "learning_rate": 8.266277085373753e-08,
+ "loss": 0.0248,
+ "step": 35242
+ },
+ {
+ "epoch": 96.02997275204359,
+ "grad_norm": 1.7718288898468018,
+ "learning_rate": 8.254957394842833e-08,
+ "loss": 0.0278,
+ "step": 35243
+ },
+ {
+ "epoch": 96.03269754768392,
+ "grad_norm": 3.014353036880493,
+ "learning_rate": 8.243645427990388e-08,
+ "loss": 0.0374,
+ "step": 35244
+ },
+ {
+ "epoch": 96.03542234332426,
+ "grad_norm": 2.291088104248047,
+ "learning_rate": 8.232341184904458e-08,
+ "loss": 0.0224,
+ "step": 35245
+ },
+ {
+ "epoch": 96.03814713896458,
+ "grad_norm": 3.4260973930358887,
+ "learning_rate": 8.221044665673194e-08,
+ "loss": 0.0697,
+ "step": 35246
+ },
+ {
+ "epoch": 96.04087193460491,
+ "grad_norm": 4.077487468719482,
+ "learning_rate": 8.209755870384417e-08,
+ "loss": 0.2125,
+ "step": 35247
+ },
+ {
+ "epoch": 96.04359673024523,
+ "grad_norm": 2.3869411945343018,
+ "learning_rate": 8.198474799126167e-08,
+ "loss": 0.0244,
+ "step": 35248
+ },
+ {
+ "epoch": 96.04632152588556,
+ "grad_norm": 4.090585231781006,
+ "learning_rate": 8.18720145198626e-08,
+ "loss": 0.0387,
+ "step": 35249
+ },
+ {
+ "epoch": 96.04904632152588,
+ "grad_norm": 2.4099318981170654,
+ "learning_rate": 8.175935829052628e-08,
+ "loss": 0.0259,
+ "step": 35250
+ },
+ {
+ "epoch": 96.05177111716621,
+ "grad_norm": 4.118835926055908,
+ "learning_rate": 8.164677930412867e-08,
+ "loss": 0.058,
+ "step": 35251
+ },
+ {
+ "epoch": 96.05449591280654,
+ "grad_norm": 3.0008699893951416,
+ "learning_rate": 8.153427756154575e-08,
+ "loss": 0.0624,
+ "step": 35252
+ },
+ {
+ "epoch": 96.05722070844686,
+ "grad_norm": 3.927640914916992,
+ "learning_rate": 8.142185306365457e-08,
+ "loss": 0.1975,
+ "step": 35253
+ },
+ {
+ "epoch": 96.0599455040872,
+ "grad_norm": 3.217844247817993,
+ "learning_rate": 8.130950581133113e-08,
+ "loss": 0.0537,
+ "step": 35254
+ },
+ {
+ "epoch": 96.06267029972751,
+ "grad_norm": 2.599726915359497,
+ "learning_rate": 8.119723580545136e-08,
+ "loss": 0.0254,
+ "step": 35255
+ },
+ {
+ "epoch": 96.06539509536785,
+ "grad_norm": 2.5743327140808105,
+ "learning_rate": 8.10850430468868e-08,
+ "loss": 0.1085,
+ "step": 35256
+ },
+ {
+ "epoch": 96.06811989100818,
+ "grad_norm": 1.2380759716033936,
+ "learning_rate": 8.097292753651232e-08,
+ "loss": 0.0119,
+ "step": 35257
+ },
+ {
+ "epoch": 96.0708446866485,
+ "grad_norm": 1.8359806537628174,
+ "learning_rate": 8.086088927520274e-08,
+ "loss": 0.0208,
+ "step": 35258
+ },
+ {
+ "epoch": 96.07356948228883,
+ "grad_norm": 2.276522159576416,
+ "learning_rate": 8.074892826382852e-08,
+ "loss": 0.1583,
+ "step": 35259
+ },
+ {
+ "epoch": 96.07629427792915,
+ "grad_norm": 2.629805564880371,
+ "learning_rate": 8.063704450326227e-08,
+ "loss": 0.044,
+ "step": 35260
+ },
+ {
+ "epoch": 96.07901907356948,
+ "grad_norm": 2.550387144088745,
+ "learning_rate": 8.052523799437551e-08,
+ "loss": 0.0405,
+ "step": 35261
+ },
+ {
+ "epoch": 96.0817438692098,
+ "grad_norm": 2.132642984390259,
+ "learning_rate": 8.041350873803978e-08,
+ "loss": 0.1068,
+ "step": 35262
+ },
+ {
+ "epoch": 96.08446866485014,
+ "grad_norm": 2.0799076557159424,
+ "learning_rate": 8.030185673512325e-08,
+ "loss": 0.036,
+ "step": 35263
+ },
+ {
+ "epoch": 96.08719346049047,
+ "grad_norm": 2.644192934036255,
+ "learning_rate": 8.019028198649747e-08,
+ "loss": 0.0634,
+ "step": 35264
+ },
+ {
+ "epoch": 96.08991825613079,
+ "grad_norm": 1.6757255792617798,
+ "learning_rate": 8.007878449303064e-08,
+ "loss": 0.021,
+ "step": 35265
+ },
+ {
+ "epoch": 96.09264305177112,
+ "grad_norm": 2.489243745803833,
+ "learning_rate": 7.996736425558982e-08,
+ "loss": 0.0435,
+ "step": 35266
+ },
+ {
+ "epoch": 96.09536784741144,
+ "grad_norm": 2.456620216369629,
+ "learning_rate": 7.985602127504432e-08,
+ "loss": 0.0319,
+ "step": 35267
+ },
+ {
+ "epoch": 96.09809264305177,
+ "grad_norm": 2.1677346229553223,
+ "learning_rate": 7.974475555226125e-08,
+ "loss": 0.0727,
+ "step": 35268
+ },
+ {
+ "epoch": 96.1008174386921,
+ "grad_norm": 2.95621395111084,
+ "learning_rate": 7.963356708810654e-08,
+ "loss": 0.0398,
+ "step": 35269
+ },
+ {
+ "epoch": 96.10354223433242,
+ "grad_norm": 2.322218894958496,
+ "learning_rate": 7.95224558834462e-08,
+ "loss": 0.0707,
+ "step": 35270
+ },
+ {
+ "epoch": 96.10626702997276,
+ "grad_norm": 2.460341215133667,
+ "learning_rate": 7.941142193914619e-08,
+ "loss": 0.079,
+ "step": 35271
+ },
+ {
+ "epoch": 96.10899182561307,
+ "grad_norm": 2.0585649013519287,
+ "learning_rate": 7.930046525607027e-08,
+ "loss": 0.0339,
+ "step": 35272
+ },
+ {
+ "epoch": 96.11171662125341,
+ "grad_norm": 3.2247707843780518,
+ "learning_rate": 7.91895858350833e-08,
+ "loss": 0.0878,
+ "step": 35273
+ },
+ {
+ "epoch": 96.11444141689373,
+ "grad_norm": 4.812054634094238,
+ "learning_rate": 7.907878367704791e-08,
+ "loss": 0.0203,
+ "step": 35274
+ },
+ {
+ "epoch": 96.11716621253406,
+ "grad_norm": 2.8286547660827637,
+ "learning_rate": 7.896805878282898e-08,
+ "loss": 0.1109,
+ "step": 35275
+ },
+ {
+ "epoch": 96.11989100817439,
+ "grad_norm": 2.2864203453063965,
+ "learning_rate": 7.885741115328583e-08,
+ "loss": 0.1572,
+ "step": 35276
+ },
+ {
+ "epoch": 96.12261580381471,
+ "grad_norm": 2.099889039993286,
+ "learning_rate": 7.87468407892833e-08,
+ "loss": 0.0327,
+ "step": 35277
+ },
+ {
+ "epoch": 96.12534059945504,
+ "grad_norm": 4.798058986663818,
+ "learning_rate": 7.86363476916796e-08,
+ "loss": 0.0607,
+ "step": 35278
+ },
+ {
+ "epoch": 96.12806539509536,
+ "grad_norm": 2.89988374710083,
+ "learning_rate": 7.85259318613385e-08,
+ "loss": 0.0352,
+ "step": 35279
+ },
+ {
+ "epoch": 96.1307901907357,
+ "grad_norm": 2.715339422225952,
+ "learning_rate": 7.841559329911707e-08,
+ "loss": 0.1212,
+ "step": 35280
+ },
+ {
+ "epoch": 96.13351498637603,
+ "grad_norm": 4.634676456451416,
+ "learning_rate": 7.830533200587576e-08,
+ "loss": 0.0354,
+ "step": 35281
+ },
+ {
+ "epoch": 96.13623978201635,
+ "grad_norm": 4.271185874938965,
+ "learning_rate": 7.819514798247274e-08,
+ "loss": 0.2337,
+ "step": 35282
+ },
+ {
+ "epoch": 96.13896457765668,
+ "grad_norm": 1.6097041368484497,
+ "learning_rate": 7.808504122976624e-08,
+ "loss": 0.0233,
+ "step": 35283
+ },
+ {
+ "epoch": 96.141689373297,
+ "grad_norm": 4.050378799438477,
+ "learning_rate": 7.797501174861555e-08,
+ "loss": 0.1224,
+ "step": 35284
+ },
+ {
+ "epoch": 96.14441416893733,
+ "grad_norm": 2.521028518676758,
+ "learning_rate": 7.786505953987555e-08,
+ "loss": 0.056,
+ "step": 35285
+ },
+ {
+ "epoch": 96.14713896457765,
+ "grad_norm": 25.072004318237305,
+ "learning_rate": 7.775518460440223e-08,
+ "loss": 0.0674,
+ "step": 35286
+ },
+ {
+ "epoch": 96.14986376021798,
+ "grad_norm": 2.9250643253326416,
+ "learning_rate": 7.76453869430538e-08,
+ "loss": 0.0462,
+ "step": 35287
+ },
+ {
+ "epoch": 96.15258855585832,
+ "grad_norm": 2.3465731143951416,
+ "learning_rate": 7.753566655668287e-08,
+ "loss": 0.0944,
+ "step": 35288
+ },
+ {
+ "epoch": 96.15531335149863,
+ "grad_norm": 1.7991676330566406,
+ "learning_rate": 7.742602344614547e-08,
+ "loss": 0.0267,
+ "step": 35289
+ },
+ {
+ "epoch": 96.15803814713897,
+ "grad_norm": 3.252142906188965,
+ "learning_rate": 7.731645761229311e-08,
+ "loss": 0.0387,
+ "step": 35290
+ },
+ {
+ "epoch": 96.16076294277929,
+ "grad_norm": 2.0888664722442627,
+ "learning_rate": 7.72069690559829e-08,
+ "loss": 0.0694,
+ "step": 35291
+ },
+ {
+ "epoch": 96.16348773841962,
+ "grad_norm": 2.0460405349731445,
+ "learning_rate": 7.709755777806416e-08,
+ "loss": 0.0224,
+ "step": 35292
+ },
+ {
+ "epoch": 96.16621253405995,
+ "grad_norm": 3.1798970699310303,
+ "learning_rate": 7.698822377939063e-08,
+ "loss": 0.0712,
+ "step": 35293
+ },
+ {
+ "epoch": 96.16893732970027,
+ "grad_norm": 1.9900087118148804,
+ "learning_rate": 7.687896706081388e-08,
+ "loss": 0.0159,
+ "step": 35294
+ },
+ {
+ "epoch": 96.1716621253406,
+ "grad_norm": 1.9430514574050903,
+ "learning_rate": 7.676978762318321e-08,
+ "loss": 0.0301,
+ "step": 35295
+ },
+ {
+ "epoch": 96.17438692098092,
+ "grad_norm": 2.5412027835845947,
+ "learning_rate": 7.666068546735129e-08,
+ "loss": 0.0431,
+ "step": 35296
+ },
+ {
+ "epoch": 96.17711171662125,
+ "grad_norm": 2.8897788524627686,
+ "learning_rate": 7.655166059416519e-08,
+ "loss": 0.065,
+ "step": 35297
+ },
+ {
+ "epoch": 96.17983651226157,
+ "grad_norm": 2.243454694747925,
+ "learning_rate": 7.644271300447647e-08,
+ "loss": 0.0358,
+ "step": 35298
+ },
+ {
+ "epoch": 96.1825613079019,
+ "grad_norm": 2.231678009033203,
+ "learning_rate": 7.633384269913224e-08,
+ "loss": 0.034,
+ "step": 35299
+ },
+ {
+ "epoch": 96.18528610354224,
+ "grad_norm": 3.5967888832092285,
+ "learning_rate": 7.62250496789807e-08,
+ "loss": 0.1114,
+ "step": 35300
+ },
+ {
+ "epoch": 96.18801089918256,
+ "grad_norm": 2.564082384109497,
+ "learning_rate": 7.611633394487005e-08,
+ "loss": 0.1345,
+ "step": 35301
+ },
+ {
+ "epoch": 96.19073569482289,
+ "grad_norm": 2.419724941253662,
+ "learning_rate": 7.600769549764408e-08,
+ "loss": 0.0257,
+ "step": 35302
+ },
+ {
+ "epoch": 96.19346049046321,
+ "grad_norm": 2.611628770828247,
+ "learning_rate": 7.58991343381521e-08,
+ "loss": 0.028,
+ "step": 35303
+ },
+ {
+ "epoch": 96.19618528610354,
+ "grad_norm": 2.4860422611236572,
+ "learning_rate": 7.579065046723789e-08,
+ "loss": 0.0453,
+ "step": 35304
+ },
+ {
+ "epoch": 96.19891008174388,
+ "grad_norm": 2.565809965133667,
+ "learning_rate": 7.56822438857463e-08,
+ "loss": 0.102,
+ "step": 35305
+ },
+ {
+ "epoch": 96.2016348773842,
+ "grad_norm": 1.5890276432037354,
+ "learning_rate": 7.557391459452224e-08,
+ "loss": 0.0161,
+ "step": 35306
+ },
+ {
+ "epoch": 96.20435967302453,
+ "grad_norm": 4.1379923820495605,
+ "learning_rate": 7.546566259440946e-08,
+ "loss": 0.0432,
+ "step": 35307
+ },
+ {
+ "epoch": 96.20708446866485,
+ "grad_norm": 4.850417137145996,
+ "learning_rate": 7.535748788625064e-08,
+ "loss": 0.0348,
+ "step": 35308
+ },
+ {
+ "epoch": 96.20980926430518,
+ "grad_norm": 2.616990327835083,
+ "learning_rate": 7.524939047088842e-08,
+ "loss": 0.0663,
+ "step": 35309
+ },
+ {
+ "epoch": 96.2125340599455,
+ "grad_norm": 2.0257766246795654,
+ "learning_rate": 7.514137034916325e-08,
+ "loss": 0.1266,
+ "step": 35310
+ },
+ {
+ "epoch": 96.21525885558583,
+ "grad_norm": 2.8868000507354736,
+ "learning_rate": 7.503342752191889e-08,
+ "loss": 0.0744,
+ "step": 35311
+ },
+ {
+ "epoch": 96.21798365122616,
+ "grad_norm": 2.598789691925049,
+ "learning_rate": 7.492556198999468e-08,
+ "loss": 0.0324,
+ "step": 35312
+ },
+ {
+ "epoch": 96.22070844686648,
+ "grad_norm": 2.572842836380005,
+ "learning_rate": 7.481777375423105e-08,
+ "loss": 0.0398,
+ "step": 35313
+ },
+ {
+ "epoch": 96.22343324250681,
+ "grad_norm": 1.9657859802246094,
+ "learning_rate": 7.471006281546622e-08,
+ "loss": 0.0192,
+ "step": 35314
+ },
+ {
+ "epoch": 96.22615803814713,
+ "grad_norm": 2.165194034576416,
+ "learning_rate": 7.460242917453952e-08,
+ "loss": 0.0241,
+ "step": 35315
+ },
+ {
+ "epoch": 96.22888283378747,
+ "grad_norm": 3.8123340606689453,
+ "learning_rate": 7.44948728322914e-08,
+ "loss": 0.0253,
+ "step": 35316
+ },
+ {
+ "epoch": 96.2316076294278,
+ "grad_norm": 1.8331133127212524,
+ "learning_rate": 7.438739378955673e-08,
+ "loss": 0.0222,
+ "step": 35317
+ },
+ {
+ "epoch": 96.23433242506812,
+ "grad_norm": 3.504307508468628,
+ "learning_rate": 7.427999204717374e-08,
+ "loss": 0.1221,
+ "step": 35318
+ },
+ {
+ "epoch": 96.23705722070845,
+ "grad_norm": 4.067674160003662,
+ "learning_rate": 7.417266760597842e-08,
+ "loss": 0.0374,
+ "step": 35319
+ },
+ {
+ "epoch": 96.23978201634877,
+ "grad_norm": 2.9613125324249268,
+ "learning_rate": 7.406542046680787e-08,
+ "loss": 0.0277,
+ "step": 35320
+ },
+ {
+ "epoch": 96.2425068119891,
+ "grad_norm": 2.0485403537750244,
+ "learning_rate": 7.395825063049588e-08,
+ "loss": 0.0232,
+ "step": 35321
+ },
+ {
+ "epoch": 96.24523160762942,
+ "grad_norm": 2.219895124435425,
+ "learning_rate": 7.385115809787624e-08,
+ "loss": 0.0524,
+ "step": 35322
+ },
+ {
+ "epoch": 96.24795640326975,
+ "grad_norm": 4.913880825042725,
+ "learning_rate": 7.374414286978604e-08,
+ "loss": 0.0499,
+ "step": 35323
+ },
+ {
+ "epoch": 96.25068119891009,
+ "grad_norm": 3.1046810150146484,
+ "learning_rate": 7.363720494705684e-08,
+ "loss": 0.1162,
+ "step": 35324
+ },
+ {
+ "epoch": 96.2534059945504,
+ "grad_norm": 5.151793003082275,
+ "learning_rate": 7.353034433052131e-08,
+ "loss": 0.0428,
+ "step": 35325
+ },
+ {
+ "epoch": 96.25613079019074,
+ "grad_norm": 2.6411540508270264,
+ "learning_rate": 7.3423561021011e-08,
+ "loss": 0.1316,
+ "step": 35326
+ },
+ {
+ "epoch": 96.25885558583106,
+ "grad_norm": 3.530471086502075,
+ "learning_rate": 7.33168550193597e-08,
+ "loss": 0.0793,
+ "step": 35327
+ },
+ {
+ "epoch": 96.26158038147139,
+ "grad_norm": 2.105945110321045,
+ "learning_rate": 7.321022632639674e-08,
+ "loss": 0.0338,
+ "step": 35328
+ },
+ {
+ "epoch": 96.26430517711172,
+ "grad_norm": 2.030118465423584,
+ "learning_rate": 7.310367494295367e-08,
+ "loss": 0.037,
+ "step": 35329
+ },
+ {
+ "epoch": 96.26702997275204,
+ "grad_norm": 2.513051748275757,
+ "learning_rate": 7.299720086985872e-08,
+ "loss": 0.0529,
+ "step": 35330
+ },
+ {
+ "epoch": 96.26975476839237,
+ "grad_norm": 3.9353020191192627,
+ "learning_rate": 7.289080410794236e-08,
+ "loss": 0.0363,
+ "step": 35331
+ },
+ {
+ "epoch": 96.2724795640327,
+ "grad_norm": 2.9553170204162598,
+ "learning_rate": 7.27844846580339e-08,
+ "loss": 0.0526,
+ "step": 35332
+ },
+ {
+ "epoch": 96.27520435967303,
+ "grad_norm": 2.5372941493988037,
+ "learning_rate": 7.267824252095823e-08,
+ "loss": 0.0749,
+ "step": 35333
+ },
+ {
+ "epoch": 96.27792915531334,
+ "grad_norm": 3.0864951610565186,
+ "learning_rate": 7.257207769754693e-08,
+ "loss": 0.058,
+ "step": 35334
+ },
+ {
+ "epoch": 96.28065395095368,
+ "grad_norm": 2.306518077850342,
+ "learning_rate": 7.246599018862377e-08,
+ "loss": 0.1582,
+ "step": 35335
+ },
+ {
+ "epoch": 96.28337874659401,
+ "grad_norm": 2.6885318756103516,
+ "learning_rate": 7.235997999501587e-08,
+ "loss": 0.0749,
+ "step": 35336
+ },
+ {
+ "epoch": 96.28610354223433,
+ "grad_norm": 1.9896204471588135,
+ "learning_rate": 7.225404711755035e-08,
+ "loss": 0.0355,
+ "step": 35337
+ },
+ {
+ "epoch": 96.28882833787466,
+ "grad_norm": 2.0738072395324707,
+ "learning_rate": 7.214819155704878e-08,
+ "loss": 0.1249,
+ "step": 35338
+ },
+ {
+ "epoch": 96.29155313351498,
+ "grad_norm": 2.042652130126953,
+ "learning_rate": 7.204241331433936e-08,
+ "loss": 0.0216,
+ "step": 35339
+ },
+ {
+ "epoch": 96.29427792915531,
+ "grad_norm": 2.8200011253356934,
+ "learning_rate": 7.193671239024258e-08,
+ "loss": 0.0403,
+ "step": 35340
+ },
+ {
+ "epoch": 96.29700272479565,
+ "grad_norm": 1.7782176733016968,
+ "learning_rate": 7.183108878558443e-08,
+ "loss": 0.0862,
+ "step": 35341
+ },
+ {
+ "epoch": 96.29972752043597,
+ "grad_norm": 4.042399883270264,
+ "learning_rate": 7.172554250118535e-08,
+ "loss": 0.0868,
+ "step": 35342
+ },
+ {
+ "epoch": 96.3024523160763,
+ "grad_norm": 2.733473300933838,
+ "learning_rate": 7.162007353786915e-08,
+ "loss": 0.0798,
+ "step": 35343
+ },
+ {
+ "epoch": 96.30517711171662,
+ "grad_norm": 1.9620474576950073,
+ "learning_rate": 7.151468189645516e-08,
+ "loss": 0.0238,
+ "step": 35344
+ },
+ {
+ "epoch": 96.30790190735695,
+ "grad_norm": 3.0320639610290527,
+ "learning_rate": 7.140936757776607e-08,
+ "loss": 0.0498,
+ "step": 35345
+ },
+ {
+ "epoch": 96.31062670299727,
+ "grad_norm": 2.256063938140869,
+ "learning_rate": 7.13041305826201e-08,
+ "loss": 0.0794,
+ "step": 35346
+ },
+ {
+ "epoch": 96.3133514986376,
+ "grad_norm": 1.9673376083374023,
+ "learning_rate": 7.119897091183991e-08,
+ "loss": 0.0254,
+ "step": 35347
+ },
+ {
+ "epoch": 96.31607629427793,
+ "grad_norm": 3.04085373878479,
+ "learning_rate": 7.109388856624156e-08,
+ "loss": 0.0749,
+ "step": 35348
+ },
+ {
+ "epoch": 96.31880108991825,
+ "grad_norm": 2.1095919609069824,
+ "learning_rate": 7.098888354664435e-08,
+ "loss": 0.0812,
+ "step": 35349
+ },
+ {
+ "epoch": 96.32152588555859,
+ "grad_norm": 1.6618585586547852,
+ "learning_rate": 7.088395585386543e-08,
+ "loss": 0.0288,
+ "step": 35350
+ },
+ {
+ "epoch": 96.3242506811989,
+ "grad_norm": 3.0538253784179688,
+ "learning_rate": 7.077910548872303e-08,
+ "loss": 0.1133,
+ "step": 35351
+ },
+ {
+ "epoch": 96.32697547683924,
+ "grad_norm": 3.3978896141052246,
+ "learning_rate": 7.067433245203426e-08,
+ "loss": 0.0589,
+ "step": 35352
+ },
+ {
+ "epoch": 96.32970027247957,
+ "grad_norm": 4.375565528869629,
+ "learning_rate": 7.056963674461403e-08,
+ "loss": 0.0765,
+ "step": 35353
+ },
+ {
+ "epoch": 96.33242506811989,
+ "grad_norm": 5.209430694580078,
+ "learning_rate": 7.046501836727837e-08,
+ "loss": 0.0795,
+ "step": 35354
+ },
+ {
+ "epoch": 96.33514986376022,
+ "grad_norm": 2.466344118118286,
+ "learning_rate": 7.036047732083995e-08,
+ "loss": 0.0344,
+ "step": 35355
+ },
+ {
+ "epoch": 96.33787465940054,
+ "grad_norm": 2.28086519241333,
+ "learning_rate": 7.025601360611589e-08,
+ "loss": 0.0393,
+ "step": 35356
+ },
+ {
+ "epoch": 96.34059945504087,
+ "grad_norm": 1.84520423412323,
+ "learning_rate": 7.015162722391777e-08,
+ "loss": 0.0205,
+ "step": 35357
+ },
+ {
+ "epoch": 96.34332425068119,
+ "grad_norm": 2.9149668216705322,
+ "learning_rate": 7.004731817505939e-08,
+ "loss": 0.0349,
+ "step": 35358
+ },
+ {
+ "epoch": 96.34604904632153,
+ "grad_norm": 2.657827854156494,
+ "learning_rate": 6.994308646035342e-08,
+ "loss": 0.0487,
+ "step": 35359
+ },
+ {
+ "epoch": 96.34877384196186,
+ "grad_norm": 2.733856678009033,
+ "learning_rate": 6.983893208061032e-08,
+ "loss": 0.0278,
+ "step": 35360
+ },
+ {
+ "epoch": 96.35149863760218,
+ "grad_norm": 4.0479631423950195,
+ "learning_rate": 6.973485503664279e-08,
+ "loss": 0.1143,
+ "step": 35361
+ },
+ {
+ "epoch": 96.35422343324251,
+ "grad_norm": 1.9658021926879883,
+ "learning_rate": 6.963085532925906e-08,
+ "loss": 0.0263,
+ "step": 35362
+ },
+ {
+ "epoch": 96.35694822888283,
+ "grad_norm": 3.4346835613250732,
+ "learning_rate": 6.952693295927182e-08,
+ "loss": 0.0487,
+ "step": 35363
+ },
+ {
+ "epoch": 96.35967302452316,
+ "grad_norm": 2.051133394241333,
+ "learning_rate": 6.942308792748931e-08,
+ "loss": 0.0518,
+ "step": 35364
+ },
+ {
+ "epoch": 96.3623978201635,
+ "grad_norm": 2.170633316040039,
+ "learning_rate": 6.931932023471976e-08,
+ "loss": 0.0521,
+ "step": 35365
+ },
+ {
+ "epoch": 96.36512261580381,
+ "grad_norm": 2.4649534225463867,
+ "learning_rate": 6.921562988177144e-08,
+ "loss": 0.183,
+ "step": 35366
+ },
+ {
+ "epoch": 96.36784741144415,
+ "grad_norm": 2.149437427520752,
+ "learning_rate": 6.911201686945257e-08,
+ "loss": 0.0513,
+ "step": 35367
+ },
+ {
+ "epoch": 96.37057220708446,
+ "grad_norm": 2.6818723678588867,
+ "learning_rate": 6.90084811985703e-08,
+ "loss": 0.1554,
+ "step": 35368
+ },
+ {
+ "epoch": 96.3732970027248,
+ "grad_norm": 3.1670899391174316,
+ "learning_rate": 6.89050228699295e-08,
+ "loss": 0.0385,
+ "step": 35369
+ },
+ {
+ "epoch": 96.37602179836512,
+ "grad_norm": 2.5463054180145264,
+ "learning_rate": 6.880164188433735e-08,
+ "loss": 0.0399,
+ "step": 35370
+ },
+ {
+ "epoch": 96.37874659400545,
+ "grad_norm": 2.164754867553711,
+ "learning_rate": 6.869833824259764e-08,
+ "loss": 0.0319,
+ "step": 35371
+ },
+ {
+ "epoch": 96.38147138964578,
+ "grad_norm": 5.0746073722839355,
+ "learning_rate": 6.859511194551637e-08,
+ "loss": 0.2198,
+ "step": 35372
+ },
+ {
+ "epoch": 96.3841961852861,
+ "grad_norm": 3.267862319946289,
+ "learning_rate": 6.849196299389627e-08,
+ "loss": 0.024,
+ "step": 35373
+ },
+ {
+ "epoch": 96.38692098092643,
+ "grad_norm": 6.8015265464782715,
+ "learning_rate": 6.838889138854221e-08,
+ "loss": 0.0558,
+ "step": 35374
+ },
+ {
+ "epoch": 96.38964577656675,
+ "grad_norm": 2.5740325450897217,
+ "learning_rate": 6.828589713025358e-08,
+ "loss": 0.0218,
+ "step": 35375
+ },
+ {
+ "epoch": 96.39237057220708,
+ "grad_norm": 1.7000741958618164,
+ "learning_rate": 6.818298021983638e-08,
+ "loss": 0.0205,
+ "step": 35376
+ },
+ {
+ "epoch": 96.39509536784742,
+ "grad_norm": 2.4573564529418945,
+ "learning_rate": 6.808014065808998e-08,
+ "loss": 0.0443,
+ "step": 35377
+ },
+ {
+ "epoch": 96.39782016348774,
+ "grad_norm": 2.234182834625244,
+ "learning_rate": 6.797737844581709e-08,
+ "loss": 0.0831,
+ "step": 35378
+ },
+ {
+ "epoch": 96.40054495912807,
+ "grad_norm": 4.208703994750977,
+ "learning_rate": 6.787469358381483e-08,
+ "loss": 0.0444,
+ "step": 35379
+ },
+ {
+ "epoch": 96.40326975476839,
+ "grad_norm": 2.4536097049713135,
+ "learning_rate": 6.777208607288588e-08,
+ "loss": 0.0255,
+ "step": 35380
+ },
+ {
+ "epoch": 96.40599455040872,
+ "grad_norm": 2.6513986587524414,
+ "learning_rate": 6.76695559138274e-08,
+ "loss": 0.0863,
+ "step": 35381
+ },
+ {
+ "epoch": 96.40871934604904,
+ "grad_norm": 2.6731977462768555,
+ "learning_rate": 6.756710310743875e-08,
+ "loss": 0.0499,
+ "step": 35382
+ },
+ {
+ "epoch": 96.41144414168937,
+ "grad_norm": 2.5571868419647217,
+ "learning_rate": 6.746472765451928e-08,
+ "loss": 0.0251,
+ "step": 35383
+ },
+ {
+ "epoch": 96.4141689373297,
+ "grad_norm": 3.7371065616607666,
+ "learning_rate": 6.73624295558628e-08,
+ "loss": 0.0735,
+ "step": 35384
+ },
+ {
+ "epoch": 96.41689373297002,
+ "grad_norm": 1.3535984754562378,
+ "learning_rate": 6.72602088122698e-08,
+ "loss": 0.0155,
+ "step": 35385
+ },
+ {
+ "epoch": 96.41961852861036,
+ "grad_norm": 2.044111490249634,
+ "learning_rate": 6.715806542453407e-08,
+ "loss": 0.1439,
+ "step": 35386
+ },
+ {
+ "epoch": 96.42234332425068,
+ "grad_norm": 3.4099745750427246,
+ "learning_rate": 6.705599939345053e-08,
+ "loss": 0.0619,
+ "step": 35387
+ },
+ {
+ "epoch": 96.42506811989101,
+ "grad_norm": 2.2722225189208984,
+ "learning_rate": 6.695401071981633e-08,
+ "loss": 0.0918,
+ "step": 35388
+ },
+ {
+ "epoch": 96.42779291553134,
+ "grad_norm": 2.1422479152679443,
+ "learning_rate": 6.685209940442527e-08,
+ "loss": 0.0219,
+ "step": 35389
+ },
+ {
+ "epoch": 96.43051771117166,
+ "grad_norm": 2.9350244998931885,
+ "learning_rate": 6.675026544806895e-08,
+ "loss": 0.0816,
+ "step": 35390
+ },
+ {
+ "epoch": 96.433242506812,
+ "grad_norm": 2.466939926147461,
+ "learning_rate": 6.664850885154228e-08,
+ "loss": 0.0415,
+ "step": 35391
+ },
+ {
+ "epoch": 96.43596730245231,
+ "grad_norm": 3.0898635387420654,
+ "learning_rate": 6.654682961563797e-08,
+ "loss": 0.0723,
+ "step": 35392
+ },
+ {
+ "epoch": 96.43869209809264,
+ "grad_norm": 3.9820556640625,
+ "learning_rate": 6.644522774114648e-08,
+ "loss": 0.0964,
+ "step": 35393
+ },
+ {
+ "epoch": 96.44141689373296,
+ "grad_norm": 2.8883168697357178,
+ "learning_rate": 6.634370322886052e-08,
+ "loss": 0.04,
+ "step": 35394
+ },
+ {
+ "epoch": 96.4441416893733,
+ "grad_norm": 1.9567556381225586,
+ "learning_rate": 6.624225607956946e-08,
+ "loss": 0.0275,
+ "step": 35395
+ },
+ {
+ "epoch": 96.44686648501363,
+ "grad_norm": 1.7626467943191528,
+ "learning_rate": 6.614088629406379e-08,
+ "loss": 0.057,
+ "step": 35396
+ },
+ {
+ "epoch": 96.44959128065395,
+ "grad_norm": 1.9004507064819336,
+ "learning_rate": 6.603959387313397e-08,
+ "loss": 0.019,
+ "step": 35397
+ },
+ {
+ "epoch": 96.45231607629428,
+ "grad_norm": 2.021732807159424,
+ "learning_rate": 6.593837881756826e-08,
+ "loss": 0.0312,
+ "step": 35398
+ },
+ {
+ "epoch": 96.4550408719346,
+ "grad_norm": 2.7149088382720947,
+ "learning_rate": 6.583724112815382e-08,
+ "loss": 0.0346,
+ "step": 35399
+ },
+ {
+ "epoch": 96.45776566757493,
+ "grad_norm": 2.1930859088897705,
+ "learning_rate": 6.57361808056789e-08,
+ "loss": 0.034,
+ "step": 35400
+ },
+ {
+ "epoch": 96.46049046321527,
+ "grad_norm": 2.3776214122772217,
+ "learning_rate": 6.563519785093175e-08,
+ "loss": 0.0262,
+ "step": 35401
+ },
+ {
+ "epoch": 96.46321525885558,
+ "grad_norm": 3.6150803565979004,
+ "learning_rate": 6.553429226469732e-08,
+ "loss": 0.1215,
+ "step": 35402
+ },
+ {
+ "epoch": 96.46594005449592,
+ "grad_norm": 2.461015462875366,
+ "learning_rate": 6.543346404776274e-08,
+ "loss": 0.113,
+ "step": 35403
+ },
+ {
+ "epoch": 96.46866485013624,
+ "grad_norm": 2.3507983684539795,
+ "learning_rate": 6.533271320091183e-08,
+ "loss": 0.1221,
+ "step": 35404
+ },
+ {
+ "epoch": 96.47138964577657,
+ "grad_norm": 1.8498133420944214,
+ "learning_rate": 6.523203972493064e-08,
+ "loss": 0.0516,
+ "step": 35405
+ },
+ {
+ "epoch": 96.47411444141689,
+ "grad_norm": 5.818890571594238,
+ "learning_rate": 6.513144362060297e-08,
+ "loss": 0.0639,
+ "step": 35406
+ },
+ {
+ "epoch": 96.47683923705722,
+ "grad_norm": 1.764113426208496,
+ "learning_rate": 6.503092488871043e-08,
+ "loss": 0.0298,
+ "step": 35407
+ },
+ {
+ "epoch": 96.47956403269755,
+ "grad_norm": 3.480236053466797,
+ "learning_rate": 6.493048353003905e-08,
+ "loss": 0.0312,
+ "step": 35408
+ },
+ {
+ "epoch": 96.48228882833787,
+ "grad_norm": 3.6187903881073,
+ "learning_rate": 6.483011954536823e-08,
+ "loss": 0.0556,
+ "step": 35409
+ },
+ {
+ "epoch": 96.4850136239782,
+ "grad_norm": 2.8983848094940186,
+ "learning_rate": 6.472983293548063e-08,
+ "loss": 0.1239,
+ "step": 35410
+ },
+ {
+ "epoch": 96.48773841961852,
+ "grad_norm": 3.3406033515930176,
+ "learning_rate": 6.462962370115789e-08,
+ "loss": 0.0551,
+ "step": 35411
+ },
+ {
+ "epoch": 96.49046321525886,
+ "grad_norm": 2.954235315322876,
+ "learning_rate": 6.452949184317936e-08,
+ "loss": 0.0333,
+ "step": 35412
+ },
+ {
+ "epoch": 96.49318801089919,
+ "grad_norm": 3.331435203552246,
+ "learning_rate": 6.442943736232554e-08,
+ "loss": 0.0497,
+ "step": 35413
+ },
+ {
+ "epoch": 96.49591280653951,
+ "grad_norm": 2.757610559463501,
+ "learning_rate": 6.43294602593758e-08,
+ "loss": 0.0432,
+ "step": 35414
+ },
+ {
+ "epoch": 96.49863760217984,
+ "grad_norm": 1.955291748046875,
+ "learning_rate": 6.422956053510842e-08,
+ "loss": 0.0197,
+ "step": 35415
+ },
+ {
+ "epoch": 96.50136239782016,
+ "grad_norm": 2.445478916168213,
+ "learning_rate": 6.412973819030054e-08,
+ "loss": 0.0226,
+ "step": 35416
+ },
+ {
+ "epoch": 96.50408719346049,
+ "grad_norm": 1.7992150783538818,
+ "learning_rate": 6.402999322573155e-08,
+ "loss": 0.0188,
+ "step": 35417
+ },
+ {
+ "epoch": 96.50681198910081,
+ "grad_norm": 3.279829978942871,
+ "learning_rate": 6.393032564217749e-08,
+ "loss": 0.1837,
+ "step": 35418
+ },
+ {
+ "epoch": 96.50953678474114,
+ "grad_norm": 2.0962960720062256,
+ "learning_rate": 6.383073544041329e-08,
+ "loss": 0.0301,
+ "step": 35419
+ },
+ {
+ "epoch": 96.51226158038148,
+ "grad_norm": 3.2004408836364746,
+ "learning_rate": 6.373122262121501e-08,
+ "loss": 0.0788,
+ "step": 35420
+ },
+ {
+ "epoch": 96.5149863760218,
+ "grad_norm": 2.7900593280792236,
+ "learning_rate": 6.363178718535867e-08,
+ "loss": 0.0304,
+ "step": 35421
+ },
+ {
+ "epoch": 96.51771117166213,
+ "grad_norm": 2.743136405944824,
+ "learning_rate": 6.353242913361923e-08,
+ "loss": 0.0356,
+ "step": 35422
+ },
+ {
+ "epoch": 96.52043596730245,
+ "grad_norm": 2.221099376678467,
+ "learning_rate": 6.34331484667683e-08,
+ "loss": 0.0544,
+ "step": 35423
+ },
+ {
+ "epoch": 96.52316076294278,
+ "grad_norm": 2.3044931888580322,
+ "learning_rate": 6.333394518558078e-08,
+ "loss": 0.0294,
+ "step": 35424
+ },
+ {
+ "epoch": 96.52588555858311,
+ "grad_norm": 1.9390853643417358,
+ "learning_rate": 6.323481929082831e-08,
+ "loss": 0.0161,
+ "step": 35425
+ },
+ {
+ "epoch": 96.52861035422343,
+ "grad_norm": 2.6898579597473145,
+ "learning_rate": 6.313577078328358e-08,
+ "loss": 0.0737,
+ "step": 35426
+ },
+ {
+ "epoch": 96.53133514986376,
+ "grad_norm": 2.4154839515686035,
+ "learning_rate": 6.303679966371712e-08,
+ "loss": 0.0497,
+ "step": 35427
+ },
+ {
+ "epoch": 96.53405994550408,
+ "grad_norm": 2.372375249862671,
+ "learning_rate": 6.29379059329005e-08,
+ "loss": 0.0916,
+ "step": 35428
+ },
+ {
+ "epoch": 96.53678474114442,
+ "grad_norm": 1.3991450071334839,
+ "learning_rate": 6.283908959160424e-08,
+ "loss": 0.1319,
+ "step": 35429
+ },
+ {
+ "epoch": 96.53950953678473,
+ "grad_norm": 2.4112188816070557,
+ "learning_rate": 6.274035064059658e-08,
+ "loss": 0.0329,
+ "step": 35430
+ },
+ {
+ "epoch": 96.54223433242507,
+ "grad_norm": 2.5971317291259766,
+ "learning_rate": 6.264168908064694e-08,
+ "loss": 0.1263,
+ "step": 35431
+ },
+ {
+ "epoch": 96.5449591280654,
+ "grad_norm": 2.3224124908447266,
+ "learning_rate": 6.254310491252469e-08,
+ "loss": 0.0701,
+ "step": 35432
+ },
+ {
+ "epoch": 96.54768392370572,
+ "grad_norm": 1.5080344676971436,
+ "learning_rate": 6.244459813699699e-08,
+ "loss": 0.0801,
+ "step": 35433
+ },
+ {
+ "epoch": 96.55040871934605,
+ "grad_norm": 2.822840452194214,
+ "learning_rate": 6.234616875483101e-08,
+ "loss": 0.0414,
+ "step": 35434
+ },
+ {
+ "epoch": 96.55313351498637,
+ "grad_norm": 3.74899959564209,
+ "learning_rate": 6.224781676679281e-08,
+ "loss": 0.0468,
+ "step": 35435
+ },
+ {
+ "epoch": 96.5558583106267,
+ "grad_norm": 3.728947162628174,
+ "learning_rate": 6.214954217364844e-08,
+ "loss": 0.1173,
+ "step": 35436
+ },
+ {
+ "epoch": 96.55858310626704,
+ "grad_norm": 2.3255670070648193,
+ "learning_rate": 6.205134497616394e-08,
+ "loss": 0.0326,
+ "step": 35437
+ },
+ {
+ "epoch": 96.56130790190736,
+ "grad_norm": 3.693643808364868,
+ "learning_rate": 6.195322517510427e-08,
+ "loss": 0.0522,
+ "step": 35438
+ },
+ {
+ "epoch": 96.56403269754769,
+ "grad_norm": 2.8127853870391846,
+ "learning_rate": 6.185518277123215e-08,
+ "loss": 0.0293,
+ "step": 35439
+ },
+ {
+ "epoch": 96.566757493188,
+ "grad_norm": 2.7797751426696777,
+ "learning_rate": 6.175721776531251e-08,
+ "loss": 0.0236,
+ "step": 35440
+ },
+ {
+ "epoch": 96.56948228882834,
+ "grad_norm": 2.783245325088501,
+ "learning_rate": 6.16593301581081e-08,
+ "loss": 0.1711,
+ "step": 35441
+ },
+ {
+ "epoch": 96.57220708446866,
+ "grad_norm": 3.790992021560669,
+ "learning_rate": 6.156151995038052e-08,
+ "loss": 0.0772,
+ "step": 35442
+ },
+ {
+ "epoch": 96.57493188010899,
+ "grad_norm": 2.600486993789673,
+ "learning_rate": 6.146378714289136e-08,
+ "loss": 0.2184,
+ "step": 35443
+ },
+ {
+ "epoch": 96.57765667574932,
+ "grad_norm": 3.12739634513855,
+ "learning_rate": 6.136613173640338e-08,
+ "loss": 0.0754,
+ "step": 35444
+ },
+ {
+ "epoch": 96.58038147138964,
+ "grad_norm": 2.153390645980835,
+ "learning_rate": 6.126855373167595e-08,
+ "loss": 0.0289,
+ "step": 35445
+ },
+ {
+ "epoch": 96.58310626702998,
+ "grad_norm": 3.036858320236206,
+ "learning_rate": 6.117105312946848e-08,
+ "loss": 0.0783,
+ "step": 35446
+ },
+ {
+ "epoch": 96.5858310626703,
+ "grad_norm": 2.371133804321289,
+ "learning_rate": 6.107362993054145e-08,
+ "loss": 0.0245,
+ "step": 35447
+ },
+ {
+ "epoch": 96.58855585831063,
+ "grad_norm": 3.0209193229675293,
+ "learning_rate": 6.097628413565315e-08,
+ "loss": 0.1349,
+ "step": 35448
+ },
+ {
+ "epoch": 96.59128065395096,
+ "grad_norm": 2.7885658740997314,
+ "learning_rate": 6.087901574556188e-08,
+ "loss": 0.022,
+ "step": 35449
+ },
+ {
+ "epoch": 96.59400544959128,
+ "grad_norm": 2.07749342918396,
+ "learning_rate": 6.078182476102479e-08,
+ "loss": 0.0191,
+ "step": 35450
+ },
+ {
+ "epoch": 96.59673024523161,
+ "grad_norm": 2.2811388969421387,
+ "learning_rate": 6.068471118279796e-08,
+ "loss": 0.0646,
+ "step": 35451
+ },
+ {
+ "epoch": 96.59945504087193,
+ "grad_norm": 2.1365513801574707,
+ "learning_rate": 6.058767501163965e-08,
+ "loss": 0.0244,
+ "step": 35452
+ },
+ {
+ "epoch": 96.60217983651226,
+ "grad_norm": 2.067659616470337,
+ "learning_rate": 6.049071624830371e-08,
+ "loss": 0.1074,
+ "step": 35453
+ },
+ {
+ "epoch": 96.60490463215258,
+ "grad_norm": 2.351426601409912,
+ "learning_rate": 6.039383489354734e-08,
+ "loss": 0.0185,
+ "step": 35454
+ },
+ {
+ "epoch": 96.60762942779292,
+ "grad_norm": 2.4213521480560303,
+ "learning_rate": 6.029703094812433e-08,
+ "loss": 0.0826,
+ "step": 35455
+ },
+ {
+ "epoch": 96.61035422343325,
+ "grad_norm": 2.7885429859161377,
+ "learning_rate": 6.020030441278635e-08,
+ "loss": 0.1608,
+ "step": 35456
+ },
+ {
+ "epoch": 96.61307901907357,
+ "grad_norm": 2.439114570617676,
+ "learning_rate": 6.010365528828944e-08,
+ "loss": 0.0383,
+ "step": 35457
+ },
+ {
+ "epoch": 96.6158038147139,
+ "grad_norm": 2.6008098125457764,
+ "learning_rate": 6.00070835753852e-08,
+ "loss": 0.0593,
+ "step": 35458
+ },
+ {
+ "epoch": 96.61852861035422,
+ "grad_norm": 1.9538836479187012,
+ "learning_rate": 5.991058927482641e-08,
+ "loss": 0.0721,
+ "step": 35459
+ },
+ {
+ "epoch": 96.62125340599455,
+ "grad_norm": 2.3058667182922363,
+ "learning_rate": 5.981417238736353e-08,
+ "loss": 0.0708,
+ "step": 35460
+ },
+ {
+ "epoch": 96.62397820163488,
+ "grad_norm": 3.0144667625427246,
+ "learning_rate": 5.971783291374822e-08,
+ "loss": 0.0875,
+ "step": 35461
+ },
+ {
+ "epoch": 96.6267029972752,
+ "grad_norm": 1.9830503463745117,
+ "learning_rate": 5.962157085473097e-08,
+ "loss": 0.0986,
+ "step": 35462
+ },
+ {
+ "epoch": 96.62942779291554,
+ "grad_norm": 4.235957622528076,
+ "learning_rate": 5.952538621106008e-08,
+ "loss": 0.1544,
+ "step": 35463
+ },
+ {
+ "epoch": 96.63215258855585,
+ "grad_norm": 2.2204272747039795,
+ "learning_rate": 5.942927898348494e-08,
+ "loss": 0.0731,
+ "step": 35464
+ },
+ {
+ "epoch": 96.63487738419619,
+ "grad_norm": 2.223872184753418,
+ "learning_rate": 5.933324917275607e-08,
+ "loss": 0.0343,
+ "step": 35465
+ },
+ {
+ "epoch": 96.6376021798365,
+ "grad_norm": 2.088108539581299,
+ "learning_rate": 5.923729677961954e-08,
+ "loss": 0.0281,
+ "step": 35466
+ },
+ {
+ "epoch": 96.64032697547684,
+ "grad_norm": 2.085111141204834,
+ "learning_rate": 5.914142180482252e-08,
+ "loss": 0.0408,
+ "step": 35467
+ },
+ {
+ "epoch": 96.64305177111717,
+ "grad_norm": 3.047095775604248,
+ "learning_rate": 5.90456242491122e-08,
+ "loss": 0.0477,
+ "step": 35468
+ },
+ {
+ "epoch": 96.64577656675749,
+ "grad_norm": 2.2496964931488037,
+ "learning_rate": 5.8949904113235756e-08,
+ "loss": 0.0954,
+ "step": 35469
+ },
+ {
+ "epoch": 96.64850136239782,
+ "grad_norm": 3.0736424922943115,
+ "learning_rate": 5.885426139793593e-08,
+ "loss": 0.1502,
+ "step": 35470
+ },
+ {
+ "epoch": 96.65122615803814,
+ "grad_norm": 8.928645133972168,
+ "learning_rate": 5.87586961039599e-08,
+ "loss": 0.1033,
+ "step": 35471
+ },
+ {
+ "epoch": 96.65395095367847,
+ "grad_norm": 1.8662821054458618,
+ "learning_rate": 5.866320823205152e-08,
+ "loss": 0.0277,
+ "step": 35472
+ },
+ {
+ "epoch": 96.65667574931881,
+ "grad_norm": 3.231903553009033,
+ "learning_rate": 5.856779778295352e-08,
+ "loss": 0.0707,
+ "step": 35473
+ },
+ {
+ "epoch": 96.65940054495913,
+ "grad_norm": 2.469789505004883,
+ "learning_rate": 5.847246475740975e-08,
+ "loss": 0.0566,
+ "step": 35474
+ },
+ {
+ "epoch": 96.66212534059946,
+ "grad_norm": 2.4956843852996826,
+ "learning_rate": 5.837720915616296e-08,
+ "loss": 0.0863,
+ "step": 35475
+ },
+ {
+ "epoch": 96.66485013623978,
+ "grad_norm": 3.3892629146575928,
+ "learning_rate": 5.828203097995366e-08,
+ "loss": 0.1029,
+ "step": 35476
+ },
+ {
+ "epoch": 96.66757493188011,
+ "grad_norm": 3.15836501121521,
+ "learning_rate": 5.8186930229524595e-08,
+ "loss": 0.1668,
+ "step": 35477
+ },
+ {
+ "epoch": 96.67029972752043,
+ "grad_norm": 4.306105136871338,
+ "learning_rate": 5.809190690561517e-08,
+ "loss": 0.0819,
+ "step": 35478
+ },
+ {
+ "epoch": 96.67302452316076,
+ "grad_norm": 2.091834306716919,
+ "learning_rate": 5.799696100896701e-08,
+ "loss": 0.0386,
+ "step": 35479
+ },
+ {
+ "epoch": 96.6757493188011,
+ "grad_norm": 1.1044886112213135,
+ "learning_rate": 5.790209254031731e-08,
+ "loss": 0.0143,
+ "step": 35480
+ },
+ {
+ "epoch": 96.67847411444141,
+ "grad_norm": 2.554041862487793,
+ "learning_rate": 5.780730150040659e-08,
+ "loss": 0.1086,
+ "step": 35481
+ },
+ {
+ "epoch": 96.68119891008175,
+ "grad_norm": 6.993478298187256,
+ "learning_rate": 5.7712587889973136e-08,
+ "loss": 0.1051,
+ "step": 35482
+ },
+ {
+ "epoch": 96.68392370572207,
+ "grad_norm": 2.266606569290161,
+ "learning_rate": 5.761795170975304e-08,
+ "loss": 0.0423,
+ "step": 35483
+ },
+ {
+ "epoch": 96.6866485013624,
+ "grad_norm": 2.4315783977508545,
+ "learning_rate": 5.752339296048459e-08,
+ "loss": 0.0336,
+ "step": 35484
+ },
+ {
+ "epoch": 96.68937329700273,
+ "grad_norm": 1.8120712041854858,
+ "learning_rate": 5.742891164290498e-08,
+ "loss": 0.0333,
+ "step": 35485
+ },
+ {
+ "epoch": 96.69209809264305,
+ "grad_norm": 1.5353174209594727,
+ "learning_rate": 5.733450775774807e-08,
+ "loss": 0.0256,
+ "step": 35486
+ },
+ {
+ "epoch": 96.69482288828338,
+ "grad_norm": 2.4484543800354004,
+ "learning_rate": 5.724018130574993e-08,
+ "loss": 0.0365,
+ "step": 35487
+ },
+ {
+ "epoch": 96.6975476839237,
+ "grad_norm": 4.073673725128174,
+ "learning_rate": 5.714593228764553e-08,
+ "loss": 0.0515,
+ "step": 35488
+ },
+ {
+ "epoch": 96.70027247956403,
+ "grad_norm": 2.161654472351074,
+ "learning_rate": 5.7051760704168734e-08,
+ "loss": 0.0338,
+ "step": 35489
+ },
+ {
+ "epoch": 96.70299727520435,
+ "grad_norm": 2.069058895111084,
+ "learning_rate": 5.695766655605228e-08,
+ "loss": 0.0229,
+ "step": 35490
+ },
+ {
+ "epoch": 96.70572207084469,
+ "grad_norm": 4.5033769607543945,
+ "learning_rate": 5.686364984403003e-08,
+ "loss": 0.0317,
+ "step": 35491
+ },
+ {
+ "epoch": 96.70844686648502,
+ "grad_norm": 1.8857495784759521,
+ "learning_rate": 5.676971056883362e-08,
+ "loss": 0.1158,
+ "step": 35492
+ },
+ {
+ "epoch": 96.71117166212534,
+ "grad_norm": 2.522603988647461,
+ "learning_rate": 5.6675848731194695e-08,
+ "loss": 0.0276,
+ "step": 35493
+ },
+ {
+ "epoch": 96.71389645776567,
+ "grad_norm": 3.187896251678467,
+ "learning_rate": 5.658206433184377e-08,
+ "loss": 0.03,
+ "step": 35494
+ },
+ {
+ "epoch": 96.71662125340599,
+ "grad_norm": 2.375319242477417,
+ "learning_rate": 5.648835737151248e-08,
+ "loss": 0.0637,
+ "step": 35495
+ },
+ {
+ "epoch": 96.71934604904632,
+ "grad_norm": 2.4035370349884033,
+ "learning_rate": 5.6394727850929145e-08,
+ "loss": 0.0502,
+ "step": 35496
+ },
+ {
+ "epoch": 96.72207084468666,
+ "grad_norm": 2.127671957015991,
+ "learning_rate": 5.6301175770824277e-08,
+ "loss": 0.0391,
+ "step": 35497
+ },
+ {
+ "epoch": 96.72479564032697,
+ "grad_norm": 2.6739914417266846,
+ "learning_rate": 5.620770113192509e-08,
+ "loss": 0.0335,
+ "step": 35498
+ },
+ {
+ "epoch": 96.7275204359673,
+ "grad_norm": 2.37778902053833,
+ "learning_rate": 5.611430393496098e-08,
+ "loss": 0.0531,
+ "step": 35499
+ },
+ {
+ "epoch": 96.73024523160763,
+ "grad_norm": 2.3967061042785645,
+ "learning_rate": 5.602098418065804e-08,
+ "loss": 0.0332,
+ "step": 35500
+ },
+ {
+ "epoch": 96.73297002724796,
+ "grad_norm": 2.5274176597595215,
+ "learning_rate": 5.592774186974348e-08,
+ "loss": 0.0214,
+ "step": 35501
+ },
+ {
+ "epoch": 96.73569482288828,
+ "grad_norm": 2.33677077293396,
+ "learning_rate": 5.5834577002944476e-08,
+ "loss": 0.0479,
+ "step": 35502
+ },
+ {
+ "epoch": 96.73841961852861,
+ "grad_norm": 1.8418856859207153,
+ "learning_rate": 5.574148958098491e-08,
+ "loss": 0.1129,
+ "step": 35503
+ },
+ {
+ "epoch": 96.74114441416894,
+ "grad_norm": 2.4903202056884766,
+ "learning_rate": 5.5648479604590856e-08,
+ "loss": 0.0392,
+ "step": 35504
+ },
+ {
+ "epoch": 96.74386920980926,
+ "grad_norm": 1.9814727306365967,
+ "learning_rate": 5.555554707448618e-08,
+ "loss": 0.0682,
+ "step": 35505
+ },
+ {
+ "epoch": 96.7465940054496,
+ "grad_norm": 1.7760999202728271,
+ "learning_rate": 5.5462691991395865e-08,
+ "loss": 0.0482,
+ "step": 35506
+ },
+ {
+ "epoch": 96.74931880108991,
+ "grad_norm": 2.503962516784668,
+ "learning_rate": 5.5369914356041556e-08,
+ "loss": 0.0947,
+ "step": 35507
+ },
+ {
+ "epoch": 96.75204359673025,
+ "grad_norm": 5.7593674659729,
+ "learning_rate": 5.527721416914489e-08,
+ "loss": 0.0524,
+ "step": 35508
+ },
+ {
+ "epoch": 96.75476839237058,
+ "grad_norm": 2.3444464206695557,
+ "learning_rate": 5.5184591431430845e-08,
+ "loss": 0.0279,
+ "step": 35509
+ },
+ {
+ "epoch": 96.7574931880109,
+ "grad_norm": 4.473971366882324,
+ "learning_rate": 5.5092046143618846e-08,
+ "loss": 0.1204,
+ "step": 35510
+ },
+ {
+ "epoch": 96.76021798365123,
+ "grad_norm": 2.6154189109802246,
+ "learning_rate": 5.4999578306429436e-08,
+ "loss": 0.0326,
+ "step": 35511
+ },
+ {
+ "epoch": 96.76294277929155,
+ "grad_norm": 2.3137433528900146,
+ "learning_rate": 5.490718792058314e-08,
+ "loss": 0.1018,
+ "step": 35512
+ },
+ {
+ "epoch": 96.76566757493188,
+ "grad_norm": 1.6487475633621216,
+ "learning_rate": 5.4814874986800495e-08,
+ "loss": 0.0256,
+ "step": 35513
+ },
+ {
+ "epoch": 96.7683923705722,
+ "grad_norm": 2.6181390285491943,
+ "learning_rate": 5.4722639505798704e-08,
+ "loss": 0.0454,
+ "step": 35514
+ },
+ {
+ "epoch": 96.77111716621253,
+ "grad_norm": 2.4293861389160156,
+ "learning_rate": 5.4630481478297196e-08,
+ "loss": 0.0397,
+ "step": 35515
+ },
+ {
+ "epoch": 96.77384196185287,
+ "grad_norm": 2.441007375717163,
+ "learning_rate": 5.453840090501317e-08,
+ "loss": 0.0512,
+ "step": 35516
+ },
+ {
+ "epoch": 96.77656675749319,
+ "grad_norm": 1.941656470298767,
+ "learning_rate": 5.4446397786664936e-08,
+ "loss": 0.1108,
+ "step": 35517
+ },
+ {
+ "epoch": 96.77929155313352,
+ "grad_norm": 3.0584681034088135,
+ "learning_rate": 5.43544721239675e-08,
+ "loss": 0.111,
+ "step": 35518
+ },
+ {
+ "epoch": 96.78201634877384,
+ "grad_norm": 2.185162305831909,
+ "learning_rate": 5.4262623917636925e-08,
+ "loss": 0.0354,
+ "step": 35519
+ },
+ {
+ "epoch": 96.78474114441417,
+ "grad_norm": 2.0862855911254883,
+ "learning_rate": 5.417085316838933e-08,
+ "loss": 0.0433,
+ "step": 35520
+ },
+ {
+ "epoch": 96.7874659400545,
+ "grad_norm": 2.384084463119507,
+ "learning_rate": 5.407915987693857e-08,
+ "loss": 0.0238,
+ "step": 35521
+ },
+ {
+ "epoch": 96.79019073569482,
+ "grad_norm": 2.707002639770508,
+ "learning_rate": 5.398754404399964e-08,
+ "loss": 0.0484,
+ "step": 35522
+ },
+ {
+ "epoch": 96.79291553133515,
+ "grad_norm": 2.577698230743408,
+ "learning_rate": 5.38960056702853e-08,
+ "loss": 0.101,
+ "step": 35523
+ },
+ {
+ "epoch": 96.79564032697547,
+ "grad_norm": 2.1527206897735596,
+ "learning_rate": 5.380454475650942e-08,
+ "loss": 0.0341,
+ "step": 35524
+ },
+ {
+ "epoch": 96.7983651226158,
+ "grad_norm": 2.3384931087493896,
+ "learning_rate": 5.371316130338255e-08,
+ "loss": 0.0854,
+ "step": 35525
+ },
+ {
+ "epoch": 96.80108991825612,
+ "grad_norm": 1.8126362562179565,
+ "learning_rate": 5.362185531161746e-08,
+ "loss": 0.0747,
+ "step": 35526
+ },
+ {
+ "epoch": 96.80381471389646,
+ "grad_norm": 2.0274250507354736,
+ "learning_rate": 5.353062678192689e-08,
+ "loss": 0.0655,
+ "step": 35527
+ },
+ {
+ "epoch": 96.80653950953679,
+ "grad_norm": 2.397373914718628,
+ "learning_rate": 5.343947571501806e-08,
+ "loss": 0.0363,
+ "step": 35528
+ },
+ {
+ "epoch": 96.80926430517711,
+ "grad_norm": 7.551501274108887,
+ "learning_rate": 5.334840211160264e-08,
+ "loss": 0.0401,
+ "step": 35529
+ },
+ {
+ "epoch": 96.81198910081744,
+ "grad_norm": 1.9004566669464111,
+ "learning_rate": 5.3257405972390043e-08,
+ "loss": 0.0318,
+ "step": 35530
+ },
+ {
+ "epoch": 96.81471389645776,
+ "grad_norm": 2.246920108795166,
+ "learning_rate": 5.316648729808971e-08,
+ "loss": 0.0643,
+ "step": 35531
+ },
+ {
+ "epoch": 96.8174386920981,
+ "grad_norm": 2.6450071334838867,
+ "learning_rate": 5.307564608940663e-08,
+ "loss": 0.0537,
+ "step": 35532
+ },
+ {
+ "epoch": 96.82016348773843,
+ "grad_norm": 1.4076768159866333,
+ "learning_rate": 5.2984882347051345e-08,
+ "loss": 0.0177,
+ "step": 35533
+ },
+ {
+ "epoch": 96.82288828337875,
+ "grad_norm": 2.5664820671081543,
+ "learning_rate": 5.2894196071729966e-08,
+ "loss": 0.0418,
+ "step": 35534
+ },
+ {
+ "epoch": 96.82561307901908,
+ "grad_norm": 2.4444258213043213,
+ "learning_rate": 5.280358726414858e-08,
+ "loss": 0.0339,
+ "step": 35535
+ },
+ {
+ "epoch": 96.8283378746594,
+ "grad_norm": 2.2147350311279297,
+ "learning_rate": 5.271305592501108e-08,
+ "loss": 0.0499,
+ "step": 35536
+ },
+ {
+ "epoch": 96.83106267029973,
+ "grad_norm": 2.550987958908081,
+ "learning_rate": 5.262260205502578e-08,
+ "loss": 0.0985,
+ "step": 35537
+ },
+ {
+ "epoch": 96.83378746594005,
+ "grad_norm": 2.4605648517608643,
+ "learning_rate": 5.253222565489546e-08,
+ "loss": 0.0767,
+ "step": 35538
+ },
+ {
+ "epoch": 96.83651226158038,
+ "grad_norm": 4.611190319061279,
+ "learning_rate": 5.244192672532289e-08,
+ "loss": 0.2291,
+ "step": 35539
+ },
+ {
+ "epoch": 96.83923705722071,
+ "grad_norm": 1.9465532302856445,
+ "learning_rate": 5.2351705267013055e-08,
+ "loss": 0.0579,
+ "step": 35540
+ },
+ {
+ "epoch": 96.84196185286103,
+ "grad_norm": 4.9753594398498535,
+ "learning_rate": 5.2261561280667614e-08,
+ "loss": 0.1049,
+ "step": 35541
+ },
+ {
+ "epoch": 96.84468664850137,
+ "grad_norm": 2.467731475830078,
+ "learning_rate": 5.217149476698935e-08,
+ "loss": 0.0849,
+ "step": 35542
+ },
+ {
+ "epoch": 96.84741144414168,
+ "grad_norm": 2.3039093017578125,
+ "learning_rate": 5.2081505726679916e-08,
+ "loss": 0.0316,
+ "step": 35543
+ },
+ {
+ "epoch": 96.85013623978202,
+ "grad_norm": 3.5640945434570312,
+ "learning_rate": 5.199159416043875e-08,
+ "loss": 0.0335,
+ "step": 35544
+ },
+ {
+ "epoch": 96.85286103542235,
+ "grad_norm": 2.324336290359497,
+ "learning_rate": 5.190176006896641e-08,
+ "loss": 0.0506,
+ "step": 35545
+ },
+ {
+ "epoch": 96.85558583106267,
+ "grad_norm": 2.183614492416382,
+ "learning_rate": 5.181200345296455e-08,
+ "loss": 0.0506,
+ "step": 35546
+ },
+ {
+ "epoch": 96.858310626703,
+ "grad_norm": 3.2237741947174072,
+ "learning_rate": 5.172232431312929e-08,
+ "loss": 0.03,
+ "step": 35547
+ },
+ {
+ "epoch": 96.86103542234332,
+ "grad_norm": 2.060969591140747,
+ "learning_rate": 5.163272265016117e-08,
+ "loss": 0.0541,
+ "step": 35548
+ },
+ {
+ "epoch": 96.86376021798365,
+ "grad_norm": 2.4621293544769287,
+ "learning_rate": 5.154319846475631e-08,
+ "loss": 0.023,
+ "step": 35549
+ },
+ {
+ "epoch": 96.86648501362397,
+ "grad_norm": 2.451321840286255,
+ "learning_rate": 5.1453751757614136e-08,
+ "loss": 0.0316,
+ "step": 35550
+ },
+ {
+ "epoch": 96.8692098092643,
+ "grad_norm": 1.8460115194320679,
+ "learning_rate": 5.1364382529428545e-08,
+ "loss": 0.0167,
+ "step": 35551
+ },
+ {
+ "epoch": 96.87193460490464,
+ "grad_norm": 3.7541723251342773,
+ "learning_rate": 5.1275090780897875e-08,
+ "loss": 0.0663,
+ "step": 35552
+ },
+ {
+ "epoch": 96.87465940054496,
+ "grad_norm": 2.6491284370422363,
+ "learning_rate": 5.1185876512716004e-08,
+ "loss": 0.0263,
+ "step": 35553
+ },
+ {
+ "epoch": 96.87738419618529,
+ "grad_norm": 2.2321131229400635,
+ "learning_rate": 5.109673972557905e-08,
+ "loss": 0.0197,
+ "step": 35554
+ },
+ {
+ "epoch": 96.88010899182561,
+ "grad_norm": 7.176581382751465,
+ "learning_rate": 5.1007680420179786e-08,
+ "loss": 0.0547,
+ "step": 35555
+ },
+ {
+ "epoch": 96.88283378746594,
+ "grad_norm": 2.114020586013794,
+ "learning_rate": 5.0918698597212104e-08,
+ "loss": 0.1361,
+ "step": 35556
+ },
+ {
+ "epoch": 96.88555858310627,
+ "grad_norm": 1.994983434677124,
+ "learning_rate": 5.082979425736989e-08,
+ "loss": 0.0905,
+ "step": 35557
+ },
+ {
+ "epoch": 96.88828337874659,
+ "grad_norm": 1.936752438545227,
+ "learning_rate": 5.074096740134593e-08,
+ "loss": 0.0306,
+ "step": 35558
+ },
+ {
+ "epoch": 96.89100817438693,
+ "grad_norm": 2.5228633880615234,
+ "learning_rate": 5.065221802983078e-08,
+ "loss": 0.0741,
+ "step": 35559
+ },
+ {
+ "epoch": 96.89373297002724,
+ "grad_norm": 1.7915103435516357,
+ "learning_rate": 5.0563546143515e-08,
+ "loss": 0.1433,
+ "step": 35560
+ },
+ {
+ "epoch": 96.89645776566758,
+ "grad_norm": 2.609074115753174,
+ "learning_rate": 5.047495174309025e-08,
+ "loss": 0.0458,
+ "step": 35561
+ },
+ {
+ "epoch": 96.8991825613079,
+ "grad_norm": 2.0458016395568848,
+ "learning_rate": 5.03864348292471e-08,
+ "loss": 0.022,
+ "step": 35562
+ },
+ {
+ "epoch": 96.90190735694823,
+ "grad_norm": 2.0826382637023926,
+ "learning_rate": 5.0297995402673884e-08,
+ "loss": 0.0388,
+ "step": 35563
+ },
+ {
+ "epoch": 96.90463215258856,
+ "grad_norm": 1.929991364479065,
+ "learning_rate": 5.0209633464060046e-08,
+ "loss": 0.0183,
+ "step": 35564
+ },
+ {
+ "epoch": 96.90735694822888,
+ "grad_norm": 2.0320088863372803,
+ "learning_rate": 5.0121349014091715e-08,
+ "loss": 0.1049,
+ "step": 35565
+ },
+ {
+ "epoch": 96.91008174386921,
+ "grad_norm": 16.922584533691406,
+ "learning_rate": 5.003314205345944e-08,
+ "loss": 0.0905,
+ "step": 35566
+ },
+ {
+ "epoch": 96.91280653950953,
+ "grad_norm": 2.336092710494995,
+ "learning_rate": 4.994501258284934e-08,
+ "loss": 0.1259,
+ "step": 35567
+ },
+ {
+ "epoch": 96.91553133514986,
+ "grad_norm": 1.9293670654296875,
+ "learning_rate": 4.985696060294642e-08,
+ "loss": 0.0248,
+ "step": 35568
+ },
+ {
+ "epoch": 96.9182561307902,
+ "grad_norm": 4.455367088317871,
+ "learning_rate": 4.9768986114436814e-08,
+ "loss": 0.1014,
+ "step": 35569
+ },
+ {
+ "epoch": 96.92098092643052,
+ "grad_norm": 3.27518630027771,
+ "learning_rate": 4.968108911800662e-08,
+ "loss": 0.0501,
+ "step": 35570
+ },
+ {
+ "epoch": 96.92370572207085,
+ "grad_norm": 3.5886731147766113,
+ "learning_rate": 4.9593269614339744e-08,
+ "loss": 0.0365,
+ "step": 35571
+ },
+ {
+ "epoch": 96.92643051771117,
+ "grad_norm": 2.05401611328125,
+ "learning_rate": 4.9505527604121194e-08,
+ "loss": 0.0264,
+ "step": 35572
+ },
+ {
+ "epoch": 96.9291553133515,
+ "grad_norm": 2.369694948196411,
+ "learning_rate": 4.941786308803154e-08,
+ "loss": 0.1041,
+ "step": 35573
+ },
+ {
+ "epoch": 96.93188010899182,
+ "grad_norm": 2.589430093765259,
+ "learning_rate": 4.933027606675689e-08,
+ "loss": 0.0654,
+ "step": 35574
+ },
+ {
+ "epoch": 96.93460490463215,
+ "grad_norm": 3.099961757659912,
+ "learning_rate": 4.924276654097671e-08,
+ "loss": 0.0288,
+ "step": 35575
+ },
+ {
+ "epoch": 96.93732970027249,
+ "grad_norm": 2.487401008605957,
+ "learning_rate": 4.9155334511373775e-08,
+ "loss": 0.1365,
+ "step": 35576
+ },
+ {
+ "epoch": 96.9400544959128,
+ "grad_norm": 3.020406723022461,
+ "learning_rate": 4.9067979978629776e-08,
+ "loss": 0.1856,
+ "step": 35577
+ },
+ {
+ "epoch": 96.94277929155314,
+ "grad_norm": 2.2442588806152344,
+ "learning_rate": 4.898070294342305e-08,
+ "loss": 0.0309,
+ "step": 35578
+ },
+ {
+ "epoch": 96.94550408719346,
+ "grad_norm": 3.3606913089752197,
+ "learning_rate": 4.8893503406435285e-08,
+ "loss": 0.046,
+ "step": 35579
+ },
+ {
+ "epoch": 96.94822888283379,
+ "grad_norm": 2.7061917781829834,
+ "learning_rate": 4.8806381368343705e-08,
+ "loss": 0.0324,
+ "step": 35580
+ },
+ {
+ "epoch": 96.95095367847412,
+ "grad_norm": 2.671208620071411,
+ "learning_rate": 4.8719336829827765e-08,
+ "loss": 0.0912,
+ "step": 35581
+ },
+ {
+ "epoch": 96.95367847411444,
+ "grad_norm": 2.5573370456695557,
+ "learning_rate": 4.8632369791565825e-08,
+ "loss": 0.0715,
+ "step": 35582
+ },
+ {
+ "epoch": 96.95640326975477,
+ "grad_norm": 2.2591705322265625,
+ "learning_rate": 4.854548025423511e-08,
+ "loss": 0.0418,
+ "step": 35583
+ },
+ {
+ "epoch": 96.95912806539509,
+ "grad_norm": 2.5224218368530273,
+ "learning_rate": 4.845866821851064e-08,
+ "loss": 0.0834,
+ "step": 35584
+ },
+ {
+ "epoch": 96.96185286103542,
+ "grad_norm": 3.1266067028045654,
+ "learning_rate": 4.837193368507076e-08,
+ "loss": 0.0334,
+ "step": 35585
+ },
+ {
+ "epoch": 96.96457765667574,
+ "grad_norm": 2.3245010375976562,
+ "learning_rate": 4.828527665458937e-08,
+ "loss": 0.0253,
+ "step": 35586
+ },
+ {
+ "epoch": 96.96730245231608,
+ "grad_norm": 23.660011291503906,
+ "learning_rate": 4.8198697127742613e-08,
+ "loss": 0.0601,
+ "step": 35587
+ },
+ {
+ "epoch": 96.97002724795641,
+ "grad_norm": 4.185683250427246,
+ "learning_rate": 4.811219510520437e-08,
+ "loss": 0.0262,
+ "step": 35588
+ },
+ {
+ "epoch": 96.97275204359673,
+ "grad_norm": 2.4813575744628906,
+ "learning_rate": 4.802577058764635e-08,
+ "loss": 0.0236,
+ "step": 35589
+ },
+ {
+ "epoch": 96.97547683923706,
+ "grad_norm": 2.5231006145477295,
+ "learning_rate": 4.793942357574466e-08,
+ "loss": 0.0427,
+ "step": 35590
+ },
+ {
+ "epoch": 96.97820163487738,
+ "grad_norm": 2.479731559753418,
+ "learning_rate": 4.7853154070169885e-08,
+ "loss": 0.0423,
+ "step": 35591
+ },
+ {
+ "epoch": 96.98092643051771,
+ "grad_norm": 2.662405014038086,
+ "learning_rate": 4.776696207159481e-08,
+ "loss": 0.0286,
+ "step": 35592
+ },
+ {
+ "epoch": 96.98365122615803,
+ "grad_norm": 2.94612979888916,
+ "learning_rate": 4.7680847580691136e-08,
+ "loss": 0.1132,
+ "step": 35593
+ },
+ {
+ "epoch": 96.98637602179836,
+ "grad_norm": 2.1367650032043457,
+ "learning_rate": 4.75948105981272e-08,
+ "loss": 0.0974,
+ "step": 35594
+ },
+ {
+ "epoch": 96.9891008174387,
+ "grad_norm": 4.904690742492676,
+ "learning_rate": 4.7508851124574705e-08,
+ "loss": 0.0674,
+ "step": 35595
+ },
+ {
+ "epoch": 96.99182561307902,
+ "grad_norm": 1.8304905891418457,
+ "learning_rate": 4.742296916070421e-08,
+ "loss": 0.0768,
+ "step": 35596
+ },
+ {
+ "epoch": 96.99455040871935,
+ "grad_norm": 2.413317918777466,
+ "learning_rate": 4.733716470718186e-08,
+ "loss": 0.0181,
+ "step": 35597
+ },
+ {
+ "epoch": 96.99727520435967,
+ "grad_norm": 2.6462340354919434,
+ "learning_rate": 4.725143776467822e-08,
+ "loss": 0.0844,
+ "step": 35598
+ },
+ {
+ "epoch": 97.0,
+ "grad_norm": 1.5588715076446533,
+ "learning_rate": 4.716578833386054e-08,
+ "loss": 0.0205,
+ "step": 35599
+ },
+ {
+ "epoch": 97.00272479564033,
+ "grad_norm": 2.9802091121673584,
+ "learning_rate": 4.7080216415394954e-08,
+ "loss": 0.063,
+ "step": 35600
+ },
+ {
+ "epoch": 97.00544959128065,
+ "grad_norm": 2.9426045417785645,
+ "learning_rate": 4.699472200994759e-08,
+ "loss": 0.0283,
+ "step": 35601
+ },
+ {
+ "epoch": 97.00817438692098,
+ "grad_norm": 1.8756449222564697,
+ "learning_rate": 4.69093051181857e-08,
+ "loss": 0.0593,
+ "step": 35602
+ },
+ {
+ "epoch": 97.0108991825613,
+ "grad_norm": 3.53544545173645,
+ "learning_rate": 4.682396574077319e-08,
+ "loss": 0.0279,
+ "step": 35603
+ },
+ {
+ "epoch": 97.01362397820164,
+ "grad_norm": 2.3807857036590576,
+ "learning_rate": 4.6738703878376204e-08,
+ "loss": 0.0459,
+ "step": 35604
+ },
+ {
+ "epoch": 97.01634877384195,
+ "grad_norm": 2.192631721496582,
+ "learning_rate": 4.665351953165642e-08,
+ "loss": 0.0422,
+ "step": 35605
+ },
+ {
+ "epoch": 97.01907356948229,
+ "grad_norm": 3.610191822052002,
+ "learning_rate": 4.656841270127999e-08,
+ "loss": 0.1389,
+ "step": 35606
+ },
+ {
+ "epoch": 97.02179836512262,
+ "grad_norm": 2.798900604248047,
+ "learning_rate": 4.6483383387908585e-08,
+ "loss": 0.0817,
+ "step": 35607
+ },
+ {
+ "epoch": 97.02452316076294,
+ "grad_norm": 4.655253887176514,
+ "learning_rate": 4.6398431592202805e-08,
+ "loss": 0.0451,
+ "step": 35608
+ },
+ {
+ "epoch": 97.02724795640327,
+ "grad_norm": 2.315178155899048,
+ "learning_rate": 4.6313557314826564e-08,
+ "loss": 0.0496,
+ "step": 35609
+ },
+ {
+ "epoch": 97.02997275204359,
+ "grad_norm": 1.9423848390579224,
+ "learning_rate": 4.622876055643932e-08,
+ "loss": 0.0274,
+ "step": 35610
+ },
+ {
+ "epoch": 97.03269754768392,
+ "grad_norm": 2.0493133068084717,
+ "learning_rate": 4.614404131770389e-08,
+ "loss": 0.0243,
+ "step": 35611
+ },
+ {
+ "epoch": 97.03542234332426,
+ "grad_norm": 3.3066389560699463,
+ "learning_rate": 4.605939959927641e-08,
+ "loss": 0.0523,
+ "step": 35612
+ },
+ {
+ "epoch": 97.03814713896458,
+ "grad_norm": 4.777273654937744,
+ "learning_rate": 4.597483540181968e-08,
+ "loss": 0.0293,
+ "step": 35613
+ },
+ {
+ "epoch": 97.04087193460491,
+ "grad_norm": 2.330043315887451,
+ "learning_rate": 4.5890348725988744e-08,
+ "loss": 0.0261,
+ "step": 35614
+ },
+ {
+ "epoch": 97.04359673024523,
+ "grad_norm": 3.9469618797302246,
+ "learning_rate": 4.5805939572444166e-08,
+ "loss": 0.0224,
+ "step": 35615
+ },
+ {
+ "epoch": 97.04632152588556,
+ "grad_norm": 2.940596342086792,
+ "learning_rate": 4.572160794184322e-08,
+ "loss": 0.0392,
+ "step": 35616
+ },
+ {
+ "epoch": 97.04904632152588,
+ "grad_norm": 2.8023288249969482,
+ "learning_rate": 4.563735383484091e-08,
+ "loss": 0.0338,
+ "step": 35617
+ },
+ {
+ "epoch": 97.05177111716621,
+ "grad_norm": 2.739731788635254,
+ "learning_rate": 4.5553177252095624e-08,
+ "loss": 0.0534,
+ "step": 35618
+ },
+ {
+ "epoch": 97.05449591280654,
+ "grad_norm": 2.1139893531799316,
+ "learning_rate": 4.5469078194261276e-08,
+ "loss": 0.0328,
+ "step": 35619
+ },
+ {
+ "epoch": 97.05722070844686,
+ "grad_norm": 2.6700010299682617,
+ "learning_rate": 4.5385056661992886e-08,
+ "loss": 0.0255,
+ "step": 35620
+ },
+ {
+ "epoch": 97.0599455040872,
+ "grad_norm": 2.1723580360412598,
+ "learning_rate": 4.53011126559455e-08,
+ "loss": 0.0158,
+ "step": 35621
+ },
+ {
+ "epoch": 97.06267029972751,
+ "grad_norm": 1.5713322162628174,
+ "learning_rate": 4.5217246176773036e-08,
+ "loss": 0.0194,
+ "step": 35622
+ },
+ {
+ "epoch": 97.06539509536785,
+ "grad_norm": 2.799923896789551,
+ "learning_rate": 4.5133457225128296e-08,
+ "loss": 0.0423,
+ "step": 35623
+ },
+ {
+ "epoch": 97.06811989100818,
+ "grad_norm": 2.719472646713257,
+ "learning_rate": 4.50497458016641e-08,
+ "loss": 0.0711,
+ "step": 35624
+ },
+ {
+ "epoch": 97.0708446866485,
+ "grad_norm": 17.930240631103516,
+ "learning_rate": 4.496611190703104e-08,
+ "loss": 0.0529,
+ "step": 35625
+ },
+ {
+ "epoch": 97.07356948228883,
+ "grad_norm": 1.8039621114730835,
+ "learning_rate": 4.488255554188192e-08,
+ "loss": 0.1001,
+ "step": 35626
+ },
+ {
+ "epoch": 97.07629427792915,
+ "grad_norm": 1.8604620695114136,
+ "learning_rate": 4.479907670686734e-08,
+ "loss": 0.0262,
+ "step": 35627
+ },
+ {
+ "epoch": 97.07901907356948,
+ "grad_norm": 2.324397087097168,
+ "learning_rate": 4.4715675402636774e-08,
+ "loss": 0.0389,
+ "step": 35628
+ },
+ {
+ "epoch": 97.0817438692098,
+ "grad_norm": 3.6882824897766113,
+ "learning_rate": 4.463235162984081e-08,
+ "loss": 0.0382,
+ "step": 35629
+ },
+ {
+ "epoch": 97.08446866485014,
+ "grad_norm": 2.095919370651245,
+ "learning_rate": 4.454910538912671e-08,
+ "loss": 0.0237,
+ "step": 35630
+ },
+ {
+ "epoch": 97.08719346049047,
+ "grad_norm": 3.908423900604248,
+ "learning_rate": 4.446593668114396e-08,
+ "loss": 0.08,
+ "step": 35631
+ },
+ {
+ "epoch": 97.08991825613079,
+ "grad_norm": 2.1432840824127197,
+ "learning_rate": 4.438284550654093e-08,
+ "loss": 0.0335,
+ "step": 35632
+ },
+ {
+ "epoch": 97.09264305177112,
+ "grad_norm": 2.915332794189453,
+ "learning_rate": 4.4299831865962653e-08,
+ "loss": 0.1137,
+ "step": 35633
+ },
+ {
+ "epoch": 97.09536784741144,
+ "grad_norm": 3.781524658203125,
+ "learning_rate": 4.42168957600575e-08,
+ "loss": 0.1042,
+ "step": 35634
+ },
+ {
+ "epoch": 97.09809264305177,
+ "grad_norm": 2.3162896633148193,
+ "learning_rate": 4.413403718947162e-08,
+ "loss": 0.051,
+ "step": 35635
+ },
+ {
+ "epoch": 97.1008174386921,
+ "grad_norm": 2.087754011154175,
+ "learning_rate": 4.4051256154847844e-08,
+ "loss": 0.022,
+ "step": 35636
+ },
+ {
+ "epoch": 97.10354223433242,
+ "grad_norm": 2.776384115219116,
+ "learning_rate": 4.396855265683342e-08,
+ "loss": 0.0267,
+ "step": 35637
+ },
+ {
+ "epoch": 97.10626702997276,
+ "grad_norm": 2.3792355060577393,
+ "learning_rate": 4.388592669607117e-08,
+ "loss": 0.0267,
+ "step": 35638
+ },
+ {
+ "epoch": 97.10899182561307,
+ "grad_norm": 1.4954745769500732,
+ "learning_rate": 4.3803378273205024e-08,
+ "loss": 0.0215,
+ "step": 35639
+ },
+ {
+ "epoch": 97.11171662125341,
+ "grad_norm": 3.321103096008301,
+ "learning_rate": 4.37209073888778e-08,
+ "loss": 0.1687,
+ "step": 35640
+ },
+ {
+ "epoch": 97.11444141689373,
+ "grad_norm": 2.249972343444824,
+ "learning_rate": 4.363851404373121e-08,
+ "loss": 0.0383,
+ "step": 35641
+ },
+ {
+ "epoch": 97.11716621253406,
+ "grad_norm": 2.076660394668579,
+ "learning_rate": 4.3556198238408064e-08,
+ "loss": 0.0691,
+ "step": 35642
+ },
+ {
+ "epoch": 97.11989100817439,
+ "grad_norm": 3.3433871269226074,
+ "learning_rate": 4.3473959973547866e-08,
+ "loss": 0.0686,
+ "step": 35643
+ },
+ {
+ "epoch": 97.12261580381471,
+ "grad_norm": 3.1689705848693848,
+ "learning_rate": 4.339179924979342e-08,
+ "loss": 0.1157,
+ "step": 35644
+ },
+ {
+ "epoch": 97.12534059945504,
+ "grad_norm": 2.73633074760437,
+ "learning_rate": 4.3309716067782e-08,
+ "loss": 0.1455,
+ "step": 35645
+ },
+ {
+ "epoch": 97.12806539509536,
+ "grad_norm": 2.4419350624084473,
+ "learning_rate": 4.322771042815421e-08,
+ "loss": 0.0266,
+ "step": 35646
+ },
+ {
+ "epoch": 97.1307901907357,
+ "grad_norm": 2.533695697784424,
+ "learning_rate": 4.314578233154953e-08,
+ "loss": 0.0257,
+ "step": 35647
+ },
+ {
+ "epoch": 97.13351498637603,
+ "grad_norm": 3.47039532661438,
+ "learning_rate": 4.306393177860413e-08,
+ "loss": 0.0442,
+ "step": 35648
+ },
+ {
+ "epoch": 97.13623978201635,
+ "grad_norm": 7.448739051818848,
+ "learning_rate": 4.2982158769956375e-08,
+ "loss": 0.1653,
+ "step": 35649
+ },
+ {
+ "epoch": 97.13896457765668,
+ "grad_norm": 3.205759286880493,
+ "learning_rate": 4.290046330624354e-08,
+ "loss": 0.0518,
+ "step": 35650
+ },
+ {
+ "epoch": 97.141689373297,
+ "grad_norm": 2.101719617843628,
+ "learning_rate": 4.281884538810066e-08,
+ "loss": 0.0657,
+ "step": 35651
+ },
+ {
+ "epoch": 97.14441416893733,
+ "grad_norm": 1.5737000703811646,
+ "learning_rate": 4.2737305016165024e-08,
+ "loss": 0.0178,
+ "step": 35652
+ },
+ {
+ "epoch": 97.14713896457765,
+ "grad_norm": 2.535308599472046,
+ "learning_rate": 4.265584219107055e-08,
+ "loss": 0.0216,
+ "step": 35653
+ },
+ {
+ "epoch": 97.14986376021798,
+ "grad_norm": 1.0927975177764893,
+ "learning_rate": 4.25744569134523e-08,
+ "loss": 0.0164,
+ "step": 35654
+ },
+ {
+ "epoch": 97.15258855585832,
+ "grad_norm": 1.8163610696792603,
+ "learning_rate": 4.24931491839431e-08,
+ "loss": 0.0257,
+ "step": 35655
+ },
+ {
+ "epoch": 97.15531335149863,
+ "grad_norm": 2.726227283477783,
+ "learning_rate": 4.241191900317687e-08,
+ "loss": 0.0664,
+ "step": 35656
+ },
+ {
+ "epoch": 97.15803814713897,
+ "grad_norm": 5.813877105712891,
+ "learning_rate": 4.233076637178646e-08,
+ "loss": 0.0466,
+ "step": 35657
+ },
+ {
+ "epoch": 97.16076294277929,
+ "grad_norm": 2.5090365409851074,
+ "learning_rate": 4.224969129040246e-08,
+ "loss": 0.0704,
+ "step": 35658
+ },
+ {
+ "epoch": 97.16348773841962,
+ "grad_norm": 1.8353524208068848,
+ "learning_rate": 4.2168693759658815e-08,
+ "loss": 0.0668,
+ "step": 35659
+ },
+ {
+ "epoch": 97.16621253405995,
+ "grad_norm": 4.932413578033447,
+ "learning_rate": 4.208777378018392e-08,
+ "loss": 0.0461,
+ "step": 35660
+ },
+ {
+ "epoch": 97.16893732970027,
+ "grad_norm": 3.0826075077056885,
+ "learning_rate": 4.200693135260836e-08,
+ "loss": 0.0729,
+ "step": 35661
+ },
+ {
+ "epoch": 97.1716621253406,
+ "grad_norm": 2.846266269683838,
+ "learning_rate": 4.192616647756387e-08,
+ "loss": 0.06,
+ "step": 35662
+ },
+ {
+ "epoch": 97.17438692098092,
+ "grad_norm": 1.3967534303665161,
+ "learning_rate": 4.184547915567661e-08,
+ "loss": 0.0163,
+ "step": 35663
+ },
+ {
+ "epoch": 97.17711171662125,
+ "grad_norm": 2.4666824340820312,
+ "learning_rate": 4.1764869387577175e-08,
+ "loss": 0.0367,
+ "step": 35664
+ },
+ {
+ "epoch": 97.17983651226157,
+ "grad_norm": 2.026526927947998,
+ "learning_rate": 4.168433717389286e-08,
+ "loss": 0.0255,
+ "step": 35665
+ },
+ {
+ "epoch": 97.1825613079019,
+ "grad_norm": 4.576807498931885,
+ "learning_rate": 4.1603882515248714e-08,
+ "loss": 0.0392,
+ "step": 35666
+ },
+ {
+ "epoch": 97.18528610354224,
+ "grad_norm": 5.354944229125977,
+ "learning_rate": 4.1523505412274235e-08,
+ "loss": 0.0359,
+ "step": 35667
+ },
+ {
+ "epoch": 97.18801089918256,
+ "grad_norm": 4.240804195404053,
+ "learning_rate": 4.144320586559447e-08,
+ "loss": 0.0708,
+ "step": 35668
+ },
+ {
+ "epoch": 97.19073569482289,
+ "grad_norm": 1.174184799194336,
+ "learning_rate": 4.1362983875833373e-08,
+ "loss": 0.0165,
+ "step": 35669
+ },
+ {
+ "epoch": 97.19346049046321,
+ "grad_norm": 2.881422758102417,
+ "learning_rate": 4.1282839443617106e-08,
+ "loss": 0.1455,
+ "step": 35670
+ },
+ {
+ "epoch": 97.19618528610354,
+ "grad_norm": 2.0956594944000244,
+ "learning_rate": 4.1202772569570724e-08,
+ "loss": 0.0755,
+ "step": 35671
+ },
+ {
+ "epoch": 97.19891008174388,
+ "grad_norm": 5.350720405578613,
+ "learning_rate": 4.1122783254315955e-08,
+ "loss": 0.0434,
+ "step": 35672
+ },
+ {
+ "epoch": 97.2016348773842,
+ "grad_norm": 2.869659185409546,
+ "learning_rate": 4.1042871498476746e-08,
+ "loss": 0.0341,
+ "step": 35673
+ },
+ {
+ "epoch": 97.20435967302453,
+ "grad_norm": 2.8423678874969482,
+ "learning_rate": 4.09630373026737e-08,
+ "loss": 0.0985,
+ "step": 35674
+ },
+ {
+ "epoch": 97.20708446866485,
+ "grad_norm": 1.7651212215423584,
+ "learning_rate": 4.088328066753078e-08,
+ "loss": 0.1022,
+ "step": 35675
+ },
+ {
+ "epoch": 97.20980926430518,
+ "grad_norm": 2.8172552585601807,
+ "learning_rate": 4.0803601593668586e-08,
+ "loss": 0.0491,
+ "step": 35676
+ },
+ {
+ "epoch": 97.2125340599455,
+ "grad_norm": 2.1117210388183594,
+ "learning_rate": 4.072400008170774e-08,
+ "loss": 0.0731,
+ "step": 35677
+ },
+ {
+ "epoch": 97.21525885558583,
+ "grad_norm": 5.589637756347656,
+ "learning_rate": 4.064447613226774e-08,
+ "loss": 0.0485,
+ "step": 35678
+ },
+ {
+ "epoch": 97.21798365122616,
+ "grad_norm": 1.5005141496658325,
+ "learning_rate": 4.0565029745966987e-08,
+ "loss": 0.0166,
+ "step": 35679
+ },
+ {
+ "epoch": 97.22070844686648,
+ "grad_norm": 1.5149348974227905,
+ "learning_rate": 4.0485660923426095e-08,
+ "loss": 0.0207,
+ "step": 35680
+ },
+ {
+ "epoch": 97.22343324250681,
+ "grad_norm": 2.9435641765594482,
+ "learning_rate": 4.0406369665262343e-08,
+ "loss": 0.0499,
+ "step": 35681
+ },
+ {
+ "epoch": 97.22615803814713,
+ "grad_norm": 2.9011828899383545,
+ "learning_rate": 4.032715597209302e-08,
+ "loss": 0.0581,
+ "step": 35682
+ },
+ {
+ "epoch": 97.22888283378747,
+ "grad_norm": 3.445481300354004,
+ "learning_rate": 4.024801984453541e-08,
+ "loss": 0.0699,
+ "step": 35683
+ },
+ {
+ "epoch": 97.2316076294278,
+ "grad_norm": 1.88826584815979,
+ "learning_rate": 4.016896128320569e-08,
+ "loss": 0.0194,
+ "step": 35684
+ },
+ {
+ "epoch": 97.23433242506812,
+ "grad_norm": 2.2753238677978516,
+ "learning_rate": 4.008998028872002e-08,
+ "loss": 0.0678,
+ "step": 35685
+ },
+ {
+ "epoch": 97.23705722070845,
+ "grad_norm": 2.4716103076934814,
+ "learning_rate": 4.0011076861691254e-08,
+ "loss": 0.0948,
+ "step": 35686
+ },
+ {
+ "epoch": 97.23978201634877,
+ "grad_norm": 4.816853046417236,
+ "learning_rate": 3.993225100273779e-08,
+ "loss": 0.1862,
+ "step": 35687
+ },
+ {
+ "epoch": 97.2425068119891,
+ "grad_norm": 2.6293253898620605,
+ "learning_rate": 3.985350271247024e-08,
+ "loss": 0.0963,
+ "step": 35688
+ },
+ {
+ "epoch": 97.24523160762942,
+ "grad_norm": 2.2298426628112793,
+ "learning_rate": 3.9774831991503674e-08,
+ "loss": 0.0421,
+ "step": 35689
+ },
+ {
+ "epoch": 97.24795640326975,
+ "grad_norm": 2.217453956604004,
+ "learning_rate": 3.9696238840448705e-08,
+ "loss": 0.0459,
+ "step": 35690
+ },
+ {
+ "epoch": 97.25068119891009,
+ "grad_norm": 2.6928329467773438,
+ "learning_rate": 3.9617723259920417e-08,
+ "loss": 0.0229,
+ "step": 35691
+ },
+ {
+ "epoch": 97.2534059945504,
+ "grad_norm": 2.535069704055786,
+ "learning_rate": 3.95392852505283e-08,
+ "loss": 0.0789,
+ "step": 35692
+ },
+ {
+ "epoch": 97.25613079019074,
+ "grad_norm": 3.881356716156006,
+ "learning_rate": 3.9460924812884107e-08,
+ "loss": 0.0964,
+ "step": 35693
+ },
+ {
+ "epoch": 97.25885558583106,
+ "grad_norm": 2.926912307739258,
+ "learning_rate": 3.938264194759622e-08,
+ "loss": 0.1163,
+ "step": 35694
+ },
+ {
+ "epoch": 97.26158038147139,
+ "grad_norm": 3.2584853172302246,
+ "learning_rate": 3.9304436655276393e-08,
+ "loss": 0.0648,
+ "step": 35695
+ },
+ {
+ "epoch": 97.26430517711172,
+ "grad_norm": 1.52204430103302,
+ "learning_rate": 3.922630893653301e-08,
+ "loss": 0.0248,
+ "step": 35696
+ },
+ {
+ "epoch": 97.26702997275204,
+ "grad_norm": 2.9916036128997803,
+ "learning_rate": 3.914825879197559e-08,
+ "loss": 0.1678,
+ "step": 35697
+ },
+ {
+ "epoch": 97.26975476839237,
+ "grad_norm": 2.6528549194335938,
+ "learning_rate": 3.9070286222210316e-08,
+ "loss": 0.068,
+ "step": 35698
+ },
+ {
+ "epoch": 97.2724795640327,
+ "grad_norm": 2.157846689224243,
+ "learning_rate": 3.899239122784448e-08,
+ "loss": 0.0598,
+ "step": 35699
+ },
+ {
+ "epoch": 97.27520435967303,
+ "grad_norm": 2.51202654838562,
+ "learning_rate": 3.891457380948538e-08,
+ "loss": 0.0414,
+ "step": 35700
+ },
+ {
+ "epoch": 97.27792915531334,
+ "grad_norm": 2.394866943359375,
+ "learning_rate": 3.883683396773919e-08,
+ "loss": 0.0283,
+ "step": 35701
+ },
+ {
+ "epoch": 97.28065395095368,
+ "grad_norm": 3.044130325317383,
+ "learning_rate": 3.875917170321208e-08,
+ "loss": 0.1344,
+ "step": 35702
+ },
+ {
+ "epoch": 97.28337874659401,
+ "grad_norm": 3.3202123641967773,
+ "learning_rate": 3.8681587016506924e-08,
+ "loss": 0.0472,
+ "step": 35703
+ },
+ {
+ "epoch": 97.28610354223433,
+ "grad_norm": 2.31563401222229,
+ "learning_rate": 3.860407990822879e-08,
+ "loss": 0.0421,
+ "step": 35704
+ },
+ {
+ "epoch": 97.28882833787466,
+ "grad_norm": 2.1818692684173584,
+ "learning_rate": 3.8526650378982736e-08,
+ "loss": 0.0593,
+ "step": 35705
+ },
+ {
+ "epoch": 97.29155313351498,
+ "grad_norm": 5.058921813964844,
+ "learning_rate": 3.8449298429369397e-08,
+ "loss": 0.0681,
+ "step": 35706
+ },
+ {
+ "epoch": 97.29427792915531,
+ "grad_norm": 1.8164100646972656,
+ "learning_rate": 3.8372024059991633e-08,
+ "loss": 0.0241,
+ "step": 35707
+ },
+ {
+ "epoch": 97.29700272479565,
+ "grad_norm": 2.463520050048828,
+ "learning_rate": 3.8294827271453394e-08,
+ "loss": 0.0571,
+ "step": 35708
+ },
+ {
+ "epoch": 97.29972752043597,
+ "grad_norm": 3.147904634475708,
+ "learning_rate": 3.8217708064354206e-08,
+ "loss": 0.0868,
+ "step": 35709
+ },
+ {
+ "epoch": 97.3024523160763,
+ "grad_norm": 3.002943515777588,
+ "learning_rate": 3.81406664392936e-08,
+ "loss": 0.0569,
+ "step": 35710
+ },
+ {
+ "epoch": 97.30517711171662,
+ "grad_norm": 1.6419553756713867,
+ "learning_rate": 3.80637023968744e-08,
+ "loss": 0.0228,
+ "step": 35711
+ },
+ {
+ "epoch": 97.30790190735695,
+ "grad_norm": 2.226773738861084,
+ "learning_rate": 3.798681593769393e-08,
+ "loss": 0.0746,
+ "step": 35712
+ },
+ {
+ "epoch": 97.31062670299727,
+ "grad_norm": 4.040128707885742,
+ "learning_rate": 3.791000706235171e-08,
+ "loss": 0.0671,
+ "step": 35713
+ },
+ {
+ "epoch": 97.3133514986376,
+ "grad_norm": 2.2122244834899902,
+ "learning_rate": 3.783327577144502e-08,
+ "loss": 0.0241,
+ "step": 35714
+ },
+ {
+ "epoch": 97.31607629427793,
+ "grad_norm": 1.792174220085144,
+ "learning_rate": 3.775662206557229e-08,
+ "loss": 0.0505,
+ "step": 35715
+ },
+ {
+ "epoch": 97.31880108991825,
+ "grad_norm": 2.6207172870635986,
+ "learning_rate": 3.768004594533081e-08,
+ "loss": 0.027,
+ "step": 35716
+ },
+ {
+ "epoch": 97.32152588555859,
+ "grad_norm": 2.3851215839385986,
+ "learning_rate": 3.760354741131678e-08,
+ "loss": 0.0258,
+ "step": 35717
+ },
+ {
+ "epoch": 97.3242506811989,
+ "grad_norm": 2.7815468311309814,
+ "learning_rate": 3.752712646412526e-08,
+ "loss": 0.1268,
+ "step": 35718
+ },
+ {
+ "epoch": 97.32697547683924,
+ "grad_norm": 2.303602933883667,
+ "learning_rate": 3.745078310435135e-08,
+ "loss": 0.0569,
+ "step": 35719
+ },
+ {
+ "epoch": 97.32970027247957,
+ "grad_norm": 2.026928663253784,
+ "learning_rate": 3.737451733259123e-08,
+ "loss": 0.0544,
+ "step": 35720
+ },
+ {
+ "epoch": 97.33242506811989,
+ "grad_norm": 2.396444797515869,
+ "learning_rate": 3.729832914943665e-08,
+ "loss": 0.1104,
+ "step": 35721
+ },
+ {
+ "epoch": 97.33514986376022,
+ "grad_norm": 2.3454558849334717,
+ "learning_rate": 3.722221855548269e-08,
+ "loss": 0.0254,
+ "step": 35722
+ },
+ {
+ "epoch": 97.33787465940054,
+ "grad_norm": 2.012298822402954,
+ "learning_rate": 3.71461855513211e-08,
+ "loss": 0.0865,
+ "step": 35723
+ },
+ {
+ "epoch": 97.34059945504087,
+ "grad_norm": 2.7653141021728516,
+ "learning_rate": 3.707023013754474e-08,
+ "loss": 0.0291,
+ "step": 35724
+ },
+ {
+ "epoch": 97.34332425068119,
+ "grad_norm": 2.1480188369750977,
+ "learning_rate": 3.699435231474424e-08,
+ "loss": 0.0236,
+ "step": 35725
+ },
+ {
+ "epoch": 97.34604904632153,
+ "grad_norm": 2.642390251159668,
+ "learning_rate": 3.691855208351136e-08,
+ "loss": 0.135,
+ "step": 35726
+ },
+ {
+ "epoch": 97.34877384196186,
+ "grad_norm": 2.243866205215454,
+ "learning_rate": 3.6842829444436734e-08,
+ "loss": 0.0227,
+ "step": 35727
+ },
+ {
+ "epoch": 97.35149863760218,
+ "grad_norm": 2.7783806324005127,
+ "learning_rate": 3.676718439810767e-08,
+ "loss": 0.0499,
+ "step": 35728
+ },
+ {
+ "epoch": 97.35422343324251,
+ "grad_norm": 2.030147075653076,
+ "learning_rate": 3.6691616945117025e-08,
+ "loss": 0.0541,
+ "step": 35729
+ },
+ {
+ "epoch": 97.35694822888283,
+ "grad_norm": 2.5146689414978027,
+ "learning_rate": 3.6616127086051e-08,
+ "loss": 0.0337,
+ "step": 35730
+ },
+ {
+ "epoch": 97.35967302452316,
+ "grad_norm": 4.058608055114746,
+ "learning_rate": 3.65407148214969e-08,
+ "loss": 0.0359,
+ "step": 35731
+ },
+ {
+ "epoch": 97.3623978201635,
+ "grad_norm": 2.2269248962402344,
+ "learning_rate": 3.646538015204426e-08,
+ "loss": 0.0251,
+ "step": 35732
+ },
+ {
+ "epoch": 97.36512261580381,
+ "grad_norm": 3.1376373767852783,
+ "learning_rate": 3.639012307827816e-08,
+ "loss": 0.1518,
+ "step": 35733
+ },
+ {
+ "epoch": 97.36784741144415,
+ "grad_norm": 2.2508909702301025,
+ "learning_rate": 3.63149436007848e-08,
+ "loss": 0.1153,
+ "step": 35734
+ },
+ {
+ "epoch": 97.37057220708446,
+ "grad_norm": 3.2898099422454834,
+ "learning_rate": 3.623984172015038e-08,
+ "loss": 0.0883,
+ "step": 35735
+ },
+ {
+ "epoch": 97.3732970027248,
+ "grad_norm": 2.400824546813965,
+ "learning_rate": 3.616481743695888e-08,
+ "loss": 0.0312,
+ "step": 35736
+ },
+ {
+ "epoch": 97.37602179836512,
+ "grad_norm": 6.968176364898682,
+ "learning_rate": 3.6089870751795374e-08,
+ "loss": 0.0395,
+ "step": 35737
+ },
+ {
+ "epoch": 97.37874659400545,
+ "grad_norm": 3.3455638885498047,
+ "learning_rate": 3.6015001665243853e-08,
+ "loss": 0.1089,
+ "step": 35738
+ },
+ {
+ "epoch": 97.38147138964578,
+ "grad_norm": 1.6406556367874146,
+ "learning_rate": 3.594021017788607e-08,
+ "loss": 0.0189,
+ "step": 35739
+ },
+ {
+ "epoch": 97.3841961852861,
+ "grad_norm": 1.971541404724121,
+ "learning_rate": 3.586549629030489e-08,
+ "loss": 0.0838,
+ "step": 35740
+ },
+ {
+ "epoch": 97.38692098092643,
+ "grad_norm": 2.65551495552063,
+ "learning_rate": 3.579086000308318e-08,
+ "loss": 0.0356,
+ "step": 35741
+ },
+ {
+ "epoch": 97.38964577656675,
+ "grad_norm": 4.395047664642334,
+ "learning_rate": 3.571630131680159e-08,
+ "loss": 0.0538,
+ "step": 35742
+ },
+ {
+ "epoch": 97.39237057220708,
+ "grad_norm": 2.4963653087615967,
+ "learning_rate": 3.564182023204077e-08,
+ "loss": 0.0576,
+ "step": 35743
+ },
+ {
+ "epoch": 97.39509536784742,
+ "grad_norm": 2.5708718299865723,
+ "learning_rate": 3.556741674938024e-08,
+ "loss": 0.0657,
+ "step": 35744
+ },
+ {
+ "epoch": 97.39782016348774,
+ "grad_norm": 1.9411816596984863,
+ "learning_rate": 3.549309086940067e-08,
+ "loss": 0.0205,
+ "step": 35745
+ },
+ {
+ "epoch": 97.40054495912807,
+ "grad_norm": 1.9105851650238037,
+ "learning_rate": 3.541884259267936e-08,
+ "loss": 0.0222,
+ "step": 35746
+ },
+ {
+ "epoch": 97.40326975476839,
+ "grad_norm": 2.73858380317688,
+ "learning_rate": 3.5344671919795844e-08,
+ "loss": 0.0624,
+ "step": 35747
+ },
+ {
+ "epoch": 97.40599455040872,
+ "grad_norm": 2.018718957901001,
+ "learning_rate": 3.5270578851327454e-08,
+ "loss": 0.0198,
+ "step": 35748
+ },
+ {
+ "epoch": 97.40871934604904,
+ "grad_norm": 1.703837275505066,
+ "learning_rate": 3.519656338785038e-08,
+ "loss": 0.0571,
+ "step": 35749
+ },
+ {
+ "epoch": 97.41144414168937,
+ "grad_norm": 2.6347010135650635,
+ "learning_rate": 3.512262552994305e-08,
+ "loss": 0.0382,
+ "step": 35750
+ },
+ {
+ "epoch": 97.4141689373297,
+ "grad_norm": 1.892220377922058,
+ "learning_rate": 3.504876527817946e-08,
+ "loss": 0.0325,
+ "step": 35751
+ },
+ {
+ "epoch": 97.41689373297002,
+ "grad_norm": 2.6764485836029053,
+ "learning_rate": 3.49749826331347e-08,
+ "loss": 0.1365,
+ "step": 35752
+ },
+ {
+ "epoch": 97.41961852861036,
+ "grad_norm": 2.0000882148742676,
+ "learning_rate": 3.490127759538497e-08,
+ "loss": 0.0597,
+ "step": 35753
+ },
+ {
+ "epoch": 97.42234332425068,
+ "grad_norm": 4.685260772705078,
+ "learning_rate": 3.482765016550316e-08,
+ "loss": 0.083,
+ "step": 35754
+ },
+ {
+ "epoch": 97.42506811989101,
+ "grad_norm": 1.8418105840682983,
+ "learning_rate": 3.475410034406212e-08,
+ "loss": 0.023,
+ "step": 35755
+ },
+ {
+ "epoch": 97.42779291553134,
+ "grad_norm": 1.4824579954147339,
+ "learning_rate": 3.468062813163586e-08,
+ "loss": 0.0142,
+ "step": 35756
+ },
+ {
+ "epoch": 97.43051771117166,
+ "grad_norm": 2.7751262187957764,
+ "learning_rate": 3.4607233528796136e-08,
+ "loss": 0.0158,
+ "step": 35757
+ },
+ {
+ "epoch": 97.433242506812,
+ "grad_norm": 4.138879776000977,
+ "learning_rate": 3.453391653611471e-08,
+ "loss": 0.1413,
+ "step": 35758
+ },
+ {
+ "epoch": 97.43596730245231,
+ "grad_norm": 2.429327964782715,
+ "learning_rate": 3.446067715416224e-08,
+ "loss": 0.0659,
+ "step": 35759
+ },
+ {
+ "epoch": 97.43869209809264,
+ "grad_norm": 2.288085699081421,
+ "learning_rate": 3.438751538350937e-08,
+ "loss": 0.0298,
+ "step": 35760
+ },
+ {
+ "epoch": 97.44141689373296,
+ "grad_norm": 3.082080602645874,
+ "learning_rate": 3.431443122472566e-08,
+ "loss": 0.0767,
+ "step": 35761
+ },
+ {
+ "epoch": 97.4441416893733,
+ "grad_norm": 1.9701496362686157,
+ "learning_rate": 3.424142467838065e-08,
+ "loss": 0.1448,
+ "step": 35762
+ },
+ {
+ "epoch": 97.44686648501363,
+ "grad_norm": 2.3054821491241455,
+ "learning_rate": 3.4168495745042776e-08,
+ "loss": 0.0486,
+ "step": 35763
+ },
+ {
+ "epoch": 97.44959128065395,
+ "grad_norm": 2.489908456802368,
+ "learning_rate": 3.409564442527935e-08,
+ "loss": 0.0973,
+ "step": 35764
+ },
+ {
+ "epoch": 97.45231607629428,
+ "grad_norm": 2.0973353385925293,
+ "learning_rate": 3.402287071965882e-08,
+ "loss": 0.0333,
+ "step": 35765
+ },
+ {
+ "epoch": 97.4550408719346,
+ "grad_norm": 2.7435762882232666,
+ "learning_rate": 3.395017462874739e-08,
+ "loss": 0.0508,
+ "step": 35766
+ },
+ {
+ "epoch": 97.45776566757493,
+ "grad_norm": 2.5076231956481934,
+ "learning_rate": 3.387755615311128e-08,
+ "loss": 0.0292,
+ "step": 35767
+ },
+ {
+ "epoch": 97.46049046321527,
+ "grad_norm": 2.5052192211151123,
+ "learning_rate": 3.380501529331559e-08,
+ "loss": 0.0485,
+ "step": 35768
+ },
+ {
+ "epoch": 97.46321525885558,
+ "grad_norm": 7.725629806518555,
+ "learning_rate": 3.3732552049925423e-08,
+ "loss": 0.1641,
+ "step": 35769
+ },
+ {
+ "epoch": 97.46594005449592,
+ "grad_norm": 3.0218212604522705,
+ "learning_rate": 3.366016642350589e-08,
+ "loss": 0.0307,
+ "step": 35770
+ },
+ {
+ "epoch": 97.46866485013624,
+ "grad_norm": 2.0976974964141846,
+ "learning_rate": 3.358785841462098e-08,
+ "loss": 0.0806,
+ "step": 35771
+ },
+ {
+ "epoch": 97.47138964577657,
+ "grad_norm": 7.243982315063477,
+ "learning_rate": 3.3515628023831346e-08,
+ "loss": 0.041,
+ "step": 35772
+ },
+ {
+ "epoch": 97.47411444141689,
+ "grad_norm": 1.8728142976760864,
+ "learning_rate": 3.344347525170322e-08,
+ "loss": 0.1892,
+ "step": 35773
+ },
+ {
+ "epoch": 97.47683923705722,
+ "grad_norm": 2.4406001567840576,
+ "learning_rate": 3.337140009879503e-08,
+ "loss": 0.0193,
+ "step": 35774
+ },
+ {
+ "epoch": 97.47956403269755,
+ "grad_norm": 2.5310189723968506,
+ "learning_rate": 3.329940256566966e-08,
+ "loss": 0.0227,
+ "step": 35775
+ },
+ {
+ "epoch": 97.48228882833787,
+ "grad_norm": 3.100160598754883,
+ "learning_rate": 3.3227482652888885e-08,
+ "loss": 0.0585,
+ "step": 35776
+ },
+ {
+ "epoch": 97.4850136239782,
+ "grad_norm": 2.3535513877868652,
+ "learning_rate": 3.315564036101115e-08,
+ "loss": 0.0286,
+ "step": 35777
+ },
+ {
+ "epoch": 97.48773841961852,
+ "grad_norm": 2.1238162517547607,
+ "learning_rate": 3.308387569059601e-08,
+ "loss": 0.1461,
+ "step": 35778
+ },
+ {
+ "epoch": 97.49046321525886,
+ "grad_norm": 2.19785475730896,
+ "learning_rate": 3.3012188642203015e-08,
+ "loss": 0.031,
+ "step": 35779
+ },
+ {
+ "epoch": 97.49318801089919,
+ "grad_norm": 5.525651454925537,
+ "learning_rate": 3.29405792163906e-08,
+ "loss": 0.0845,
+ "step": 35780
+ },
+ {
+ "epoch": 97.49591280653951,
+ "grad_norm": 3.4149084091186523,
+ "learning_rate": 3.2869047413716104e-08,
+ "loss": 0.0955,
+ "step": 35781
+ },
+ {
+ "epoch": 97.49863760217984,
+ "grad_norm": 3.5434200763702393,
+ "learning_rate": 3.2797593234735745e-08,
+ "loss": 0.035,
+ "step": 35782
+ },
+ {
+ "epoch": 97.50136239782016,
+ "grad_norm": 4.449948310852051,
+ "learning_rate": 3.272621668000797e-08,
+ "loss": 0.0667,
+ "step": 35783
+ },
+ {
+ "epoch": 97.50408719346049,
+ "grad_norm": 2.3025572299957275,
+ "learning_rate": 3.265491775008789e-08,
+ "loss": 0.0849,
+ "step": 35784
+ },
+ {
+ "epoch": 97.50681198910081,
+ "grad_norm": 2.930227041244507,
+ "learning_rate": 3.25836964455295e-08,
+ "loss": 0.1944,
+ "step": 35785
+ },
+ {
+ "epoch": 97.50953678474114,
+ "grad_norm": 2.109895706176758,
+ "learning_rate": 3.251255276688903e-08,
+ "loss": 0.024,
+ "step": 35786
+ },
+ {
+ "epoch": 97.51226158038148,
+ "grad_norm": 2.6566219329833984,
+ "learning_rate": 3.2441486714720474e-08,
+ "loss": 0.2145,
+ "step": 35787
+ },
+ {
+ "epoch": 97.5149863760218,
+ "grad_norm": 4.1831512451171875,
+ "learning_rate": 3.2370498289576727e-08,
+ "loss": 0.0332,
+ "step": 35788
+ },
+ {
+ "epoch": 97.51771117166213,
+ "grad_norm": 1.8247441053390503,
+ "learning_rate": 3.2299587492009565e-08,
+ "loss": 0.0231,
+ "step": 35789
+ },
+ {
+ "epoch": 97.52043596730245,
+ "grad_norm": 2.600660800933838,
+ "learning_rate": 3.2228754322574106e-08,
+ "loss": 0.08,
+ "step": 35790
+ },
+ {
+ "epoch": 97.52316076294278,
+ "grad_norm": 1.1747342348098755,
+ "learning_rate": 3.21579987818188e-08,
+ "loss": 0.0146,
+ "step": 35791
+ },
+ {
+ "epoch": 97.52588555858311,
+ "grad_norm": 1.9240552186965942,
+ "learning_rate": 3.208732087029653e-08,
+ "loss": 0.0535,
+ "step": 35792
+ },
+ {
+ "epoch": 97.52861035422343,
+ "grad_norm": 1.777369737625122,
+ "learning_rate": 3.201672058855798e-08,
+ "loss": 0.0808,
+ "step": 35793
+ },
+ {
+ "epoch": 97.53133514986376,
+ "grad_norm": 1.862227201461792,
+ "learning_rate": 3.19461979371527e-08,
+ "loss": 0.0446,
+ "step": 35794
+ },
+ {
+ "epoch": 97.53405994550408,
+ "grad_norm": 1.7047882080078125,
+ "learning_rate": 3.1875752916628034e-08,
+ "loss": 0.0421,
+ "step": 35795
+ },
+ {
+ "epoch": 97.53678474114442,
+ "grad_norm": 2.558957576751709,
+ "learning_rate": 3.180538552753576e-08,
+ "loss": 0.1248,
+ "step": 35796
+ },
+ {
+ "epoch": 97.53950953678473,
+ "grad_norm": 1.5976080894470215,
+ "learning_rate": 3.1735095770421e-08,
+ "loss": 0.0167,
+ "step": 35797
+ },
+ {
+ "epoch": 97.54223433242507,
+ "grad_norm": 2.2887840270996094,
+ "learning_rate": 3.166488364583331e-08,
+ "loss": 0.055,
+ "step": 35798
+ },
+ {
+ "epoch": 97.5449591280654,
+ "grad_norm": 2.419386863708496,
+ "learning_rate": 3.159474915431893e-08,
+ "loss": 0.0276,
+ "step": 35799
+ },
+ {
+ "epoch": 97.54768392370572,
+ "grad_norm": 2.284625768661499,
+ "learning_rate": 3.1524692296422966e-08,
+ "loss": 0.0894,
+ "step": 35800
+ },
+ {
+ "epoch": 97.55040871934605,
+ "grad_norm": 2.5056934356689453,
+ "learning_rate": 3.145471307269277e-08,
+ "loss": 0.1508,
+ "step": 35801
+ },
+ {
+ "epoch": 97.55313351498637,
+ "grad_norm": 2.7053492069244385,
+ "learning_rate": 3.138481148367123e-08,
+ "loss": 0.0803,
+ "step": 35802
+ },
+ {
+ "epoch": 97.5558583106267,
+ "grad_norm": 2.577946662902832,
+ "learning_rate": 3.1314987529905696e-08,
+ "loss": 0.0287,
+ "step": 35803
+ },
+ {
+ "epoch": 97.55858310626704,
+ "grad_norm": 4.119221210479736,
+ "learning_rate": 3.124524121193684e-08,
+ "loss": 0.1726,
+ "step": 35804
+ },
+ {
+ "epoch": 97.56130790190736,
+ "grad_norm": 2.4762916564941406,
+ "learning_rate": 3.117557253030978e-08,
+ "loss": 0.277,
+ "step": 35805
+ },
+ {
+ "epoch": 97.56403269754769,
+ "grad_norm": 2.0731794834136963,
+ "learning_rate": 3.1105981485566314e-08,
+ "loss": 0.0502,
+ "step": 35806
+ },
+ {
+ "epoch": 97.566757493188,
+ "grad_norm": 5.1868109703063965,
+ "learning_rate": 3.1036468078248226e-08,
+ "loss": 0.0834,
+ "step": 35807
+ },
+ {
+ "epoch": 97.56948228882834,
+ "grad_norm": 10.438080787658691,
+ "learning_rate": 3.0967032308897304e-08,
+ "loss": 0.0165,
+ "step": 35808
+ },
+ {
+ "epoch": 97.57220708446866,
+ "grad_norm": 2.423152446746826,
+ "learning_rate": 3.089767417805534e-08,
+ "loss": 0.0232,
+ "step": 35809
+ },
+ {
+ "epoch": 97.57493188010899,
+ "grad_norm": 2.390340805053711,
+ "learning_rate": 3.082839368626078e-08,
+ "loss": 0.147,
+ "step": 35810
+ },
+ {
+ "epoch": 97.57765667574932,
+ "grad_norm": 2.715242624282837,
+ "learning_rate": 3.075919083405321e-08,
+ "loss": 0.0534,
+ "step": 35811
+ },
+ {
+ "epoch": 97.58038147138964,
+ "grad_norm": 2.4230451583862305,
+ "learning_rate": 3.06900656219733e-08,
+ "loss": 0.0555,
+ "step": 35812
+ },
+ {
+ "epoch": 97.58310626702998,
+ "grad_norm": 2.556752920150757,
+ "learning_rate": 3.0621018050557285e-08,
+ "loss": 0.0471,
+ "step": 35813
+ },
+ {
+ "epoch": 97.5858310626703,
+ "grad_norm": 2.55846905708313,
+ "learning_rate": 3.0552048120343625e-08,
+ "loss": 0.0276,
+ "step": 35814
+ },
+ {
+ "epoch": 97.58855585831063,
+ "grad_norm": 2.751675605773926,
+ "learning_rate": 3.048315583187078e-08,
+ "loss": 0.0822,
+ "step": 35815
+ },
+ {
+ "epoch": 97.59128065395096,
+ "grad_norm": 2.4820244312286377,
+ "learning_rate": 3.041434118567388e-08,
+ "loss": 0.0377,
+ "step": 35816
+ },
+ {
+ "epoch": 97.59400544959128,
+ "grad_norm": 1.261082649230957,
+ "learning_rate": 3.034560418228916e-08,
+ "loss": 0.0173,
+ "step": 35817
+ },
+ {
+ "epoch": 97.59673024523161,
+ "grad_norm": 3.7353408336639404,
+ "learning_rate": 3.027694482225285e-08,
+ "loss": 0.1013,
+ "step": 35818
+ },
+ {
+ "epoch": 97.59945504087193,
+ "grad_norm": 2.633507251739502,
+ "learning_rate": 3.020836310609787e-08,
+ "loss": 0.0305,
+ "step": 35819
+ },
+ {
+ "epoch": 97.60217983651226,
+ "grad_norm": 2.2586116790771484,
+ "learning_rate": 3.0139859034359344e-08,
+ "loss": 0.0249,
+ "step": 35820
+ },
+ {
+ "epoch": 97.60490463215258,
+ "grad_norm": 2.453795909881592,
+ "learning_rate": 3.0071432607571284e-08,
+ "loss": 0.0449,
+ "step": 35821
+ },
+ {
+ "epoch": 97.60762942779292,
+ "grad_norm": 1.8358465433120728,
+ "learning_rate": 3.000308382626549e-08,
+ "loss": 0.0244,
+ "step": 35822
+ },
+ {
+ "epoch": 97.61035422343325,
+ "grad_norm": 2.564528703689575,
+ "learning_rate": 2.9934812690974865e-08,
+ "loss": 0.0816,
+ "step": 35823
+ },
+ {
+ "epoch": 97.61307901907357,
+ "grad_norm": 2.7338919639587402,
+ "learning_rate": 2.986661920223122e-08,
+ "loss": 0.0786,
+ "step": 35824
+ },
+ {
+ "epoch": 97.6158038147139,
+ "grad_norm": 3.4388840198516846,
+ "learning_rate": 2.9798503360565225e-08,
+ "loss": 0.1104,
+ "step": 35825
+ },
+ {
+ "epoch": 97.61852861035422,
+ "grad_norm": 3.998267412185669,
+ "learning_rate": 2.9730465166508683e-08,
+ "loss": 0.1049,
+ "step": 35826
+ },
+ {
+ "epoch": 97.62125340599455,
+ "grad_norm": 2.5960872173309326,
+ "learning_rate": 2.966250462058895e-08,
+ "loss": 0.0555,
+ "step": 35827
+ },
+ {
+ "epoch": 97.62397820163488,
+ "grad_norm": 3.861147880554199,
+ "learning_rate": 2.9594621723336715e-08,
+ "loss": 0.1128,
+ "step": 35828
+ },
+ {
+ "epoch": 97.6267029972752,
+ "grad_norm": 2.300067663192749,
+ "learning_rate": 2.952681647528155e-08,
+ "loss": 0.0264,
+ "step": 35829
+ },
+ {
+ "epoch": 97.62942779291554,
+ "grad_norm": 2.9510819911956787,
+ "learning_rate": 2.9459088876950814e-08,
+ "loss": 0.0454,
+ "step": 35830
+ },
+ {
+ "epoch": 97.63215258855585,
+ "grad_norm": 2.6466665267944336,
+ "learning_rate": 2.939143892887075e-08,
+ "loss": 0.0342,
+ "step": 35831
+ },
+ {
+ "epoch": 97.63487738419619,
+ "grad_norm": 2.8660361766815186,
+ "learning_rate": 2.932386663156983e-08,
+ "loss": 0.0273,
+ "step": 35832
+ },
+ {
+ "epoch": 97.6376021798365,
+ "grad_norm": 2.7252252101898193,
+ "learning_rate": 2.9256371985573183e-08,
+ "loss": 0.0471,
+ "step": 35833
+ },
+ {
+ "epoch": 97.64032697547684,
+ "grad_norm": 1.7736456394195557,
+ "learning_rate": 2.918895499140817e-08,
+ "loss": 0.025,
+ "step": 35834
+ },
+ {
+ "epoch": 97.64305177111717,
+ "grad_norm": 3.138150691986084,
+ "learning_rate": 2.91216156495977e-08,
+ "loss": 0.0954,
+ "step": 35835
+ },
+ {
+ "epoch": 97.64577656675749,
+ "grad_norm": 2.4309849739074707,
+ "learning_rate": 2.9054353960666914e-08,
+ "loss": 0.038,
+ "step": 35836
+ },
+ {
+ "epoch": 97.64850136239782,
+ "grad_norm": 2.0006468296051025,
+ "learning_rate": 2.8987169925140947e-08,
+ "loss": 0.0347,
+ "step": 35837
+ },
+ {
+ "epoch": 97.65122615803814,
+ "grad_norm": 1.5603562593460083,
+ "learning_rate": 2.89200635435416e-08,
+ "loss": 0.0622,
+ "step": 35838
+ },
+ {
+ "epoch": 97.65395095367847,
+ "grad_norm": 2.112581491470337,
+ "learning_rate": 2.885303481639179e-08,
+ "loss": 0.0379,
+ "step": 35839
+ },
+ {
+ "epoch": 97.65667574931881,
+ "grad_norm": 1.983702540397644,
+ "learning_rate": 2.8786083744213322e-08,
+ "loss": 0.0239,
+ "step": 35840
+ },
+ {
+ "epoch": 97.65940054495913,
+ "grad_norm": 2.877119541168213,
+ "learning_rate": 2.8719210327528e-08,
+ "loss": 0.097,
+ "step": 35841
+ },
+ {
+ "epoch": 97.66212534059946,
+ "grad_norm": 1.8336174488067627,
+ "learning_rate": 2.8652414566857633e-08,
+ "loss": 0.0228,
+ "step": 35842
+ },
+ {
+ "epoch": 97.66485013623978,
+ "grad_norm": 1.8584233522415161,
+ "learning_rate": 2.858569646272069e-08,
+ "loss": 0.0318,
+ "step": 35843
+ },
+ {
+ "epoch": 97.66757493188011,
+ "grad_norm": 4.630131721496582,
+ "learning_rate": 2.8519056015636758e-08,
+ "loss": 0.2295,
+ "step": 35844
+ },
+ {
+ "epoch": 97.67029972752043,
+ "grad_norm": 6.461533069610596,
+ "learning_rate": 2.845249322612542e-08,
+ "loss": 0.0283,
+ "step": 35845
+ },
+ {
+ "epoch": 97.67302452316076,
+ "grad_norm": 2.585191488265991,
+ "learning_rate": 2.8386008094706264e-08,
+ "loss": 0.0307,
+ "step": 35846
+ },
+ {
+ "epoch": 97.6757493188011,
+ "grad_norm": 2.753736972808838,
+ "learning_rate": 2.8319600621895537e-08,
+ "loss": 0.0288,
+ "step": 35847
+ },
+ {
+ "epoch": 97.67847411444141,
+ "grad_norm": 1.8776227235794067,
+ "learning_rate": 2.8253270808209498e-08,
+ "loss": 0.0481,
+ "step": 35848
+ },
+ {
+ "epoch": 97.68119891008175,
+ "grad_norm": 2.0777225494384766,
+ "learning_rate": 2.818701865416773e-08,
+ "loss": 0.0196,
+ "step": 35849
+ },
+ {
+ "epoch": 97.68392370572207,
+ "grad_norm": 3.543302059173584,
+ "learning_rate": 2.8120844160283155e-08,
+ "loss": 0.0319,
+ "step": 35850
+ },
+ {
+ "epoch": 97.6866485013624,
+ "grad_norm": 2.379166841506958,
+ "learning_rate": 2.805474732707425e-08,
+ "loss": 0.0935,
+ "step": 35851
+ },
+ {
+ "epoch": 97.68937329700273,
+ "grad_norm": 1.4063812494277954,
+ "learning_rate": 2.7988728155052825e-08,
+ "loss": 0.0199,
+ "step": 35852
+ },
+ {
+ "epoch": 97.69209809264305,
+ "grad_norm": 2.5580313205718994,
+ "learning_rate": 2.7922786644734023e-08,
+ "loss": 0.0546,
+ "step": 35853
+ },
+ {
+ "epoch": 97.69482288828338,
+ "grad_norm": 4.716394424438477,
+ "learning_rate": 2.785692279663188e-08,
+ "loss": 0.0518,
+ "step": 35854
+ },
+ {
+ "epoch": 97.6975476839237,
+ "grad_norm": 12.530521392822266,
+ "learning_rate": 2.779113661125932e-08,
+ "loss": 0.0395,
+ "step": 35855
+ },
+ {
+ "epoch": 97.70027247956403,
+ "grad_norm": 2.3398494720458984,
+ "learning_rate": 2.7725428089128148e-08,
+ "loss": 0.0687,
+ "step": 35856
+ },
+ {
+ "epoch": 97.70299727520435,
+ "grad_norm": 2.703486680984497,
+ "learning_rate": 2.7659797230751295e-08,
+ "loss": 0.1221,
+ "step": 35857
+ },
+ {
+ "epoch": 97.70572207084469,
+ "grad_norm": 2.562216281890869,
+ "learning_rate": 2.759424403663835e-08,
+ "loss": 0.1106,
+ "step": 35858
+ },
+ {
+ "epoch": 97.70844686648502,
+ "grad_norm": 2.428530693054199,
+ "learning_rate": 2.752876850730002e-08,
+ "loss": 0.0369,
+ "step": 35859
+ },
+ {
+ "epoch": 97.71117166212534,
+ "grad_norm": 2.3940417766571045,
+ "learning_rate": 2.7463370643247e-08,
+ "loss": 0.0773,
+ "step": 35860
+ },
+ {
+ "epoch": 97.71389645776567,
+ "grad_norm": 3.7675716876983643,
+ "learning_rate": 2.7398050444987777e-08,
+ "loss": 0.0825,
+ "step": 35861
+ },
+ {
+ "epoch": 97.71662125340599,
+ "grad_norm": 2.7979650497436523,
+ "learning_rate": 2.7332807913033055e-08,
+ "loss": 0.1596,
+ "step": 35862
+ },
+ {
+ "epoch": 97.71934604904632,
+ "grad_norm": 3.132063150405884,
+ "learning_rate": 2.7267643047887982e-08,
+ "loss": 0.06,
+ "step": 35863
+ },
+ {
+ "epoch": 97.72207084468666,
+ "grad_norm": 3.481983184814453,
+ "learning_rate": 2.720255585006215e-08,
+ "loss": 0.0613,
+ "step": 35864
+ },
+ {
+ "epoch": 97.72479564032697,
+ "grad_norm": 2.4922659397125244,
+ "learning_rate": 2.7137546320061824e-08,
+ "loss": 0.0716,
+ "step": 35865
+ },
+ {
+ "epoch": 97.7275204359673,
+ "grad_norm": 4.750972270965576,
+ "learning_rate": 2.7072614458393263e-08,
+ "loss": 0.0408,
+ "step": 35866
+ },
+ {
+ "epoch": 97.73024523160763,
+ "grad_norm": 2.241948127746582,
+ "learning_rate": 2.7007760265561623e-08,
+ "loss": 0.0278,
+ "step": 35867
+ },
+ {
+ "epoch": 97.73297002724796,
+ "grad_norm": 2.3033273220062256,
+ "learning_rate": 2.694298374207316e-08,
+ "loss": 0.0254,
+ "step": 35868
+ },
+ {
+ "epoch": 97.73569482288828,
+ "grad_norm": 3.9879684448242188,
+ "learning_rate": 2.6878284888431916e-08,
+ "loss": 0.0698,
+ "step": 35869
+ },
+ {
+ "epoch": 97.73841961852861,
+ "grad_norm": 2.7510740756988525,
+ "learning_rate": 2.6813663705141935e-08,
+ "loss": 0.109,
+ "step": 35870
+ },
+ {
+ "epoch": 97.74114441416894,
+ "grad_norm": 3.931377410888672,
+ "learning_rate": 2.6749120192705037e-08,
+ "loss": 0.1352,
+ "step": 35871
+ },
+ {
+ "epoch": 97.74386920980926,
+ "grad_norm": 2.564488172531128,
+ "learning_rate": 2.668465435162637e-08,
+ "loss": 0.1061,
+ "step": 35872
+ },
+ {
+ "epoch": 97.7465940054496,
+ "grad_norm": 4.47464656829834,
+ "learning_rate": 2.6620266182405542e-08,
+ "loss": 0.233,
+ "step": 35873
+ },
+ {
+ "epoch": 97.74931880108991,
+ "grad_norm": 1.857589602470398,
+ "learning_rate": 2.6555955685545476e-08,
+ "loss": 0.0255,
+ "step": 35874
+ },
+ {
+ "epoch": 97.75204359673025,
+ "grad_norm": 2.577150583267212,
+ "learning_rate": 2.6491722861546887e-08,
+ "loss": 0.0413,
+ "step": 35875
+ },
+ {
+ "epoch": 97.75476839237058,
+ "grad_norm": 3.132887601852417,
+ "learning_rate": 2.6427567710909374e-08,
+ "loss": 0.0273,
+ "step": 35876
+ },
+ {
+ "epoch": 97.7574931880109,
+ "grad_norm": 1.9996192455291748,
+ "learning_rate": 2.636349023413254e-08,
+ "loss": 0.0997,
+ "step": 35877
+ },
+ {
+ "epoch": 97.76021798365123,
+ "grad_norm": 2.1004786491394043,
+ "learning_rate": 2.629949043171709e-08,
+ "loss": 0.0346,
+ "step": 35878
+ },
+ {
+ "epoch": 97.76294277929155,
+ "grad_norm": 1.7419300079345703,
+ "learning_rate": 2.62355683041593e-08,
+ "loss": 0.0293,
+ "step": 35879
+ },
+ {
+ "epoch": 97.76566757493188,
+ "grad_norm": 2.583218812942505,
+ "learning_rate": 2.6171723851957652e-08,
+ "loss": 0.0338,
+ "step": 35880
+ },
+ {
+ "epoch": 97.7683923705722,
+ "grad_norm": 1.9477218389511108,
+ "learning_rate": 2.6107957075609537e-08,
+ "loss": 0.029,
+ "step": 35881
+ },
+ {
+ "epoch": 97.77111716621253,
+ "grad_norm": 1.9340739250183105,
+ "learning_rate": 2.6044267975612324e-08,
+ "loss": 0.0298,
+ "step": 35882
+ },
+ {
+ "epoch": 97.77384196185287,
+ "grad_norm": 2.064065933227539,
+ "learning_rate": 2.5980656552461182e-08,
+ "loss": 0.1699,
+ "step": 35883
+ },
+ {
+ "epoch": 97.77656675749319,
+ "grad_norm": 2.660323143005371,
+ "learning_rate": 2.5917122806652374e-08,
+ "loss": 0.1159,
+ "step": 35884
+ },
+ {
+ "epoch": 97.77929155313352,
+ "grad_norm": 2.3571033477783203,
+ "learning_rate": 2.585366673867884e-08,
+ "loss": 0.1284,
+ "step": 35885
+ },
+ {
+ "epoch": 97.78201634877384,
+ "grad_norm": 2.6144180297851562,
+ "learning_rate": 2.5790288349035742e-08,
+ "loss": 0.1057,
+ "step": 35886
+ },
+ {
+ "epoch": 97.78474114441417,
+ "grad_norm": 2.8029589653015137,
+ "learning_rate": 2.5726987638218238e-08,
+ "loss": 0.0518,
+ "step": 35887
+ },
+ {
+ "epoch": 97.7874659400545,
+ "grad_norm": 2.6526236534118652,
+ "learning_rate": 2.5663764606717046e-08,
+ "loss": 0.0926,
+ "step": 35888
+ },
+ {
+ "epoch": 97.79019073569482,
+ "grad_norm": 3.7425220012664795,
+ "learning_rate": 2.5600619255025106e-08,
+ "loss": 0.1374,
+ "step": 35889
+ },
+ {
+ "epoch": 97.79291553133515,
+ "grad_norm": 2.5686843395233154,
+ "learning_rate": 2.5537551583635356e-08,
+ "loss": 0.0217,
+ "step": 35890
+ },
+ {
+ "epoch": 97.79564032697547,
+ "grad_norm": 1.8298101425170898,
+ "learning_rate": 2.5474561593037406e-08,
+ "loss": 0.0203,
+ "step": 35891
+ },
+ {
+ "epoch": 97.7983651226158,
+ "grad_norm": 3.1686811447143555,
+ "learning_rate": 2.5411649283723083e-08,
+ "loss": 0.0518,
+ "step": 35892
+ },
+ {
+ "epoch": 97.80108991825612,
+ "grad_norm": 2.802241325378418,
+ "learning_rate": 2.5348814656181996e-08,
+ "loss": 0.0389,
+ "step": 35893
+ },
+ {
+ "epoch": 97.80381471389646,
+ "grad_norm": 2.4015142917633057,
+ "learning_rate": 2.5286057710902647e-08,
+ "loss": 0.134,
+ "step": 35894
+ },
+ {
+ "epoch": 97.80653950953679,
+ "grad_norm": 2.5389842987060547,
+ "learning_rate": 2.5223378448374636e-08,
+ "loss": 0.108,
+ "step": 35895
+ },
+ {
+ "epoch": 97.80926430517711,
+ "grad_norm": 2.8739893436431885,
+ "learning_rate": 2.5160776869086467e-08,
+ "loss": 0.1641,
+ "step": 35896
+ },
+ {
+ "epoch": 97.81198910081744,
+ "grad_norm": 1.6186907291412354,
+ "learning_rate": 2.509825297352442e-08,
+ "loss": 0.0279,
+ "step": 35897
+ },
+ {
+ "epoch": 97.81471389645776,
+ "grad_norm": 2.8059005737304688,
+ "learning_rate": 2.5035806762175874e-08,
+ "loss": 0.0389,
+ "step": 35898
+ },
+ {
+ "epoch": 97.8174386920981,
+ "grad_norm": 2.3546082973480225,
+ "learning_rate": 2.4973438235528223e-08,
+ "loss": 0.0934,
+ "step": 35899
+ },
+ {
+ "epoch": 97.82016348773843,
+ "grad_norm": 1.5940228700637817,
+ "learning_rate": 2.4911147394065526e-08,
+ "loss": 0.0817,
+ "step": 35900
+ },
+ {
+ "epoch": 97.82288828337875,
+ "grad_norm": 2.4367599487304688,
+ "learning_rate": 2.484893423827406e-08,
+ "loss": 0.0494,
+ "step": 35901
+ },
+ {
+ "epoch": 97.82561307901908,
+ "grad_norm": 3.33247447013855,
+ "learning_rate": 2.4786798768638987e-08,
+ "loss": 0.0252,
+ "step": 35902
+ },
+ {
+ "epoch": 97.8283378746594,
+ "grad_norm": 1.9521251916885376,
+ "learning_rate": 2.4724740985642148e-08,
+ "loss": 0.0405,
+ "step": 35903
+ },
+ {
+ "epoch": 97.83106267029973,
+ "grad_norm": 2.5466678142547607,
+ "learning_rate": 2.466276088976871e-08,
+ "loss": 0.0296,
+ "step": 35904
+ },
+ {
+ "epoch": 97.83378746594005,
+ "grad_norm": 1.8345268964767456,
+ "learning_rate": 2.4600858481500512e-08,
+ "loss": 0.0286,
+ "step": 35905
+ },
+ {
+ "epoch": 97.83651226158038,
+ "grad_norm": 1.7329964637756348,
+ "learning_rate": 2.4539033761319387e-08,
+ "loss": 0.0206,
+ "step": 35906
+ },
+ {
+ "epoch": 97.83923705722071,
+ "grad_norm": 4.210390090942383,
+ "learning_rate": 2.447728672970717e-08,
+ "loss": 0.0614,
+ "step": 35907
+ },
+ {
+ "epoch": 97.84196185286103,
+ "grad_norm": 1.8690903186798096,
+ "learning_rate": 2.4415617387145708e-08,
+ "loss": 0.0619,
+ "step": 35908
+ },
+ {
+ "epoch": 97.84468664850137,
+ "grad_norm": 2.3672852516174316,
+ "learning_rate": 2.4354025734113495e-08,
+ "loss": 0.0262,
+ "step": 35909
+ },
+ {
+ "epoch": 97.84741144414168,
+ "grad_norm": 3.118413209915161,
+ "learning_rate": 2.4292511771091266e-08,
+ "loss": 0.0801,
+ "step": 35910
+ },
+ {
+ "epoch": 97.85013623978202,
+ "grad_norm": 1.7585015296936035,
+ "learning_rate": 2.4231075498557522e-08,
+ "loss": 0.0294,
+ "step": 35911
+ },
+ {
+ "epoch": 97.85286103542235,
+ "grad_norm": 1.6392691135406494,
+ "learning_rate": 2.416971691699188e-08,
+ "loss": 0.0683,
+ "step": 35912
+ },
+ {
+ "epoch": 97.85558583106267,
+ "grad_norm": 4.103469371795654,
+ "learning_rate": 2.410843602687063e-08,
+ "loss": 0.0183,
+ "step": 35913
+ },
+ {
+ "epoch": 97.858310626703,
+ "grad_norm": 3.2853872776031494,
+ "learning_rate": 2.4047232828672272e-08,
+ "loss": 0.0936,
+ "step": 35914
+ },
+ {
+ "epoch": 97.86103542234332,
+ "grad_norm": 2.474257469177246,
+ "learning_rate": 2.39861073228731e-08,
+ "loss": 0.0541,
+ "step": 35915
+ },
+ {
+ "epoch": 97.86376021798365,
+ "grad_norm": 2.428039073944092,
+ "learning_rate": 2.392505950994939e-08,
+ "loss": 0.0708,
+ "step": 35916
+ },
+ {
+ "epoch": 97.86648501362397,
+ "grad_norm": 1.4760277271270752,
+ "learning_rate": 2.386408939037521e-08,
+ "loss": 0.0934,
+ "step": 35917
+ },
+ {
+ "epoch": 97.8692098092643,
+ "grad_norm": 3.3375816345214844,
+ "learning_rate": 2.380319696462685e-08,
+ "loss": 0.0295,
+ "step": 35918
+ },
+ {
+ "epoch": 97.87193460490464,
+ "grad_norm": 2.3691625595092773,
+ "learning_rate": 2.3742382233178374e-08,
+ "loss": 0.0826,
+ "step": 35919
+ },
+ {
+ "epoch": 97.87465940054496,
+ "grad_norm": 2.846940517425537,
+ "learning_rate": 2.3681645196502733e-08,
+ "loss": 0.0383,
+ "step": 35920
+ },
+ {
+ "epoch": 97.87738419618529,
+ "grad_norm": 1.978087067604065,
+ "learning_rate": 2.3620985855072887e-08,
+ "loss": 0.0409,
+ "step": 35921
+ },
+ {
+ "epoch": 97.88010899182561,
+ "grad_norm": 2.6109161376953125,
+ "learning_rate": 2.3560404209362897e-08,
+ "loss": 0.1963,
+ "step": 35922
+ },
+ {
+ "epoch": 97.88283378746594,
+ "grad_norm": 2.762831687927246,
+ "learning_rate": 2.349990025984239e-08,
+ "loss": 0.0846,
+ "step": 35923
+ },
+ {
+ "epoch": 97.88555858310627,
+ "grad_norm": 2.228059768676758,
+ "learning_rate": 2.343947400698432e-08,
+ "loss": 0.0227,
+ "step": 35924
+ },
+ {
+ "epoch": 97.88828337874659,
+ "grad_norm": 2.9268105030059814,
+ "learning_rate": 2.3379125451258312e-08,
+ "loss": 0.1677,
+ "step": 35925
+ },
+ {
+ "epoch": 97.89100817438693,
+ "grad_norm": 2.174006938934326,
+ "learning_rate": 2.3318854593135098e-08,
+ "loss": 0.0294,
+ "step": 35926
+ },
+ {
+ "epoch": 97.89373297002724,
+ "grad_norm": 1.953399896621704,
+ "learning_rate": 2.3258661433082087e-08,
+ "loss": 0.0776,
+ "step": 35927
+ },
+ {
+ "epoch": 97.89645776566758,
+ "grad_norm": 3.0561678409576416,
+ "learning_rate": 2.3198545971571118e-08,
+ "loss": 0.0314,
+ "step": 35928
+ },
+ {
+ "epoch": 97.8991825613079,
+ "grad_norm": 2.6855521202087402,
+ "learning_rate": 2.3138508209067377e-08,
+ "loss": 0.0363,
+ "step": 35929
+ },
+ {
+ "epoch": 97.90190735694823,
+ "grad_norm": 2.544351577758789,
+ "learning_rate": 2.307854814604049e-08,
+ "loss": 0.0203,
+ "step": 35930
+ },
+ {
+ "epoch": 97.90463215258856,
+ "grad_norm": 2.0955066680908203,
+ "learning_rate": 2.301866578295675e-08,
+ "loss": 0.0602,
+ "step": 35931
+ },
+ {
+ "epoch": 97.90735694822888,
+ "grad_norm": 2.097294569015503,
+ "learning_rate": 2.2958861120283558e-08,
+ "loss": 0.0217,
+ "step": 35932
+ },
+ {
+ "epoch": 97.91008174386921,
+ "grad_norm": 2.20684814453125,
+ "learning_rate": 2.2899134158483883e-08,
+ "loss": 0.1108,
+ "step": 35933
+ },
+ {
+ "epoch": 97.91280653950953,
+ "grad_norm": 2.080538749694824,
+ "learning_rate": 2.283948489802512e-08,
+ "loss": 0.0271,
+ "step": 35934
+ },
+ {
+ "epoch": 97.91553133514986,
+ "grad_norm": 2.9684462547302246,
+ "learning_rate": 2.2779913339371352e-08,
+ "loss": 0.0647,
+ "step": 35935
+ },
+ {
+ "epoch": 97.9182561307902,
+ "grad_norm": 3.363239049911499,
+ "learning_rate": 2.2720419482987754e-08,
+ "loss": 0.0244,
+ "step": 35936
+ },
+ {
+ "epoch": 97.92098092643052,
+ "grad_norm": 4.937668800354004,
+ "learning_rate": 2.2661003329335073e-08,
+ "loss": 0.0565,
+ "step": 35937
+ },
+ {
+ "epoch": 97.92370572207085,
+ "grad_norm": 2.4344513416290283,
+ "learning_rate": 2.2601664878877384e-08,
+ "loss": 0.0365,
+ "step": 35938
+ },
+ {
+ "epoch": 97.92643051771117,
+ "grad_norm": 2.5451300144195557,
+ "learning_rate": 2.2542404132077643e-08,
+ "loss": 0.1251,
+ "step": 35939
+ },
+ {
+ "epoch": 97.9291553133515,
+ "grad_norm": 1.9203739166259766,
+ "learning_rate": 2.248322108939549e-08,
+ "loss": 0.0661,
+ "step": 35940
+ },
+ {
+ "epoch": 97.93188010899182,
+ "grad_norm": 2.2082369327545166,
+ "learning_rate": 2.2424115751293885e-08,
+ "loss": 0.0472,
+ "step": 35941
+ },
+ {
+ "epoch": 97.93460490463215,
+ "grad_norm": 2.3483364582061768,
+ "learning_rate": 2.2365088118231347e-08,
+ "loss": 0.0504,
+ "step": 35942
+ },
+ {
+ "epoch": 97.93732970027249,
+ "grad_norm": 2.3083558082580566,
+ "learning_rate": 2.2306138190668624e-08,
+ "loss": 0.0269,
+ "step": 35943
+ },
+ {
+ "epoch": 97.9400544959128,
+ "grad_norm": 2.189378261566162,
+ "learning_rate": 2.2247265969065347e-08,
+ "loss": 0.0314,
+ "step": 35944
+ },
+ {
+ "epoch": 97.94277929155314,
+ "grad_norm": 2.719431161880493,
+ "learning_rate": 2.2188471453877815e-08,
+ "loss": 0.0557,
+ "step": 35945
+ },
+ {
+ "epoch": 97.94550408719346,
+ "grad_norm": 2.964179754257202,
+ "learning_rate": 2.212975464556677e-08,
+ "loss": 0.0734,
+ "step": 35946
+ },
+ {
+ "epoch": 97.94822888283379,
+ "grad_norm": 1.7924069166183472,
+ "learning_rate": 2.2071115544587406e-08,
+ "loss": 0.0266,
+ "step": 35947
+ },
+ {
+ "epoch": 97.95095367847412,
+ "grad_norm": 2.598353862762451,
+ "learning_rate": 2.2012554151397137e-08,
+ "loss": 0.0391,
+ "step": 35948
+ },
+ {
+ "epoch": 97.95367847411444,
+ "grad_norm": 1.3391518592834473,
+ "learning_rate": 2.195407046645115e-08,
+ "loss": 0.019,
+ "step": 35949
+ },
+ {
+ "epoch": 97.95640326975477,
+ "grad_norm": 1.5363374948501587,
+ "learning_rate": 2.1895664490206857e-08,
+ "loss": 0.0279,
+ "step": 35950
+ },
+ {
+ "epoch": 97.95912806539509,
+ "grad_norm": 3.2424540519714355,
+ "learning_rate": 2.1837336223117233e-08,
+ "loss": 0.0335,
+ "step": 35951
+ },
+ {
+ "epoch": 97.96185286103542,
+ "grad_norm": 2.925813674926758,
+ "learning_rate": 2.1779085665637467e-08,
+ "loss": 0.0579,
+ "step": 35952
+ },
+ {
+ "epoch": 97.96457765667574,
+ "grad_norm": 2.4966001510620117,
+ "learning_rate": 2.172091281822164e-08,
+ "loss": 0.0526,
+ "step": 35953
+ },
+ {
+ "epoch": 97.96730245231608,
+ "grad_norm": 2.0699377059936523,
+ "learning_rate": 2.1662817681321613e-08,
+ "loss": 0.0637,
+ "step": 35954
+ },
+ {
+ "epoch": 97.97002724795641,
+ "grad_norm": 2.216644525527954,
+ "learning_rate": 2.1604800255390356e-08,
+ "loss": 0.0928,
+ "step": 35955
+ },
+ {
+ "epoch": 97.97275204359673,
+ "grad_norm": 3.448300361633301,
+ "learning_rate": 2.1546860540879734e-08,
+ "loss": 0.0463,
+ "step": 35956
+ },
+ {
+ "epoch": 97.97547683923706,
+ "grad_norm": 3.955340623855591,
+ "learning_rate": 2.14889985382416e-08,
+ "loss": 0.0295,
+ "step": 35957
+ },
+ {
+ "epoch": 97.97820163487738,
+ "grad_norm": 4.31251335144043,
+ "learning_rate": 2.14312142479256e-08,
+ "loss": 0.1193,
+ "step": 35958
+ },
+ {
+ "epoch": 97.98092643051771,
+ "grad_norm": 4.111076354980469,
+ "learning_rate": 2.1373507670381376e-08,
+ "loss": 0.0726,
+ "step": 35959
+ },
+ {
+ "epoch": 97.98365122615803,
+ "grad_norm": 3.263672351837158,
+ "learning_rate": 2.1315878806060787e-08,
+ "loss": 0.0558,
+ "step": 35960
+ },
+ {
+ "epoch": 97.98637602179836,
+ "grad_norm": 2.007985830307007,
+ "learning_rate": 2.125832765541014e-08,
+ "loss": 0.027,
+ "step": 35961
+ },
+ {
+ "epoch": 97.9891008174387,
+ "grad_norm": 2.3174593448638916,
+ "learning_rate": 2.1200854218877964e-08,
+ "loss": 0.0367,
+ "step": 35962
+ },
+ {
+ "epoch": 97.99182561307902,
+ "grad_norm": 1.442603349685669,
+ "learning_rate": 2.1143458496912795e-08,
+ "loss": 0.0162,
+ "step": 35963
+ },
+ {
+ "epoch": 97.99455040871935,
+ "grad_norm": 4.202771186828613,
+ "learning_rate": 2.1086140489960937e-08,
+ "loss": 0.0444,
+ "step": 35964
+ },
+ {
+ "epoch": 97.99727520435967,
+ "grad_norm": 2.63293194770813,
+ "learning_rate": 2.1028900198468704e-08,
+ "loss": 0.0247,
+ "step": 35965
+ },
+ {
+ "epoch": 98.0,
+ "grad_norm": 2.4509873390197754,
+ "learning_rate": 2.0971737622883515e-08,
+ "loss": 0.0524,
+ "step": 35966
+ },
+ {
+ "epoch": 98.00272479564033,
+ "grad_norm": 1.954356074333191,
+ "learning_rate": 2.0914652763648348e-08,
+ "loss": 0.0263,
+ "step": 35967
+ },
+ {
+ "epoch": 98.00544959128065,
+ "grad_norm": 2.8290443420410156,
+ "learning_rate": 2.085764562120951e-08,
+ "loss": 0.0574,
+ "step": 35968
+ },
+ {
+ "epoch": 98.00817438692098,
+ "grad_norm": 2.316638231277466,
+ "learning_rate": 2.0800716196008874e-08,
+ "loss": 0.0668,
+ "step": 35969
+ },
+ {
+ "epoch": 98.0108991825613,
+ "grad_norm": 4.08411979675293,
+ "learning_rate": 2.074386448849164e-08,
+ "loss": 0.0718,
+ "step": 35970
+ },
+ {
+ "epoch": 98.01362397820164,
+ "grad_norm": 2.340932846069336,
+ "learning_rate": 2.068709049910078e-08,
+ "loss": 0.0681,
+ "step": 35971
+ },
+ {
+ "epoch": 98.01634877384195,
+ "grad_norm": 2.5804271697998047,
+ "learning_rate": 2.0630394228277063e-08,
+ "loss": 0.0828,
+ "step": 35972
+ },
+ {
+ "epoch": 98.01907356948229,
+ "grad_norm": 2.2683908939361572,
+ "learning_rate": 2.057377567646235e-08,
+ "loss": 0.0313,
+ "step": 35973
+ },
+ {
+ "epoch": 98.02179836512262,
+ "grad_norm": 2.1464920043945312,
+ "learning_rate": 2.05172348440974e-08,
+ "loss": 0.0302,
+ "step": 35974
+ },
+ {
+ "epoch": 98.02452316076294,
+ "grad_norm": 2.4043939113616943,
+ "learning_rate": 2.0460771731624086e-08,
+ "loss": 0.0261,
+ "step": 35975
+ },
+ {
+ "epoch": 98.02724795640327,
+ "grad_norm": 2.5983052253723145,
+ "learning_rate": 2.040438633948094e-08,
+ "loss": 0.1276,
+ "step": 35976
+ },
+ {
+ "epoch": 98.02997275204359,
+ "grad_norm": 2.8535356521606445,
+ "learning_rate": 2.034807866810762e-08,
+ "loss": 0.1196,
+ "step": 35977
+ },
+ {
+ "epoch": 98.03269754768392,
+ "grad_norm": 2.621011972427368,
+ "learning_rate": 2.029184871794154e-08,
+ "loss": 0.177,
+ "step": 35978
+ },
+ {
+ "epoch": 98.03542234332426,
+ "grad_norm": 3.7379093170166016,
+ "learning_rate": 2.0235696489421254e-08,
+ "loss": 0.2048,
+ "step": 35979
+ },
+ {
+ "epoch": 98.03814713896458,
+ "grad_norm": 2.3887557983398438,
+ "learning_rate": 2.0179621982984178e-08,
+ "loss": 0.1078,
+ "step": 35980
+ },
+ {
+ "epoch": 98.04087193460491,
+ "grad_norm": 7.204305171966553,
+ "learning_rate": 2.0123625199067743e-08,
+ "loss": 0.093,
+ "step": 35981
+ },
+ {
+ "epoch": 98.04359673024523,
+ "grad_norm": 2.4790451526641846,
+ "learning_rate": 2.0067706138107157e-08,
+ "loss": 0.0773,
+ "step": 35982
+ },
+ {
+ "epoch": 98.04632152588556,
+ "grad_norm": 2.852440595626831,
+ "learning_rate": 2.001186480053763e-08,
+ "loss": 0.1036,
+ "step": 35983
+ },
+ {
+ "epoch": 98.04904632152588,
+ "grad_norm": 1.650865077972412,
+ "learning_rate": 1.9956101186794362e-08,
+ "loss": 0.0369,
+ "step": 35984
+ },
+ {
+ "epoch": 98.05177111716621,
+ "grad_norm": 2.4738357067108154,
+ "learning_rate": 1.990041529731257e-08,
+ "loss": 0.0237,
+ "step": 35985
+ },
+ {
+ "epoch": 98.05449591280654,
+ "grad_norm": 2.4581356048583984,
+ "learning_rate": 1.9844807132524123e-08,
+ "loss": 0.0202,
+ "step": 35986
+ },
+ {
+ "epoch": 98.05722070844686,
+ "grad_norm": 2.1589486598968506,
+ "learning_rate": 1.9789276692863125e-08,
+ "loss": 0.0362,
+ "step": 35987
+ },
+ {
+ "epoch": 98.0599455040872,
+ "grad_norm": 3.0614559650421143,
+ "learning_rate": 1.9733823978762555e-08,
+ "loss": 0.0566,
+ "step": 35988
+ },
+ {
+ "epoch": 98.06267029972751,
+ "grad_norm": 1.0813218355178833,
+ "learning_rate": 1.96784489906543e-08,
+ "loss": 0.0123,
+ "step": 35989
+ },
+ {
+ "epoch": 98.06539509536785,
+ "grad_norm": 3.7860329151153564,
+ "learning_rate": 1.9623151728968004e-08,
+ "loss": 0.0522,
+ "step": 35990
+ },
+ {
+ "epoch": 98.06811989100818,
+ "grad_norm": 5.7503204345703125,
+ "learning_rate": 1.9567932194135553e-08,
+ "loss": 0.0411,
+ "step": 35991
+ },
+ {
+ "epoch": 98.0708446866485,
+ "grad_norm": 1.8334646224975586,
+ "learning_rate": 1.951279038658771e-08,
+ "loss": 0.0239,
+ "step": 35992
+ },
+ {
+ "epoch": 98.07356948228883,
+ "grad_norm": 3.1036291122436523,
+ "learning_rate": 1.9457726306751913e-08,
+ "loss": 0.1188,
+ "step": 35993
+ },
+ {
+ "epoch": 98.07629427792915,
+ "grad_norm": 1.93489670753479,
+ "learning_rate": 1.9402739955058925e-08,
+ "loss": 0.028,
+ "step": 35994
+ },
+ {
+ "epoch": 98.07901907356948,
+ "grad_norm": 2.9652209281921387,
+ "learning_rate": 1.9347831331936186e-08,
+ "loss": 0.2568,
+ "step": 35995
+ },
+ {
+ "epoch": 98.0817438692098,
+ "grad_norm": 2.488975763320923,
+ "learning_rate": 1.9293000437811127e-08,
+ "loss": 0.0921,
+ "step": 35996
+ },
+ {
+ "epoch": 98.08446866485014,
+ "grad_norm": 2.527630567550659,
+ "learning_rate": 1.9238247273110077e-08,
+ "loss": 0.0303,
+ "step": 35997
+ },
+ {
+ "epoch": 98.08719346049047,
+ "grad_norm": 1.9312889575958252,
+ "learning_rate": 1.9183571838261584e-08,
+ "loss": 0.0268,
+ "step": 35998
+ },
+ {
+ "epoch": 98.08991825613079,
+ "grad_norm": 2.61395001411438,
+ "learning_rate": 1.9128974133689748e-08,
+ "loss": 0.0212,
+ "step": 35999
+ },
+ {
+ "epoch": 98.09264305177112,
+ "grad_norm": 1.9238824844360352,
+ "learning_rate": 1.907445415981979e-08,
+ "loss": 0.0285,
+ "step": 36000
+ },
+ {
+ "epoch": 98.09536784741144,
+ "grad_norm": 1.5434598922729492,
+ "learning_rate": 1.902001191707803e-08,
+ "loss": 0.0334,
+ "step": 36001
+ },
+ {
+ "epoch": 98.09809264305177,
+ "grad_norm": 1.6021926403045654,
+ "learning_rate": 1.8965647405885247e-08,
+ "loss": 0.0423,
+ "step": 36002
+ },
+ {
+ "epoch": 98.1008174386921,
+ "grad_norm": 2.5341289043426514,
+ "learning_rate": 1.8911360626668874e-08,
+ "loss": 0.0345,
+ "step": 36003
+ },
+ {
+ "epoch": 98.10354223433242,
+ "grad_norm": 1.9662022590637207,
+ "learning_rate": 1.8857151579847465e-08,
+ "loss": 0.1571,
+ "step": 36004
+ },
+ {
+ "epoch": 98.10626702997276,
+ "grad_norm": 1.6988203525543213,
+ "learning_rate": 1.8803020265847348e-08,
+ "loss": 0.023,
+ "step": 36005
+ },
+ {
+ "epoch": 98.10899182561307,
+ "grad_norm": 2.856804609298706,
+ "learning_rate": 1.874896668508597e-08,
+ "loss": 0.2222,
+ "step": 36006
+ },
+ {
+ "epoch": 98.11171662125341,
+ "grad_norm": 2.2739062309265137,
+ "learning_rate": 1.8694990837988534e-08,
+ "loss": 0.0209,
+ "step": 36007
+ },
+ {
+ "epoch": 98.11444141689373,
+ "grad_norm": 2.8482143878936768,
+ "learning_rate": 1.8641092724971388e-08,
+ "loss": 0.2362,
+ "step": 36008
+ },
+ {
+ "epoch": 98.11716621253406,
+ "grad_norm": 2.5867767333984375,
+ "learning_rate": 1.858727234645752e-08,
+ "loss": 0.0294,
+ "step": 36009
+ },
+ {
+ "epoch": 98.11989100817439,
+ "grad_norm": 3.1094701290130615,
+ "learning_rate": 1.8533529702864374e-08,
+ "loss": 0.0288,
+ "step": 36010
+ },
+ {
+ "epoch": 98.12261580381471,
+ "grad_norm": 2.174095869064331,
+ "learning_rate": 1.8479864794610502e-08,
+ "loss": 0.0357,
+ "step": 36011
+ },
+ {
+ "epoch": 98.12534059945504,
+ "grad_norm": 3.00639271736145,
+ "learning_rate": 1.8426277622114463e-08,
+ "loss": 0.0362,
+ "step": 36012
+ },
+ {
+ "epoch": 98.12806539509536,
+ "grad_norm": 1.8950481414794922,
+ "learning_rate": 1.83727681857937e-08,
+ "loss": 0.0212,
+ "step": 36013
+ },
+ {
+ "epoch": 98.1307901907357,
+ "grad_norm": 1.8707834482192993,
+ "learning_rate": 1.8319336486063433e-08,
+ "loss": 0.0267,
+ "step": 36014
+ },
+ {
+ "epoch": 98.13351498637603,
+ "grad_norm": 2.5346744060516357,
+ "learning_rate": 1.826598252334222e-08,
+ "loss": 0.092,
+ "step": 36015
+ },
+ {
+ "epoch": 98.13623978201635,
+ "grad_norm": 1.6178852319717407,
+ "learning_rate": 1.821270629804306e-08,
+ "loss": 0.0297,
+ "step": 36016
+ },
+ {
+ "epoch": 98.13896457765668,
+ "grad_norm": 1.6849186420440674,
+ "learning_rate": 1.81595078105834e-08,
+ "loss": 0.0295,
+ "step": 36017
+ },
+ {
+ "epoch": 98.141689373297,
+ "grad_norm": 2.2350454330444336,
+ "learning_rate": 1.810638706137513e-08,
+ "loss": 0.1013,
+ "step": 36018
+ },
+ {
+ "epoch": 98.14441416893733,
+ "grad_norm": 2.8852832317352295,
+ "learning_rate": 1.8053344050833478e-08,
+ "loss": 0.041,
+ "step": 36019
+ },
+ {
+ "epoch": 98.14713896457765,
+ "grad_norm": 3.075474262237549,
+ "learning_rate": 1.800037877937144e-08,
+ "loss": 0.0758,
+ "step": 36020
+ },
+ {
+ "epoch": 98.14986376021798,
+ "grad_norm": 2.540247917175293,
+ "learning_rate": 1.7947491247399808e-08,
+ "loss": 0.0815,
+ "step": 36021
+ },
+ {
+ "epoch": 98.15258855585832,
+ "grad_norm": 2.0208468437194824,
+ "learning_rate": 1.7894681455333794e-08,
+ "loss": 0.0339,
+ "step": 36022
+ },
+ {
+ "epoch": 98.15531335149863,
+ "grad_norm": 3.4823648929595947,
+ "learning_rate": 1.784194940358086e-08,
+ "loss": 0.0955,
+ "step": 36023
+ },
+ {
+ "epoch": 98.15803814713897,
+ "grad_norm": 2.4442057609558105,
+ "learning_rate": 1.7789295092555114e-08,
+ "loss": 0.054,
+ "step": 36024
+ },
+ {
+ "epoch": 98.16076294277929,
+ "grad_norm": 3.0584557056427,
+ "learning_rate": 1.773671852266401e-08,
+ "loss": 0.0513,
+ "step": 36025
+ },
+ {
+ "epoch": 98.16348773841962,
+ "grad_norm": 2.1580777168273926,
+ "learning_rate": 1.7684219694318328e-08,
+ "loss": 0.0257,
+ "step": 36026
+ },
+ {
+ "epoch": 98.16621253405995,
+ "grad_norm": 2.9333670139312744,
+ "learning_rate": 1.763179860792663e-08,
+ "loss": 0.1014,
+ "step": 36027
+ },
+ {
+ "epoch": 98.16893732970027,
+ "grad_norm": 2.2418465614318848,
+ "learning_rate": 1.7579455263897483e-08,
+ "loss": 0.0561,
+ "step": 36028
+ },
+ {
+ "epoch": 98.1716621253406,
+ "grad_norm": 6.723508358001709,
+ "learning_rate": 1.7527189662638334e-08,
+ "loss": 0.0727,
+ "step": 36029
+ },
+ {
+ "epoch": 98.17438692098092,
+ "grad_norm": 1.9667026996612549,
+ "learning_rate": 1.7475001804555525e-08,
+ "loss": 0.0346,
+ "step": 36030
+ },
+ {
+ "epoch": 98.17711171662125,
+ "grad_norm": 2.2690699100494385,
+ "learning_rate": 1.7422891690056508e-08,
+ "loss": 0.0321,
+ "step": 36031
+ },
+ {
+ "epoch": 98.17983651226157,
+ "grad_norm": 5.59989070892334,
+ "learning_rate": 1.7370859319547628e-08,
+ "loss": 0.0415,
+ "step": 36032
+ },
+ {
+ "epoch": 98.1825613079019,
+ "grad_norm": 2.4863879680633545,
+ "learning_rate": 1.7318904693431894e-08,
+ "loss": 0.0548,
+ "step": 36033
+ },
+ {
+ "epoch": 98.18528610354224,
+ "grad_norm": 3.2599329948425293,
+ "learning_rate": 1.7267027812115646e-08,
+ "loss": 0.1327,
+ "step": 36034
+ },
+ {
+ "epoch": 98.18801089918256,
+ "grad_norm": 2.4539096355438232,
+ "learning_rate": 1.7215228676003005e-08,
+ "loss": 0.176,
+ "step": 36035
+ },
+ {
+ "epoch": 98.19073569482289,
+ "grad_norm": 1.724025845527649,
+ "learning_rate": 1.7163507285495872e-08,
+ "loss": 0.0297,
+ "step": 36036
+ },
+ {
+ "epoch": 98.19346049046321,
+ "grad_norm": 1.5585377216339111,
+ "learning_rate": 1.7111863640999483e-08,
+ "loss": 0.1148,
+ "step": 36037
+ },
+ {
+ "epoch": 98.19618528610354,
+ "grad_norm": 1.6620516777038574,
+ "learning_rate": 1.706029774291351e-08,
+ "loss": 0.0213,
+ "step": 36038
+ },
+ {
+ "epoch": 98.19891008174388,
+ "grad_norm": 2.1538443565368652,
+ "learning_rate": 1.7008809591639863e-08,
+ "loss": 0.0811,
+ "step": 36039
+ },
+ {
+ "epoch": 98.2016348773842,
+ "grad_norm": 2.7999744415283203,
+ "learning_rate": 1.6957399187581547e-08,
+ "loss": 0.1881,
+ "step": 36040
+ },
+ {
+ "epoch": 98.20435967302453,
+ "grad_norm": 3.429708242416382,
+ "learning_rate": 1.6906066531137132e-08,
+ "loss": 0.0264,
+ "step": 36041
+ },
+ {
+ "epoch": 98.20708446866485,
+ "grad_norm": 2.7518060207366943,
+ "learning_rate": 1.6854811622707412e-08,
+ "loss": 0.0634,
+ "step": 36042
+ },
+ {
+ "epoch": 98.20980926430518,
+ "grad_norm": 3.1121954917907715,
+ "learning_rate": 1.6803634462690955e-08,
+ "loss": 0.0921,
+ "step": 36043
+ },
+ {
+ "epoch": 98.2125340599455,
+ "grad_norm": 3.7017569541931152,
+ "learning_rate": 1.675253505148633e-08,
+ "loss": 0.0453,
+ "step": 36044
+ },
+ {
+ "epoch": 98.21525885558583,
+ "grad_norm": 2.11387038230896,
+ "learning_rate": 1.6701513389492106e-08,
+ "loss": 0.0447,
+ "step": 36045
+ },
+ {
+ "epoch": 98.21798365122616,
+ "grad_norm": 1.6125013828277588,
+ "learning_rate": 1.6650569477104638e-08,
+ "loss": 0.0201,
+ "step": 36046
+ },
+ {
+ "epoch": 98.22070844686648,
+ "grad_norm": 2.024996042251587,
+ "learning_rate": 1.6599703314721382e-08,
+ "loss": 0.0343,
+ "step": 36047
+ },
+ {
+ "epoch": 98.22343324250681,
+ "grad_norm": 1.7762742042541504,
+ "learning_rate": 1.6548914902738688e-08,
+ "loss": 0.0184,
+ "step": 36048
+ },
+ {
+ "epoch": 98.22615803814713,
+ "grad_norm": 2.6843836307525635,
+ "learning_rate": 1.6498204241551796e-08,
+ "loss": 0.0272,
+ "step": 36049
+ },
+ {
+ "epoch": 98.22888283378747,
+ "grad_norm": 2.516796112060547,
+ "learning_rate": 1.6447571331554836e-08,
+ "loss": 0.1096,
+ "step": 36050
+ },
+ {
+ "epoch": 98.2316076294278,
+ "grad_norm": 1.8902513980865479,
+ "learning_rate": 1.6397016173143043e-08,
+ "loss": 0.0189,
+ "step": 36051
+ },
+ {
+ "epoch": 98.23433242506812,
+ "grad_norm": 2.1218597888946533,
+ "learning_rate": 1.6346538766710552e-08,
+ "loss": 0.0863,
+ "step": 36052
+ },
+ {
+ "epoch": 98.23705722070845,
+ "grad_norm": 3.2340712547302246,
+ "learning_rate": 1.6296139112649268e-08,
+ "loss": 0.0603,
+ "step": 36053
+ },
+ {
+ "epoch": 98.23978201634877,
+ "grad_norm": 3.202751398086548,
+ "learning_rate": 1.6245817211353322e-08,
+ "loss": 0.099,
+ "step": 36054
+ },
+ {
+ "epoch": 98.2425068119891,
+ "grad_norm": 2.7101292610168457,
+ "learning_rate": 1.61955730632124e-08,
+ "loss": 0.0193,
+ "step": 36055
+ },
+ {
+ "epoch": 98.24523160762942,
+ "grad_norm": 1.6028387546539307,
+ "learning_rate": 1.6145406668619523e-08,
+ "loss": 0.028,
+ "step": 36056
+ },
+ {
+ "epoch": 98.24795640326975,
+ "grad_norm": 3.7268786430358887,
+ "learning_rate": 1.609531802796549e-08,
+ "loss": 0.0414,
+ "step": 36057
+ },
+ {
+ "epoch": 98.25068119891009,
+ "grad_norm": 2.2488632202148438,
+ "learning_rate": 1.604530714163888e-08,
+ "loss": 0.0246,
+ "step": 36058
+ },
+ {
+ "epoch": 98.2534059945504,
+ "grad_norm": 2.7443923950195312,
+ "learning_rate": 1.5995374010030483e-08,
+ "loss": 0.1881,
+ "step": 36059
+ },
+ {
+ "epoch": 98.25613079019074,
+ "grad_norm": 4.7676682472229,
+ "learning_rate": 1.594551863352889e-08,
+ "loss": 0.0768,
+ "step": 36060
+ },
+ {
+ "epoch": 98.25885558583106,
+ "grad_norm": 2.9786148071289062,
+ "learning_rate": 1.5895741012521558e-08,
+ "loss": 0.0934,
+ "step": 36061
+ },
+ {
+ "epoch": 98.26158038147139,
+ "grad_norm": 3.0991547107696533,
+ "learning_rate": 1.5846041147397072e-08,
+ "loss": 0.044,
+ "step": 36062
+ },
+ {
+ "epoch": 98.26430517711172,
+ "grad_norm": 1.976578950881958,
+ "learning_rate": 1.5796419038542897e-08,
+ "loss": 0.0169,
+ "step": 36063
+ },
+ {
+ "epoch": 98.26702997275204,
+ "grad_norm": 2.9477286338806152,
+ "learning_rate": 1.5746874686344284e-08,
+ "loss": 0.0365,
+ "step": 36064
+ },
+ {
+ "epoch": 98.26975476839237,
+ "grad_norm": 1.9412206411361694,
+ "learning_rate": 1.5697408091188694e-08,
+ "loss": 0.0223,
+ "step": 36065
+ },
+ {
+ "epoch": 98.2724795640327,
+ "grad_norm": 2.5030250549316406,
+ "learning_rate": 1.5648019253459156e-08,
+ "loss": 0.096,
+ "step": 36066
+ },
+ {
+ "epoch": 98.27520435967303,
+ "grad_norm": 1.2808163166046143,
+ "learning_rate": 1.5598708173542032e-08,
+ "loss": 0.0171,
+ "step": 36067
+ },
+ {
+ "epoch": 98.27792915531334,
+ "grad_norm": 2.0064923763275146,
+ "learning_rate": 1.5549474851820346e-08,
+ "loss": 0.0263,
+ "step": 36068
+ },
+ {
+ "epoch": 98.28065395095368,
+ "grad_norm": 2.899421215057373,
+ "learning_rate": 1.5500319288678234e-08,
+ "loss": 0.0847,
+ "step": 36069
+ },
+ {
+ "epoch": 98.28337874659401,
+ "grad_norm": 3.2286341190338135,
+ "learning_rate": 1.5451241484498724e-08,
+ "loss": 0.0996,
+ "step": 36070
+ },
+ {
+ "epoch": 98.28610354223433,
+ "grad_norm": 2.4577603340148926,
+ "learning_rate": 1.5402241439663736e-08,
+ "loss": 0.0692,
+ "step": 36071
+ },
+ {
+ "epoch": 98.28882833787466,
+ "grad_norm": 2.7878971099853516,
+ "learning_rate": 1.535331915455407e-08,
+ "loss": 0.0471,
+ "step": 36072
+ },
+ {
+ "epoch": 98.29155313351498,
+ "grad_norm": 2.434969186782837,
+ "learning_rate": 1.5304474629551648e-08,
+ "loss": 0.0244,
+ "step": 36073
+ },
+ {
+ "epoch": 98.29427792915531,
+ "grad_norm": 2.7359986305236816,
+ "learning_rate": 1.5255707865036163e-08,
+ "loss": 0.0523,
+ "step": 36074
+ },
+ {
+ "epoch": 98.29700272479565,
+ "grad_norm": 1.842993140220642,
+ "learning_rate": 1.5207018861388423e-08,
+ "loss": 0.0415,
+ "step": 36075
+ },
+ {
+ "epoch": 98.29972752043597,
+ "grad_norm": 3.4313676357269287,
+ "learning_rate": 1.5158407618987014e-08,
+ "loss": 0.0666,
+ "step": 36076
+ },
+ {
+ "epoch": 98.3024523160763,
+ "grad_norm": 1.4521300792694092,
+ "learning_rate": 1.5109874138210522e-08,
+ "loss": 0.0185,
+ "step": 36077
+ },
+ {
+ "epoch": 98.30517711171662,
+ "grad_norm": 2.410409688949585,
+ "learning_rate": 1.5061418419437536e-08,
+ "loss": 0.0668,
+ "step": 36078
+ },
+ {
+ "epoch": 98.30790190735695,
+ "grad_norm": 1.9829622507095337,
+ "learning_rate": 1.5013040463043305e-08,
+ "loss": 0.0319,
+ "step": 36079
+ },
+ {
+ "epoch": 98.31062670299727,
+ "grad_norm": 2.0669567584991455,
+ "learning_rate": 1.496474026940753e-08,
+ "loss": 0.0344,
+ "step": 36080
+ },
+ {
+ "epoch": 98.3133514986376,
+ "grad_norm": 2.6750333309173584,
+ "learning_rate": 1.4916517838904355e-08,
+ "loss": 0.037,
+ "step": 36081
+ },
+ {
+ "epoch": 98.31607629427793,
+ "grad_norm": 1.5951213836669922,
+ "learning_rate": 1.4868373171910144e-08,
+ "loss": 0.027,
+ "step": 36082
+ },
+ {
+ "epoch": 98.31880108991825,
+ "grad_norm": 1.3873144388198853,
+ "learning_rate": 1.4820306268800155e-08,
+ "loss": 0.0157,
+ "step": 36083
+ },
+ {
+ "epoch": 98.32152588555859,
+ "grad_norm": 1.8574143648147583,
+ "learning_rate": 1.4772317129947422e-08,
+ "loss": 0.0481,
+ "step": 36084
+ },
+ {
+ "epoch": 98.3242506811989,
+ "grad_norm": 3.45485782623291,
+ "learning_rate": 1.47244057557272e-08,
+ "loss": 0.1301,
+ "step": 36085
+ },
+ {
+ "epoch": 98.32697547683924,
+ "grad_norm": 2.714715003967285,
+ "learning_rate": 1.4676572146511414e-08,
+ "loss": 0.1108,
+ "step": 36086
+ },
+ {
+ "epoch": 98.32970027247957,
+ "grad_norm": 2.4655139446258545,
+ "learning_rate": 1.46288163026731e-08,
+ "loss": 0.0625,
+ "step": 36087
+ },
+ {
+ "epoch": 98.33242506811989,
+ "grad_norm": 5.965032577514648,
+ "learning_rate": 1.458113822458529e-08,
+ "loss": 0.0718,
+ "step": 36088
+ },
+ {
+ "epoch": 98.33514986376022,
+ "grad_norm": 1.9181727170944214,
+ "learning_rate": 1.453353791261658e-08,
+ "loss": 0.0481,
+ "step": 36089
+ },
+ {
+ "epoch": 98.33787465940054,
+ "grad_norm": 2.015746593475342,
+ "learning_rate": 1.4486015367140005e-08,
+ "loss": 0.093,
+ "step": 36090
+ },
+ {
+ "epoch": 98.34059945504087,
+ "grad_norm": 2.7315802574157715,
+ "learning_rate": 1.443857058852527e-08,
+ "loss": 0.0274,
+ "step": 36091
+ },
+ {
+ "epoch": 98.34332425068119,
+ "grad_norm": 2.158799171447754,
+ "learning_rate": 1.4391203577140966e-08,
+ "loss": 0.0705,
+ "step": 36092
+ },
+ {
+ "epoch": 98.34604904632153,
+ "grad_norm": 3.0152547359466553,
+ "learning_rate": 1.4343914333356801e-08,
+ "loss": 0.1108,
+ "step": 36093
+ },
+ {
+ "epoch": 98.34877384196186,
+ "grad_norm": 2.108616352081299,
+ "learning_rate": 1.4296702857541367e-08,
+ "loss": 0.0309,
+ "step": 36094
+ },
+ {
+ "epoch": 98.35149863760218,
+ "grad_norm": 2.5189340114593506,
+ "learning_rate": 1.4249569150061037e-08,
+ "loss": 0.0299,
+ "step": 36095
+ },
+ {
+ "epoch": 98.35422343324251,
+ "grad_norm": 2.253386974334717,
+ "learning_rate": 1.4202513211284408e-08,
+ "loss": 0.1952,
+ "step": 36096
+ },
+ {
+ "epoch": 98.35694822888283,
+ "grad_norm": 1.5023448467254639,
+ "learning_rate": 1.415553504157674e-08,
+ "loss": 0.0541,
+ "step": 36097
+ },
+ {
+ "epoch": 98.35967302452316,
+ "grad_norm": 1.9690170288085938,
+ "learning_rate": 1.4108634641304409e-08,
+ "loss": 0.0254,
+ "step": 36098
+ },
+ {
+ "epoch": 98.3623978201635,
+ "grad_norm": 2.67514967918396,
+ "learning_rate": 1.4061812010832676e-08,
+ "loss": 0.0541,
+ "step": 36099
+ },
+ {
+ "epoch": 98.36512261580381,
+ "grad_norm": 2.0228111743927,
+ "learning_rate": 1.4015067150525696e-08,
+ "loss": 0.0244,
+ "step": 36100
+ },
+ {
+ "epoch": 98.36784741144415,
+ "grad_norm": 3.1129562854766846,
+ "learning_rate": 1.3968400060748733e-08,
+ "loss": 0.0341,
+ "step": 36101
+ },
+ {
+ "epoch": 98.37057220708446,
+ "grad_norm": 2.7543745040893555,
+ "learning_rate": 1.3921810741864828e-08,
+ "loss": 0.0343,
+ "step": 36102
+ },
+ {
+ "epoch": 98.3732970027248,
+ "grad_norm": 4.894028186798096,
+ "learning_rate": 1.3875299194235914e-08,
+ "loss": 0.0757,
+ "step": 36103
+ },
+ {
+ "epoch": 98.37602179836512,
+ "grad_norm": 2.0562045574188232,
+ "learning_rate": 1.3828865418223925e-08,
+ "loss": 0.0341,
+ "step": 36104
+ },
+ {
+ "epoch": 98.37874659400545,
+ "grad_norm": 5.251753330230713,
+ "learning_rate": 1.3782509414191902e-08,
+ "loss": 0.0528,
+ "step": 36105
+ },
+ {
+ "epoch": 98.38147138964578,
+ "grad_norm": 4.380325794219971,
+ "learning_rate": 1.373623118250067e-08,
+ "loss": 0.0289,
+ "step": 36106
+ },
+ {
+ "epoch": 98.3841961852861,
+ "grad_norm": 3.9425055980682373,
+ "learning_rate": 1.3690030723509939e-08,
+ "loss": 0.075,
+ "step": 36107
+ },
+ {
+ "epoch": 98.38692098092643,
+ "grad_norm": 3.0681300163269043,
+ "learning_rate": 1.3643908037580533e-08,
+ "loss": 0.184,
+ "step": 36108
+ },
+ {
+ "epoch": 98.38964577656675,
+ "grad_norm": 2.5093634128570557,
+ "learning_rate": 1.3597863125069943e-08,
+ "loss": 0.0444,
+ "step": 36109
+ },
+ {
+ "epoch": 98.39237057220708,
+ "grad_norm": 2.9992306232452393,
+ "learning_rate": 1.3551895986338993e-08,
+ "loss": 0.1239,
+ "step": 36110
+ },
+ {
+ "epoch": 98.39509536784742,
+ "grad_norm": 2.3570594787597656,
+ "learning_rate": 1.3506006621742951e-08,
+ "loss": 0.0403,
+ "step": 36111
+ },
+ {
+ "epoch": 98.39782016348774,
+ "grad_norm": 2.0751588344573975,
+ "learning_rate": 1.3460195031641532e-08,
+ "loss": 0.1548,
+ "step": 36112
+ },
+ {
+ "epoch": 98.40054495912807,
+ "grad_norm": 3.247391939163208,
+ "learning_rate": 1.3414461216391117e-08,
+ "loss": 0.0984,
+ "step": 36113
+ },
+ {
+ "epoch": 98.40326975476839,
+ "grad_norm": 1.9408838748931885,
+ "learning_rate": 1.3368805176346977e-08,
+ "loss": 0.0262,
+ "step": 36114
+ },
+ {
+ "epoch": 98.40599455040872,
+ "grad_norm": 3.2725577354431152,
+ "learning_rate": 1.3323226911864385e-08,
+ "loss": 0.123,
+ "step": 36115
+ },
+ {
+ "epoch": 98.40871934604904,
+ "grad_norm": 2.6939446926116943,
+ "learning_rate": 1.327772642330083e-08,
+ "loss": 0.0371,
+ "step": 36116
+ },
+ {
+ "epoch": 98.41144414168937,
+ "grad_norm": 2.5777392387390137,
+ "learning_rate": 1.3232303711007143e-08,
+ "loss": 0.0715,
+ "step": 36117
+ },
+ {
+ "epoch": 98.4141689373297,
+ "grad_norm": 2.5360629558563232,
+ "learning_rate": 1.3186958775339709e-08,
+ "loss": 0.0458,
+ "step": 36118
+ },
+ {
+ "epoch": 98.41689373297002,
+ "grad_norm": 2.9892444610595703,
+ "learning_rate": 1.3141691616651575e-08,
+ "loss": 0.1276,
+ "step": 36119
+ },
+ {
+ "epoch": 98.41961852861036,
+ "grad_norm": 3.8520965576171875,
+ "learning_rate": 1.3096502235293573e-08,
+ "loss": 0.1467,
+ "step": 36120
+ },
+ {
+ "epoch": 98.42234332425068,
+ "grad_norm": 1.4537595510482788,
+ "learning_rate": 1.3051390631618755e-08,
+ "loss": 0.0925,
+ "step": 36121
+ },
+ {
+ "epoch": 98.42506811989101,
+ "grad_norm": 3.732198715209961,
+ "learning_rate": 1.3006356805977949e-08,
+ "loss": 0.1491,
+ "step": 36122
+ },
+ {
+ "epoch": 98.42779291553134,
+ "grad_norm": 2.4978554248809814,
+ "learning_rate": 1.2961400758721987e-08,
+ "loss": 0.0511,
+ "step": 36123
+ },
+ {
+ "epoch": 98.43051771117166,
+ "grad_norm": 4.112996578216553,
+ "learning_rate": 1.2916522490201699e-08,
+ "loss": 0.0407,
+ "step": 36124
+ },
+ {
+ "epoch": 98.433242506812,
+ "grad_norm": 1.5079231262207031,
+ "learning_rate": 1.2871722000766806e-08,
+ "loss": 0.0155,
+ "step": 36125
+ },
+ {
+ "epoch": 98.43596730245231,
+ "grad_norm": 2.5488126277923584,
+ "learning_rate": 1.2826999290764807e-08,
+ "loss": 0.0576,
+ "step": 36126
+ },
+ {
+ "epoch": 98.43869209809264,
+ "grad_norm": 3.4591064453125,
+ "learning_rate": 1.2782354360544314e-08,
+ "loss": 0.0393,
+ "step": 36127
+ },
+ {
+ "epoch": 98.44141689373296,
+ "grad_norm": 2.671058416366577,
+ "learning_rate": 1.2737787210453933e-08,
+ "loss": 0.0665,
+ "step": 36128
+ },
+ {
+ "epoch": 98.4441416893733,
+ "grad_norm": 3.291278123855591,
+ "learning_rate": 1.2693297840840058e-08,
+ "loss": 0.0498,
+ "step": 36129
+ },
+ {
+ "epoch": 98.44686648501363,
+ "grad_norm": 3.0969431400299072,
+ "learning_rate": 1.2648886252050186e-08,
+ "loss": 0.068,
+ "step": 36130
+ },
+ {
+ "epoch": 98.44959128065395,
+ "grad_norm": 2.8539137840270996,
+ "learning_rate": 1.2604552444428487e-08,
+ "loss": 0.0499,
+ "step": 36131
+ },
+ {
+ "epoch": 98.45231607629428,
+ "grad_norm": 2.5560038089752197,
+ "learning_rate": 1.2560296418320239e-08,
+ "loss": 0.0398,
+ "step": 36132
+ },
+ {
+ "epoch": 98.4550408719346,
+ "grad_norm": 2.3815579414367676,
+ "learning_rate": 1.2516118174071834e-08,
+ "loss": 0.026,
+ "step": 36133
+ },
+ {
+ "epoch": 98.45776566757493,
+ "grad_norm": 1.9051722288131714,
+ "learning_rate": 1.2472017712027439e-08,
+ "loss": 0.0295,
+ "step": 36134
+ },
+ {
+ "epoch": 98.46049046321527,
+ "grad_norm": 2.047534704208374,
+ "learning_rate": 1.2427995032527895e-08,
+ "loss": 0.0307,
+ "step": 36135
+ },
+ {
+ "epoch": 98.46321525885558,
+ "grad_norm": 1.9832487106323242,
+ "learning_rate": 1.238405013591848e-08,
+ "loss": 0.056,
+ "step": 36136
+ },
+ {
+ "epoch": 98.46594005449592,
+ "grad_norm": 2.251464605331421,
+ "learning_rate": 1.2340183022541142e-08,
+ "loss": 0.0343,
+ "step": 36137
+ },
+ {
+ "epoch": 98.46866485013624,
+ "grad_norm": 1.642418622970581,
+ "learning_rate": 1.2296393692735608e-08,
+ "loss": 0.0187,
+ "step": 36138
+ },
+ {
+ "epoch": 98.47138964577657,
+ "grad_norm": 2.1609480381011963,
+ "learning_rate": 1.225268214684494e-08,
+ "loss": 0.0845,
+ "step": 36139
+ },
+ {
+ "epoch": 98.47411444141689,
+ "grad_norm": 2.5468668937683105,
+ "learning_rate": 1.2209048385209977e-08,
+ "loss": 0.1115,
+ "step": 36140
+ },
+ {
+ "epoch": 98.47683923705722,
+ "grad_norm": 3.6908071041107178,
+ "learning_rate": 1.2165492408168223e-08,
+ "loss": 0.046,
+ "step": 36141
+ },
+ {
+ "epoch": 98.47956403269755,
+ "grad_norm": 3.202972173690796,
+ "learning_rate": 1.2122014216060518e-08,
+ "loss": 0.1119,
+ "step": 36142
+ },
+ {
+ "epoch": 98.48228882833787,
+ "grad_norm": 3.602304458618164,
+ "learning_rate": 1.2078613809225482e-08,
+ "loss": 0.0756,
+ "step": 36143
+ },
+ {
+ "epoch": 98.4850136239782,
+ "grad_norm": 3.881646156311035,
+ "learning_rate": 1.2035291187999509e-08,
+ "loss": 0.0448,
+ "step": 36144
+ },
+ {
+ "epoch": 98.48773841961852,
+ "grad_norm": 1.424583911895752,
+ "learning_rate": 1.199204635272233e-08,
+ "loss": 0.013,
+ "step": 36145
+ },
+ {
+ "epoch": 98.49046321525886,
+ "grad_norm": 1.6723031997680664,
+ "learning_rate": 1.1948879303729233e-08,
+ "loss": 0.0118,
+ "step": 36146
+ },
+ {
+ "epoch": 98.49318801089919,
+ "grad_norm": 3.3834898471832275,
+ "learning_rate": 1.1905790041357724e-08,
+ "loss": 0.028,
+ "step": 36147
+ },
+ {
+ "epoch": 98.49591280653951,
+ "grad_norm": 1.136795997619629,
+ "learning_rate": 1.1862778565940869e-08,
+ "loss": 0.0156,
+ "step": 36148
+ },
+ {
+ "epoch": 98.49863760217984,
+ "grad_norm": 2.5485243797302246,
+ "learning_rate": 1.1819844877816178e-08,
+ "loss": 0.0458,
+ "step": 36149
+ },
+ {
+ "epoch": 98.50136239782016,
+ "grad_norm": 2.5030970573425293,
+ "learning_rate": 1.1776988977316717e-08,
+ "loss": 0.061,
+ "step": 36150
+ },
+ {
+ "epoch": 98.50408719346049,
+ "grad_norm": 4.324421405792236,
+ "learning_rate": 1.1734210864777773e-08,
+ "loss": 0.1569,
+ "step": 36151
+ },
+ {
+ "epoch": 98.50681198910081,
+ "grad_norm": 2.1284096240997314,
+ "learning_rate": 1.1691510540530193e-08,
+ "loss": 0.0599,
+ "step": 36152
+ },
+ {
+ "epoch": 98.50953678474114,
+ "grad_norm": 1.4949356317520142,
+ "learning_rate": 1.1648888004907043e-08,
+ "loss": 0.0183,
+ "step": 36153
+ },
+ {
+ "epoch": 98.51226158038148,
+ "grad_norm": 2.3864893913269043,
+ "learning_rate": 1.1606343258242503e-08,
+ "loss": 0.1269,
+ "step": 36154
+ },
+ {
+ "epoch": 98.5149863760218,
+ "grad_norm": 1.6330173015594482,
+ "learning_rate": 1.1563876300865195e-08,
+ "loss": 0.0367,
+ "step": 36155
+ },
+ {
+ "epoch": 98.51771117166213,
+ "grad_norm": 3.575246810913086,
+ "learning_rate": 1.152148713310708e-08,
+ "loss": 0.0872,
+ "step": 36156
+ },
+ {
+ "epoch": 98.52043596730245,
+ "grad_norm": 2.4141902923583984,
+ "learning_rate": 1.1479175755297889e-08,
+ "loss": 0.0862,
+ "step": 36157
+ },
+ {
+ "epoch": 98.52316076294278,
+ "grad_norm": 1.7315680980682373,
+ "learning_rate": 1.1436942167768472e-08,
+ "loss": 0.0661,
+ "step": 36158
+ },
+ {
+ "epoch": 98.52588555858311,
+ "grad_norm": 2.7438507080078125,
+ "learning_rate": 1.1394786370845234e-08,
+ "loss": 0.1063,
+ "step": 36159
+ },
+ {
+ "epoch": 98.52861035422343,
+ "grad_norm": 2.2468864917755127,
+ "learning_rate": 1.1352708364859022e-08,
+ "loss": 0.0189,
+ "step": 36160
+ },
+ {
+ "epoch": 98.53133514986376,
+ "grad_norm": 2.3657684326171875,
+ "learning_rate": 1.131070815013624e-08,
+ "loss": 0.0293,
+ "step": 36161
+ },
+ {
+ "epoch": 98.53405994550408,
+ "grad_norm": 3.182272434234619,
+ "learning_rate": 1.1268785727004406e-08,
+ "loss": 0.1786,
+ "step": 36162
+ },
+ {
+ "epoch": 98.53678474114442,
+ "grad_norm": 3.479954242706299,
+ "learning_rate": 1.1226941095788813e-08,
+ "loss": 0.051,
+ "step": 36163
+ },
+ {
+ "epoch": 98.53950953678473,
+ "grad_norm": 2.0503923892974854,
+ "learning_rate": 1.1185174256816978e-08,
+ "loss": 0.0247,
+ "step": 36164
+ },
+ {
+ "epoch": 98.54223433242507,
+ "grad_norm": 2.055842399597168,
+ "learning_rate": 1.1143485210413086e-08,
+ "loss": 0.0238,
+ "step": 36165
+ },
+ {
+ "epoch": 98.5449591280654,
+ "grad_norm": 3.5154647827148438,
+ "learning_rate": 1.1101873956902431e-08,
+ "loss": 0.0838,
+ "step": 36166
+ },
+ {
+ "epoch": 98.54768392370572,
+ "grad_norm": 9.433673858642578,
+ "learning_rate": 1.10603404966092e-08,
+ "loss": 0.0289,
+ "step": 36167
+ },
+ {
+ "epoch": 98.55040871934605,
+ "grad_norm": 4.547787189483643,
+ "learning_rate": 1.101888482985647e-08,
+ "loss": 0.0366,
+ "step": 36168
+ },
+ {
+ "epoch": 98.55313351498637,
+ "grad_norm": 2.169792652130127,
+ "learning_rate": 1.0977506956967309e-08,
+ "loss": 0.0235,
+ "step": 36169
+ },
+ {
+ "epoch": 98.5558583106267,
+ "grad_norm": 5.074012756347656,
+ "learning_rate": 1.093620687826369e-08,
+ "loss": 0.0531,
+ "step": 36170
+ },
+ {
+ "epoch": 98.55858310626704,
+ "grad_norm": 2.4713664054870605,
+ "learning_rate": 1.0894984594067571e-08,
+ "loss": 0.0533,
+ "step": 36171
+ },
+ {
+ "epoch": 98.56130790190736,
+ "grad_norm": 1.9822112321853638,
+ "learning_rate": 1.0853840104698698e-08,
+ "loss": 0.0322,
+ "step": 36172
+ },
+ {
+ "epoch": 98.56403269754769,
+ "grad_norm": 4.8559136390686035,
+ "learning_rate": 1.0812773410480148e-08,
+ "loss": 0.0784,
+ "step": 36173
+ },
+ {
+ "epoch": 98.566757493188,
+ "grad_norm": 3.35929012298584,
+ "learning_rate": 1.0771784511729444e-08,
+ "loss": 0.11,
+ "step": 36174
+ },
+ {
+ "epoch": 98.56948228882834,
+ "grad_norm": 1.8584080934524536,
+ "learning_rate": 1.0730873408766329e-08,
+ "loss": 0.0279,
+ "step": 36175
+ },
+ {
+ "epoch": 98.57220708446866,
+ "grad_norm": 3.7485361099243164,
+ "learning_rate": 1.0690040101910549e-08,
+ "loss": 0.0979,
+ "step": 36176
+ },
+ {
+ "epoch": 98.57493188010899,
+ "grad_norm": 2.447479248046875,
+ "learning_rate": 1.0649284591478514e-08,
+ "loss": 0.0633,
+ "step": 36177
+ },
+ {
+ "epoch": 98.57765667574932,
+ "grad_norm": 1.4438681602478027,
+ "learning_rate": 1.0608606877788863e-08,
+ "loss": 0.0764,
+ "step": 36178
+ },
+ {
+ "epoch": 98.58038147138964,
+ "grad_norm": 3.983067274093628,
+ "learning_rate": 1.0568006961156895e-08,
+ "loss": 0.0306,
+ "step": 36179
+ },
+ {
+ "epoch": 98.58310626702998,
+ "grad_norm": 1.738135576248169,
+ "learning_rate": 1.0527484841900137e-08,
+ "loss": 0.0292,
+ "step": 36180
+ },
+ {
+ "epoch": 98.5858310626703,
+ "grad_norm": 2.455057382583618,
+ "learning_rate": 1.0487040520335e-08,
+ "loss": 0.0323,
+ "step": 36181
+ },
+ {
+ "epoch": 98.58855585831063,
+ "grad_norm": 1.8972069025039673,
+ "learning_rate": 1.044667399677457e-08,
+ "loss": 0.0241,
+ "step": 36182
+ },
+ {
+ "epoch": 98.59128065395096,
+ "grad_norm": 2.701190710067749,
+ "learning_rate": 1.0406385271533037e-08,
+ "loss": 0.0959,
+ "step": 36183
+ },
+ {
+ "epoch": 98.59400544959128,
+ "grad_norm": 3.047895908355713,
+ "learning_rate": 1.0366174344925705e-08,
+ "loss": 0.0672,
+ "step": 36184
+ },
+ {
+ "epoch": 98.59673024523161,
+ "grad_norm": 2.033413887023926,
+ "learning_rate": 1.0326041217265659e-08,
+ "loss": 0.1726,
+ "step": 36185
+ },
+ {
+ "epoch": 98.59945504087193,
+ "grad_norm": 2.644911527633667,
+ "learning_rate": 1.0285985888863759e-08,
+ "loss": 0.0378,
+ "step": 36186
+ },
+ {
+ "epoch": 98.60217983651226,
+ "grad_norm": 2.7324492931365967,
+ "learning_rate": 1.0246008360034199e-08,
+ "loss": 0.0484,
+ "step": 36187
+ },
+ {
+ "epoch": 98.60490463215258,
+ "grad_norm": 2.0621514320373535,
+ "learning_rate": 1.020610863108673e-08,
+ "loss": 0.0755,
+ "step": 36188
+ },
+ {
+ "epoch": 98.60762942779292,
+ "grad_norm": 2.5982513427734375,
+ "learning_rate": 1.0166286702332218e-08,
+ "loss": 0.0341,
+ "step": 36189
+ },
+ {
+ "epoch": 98.61035422343325,
+ "grad_norm": 2.2652432918548584,
+ "learning_rate": 1.0126542574081521e-08,
+ "loss": 0.0354,
+ "step": 36190
+ },
+ {
+ "epoch": 98.61307901907357,
+ "grad_norm": 2.6030406951904297,
+ "learning_rate": 1.0086876246644395e-08,
+ "loss": 0.0826,
+ "step": 36191
+ },
+ {
+ "epoch": 98.6158038147139,
+ "grad_norm": 2.524291515350342,
+ "learning_rate": 1.0047287720328369e-08,
+ "loss": 0.0447,
+ "step": 36192
+ },
+ {
+ "epoch": 98.61852861035422,
+ "grad_norm": 1.7350260019302368,
+ "learning_rate": 1.0007776995442087e-08,
+ "loss": 0.0363,
+ "step": 36193
+ },
+ {
+ "epoch": 98.62125340599455,
+ "grad_norm": 2.4189505577087402,
+ "learning_rate": 9.96834407229419e-09,
+ "loss": 0.0332,
+ "step": 36194
+ },
+ {
+ "epoch": 98.62397820163488,
+ "grad_norm": 2.639000415802002,
+ "learning_rate": 9.928988951192209e-09,
+ "loss": 0.0343,
+ "step": 36195
+ },
+ {
+ "epoch": 98.6267029972752,
+ "grad_norm": 2.462409019470215,
+ "learning_rate": 9.889711632440346e-09,
+ "loss": 0.0336,
+ "step": 36196
+ },
+ {
+ "epoch": 98.62942779291554,
+ "grad_norm": 2.373863458633423,
+ "learning_rate": 9.850512116347245e-09,
+ "loss": 0.1455,
+ "step": 36197
+ },
+ {
+ "epoch": 98.63215258855585,
+ "grad_norm": 2.109741449356079,
+ "learning_rate": 9.811390403215992e-09,
+ "loss": 0.0429,
+ "step": 36198
+ },
+ {
+ "epoch": 98.63487738419619,
+ "grad_norm": 2.0638701915740967,
+ "learning_rate": 9.772346493351902e-09,
+ "loss": 0.0302,
+ "step": 36199
+ },
+ {
+ "epoch": 98.6376021798365,
+ "grad_norm": 3.05644154548645,
+ "learning_rate": 9.733380387059177e-09,
+ "loss": 0.2133,
+ "step": 36200
+ },
+ {
+ "epoch": 98.64032697547684,
+ "grad_norm": 3.4912054538726807,
+ "learning_rate": 9.694492084642016e-09,
+ "loss": 0.0805,
+ "step": 36201
+ },
+ {
+ "epoch": 98.64305177111717,
+ "grad_norm": 2.714277744293213,
+ "learning_rate": 9.6556815864024e-09,
+ "loss": 0.0427,
+ "step": 36202
+ },
+ {
+ "epoch": 98.64577656675749,
+ "grad_norm": 2.102691411972046,
+ "learning_rate": 9.616948892642307e-09,
+ "loss": 0.1589,
+ "step": 36203
+ },
+ {
+ "epoch": 98.64850136239782,
+ "grad_norm": 2.0056819915771484,
+ "learning_rate": 9.578294003664835e-09,
+ "loss": 0.0388,
+ "step": 36204
+ },
+ {
+ "epoch": 98.65122615803814,
+ "grad_norm": 3.3613219261169434,
+ "learning_rate": 9.539716919768626e-09,
+ "loss": 0.1596,
+ "step": 36205
+ },
+ {
+ "epoch": 98.65395095367847,
+ "grad_norm": 3.162074089050293,
+ "learning_rate": 9.501217641256776e-09,
+ "loss": 0.0988,
+ "step": 36206
+ },
+ {
+ "epoch": 98.65667574931881,
+ "grad_norm": 3.202958822250366,
+ "learning_rate": 9.462796168427935e-09,
+ "loss": 0.0974,
+ "step": 36207
+ },
+ {
+ "epoch": 98.65940054495913,
+ "grad_norm": 1.555505633354187,
+ "learning_rate": 9.42445250158075e-09,
+ "loss": 0.02,
+ "step": 36208
+ },
+ {
+ "epoch": 98.66212534059946,
+ "grad_norm": 5.151355266571045,
+ "learning_rate": 9.386186641013872e-09,
+ "loss": 0.0285,
+ "step": 36209
+ },
+ {
+ "epoch": 98.66485013623978,
+ "grad_norm": 2.0583536624908447,
+ "learning_rate": 9.347998587027063e-09,
+ "loss": 0.024,
+ "step": 36210
+ },
+ {
+ "epoch": 98.66757493188011,
+ "grad_norm": 2.2810378074645996,
+ "learning_rate": 9.30988833991564e-09,
+ "loss": 0.0576,
+ "step": 36211
+ },
+ {
+ "epoch": 98.67029972752043,
+ "grad_norm": 2.646106004714966,
+ "learning_rate": 9.271855899977144e-09,
+ "loss": 0.0264,
+ "step": 36212
+ },
+ {
+ "epoch": 98.67302452316076,
+ "grad_norm": 2.243086338043213,
+ "learning_rate": 9.233901267509115e-09,
+ "loss": 0.0927,
+ "step": 36213
+ },
+ {
+ "epoch": 98.6757493188011,
+ "grad_norm": 1.8522670269012451,
+ "learning_rate": 9.196024442804652e-09,
+ "loss": 0.0445,
+ "step": 36214
+ },
+ {
+ "epoch": 98.67847411444141,
+ "grad_norm": 2.2108867168426514,
+ "learning_rate": 9.158225426160183e-09,
+ "loss": 0.0687,
+ "step": 36215
+ },
+ {
+ "epoch": 98.68119891008175,
+ "grad_norm": 2.378458261489868,
+ "learning_rate": 9.120504217871029e-09,
+ "loss": 0.1945,
+ "step": 36216
+ },
+ {
+ "epoch": 98.68392370572207,
+ "grad_norm": 2.6821839809417725,
+ "learning_rate": 9.082860818228068e-09,
+ "loss": 0.1039,
+ "step": 36217
+ },
+ {
+ "epoch": 98.6866485013624,
+ "grad_norm": 2.8306756019592285,
+ "learning_rate": 9.045295227527728e-09,
+ "loss": 0.0531,
+ "step": 36218
+ },
+ {
+ "epoch": 98.68937329700273,
+ "grad_norm": 2.138756036758423,
+ "learning_rate": 9.007807446059779e-09,
+ "loss": 0.1238,
+ "step": 36219
+ },
+ {
+ "epoch": 98.69209809264305,
+ "grad_norm": 2.8362069129943848,
+ "learning_rate": 8.970397474118431e-09,
+ "loss": 0.0756,
+ "step": 36220
+ },
+ {
+ "epoch": 98.69482288828338,
+ "grad_norm": 1.5811744928359985,
+ "learning_rate": 8.93306531199345e-09,
+ "loss": 0.0255,
+ "step": 36221
+ },
+ {
+ "epoch": 98.6975476839237,
+ "grad_norm": 2.259927988052368,
+ "learning_rate": 8.895810959976825e-09,
+ "loss": 0.0324,
+ "step": 36222
+ },
+ {
+ "epoch": 98.70027247956403,
+ "grad_norm": 2.612879991531372,
+ "learning_rate": 8.858634418358325e-09,
+ "loss": 0.0418,
+ "step": 36223
+ },
+ {
+ "epoch": 98.70299727520435,
+ "grad_norm": 2.5344955921173096,
+ "learning_rate": 8.821535687426609e-09,
+ "loss": 0.029,
+ "step": 36224
+ },
+ {
+ "epoch": 98.70572207084469,
+ "grad_norm": 13.622929573059082,
+ "learning_rate": 8.784514767470331e-09,
+ "loss": 0.0871,
+ "step": 36225
+ },
+ {
+ "epoch": 98.70844686648502,
+ "grad_norm": 1.8633819818496704,
+ "learning_rate": 8.747571658780373e-09,
+ "loss": 0.0222,
+ "step": 36226
+ },
+ {
+ "epoch": 98.71117166212534,
+ "grad_norm": 2.615386486053467,
+ "learning_rate": 8.710706361642063e-09,
+ "loss": 0.0578,
+ "step": 36227
+ },
+ {
+ "epoch": 98.71389645776567,
+ "grad_norm": 2.52996563911438,
+ "learning_rate": 8.673918876342947e-09,
+ "loss": 0.0966,
+ "step": 36228
+ },
+ {
+ "epoch": 98.71662125340599,
+ "grad_norm": 1.7542939186096191,
+ "learning_rate": 8.63720920316946e-09,
+ "loss": 0.0367,
+ "step": 36229
+ },
+ {
+ "epoch": 98.71934604904632,
+ "grad_norm": 2.614475727081299,
+ "learning_rate": 8.600577342408046e-09,
+ "loss": 0.0735,
+ "step": 36230
+ },
+ {
+ "epoch": 98.72207084468666,
+ "grad_norm": 4.2264814376831055,
+ "learning_rate": 8.564023294344026e-09,
+ "loss": 0.0692,
+ "step": 36231
+ },
+ {
+ "epoch": 98.72479564032697,
+ "grad_norm": 1.6859139204025269,
+ "learning_rate": 8.527547059262731e-09,
+ "loss": 0.1277,
+ "step": 36232
+ },
+ {
+ "epoch": 98.7275204359673,
+ "grad_norm": 2.428453207015991,
+ "learning_rate": 8.491148637446156e-09,
+ "loss": 0.0275,
+ "step": 36233
+ },
+ {
+ "epoch": 98.73024523160763,
+ "grad_norm": 4.541210651397705,
+ "learning_rate": 8.454828029178518e-09,
+ "loss": 0.0867,
+ "step": 36234
+ },
+ {
+ "epoch": 98.73297002724796,
+ "grad_norm": 2.7328550815582275,
+ "learning_rate": 8.418585234744037e-09,
+ "loss": 0.1257,
+ "step": 36235
+ },
+ {
+ "epoch": 98.73569482288828,
+ "grad_norm": 1.9844528436660767,
+ "learning_rate": 8.382420254424706e-09,
+ "loss": 0.0273,
+ "step": 36236
+ },
+ {
+ "epoch": 98.73841961852861,
+ "grad_norm": 2.834373950958252,
+ "learning_rate": 8.346333088500303e-09,
+ "loss": 0.0505,
+ "step": 36237
+ },
+ {
+ "epoch": 98.74114441416894,
+ "grad_norm": 2.5058889389038086,
+ "learning_rate": 8.310323737252824e-09,
+ "loss": 0.0267,
+ "step": 36238
+ },
+ {
+ "epoch": 98.74386920980926,
+ "grad_norm": 2.4641990661621094,
+ "learning_rate": 8.274392200964265e-09,
+ "loss": 0.0387,
+ "step": 36239
+ },
+ {
+ "epoch": 98.7465940054496,
+ "grad_norm": 4.683347702026367,
+ "learning_rate": 8.238538479912184e-09,
+ "loss": 0.1611,
+ "step": 36240
+ },
+ {
+ "epoch": 98.74931880108991,
+ "grad_norm": 2.662602186203003,
+ "learning_rate": 8.202762574376355e-09,
+ "loss": 0.0271,
+ "step": 36241
+ },
+ {
+ "epoch": 98.75204359673025,
+ "grad_norm": 2.5227410793304443,
+ "learning_rate": 8.167064484636555e-09,
+ "loss": 0.069,
+ "step": 36242
+ },
+ {
+ "epoch": 98.75476839237058,
+ "grad_norm": 3.3482046127319336,
+ "learning_rate": 8.13144421097034e-09,
+ "loss": 0.0352,
+ "step": 36243
+ },
+ {
+ "epoch": 98.7574931880109,
+ "grad_norm": 2.558753728866577,
+ "learning_rate": 8.095901753654156e-09,
+ "loss": 0.0271,
+ "step": 36244
+ },
+ {
+ "epoch": 98.76021798365123,
+ "grad_norm": 2.3655343055725098,
+ "learning_rate": 8.060437112965558e-09,
+ "loss": 0.0602,
+ "step": 36245
+ },
+ {
+ "epoch": 98.76294277929155,
+ "grad_norm": 2.8100643157958984,
+ "learning_rate": 8.02505028918099e-09,
+ "loss": 0.0667,
+ "step": 36246
+ },
+ {
+ "epoch": 98.76566757493188,
+ "grad_norm": 1.8988646268844604,
+ "learning_rate": 7.989741282575792e-09,
+ "loss": 0.077,
+ "step": 36247
+ },
+ {
+ "epoch": 98.7683923705722,
+ "grad_norm": 2.5409767627716064,
+ "learning_rate": 7.954510093425294e-09,
+ "loss": 0.095,
+ "step": 36248
+ },
+ {
+ "epoch": 98.77111716621253,
+ "grad_norm": 2.4074063301086426,
+ "learning_rate": 7.919356722002613e-09,
+ "loss": 0.0317,
+ "step": 36249
+ },
+ {
+ "epoch": 98.77384196185287,
+ "grad_norm": 1.1986193656921387,
+ "learning_rate": 7.884281168583086e-09,
+ "loss": 0.0141,
+ "step": 36250
+ },
+ {
+ "epoch": 98.77656675749319,
+ "grad_norm": 5.700056552886963,
+ "learning_rate": 7.849283433438714e-09,
+ "loss": 0.0583,
+ "step": 36251
+ },
+ {
+ "epoch": 98.77929155313352,
+ "grad_norm": 3.0358242988586426,
+ "learning_rate": 7.814363516842616e-09,
+ "loss": 0.0546,
+ "step": 36252
+ },
+ {
+ "epoch": 98.78201634877384,
+ "grad_norm": 1.692973256111145,
+ "learning_rate": 7.779521419066793e-09,
+ "loss": 0.0178,
+ "step": 36253
+ },
+ {
+ "epoch": 98.78474114441417,
+ "grad_norm": 4.116315841674805,
+ "learning_rate": 7.744757140382141e-09,
+ "loss": 0.0465,
+ "step": 36254
+ },
+ {
+ "epoch": 98.7874659400545,
+ "grad_norm": 1.8948396444320679,
+ "learning_rate": 7.710070681060666e-09,
+ "loss": 0.0192,
+ "step": 36255
+ },
+ {
+ "epoch": 98.79019073569482,
+ "grad_norm": 1.9507626295089722,
+ "learning_rate": 7.67546204137104e-09,
+ "loss": 0.0448,
+ "step": 36256
+ },
+ {
+ "epoch": 98.79291553133515,
+ "grad_norm": 3.586582660675049,
+ "learning_rate": 7.640931221583048e-09,
+ "loss": 0.0426,
+ "step": 36257
+ },
+ {
+ "epoch": 98.79564032697547,
+ "grad_norm": 3.2128372192382812,
+ "learning_rate": 7.606478221965363e-09,
+ "loss": 0.0405,
+ "step": 36258
+ },
+ {
+ "epoch": 98.7983651226158,
+ "grad_norm": 2.8067307472229004,
+ "learning_rate": 7.572103042787771e-09,
+ "loss": 0.0772,
+ "step": 36259
+ },
+ {
+ "epoch": 98.80108991825612,
+ "grad_norm": 2.903602361679077,
+ "learning_rate": 7.537805684316724e-09,
+ "loss": 0.0514,
+ "step": 36260
+ },
+ {
+ "epoch": 98.80381471389646,
+ "grad_norm": 2.3150784969329834,
+ "learning_rate": 7.503586146819785e-09,
+ "loss": 0.0279,
+ "step": 36261
+ },
+ {
+ "epoch": 98.80653950953679,
+ "grad_norm": 2.790849208831787,
+ "learning_rate": 7.4694444305623e-09,
+ "loss": 0.0524,
+ "step": 36262
+ },
+ {
+ "epoch": 98.80926430517711,
+ "grad_norm": 2.5214614868164062,
+ "learning_rate": 7.4353805358129416e-09,
+ "loss": 0.1017,
+ "step": 36263
+ },
+ {
+ "epoch": 98.81198910081744,
+ "grad_norm": 2.7264602184295654,
+ "learning_rate": 7.401394462833722e-09,
+ "loss": 0.0297,
+ "step": 36264
+ },
+ {
+ "epoch": 98.81471389645776,
+ "grad_norm": 2.5907976627349854,
+ "learning_rate": 7.3674862118922055e-09,
+ "loss": 0.0599,
+ "step": 36265
+ },
+ {
+ "epoch": 98.8174386920981,
+ "grad_norm": 3.868417263031006,
+ "learning_rate": 7.333655783249294e-09,
+ "loss": 0.0575,
+ "step": 36266
+ },
+ {
+ "epoch": 98.82016348773843,
+ "grad_norm": 2.3906784057617188,
+ "learning_rate": 7.299903177171441e-09,
+ "loss": 0.082,
+ "step": 36267
+ },
+ {
+ "epoch": 98.82288828337875,
+ "grad_norm": 7.075655460357666,
+ "learning_rate": 7.2662283939206604e-09,
+ "loss": 0.025,
+ "step": 36268
+ },
+ {
+ "epoch": 98.82561307901908,
+ "grad_norm": 3.075913906097412,
+ "learning_rate": 7.232631433757853e-09,
+ "loss": 0.0504,
+ "step": 36269
+ },
+ {
+ "epoch": 98.8283378746594,
+ "grad_norm": 2.7215065956115723,
+ "learning_rate": 7.1991122969461425e-09,
+ "loss": 0.0616,
+ "step": 36270
+ },
+ {
+ "epoch": 98.83106267029973,
+ "grad_norm": 2.9382898807525635,
+ "learning_rate": 7.165670983746431e-09,
+ "loss": 0.053,
+ "step": 36271
+ },
+ {
+ "epoch": 98.83378746594005,
+ "grad_norm": 3.1600341796875,
+ "learning_rate": 7.132307494418511e-09,
+ "loss": 0.0317,
+ "step": 36272
+ },
+ {
+ "epoch": 98.83651226158038,
+ "grad_norm": 2.2423198223114014,
+ "learning_rate": 7.099021829223285e-09,
+ "loss": 0.0593,
+ "step": 36273
+ },
+ {
+ "epoch": 98.83923705722071,
+ "grad_norm": 2.4246907234191895,
+ "learning_rate": 7.065813988418324e-09,
+ "loss": 0.0484,
+ "step": 36274
+ },
+ {
+ "epoch": 98.84196185286103,
+ "grad_norm": 2.9497811794281006,
+ "learning_rate": 7.032683972263421e-09,
+ "loss": 0.0344,
+ "step": 36275
+ },
+ {
+ "epoch": 98.84468664850137,
+ "grad_norm": 1.5730886459350586,
+ "learning_rate": 6.999631781017258e-09,
+ "loss": 0.0173,
+ "step": 36276
+ },
+ {
+ "epoch": 98.84741144414168,
+ "grad_norm": 2.204084634780884,
+ "learning_rate": 6.966657414935185e-09,
+ "loss": 0.0454,
+ "step": 36277
+ },
+ {
+ "epoch": 98.85013623978202,
+ "grad_norm": 2.1484272480010986,
+ "learning_rate": 6.933760874274775e-09,
+ "loss": 0.0466,
+ "step": 36278
+ },
+ {
+ "epoch": 98.85286103542235,
+ "grad_norm": 2.359956741333008,
+ "learning_rate": 6.9009421592936e-09,
+ "loss": 0.0305,
+ "step": 36279
+ },
+ {
+ "epoch": 98.85558583106267,
+ "grad_norm": 3.301863670349121,
+ "learning_rate": 6.8682012702459e-09,
+ "loss": 0.085,
+ "step": 36280
+ },
+ {
+ "epoch": 98.858310626703,
+ "grad_norm": 1.8629157543182373,
+ "learning_rate": 6.835538207387027e-09,
+ "loss": 0.0227,
+ "step": 36281
+ },
+ {
+ "epoch": 98.86103542234332,
+ "grad_norm": 1.7687841653823853,
+ "learning_rate": 6.802952970971222e-09,
+ "loss": 0.0311,
+ "step": 36282
+ },
+ {
+ "epoch": 98.86376021798365,
+ "grad_norm": 2.2203309535980225,
+ "learning_rate": 6.770445561252725e-09,
+ "loss": 0.0374,
+ "step": 36283
+ },
+ {
+ "epoch": 98.86648501362397,
+ "grad_norm": 3.330214023590088,
+ "learning_rate": 6.738015978484669e-09,
+ "loss": 0.0371,
+ "step": 36284
+ },
+ {
+ "epoch": 98.8692098092643,
+ "grad_norm": 2.2659683227539062,
+ "learning_rate": 6.705664222919072e-09,
+ "loss": 0.0565,
+ "step": 36285
+ },
+ {
+ "epoch": 98.87193460490464,
+ "grad_norm": 2.4965755939483643,
+ "learning_rate": 6.673390294807958e-09,
+ "loss": 0.0605,
+ "step": 36286
+ },
+ {
+ "epoch": 98.87465940054496,
+ "grad_norm": 2.2927823066711426,
+ "learning_rate": 6.641194194402234e-09,
+ "loss": 0.0253,
+ "step": 36287
+ },
+ {
+ "epoch": 98.87738419618529,
+ "grad_norm": 2.6198787689208984,
+ "learning_rate": 6.609075921953923e-09,
+ "loss": 0.0968,
+ "step": 36288
+ },
+ {
+ "epoch": 98.88010899182561,
+ "grad_norm": 2.3675615787506104,
+ "learning_rate": 6.577035477712823e-09,
+ "loss": 0.0383,
+ "step": 36289
+ },
+ {
+ "epoch": 98.88283378746594,
+ "grad_norm": 3.417741298675537,
+ "learning_rate": 6.545072861927626e-09,
+ "loss": 0.097,
+ "step": 36290
+ },
+ {
+ "epoch": 98.88555858310627,
+ "grad_norm": 1.915927529335022,
+ "learning_rate": 6.5131880748481314e-09,
+ "loss": 0.0749,
+ "step": 36291
+ },
+ {
+ "epoch": 98.88828337874659,
+ "grad_norm": 2.6985626220703125,
+ "learning_rate": 6.481381116721919e-09,
+ "loss": 0.0901,
+ "step": 36292
+ },
+ {
+ "epoch": 98.89100817438693,
+ "grad_norm": 3.038095235824585,
+ "learning_rate": 6.449651987797678e-09,
+ "loss": 0.0373,
+ "step": 36293
+ },
+ {
+ "epoch": 98.89373297002724,
+ "grad_norm": 2.512392520904541,
+ "learning_rate": 6.418000688320769e-09,
+ "loss": 0.0248,
+ "step": 36294
+ },
+ {
+ "epoch": 98.89645776566758,
+ "grad_norm": 1.378581166267395,
+ "learning_rate": 6.386427218539881e-09,
+ "loss": 0.0157,
+ "step": 36295
+ },
+ {
+ "epoch": 98.8991825613079,
+ "grad_norm": 1.49094557762146,
+ "learning_rate": 6.354931578699264e-09,
+ "loss": 0.0318,
+ "step": 36296
+ },
+ {
+ "epoch": 98.90190735694823,
+ "grad_norm": 2.465254545211792,
+ "learning_rate": 6.323513769045386e-09,
+ "loss": 0.0295,
+ "step": 36297
+ },
+ {
+ "epoch": 98.90463215258856,
+ "grad_norm": 2.6463098526000977,
+ "learning_rate": 6.292173789821387e-09,
+ "loss": 0.0393,
+ "step": 36298
+ },
+ {
+ "epoch": 98.90735694822888,
+ "grad_norm": 2.901310920715332,
+ "learning_rate": 6.260911641272626e-09,
+ "loss": 0.0693,
+ "step": 36299
+ },
+ {
+ "epoch": 98.91008174386921,
+ "grad_norm": 2.0929248332977295,
+ "learning_rate": 6.229727323643353e-09,
+ "loss": 0.1131,
+ "step": 36300
+ },
+ {
+ "epoch": 98.91280653950953,
+ "grad_norm": 2.5953946113586426,
+ "learning_rate": 6.198620837174485e-09,
+ "loss": 0.0463,
+ "step": 36301
+ },
+ {
+ "epoch": 98.91553133514986,
+ "grad_norm": 2.3402748107910156,
+ "learning_rate": 6.167592182108051e-09,
+ "loss": 0.0297,
+ "step": 36302
+ },
+ {
+ "epoch": 98.9182561307902,
+ "grad_norm": 2.9301769733428955,
+ "learning_rate": 6.1366413586883e-09,
+ "loss": 0.1096,
+ "step": 36303
+ },
+ {
+ "epoch": 98.92098092643052,
+ "grad_norm": 3.1592493057250977,
+ "learning_rate": 6.10576836715393e-09,
+ "loss": 0.0623,
+ "step": 36304
+ },
+ {
+ "epoch": 98.92370572207085,
+ "grad_norm": 2.4974987506866455,
+ "learning_rate": 6.07497320774697e-09,
+ "loss": 0.0535,
+ "step": 36305
+ },
+ {
+ "epoch": 98.92643051771117,
+ "grad_norm": 1.8690325021743774,
+ "learning_rate": 6.044255880705008e-09,
+ "loss": 0.1418,
+ "step": 36306
+ },
+ {
+ "epoch": 98.9291553133515,
+ "grad_norm": 2.1339619159698486,
+ "learning_rate": 6.013616386270071e-09,
+ "loss": 0.018,
+ "step": 36307
+ },
+ {
+ "epoch": 98.93188010899182,
+ "grad_norm": 1.7211685180664062,
+ "learning_rate": 5.983054724679749e-09,
+ "loss": 0.0186,
+ "step": 36308
+ },
+ {
+ "epoch": 98.93460490463215,
+ "grad_norm": 2.7866098880767822,
+ "learning_rate": 5.952570896170518e-09,
+ "loss": 0.0359,
+ "step": 36309
+ },
+ {
+ "epoch": 98.93732970027249,
+ "grad_norm": 3.0363857746124268,
+ "learning_rate": 5.9221649009810756e-09,
+ "loss": 0.0381,
+ "step": 36310
+ },
+ {
+ "epoch": 98.9400544959128,
+ "grad_norm": 6.504725456237793,
+ "learning_rate": 5.891836739349011e-09,
+ "loss": 0.0466,
+ "step": 36311
+ },
+ {
+ "epoch": 98.94277929155314,
+ "grad_norm": 2.009805679321289,
+ "learning_rate": 5.86158641150969e-09,
+ "loss": 0.0238,
+ "step": 36312
+ },
+ {
+ "epoch": 98.94550408719346,
+ "grad_norm": 3.1905014514923096,
+ "learning_rate": 5.83141391769737e-09,
+ "loss": 0.0407,
+ "step": 36313
+ },
+ {
+ "epoch": 98.94822888283379,
+ "grad_norm": 2.685636520385742,
+ "learning_rate": 5.80131925814964e-09,
+ "loss": 0.0229,
+ "step": 36314
+ },
+ {
+ "epoch": 98.95095367847412,
+ "grad_norm": 2.8348448276519775,
+ "learning_rate": 5.771302433098536e-09,
+ "loss": 0.0467,
+ "step": 36315
+ },
+ {
+ "epoch": 98.95367847411444,
+ "grad_norm": 3.036760091781616,
+ "learning_rate": 5.741363442779424e-09,
+ "loss": 0.0544,
+ "step": 36316
+ },
+ {
+ "epoch": 98.95640326975477,
+ "grad_norm": 2.766896963119507,
+ "learning_rate": 5.711502287425452e-09,
+ "loss": 0.0347,
+ "step": 36317
+ },
+ {
+ "epoch": 98.95912806539509,
+ "grad_norm": 1.3856438398361206,
+ "learning_rate": 5.6817189672675464e-09,
+ "loss": 0.0166,
+ "step": 36318
+ },
+ {
+ "epoch": 98.96185286103542,
+ "grad_norm": 2.2274909019470215,
+ "learning_rate": 5.652013482539964e-09,
+ "loss": 0.1188,
+ "step": 36319
+ },
+ {
+ "epoch": 98.96457765667574,
+ "grad_norm": 1.9218724966049194,
+ "learning_rate": 5.6223858334725215e-09,
+ "loss": 0.0305,
+ "step": 36320
+ },
+ {
+ "epoch": 98.96730245231608,
+ "grad_norm": 2.904686689376831,
+ "learning_rate": 5.592836020295034e-09,
+ "loss": 0.0803,
+ "step": 36321
+ },
+ {
+ "epoch": 98.97002724795641,
+ "grad_norm": 1.8116261959075928,
+ "learning_rate": 5.563364043240649e-09,
+ "loss": 0.0276,
+ "step": 36322
+ },
+ {
+ "epoch": 98.97275204359673,
+ "grad_norm": 2.1489503383636475,
+ "learning_rate": 5.533969902535852e-09,
+ "loss": 0.1026,
+ "step": 36323
+ },
+ {
+ "epoch": 98.97547683923706,
+ "grad_norm": 2.3643507957458496,
+ "learning_rate": 5.504653598411569e-09,
+ "loss": 0.0418,
+ "step": 36324
+ },
+ {
+ "epoch": 98.97820163487738,
+ "grad_norm": 1.8588837385177612,
+ "learning_rate": 5.475415131094286e-09,
+ "loss": 0.0258,
+ "step": 36325
+ },
+ {
+ "epoch": 98.98092643051771,
+ "grad_norm": 3.1523587703704834,
+ "learning_rate": 5.446254500813819e-09,
+ "loss": 0.1419,
+ "step": 36326
+ },
+ {
+ "epoch": 98.98365122615803,
+ "grad_norm": 3.467860221862793,
+ "learning_rate": 5.417171707795544e-09,
+ "loss": 0.0603,
+ "step": 36327
+ },
+ {
+ "epoch": 98.98637602179836,
+ "grad_norm": 2.8103842735290527,
+ "learning_rate": 5.388166752267054e-09,
+ "loss": 0.0376,
+ "step": 36328
+ },
+ {
+ "epoch": 98.9891008174387,
+ "grad_norm": 2.1515791416168213,
+ "learning_rate": 5.359239634454838e-09,
+ "loss": 0.0339,
+ "step": 36329
+ },
+ {
+ "epoch": 98.99182561307902,
+ "grad_norm": 3.5862340927124023,
+ "learning_rate": 5.330390354582049e-09,
+ "loss": 0.1131,
+ "step": 36330
+ },
+ {
+ "epoch": 98.99455040871935,
+ "grad_norm": 4.1147685050964355,
+ "learning_rate": 5.301618912874062e-09,
+ "loss": 0.1015,
+ "step": 36331
+ },
+ {
+ "epoch": 98.99727520435967,
+ "grad_norm": 4.5505781173706055,
+ "learning_rate": 5.2729253095562535e-09,
+ "loss": 0.1679,
+ "step": 36332
+ },
+ {
+ "epoch": 99.0,
+ "grad_norm": 2.0763278007507324,
+ "learning_rate": 5.2443095448506674e-09,
+ "loss": 0.039,
+ "step": 36333
+ },
+ {
+ "epoch": 99.00272479564033,
+ "grad_norm": 2.160623073577881,
+ "learning_rate": 5.2157716189815685e-09,
+ "loss": 0.0228,
+ "step": 36334
+ },
+ {
+ "epoch": 99.00544959128065,
+ "grad_norm": 2.648790121078491,
+ "learning_rate": 5.1873115321698916e-09,
+ "loss": 0.0254,
+ "step": 36335
+ },
+ {
+ "epoch": 99.00817438692098,
+ "grad_norm": 1.4263352155685425,
+ "learning_rate": 5.158929284637682e-09,
+ "loss": 0.0121,
+ "step": 36336
+ },
+ {
+ "epoch": 99.0108991825613,
+ "grad_norm": 2.350101947784424,
+ "learning_rate": 5.130624876605872e-09,
+ "loss": 0.083,
+ "step": 36337
+ },
+ {
+ "epoch": 99.01362397820164,
+ "grad_norm": 1.9578046798706055,
+ "learning_rate": 5.102398308295398e-09,
+ "loss": 0.0771,
+ "step": 36338
+ },
+ {
+ "epoch": 99.01634877384195,
+ "grad_norm": 2.8038489818573,
+ "learning_rate": 5.074249579924972e-09,
+ "loss": 0.0727,
+ "step": 36339
+ },
+ {
+ "epoch": 99.01907356948229,
+ "grad_norm": 2.09999418258667,
+ "learning_rate": 5.046178691715531e-09,
+ "loss": 0.0247,
+ "step": 36340
+ },
+ {
+ "epoch": 99.02179836512262,
+ "grad_norm": 2.1430397033691406,
+ "learning_rate": 5.018185643884676e-09,
+ "loss": 0.0304,
+ "step": 36341
+ },
+ {
+ "epoch": 99.02452316076294,
+ "grad_norm": 1.720141053199768,
+ "learning_rate": 4.9902704366500135e-09,
+ "loss": 0.0254,
+ "step": 36342
+ },
+ {
+ "epoch": 99.02724795640327,
+ "grad_norm": 1.895276665687561,
+ "learning_rate": 4.9624330702302544e-09,
+ "loss": 0.0384,
+ "step": 36343
+ },
+ {
+ "epoch": 99.02997275204359,
+ "grad_norm": 3.258413076400757,
+ "learning_rate": 4.9346735448407845e-09,
+ "loss": 0.0641,
+ "step": 36344
+ },
+ {
+ "epoch": 99.03269754768392,
+ "grad_norm": 1.620366096496582,
+ "learning_rate": 4.906991860698096e-09,
+ "loss": 0.0307,
+ "step": 36345
+ },
+ {
+ "epoch": 99.03542234332426,
+ "grad_norm": 2.048008680343628,
+ "learning_rate": 4.879388018018683e-09,
+ "loss": 0.0226,
+ "step": 36346
+ },
+ {
+ "epoch": 99.03814713896458,
+ "grad_norm": 2.050539255142212,
+ "learning_rate": 4.8518620170168175e-09,
+ "loss": 0.0248,
+ "step": 36347
+ },
+ {
+ "epoch": 99.04087193460491,
+ "grad_norm": 3.3020405769348145,
+ "learning_rate": 4.824413857906773e-09,
+ "loss": 0.1052,
+ "step": 36348
+ },
+ {
+ "epoch": 99.04359673024523,
+ "grad_norm": 3.141381025314331,
+ "learning_rate": 4.7970435409017136e-09,
+ "loss": 0.0554,
+ "step": 36349
+ },
+ {
+ "epoch": 99.04632152588556,
+ "grad_norm": 14.986294746398926,
+ "learning_rate": 4.769751066217021e-09,
+ "loss": 0.0382,
+ "step": 36350
+ },
+ {
+ "epoch": 99.04904632152588,
+ "grad_norm": 2.1716835498809814,
+ "learning_rate": 4.742536434062528e-09,
+ "loss": 0.0511,
+ "step": 36351
+ },
+ {
+ "epoch": 99.05177111716621,
+ "grad_norm": 2.3615550994873047,
+ "learning_rate": 4.715399644652508e-09,
+ "loss": 0.0452,
+ "step": 36352
+ },
+ {
+ "epoch": 99.05449591280654,
+ "grad_norm": 2.8376779556274414,
+ "learning_rate": 4.6883406981967915e-09,
+ "loss": 0.0363,
+ "step": 36353
+ },
+ {
+ "epoch": 99.05722070844686,
+ "grad_norm": 1.998656153678894,
+ "learning_rate": 4.661359594906323e-09,
+ "loss": 0.0817,
+ "step": 36354
+ },
+ {
+ "epoch": 99.0599455040872,
+ "grad_norm": 2.0303032398223877,
+ "learning_rate": 4.634456334992044e-09,
+ "loss": 0.0369,
+ "step": 36355
+ },
+ {
+ "epoch": 99.06267029972751,
+ "grad_norm": 1.6783592700958252,
+ "learning_rate": 4.607630918662676e-09,
+ "loss": 0.0582,
+ "step": 36356
+ },
+ {
+ "epoch": 99.06539509536785,
+ "grad_norm": 4.393839359283447,
+ "learning_rate": 4.580883346128051e-09,
+ "loss": 0.0314,
+ "step": 36357
+ },
+ {
+ "epoch": 99.06811989100818,
+ "grad_norm": 2.3626253604888916,
+ "learning_rate": 4.554213617594672e-09,
+ "loss": 0.0389,
+ "step": 36358
+ },
+ {
+ "epoch": 99.0708446866485,
+ "grad_norm": 3.6280767917633057,
+ "learning_rate": 4.527621733271259e-09,
+ "loss": 0.1319,
+ "step": 36359
+ },
+ {
+ "epoch": 99.07356948228883,
+ "grad_norm": 2.038217067718506,
+ "learning_rate": 4.5011076933665356e-09,
+ "loss": 0.0224,
+ "step": 36360
+ },
+ {
+ "epoch": 99.07629427792915,
+ "grad_norm": 3.5371341705322266,
+ "learning_rate": 4.474671498083671e-09,
+ "loss": 0.0534,
+ "step": 36361
+ },
+ {
+ "epoch": 99.07901907356948,
+ "grad_norm": 2.664658546447754,
+ "learning_rate": 4.448313147631389e-09,
+ "loss": 0.0848,
+ "step": 36362
+ },
+ {
+ "epoch": 99.0817438692098,
+ "grad_norm": 3.05959153175354,
+ "learning_rate": 4.422032642213969e-09,
+ "loss": 0.037,
+ "step": 36363
+ },
+ {
+ "epoch": 99.08446866485014,
+ "grad_norm": 1.676727294921875,
+ "learning_rate": 4.395829982035693e-09,
+ "loss": 0.0487,
+ "step": 36364
+ },
+ {
+ "epoch": 99.08719346049047,
+ "grad_norm": 2.3347127437591553,
+ "learning_rate": 4.369705167301952e-09,
+ "loss": 0.1061,
+ "step": 36365
+ },
+ {
+ "epoch": 99.08991825613079,
+ "grad_norm": 2.571681261062622,
+ "learning_rate": 4.343658198213696e-09,
+ "loss": 0.0478,
+ "step": 36366
+ },
+ {
+ "epoch": 99.09264305177112,
+ "grad_norm": 1.9872663021087646,
+ "learning_rate": 4.317689074976317e-09,
+ "loss": 0.0279,
+ "step": 36367
+ },
+ {
+ "epoch": 99.09536784741144,
+ "grad_norm": 4.219489574432373,
+ "learning_rate": 4.291797797790764e-09,
+ "loss": 0.0283,
+ "step": 36368
+ },
+ {
+ "epoch": 99.09809264305177,
+ "grad_norm": 3.7424395084381104,
+ "learning_rate": 4.2659843668591e-09,
+ "loss": 0.1513,
+ "step": 36369
+ },
+ {
+ "epoch": 99.1008174386921,
+ "grad_norm": 3.471322536468506,
+ "learning_rate": 4.240248782382272e-09,
+ "loss": 0.0839,
+ "step": 36370
+ },
+ {
+ "epoch": 99.10354223433242,
+ "grad_norm": 2.9463798999786377,
+ "learning_rate": 4.214591044560123e-09,
+ "loss": 0.041,
+ "step": 36371
+ },
+ {
+ "epoch": 99.10626702997276,
+ "grad_norm": 2.3431172370910645,
+ "learning_rate": 4.189011153593603e-09,
+ "loss": 0.0612,
+ "step": 36372
+ },
+ {
+ "epoch": 99.10899182561307,
+ "grad_norm": 1.8754887580871582,
+ "learning_rate": 4.163509109681441e-09,
+ "loss": 0.0209,
+ "step": 36373
+ },
+ {
+ "epoch": 99.11171662125341,
+ "grad_norm": 4.4420366287231445,
+ "learning_rate": 4.1380849130223666e-09,
+ "loss": 0.0855,
+ "step": 36374
+ },
+ {
+ "epoch": 99.11444141689373,
+ "grad_norm": 2.1189613342285156,
+ "learning_rate": 4.112738563814e-09,
+ "loss": 0.1157,
+ "step": 36375
+ },
+ {
+ "epoch": 99.11716621253406,
+ "grad_norm": 3.5993266105651855,
+ "learning_rate": 4.087470062252852e-09,
+ "loss": 0.0905,
+ "step": 36376
+ },
+ {
+ "epoch": 99.11989100817439,
+ "grad_norm": 3.2593681812286377,
+ "learning_rate": 4.06227940853765e-09,
+ "loss": 0.0729,
+ "step": 36377
+ },
+ {
+ "epoch": 99.12261580381471,
+ "grad_norm": 4.9808454513549805,
+ "learning_rate": 4.0371666028637954e-09,
+ "loss": 0.1191,
+ "step": 36378
+ },
+ {
+ "epoch": 99.12534059945504,
+ "grad_norm": 2.3980395793914795,
+ "learning_rate": 4.012131645426687e-09,
+ "loss": 0.0205,
+ "step": 36379
+ },
+ {
+ "epoch": 99.12806539509536,
+ "grad_norm": 2.978144645690918,
+ "learning_rate": 3.987174536421723e-09,
+ "loss": 0.0345,
+ "step": 36380
+ },
+ {
+ "epoch": 99.1307901907357,
+ "grad_norm": 2.6568796634674072,
+ "learning_rate": 3.962295276042083e-09,
+ "loss": 0.0539,
+ "step": 36381
+ },
+ {
+ "epoch": 99.13351498637603,
+ "grad_norm": 2.537956476211548,
+ "learning_rate": 3.937493864483166e-09,
+ "loss": 0.0359,
+ "step": 36382
+ },
+ {
+ "epoch": 99.13623978201635,
+ "grad_norm": 5.514376640319824,
+ "learning_rate": 3.912770301937041e-09,
+ "loss": 0.0443,
+ "step": 36383
+ },
+ {
+ "epoch": 99.13896457765668,
+ "grad_norm": 1.956241250038147,
+ "learning_rate": 3.8881245885957765e-09,
+ "loss": 0.0261,
+ "step": 36384
+ },
+ {
+ "epoch": 99.141689373297,
+ "grad_norm": 1.6229876279830933,
+ "learning_rate": 3.863556724652551e-09,
+ "loss": 0.0154,
+ "step": 36385
+ },
+ {
+ "epoch": 99.14441416893733,
+ "grad_norm": 2.845139741897583,
+ "learning_rate": 3.839066710298323e-09,
+ "loss": 0.0728,
+ "step": 36386
+ },
+ {
+ "epoch": 99.14713896457765,
+ "grad_norm": 3.711958646774292,
+ "learning_rate": 3.81465454572405e-09,
+ "loss": 0.0603,
+ "step": 36387
+ },
+ {
+ "epoch": 99.14986376021798,
+ "grad_norm": 3.5983099937438965,
+ "learning_rate": 3.790320231119582e-09,
+ "loss": 0.0526,
+ "step": 36388
+ },
+ {
+ "epoch": 99.15258855585832,
+ "grad_norm": 4.311792373657227,
+ "learning_rate": 3.766063766673656e-09,
+ "loss": 0.0487,
+ "step": 36389
+ },
+ {
+ "epoch": 99.15531335149863,
+ "grad_norm": 1.893627405166626,
+ "learning_rate": 3.7418851525772296e-09,
+ "loss": 0.0151,
+ "step": 36390
+ },
+ {
+ "epoch": 99.15803814713897,
+ "grad_norm": 1.9946928024291992,
+ "learning_rate": 3.7177843890157108e-09,
+ "loss": 0.0323,
+ "step": 36391
+ },
+ {
+ "epoch": 99.16076294277929,
+ "grad_norm": 3.0589988231658936,
+ "learning_rate": 3.6937614761789474e-09,
+ "loss": 0.0219,
+ "step": 36392
+ },
+ {
+ "epoch": 99.16348773841962,
+ "grad_norm": 1.6643747091293335,
+ "learning_rate": 3.6698164142534574e-09,
+ "loss": 0.0478,
+ "step": 36393
+ },
+ {
+ "epoch": 99.16621253405995,
+ "grad_norm": 2.7943308353424072,
+ "learning_rate": 3.645949203425758e-09,
+ "loss": 0.0319,
+ "step": 36394
+ },
+ {
+ "epoch": 99.16893732970027,
+ "grad_norm": 2.1140692234039307,
+ "learning_rate": 3.6221598438812567e-09,
+ "loss": 0.017,
+ "step": 36395
+ },
+ {
+ "epoch": 99.1716621253406,
+ "grad_norm": 3.405674457550049,
+ "learning_rate": 3.5984483358064703e-09,
+ "loss": 0.0269,
+ "step": 36396
+ },
+ {
+ "epoch": 99.17438692098092,
+ "grad_norm": 1.7860310077667236,
+ "learning_rate": 3.574814679384586e-09,
+ "loss": 0.0224,
+ "step": 36397
+ },
+ {
+ "epoch": 99.17711171662125,
+ "grad_norm": 3.141554832458496,
+ "learning_rate": 3.5512588748010114e-09,
+ "loss": 0.1446,
+ "step": 36398
+ },
+ {
+ "epoch": 99.17983651226157,
+ "grad_norm": 2.2735395431518555,
+ "learning_rate": 3.527780922237822e-09,
+ "loss": 0.0572,
+ "step": 36399
+ },
+ {
+ "epoch": 99.1825613079019,
+ "grad_norm": 2.2199854850769043,
+ "learning_rate": 3.504380821878206e-09,
+ "loss": 0.0327,
+ "step": 36400
+ },
+ {
+ "epoch": 99.18528610354224,
+ "grad_norm": 3.187570810317993,
+ "learning_rate": 3.4810585739053492e-09,
+ "loss": 0.0714,
+ "step": 36401
+ },
+ {
+ "epoch": 99.18801089918256,
+ "grad_norm": 2.511786460876465,
+ "learning_rate": 3.4578141785002182e-09,
+ "loss": 0.0505,
+ "step": 36402
+ },
+ {
+ "epoch": 99.19073569482289,
+ "grad_norm": 1.9665066003799438,
+ "learning_rate": 3.43464763584378e-09,
+ "loss": 0.0881,
+ "step": 36403
+ },
+ {
+ "epoch": 99.19346049046321,
+ "grad_norm": 5.338626384735107,
+ "learning_rate": 3.4115589461169994e-09,
+ "loss": 0.0701,
+ "step": 36404
+ },
+ {
+ "epoch": 99.19618528610354,
+ "grad_norm": 1.8583027124404907,
+ "learning_rate": 3.388548109498624e-09,
+ "loss": 0.0685,
+ "step": 36405
+ },
+ {
+ "epoch": 99.19891008174388,
+ "grad_norm": 2.840616464614868,
+ "learning_rate": 3.3656151261696192e-09,
+ "loss": 0.2491,
+ "step": 36406
+ },
+ {
+ "epoch": 99.2016348773842,
+ "grad_norm": 2.7709131240844727,
+ "learning_rate": 3.3427599963065105e-09,
+ "loss": 0.0333,
+ "step": 36407
+ },
+ {
+ "epoch": 99.20435967302453,
+ "grad_norm": 3.268580436706543,
+ "learning_rate": 3.319982720088044e-09,
+ "loss": 0.0473,
+ "step": 36408
+ },
+ {
+ "epoch": 99.20708446866485,
+ "grad_norm": 3.149470806121826,
+ "learning_rate": 3.2972832976918557e-09,
+ "loss": 0.0759,
+ "step": 36409
+ },
+ {
+ "epoch": 99.20980926430518,
+ "grad_norm": 2.2788093090057373,
+ "learning_rate": 3.274661729295581e-09,
+ "loss": 0.0873,
+ "step": 36410
+ },
+ {
+ "epoch": 99.2125340599455,
+ "grad_norm": 1.9153056144714355,
+ "learning_rate": 3.2521180150735244e-09,
+ "loss": 0.0249,
+ "step": 36411
+ },
+ {
+ "epoch": 99.21525885558583,
+ "grad_norm": 2.340096950531006,
+ "learning_rate": 3.2296521552033223e-09,
+ "loss": 0.1278,
+ "step": 36412
+ },
+ {
+ "epoch": 99.21798365122616,
+ "grad_norm": 2.90765643119812,
+ "learning_rate": 3.207264149857059e-09,
+ "loss": 0.0468,
+ "step": 36413
+ },
+ {
+ "epoch": 99.22070844686648,
+ "grad_norm": 2.310850143432617,
+ "learning_rate": 3.18495399921237e-09,
+ "loss": 0.0321,
+ "step": 36414
+ },
+ {
+ "epoch": 99.22343324250681,
+ "grad_norm": 3.482832193374634,
+ "learning_rate": 3.1627217034413403e-09,
+ "loss": 0.0328,
+ "step": 36415
+ },
+ {
+ "epoch": 99.22615803814713,
+ "grad_norm": 2.7978789806365967,
+ "learning_rate": 3.1405672627171645e-09,
+ "loss": 0.0276,
+ "step": 36416
+ },
+ {
+ "epoch": 99.22888283378747,
+ "grad_norm": 3.4980978965759277,
+ "learning_rate": 3.118490677211927e-09,
+ "loss": 0.0471,
+ "step": 36417
+ },
+ {
+ "epoch": 99.2316076294278,
+ "grad_norm": 1.6601653099060059,
+ "learning_rate": 3.096491947098823e-09,
+ "loss": 0.0757,
+ "step": 36418
+ },
+ {
+ "epoch": 99.23433242506812,
+ "grad_norm": 6.678323268890381,
+ "learning_rate": 3.0745710725477164e-09,
+ "loss": 0.0646,
+ "step": 36419
+ },
+ {
+ "epoch": 99.23705722070845,
+ "grad_norm": 1.7206647396087646,
+ "learning_rate": 3.0527280537306915e-09,
+ "loss": 0.0308,
+ "step": 36420
+ },
+ {
+ "epoch": 99.23978201634877,
+ "grad_norm": 1.7365213632583618,
+ "learning_rate": 3.0309628908176125e-09,
+ "loss": 0.0235,
+ "step": 36421
+ },
+ {
+ "epoch": 99.2425068119891,
+ "grad_norm": 1.6074193716049194,
+ "learning_rate": 3.0092755839772336e-09,
+ "loss": 0.0174,
+ "step": 36422
+ },
+ {
+ "epoch": 99.24523160762942,
+ "grad_norm": 2.532968282699585,
+ "learning_rate": 2.9876661333783084e-09,
+ "loss": 0.0624,
+ "step": 36423
+ },
+ {
+ "epoch": 99.24795640326975,
+ "grad_norm": 2.9972033500671387,
+ "learning_rate": 2.9661345391907013e-09,
+ "loss": 0.2823,
+ "step": 36424
+ },
+ {
+ "epoch": 99.25068119891009,
+ "grad_norm": 2.2182281017303467,
+ "learning_rate": 2.9446808015809457e-09,
+ "loss": 0.0871,
+ "step": 36425
+ },
+ {
+ "epoch": 99.2534059945504,
+ "grad_norm": 2.8645570278167725,
+ "learning_rate": 2.923304920715575e-09,
+ "loss": 0.0635,
+ "step": 36426
+ },
+ {
+ "epoch": 99.25613079019074,
+ "grad_norm": 2.3982489109039307,
+ "learning_rate": 2.902006896762233e-09,
+ "loss": 0.0265,
+ "step": 36427
+ },
+ {
+ "epoch": 99.25885558583106,
+ "grad_norm": 4.365675926208496,
+ "learning_rate": 2.8807867298863425e-09,
+ "loss": 0.0273,
+ "step": 36428
+ },
+ {
+ "epoch": 99.26158038147139,
+ "grad_norm": 2.683900833129883,
+ "learning_rate": 2.8596444202522166e-09,
+ "loss": 0.1043,
+ "step": 36429
+ },
+ {
+ "epoch": 99.26430517711172,
+ "grad_norm": 2.0241880416870117,
+ "learning_rate": 2.8385799680263892e-09,
+ "loss": 0.1868,
+ "step": 36430
+ },
+ {
+ "epoch": 99.26702997275204,
+ "grad_norm": 1.9473216533660889,
+ "learning_rate": 2.817593373372063e-09,
+ "loss": 0.0326,
+ "step": 36431
+ },
+ {
+ "epoch": 99.26975476839237,
+ "grad_norm": 3.1982765197753906,
+ "learning_rate": 2.79668463645244e-09,
+ "loss": 0.0731,
+ "step": 36432
+ },
+ {
+ "epoch": 99.2724795640327,
+ "grad_norm": 1.6564440727233887,
+ "learning_rate": 2.775853757429614e-09,
+ "loss": 0.0189,
+ "step": 36433
+ },
+ {
+ "epoch": 99.27520435967303,
+ "grad_norm": 2.0607547760009766,
+ "learning_rate": 2.755100736467897e-09,
+ "loss": 0.0985,
+ "step": 36434
+ },
+ {
+ "epoch": 99.27792915531334,
+ "grad_norm": 2.2081785202026367,
+ "learning_rate": 2.734425573727162e-09,
+ "loss": 0.023,
+ "step": 36435
+ },
+ {
+ "epoch": 99.28065395095368,
+ "grad_norm": 2.806126594543457,
+ "learning_rate": 2.7138282693683904e-09,
+ "loss": 0.0649,
+ "step": 36436
+ },
+ {
+ "epoch": 99.28337874659401,
+ "grad_norm": 3.082141876220703,
+ "learning_rate": 2.6933088235536752e-09,
+ "loss": 0.0543,
+ "step": 36437
+ },
+ {
+ "epoch": 99.28610354223433,
+ "grad_norm": 2.207090139389038,
+ "learning_rate": 2.672867236440668e-09,
+ "loss": 0.0247,
+ "step": 36438
+ },
+ {
+ "epoch": 99.28882833787466,
+ "grad_norm": 1.978706955909729,
+ "learning_rate": 2.6525035081903516e-09,
+ "loss": 0.0297,
+ "step": 36439
+ },
+ {
+ "epoch": 99.29155313351498,
+ "grad_norm": 2.7729930877685547,
+ "learning_rate": 2.632217638960377e-09,
+ "loss": 0.0251,
+ "step": 36440
+ },
+ {
+ "epoch": 99.29427792915531,
+ "grad_norm": 2.5666956901550293,
+ "learning_rate": 2.6120096289083964e-09,
+ "loss": 0.0736,
+ "step": 36441
+ },
+ {
+ "epoch": 99.29700272479565,
+ "grad_norm": 2.3435373306274414,
+ "learning_rate": 2.5918794781931713e-09,
+ "loss": 0.1035,
+ "step": 36442
+ },
+ {
+ "epoch": 99.29972752043597,
+ "grad_norm": 2.143259286880493,
+ "learning_rate": 2.571827186970133e-09,
+ "loss": 0.0686,
+ "step": 36443
+ },
+ {
+ "epoch": 99.3024523160763,
+ "grad_norm": 3.842270612716675,
+ "learning_rate": 2.551852755395823e-09,
+ "loss": 0.0896,
+ "step": 36444
+ },
+ {
+ "epoch": 99.30517711171662,
+ "grad_norm": 1.5671322345733643,
+ "learning_rate": 2.5319561836267824e-09,
+ "loss": 0.0204,
+ "step": 36445
+ },
+ {
+ "epoch": 99.30790190735695,
+ "grad_norm": 2.957319974899292,
+ "learning_rate": 2.5121374718162228e-09,
+ "loss": 0.0291,
+ "step": 36446
+ },
+ {
+ "epoch": 99.31062670299727,
+ "grad_norm": 1.752927541732788,
+ "learning_rate": 2.4923966201195748e-09,
+ "loss": 0.0245,
+ "step": 36447
+ },
+ {
+ "epoch": 99.3133514986376,
+ "grad_norm": 1.822049856185913,
+ "learning_rate": 2.4727336286900493e-09,
+ "loss": 0.1189,
+ "step": 36448
+ },
+ {
+ "epoch": 99.31607629427793,
+ "grad_norm": 1.785093903541565,
+ "learning_rate": 2.4531484976819677e-09,
+ "loss": 0.0389,
+ "step": 36449
+ },
+ {
+ "epoch": 99.31880108991825,
+ "grad_norm": 1.935732364654541,
+ "learning_rate": 2.4336412272463197e-09,
+ "loss": 0.0252,
+ "step": 36450
+ },
+ {
+ "epoch": 99.32152588555859,
+ "grad_norm": 2.195263147354126,
+ "learning_rate": 2.414211817535206e-09,
+ "loss": 0.0441,
+ "step": 36451
+ },
+ {
+ "epoch": 99.3242506811989,
+ "grad_norm": 1.9610813856124878,
+ "learning_rate": 2.3948602687018375e-09,
+ "loss": 0.0222,
+ "step": 36452
+ },
+ {
+ "epoch": 99.32697547683924,
+ "grad_norm": 2.1458311080932617,
+ "learning_rate": 2.375586580893874e-09,
+ "loss": 0.0311,
+ "step": 36453
+ },
+ {
+ "epoch": 99.32970027247957,
+ "grad_norm": 1.9295579195022583,
+ "learning_rate": 2.3563907542645257e-09,
+ "loss": 0.1235,
+ "step": 36454
+ },
+ {
+ "epoch": 99.33242506811989,
+ "grad_norm": 2.887185573577881,
+ "learning_rate": 2.337272788961453e-09,
+ "loss": 0.0348,
+ "step": 36455
+ },
+ {
+ "epoch": 99.33514986376022,
+ "grad_norm": 1.5260833501815796,
+ "learning_rate": 2.318232685133426e-09,
+ "loss": 0.0667,
+ "step": 36456
+ },
+ {
+ "epoch": 99.33787465940054,
+ "grad_norm": 1.5578218698501587,
+ "learning_rate": 2.2992704429292136e-09,
+ "loss": 0.024,
+ "step": 36457
+ },
+ {
+ "epoch": 99.34059945504087,
+ "grad_norm": 1.683821439743042,
+ "learning_rate": 2.280386062497586e-09,
+ "loss": 0.0202,
+ "step": 36458
+ },
+ {
+ "epoch": 99.34332425068119,
+ "grad_norm": 3.2472360134124756,
+ "learning_rate": 2.2615795439839826e-09,
+ "loss": 0.0341,
+ "step": 36459
+ },
+ {
+ "epoch": 99.34604904632153,
+ "grad_norm": 4.313271522521973,
+ "learning_rate": 2.242850887534953e-09,
+ "loss": 0.1013,
+ "step": 36460
+ },
+ {
+ "epoch": 99.34877384196186,
+ "grad_norm": 3.0428760051727295,
+ "learning_rate": 2.2242000932970464e-09,
+ "loss": 0.0309,
+ "step": 36461
+ },
+ {
+ "epoch": 99.35149863760218,
+ "grad_norm": 2.2389774322509766,
+ "learning_rate": 2.205627161415702e-09,
+ "loss": 0.0399,
+ "step": 36462
+ },
+ {
+ "epoch": 99.35422343324251,
+ "grad_norm": 1.8114615678787231,
+ "learning_rate": 2.187132092034139e-09,
+ "loss": 0.0216,
+ "step": 36463
+ },
+ {
+ "epoch": 99.35694822888283,
+ "grad_norm": 3.40175461769104,
+ "learning_rate": 2.168714885298906e-09,
+ "loss": 0.0247,
+ "step": 36464
+ },
+ {
+ "epoch": 99.35967302452316,
+ "grad_norm": 2.9031620025634766,
+ "learning_rate": 2.150375541351002e-09,
+ "loss": 0.0329,
+ "step": 36465
+ },
+ {
+ "epoch": 99.3623978201635,
+ "grad_norm": 3.3373162746429443,
+ "learning_rate": 2.1321140603336452e-09,
+ "loss": 0.0241,
+ "step": 36466
+ },
+ {
+ "epoch": 99.36512261580381,
+ "grad_norm": 1.999098539352417,
+ "learning_rate": 2.113930442390055e-09,
+ "loss": 0.021,
+ "step": 36467
+ },
+ {
+ "epoch": 99.36784741144415,
+ "grad_norm": 2.326115608215332,
+ "learning_rate": 2.09582468766234e-09,
+ "loss": 0.0679,
+ "step": 36468
+ },
+ {
+ "epoch": 99.37057220708446,
+ "grad_norm": 11.089275360107422,
+ "learning_rate": 2.0777967962892775e-09,
+ "loss": 0.1068,
+ "step": 36469
+ },
+ {
+ "epoch": 99.3732970027248,
+ "grad_norm": 3.55578351020813,
+ "learning_rate": 2.059846768412976e-09,
+ "loss": 0.0205,
+ "step": 36470
+ },
+ {
+ "epoch": 99.37602179836512,
+ "grad_norm": 1.9651052951812744,
+ "learning_rate": 2.0419746041733247e-09,
+ "loss": 0.0592,
+ "step": 36471
+ },
+ {
+ "epoch": 99.37874659400545,
+ "grad_norm": 2.7975447177886963,
+ "learning_rate": 2.0241803037091002e-09,
+ "loss": 0.0518,
+ "step": 36472
+ },
+ {
+ "epoch": 99.38147138964578,
+ "grad_norm": 6.04313325881958,
+ "learning_rate": 2.0064638671579706e-09,
+ "loss": 0.1152,
+ "step": 36473
+ },
+ {
+ "epoch": 99.3841961852861,
+ "grad_norm": 2.5856568813323975,
+ "learning_rate": 1.988825294658714e-09,
+ "loss": 0.1662,
+ "step": 36474
+ },
+ {
+ "epoch": 99.38692098092643,
+ "grad_norm": 2.250094175338745,
+ "learning_rate": 1.9712645863489977e-09,
+ "loss": 0.07,
+ "step": 36475
+ },
+ {
+ "epoch": 99.38964577656675,
+ "grad_norm": 2.380284309387207,
+ "learning_rate": 1.9537817423653794e-09,
+ "loss": 0.0531,
+ "step": 36476
+ },
+ {
+ "epoch": 99.39237057220708,
+ "grad_norm": 2.2417728900909424,
+ "learning_rate": 1.9363767628444164e-09,
+ "loss": 0.0748,
+ "step": 36477
+ },
+ {
+ "epoch": 99.39509536784742,
+ "grad_norm": 2.6770682334899902,
+ "learning_rate": 1.919049647920446e-09,
+ "loss": 0.05,
+ "step": 36478
+ },
+ {
+ "epoch": 99.39782016348774,
+ "grad_norm": 3.7568910121917725,
+ "learning_rate": 1.9018003977289147e-09,
+ "loss": 0.0294,
+ "step": 36479
+ },
+ {
+ "epoch": 99.40054495912807,
+ "grad_norm": 2.4807164669036865,
+ "learning_rate": 1.8846290124052703e-09,
+ "loss": 0.0256,
+ "step": 36480
+ },
+ {
+ "epoch": 99.40326975476839,
+ "grad_norm": 4.318384170532227,
+ "learning_rate": 1.8675354920816293e-09,
+ "loss": 0.1189,
+ "step": 36481
+ },
+ {
+ "epoch": 99.40599455040872,
+ "grad_norm": 2.2268853187561035,
+ "learning_rate": 1.8505198368923282e-09,
+ "loss": 0.0317,
+ "step": 36482
+ },
+ {
+ "epoch": 99.40871934604904,
+ "grad_norm": 2.5289037227630615,
+ "learning_rate": 1.833582046968374e-09,
+ "loss": 0.0271,
+ "step": 36483
+ },
+ {
+ "epoch": 99.41144414168937,
+ "grad_norm": 2.2588653564453125,
+ "learning_rate": 1.8167221224441035e-09,
+ "loss": 0.0973,
+ "step": 36484
+ },
+ {
+ "epoch": 99.4141689373297,
+ "grad_norm": 2.657165288925171,
+ "learning_rate": 1.799940063448302e-09,
+ "loss": 0.0832,
+ "step": 36485
+ },
+ {
+ "epoch": 99.41689373297002,
+ "grad_norm": 2.0009355545043945,
+ "learning_rate": 1.783235870113087e-09,
+ "loss": 0.0297,
+ "step": 36486
+ },
+ {
+ "epoch": 99.41961852861036,
+ "grad_norm": 2.1202259063720703,
+ "learning_rate": 1.7666095425683538e-09,
+ "loss": 0.0381,
+ "step": 36487
+ },
+ {
+ "epoch": 99.42234332425068,
+ "grad_norm": 2.0005722045898438,
+ "learning_rate": 1.7500610809439989e-09,
+ "loss": 0.0269,
+ "step": 36488
+ },
+ {
+ "epoch": 99.42506811989101,
+ "grad_norm": 1.8287826776504517,
+ "learning_rate": 1.7335904853676977e-09,
+ "loss": 0.023,
+ "step": 36489
+ },
+ {
+ "epoch": 99.42779291553134,
+ "grad_norm": 2.116440534591675,
+ "learning_rate": 1.7171977559682363e-09,
+ "loss": 0.0485,
+ "step": 36490
+ },
+ {
+ "epoch": 99.43051771117166,
+ "grad_norm": 2.248250722885132,
+ "learning_rate": 1.70088289287329e-09,
+ "loss": 0.0537,
+ "step": 36491
+ },
+ {
+ "epoch": 99.433242506812,
+ "grad_norm": 3.7882604598999023,
+ "learning_rate": 1.684645896210535e-09,
+ "loss": 0.0244,
+ "step": 36492
+ },
+ {
+ "epoch": 99.43596730245231,
+ "grad_norm": 2.1944730281829834,
+ "learning_rate": 1.6684867661065363e-09,
+ "loss": 0.0898,
+ "step": 36493
+ },
+ {
+ "epoch": 99.43869209809264,
+ "grad_norm": 2.940349817276001,
+ "learning_rate": 1.6524055026856388e-09,
+ "loss": 0.0978,
+ "step": 36494
+ },
+ {
+ "epoch": 99.44141689373296,
+ "grad_norm": 2.730057716369629,
+ "learning_rate": 1.6364021060744084e-09,
+ "loss": 0.0567,
+ "step": 36495
+ },
+ {
+ "epoch": 99.4441416893733,
+ "grad_norm": 2.3615787029266357,
+ "learning_rate": 1.6204765763971897e-09,
+ "loss": 0.0447,
+ "step": 36496
+ },
+ {
+ "epoch": 99.44686648501363,
+ "grad_norm": 2.5666565895080566,
+ "learning_rate": 1.6046289137783277e-09,
+ "loss": 0.0623,
+ "step": 36497
+ },
+ {
+ "epoch": 99.44959128065395,
+ "grad_norm": 4.310489654541016,
+ "learning_rate": 1.5888591183399472e-09,
+ "loss": 0.1389,
+ "step": 36498
+ },
+ {
+ "epoch": 99.45231607629428,
+ "grad_norm": 2.57661771774292,
+ "learning_rate": 1.5731671902063927e-09,
+ "loss": 0.0811,
+ "step": 36499
+ },
+ {
+ "epoch": 99.4550408719346,
+ "grad_norm": 2.558673620223999,
+ "learning_rate": 1.557553129498679e-09,
+ "loss": 0.0345,
+ "step": 36500
+ },
+ {
+ "epoch": 99.45776566757493,
+ "grad_norm": 3.643984317779541,
+ "learning_rate": 1.5420169363389303e-09,
+ "loss": 0.0345,
+ "step": 36501
+ },
+ {
+ "epoch": 99.46049046321527,
+ "grad_norm": 2.4214136600494385,
+ "learning_rate": 1.5265586108481612e-09,
+ "loss": 0.1484,
+ "step": 36502
+ },
+ {
+ "epoch": 99.46321525885558,
+ "grad_norm": 2.4700000286102295,
+ "learning_rate": 1.5111781531473856e-09,
+ "loss": 0.0313,
+ "step": 36503
+ },
+ {
+ "epoch": 99.46594005449592,
+ "grad_norm": 2.7732627391815186,
+ "learning_rate": 1.4958755633542876e-09,
+ "loss": 0.0269,
+ "step": 36504
+ },
+ {
+ "epoch": 99.46866485013624,
+ "grad_norm": 2.753965139389038,
+ "learning_rate": 1.4806508415909914e-09,
+ "loss": 0.0943,
+ "step": 36505
+ },
+ {
+ "epoch": 99.47138964577657,
+ "grad_norm": 2.1247220039367676,
+ "learning_rate": 1.4655039879740706e-09,
+ "loss": 0.2098,
+ "step": 36506
+ },
+ {
+ "epoch": 99.47411444141689,
+ "grad_norm": 2.5269577503204346,
+ "learning_rate": 1.4504350026223192e-09,
+ "loss": 0.0488,
+ "step": 36507
+ },
+ {
+ "epoch": 99.47683923705722,
+ "grad_norm": 1.9422529935836792,
+ "learning_rate": 1.43544388565231e-09,
+ "loss": 0.0172,
+ "step": 36508
+ },
+ {
+ "epoch": 99.47956403269755,
+ "grad_norm": 3.2932417392730713,
+ "learning_rate": 1.4205306371817274e-09,
+ "loss": 0.0342,
+ "step": 36509
+ },
+ {
+ "epoch": 99.48228882833787,
+ "grad_norm": 4.437108039855957,
+ "learning_rate": 1.405695257326034e-09,
+ "loss": 0.148,
+ "step": 36510
+ },
+ {
+ "epoch": 99.4850136239782,
+ "grad_norm": 1.8429901599884033,
+ "learning_rate": 1.3909377462006933e-09,
+ "loss": 0.145,
+ "step": 36511
+ },
+ {
+ "epoch": 99.48773841961852,
+ "grad_norm": 2.8696699142456055,
+ "learning_rate": 1.3762581039211686e-09,
+ "loss": 0.0878,
+ "step": 36512
+ },
+ {
+ "epoch": 99.49046321525886,
+ "grad_norm": 3.777517557144165,
+ "learning_rate": 1.3616563306018126e-09,
+ "loss": 0.0543,
+ "step": 36513
+ },
+ {
+ "epoch": 99.49318801089919,
+ "grad_norm": 2.00805401802063,
+ "learning_rate": 1.3471324263558684e-09,
+ "loss": 0.0207,
+ "step": 36514
+ },
+ {
+ "epoch": 99.49591280653951,
+ "grad_norm": 2.38852596282959,
+ "learning_rate": 1.3326863912965782e-09,
+ "loss": 0.0959,
+ "step": 36515
+ },
+ {
+ "epoch": 99.49863760217984,
+ "grad_norm": 2.6656932830810547,
+ "learning_rate": 1.318318225536075e-09,
+ "loss": 0.0883,
+ "step": 36516
+ },
+ {
+ "epoch": 99.50136239782016,
+ "grad_norm": 4.719111919403076,
+ "learning_rate": 1.3040279291876013e-09,
+ "loss": 0.071,
+ "step": 36517
+ },
+ {
+ "epoch": 99.50408719346049,
+ "grad_norm": 2.596975803375244,
+ "learning_rate": 1.2898155023610692e-09,
+ "loss": 0.1507,
+ "step": 36518
+ },
+ {
+ "epoch": 99.50681198910081,
+ "grad_norm": 4.292980194091797,
+ "learning_rate": 1.2756809451675012e-09,
+ "loss": 0.0935,
+ "step": 36519
+ },
+ {
+ "epoch": 99.50953678474114,
+ "grad_norm": 2.4347875118255615,
+ "learning_rate": 1.2616242577168092e-09,
+ "loss": 0.0316,
+ "step": 36520
+ },
+ {
+ "epoch": 99.51226158038148,
+ "grad_norm": 2.349003791809082,
+ "learning_rate": 1.2476454401200155e-09,
+ "loss": 0.0832,
+ "step": 36521
+ },
+ {
+ "epoch": 99.5149863760218,
+ "grad_norm": 1.5870577096939087,
+ "learning_rate": 1.2337444924837017e-09,
+ "loss": 0.0706,
+ "step": 36522
+ },
+ {
+ "epoch": 99.51771117166213,
+ "grad_norm": 2.5609068870544434,
+ "learning_rate": 1.2199214149177795e-09,
+ "loss": 0.092,
+ "step": 36523
+ },
+ {
+ "epoch": 99.52043596730245,
+ "grad_norm": 2.1779537200927734,
+ "learning_rate": 1.2061762075288307e-09,
+ "loss": 0.0374,
+ "step": 36524
+ },
+ {
+ "epoch": 99.52316076294278,
+ "grad_norm": 1.9448508024215698,
+ "learning_rate": 1.192508870424547e-09,
+ "loss": 0.0225,
+ "step": 36525
+ },
+ {
+ "epoch": 99.52588555858311,
+ "grad_norm": 3.0391459465026855,
+ "learning_rate": 1.1789194037115093e-09,
+ "loss": 0.1417,
+ "step": 36526
+ },
+ {
+ "epoch": 99.52861035422343,
+ "grad_norm": 2.4883079528808594,
+ "learning_rate": 1.1654078074940788e-09,
+ "loss": 0.0598,
+ "step": 36527
+ },
+ {
+ "epoch": 99.53133514986376,
+ "grad_norm": 3.8180992603302,
+ "learning_rate": 1.1519740818799473e-09,
+ "loss": 0.0397,
+ "step": 36528
+ },
+ {
+ "epoch": 99.53405994550408,
+ "grad_norm": 2.5799219608306885,
+ "learning_rate": 1.1386182269723656e-09,
+ "loss": 0.0308,
+ "step": 36529
+ },
+ {
+ "epoch": 99.53678474114442,
+ "grad_norm": 2.159740924835205,
+ "learning_rate": 1.1253402428745841e-09,
+ "loss": 0.0273,
+ "step": 36530
+ },
+ {
+ "epoch": 99.53950953678473,
+ "grad_norm": 1.376673698425293,
+ "learning_rate": 1.1121401296909639e-09,
+ "loss": 0.0872,
+ "step": 36531
+ },
+ {
+ "epoch": 99.54223433242507,
+ "grad_norm": 3.0177886486053467,
+ "learning_rate": 1.099017887524756e-09,
+ "loss": 0.0326,
+ "step": 36532
+ },
+ {
+ "epoch": 99.5449591280654,
+ "grad_norm": 2.472672462463379,
+ "learning_rate": 1.0859735164769903e-09,
+ "loss": 0.0297,
+ "step": 36533
+ },
+ {
+ "epoch": 99.54768392370572,
+ "grad_norm": 2.5569729804992676,
+ "learning_rate": 1.0730070166509177e-09,
+ "loss": 0.1165,
+ "step": 36534
+ },
+ {
+ "epoch": 99.55040871934605,
+ "grad_norm": 2.6483771800994873,
+ "learning_rate": 1.060118388145348e-09,
+ "loss": 0.0229,
+ "step": 36535
+ },
+ {
+ "epoch": 99.55313351498637,
+ "grad_norm": 2.695887804031372,
+ "learning_rate": 1.0473076310624218e-09,
+ "loss": 0.0465,
+ "step": 36536
+ },
+ {
+ "epoch": 99.5558583106267,
+ "grad_norm": 2.4064455032348633,
+ "learning_rate": 1.034574745500949e-09,
+ "loss": 0.0948,
+ "step": 36537
+ },
+ {
+ "epoch": 99.55858310626704,
+ "grad_norm": 1.4350569248199463,
+ "learning_rate": 1.0219197315597396e-09,
+ "loss": 0.0175,
+ "step": 36538
+ },
+ {
+ "epoch": 99.56130790190736,
+ "grad_norm": 2.4260857105255127,
+ "learning_rate": 1.0093425893387133e-09,
+ "loss": 0.1,
+ "step": 36539
+ },
+ {
+ "epoch": 99.56403269754769,
+ "grad_norm": 2.115938663482666,
+ "learning_rate": 9.968433189355697e-10,
+ "loss": 0.3049,
+ "step": 36540
+ },
+ {
+ "epoch": 99.566757493188,
+ "grad_norm": 2.5792899131774902,
+ "learning_rate": 9.844219204468985e-10,
+ "loss": 0.0392,
+ "step": 36541
+ },
+ {
+ "epoch": 99.56948228882834,
+ "grad_norm": 2.8147940635681152,
+ "learning_rate": 9.720783939692891e-10,
+ "loss": 0.0434,
+ "step": 36542
+ },
+ {
+ "epoch": 99.57220708446866,
+ "grad_norm": 2.99324107170105,
+ "learning_rate": 9.598127395993307e-10,
+ "loss": 0.0319,
+ "step": 36543
+ },
+ {
+ "epoch": 99.57493188010899,
+ "grad_norm": 2.7439558506011963,
+ "learning_rate": 9.476249574325026e-10,
+ "loss": 0.0557,
+ "step": 36544
+ },
+ {
+ "epoch": 99.57765667574932,
+ "grad_norm": 3.165449857711792,
+ "learning_rate": 9.355150475642837e-10,
+ "loss": 0.0294,
+ "step": 36545
+ },
+ {
+ "epoch": 99.58038147138964,
+ "grad_norm": 2.2052972316741943,
+ "learning_rate": 9.234830100879333e-10,
+ "loss": 0.1125,
+ "step": 36546
+ },
+ {
+ "epoch": 99.58310626702998,
+ "grad_norm": 2.7302558422088623,
+ "learning_rate": 9.115288450978199e-10,
+ "loss": 0.1363,
+ "step": 36547
+ },
+ {
+ "epoch": 99.5858310626703,
+ "grad_norm": 1.9348679780960083,
+ "learning_rate": 8.996525526872024e-10,
+ "loss": 0.0199,
+ "step": 36548
+ },
+ {
+ "epoch": 99.58855585831063,
+ "grad_norm": 3.44775390625,
+ "learning_rate": 8.878541329482293e-10,
+ "loss": 0.0242,
+ "step": 36549
+ },
+ {
+ "epoch": 99.59128065395096,
+ "grad_norm": 2.0738258361816406,
+ "learning_rate": 8.761335859730491e-10,
+ "loss": 0.032,
+ "step": 36550
+ },
+ {
+ "epoch": 99.59400544959128,
+ "grad_norm": 2.6990418434143066,
+ "learning_rate": 8.644909118515898e-10,
+ "loss": 0.0329,
+ "step": 36551
+ },
+ {
+ "epoch": 99.59673024523161,
+ "grad_norm": 2.516026258468628,
+ "learning_rate": 8.529261106771103e-10,
+ "loss": 0.0537,
+ "step": 36552
+ },
+ {
+ "epoch": 99.59945504087193,
+ "grad_norm": 2.832350730895996,
+ "learning_rate": 8.41439182537318e-10,
+ "loss": 0.023,
+ "step": 36553
+ },
+ {
+ "epoch": 99.60217983651226,
+ "grad_norm": 2.176815986633301,
+ "learning_rate": 8.300301275221412e-10,
+ "loss": 0.0325,
+ "step": 36554
+ },
+ {
+ "epoch": 99.60490463215258,
+ "grad_norm": 2.719883918762207,
+ "learning_rate": 8.186989457215078e-10,
+ "loss": 0.0668,
+ "step": 36555
+ },
+ {
+ "epoch": 99.60762942779292,
+ "grad_norm": 2.2102978229522705,
+ "learning_rate": 8.074456372231254e-10,
+ "loss": 0.0756,
+ "step": 36556
+ },
+ {
+ "epoch": 99.61035422343325,
+ "grad_norm": 1.9211902618408203,
+ "learning_rate": 7.962702021147018e-10,
+ "loss": 0.0159,
+ "step": 36557
+ },
+ {
+ "epoch": 99.61307901907357,
+ "grad_norm": 2.3778374195098877,
+ "learning_rate": 7.851726404828342e-10,
+ "loss": 0.0706,
+ "step": 36558
+ },
+ {
+ "epoch": 99.6158038147139,
+ "grad_norm": 2.125946521759033,
+ "learning_rate": 7.741529524141201e-10,
+ "loss": 0.037,
+ "step": 36559
+ },
+ {
+ "epoch": 99.61852861035422,
+ "grad_norm": 7.415036201477051,
+ "learning_rate": 7.632111379951568e-10,
+ "loss": 0.0206,
+ "step": 36560
+ },
+ {
+ "epoch": 99.62125340599455,
+ "grad_norm": 1.5431028604507446,
+ "learning_rate": 7.523471973092112e-10,
+ "loss": 0.0199,
+ "step": 36561
+ },
+ {
+ "epoch": 99.62397820163488,
+ "grad_norm": 2.3266077041625977,
+ "learning_rate": 7.415611304428805e-10,
+ "loss": 0.1038,
+ "step": 36562
+ },
+ {
+ "epoch": 99.6267029972752,
+ "grad_norm": 2.8579304218292236,
+ "learning_rate": 7.308529374794316e-10,
+ "loss": 0.0793,
+ "step": 36563
+ },
+ {
+ "epoch": 99.62942779291554,
+ "grad_norm": 2.9477689266204834,
+ "learning_rate": 7.20222618502131e-10,
+ "loss": 0.1182,
+ "step": 36564
+ },
+ {
+ "epoch": 99.63215258855585,
+ "grad_norm": 1.4284054040908813,
+ "learning_rate": 7.096701735942457e-10,
+ "loss": 0.024,
+ "step": 36565
+ },
+ {
+ "epoch": 99.63487738419619,
+ "grad_norm": 2.898362159729004,
+ "learning_rate": 6.991956028379321e-10,
+ "loss": 0.0802,
+ "step": 36566
+ },
+ {
+ "epoch": 99.6376021798365,
+ "grad_norm": 1.9462116956710815,
+ "learning_rate": 6.887989063131262e-10,
+ "loss": 0.0298,
+ "step": 36567
+ },
+ {
+ "epoch": 99.64032697547684,
+ "grad_norm": 1.887109398841858,
+ "learning_rate": 6.784800841030948e-10,
+ "loss": 0.0897,
+ "step": 36568
+ },
+ {
+ "epoch": 99.64305177111717,
+ "grad_norm": 2.0863425731658936,
+ "learning_rate": 6.682391362877738e-10,
+ "loss": 0.0273,
+ "step": 36569
+ },
+ {
+ "epoch": 99.64577656675749,
+ "grad_norm": 2.1058130264282227,
+ "learning_rate": 6.58076062944879e-10,
+ "loss": 0.0211,
+ "step": 36570
+ },
+ {
+ "epoch": 99.64850136239782,
+ "grad_norm": 2.643380880355835,
+ "learning_rate": 6.479908641565668e-10,
+ "loss": 0.0388,
+ "step": 36571
+ },
+ {
+ "epoch": 99.65122615803814,
+ "grad_norm": 2.3741872310638428,
+ "learning_rate": 6.379835399983326e-10,
+ "loss": 0.0278,
+ "step": 36572
+ },
+ {
+ "epoch": 99.65395095367847,
+ "grad_norm": 2.371957540512085,
+ "learning_rate": 6.280540905512222e-10,
+ "loss": 0.0256,
+ "step": 36573
+ },
+ {
+ "epoch": 99.65667574931881,
+ "grad_norm": 2.2500576972961426,
+ "learning_rate": 6.18202515889621e-10,
+ "loss": 0.0271,
+ "step": 36574
+ },
+ {
+ "epoch": 99.65940054495913,
+ "grad_norm": 1.956206202507019,
+ "learning_rate": 6.084288160923546e-10,
+ "loss": 0.0302,
+ "step": 36575
+ },
+ {
+ "epoch": 99.66212534059946,
+ "grad_norm": 1.9971297979354858,
+ "learning_rate": 5.987329912349182e-10,
+ "loss": 0.0211,
+ "step": 36576
+ },
+ {
+ "epoch": 99.66485013623978,
+ "grad_norm": 2.158386707305908,
+ "learning_rate": 5.891150413928071e-10,
+ "loss": 0.0291,
+ "step": 36577
+ },
+ {
+ "epoch": 99.66757493188011,
+ "grad_norm": 2.6648027896881104,
+ "learning_rate": 5.795749666404061e-10,
+ "loss": 0.0976,
+ "step": 36578
+ },
+ {
+ "epoch": 99.67029972752043,
+ "grad_norm": 2.7986602783203125,
+ "learning_rate": 5.701127670532103e-10,
+ "loss": 0.0389,
+ "step": 36579
+ },
+ {
+ "epoch": 99.67302452316076,
+ "grad_norm": 1.5865932703018188,
+ "learning_rate": 5.607284427033843e-10,
+ "loss": 0.0223,
+ "step": 36580
+ },
+ {
+ "epoch": 99.6757493188011,
+ "grad_norm": 2.294034242630005,
+ "learning_rate": 5.514219936642029e-10,
+ "loss": 0.1224,
+ "step": 36581
+ },
+ {
+ "epoch": 99.67847411444141,
+ "grad_norm": 2.7299232482910156,
+ "learning_rate": 5.42193420010051e-10,
+ "loss": 0.1174,
+ "step": 36582
+ },
+ {
+ "epoch": 99.68119891008175,
+ "grad_norm": 1.9245857000350952,
+ "learning_rate": 5.330427218108725e-10,
+ "loss": 0.0274,
+ "step": 36583
+ },
+ {
+ "epoch": 99.68392370572207,
+ "grad_norm": 1.757200837135315,
+ "learning_rate": 5.239698991388321e-10,
+ "loss": 0.0196,
+ "step": 36584
+ },
+ {
+ "epoch": 99.6866485013624,
+ "grad_norm": 1.994696855545044,
+ "learning_rate": 5.149749520638736e-10,
+ "loss": 0.0334,
+ "step": 36585
+ },
+ {
+ "epoch": 99.68937329700273,
+ "grad_norm": 2.803117036819458,
+ "learning_rate": 5.060578806559413e-10,
+ "loss": 0.0774,
+ "step": 36586
+ },
+ {
+ "epoch": 99.69209809264305,
+ "grad_norm": 4.198057174682617,
+ "learning_rate": 4.972186849860894e-10,
+ "loss": 0.0306,
+ "step": 36587
+ },
+ {
+ "epoch": 99.69482288828338,
+ "grad_norm": 2.314763069152832,
+ "learning_rate": 4.884573651209313e-10,
+ "loss": 0.0291,
+ "step": 36588
+ },
+ {
+ "epoch": 99.6975476839237,
+ "grad_norm": 1.7226258516311646,
+ "learning_rate": 4.797739211304108e-10,
+ "loss": 0.0362,
+ "step": 36589
+ },
+ {
+ "epoch": 99.70027247956403,
+ "grad_norm": 13.523866653442383,
+ "learning_rate": 4.711683530822519e-10,
+ "loss": 0.147,
+ "step": 36590
+ },
+ {
+ "epoch": 99.70299727520435,
+ "grad_norm": 5.580814838409424,
+ "learning_rate": 4.626406610419576e-10,
+ "loss": 0.0941,
+ "step": 36591
+ },
+ {
+ "epoch": 99.70572207084469,
+ "grad_norm": 2.962643623352051,
+ "learning_rate": 4.5419084507725143e-10,
+ "loss": 0.1124,
+ "step": 36592
+ },
+ {
+ "epoch": 99.70844686648502,
+ "grad_norm": 1.9783023595809937,
+ "learning_rate": 4.458189052536366e-10,
+ "loss": 0.0363,
+ "step": 36593
+ },
+ {
+ "epoch": 99.71117166212534,
+ "grad_norm": 1.824733018875122,
+ "learning_rate": 4.37524841635506e-10,
+ "loss": 0.0294,
+ "step": 36594
+ },
+ {
+ "epoch": 99.71389645776567,
+ "grad_norm": 2.0353915691375732,
+ "learning_rate": 4.2930865428836286e-10,
+ "loss": 0.0541,
+ "step": 36595
+ },
+ {
+ "epoch": 99.71662125340599,
+ "grad_norm": 2.389317512512207,
+ "learning_rate": 4.2117034327548987e-10,
+ "loss": 0.0439,
+ "step": 36596
+ },
+ {
+ "epoch": 99.71934604904632,
+ "grad_norm": 2.519260883331299,
+ "learning_rate": 4.1310990866128e-10,
+ "loss": 0.0341,
+ "step": 36597
+ },
+ {
+ "epoch": 99.72207084468666,
+ "grad_norm": 3.8815038204193115,
+ "learning_rate": 4.0512735050790566e-10,
+ "loss": 0.0543,
+ "step": 36598
+ },
+ {
+ "epoch": 99.72479564032697,
+ "grad_norm": 2.7397398948669434,
+ "learning_rate": 3.9722266887753933e-10,
+ "loss": 0.1035,
+ "step": 36599
+ },
+ {
+ "epoch": 99.7275204359673,
+ "grad_norm": 2.6178321838378906,
+ "learning_rate": 3.893958638312434e-10,
+ "loss": 0.1109,
+ "step": 36600
+ },
+ {
+ "epoch": 99.73024523160763,
+ "grad_norm": 2.7417891025543213,
+ "learning_rate": 3.8164693543119024e-10,
+ "loss": 0.0287,
+ "step": 36601
+ },
+ {
+ "epoch": 99.73297002724796,
+ "grad_norm": 2.6343674659729004,
+ "learning_rate": 3.7397588373733196e-10,
+ "loss": 0.0488,
+ "step": 36602
+ },
+ {
+ "epoch": 99.73569482288828,
+ "grad_norm": 6.195209503173828,
+ "learning_rate": 3.6638270880851034e-10,
+ "loss": 0.2053,
+ "step": 36603
+ },
+ {
+ "epoch": 99.73841961852861,
+ "grad_norm": 2.066901922225952,
+ "learning_rate": 3.588674107035672e-10,
+ "loss": 0.0271,
+ "step": 36604
+ },
+ {
+ "epoch": 99.74114441416894,
+ "grad_norm": 2.7348265647888184,
+ "learning_rate": 3.514299894835649e-10,
+ "loss": 0.0271,
+ "step": 36605
+ },
+ {
+ "epoch": 99.74386920980926,
+ "grad_norm": 2.0644443035125732,
+ "learning_rate": 3.4407044520401443e-10,
+ "loss": 0.0213,
+ "step": 36606
+ },
+ {
+ "epoch": 99.7465940054496,
+ "grad_norm": 5.294316291809082,
+ "learning_rate": 3.3678877792264754e-10,
+ "loss": 0.0633,
+ "step": 36607
+ },
+ {
+ "epoch": 99.74931880108991,
+ "grad_norm": 2.1260714530944824,
+ "learning_rate": 3.295849876971957e-10,
+ "loss": 0.1096,
+ "step": 36608
+ },
+ {
+ "epoch": 99.75204359673025,
+ "grad_norm": 2.419437885284424,
+ "learning_rate": 3.2245907458317015e-10,
+ "loss": 0.0466,
+ "step": 36609
+ },
+ {
+ "epoch": 99.75476839237058,
+ "grad_norm": 2.7944250106811523,
+ "learning_rate": 3.154110386349718e-10,
+ "loss": 0.0624,
+ "step": 36610
+ },
+ {
+ "epoch": 99.7574931880109,
+ "grad_norm": 1.9427090883255005,
+ "learning_rate": 3.08440879909222e-10,
+ "loss": 0.0261,
+ "step": 36611
+ },
+ {
+ "epoch": 99.76021798365123,
+ "grad_norm": 2.4367549419403076,
+ "learning_rate": 3.015485984603217e-10,
+ "loss": 0.0258,
+ "step": 36612
+ },
+ {
+ "epoch": 99.76294277929155,
+ "grad_norm": 2.3611412048339844,
+ "learning_rate": 2.9473419434045136e-10,
+ "loss": 0.2156,
+ "step": 36613
+ },
+ {
+ "epoch": 99.76566757493188,
+ "grad_norm": 3.508145809173584,
+ "learning_rate": 2.879976676029017e-10,
+ "loss": 0.2697,
+ "step": 36614
+ },
+ {
+ "epoch": 99.7683923705722,
+ "grad_norm": 1.7755341529846191,
+ "learning_rate": 2.8133901830096343e-10,
+ "loss": 0.025,
+ "step": 36615
+ },
+ {
+ "epoch": 99.77111716621253,
+ "grad_norm": 1.9118646383285522,
+ "learning_rate": 2.7475824648570683e-10,
+ "loss": 0.0337,
+ "step": 36616
+ },
+ {
+ "epoch": 99.77384196185287,
+ "grad_norm": 2.203730821609497,
+ "learning_rate": 2.6825535220931233e-10,
+ "loss": 0.034,
+ "step": 36617
+ },
+ {
+ "epoch": 99.77656675749319,
+ "grad_norm": 4.123830318450928,
+ "learning_rate": 2.6183033552174e-10,
+ "loss": 0.0829,
+ "step": 36618
+ },
+ {
+ "epoch": 99.77929155313352,
+ "grad_norm": 2.0598483085632324,
+ "learning_rate": 2.554831964729498e-10,
+ "loss": 0.0234,
+ "step": 36619
+ },
+ {
+ "epoch": 99.78201634877384,
+ "grad_norm": 2.5967087745666504,
+ "learning_rate": 2.4921393511290195e-10,
+ "loss": 0.0279,
+ "step": 36620
+ },
+ {
+ "epoch": 99.78474114441417,
+ "grad_norm": 2.9723432064056396,
+ "learning_rate": 2.4302255149044607e-10,
+ "loss": 0.1216,
+ "step": 36621
+ },
+ {
+ "epoch": 99.7874659400545,
+ "grad_norm": 2.351841688156128,
+ "learning_rate": 2.369090456533218e-10,
+ "loss": 0.0514,
+ "step": 36622
+ },
+ {
+ "epoch": 99.79019073569482,
+ "grad_norm": 3.7699193954467773,
+ "learning_rate": 2.3087341764926885e-10,
+ "loss": 0.071,
+ "step": 36623
+ },
+ {
+ "epoch": 99.79291553133515,
+ "grad_norm": 3.212890625,
+ "learning_rate": 2.2491566752491646e-10,
+ "loss": 0.1577,
+ "step": 36624
+ },
+ {
+ "epoch": 99.79564032697547,
+ "grad_norm": 1.6444101333618164,
+ "learning_rate": 2.19035795326894e-10,
+ "loss": 0.0292,
+ "step": 36625
+ },
+ {
+ "epoch": 99.7983651226158,
+ "grad_norm": 3.579833984375,
+ "learning_rate": 2.1323380110183088e-10,
+ "loss": 0.0244,
+ "step": 36626
+ },
+ {
+ "epoch": 99.80108991825612,
+ "grad_norm": 3.0298268795013428,
+ "learning_rate": 2.0750968489413604e-10,
+ "loss": 0.09,
+ "step": 36627
+ },
+ {
+ "epoch": 99.80381471389646,
+ "grad_norm": 3.3600499629974365,
+ "learning_rate": 2.0186344674821834e-10,
+ "loss": 0.0834,
+ "step": 36628
+ },
+ {
+ "epoch": 99.80653950953679,
+ "grad_norm": 2.7193455696105957,
+ "learning_rate": 1.9629508670848674e-10,
+ "loss": 0.0782,
+ "step": 36629
+ },
+ {
+ "epoch": 99.80926430517711,
+ "grad_norm": 2.516709566116333,
+ "learning_rate": 1.9080460481823993e-10,
+ "loss": 0.0957,
+ "step": 36630
+ },
+ {
+ "epoch": 99.81198910081744,
+ "grad_norm": 2.8346807956695557,
+ "learning_rate": 1.853920011207766e-10,
+ "loss": 0.0436,
+ "step": 36631
+ },
+ {
+ "epoch": 99.81471389645776,
+ "grad_norm": 5.574287414550781,
+ "learning_rate": 1.8005727565717502e-10,
+ "loss": 0.0314,
+ "step": 36632
+ },
+ {
+ "epoch": 99.8174386920981,
+ "grad_norm": 2.6337056159973145,
+ "learning_rate": 1.7480042846851341e-10,
+ "loss": 0.1221,
+ "step": 36633
+ },
+ {
+ "epoch": 99.82016348773843,
+ "grad_norm": 2.943788766860962,
+ "learning_rate": 1.696214595980905e-10,
+ "loss": 0.064,
+ "step": 36634
+ },
+ {
+ "epoch": 99.82288828337875,
+ "grad_norm": 2.968533754348755,
+ "learning_rate": 1.6452036908365388e-10,
+ "loss": 0.106,
+ "step": 36635
+ },
+ {
+ "epoch": 99.82561307901908,
+ "grad_norm": 2.553696393966675,
+ "learning_rate": 1.59497156967392e-10,
+ "loss": 0.0431,
+ "step": 36636
+ },
+ {
+ "epoch": 99.8283378746594,
+ "grad_norm": 2.3409392833709717,
+ "learning_rate": 1.545518232859422e-10,
+ "loss": 0.0949,
+ "step": 36637
+ },
+ {
+ "epoch": 99.83106267029973,
+ "grad_norm": 2.7663166522979736,
+ "learning_rate": 1.4968436807927255e-10,
+ "loss": 0.0405,
+ "step": 36638
+ },
+ {
+ "epoch": 99.83378746594005,
+ "grad_norm": 2.4775993824005127,
+ "learning_rate": 1.4489479138513062e-10,
+ "loss": 0.0363,
+ "step": 36639
+ },
+ {
+ "epoch": 99.83651226158038,
+ "grad_norm": 3.056490421295166,
+ "learning_rate": 1.40183093241264e-10,
+ "loss": 0.1586,
+ "step": 36640
+ },
+ {
+ "epoch": 99.83923705722071,
+ "grad_norm": 2.3072080612182617,
+ "learning_rate": 1.3554927368319982e-10,
+ "loss": 0.0879,
+ "step": 36641
+ },
+ {
+ "epoch": 99.84196185286103,
+ "grad_norm": 3.618222236633301,
+ "learning_rate": 1.3099333274757543e-10,
+ "loss": 0.1427,
+ "step": 36642
+ },
+ {
+ "epoch": 99.84468664850137,
+ "grad_norm": 3.623671770095825,
+ "learning_rate": 1.2651527046991796e-10,
+ "loss": 0.0563,
+ "step": 36643
+ },
+ {
+ "epoch": 99.84741144414168,
+ "grad_norm": 2.6766088008880615,
+ "learning_rate": 1.2211508688464434e-10,
+ "loss": 0.0362,
+ "step": 36644
+ },
+ {
+ "epoch": 99.85013623978202,
+ "grad_norm": 2.361475944519043,
+ "learning_rate": 1.1779278202728174e-10,
+ "loss": 0.0578,
+ "step": 36645
+ },
+ {
+ "epoch": 99.85286103542235,
+ "grad_norm": 2.4094767570495605,
+ "learning_rate": 1.1354835593113678e-10,
+ "loss": 0.0536,
+ "step": 36646
+ },
+ {
+ "epoch": 99.85558583106267,
+ "grad_norm": 2.4418084621429443,
+ "learning_rate": 1.0938180862729575e-10,
+ "loss": 0.0879,
+ "step": 36647
+ },
+ {
+ "epoch": 99.858310626703,
+ "grad_norm": 2.1416845321655273,
+ "learning_rate": 1.0529314015128577e-10,
+ "loss": 0.0344,
+ "step": 36648
+ },
+ {
+ "epoch": 99.86103542234332,
+ "grad_norm": 1.8528544902801514,
+ "learning_rate": 1.0128235053308289e-10,
+ "loss": 0.0177,
+ "step": 36649
+ },
+ {
+ "epoch": 99.86376021798365,
+ "grad_norm": 3.770249128341675,
+ "learning_rate": 9.734943980377331e-11,
+ "loss": 0.0281,
+ "step": 36650
+ },
+ {
+ "epoch": 99.86648501362397,
+ "grad_norm": 2.6298139095306396,
+ "learning_rate": 9.349440799444331e-11,
+ "loss": 0.033,
+ "step": 36651
+ },
+ {
+ "epoch": 99.8692098092643,
+ "grad_norm": 2.071444034576416,
+ "learning_rate": 8.97172551350689e-11,
+ "loss": 0.1597,
+ "step": 36652
+ },
+ {
+ "epoch": 99.87193460490464,
+ "grad_norm": 1.9126759767532349,
+ "learning_rate": 8.60179812556261e-11,
+ "loss": 0.0237,
+ "step": 36653
+ },
+ {
+ "epoch": 99.87465940054496,
+ "grad_norm": 6.645708084106445,
+ "learning_rate": 8.23965863838705e-11,
+ "loss": 0.1461,
+ "step": 36654
+ },
+ {
+ "epoch": 99.87738419618529,
+ "grad_norm": 8.344696998596191,
+ "learning_rate": 7.885307054866786e-11,
+ "loss": 0.0445,
+ "step": 36655
+ },
+ {
+ "epoch": 99.88010899182561,
+ "grad_norm": 3.1809380054473877,
+ "learning_rate": 7.53874337777738e-11,
+ "loss": 0.0333,
+ "step": 36656
+ },
+ {
+ "epoch": 99.88283378746594,
+ "grad_norm": 2.368344783782959,
+ "learning_rate": 7.199967609783365e-11,
+ "loss": 0.0761,
+ "step": 36657
+ },
+ {
+ "epoch": 99.88555858310627,
+ "grad_norm": 1.8367606401443481,
+ "learning_rate": 6.868979753549277e-11,
+ "loss": 0.037,
+ "step": 36658
+ },
+ {
+ "epoch": 99.88828337874659,
+ "grad_norm": 4.02899694442749,
+ "learning_rate": 6.545779811628627e-11,
+ "loss": 0.0289,
+ "step": 36659
+ },
+ {
+ "epoch": 99.89100817438693,
+ "grad_norm": 2.255337953567505,
+ "learning_rate": 6.230367786574931e-11,
+ "loss": 0.0424,
+ "step": 36660
+ },
+ {
+ "epoch": 99.89373297002724,
+ "grad_norm": 2.3002030849456787,
+ "learning_rate": 5.922743680719655e-11,
+ "loss": 0.0206,
+ "step": 36661
+ },
+ {
+ "epoch": 99.89645776566758,
+ "grad_norm": 1.7847018241882324,
+ "learning_rate": 5.622907496616314e-11,
+ "loss": 0.021,
+ "step": 36662
+ },
+ {
+ "epoch": 99.8991825613079,
+ "grad_norm": 1.4975664615631104,
+ "learning_rate": 5.330859236596375e-11,
+ "loss": 0.0918,
+ "step": 36663
+ },
+ {
+ "epoch": 99.90190735694823,
+ "grad_norm": 2.6824984550476074,
+ "learning_rate": 5.046598902769262e-11,
+ "loss": 0.1954,
+ "step": 36664
+ },
+ {
+ "epoch": 99.90463215258856,
+ "grad_norm": 1.4897246360778809,
+ "learning_rate": 4.770126497466443e-11,
+ "loss": 0.0189,
+ "step": 36665
+ },
+ {
+ "epoch": 99.90735694822888,
+ "grad_norm": 2.1342153549194336,
+ "learning_rate": 4.5014420229083645e-11,
+ "loss": 0.0352,
+ "step": 36666
+ },
+ {
+ "epoch": 99.91008174386921,
+ "grad_norm": 3.451512336730957,
+ "learning_rate": 4.240545481093428e-11,
+ "loss": 0.0523,
+ "step": 36667
+ },
+ {
+ "epoch": 99.91280653950953,
+ "grad_norm": 2.690477132797241,
+ "learning_rate": 3.987436874020034e-11,
+ "loss": 0.081,
+ "step": 36668
+ },
+ {
+ "epoch": 99.91553133514986,
+ "grad_norm": 8.813395500183105,
+ "learning_rate": 3.7421162036865854e-11,
+ "loss": 0.1562,
+ "step": 36669
+ },
+ {
+ "epoch": 99.9182561307902,
+ "grad_norm": 3.088932991027832,
+ "learning_rate": 3.504583472091483e-11,
+ "loss": 0.0624,
+ "step": 36670
+ },
+ {
+ "epoch": 99.92098092643052,
+ "grad_norm": 1.8969745635986328,
+ "learning_rate": 3.274838681011083e-11,
+ "loss": 0.1035,
+ "step": 36671
+ },
+ {
+ "epoch": 99.92370572207085,
+ "grad_norm": 2.33920955657959,
+ "learning_rate": 3.0528818322217435e-11,
+ "loss": 0.0569,
+ "step": 36672
+ },
+ {
+ "epoch": 99.92643051771117,
+ "grad_norm": 2.0795698165893555,
+ "learning_rate": 2.838712927388798e-11,
+ "loss": 0.0306,
+ "step": 36673
+ },
+ {
+ "epoch": 99.9291553133515,
+ "grad_norm": 2.172757625579834,
+ "learning_rate": 2.6323319683996262e-11,
+ "loss": 0.0358,
+ "step": 36674
+ },
+ {
+ "epoch": 99.93188010899182,
+ "grad_norm": 1.9380152225494385,
+ "learning_rate": 2.4337389565864956e-11,
+ "loss": 0.1664,
+ "step": 36675
+ },
+ {
+ "epoch": 99.93460490463215,
+ "grad_norm": 3.505955219268799,
+ "learning_rate": 2.2429338937257627e-11,
+ "loss": 0.0264,
+ "step": 36676
+ },
+ {
+ "epoch": 99.93732970027249,
+ "grad_norm": 2.7528839111328125,
+ "learning_rate": 2.059916781260718e-11,
+ "loss": 0.0389,
+ "step": 36677
+ },
+ {
+ "epoch": 99.9400544959128,
+ "grad_norm": 3.1094865798950195,
+ "learning_rate": 1.8846876205236287e-11,
+ "loss": 0.0626,
+ "step": 36678
+ },
+ {
+ "epoch": 99.94277929155314,
+ "grad_norm": 3.0980677604675293,
+ "learning_rate": 1.7172464128467626e-11,
+ "loss": 0.1261,
+ "step": 36679
+ },
+ {
+ "epoch": 99.94550408719346,
+ "grad_norm": 3.14235520362854,
+ "learning_rate": 1.5575931596734094e-11,
+ "loss": 0.0241,
+ "step": 36680
+ },
+ {
+ "epoch": 99.94822888283379,
+ "grad_norm": 2.5746209621429443,
+ "learning_rate": 1.4057278622248149e-11,
+ "loss": 0.0307,
+ "step": 36681
+ },
+ {
+ "epoch": 99.95095367847412,
+ "grad_norm": 2.559318780899048,
+ "learning_rate": 1.2616505216112019e-11,
+ "loss": 0.0321,
+ "step": 36682
+ },
+ {
+ "epoch": 99.95367847411444,
+ "grad_norm": 3.2531163692474365,
+ "learning_rate": 1.1253611389427931e-11,
+ "loss": 0.0735,
+ "step": 36683
+ },
+ {
+ "epoch": 99.95640326975477,
+ "grad_norm": 3.2968556880950928,
+ "learning_rate": 9.968597153298121e-12,
+ "loss": 0.0254,
+ "step": 36684
+ },
+ {
+ "epoch": 99.95912806539509,
+ "grad_norm": 3.3459370136260986,
+ "learning_rate": 8.761462518824815e-12,
+ "loss": 0.1363,
+ "step": 36685
+ },
+ {
+ "epoch": 99.96185286103542,
+ "grad_norm": 1.863379955291748,
+ "learning_rate": 7.632207492669353e-12,
+ "loss": 0.0264,
+ "step": 36686
+ },
+ {
+ "epoch": 99.96457765667574,
+ "grad_norm": 2.086629629135132,
+ "learning_rate": 6.580832085933964e-12,
+ "loss": 0.0252,
+ "step": 36687
+ },
+ {
+ "epoch": 99.96730245231608,
+ "grad_norm": 3.285036563873291,
+ "learning_rate": 5.6073363063902094e-12,
+ "loss": 0.0684,
+ "step": 36688
+ },
+ {
+ "epoch": 99.97002724795641,
+ "grad_norm": 1.7984572649002075,
+ "learning_rate": 4.711720160699429e-12,
+ "loss": 0.0199,
+ "step": 36689
+ },
+ {
+ "epoch": 99.97275204359673,
+ "grad_norm": 2.189822196960449,
+ "learning_rate": 3.893983657743405e-12,
+ "loss": 0.0326,
+ "step": 36690
+ },
+ {
+ "epoch": 99.97547683923706,
+ "grad_norm": 3.3216190338134766,
+ "learning_rate": 3.154126800852808e-12,
+ "loss": 0.0279,
+ "step": 36691
+ },
+ {
+ "epoch": 99.97820163487738,
+ "grad_norm": 4.278548717498779,
+ "learning_rate": 2.492149598909421e-12,
+ "loss": 0.0627,
+ "step": 36692
+ },
+ {
+ "epoch": 99.98092643051771,
+ "grad_norm": 2.0453996658325195,
+ "learning_rate": 1.908052055243914e-12,
+ "loss": 0.0833,
+ "step": 36693
+ },
+ {
+ "epoch": 99.98365122615803,
+ "grad_norm": 3.478553295135498,
+ "learning_rate": 1.4018341754074017e-12,
+ "loss": 0.1105,
+ "step": 36694
+ },
+ {
+ "epoch": 99.98637602179836,
+ "grad_norm": 2.225618362426758,
+ "learning_rate": 9.7349596162033e-13,
+ "loss": 0.0275,
+ "step": 36695
+ },
+ {
+ "epoch": 99.9891008174387,
+ "grad_norm": 2.206514596939087,
+ "learning_rate": 6.23037419433814e-13,
+ "loss": 0.0327,
+ "step": 36696
+ },
+ {
+ "epoch": 99.99182561307902,
+ "grad_norm": 3.2508068084716797,
+ "learning_rate": 3.5045854995807705e-13,
+ "loss": 0.0998,
+ "step": 36697
+ },
+ {
+ "epoch": 99.99455040871935,
+ "grad_norm": 2.5737099647521973,
+ "learning_rate": 1.5575935652378804e-13,
+ "loss": 0.0228,
+ "step": 36698
+ },
+ {
+ "epoch": 99.99727520435967,
+ "grad_norm": 2.334688663482666,
+ "learning_rate": 3.893983913094701e-14,
+ "loss": 0.0414,
+ "step": 36699
+ },
+ {
+ "epoch": 100.0,
+ "grad_norm": 1.9821799993515015,
+ "learning_rate": 0.0,
+ "loss": 0.022,
+ "step": 36700
+ },
+ {
+ "epoch": 100.0,
+ "step": 36700,
+ "total_flos": 2.2807420731392e+16,
+ "train_loss": 0.47043383053927723,
+ "train_runtime": 11044.2585,
+ "train_samples_per_second": 106.164,
+ "train_steps_per_second": 3.323
+ }
+ ],
+ "logging_steps": 1.0,
+ "max_steps": 36700,
+ "num_input_tokens_seen": 0,
+ "num_train_epochs": 100,
+ "save_steps": 50000,
+ "stateful_callbacks": {
+ "TrainerControl": {
+ "args": {
+ "should_epoch_stop": false,
+ "should_evaluate": false,
+ "should_log": false,
+ "should_save": true,
+ "should_training_stop": true
+ },
+ "attributes": {}
+ }
+ },
+ "total_flos": 2.2807420731392e+16,
+ "train_batch_size": 2,
+ "trial_name": null,
+ "trial_params": null
+}
diff --git a/florence-2-b_vis1024-lang2048_dior-v2_b2x16-100e-slurm-zero2/vocab.json b/florence-2-b_vis1024-lang2048_dior-v2_b2x16-100e-slurm-zero2/vocab.json
new file mode 100644
index 0000000000000000000000000000000000000000..4ebe4bb3f3114daf2e4cc349f24873a1175a35d7
--- /dev/null
+++ b/florence-2-b_vis1024-lang2048_dior-v2_b2x16-100e-slurm-zero2/vocab.json
@@ -0,0 +1 @@
+{"":0,"":1,"":2,"":3,".":4,"Ġthe":5,",":6,"Ġto":7,"Ġand":8,"Ġof":9,"Ġa":10,"Ġin":11,"-":12,"Ġfor":13,"Ġthat":14,"Ġon":15,"Ġis":16,"âĢ":17,"'s":18,"Ġwith":19,"ĠThe":20,"Ġwas":21,"Ġ\"":22,"Ġat":23,"Ġit":24,"Ġas":25,"Ġsaid":26,"Ļ":27,"Ġbe":28,"s":29,"Ġby":30,"Ġfrom":31,"Ġare":32,"Ġhave":33,"Ġhas":34,":":35,"Ġ(":36,"Ġhe":37,"ĠI":38,"Ġhis":39,"Ġwill":40,"Ġan":41,"Ġthis":42,")":43,"ĠâĢ":44,"Ġnot":45,"Ŀ":46,"Ġyou":47,"ľ":48,"Ġtheir":49,"Ġor":50,"Ġthey":51,"Ġwe":52,"Ġbut":53,"Ġwho":54,"Ġmore":55,"Ġhad":56,"Ġbeen":57,"Ġwere":58,"Ġabout":59,",\"":60,"Ġwhich":61,"Ġup":62,"Ġits":63,"Ġcan":64,"Ġone":65,"Ġout":66,"Ġalso":67,"Ġ$":68,"Ġher":69,"Ġall":70,"Ġafter":71,".\"":72,"/":73,"Ġwould":74,"'t":75,"Ġyear":76,"Ġwhen":77,"Ġfirst":78,"Ġshe":79,"Ġtwo":80,"Ġover":81,"Ġpeople":82,"ĠA":83,"Ġour":84,"ĠIt":85,"Ġtime":86,"Ġthan":87,"Ġinto":88,"Ġthere":89,"t":90,"ĠHe":91,"Ġnew":92,"ĠâĢĶ":93,"Ġlast":94,"Ġjust":95,"ĠIn":96,"Ġother":97,"Ġso":98,"Ġwhat":99,"I":100,"Ġlike":101,"a":102,"Ġsome":103,"S":104,"ë":105,"Ġthem":106,"Ġyears":107,"'":108,"Ġdo":109,"Ġyour":110,"Ġ-":111,"Ġ1":112,"\"":113,"Ġif":114,"Ġcould":115,"?":116,"Ġno":117,"i":118,"m":119,"Ġget":120,"ĠU":121,"Ġnow":122,"Ġhim":123,"Ġback":124,"ĠBut":125,"ĠâĢĵ":126,"Ġmy":127,"Ġ'":128,"Ġonly":129,"Ġthree":130,";":131,"Ġ2":132,"The":133,"1":134,"Ġpercent":135,"Ġagainst":136,"Ġbefore":137,"Ġcompany":138,"o":139,"ĠTrump":140,"Ġhow":141,"Ġbecause":142,"Ġany":143,"Ġmost":144,"Ġbeing":145,"Ġmake":146,"Ġwhere":147,"Ġduring":148,"Ġthrough":149,"Ġwhile":150,"000":151,"ĠThis":152,"Ġmillion":153,"ing":154,"Ġ3":155,"Ġmade":156,"Ġwell":157,"Ġ10":158,"Ġdown":159,"Ġoff":160,"Ġsays":161,"Ġme":162,"ĠB":163,"Ġgoing":164,"Ġteam":165,"ĠWe":166,"Ġthose":167,"Ġgovernment":168,"Ġway":169,"We":170,"Ġmany":171,"Ġthen":172,"Ġwork":173,"Ġtold":174,"com":175,"2":176,"Ġgame":177,"ĠAnd":178,"in":179,"year":180,"Ġp":181,"Ġvery":182,"Ġday":183,"Ġhome":184,"Ġtake":185,"Ġweek":186,"Ġsince":187,"ĠNew":188,"Ġmay":189,"Ġeven":190,"Ġseason":191,"Ġsee":192,"Ġ2017":193,"Ġstate":194,"Ġ5":195,"ed":196,"Ġshould":197,"Ġaround":198,"Ġ2018":199,"Ġsecond":200,"Ġus":201,"Ġstill":202,"Ġmuch":203,"Ġ4":204,"Ġgood":205,"Ġthink":206,"%":207,"ĠS":208,"Ġthese":209,"Ġmarket":210,"ĠD":211,"th":212,"Ġgo":213,"'re":214,"Ġsuch":215,"Ġknow":216,"Ġincluding":217,"Ġdon":218,"y":219,"Ġnext":220,"ĠP":221,"Ġdid":222,"Ġunder":223,"Ġsay":224,"en":225,"ĠL":226,"Ġbetween":227,"Ġper":228,"ĠK":229,"ĠC":230,"Ġ6":231,"Ġworld":232,"Ġpart":233,"ĠN":234,"Ġright":235,"Ġwant":236,"Ġfour":237,"),":238,"Ġhigh":239,"Ġneed":240,"re":241,"e":242,"It":243,"Ġhelp":244,"5":245,"3":246,"Ġcountry":247,"ĠR":248,"Ġpolice":249,"A":250,"Ġlong":251,"ĠThey":252,"Ġend":253,"er":254,"ĠT":255,"ĠM":256,"u":257,"Ġboth":258,"Ġhere":259,"an":260,"on":261,"Ġ7":262,"Ġde":263,"ĠShe":264,"Ġbusiness":265,"Ġreport":266,"j":267,"ers":268,"Ġreally":269,"ĠPresident":270,"ar":271,"ĠG":272,"ĠFriday":273,"ĠF":274,"Ġbest":275,"Ġsame":276,"Ġanother":277,"Ġset":278,"old":279,"ĠThat":280,"as":281,"n":282,"Ġcome":283,"Ġfamily":284,"Ġpublic":285,"ĠFor":286,"ĠAs":287,"0":288,"ĠH":289,"Ġ8":290,"Ġ20":291,"Ġfive":292,"es":293,"ĠTuesday":294,"Ġn":295,"ĠThursday":296,"Ġquarter":297,"h":298,"Ġtop":299,"Ġgot":300,"Ġlife":301,"ĠMonday":302,"Ġfound":303,"Ġuse":304,"ĠW":305,"4":306,"ĠWednesday":307,"Ġown":308,"Ġaccording":309,"Ġplay":310,"Ġshow":311,"ĠSt":312,"Ġman":313,"Ġleft":314,"ĠUnited":315,"Ġ12":316,"Ġplace":317,"ĠIf":318,"Ġlot":319,"Ġformer":320,"Ġ0":321,").":322,"Ġsupport":323,"ie":324,"Ġbillion":325,"Ġt":326,"Ġshares":327,"!":328,"z":329,"k":330,"ĠState":331,"Ġpoints":332,"Ġgroup":333,"Ġschool":334,"Ġinformation":335,"Ġ2016":336,"al":337,"r":338,"Ġwin":339,"Ġnews":340,"Ġused":341,"Ġput":342,"Ġcity":343,"ĠJ":344,"ĠThere":345,"Ġnumber":346,"C":347,"'ve":348,"Ġeach":349,"Ġtoo":350,"Ġwon":351,"ly":352,"Ġmonth":353,"is":354,"Ġadded":355,"Ġlook":356,"Ġbetter":357,"Ġevery":358,"Ġ&":359,"Ġdays":360,"Ġ9":361,"Ġtook":362,"Ġnight":363,"Ġe":364,"Ġ11":365,"os":366,"Ġfew":367,"or":368,"ĠNorth":369,"ĠYou":370,"Ġthird":371,"Ġgreat":372,"Ġcalled":373,"ĠOn":374,"Ġpast":375,"Ġcame":376,"Ġmonths":377,"ĠSaturday":378,"Ġ15":379,"Ġbig":380,"ĠE":381,"ĠUS":382,"Ġthings":383,"ĠO":384,"Ġd":385,"Ġstart":386,"B":387,"Ġstock":388,"Ġ30":389,"Ġwomen":390,"ĠSouth":391,"ĠMay":392,"Ġnever":393,"Ġpresident":394,"ĠSunday":395,"Ġwithout":396,"man":397,"8":398,"Ġdidn":399,"Ġlocal":400,"6":401,"Ġsomething":402,"Ġcase":403,"ĠAll":404,"it":405,"7":406,"ĠSo":407,"Ġchildren":408,"Ġaway":409,"Ġlittle":410,"Ġsix":411,"ĠCity":412,"ĠCounty":413,"Ġdata":414,"at":415,"Ġalready":416,"d":417,"Ġmoney":418,"Ġearly":419,"Ġacross":420,"Ġexpected":421,"Ġrun":422,"Ġlater":423,"am":424,"Ġprice":425,"Ġgames":426,"ĠMr":427,"b":428,"Ġmight":429,"Ġdifferent":430,"Ġreported":431,"Ġdeal":432,"Ġmedia":433,"Ġgrowth":434,"Ġcommunity":435,"ĠChina":436,"'m":437,"c":438,"Ġwent":439,"ĠNo":440,"Ġable":441,"Ġmaking":442,"Ġarea":443,"Ġfar":444,"Ġstatement":445,"ĠHouse":446,"Ġworking":447,"M":448,"Ġk":449,"Ġseen":450,"Ġcompanies":451,"Ġtoday":452,"Ġmembers":453,"Ġuntil":454,"Ġfull":455,"Ġagain":456,"Ġhalf":457,"Ġshare":458,"le":459,"Ġalways":460,"Ġcourt":461,"l":462,"and":463,"Ġchange":464,"Ġfind":465,"9":466,"Ġsystem":467,"ĠV":468,"ĠYork":469,"ĠAmerican":470,"Ġhead":471,"Ġplayers":472,"Ġdoes":473,"Ġhealth":474,"Ġm":475,"Ġpower":476,"Ġpoint":477,"Ġhit":478,"Ġ.":479,"Ġ--":480,"Ġfree":481,".,":482,"Ġlead":483,"Ġseveral":484,"Ġrecent":485,"Ġcall":486,"N":487,"Ġlaw":488,"Ġkeep":489,"Ġopen":490,"ĠNews":491,"Ġgive":492,"ia":493,"ĠMarch":494,"D":495,"ĠNational":496,"ĠAt":497,"Ġtimes":498,"Ġfuture":499,"R":500,"Ġ14":501,"ĠJune":502,"Ġofficials":503,"Ġ18":504,"Ġimportant":505,"f":506,"Ġfinal":507,"Ġ13":508,"ĠOne":509,"P":510,"Ġfollowing":511,"Ġcar":512,"Ġleast":513,"Ġwater":514,"Ġevent":515,"Ġline":516,"Ġmove":517,"Ġservices":518,"Ġhaving":519,"ĠWhen":520,"Ġstudents":521,"ĠPolice":522,"el":523,"Ġam":524,"ĠZ":525,"Ġside":526,"Ġstory":527,"Ġdue":528,"Ġmeeting":529,"K":530,"Ġmust":531,"ĠStates":532,"Ġlikely":533,"G":534,"Ġcontinue":535,"Ġago":536,"Ġparty":537,"Ġmajor":538,"Ġindustry":539,"Ġless":540,"30":541,"Ġun":542,"Ġhard":543,"Ġservice":544,"Ġ16":545,"Ġlooking":546,"Ġheld":547,"ve":548,"Ġwhether":549,"ĠJuly":550,"Ġtaken":551,"Ġalong":552,"Ġasked":553,"Ġstarted":554,"Ġbecome":555,"Ġforward":556,"Ġresearch":557,"Ġoffice":558,"Ġpolitical":559,"to":560,"Ġtogether":561,"Ġgetting":562,"Ġplan":563,"Ġ25":564,"T":565,"Ġamong":566,"Ġcoming":567,"Ġdecision":568,"Ġvideo":569,"Ġ2015":570,"g":571,"ĠAfter":572,"Ġsecurity":573,"L":574,"Ġcare":575,"Ġgiven":576,"Ġavailable":577,"âĢĶ":578,"Ġs":579,"ĠWest":580,"'ll":581,"Ġpay":582,"Ġnear":583,"Ġsaying":584,"Ġannounced":585,"Ġprogram":586,"ĠApril":587,"Ġreal":588,"ĠUniversity":589,"ĠWith":590,"AP":591,"Ġsocial":592,"Ġclose":593,"et":594,"Ġcurrent":595,"Ġwhy":596,"F":597,"ĠTo":598,"ĠTwitter":599,"Ġthough":600,"Ġ17":601,"Ġtaking":602,"ĠInc":603,"Ġmen":604,"w":605,"Ġcomes":606,"ley":607,"Ġdoing":608,"Ġprocess":609,"ĠJohn":610,"ch":611,"00":612,"Ġfinancial":613,"Ġlow":614,"Ġenough":615,"ĠWhile":616,"Ġfurther":617,"Ġpost":618,"Ġfeel":619,"st":620,"Ġperson":621,"ĠFacebook":622,"ĠWorld":623,"Ġwithin":624,"ad":625,"Ġdone":626,"the":627,"Ġlate":628,"Ġtax":629,"Ġdoesn":630,"Ġthing":631,"Ġnational":632,"Ġjob":633,"Ġusing":634,"ĠHowever":635,"ic":636,"Ġcampaign":637,"Ġrecord":638,"Ġbehind":639,"://":640,"ĠDepartment":641,"p":642,"Ġothers":643,"ĠJanuary":644,"Ġorder":645,"Ġ[":646,"Ġsales":647,"Ġyet":648,"Ä":649,"Ġsmall":650,"Ġseries":651,"Ġface":652,"ĠWhat":653,"Ġ50":654,"Ġever":655,"Ġearlier":656,"Ġlove":657,"up":658,"Ġrights":659,"ĠAn":660,"ist":661,"Ġmorning":662,"ĠWashington":663,"Ġyoung":664,"Ġlatest":665,"ĠIndia":666,"Ġtrying":667,"Ġfire":668,"Ġled":669,"Ġstrong":670,"Ġreturn":671,"Ġlevel":672,"O":673,"Ġaverage":674,"Ġperiod":675,"Ġexperience":676,"ak":677,"Ġpossible":678,"Ġbelieve":679,"Ġinclude":680,"Ġoil":681,"Ġrecently":682,"Ġonce":683,"Ġknown":684,"Ġlost":685,"Ġsure":686,"us":687,"Ġweeks":688,"Ġfood":689,"Ġreports":690,"Ġrating":691,"ĠMinister":692,"Ġwoman":693,"Ġprovide":694,"Ġproject":695,"Ġissue":696,"Ġlive":697,"10":698,"Ġclear":699,"he":700,"Ġcost":701,"Ġplayed":702,"Ġreleased":703,"Ġcoach":704,"v":705,"Ġ24":706,"Ġseven":707,"Ġplans":708,"Ġdevelopment":709,"ur":710,"ĺ":711,"Ġincrease":712,"This":713,"Ġpolicy":714,"Ġcent":715,"Ġbased":716,"E":717,"il":718,"ĠDecember":719,"Ġglobal":720,"Ġtrade":721,"Ġhours":722,"Ġhigher":723,"Ġgoal":724,"H":725,"ĠAl":726,"Ġ100":727,"Ġminutes":728,"Ġelection":729,"ĠAmerica":730,"Ġrate":731,"ĠCh":732,"Ġ21":733,"...":734,"ĠWhite":735,"Ġdirector":736,"Ġposition":737,"Ġshot":738,"Ġlarge":739,"Ġc":740,"Ġb":741,"]":742,"Ġissues":743,"Ġdeath":744,"Ġbuilding":745,"Ġtotal":746,"Ġoften":747,"Ġv":748,"Ġcountries":749,"Ġhistory":750,"Ġoutside":751,"Ġfederal":752,"Ġ19":753,"Ġfact":754,"ĠHigh":755,"Ġcareer":756,"im":757,"Ġinternational":758,"ĠNovember":759,"Ġfront":760,"Ġkind":761,"Ġkey":762,"ra":763,"ĠSan":764,"Ġshort":765,"Ġname":766,"ĠAccording":767,"Ġcourse":768,"Ġre":769,"Ġwanted":770,"W":771,"ĠSeptember":772,"Ġinterest":773,"Ġrole":774,"Ġresults":775,"Ġeconomic":776,"Ġ2014":777,"Ġchance":778,"ĠOctober":779,"Ġspecial":780,"Ġofficial":781,"Ġneeds":782,"um":783,"Ġl":784,"Ġproducts":785,"Ġnon":786,"Ġ@":787,"ĠBank":788,"Ġahead":789,"Ġhouse":790,"U":791,"Ġboard":792,"Ġold":793,"Ġsaw":794,"Ġlower":795,"ĠEuropean":796,"Ġcontrol":797,"ĠRussia":798,"Ġeight":799,"Ġrelease":800,"Ġpotential":801,"Ġthought":802,"Ġinvestigation":803,"Ġonline":804,"based":805,"Ġtechnology":806,"ĠDonald":807,"id":808,"Ġbody":809,"Ġrisk":810,"ian":811,"Ġcapital":812,"Ġstaff":813,"Ġaction":814,"ĠLeague":815,"Ġplaying":816,"Ġmakes":817,"Ġalmost":818,"Ġperformance":819,"Ġ22":820,"Ġg":821,"Ġfilm":822,"Ġnearly":823,"ĠCenter":824,"Ġvisit":825,"ĠGroup":826,"Ġbank":827,"Ġbit":828,"Ġreceived":829,"ĠAugust":830,"Ġmilitary":831,"ĠHis":832,"ine":833,"Ġchief":834,"ĠSchool":835,"Ġbring":836,"ĠCourt":837,"Ġ(@":838,"Ġmeans":839,"ĠSh":840,"Ġfans":841,"Ġse":842,"Ġ40":843,"20":844,"\".":845,"V":846,"Ġcut":847,"Ġkilled":848,"Ġ#":849,"Ġprices":850,"Ġgave":851,"ĠStreet":852,"ir":853,"ĠY":854,"Ġcurrently":855,"Ġf":856,"ay":857,"ne":858,"te":859,"Ġtry":860,"ĠPark":861,"ĥ":862,"J":863,"Ġquestion":864,"Ġhand":865,"Ġeconomy":866,"Ġinvestors":867,"able":868,"Ġplayer":869,"ĠBy":870,"ĠDavid":871,"Ġloss":872,"ab":873,"Ġbelow":874,"Ġwrote":875,"co":876,"ate":877,"Ġrunning":878,"un":879,"Ġbegan":880,"Ġsingle":881,"Ġfield":882,"Ġ23":883,"Ġleader":884,"Ġw":885,"ĠCalifornia":886,"Ġfourth":887,"Ġactually":888,"Ġlist":889,"ll":890,"Ġcouple":891,"Ġstudy":892,"Ġteams":893,"He":894,"ah":895,"ĠCanada":896,"Ġla":897,"Ġresult":898,"Ġaccess":899,"Ġvote":900,"ĠMore":901,"ĠFebruary":902,"Ġrevenue":903,"Ġoffer":904,"Ġlet":905,"ier":906,"Ġbuy":907,"Ġattack":908,"Ġblack":909,"Ġr":910,"Ġareas":911,"Ġstop":912,"Ġimpact":913,"Ġmatch":914,"Ġinvestment":915,"Ġcustomers":916,"Ġleaders":917,"ies":918,"Ġmember":919,"Ġchild":920,"Ġroad":921,"ul":922,"Ġvalue":923,"Ġshows":924,"ĠDr":925,"ĠDe":926,"ant":927,"ĠLondon":928,"Ġroom":929,"Ġmusic":930,"Ġproduction":931,"Ġanything":932,"Ġfirm":933,"Ġbiggest":934,"Ġair":935,"Ġproblem":936,"Ġgeneral":937,"Ġwasn":938,"Ġi":939,"Ġprivate":940,"Ġespecially":941,"Ġadministration":942,"Ġadditional":943,"ĠCo":944,"Ġopportunity":945,"Ġhold":946,"&":947,"Ġmatter":948,"Ġsenior":949,"Ġclub":950,"Ġsomeone":951,"ĠÃ":952,"ĠEast":953,"Ġ2019":954,".'":955,"Ġneeded":956,"ĠJames":957,"time":958,"Ġhowever":959,"Ġeverything":960,"Ġeveryone":961,"Ġdied":962,"Ġinvolved":963,"Ġfriends":964,"Ġisn":965,"Ġworth":966,"ik":967,"ĠCup":968,"Ġshowed":969,"There":970,"Ġ28":971,"Ġmeet":972,"Ġ26":973,"Ġ27":974,"Y":975,"Ġregion":976,"ĠPress":977,"ĠNow":978,"Ġson":979,"Ġspace":980,"Ġleading":981,"Ġstates":982,"Ġweekend":983,"Ġ£":984,"Ġmother":985,"Ġprevious":986,"ĠUK":987,"ĠMichael":988,"Ġleave":989,"est":990,"em":991,"Ġz":992,"ĠSome":993,"ors":994,"out":995,"15":996,"Ġwar":997,"Ġwebsite":998,"Ġstar":999,"X":1000,"ro":1001,"Ġtarget":1002,"Ġhimself":1003,"Ġturn":1004,"ĠEurope":1005,"Ġworked":1006,"Ġenergy":1007,"Ġscored":1008,"Ġ*":1009,"Ġsoon":1010,"Ġball":1011,"ĠTV":1012,"Ġannual":1013,"Ġ2013":1014,"Ġrace":1015,"ĠInternational":1016,"'d":1017,"ĠMarket":1018,"Ġconference":1019,"io":1020,"Ġo":1021,"Ġchanges":1022,"ig":1023,"Ġofficers":1024,"Ġinside":1025,"Ġform":1026,"Ġpublished":1027,"Ġphone":1028,"Ġco":1029,"Ġlegal":1030,"Ġexecutive":1031,"Ġfight":1032,"ings":1033,"Ġhope":1034,"Ġsummer":1035,"Ġofficer":1036,"Ġfootball":1037,"Ġproperty":1038,"@":1039,"Ġbook":1040,"Ġparents":1041,"Ġcosts":1042,"ac":1043,"Ġmanager":1044,"Ġcreate":1045,"Ġage":1046,"Ġemail":1047,"Ġmarkets":1048,"Ġmain":1049,"Ġhuman":1050,"Ġsent":1051,"Ġmanagement":1052,"ĠDay":1053,"ton":1054,"Ġcash":1055,"Ġfocus":1056,"Ġexpect":1057,"Ġtraining":1058,"Ġbecame":1059,"Ġwhose":1060,"Ġevents":1061,"Ġround":1062,"ĠLe":1063,"Ġfell":1064,"Ġabove":1065,"Ġanalysts":1066,"Ġtalk":1067,"Ġsituation":1068,"ri":1069,"ated":1070,"ke":1071,"Ġwants":1072,"ag":1073,"Ġlives":1074,"om":1075,"Ġal":1076,"Ġdemand":1077,"Ġsafety":1078,"Ġrest":1079,"ĠCouncil":1080,"Ġpersonal":1081,"Ġsite":1082,"ĠRussian":1083,"Ġmid":1084,"Ġnothing":1085,"Ġwhole":1086,"Ġbill":1087,"Ġsold":1088,"ĠBritish":1089,"se":1090,"Ġremain":1091,"12":1092,"Ġforeign":1093,"Ġshooting":1094,"Ġstay":1095,"50":1096,"ang":1097,"Ġhospital":1098,"Ġbad":1099,"Ġaddress":1100,"ĠKorea":1101,"Ġhappened":1102,"Ġcharges":1103,"Ġwhite":1104,"Ġ31":1105,"If":1106,"Ġearnings":1107,"Ġbreak":1108,"Ġlight":1109,"Ġterms":1110,"ĠChinese":1111,"ĠSenate":1112,"ana":1113,"Ġidea":1114,"ap":1115,"of":1116,"Ġnine":1117,"Ġcompared":1118,"Ġbuild":1119,"ard":1120,"In":1121,"Ġsimilar":1122,"Ġgas":1123,"Ġvictory":1124,"Ġ2012":1125,"Ġdebt":1126,"ĠMar":1127,"Ġarrested":1128,"Ġcomment":1129,"Ġincreased":1130,"Ġmedical":1131,"Ġ29":1132,"ĠJan":1133,"Ġgroups":1134,"Ġdespite":1135,"Ġfall":1136,"Ġtell":1137,"Ġworkers":1138,"Ġtown":1139,"é":1140,"Ġwife":1141,"Ġquestions":1142,"Ġcontinued":1143,"Ġheart":1144,"Ġmet":1145,"Ġbrought":1146,"Ġhelped":1147,"ĠCongress":1148,"Ġstep":1149,"Ġfather":1150,"Ġmoment":1151,"Ġproduct":1152,"Ġprobably":1153,"Ġlargest":1154,"Ġvehicle":1155,"ĠEngland":1156,"Ġallow":1157,"Ġstarting":1158,"Ġkids":1159,"Ġincident":1160,"Ġnet":1161,"Ġrates":1162,"ĠRead":1163,"Ġpressure":1164,"Ġincluded":1165,"Ġread":1166,"Ġissued":1167,"ol":1168,"Ġeither":1169,"Ġefforts":1170,"Ġincludes":1171,"ĠRepublican":1172,"ish":1173,"â̦":1174,"Ġgoals":1175,"aj":1176,"Ġen":1177,"x":1178,"Ġraised":1179,"au":1180,"Ġlonger":1181,"ut":1182,"Ġwatch":1183,"ĠTexas":1184,"You":1185,"Ġrange":1186,"nd":1187,"Ġfunds":1188,"Ġremains":1189,"ĠMark":1190,"Ġ60":1191,"Ġque":1192,"sh":1193,"Ġinterview":1194,"Ġrather":1195,"Ġresidents":1196,"Ġgrowing":1197,"Ġpre":1198,"Ġpaid":1199,"Ġcases":1200,"ĠReuters":1201,"Ġdifficult":1202,"Ġsign":1203,"ĠGoogle":1204,"Ġhttps":1205,"ĠPaul":1206,"Ġliving":1207,"day":1208,"ĠQ":1209,"iz":1210,"ĠRed":1211,"Ġland":1212,"They":1213,"ĠRoad":1214,"_":1215,"ĠThese":1216,"Ġview":1217,"Ġagency":1218,"Ġreason":1219,"Ġallowed":1220,"ĠAustralia":1221,"az":1222,"ĠRe":1223,"Ġturned":1224,"11":1225,"Ġnation":1226,"Ġready":1227,"Ġpress":1228,"Ġbudget":1229,"Ġdaily":1230,"ĠChief":1231,"Ġfamilies":1232,"Ġsignificant":1233,"ĠFirst":1234,"Ġthemselves":1235,"Ġj":1236,"Ġruns":1237,"Ġaccused":1238,"Ġtakes":1239,"Ġspent":1240,"Ġvia":1241,"ot":1242,"ina":1243,"25":1244,"land":1245,"Ġexample":1246,"Ġauthorities":1247,"Ġdate":1248,"Ġended":1249,"all":1250,"Reuters":1251,"Ġbusinesses":1252,"ans":1253,"Ġdetails":1254,"Ġground":1255,"Ġpretty":1256,"ĠApple":1257,"ation":1258,"ĠSmith":1259,"ĠCompany":1260,"ĠFlorida":1261,"Ġdrug":1262,"Ġresponse":1263,"one":1264,"Ġeducation":1265,"Ġmean":1266,"Ġleague":1267,"Ġanyone":1268,"Ġminister":1269,"Ġtitle":1270,"Ġadding":1271,"Ġproblems":1272,"Ġopening":1273,"Ġconditions":1274,"Ġred":1275,"Ġdecided":1276,"Å":1277,"Ġposted":1278,"term":1279,"Ġamount":1280,"ĠEU":1281,"Ġsuccess":1282,"Ġevidence":1283,"ĠObama":1284,"Ġaddition":1285,"Ġprovided":1286,"ĠLos":1287,"Ġagreement":1288,"Ġstage":1289,"ens":1290,"Ġrelationship":1291,"ĠGeneral":1292,"Ġsector":1293,"Ġstudent":1294,"ating":1295,"Ġtest":1296,"\",":1297,"Ġwinning":1298,"Ġfelt":1299,"Ġsource":1300,"Z":1301,"Ġseems":1302,"Ġcause":1303,"Ġschools":1304,"Ġdrive":1305,"Ġensure":1306,"Ġhuge":1307,"ĠMy":1308,"ĠHealth":1309,"Ġscene":1310,"Ġgiving":1311,"Ġcenter":1312,"Ġpositive":1313,"Ġyards":1314,"Ġjobs":1315,"Ġaccount":1316,"Ġheard":1317,"Ġquality":1318,"Ġways":1319,"Ġimmediately":1320,"Ġemployees":1321,"are":1322,"Ġpass":1323,"ĠCEO":1324,"Ġreceive":1325,"Ġlooks":1326,"ĠAfrica":1327,"Ġthroughout":1328,"led":1329,"Ġrelated":1330,"Ġsell":1331,"ĠUnion":1332,"ĠPhoto":1333,"ter":1334,"Ġquickly":1335,"ĠHow":1336,"Ġvarious":1337,"Ġreach":1338,"Ġpick":1339,"Ġcharged":1340,"Ġquite":1341,"ent":1342,"q":1343,"ins":1344,"Ġphoto":1345,"Ġunderstand":1346,"ĠâĢ¢":1347,"Ġreached":1348,"Ġtrack":1349,"uk":1350,"Ġeffort":1351,"ville":1352,"Ġcentral":1353,"Ġdaughter":1354,"Ġcontract":1355,"Ġinjury":1356,"Ġopened":1357,"Ġ($":1358,"Ġstraight":1359,"17":1360,"Ġcredit":1361,"ĠIndian":1362,"Ġsexual":1363,"Ġworks":1364,"Ġeasy":1365,"18":1366,"Ġclosed":1367,"Ġh":1368,"Ġhappen":1369,"Ġforce":1370,"ler":1371,"Ġhappy":1372,"Ġshared":1373,"Ġoverall":1374,"Ġmoving":1375,"á":1376,"Ġprojects":1377,"ĠBlack":1378,"Ġconcerns":1379,"Ġclass":1380,"Ġtried":1381,"Ġappeared":1382,"Ġcontent":1383,"ĠDistrict":1384,"Ġterm":1385,"Ġinstead":1386,"ĠOffice":1387,"Ġcontinues":1388,"Ġlevels":1389,"Ġafternoon":1390,"Ġfund":1391,"Ġsale":1392,"Ġdriver":1393,"Ġask":1394,"Ġcannot":1395,"ner":1396,"end":1397,"ĠHere":1398,"field":1399,"Ġstore":1400,"www":1401,"Ġcertain":1402,"Ġself":1403,"Ġdollar":1404,"ĠHer":1405,"Ġpopular":1406,"Ġfollow":1407,"Ġspending":1408,"by":1409,"Ġmoved":1410,"Ġgoes":1411,"Ġcreated":1412,"Ġstand":1413,"Ġoperations":1414,"Ġlooked":1415,"Ġtreatment":1416,"ov":1417,"Ġdistrict":1418,"Ġsigned":1419,"Ġhands":1420,"Ġmodel":1421,"ĠAngeles":1422,"Ġy":1423,"Ġborder":1424,"Ġincome":1425,"ĠLast":1426,"Ġcharge":1427,"Ġdriving":1428,"ĠJapan":1429,"Ġrise":1430,"Ġtalks":1431,"Ġfollowed":1432,"Ġpreviously":1433,"Ġusers":1434,"Ġfunding":1435,"ĠJohnson":1436,"Ġ":1437,"ou":1438,"ai":1439,"Ġnamed":1440,"Ġfriend":1441,"ĠNov":1442,"Ġdefense":1443,"ĠBritain":1444,"Ġentire":1445,"Ġtrading":1446,"Ġfailed":1447,"ĠEl":1448,"Ġclaims":1449,"Ġcomments":1450,"Ġbeat":1451,"ib":1452,"Ġbasis":1453,"ĠJones":1454,"Ġpresent":1455,"ĠBe":1456,"Ġdouble":1457,"Ġrose":1458,"ite":1459,"Ġability":1460,"Ġoriginal":1461,"Ġdead":1462,"ĠCommission":1463,"ĠMe":1464,"Ġcompetition":1465,"Ġ2011":1466,"Ġknew":1467,"Ġmaterial":1468,"av":1469,"ĠFrance":1470,"Ġscore":1471,"Ġsense":1472,"Ġserious":1473,"Ġconfirmed":1474,"Ġanti":1475,"Ġviolence":1476,"Ġimprove":1477,"son":1478,"ó":1479,"ĠAP":1480,"Ġsh":1481,"Ġhost":1482,"ĠMike":1483,"Ġpatients":1484,"ĠNFL":1485,"Ġcrisis":1486,"Ġrevealed":1487,"ach":1488,"ĠPrime":1489,"Ġbuilt":1490,"ĠNot":1491,"Ġrules":1492,"Ġelse":1493,"Ġdepartment":1494,"Ġitself":1495,"ise":1496,"500":1497,"Ġcomplete":1498,"ion":1499,"Ġtrial":1500,"ĠBay":1501,"ĠDec":1502,"Ġattention":1503,"Ġtravel":1504,"ĠCentral":1505,"ry":1506,"Ġagreed":1507,"Ġmind":1508,"ĠMc":1509,"Ġ70":1510,"Ġcontact":1511,"ari":1512,"ĠTimes":1513,"Ġspot":1514,"ĠFrench":1515,"Ġgets":1516,"op":1517,"Ġbrand":1518,"Ġcalls":1519,"Ġbanks":1520,"Ġdesign":1521,"Ġsafe":1522,"Ġoffers":1523,"Ġpractice":1524,"ĠOf":1525,"á":1526,"ling":1527,"Ġtrue":1528,"off":1529,"Ġnumbers":1530,"Ġfun":1531,"Ġlearn":1532,"Ġmultiple":1533,"ĠIs":1534,"res":1535,"als":1536,"Ġcommon":1537,"ized":1538,"Ġchallenge":1539,"Ġcommittee":1540,"ĠOur":1541,"Ġbase":1542,"ani":1543,"ĠAssociation":1544,"ung":1545,"Ġnetwork":1546,"ĠBrown":1547,"Ġapproach":1548,"16":1549,"Ġfinished":1550,"Ġreview":1551,"Ġrequired":1552,"Ġapp":1553,"ĠMan":1554,"Ġâ̦":1555,"twitter":1556,"ĠDemocratic":1557,"13":1558,"Ġevening":1559,"ĠTom":1560,"ä":1561,"ĠAssociated":1562,"ĠCanadian":1563,"Ġcollege":1564,"Ġspokesman":1565,"Ġarticle":1566,"Ġtowards":1567,"ĠChicago":1568,"Ġmovie":1569,"14":1570,"ity":1571,"Ġforces":1572,"ĠChris":1573,"ĠDemocrats":1574,"Ġfeatures":1575,"Ġhearing":1576,"ĠX":1577,"ĠAlso":1578,"Ġmessage":1579,"age":1580,"Ġnoted":1581,"ĠSuper":1582,"Ġthousands":1583,"aw":1584,"ĠBill":1585,"ĠAr":1586,"ĠLa":1587,"ip":1588,"Ġ/":1589,"ĠDuring":1590,"Ġnote":1591,".)":1592,"Ġwrong":1593,"if":1594,"Ġpassed":1595,"ĠTwo":1596,"Ġdie":1597,",'":1598,"ĠDon":1599,"ĠGermany":1600,"Ġletter":1601,"Ġdescribed":1602,"ĠIran":1603,"ĠWilliams":1604,"Ġparticularly":1605,"Ġadd":1606,"Ġconversation":1607,"ĠSe":1608,"Ġhighest":1609,"be":1610,"Ġhomes":1611,"Ġsports":1612,"Ġgone":1613,"ĠAd":1614,"Ġel":1615,"Ġopportunities":1616,"Ġwords":1617,"Ġleaving":1618,"ĠChristmas":1619,"As":1620,"ĠGovernment":1621,"Ġsimply":1622,"Ġhusband":1623,"ĠResearch":1624,"ĠMexico":1625,"ates":1626,"ale":1627,"ĠGreen":1628,"$":1629,"od":1630,"ĠHall":1631,"Ġnatural":1632,"Ġoperating":1633,"les":1634,"ations":1635,"ĠKim":1636,"Ġgold":1637,"ok":1638,"Ġprovides":1639,"(":1640,"ell":1641,"Ġbegin":1642,"ĠParty":1643,"back":1644,"ĠAmazon":1645,"19":1646,"Ġmajority":1647,"ĠEven":1648,"Ġcheck":1649,"Ġweather":1650,"Ġorganization":1651,"Ġstories":1652,"ĠCar":1653,"Ġforced":1654,"ĠGeorge":1655,"Ġwalk":1656,"ong":1657,"Ġfiled":1658,"ĠJustice":1659,"Ġlaunched":1660,"Ġoffered":1661,"Ġwww":1662,"Ġconstruction":1663,"ĠBen":1664,"Ġserved":1665,"Ġ...":1666,"Ġparts":1667,"Ġcancer":1668,"Ġguys":1669,"Reporting":1670,"ash":1671,"less":1672,"Ġleadership":1673,"ĠCommittee":1674,"Ġregular":1675,"Ġcouncil":1676,"Ġcars":1677,"ĠDirector":1678,"Ġjudge":1679,"Ġvictims":1680,"ĠDaily":1681,"Ġkept":1682,"Ġeffect":1683,"Ġbeyond":1684,"pm":1685,"Ġtalking":1686,"Ġconsidered":1687,"ore":1688,"ĠAdvertisement":1689,"Ġst":1690,"ED":1691,"Ġmiddle":1692,"Ġraise":1693,"we":1694,"Ġclaimed":1695,"ino":1696,"Ġalleged":1697,"ĠPro":1698,"ĠScott":1699,"ĠOct":1700,"Ġconsider":1701,"ĠShare":1702,"Ġtraffic":1703,"ĠAfrican":1704,"Ġcouldn":1705,"Ġtoward":1706,"Ġsearch":1707,"But":1708,"Ġlaunch":1709,"Ġinjured":1710,"That":1711,"Ġalthough":1712,"Ġactivities":1713,"Ġchanged":1714,"Ġsources":1715,"Ġmissing":1716,"Ġu":1717,"Ġ35":1718,"Ġcover":1719,"ised":1720,"Ġ|":1721,"ow":1722,"ES":1723,"Ġdecades":1724,"ich":1725,"Ġcaused":1726,"Ġelections":1727,"ane":1728,"IS":1729,"Ġfeet":1730,"ĠBar":1731,"Ġversion":1732,"Ġgrow":1733,"Ġvehicles":1734,"Ġoptions":1735,"Ġindividual":1736,"Ġenvironment":1737,"ĠRobert":1738,"ĠValley":1739,"ĠFrom":1740,"per":1741,"ara":1742,"Ġsystems":1743,"Ġprotect":1744,"ĠKing":1745,"Ġinjuries":1746,"Ġfinally":1747,"Ġnuclear":1748,"40":1749,"Ġratio":1750,"Ġgun":1751,"ĠPakistan":1752,"ĠManagement":1753,"ĠAir":1754,"ce":1755,"Ġopposition":1756,"ment":1757,"ick":1758,"Ġpro":1759,"Ġact":1760,"Ġplatform":1761,"Ġlack":1762,"Ġpair":1763,"Ġ500":1764,"Ġcalling":1765,"ary":1766,"Ġprograms":1767,"Ġscheduled":1768,"Ġfast":1769,"Ġjoined":1770,"ĠWar":1771,"ĠEditing":1772,"ĠSince":1773,"ĠRyan":1774,"ĠMac":1775,"ĠBig":1776,"ĠLake":1777,"Ġdigital":1778,"When":1779,"ue":1780,"Ġassets":1781,"Ġseeing":1782,"ĠAct":1783,"Ġpartner":1784,"ĠBoard":1785,"Ġbeginning":1786,"Ġsupply":1787,"Ġmiles":1788,"Ġprison":1789,"ons":1790,"ĠAmericans":1791,"ub":1792,"ĠOr":1793,"me":1794,"Ġbenefits":1795,"Ġbenefit":1796,"Ġmeasures":1797,"Ġhear":1798,"Ġparties":1799,"Ġsuccessful":1800,"ĠJust":1801,"Ġvictim":1802,"Ġblock":1803,"Ġlimited":1804,"Ġtrip":1805,"ĠPeople":1806,"Ġserve":1807,"Ġart":1808,"ism":1809,"Ġwide":1810,"ĠSch":1811,"Ġ80":1812,"ĠThomas":1813,"Ġ90":1814,"Ġstocks":1815,"Ġgirl":1816,"ĠAsia":1817,"Ġseeking":1818,"Ġcertainly":1819,"ĠServices":1820,"ĠCollege":1821,"Ġcommunities":1822,"Ġextra":1823,"Ġ2010":1824,"ness":1825,"Ġholding":1826,"ous":1827,"Ġtough":1828,"ade":1829,"Ġmobile":1830,"Ġowns":1831,"ĠDo":1832,"ĠFire":1833,"Ġspoke":1834,"Ġreturned":1835,"Ġsize":1836,"Ġcriminal":1837,"ĠInstagram":1838,"Ġoffering":1839,"ĠGod":1840,"ĠService":1841,"Ġpage":1842,"her":1843,"Ġdeep":1844,"wood":1845,"Ġcrime":1846,"ĠSports":1847,"ile":1848,"ĠGlobal":1849,"Ġproposed":1850,"ain":1851,"Ġsession":1852,"ĠFederal":1853,"ĠSyria":1854,"Ġch":1855,"Ġthreat":1856,"Ġallegations":1857,"ĠRepublicans":1858,"ĠGerman":1859,"Ġstrategy":1860,"Ġcommercial":1861,"ING":1862,"ĠSecretary":1863,"Q":1864,"Ġreporters":1865,"100":1866,"ĠCapital":1867,"ĠBoth":1868,"ĠPost":1869,"ĠIsrael":1870,"Ġsave":1871,"ts":1872,"ill":1873,"Ġdrop":1874,"Ġreserved":1875,"ĠMany":1876,"Ġavoid":1877,"Ġ200":1878,"iv":1879,"Ġdamage":1880,"Ġcondition":1881,"Ġdropped":1882,"Ġdoor":1883,"Ġplanning":1884,"ire":1885,"Ġcard":1886,"Ġdesigned":1887,"Ġreduce":1888,"AN":1889,"ĠUn":1890,"ford":1891,"ĠThen":1892,"Ġpic":1893,"ĠCopyright":1894,"Ġrain":1895,"ĠMartin":1896,"Ġdomestic":1897,"45":1898,"ge":1899,"Ġmurder":1900,"Ġspeech":1901,"line":1902,"Ġhelping":1903,"Ġplanned":1904,"Ġfeature":1905,"ud":1906,"Ġtype":1907,"ham":1908,"ĠPublic":1909,"ja":1910,"Ġinsurance":1911,"Ġattacks":1912,"ĠCorp":1913,"Ġforecast":1914,"Ġresources":1915,"ma":1916,"?\"":1917,"ĠAm":1918,"ĠSept":1919,"Ġpush":1920,"Ġattorney":1921,"23":1922,"Ġemergency":1923,"Ġwinner":1924,"Ġblood":1925,"Ġnorth":1926,"ĠFeb":1927,"Ġbaby":1928,"Ġfloor":1929,"Ġspend":1930,"Ġex":1931,"Ġdollars":1932,"Ġunit":1933,"ĠHill":1934,"Ġder":1935,"ĠAbout":1936,"Ġalone":1937,"ization":1938,"Ġpresidential":1939,"Ġactivity":1940,"ĠTHE":1941,"ee":1942,"ber":1943,"ĠOther":1944,"Ġowner":1945,"Ġhour":1946,"Ġcities":1947,"Ġanswer":1948,"ide":1949,"Ġfully":1950,"ek":1951,"ists":1952,"Ġcoverage":1953,"Ġvs":1954,"Ġfigure":1955,"Ġpopulation":1956,"org":1957,"Ġsnow":1958,"Ġbecoming":1959,"ĠSam":1960,"ĠCarolina":1961,"Ġjoin":1962,"Ġprofit":1963,"Ġitems":1964,"Ġindex":1965,"Ġanalysis":1966,"Ġtournament":1967,"Ġstake":1968,"Ġperfect":1969,"way":1970,"Ġband":1971,"Ġgirls":1972,"Ġoption":1973,"Ġplays":1974,"oc":1975,"Ġproviding":1976,"ÃŃ":1977,"24":1978,"Ġwouldn":1979,"Ġones":1980,"Ġdeclined":1981,"Ġwritten":1982,"Ġvoters":1983,"Ġcandidate":1984,"Ġsuspect":1985,"Ġpolicies":1986,"Ġpeace":1987,"ast":1988,"Ġparticular":1989,"for":1990,"Ġhopes":1991,"Ġstation":1992,"ĠMost":1993,"Ġspeak":1994,"ĠRiver":1995,"Ġasking":1996,"Ġstatements":1997,"Ġfifth":1998,"ha":1999,"ĠNigeria":2000,"af":2001,"Ġexplained":2002,"Ġbar":2003,"Ġhousing":2004,"ĠSanta":2005,"Ġidentified":2006,"Ġsimple":2007,"Ġcritical":2008,"ĠClub":2009,"ĠSecurity":2010,"ĠLike":2011,"Ġstarts":2012,"art":2013,"Ġstreet":2014,"Ġreality":2015,"Ġheavy":2016,"Ġprogress":2017,"Ġshowing":2018,"Ġchallenges":2019,"Ġban":2020,"Ġcommitted":2021,"35":2022,"»":2023,"Ġdirectly":2024,"Ġaren":2025,"Ġclaim":2026,"ĠWestern":2027,"ind":2028,"Ġgives":2029,"ĠSaudi":2030,"Ġchoice":2031,"ĠTh":2032,"Ġapproved":2033,"Ġlocated":2034,"Ġarrived":2035,"22":2036,"Ġcaught":2037,"Ġprofessional":2038,"Ġmissed":2039,"Ġculture":2040,"ĠYear":2041,"ĠOhio":2042,"ĠLtd":2043,"ĠAnother":2044,"Ġseem":2045,"Ġbelieves":2046,"Ġbelieved":2047,"Ġcharacter":2048,"ĠAug":2049,"red":2050,"Ġfine":2051,"Ġprior":2052,"Ġthinking":2053,"Ġhttp":2054,"Ġ+":2055,"Ġzone":2056,"Ġputting":2057,"Ġcrash":2058,"ĠAustralian":2059,"ĠAb":2060,"Ġfocused":2061,"ĠREUTERS":2062,"ĠFox":2063,"ĠSp":2064,"Ġtraditional":2065,"Ġanalyst":2066,"Ġwait":2067,"IT":2068,"Ġrequest":2069,"ru":2070,"ians":2071,"ize":2072,"Ġfinish":2073,"Ġlaws":2074,"Ġran":2075,"ER":2076,"Ġsouth":2077,"Ġspeed":2078,"Ġmovement":2079,"Ġassault":2080,"Ġexchange":2081,"Ġappear":2082,"ĠSun":2083,"Ġle":2084,"Ġmaybe":2085,"Ġlosing":2086,"Ġsubject":2087,"ive":2088,"mer":2089,"ĠBusiness":2090,"ĠBl":2091,"Ġappears":2092,"Ġadvantage":2093,"ĠLee":2094,"ada":2095,"ĠUnder":2096,"Ġprevent":2097,"Ġrespect":2098,"Ġsex":2099,"Ġcentre":2100,"ĠJoe":2101,"ado":2102,"Ġtable":2103,"Ġequipment":2104,"Ġfair":2105,"Ġtour":2106,"Ġ32":2107,"ĠFinancial":2108,"Ġcounty":2109,"Ġdevices":2110,"Ġcustomer":2111,"Ġinfrastructure":2112,"Ġexpectations":2113,"Ġfacing":2114,"Ġupon":2115,"Ġcross":2116,"ĠOpen":2117,"AL":2118,"Ġquick":2119,"Ġattempt":2120,"Ġcompleted":2121,"Ġfacility":2122,"Ġconfidence":2123,"ĠSupreme":2124,"Ġpiece":2125,"our":2126,"Ġplaces":2127,"Ġsometimes":2128,"Ġpoor":2129,"Ġstorm":2130,"Ġhot":2131,"Ġaffected":2132,"na":2133,"Ġabuse":2134,"ĠMs":2135,"Ġword":2136,"over":2137,"Ġbrother":2138,"Ġnecessary":2139,"Ġeventually":2140,"ĠStar":2141,"Ġsend":2142,"Ġboy":2143,"ĠRs":2144,"Ġremember":2145,"21":2146,"Ġclimate":2147,"Ġcapacity":2148,"Ġresponsible":2149,"ĠMatt":2150,"month":2151,"Ġsuffered":2152,"%.":2153,"og":2154,"ĠPeter":2155,"Ġ,":2156,"Ġfeeling":2157,"ze":2158,"Ġbuying":2159,"oy":2160,"ij":2161,"Ġbought":2162,"Ġactions":2163,"Ġowned":2164,"Ġ___":2165,"Ġphysical":2166,"Ġspecific":2167,"Ġbattle":2168,"ĠEnergy":2169,"Ġpicture":2170,"Ġactive":2171,"Ġindividuals":2172,"Ġguy":2173,"Ġregional":2174,"Ġbond":2175,"ows":2176,"ĠToronto":2177,"Ġrule":2178,"Ġdevelop":2179,"Ġcrowd":2180,"Ġguilty":2181,"Ġfemale":2182,"Ġselling":2183,"ĠFollow":2184,"Ġmyself":2185,"ata":2186,"Ġdevice":2187,"Ġreasons":2188,"Ġrecords":2189,"Ġfighting":2190,"ON":2191,"ities":2192,"ĠHome":2193,"Ġstatus":2194,"Ġplant":2195,"Ġdrugs":2196,"ĠChurch":2197,"Ġcompletely":2198,"Ġdisease":2199,"Ġhighly":2200,"ĠParis":2201,"Ġdecade":2202,"Ġowners":2203,"Ġwall":2204,"Ġcamp":2205,"ĠSteve":2206,"Ġreporting":2207,"Ġearned":2208,"ĠImages":2209,"Ġexisting":2210,"ĠSen":2211,"Ġconcern":2212,"Ġhundreds":2213,"Ġsong":2214,"Ġknows":2215,"Ġunique":2216,"Ġlose":2217,"ĠKh":2218,"Ġapproximately":2219,"Ġhaven":2220,"Ġpark":2221,"Ġindependent":2222,"ĠAlthough":2223,"ĠAndrew":2224,"Ġpaper":2225,"Ġdeveloped":2226,"Ġrising":2227,"Ġdirect":2228,"Ġpurchase":2229,"Ġexactly":2230,"Ġq":2231,"Ġmassive":2232,"Ġbox":2233,"Ġchampion":2234,"ĠClinton":2235,"Ġvoice":2236,"Ġarrest":2237,"ĠKorean":2238,"Ġlearning":2239,"ĠVirginia":2240,"Ġsa":2241,"Ġpar":2242,"Ġchairman":2243,"Ġagencies":2244,"Ġhealthy":2245,"ĠThose":2246,"Ġpowerful":2247,"Ġ45":2248,"Ġdifference":2249,"ĠJackson":2250,"Ġenforcement":2251,"Ġdividend":2252,"qu":2253,"Ġenjoy":2254,"Ġruling":2255,"Ġongoing":2256,"Ġsoftware":2257,"ks":2258,"Ġlocation":2259,"Ġmostly":2260,"Ġcandidates":2261,"men":2262,"Ġbroke":2263,"What":2264,"ĠBr":2265,"Ġ2008":2266,"Ġconsumer":2267,"Ġdiscuss":2268,"Ġdi":2269,"Ġprimary":2270,"ĠEn":2271,"Ġgreen":2272,"Ġconcerned":2273,"Ġimage":2274,"ĠPremier":2275,"ĠMeanwhile":2276,"Ġfired":2277,"ĠBoston":2278,"ann":2279,"Ġcamera":2280,"Ġtraded":2281,"Ġhasn":2282,"Ġexcited":2283,"Ġincreasing":2284,"ĠDespite":2285,"Ġcitizens":2286,"Ġeuro":2287,"Ġreportedly":2288,"Ġminute":2289,"ĠWill":2290,"ĠLLC":2291,"Ġsp":2292,"ĠMichigan":2293,"Ġstopped":2294,"Ġeye":2295,"Ġdenied":2296,"Ġmodern":2297,"ĠWall":2298,"Ġdefinitely":2299,"point":2300,"Ġlines":2301,"Ġpolitics":2302,"Ġhotel":2303,"Ġretail":2304,"Ġstated":2305,"ĠOver":2306,"Ġgrew":2307,"Ġbroadcast":2308,"Ġlegislation":2309,"Ġfresh":2310,"Ġbid":2311,"Ġmanaged":2312,"Ġsociety":2313,"Ġscoring":2314,"ĠGet":2315,"Ġintelligence":2316,"Ġholiday":2317,"Ġgovernor":2318,"Ġestimated":2319,"Ġexperts":2320,"ĠJeff":2321,"Ġstruck":2322,"Ġhits":2323,"Ġcarry":2324,"Ġplaced":2325,"Ġstores":2326,"Ġexpressed":2327,"Ġvalued":2328,"Ġad":2329,"Ġtwice":2330,"ala":2331,"Ġdisplay":2332,"Ġusually":2333,"Ġresponded":2334,"Ġdog":2335,"AS":2336,"ĠFed":2337,"Ġ2009":2338,"Ġdocuments":2339,"Ġnormal":2340,"Ġtrain":2341,"Ġfl":2342,"Ġshown":2343,"ĠEd":2344,"Ġsort":2345,"Ġallegedly":2346,"Ġshots":2347,"ka":2348,"Ġaccounts":2349,"Ġyesterday":2350,"Ġcreating":2351,"Ġchurch":2352,"Ġbus":2353,"Ġaward":2354,"Ġequity":2355,"Ġphotos":2356,"Ġ33":2357,"Ġfiscal":2358,"je":2359,"Ġconsumers":2360,"ĠManchester":2361,"no":2362,"ĠKevin":2363,"Ġgain":2364,"Ġcorporate":2365,"Ġcivil":2366,"ĠMiddle":2367,"ally":2368,"Ġsound":2369,"ĠEnglish":2370,"IC":2371,"Ġwinds":2372,"Ġworst":2373,"ĠGrand":2374,"Ġeffective":2375,"ĠIsland":2376,"Ġdrivers":2377,"Ġfan":2378,"pe":2379,"Ġsides":2380,"ĠGo":2381,"Ġclean":2382,"âĢĵ":2383,"Ġtelevision":2384,"ĠJr":2385,"Ġallows":2386,"My":2387,"Ġgreater":2388,"ance":2389,"Ġdecisions":2390,"Ġrestaurant":2391,"ĠHospital":2392,"ĠTr":2393,"Ġbalance":2394,"Ġmph":2395,"Ġkeeping":2396,"Ġseconds":2397,"Ġweapons":2398,"ert":2399,"Ġpain":2400,"ass":2401,"Ġsteps":2402,"ger":2403,"ĠBrexit":2404,"Ġremaining":2405,"Ġbringing":2406,"ure":2407,"Ġweight":2408,"And":2409,"Ġwriting":2410,"Photo":2411,"ĠChristian":2412,"ob":2413,"Ġsport":2414,"Ġfigures":2415,"Ġtrust":2416,"Ġskills":2417,"Ġseat":2418,"Ġfaces":2419,"ck":2420,"Ġborn":2421,"Ġsuper":2422,"Ġfuel":2423,"Ġdel":2424,"Ġmeant":2425,"ica":2426,"Ġjustice":2427,"Ġspring":2428,"Ġkilling":2429,"Ġnegative":2430,"ĠRichard":2431,"Ġund":2432,"Ġfactors":2433,"Ġsigns":2434,"Ġlearned":2435,"ĠGame":2436,"Ġaudience":2437,"Ġdeliver":2438,"Ġillegal":2439,"Ġblue":2440,"Ġscreen":2441,"Ġremained":2442,"Ġannouncement":2443,"IN":2444,"Ġwaiting":2445,"Ġthanks":2446,"Ġimmigration":2447,"ĠFBI":2448,"Ġwarned":2449,"Ġmeasure":2450,"Ġdraw":2451,"Ġpositions":2452,"Ġdebut":2453,"ĠMedia":2454,"Ġallowing":2455,"air":2456,"hen":2457,"Ġmark":2458,"ys":2459,"Ġprepared":2460,"ĠVegas":2461,"ep":2462,"ice":2463,"2018":2464,"Ġdefensive":2465,"60":2466,"ĠBeach":2467,"Ġpulled":2468,"£":2469,"Ġlawyer":2470,"Ġcast":2471,"Ġsolution":2472,"Ġeyes":2473,"Ġmarketing":2474,"ĠFoundation":2475,"Ġrisks":2476,"ĠToday":2477,"za":2478,"Ġdraft":2479,"Ġice":2480,"26":2481,"ĠHar":2482,"ĠExecutive":2483,"Ġtruck":2484,"ions":2485,"ĠYour":2486,"ĠIreland":2487,"ĠJim":2488,"Ġha":2489,"Ġfear":2490,"Ġ36":2491,"UR":2492,"ĠFord":2493,"Ġwatching":2494,"ien":2495,"Ġstyle":2496,"ĠGood":2497,"Ġwearing":2498,"ĠHouston":2499,"Ġonto":2500,"Ġboost":2501,"Ġapplication":2502,"ĠDan":2503,"Ġspread":2504,"ĠDavis":2505,"Ġstrike":2506,"els":2507,"Ġwind":2508,"Ġinterested":2509,"Ġguard":2510,"Ġmission":2511,"Ġyourself":2512,"Ġoperation":2513,"Ġlarger":2514,"She":2515,"Ġseasons":2516,"28":2517,"27":2518,"Ġrespond":2519,"ci":2520,"ĠCentre":2521,"Our":2522,"Ġnames":2523,"Ġflight":2524,"Ġquarterback":2525,"Ġstandard":2526,"so":2527,"Ġsuggested":2528,"ĠMal":2529,"Ġolder":2530,"ini":2531,"Ġperhaps":2532,"ont":2533,"ĠInstitute":2534,"Ġmillions":2535,"Ġmental":2536,"ÃĤ":2537,"ga":2538,"Ġclients":2539,"Ġplease":2540,"Ġloan":2541,"Ġaware":2542,"ft":2543,"int":2544,"75":2545,"05":2546,"AY":2547,"ĠOut":2548,"Ġhair":2549,"ied":2550,"Ġseemed":2551,"ene":2552,"ty":2553,"NYSE":2554,"Ġoffensive":2555,"Ġtaxes":2556,"Ġinitial":2557,"ren":2558,"Ġseparate":2559,"la":2560,"ĠMiami":2561,"AC":2562,"Ġclearly":2563,"Ġfit":2564,"ĠCoast":2565,"Ġfirms":2566,"Ġpartners":2567,"Ġupcoming":2568,"Ġcold":2569,"Ġproposal":2570,"AT":2571,"Ġshut":2572,"ĠCommunity":2573,"Ġnature":2574,"ĠSal":2575,"Ġbottom":2576,"ting":2577,"ĠClick":2578,"Ġnice":2579,"ets":2580,"Ġhurt":2581,"itt":2582,"ama":2583,"Ġcarried":2584,"ĠCon":2585,"rd":2586,"Ġestate":2587,"ĠLas":2588,"ĠLaw":2589,"ng":2590,"Ġprotection":2591,"Ġproduce":2592,"Ġcurrency":2593,"Ġhappens":2594,"ĠPer":2595,"ney":2596,"ĠLong":2597,"Ġfellow":2598,"Ġcuts":2599,"Ġreading":2600,"ano":2601,"Ġproud":2602,"ost":2603,"ĠUN":2604,"ĠArizona":2605,"AD":2606,"Ġhelps":2607,"Ġwinter":2608,"Ġfinding":2609,"ĠGold":2610,"att":2611,"ĠWhy":2612,"Ġbasketball":2613,"lin":2614,"ĠCan":2615,"ĠBowl":2616,"ial":2617,"ĠAlex":2618,"200":2619,"AM":2620,"Ġpresence":2621,"Ġproduced":2622,"Ġdeveloping":2623,"Ġregarding":2624,"Ġdebate":2625,"Ġvice":2626,"ĠItaly":2627,"Ġsu":2628,"its":2629,"ator":2630,"Ġ34":2631,"Ġcomplex":2632,"Ġpresented":2633,"Ġresearchers":2634,"Ġslow":2635,"ya":2636,"Ġsanctions":2637,"Ġloved":2638,"Ġseek":2639,"Ġresponsibility":2640,"Ġadmitted":2641,"Ġalbum":2642,"Ġsolutions":2643,"Ġfacilities":2644,"ett":2645,"ĠGu":2646,"ĠWell":2647,"Ġlawmakers":2648,"Ġmiss":2649,"ful":2650,"ĠNick":2651,"'.":2652,"Ġfeels":2653,"Ġprime":2654,"Ġknowledge":2655,"Ġdeals":2656,"ĠTaylor":2657,"Ġsurvey":2658,"ĠFrancisco":2659,"Ġjoint":2660,"Ġwhom":2661,"Ġsit":2662,"01":2663,"Ġtr":2664,"Ġorganizations":2665,"ĠAvenue":2666,"ĠTheir":2667,"ĠTim":2668,"Ġrally":2669,"game":2670,"Ġbigger":2671,"Ġlawsuit":2672,"Ġrecorded":2673,"Ġfavorite":2674,"yard":2675,"Ġtransaction":2676,"Ġqu":2677,"oh":2678,"Ġinteresting":2679,"Ġinflation":2680,"ath":2681,"Ġstuff":2682,"Ġindustrial":2683,"ico":2684,"TS":2685,"Ġspeaking":2686,"Ġlosses":2687,"ID":2688,"ĠStadium":2689,"Ġstars":2690,"ĠWomen":2691,"ĠBlue":2692,"Ġwins":2693,"Ġdes":2694,"Ġcompetitive":2695,"ters":2696,"Ġpounds":2697,"Ġdirection":2698,"Ġinnings":2699,"ĠBest":2700,"Ġactor":2701,"Ġdangerous":2702,"Ġrequire":2703,"Ġplus":2704,"Ġsolid":2705,"Ġgeneration":2706,"Ġstrength":2707,"ĠMary":2708,"For":2709,"Ġplenty":2710,"ĠTeam":2711,"Ġinfluence":2712,"Ġfaced":2713,"Ġes":2714,"ĠIslamic":2715,"let":2716,"ĠDevelopment":2717,"Ġpath":2718,"Ġyouth":2719,"Ġcommitment":2720,"Ġbeautiful":2721,"ĠJack":2722,"ort":2723,"Ġten":2724,"Ġattend":2725,"ars":2726,"ón":2727,"Ġviews":2728,"Ġeuros":2729,"Ġauthor":2730,"Ġcore":2731,"Ġsupporters":2732,"ĠiPhone":2733,"Ġfashion":2734,"Ġsmaller":2735,"Ġelected":2736,"Ġuniversity":2737,"Ġpicked":2738,"wa":2739,"Ġordered":2740,"ĠSc":2741,"ĠÅ":2742,"Ġlargely":2743,"+":2744,"ĠAttorney":2745,"Ġpaying":2746,"AR":2747,"Ġconnection":2748,"Ġsetting":2749,"Ġna":2750,"ĠRock":2751,"Ġrecovery":2752,"ew":2753,"Ġserving":2754,"Ġsurprise":2755,"Ġoccurred":2756,"Ġdivision":2757,"Ġtelling":2758,"Ġmargin":2759,"Ġ2020":2760,"Ġsister":2761,"ĠNBA":2762,"Ġvoted":2763,"Ġcon":2764,"By":2765,"Ġ49":2766,"Ġfoot":2767,"ü":2768,"ĠTurkey":2769,"Ġamazing":2770,"Ġcombined":2771,"Ġappearance":2772,"Ġeasily":2773,"DAY":2774,"Ġnotes":2775,"ĠStart":2776,"Ġlanguage":2777,"Ġextremely":2778,"Ġcloudy":2779,"ĠLet":2780,"Ġdelivered":2781,"Ġimproved":2782,"Ġcollection":2783,"ĠPM":2784,"Ġestimates":2785,"Ġboys":2786,"izing":2787,"Ġtext":2788,"Ġcloser":2789,"Ġprotest":2790,"Ġprovince":2791,"Ġshop":2792,"Ġsmart":2793,"de":2794,"ĠSheriff":2795,"EN":2796,"Ġcorner":2797,"Ġpanel":2798,"Ġbooks":2799,"Ġsupported":2800,"Ġmentioned":2801,"ver":2802,"ĠMinistry":2803,"ĠPrince":2804,"ĠUSA":2805,"Ġreceiving":2806,"Ġchoose":2807,"ĠIN":2808,"ĠSpain":2809,"Ġsection":2810,"Ġconsidering":2811,"ĠCor":2812,"Ġwish":2813,"Ġwelcome":2814,"ĠConference":2815,"ere":2816,"ĠOfficer":2817,"Ġhoping":2818,"Ġportfolio":2819,"Ġstandards":2820,"Ġgrand":2821,"ĠReal":2822,"Ġsecure":2823,"ĠCorporation":2824,"ĠRep":2825,"ĠKelly":2826,"Ġstreets":2827,"Ġsitting":2828,"Ġslightly":2829,"ĠInvestment":2830,"99":2831,"ond":2832,"Ġunits":2833,"Ġvotes":2834,"Ġsegment":2835,"Ġchampionship":2836,"Ġsquad":2837,"iting":2838,"ron":2839,"®":2840,"Ġem":2841,"Ġtouch":2842,"Ġ38":2843,"Ġceremony":2844,"Ġdecide":2845,"Ġapproval":2846,"So":2847,"ĠPort":2848,"Ġsub":2849,"Ġsc":2850,"Ġrep":2851,"ĠWeek":2852,"Ġupper":2853,"Ġagree":2854,"ny":2855,"Ġmatches":2856,"ics":2857,"Ġtweeted":2858,"Ġheat":2859,"ĠGreat":2860,"Ġpenalty":2861,"Ġmass":2862,"Ġalongside":2863,"Ġherself":2864,"berg":2865,"Ġscience":2866,"Ġentered":2867,"Ġappeal":2868,"ĠPr":2869,"Ġfile":2870,"che":2871,"ĠReport":2872,"ĠThree":2873,"ĠNorthern":2874,"ĠJordan":2875,"Ġamid":2876,"Ġpace":2877,"Ġjail":2878,"Ġfinance":2879,"ĠYoung":2880,"32":2881,"Ġwilling":2882,"Ġconduct":2883,"ĠPar":2884,"Ġestablished":2885,"Ġreturns":2886,"Ġaid":2887,"Ġinternet":2888,"IA":2889,"29":2890,"Ġmeetings":2891,"Ġwarning":2892,"ĠCl":2893,"Ġcampus":2894,"Most":2895,"ĠFund":2896,"ĠWilliam":2897,"ĠJapanese":2898,"Ġconsensus":2899,"Ġbrain":2900,"!\"":2901,"Ġpoll":2902,"Ġtech":2903,"Ġtrend":2904,"Ġpotentially":2905,"Ġreduced":2906,"ĠShow":2907,"Ġ37":2908,"Ġhappening":2909,"ĠBrazil":2910,"pl":2911,"ĠCal":2912,"Ġcovered":2913,"Ġenter":2914,"TV":2915,"Ġcatch":2916,"foot":2917,"Ġunion":2918,"Ġexpansion":2919,"ĠSingapore":2920,"ĠDetroit":2921,"Ġattended":2922,"ats":2923,"Ġnewspaper":2924,"ĠDivision":2925,"news":2926,"Ġcap":2927,"Ġremoved":2928,"Ġ48":2929,"ĠRoyal":2930,"Ġwindow":2931,"Ġparking":2932,"Ġdark":2933,"Ġstanding":2934,"Ġupdate":2935,"Ġagent":2936,"Ġtransfer":2937,"ĠArmy":2938,"Ġuses":2939,"80":2940,"ĠTe":2941,"Ġintroduced":2942,"Ġmale":2943,"ĠSouthern":2944,"Ġratings":2945,"Ġisland":2946,"ĠMiller":2947,"Ġteachers":2948,"Ġadvice":2949,"Ġfamiliar":2950,"uf":2951,"Ġsought":2952,"Ġpor":2953,"ĠEric":2954,"Ġda":2955,"Ġideas":2956,"uh":2957,"Ġsixth":2958,"Ġtalent":2959,"ĠImage":2960,"ering":2961,"run":2962,"ments":2963,"Ġconducted":2964,"300":2965,"Ġurged":2966,"Ġdiscovered":2967,"Ġpl":2968,"Ġunderstanding":2969,"Ġoffense":2970,"Ġsecretary":2971,"Ġsk":2972,"Ġloans":2973,"ĠGr":2974,"Ġapplications":2975,"Ġcrude":2976,"go":2977,"ĠInstead":2978,"Ġopinion":2979,"Ġdoubt":2980,"ey":2981,"Ġdis":2982,"31":2983,"Ġexperienced":2984,"Ġleg":2985,"ĠCleveland":2986,"ven":2987,"Ġfailure":2988,"market":2989,"ack":2990,"Ġdecline":2991,"Ġchanging":2992,"Ġ300":2993,"Ġdefence":2994,"ĠBrian":2995,"Ġdelivery":2996,"Ġmarried":2997,"Ġdeclared":2998,"Ġpull":2999,"Ġlimit":3000,"ĠMORE":3001,"Ġdefeat":3002,"Ġexpand":3003,"ĠColorado":3004,"ĠRob":3005,"iss":3006,"Ġworse":3007,"Ġperform":3008,"ising":3009,"Ġ2007":3010,"ĠDel":3011,"Ġsurgery":3012,"Ġeasier":3013,"Ġmaintain":3014,"ĠEx":3015,"Ġtied":3016,"Ġeast":3017,"Ġuser":3018,"ola":3019,"Ġprogramme":3020,"Ġmanufacturing":3021,"Ġhitting":3022,"Ġx":3023,"Ġskin":3024,"Ġartist":3025,"Ġtells":3026,"Ġnearby":3027,"ĠDaniel":3028,"ĠPower":3029,"Ġdetermined":3030,"Ġactual":3031,"Ġtreated":3032,"Ġlived":3033,"Ġcomputer":3034,"Ġcool":3035,"oo":3036,"ĠPl":3037,"Ġeffects":3038,"Ġenvironmental":3039,"ĠMorgan":3040,"Ġflow":3041,"Ġachieve":3042,"ĠBell":3043,"Ġtesting":3044,"ĠBob":3045,"Ġwhatever":3046,"ĠBecause":3047,"US":3048,"ĠHollywood":3049,"Ġconflict":3050,"Ġwalking":3051,"ĠJudge":3052,"ĠAlabama":3053,"Ġaircraft":3054,"Ġte":3055,"well":3056,"Ġgoods":3057,"Ġidentify":3058,"Ġassociated":3059,"ĠVer":3060,"ĠEducation":3061,"Ġairport":3062,"IL":3063,"Ġfalling":3064,"Ġgiant":3065,"ĠMa":3066,"ĠMedical":3067,"Ġride":3068,"Ġden":3069,"º":3070,"ĠJose":3071,"Ġwest":3072,"ĠPacific":3073,"Ġvisitors":3074,"ĠWatch":3075,"ĠNations":3076,"Ġgains":3077,"Ġschedule":3078,"34":3079,"ĠExchange":3080,"Ġpayments":3081,"ĠII":3082,"70":3083,"No":3084,"ĠSyrian":3085,"ĠAdam":3086,"Ġne":3087,"Ġpartnership":3088,"Ġbl":3089,"ĠGeorgia":3090,"Ġsites":3091,"Ġmodels":3092,"Ġdegree":3093,"Ġdetermine":3094,"ĠWilson":3095,"Ġcontest":3096,"Ġprofessor":3097,"ĠChelsea":3098,"Ġmeaning":3099,"ĠGames":3100,"ĠTrust":3101,"ĠAsian":3102,"33":3103,"Ġlink":3104,"ĠUp":3105,"Ġholds":3106,"ĠTop":3107,"ĠItalian":3108,"ord":3109,"ĠKansas":3110,"Ġfarmers":3111,"Ġextended":3112,"Ġbirth":3113,"Ġreform":3114,"Ġrelations":3115,"Ġwrite":3116,"Ġsupporting":3117,"55":3118,"ita":3119,"Ġnotice":3120,"ster":3121,"Ġanimals":3122,"ĠJersey":3123,"Ġarm":3124,"ĠForeign":3125,"ĠLife":3126,"Ġtruly":3127,"ĠOnce":3128,"ĠMayor":3129,"ĠFree":3130,"ĠAgency":3131,"ĠWood":3132,"Ġpassing":3133,"DA":3134,"Ġ52":3135,"Ġmoves":3136,"Ġcom":3137,"house":3138,"ĠIts":3139,"Ġmarijuana":3140,"ines":3141,"Ġveteran":3142,"Ġvariety":3143,"ki":3144,"ff":3145,"amb":3146,"Ġlisted":3147,"Ġpushed":3148,"Ġvolume":3149,"Ġincreasingly":3150,"Ġkick":3151,"Ġrock":3152,"ank":3153,"Ġfees":3154,"Ġenable":3155,"Ġimages":3156,"Ġtruth":3157,"Ġministry":3158,"Ġrare":3159,"ĠDallas":3160,"ĠMinnesota":3161,"Ġcontributed":3162,"ĠCharles":3163,"Ġpercentage":3164,"Ġtechnical":3165,"ĠApp":3166,"Ġassistant":3167,"Ġinterests":3168,"Ġimmediate":3169,"38":3170,"ĠTown":3171,"Ġclosing":3172,"ĠAnthony":3173,"Ġsouthern":3174,"ase":3175,"ĠPutin":3176,"ĠForce":3177,"ba":3178,"Ġrefused":3179,"ĠStill":3180,"ix":3181,"ĠCol":3182,"Ġmaterials":3183,"Ġstructure":3184,"Ġdriven":3185,"Ġpatient":3186,"Ġbroken":3187,"Ġradio":3188,"Ġscale":3189,"Ġreplace":3190,"Ġ39":3191,"ĠLand":3192,"Ġdeputy":3193,"und":3194,"Ġcolor":3195,"OS":3196,"Ġroads":3197,"Ġcorruption":3198,"ĠRose":3199,"Ġemployee":3200,"ĠWater":3201,"Ġseats":3202,"Ġwalked":3203,"ec":3204,"Ġcents":3205,"Ġchain":3206,"Ġpayment":3207,"ĠAndroid":3208,"eb":3209,"Ġcommission":3210,"Ġthrow":3211,"Ġcount":3212,"Ġaccident":3213,"Ġexpensive":3214,"ered":3215,"ĠYes":3216,"ĠLouis":3217,"Ġstudies":3218,"Ġinvestigating":3219,"Ġcentury":3220,"Ġdiscussion":3221,"Ġinter":3222,"DAQ":3223,"ĠBefore":3224,"Ġinitially":3225,"*":3226,"Ġinvestments":3227,"Ġmulti":3228,"Ġtight":3229,"Ġconfident":3230,"Ġcounter":3231,"ĠQu":3232,"Ġgovernments":3233,"Ġarmed":3234,"Ġsuit":3235,"Ġrow":3236,"Ġlocations":3237,"Ġepisode":3238,"itch":3239,"Ġyounger":3240,"Ġfestival":3241,"Ġpitch":3242,"ĠOF":3243,"Ġtalked":3244,"ca":3245,"Ġprotests":3246,"Ġtargets":3247,"90":3248,"Ġoriginally":3249,"Ġsinger":3250,"Ġjourney":3251,"ug":3252,"Ġapply":3253,"Ġteacher":3254,"Ġchances":3255,"):":3256,"Ġdeaths":3257,"isation":3258,"ĠStephen":3259,"Ġcode":3260,"ĠChampionship":3261,"ĠJason":3262,"ĠAT":3263,"Ġaccept":3264,"ĠSeries":3265,"Ġvalues":3266,"Ġbed":3267,"ĠHarry":3268,"Ġflat":3269,"Ġtools":3270,"Ġpublicly":3271,"37":3272,"Ġpointed":3273,"ĠGolden":3274,"ps":3275,"Ġunable":3276,"ants":3277,"Ġestimate":3278,"Ġwarm":3279,"Ġbasic":3280,"ern":3281,"Ġraising":3282,"ĠRelated":3283,"Ġultimately":3284,"Ġnorthern":3285,"Ġplane":3286,"ĠVice":3287,"ĠRaj":3288,"ĠJustin":3289,"anc":3290,"Ġbrings":3291,"ĠArt":3292,"OT":3293,"Ġshift":3294,"ĠBBC":3295,"ĠSu":3296,"BS":3297,"Ġbag":3298,"Ġdoctor":3299,"Ġfill":3300,"Ġdowntown":3301,"Ġpossibility":3302,"ĠAg":3303,"Ġest":3304,"44":3305,"Ġstruggling":3306,"Ġlinked":3307,"Ġtickets":3308,"ĠJay":3309,"ĠCall":3310,"Ġstands":3311,"Ġwedding":3312,"Ġresident":3313,"eng":3314,"Ġleads":3315,"Ġadvance":3316,"ĠAtlanta":3317,"Ġtie":3318,"Ġadvanced":3319,"pt":3320,"burg":3321,"ĠEarlier":3322,"ĠSw":3323,"ĠZealand":3324,"Ġexercise":3325,"ĠAM":3326,"Ġaffect":3327,"Ġpossession":3328,"Ġinvolving":3329,"Ġ42":3330,"Ġwriter":3331,"ĠBeijing":3332,"Ġdoctors":3333,"Ġobviously":3334,"Ġer":3335,"ĠOlympic":3336,"Ġ75":3337,"ĠKhan":3338,"ĠFort":3339,"app":3340,"like":3341,"Ġsea":3342,"ock":3343,"Ġmix":3344,"ĠIraq":3345,"ĠMuslim":3346,"ĠFinally":3347,"Ġcontinuing":3348,"Ġpr":3349,"ĠKe":3350,"ĠJoseph":3351,"Ġexpects":3352,"Ġinstitutions":3353,"Ġconservative":3354,"own":3355,"ĠChairman":3356,"Ġreturning":3357,".-":3358,"Ġstood":3359,"Ġvision":3360,"ess":3361,"Ġadults":3362,"Ġyield":3363,"Ġprove":3364,"Ġorders":3365,"Ġdream":3366,"36":3367,"related":3368,"Ġsl":3369,"Ġeverybody":3370,"ui":3371,"Ġrepresents":3372,"Ġdiscussed":3373,"Ġbecomes":3374,"Ġvillage":3375,"CC":3376,"Ġnegotiations":3377,"ĠPhiladelphia":3378,"Ġcelebrate":3379,"Ġfarm":3380,"ç":3381,"Ġregistered":3382,"ĠGovernor":3383,"OL":3384,"ĠMon":3385,"Ġfiling":3386,"04":3387,"SE":3388,"ĠAssembly":3389,"Ġactress":3390,"Ġsi":3391,"Ġthank":3392,"Ġheading":3393,"ĠWho":3394,"Ġfamous":3395,"Ġconsecutive":3396,"Ġmarriage":3397,"ette":3398,"NAS":3399,"acks":3400,"ĠPlease":3401,"ĠDiego":3402,"Ġbaseball":3403,"ĠMoore":3404,"Ġties":3405,"Ġcarrying":3406,"que":3407,"Ġturning":3408,"ĠMcC":3409,"ĠKen":3410,"OR":3411,"ĠStock":3412,"Ġbuildings":3413,"49":3414,"ĠVan":3415,"39":3416,"ĠSeattle":3417,"Ġwild":3418,"Ġcrew":3419,"Ġroute":3420,"ĠTime":3421,"Ġtonight":3422,"Ġmoments":3423,"Ġvideos":3424,"Ġinternal":3425,"ĠLiverpool":3426,"port":3427,"Ġchair":3428,"Ġrival":3429,"ĠScotland":3430,"round":3431,"ith":3432,"Ġbreaking":3433,"Ġvoting":3434,"ically":3435,"Ġproducer":3436,"ĠLove":3437,"Ġremove":3438,"PA":3439,"Ġasset":3440,"Ġrequires":3441,"Ġsigning":3442,"ages":3443,"Ġimpressive":3444,"ĠIrish":3445,"Ġauthority":3446,"Ġruled":3447,"Ġaimed":3448,"Ġcaptain":3449,"AG":3450,"Ġplants":3451,"ĠAnderson":3452,"ĠSpanish":3453,"Ġbanking":3454,"Ġthreats":3455,"Ġsuspended":3456,"Ġtests":3457,"Ġreligious":3458,"Ġelectric":3459,"ĠREAD":3460,"Ġstrategic":3461,"Ġsplit":3462,"ex":3463,"Ġpractices":3464,"ĠIsraeli":3465,"ĠArabia":3466,"ĠMoscow":3467,"Ġfranchise":3468,"Ġcustody":3469,"ĠOld":3470,"Ġrequirements":3471,"Ġquarterly":3472,"Ġcomfortable":3473,"Ġcrimes":3474,"Ġheaded":3475,"Ġnewsletter":3476,"Ġanimal":3477,"Ġregulations":3478,"long":3479,"ĠCNN":3480,"Ġassists":3481,"Ġshopping":3482,"ĠGov":3483,"ĠSecurities":3484,"Ġassistance":3485,"Ġnor":3486,"Ġrelatively":3487,"Ġincreases":3488,"Ġgenerally":3489,"Ġ55":3490,"Ġgained":3491,"Ġ41":3492,"Ġpictures":3493,"gan":3494,"Ġpop":3495,"Ġupdates":3496,"ĠRepublic":3497,"Ġrebounds":3498,"ĠPatrick":3499,"Ġrelief":3500,"Ġacting":3501,"ĠFestival":3502,"Ġ2006":3503,"Ġboss":3504,"Ġtypes":3505,"65":3506,"ĠYet":3507,"Ġpurpose":3508,"ning":3509,"Ġmatters":3510,"Ġcompete":3511,"ball":3512,"ĠRam":3513,"Ġsw":3514,"ĠFollowing":3515,"ĠBush":3516,"Ġtroops":3517,"Ġsupposed":3518,"Ġfreedom":3519,"Ġfeatured":3520,"Ġstorage":3521,"ĠInformation":3522,"ĠHong":3523,"Ġgolf":3524,"Ġagents":3525,"Ġfraud":3526,"Ġminimum":3527,"Ġartists":3528,"Ġeat":3529,"high":3530,"ĠFormer":3531,"ĠKong":3532,"ĠJosh":3533,"ĠDelhi":3534,"Ġshowers":3535,"ĠAcademy":3536,"Ġapartment":3537,"Ġvan":3538,"Ġfish":3539,"oe":3540,"Ġfilms":3541,"ĠBo":3542,"Ġedge":3543,"Ġpossibly":3544,"Ġtweet":3545,"09":3546,"Ġresolution":3547,"jo":3548,"Ġkill":3549,"Ġ44":3550,"Ġcell":3551,"Ġscheme":3552,"Ġth":3553,"Ġbonds":3554,"Ġentry":3555,"Ġsecret":3556,"Ġ43":3557,"Ġending":3558,"Ġweren":3559,"ĠCredit":3560,"ĠLive":3561,"Ġretired":3562,"Ġmachine":3563,"Ġsummit":3564,"Ġsharing":3565,"Ġacquired":3566,"Ġera":3567,"Ġwear":3568,"ical":3569,"07":3570,"Ġexciting":3571,"li":3572,"BC":3573,"ĠSocial":3574,"Ġhistoric":3575,"ĠChe":3576,"ĠLewis":3577,"ira":3578,"Ġstolen":3579,"ĠSpeaking":3580,"Ġsleep":3581,"Ġspokeswoman":3582,"week":3583,"Ġpurchased":3584,"Ġimportance":3585,"EC":3586,"Ġends":3587,"Ġdress":3588,"Ġparliament":3589,"ĠCruz":3590,"Ġcards":3591,"hi":3592,"ĠEmail":3593,"Ġrepresent":3594,"Ġbrands":3595,"ĠSenior":3596,"Ġparticipants":3597,"Ġfly":3598,"Ġidentity":3599,"ĠHam":3600,"ĠSky":3601,"ij":3602,"SA":3603,"Ġpromised":3604,"Ġtrouble":3605,"Ġsuffering":3606,"Ġleaves":3607,"Ġsuggest":3608,"Sh":3609,"Ġbusy":3610,"Ġproperties":3611,"Ġworldwide":3612,"Ġcloud":3613,"ĠSEC":3614,"Ġclosely":3615,"Ġmanage":3616,"Ġnumerous":3617,"Ġbackground":3618,"ĠExpress":3619,"Ġ65":3620,"ĠTony":3621,"ĠMadrid":3622,"ev":3623,"der":3624,"Ġsignificantly":3625,"Ġalternative":3626,"Ġship":3627,"head":3628,"ators":3629,"Ġdinner":3630,"ax":3631,"SC":3632,"Ġcriticism":3633,"ĠMah":3634,"ĠMin":3635,"rie":3636,"ĠTour":3637,"Ġbench":3638,"Ġadds":3639,"Ġseriously":3640,"star":3641,"ĠJournal":3642,"ĠDi":3643,"ali":3644,"Ġsentence":3645,"ĠSeveral":3646,"Ġmayor":3647,"ati":3648,"Ġsuggests":3649,"Ġbehavior":3650,"Ġstronger":3651,"ĠFood":3652,"Ġclient":3653,"not":3654,"ĠPrice":3655,"Ġtargeted":3656,"ĠSingh":3657,"ĠNetwork":3658,"Ġprosecutors":3659,"Ġdirected":3660,"ĠDemocrat":3661,"bl":3662,"ues":3663,"ĠFamily":3664,"Ġconnected":3665,"ĠChampions":3666,"Ġroughly":3667,"Ġabsolutely":3668,"08":3669,"Ġpassengers":3670,"ö":3671,"ĠSpecial":3672,"Ġcoast":3673,"Ġcomplaint":3674,"Ġ400":3675,"ĠEm":3676,"ves":3677,"Ġdogs":3678,"Ġhandle":3679,"Ġotherwise":3680,"Ġsees":3681,"Ġticket":3682,"ĠAward":3683,"All":3684,"Ġtask":3685,"Ġsongs":3686,"ĠAmong":3687,"Ġdedicated":3688,"Ġsteel":3689,"looking":3690,"Ġshortly":3691,"Ġtackle":3692,"ative":3693,"Ġminor":3694,"â":3695,"Ġprovider":3696,"vers":3697,"use":3698,"ives":3699,"Ġtypically":3700,"Ġarms":3701,"ĠAnt":3702,"ĠIS":3703,"Ġjump":3704,"Ġ©":3705,"47":3706,"aff":3707,"Ġmonthly":3708,"ĠMicrosoft":3709,"ĠCBS":3710,"Ġthreatened":3711,"Ġhonor":3712,"ĠMo":3713,"42":3714,"Ġinning":3715,"Ġpool":3716,"Ġhealthcare":3717,"ĠStory":3718,"ĠTennessee":3719,"Ġpromote":3720,"EL":3721,"Ġemotional":3722,"Ġpe":3723,"Ġfactor":3724,"Ġinvestigators":3725,"Ľ":3726,"ĠBack":3727,"ĠProject":3728,"Ġcu":3729,"side":3730,"Ġmessages":3731,"TH":3732,"eg":3733,"Ġexperiences":3734,"Ġcausing":3735,"Ġjoining":3736,"Ġpackage":3737,"Ġbodies":3738,"Ġlots":3739,"ĠHarris":3740,"Ġcl":3741,"ĠInternet":3742,"free":3743,"Ġperformed":3744,"Ġpieces":3745,"buy":3746,"Ġcaption":3747,"Ġweb":3748,"Ġcontracts":3749,"At":3750,"Ġattempted":3751,"Ġunlikely":3752,"Ġclick":3753,"Ġinvest":3754,"IM":3755,"ĠView":3756,"Ġneighborhood":3757,"Ġring":3758,"ĠFour":3759,"ail":3760,"46":3761,"One":3762,"Ġnative":3763,"CH":3764,"OM":3765,"Ġalcohol":3766,"ĠVal":3767,"Ġcharacters":3768,"ĠPat":3769,"Ġpoliticians":3770,"ĠMag":3771,"Ġbegins":3772,"ĠAk":3773,"Ġlos":3774,"Ġpersonnel":3775,"Ġenjoyed":3776,"ĠTechnology":3777,"Ġsun":3778,"ĠIT":3779,"Ġdocument":3780,"Ġdeficit":3781,"Ġcoalition":3782,"Ġmemory":3783,"Ġpushing":3784,"any":3785,"ified":3786,"Ġfounder":3787,"Ġ2000":3788,"2017":3789,"Ġvisited":3790,"ĠThough":3791,"ph":3792,"Ġsoft":3793,"Ġflag":3794,"Ġmom":3795,"inch":3796,"ĠSamsung":3797,"Ġapps":3798,"Ġtouchdown":3799,"ĠCare":3800,"ĠMrs":3801,"Ġredistributed":3802,"Ġencourage":3803,"ched":3804,"Ġtend":3805,"Ġregions":3806,"pp":3807,"IP":3808,"br":3809,"ush":3810,"Ġargued":3811,"Ġjunior":3812,"BA":3813,"Ġsevere":3814,"ĠNIGHT":3815,"Ġdef":3816,"Ġsurrounding":3817,"48":3818,"Ġengine":3819,"Ġfilled":3820,"Ġseventh":3821,"Ġbattery":3822,"ĠAllen":3823,"Ġguidance":3824,"Ġroll":3825,"Ġrural":3826,"Ġexpert":3827,"Ġconvicted":3828,"Ġlikes":3829,"ĠRo":3830,"Ġgrown":3831,"Ġretirement":3832,"Ġintended":3833,"Ġmis":3834,"Ġarmy":3835,"Ġdance":3836,"ĠThank":3837,"Ġent":3838,"Ġoutlook":3839,"Ġpara":3840,"Ġdry":3841,"ĠTO":3842,"era":3843,"Ġwaste":3844,"Ġfaster":3845,"ĠEagles":3846,"TA":3847,"ĠFrank":3848,"Ã":3849,"LE":3850,"ura":3851,"ko":3852,"ao":3853,"Ġdistribution":3854,"Ġimprovement":3855,"Ġplayoff":3856,"Ġacquisition":3857,"ĠCH":3858,"Ġtomorrow":3859,"Ġstruggle":3860,"ĠHuman":3861,"Ġnewly":3862,"oon":3863,"ĠNe":3864,"con":3865,"sc":3866,"Ġunless":3867,"Ġtransition":3868,"ten":3869,"ĠInter":3870,"Ġequal":3871,"Ġrec":3872,"Ġappointed":3873,"Ġwake":3874,"ĠEarth":3875,"ose":3876,"ĠEastern":3877,"Ġsoldiers":3878,"ĠParliament":3879,"Ġsets":3880,"Ġattempts":3881,"ĠIllinois":3882,"Ġrevenues":3883,"ĠWil":3884,"Ġheads":3885,"Ġprepare":3886,"Ġpriority":3887,"PS":3888,"ĠJo":3889,"ĠNBC":3890,"Ġtherefore":3891,"yn":3892,"Ġinitiative":3893,"ct":3894,"Ġcoffee":3895,"ĠFair":3896,"43":3897,"den":3898,"form":3899,"ova":3900,"Ġappropriate":3901,"ĠPlay":3902,"Ġaccepted":3903,"Ġcreative":3904,"Ġfollows":3905,"Ġrescue":3906,"Ġtree":3907,"With":3908,"ĠNetflix":3909,"ĠFootball":3910,"Ġsurprised":3911,"Ġlowest":3912,"800":3913,"amp":3914,"Ġworried":3915,"mar":3916,"ran":3917,"Ġvisiting":3918,"Ġselected":3919,"ĠMusic":3920,"ĠAnn":3921,"Ġexplain":3922,"ging":3923,"Ġwidely":3924,"Ġsquare":3925,"Ġtrends":3926,"Ġimproving":3927,"ĠHead":3928,"ĠQueen":3929,"ĠSociety":3930,"Ġcutting":3931,"ĠGOP":3932,"03":3933,"',":3934,"ET":3935,"ĠDrive":3936,"oll":3937,"ato":3938,"ĠSea":3939,"Ġjury":3940,"ĠRights":3941,"Ġinvestor":3942,"ĠABC":3943,"Ġtool":3944,"ĠAre":3945,"Ġrejected":3946,"Ġemerging":3947,"Ġcounts":3948,"Ġnations":3949,"Ġfalse":3950,"Ġtreat":3951,"va":3952,"Ġweak":3953,"ĠHighway":3954,"down":3955,"Ġstruggled":3956,"ĠMP":3957,"Ġguests":3958,"Ġgender":3959,"Ġhouses":3960,"rit":3961,"ĠWild":3962,"Ġstreak":3963,"uc":3964,"ĠReserve":3965,"ĠRatings":3966,"alt":3967,"Ġgreatest":3968,"Ġlawyers":3969,"Ġreaching":3970,"Ġtemperatures":3971,"To":3972,"Ġoutstanding":3973,"Ġpasses":3974,"Ġfaith":3975,"inc":3976,"Ġcr":3977,"Ġinformed":3978,"oz":3979,"Ġtrees":3980,"Ġsending":3981,"Ġ150":3982,"bo":3983,"Ġwine":3984,"ros":3985,"Ġsuspected":3986,"Ġrepeatedly":3987,"Ġhat":3988,"Ġshape":3989,"ĠWh":3990,"Ġassist":3991,"Ġstress":3992,"Ġfeed":3993,"ark":3994,"ored":3995,"Ġwatched":3996,"Ġincredible":3997,"cl":3998,"nt":3999,"Ġentertainment":4000,"ih":4001,"Ġbeauty":4002,"Ġbi":4003,"ĠLocal":4004,"Ġsat":4005,"41":4006,"Ġbroad":4007,"Ġheavily":4008,"Ġengaged":4009,"Ġspecifically":4010,"ĠMen":4011,"ĠRoss":4012,"Ġ2005":4013,"ST":4014,"95":4015,"Ġdownload":4016,"400":4017,"Ġsentenced":4018,"ĠCatholic":4019,"ĠOklahoma":4020,"Ġthrew":4021,"Ġworry":4022,"Ġimp":4023,"Ġdrove":4024,"Ġcolleagues":4025,"Ġagenda":4026,"64":4027,"ĠEach":4028,"Ġfee":4029,"New":4030,"ium":4031,"Ġspokesperson":4032,"Ġbills":4033,"Ġ47":4034,"ĠAfghanistan":4035,"Ġinvited":4036,"ĠYouTube":4037,"Ġanniversary":4038,"Ġdozen":4039,"ram":4040,"ĠOnly":4041,"Ġemployment":4042,"Getty":4043,"Ġgap":4044,"Ġsweet":4045,"ĠLittle":4046,"Ġinf":4047,"ying":4048,"Ġglass":4049,"Ġclasses":4050,"Ġcoal":4051,"ĠSub":4052,"Ġduty":4053,"CA":4054,"Ġcoaches":4055,"Â":4056,"anna":4057,"ĠSk":4058,"Ġ46":4059,"ison":4060,"ille":4061,"ĠST":4062,"ric":4063,"Ġparticipate":4064,"Ġequ":4065,"Ġrich":4066,"Ġrespectively":4067,"Ġexpenses":4068,"Ġcombination":4069,"right":4070,"Ġshareholders":4071,"Ġturns":4072,"Ġearn":4073,"Ġ51":4074,"ured":4075,"Ġdrink":4076,"ĠKar":4077,"ĠShares":4078,"ĠMid":4079,"ĠGetty":4080,"Ġbridge":4081,"lo":4082,"Ġinspired":4083,"Ġsurface":4084,"Ġgift":4085,"ence":4086,"Ġchallenging":4087,"Ġoffices":4088,"Ġsuspects":4089,"ĠFinance":4090,"Ġab":4091,"bound":4092,"Ġmomentum":4093,"Ġbacked":4094,"Ġparent":4095,"Ġcrucial":4096,"ave":4097,"Ġdealing":4098,"Ġregulatory":4099,"Ġapparently":4100,"ĠMat":4101,"Ġapart":4102,"Ġport":4103,"ole":4104,"Ġbeach":4105,"Ġcultural":4106,"Ġinstitutional":4107,"Ġbeating":4108,"ĠIowa":4109,"ĠAli":4110,"67":4111,"Ġje":4112,"ays":4113,"Ġweekly":4114,"Ġbirthday":4115,"Ġpipeline":4116,"Ġknee":4117,"Ġsolar":4118,"ĠPe":4119,"Ġcategory":4120,"ĠArea":4121,"ky":4122,"ures":4123,"06":4124,"ĠBall":4125,"Ġsemi":4126,"ĠHamilton":4127,"hip":4128,"ĠPh":4129,"ĠNext":4130,"Ġathletes":4131,"ii":4132,"Ġmovies":4133,"han":4134,"net":4135,"Ġplastic":4136,"Ġbehalf":4137,"gen":4138,"Ġfindings":4139,"Ġstretch":4140,"ĠSa":4141,"Ġofficially":4142,"ĠSarah":4143,"Ġprivacy":4144,"ĠMad":4145,"Ġnone":4146,"gh":4147,"On":4148,"Ġdrama":4149,"ĠFl":4150,"ika":4151,"ĠArsenal":4152,"Ġviolent":4153,"UN":4154,"called":4155,"59":4156,"Ġhate":4157,"Ġrelationships":4158,"Ġgranted":4159,"ĠJon":4160,"Ġlisten":4161,"season":4162,"Ġfewer":4163,"GA":4164,"ĠLabour":4165,"Ġremarks":4166,"ĠJonathan":4167,"ĠRos":4168,"sey":4169,"ĠOntario":4170,"ĠThompson":4171,"ĠNight":4172,"Ġranked":4173,"ĠUkraine":4174,"Ġimmigrants":4175,"Ġdegrees":4176,"ĠGe":4177,"Ġlabor":4178,"umb":4179,"ĠYORK":4180,"Ġallies":4181,"sp":4182,"hed":4183,"sw":4184,"Ġtariffs":4185,"SP":4186,"Ġclassic":4187,"Ġawards":4188,"ents":4189,"Ġfix":4190,"Ġsoccer":4191,"Ġconcert":4192,"ust":4193,"Ġadult":4194,"Ġoutput":4195,"Ġmanaging":4196,"02":4197,"Ġpromise":4198,"Ġawareness":4199,"Ġgross":4200,"Ġentering":4201,"Ġpo":4202,"oj":4203,"Ġmetal":4204,"Ġexit":4205,"Ġexcellent":4206,"Ġclubs":4207,"hold":4208,"Ġreplaced":4209,"ĠClass":4210,"Ġscientists":4211,"Ġprimarily":4212,"ĠMer":4213,"ão":4214,"Ġcircumstances":4215,"ades":4216,"Ġsupplies":4217,"aker":4218,"ĠSand":4219,"Ġscandal":4220,"Ġsettlement":4221,"ĠWisconsin":4222,"ĠWarriors":4223,"ĠAustin":4224,"Ġjournalists":4225,"ening":4226,"Ġreflect":4227,"ĠBuy":4228,"ĠAwards":4229,"Ġselection":4230,"ĠBel":4231,"bury":4232,"Ġtechnologies":4233,"%,":4234,"ime":4235,"ĠÄ":4236,"ĠAdministration":4237,"Ġchannel":4238,"Star":4239,"Ġtransport":4240,"Ġawarded":4241,"ena":4242,"Ġmotor":4243,"orn":4244,"kin":4245,"Ġfeaturing":4246,"Ġphones":4247,"ĠAND":4248,"Ġrelevant":4249,"ĠSee":4250,"Ġwinners":4251,"Ġdad":4252,"ĠSource":4253,"ĠCheck":4254,"aut":4255,"ĠFar":4256,"Ġopponents":4257,"Ġoutcome":4258,"Ġdoors":4259,"Ġsuicide":4260,"ima":4261,"Ġjumped":4262,"Ġperspective":4263,"Ġtransportation":4264,"Ġthinks":4265,"ĠMor":4266,"Ġdeadline":4267,"Ġ53":4268,"ĠDeputy":4269,"ery":4270,"Ġdetailed":4271,"uch":4272,"ĠBur":4273,"Ġtrades":4274,"ĠGreg":4275,"Ġzero":4276,"erson":4277,"ĠChildren":4278,"Ġdu":4279,"66":4280,"Ġmixed":4281,"ĠBarack":4282,"54":4283,"Ġterritory":4284,"Ġac":4285,"Ġconcept":4286,"ĠAdd":4287,"Ġourselves":4288,"Ġreaction":4289,"ĠSydney":4290,"ink":4291,"Ġconsistent":4292,"Ġboat":4293,"room":4294,"Ġdozens":4295,"Ġeffectively":4296,"but":4297,"Ġmotion":4298,"Ġalive":4299,"ĠKey":4300,"weight":4301,"Ġexports":4302,"Ġoperate":4303,"Ġregime":4304,"ĠAuthority":4305,"och":4306,"ĠCR":4307,"leg":4308,"Ġforget":4309,"American":4310,"bs":4311,"Ġthoughts":4312,"ĠSign":4313,"ĠPatriots":4314,"Ġbrief":4315,"ĠOregon":4316,"ĠBal":4317,"Ġmine":4318,"Ġciting":4319,"Ġmagazine":4320,"more":4321,"ERS":4322,"ĠBer":4323,"ua":4324,"ox":4325,"ĠMain":4326,"Ġinstance":4327,"tr":4328,"Ġrestaurants":4329,"ora":4330,"Ġharassment":4331,"\",\"":4332,"Ł":4333,"Ġsilver":4334,"ĠMueller":4335,"ĠSenator":4336,"ĠEvery":4337,"Ġfootage":4338,"ms":4339,"Ġopposed":4340,"ĠLink":4341,"Ġver":4342,"Ġpleased":4343,"ame":4344,"ending":4345,"Ġrivals":4346,"ida":4347,"ike":4348,"ta":4349,"ĠCook":4350,"Ġheadquarters":4351,"ear":4352,"Ġaggressive":4353,"Ġcourts":4354,"ĠMuseum":4355,"Ġim":4356,"ĠHoldings":4357,"Ġcommunication":4358,"Ġphase":4359,"yl":4360,"Ġpowers":4361,"Ġproved":4362,"Ġcarbon":4363,"Ġaside":4364,"ĠOlympics":4365,"Ġgathered":4366,"ĠPennsylvania":4367,"Ġsmartphone":4368,"ĠMet":4369,"ĠHurricane":4370,"Ġprotected":4371,"Ġcommunications":4372,"Ġemerged":4373,"Ġaim":4374,"Ġstable":4375,"ides":4376,"GB":4377,"Ġentirely":4378,"Ġmissile":4379,"ĠGen":4380,"Ġunclear":4381,"Ġelectricity":4382,"ology":4383,"away":4384,"Ġlicense":4385,"ĠPittsburgh":4386,"Ġcameras":4387,"Ġmusical":4388,"Ġmanagers":4389,"57":4390,"Ġscores":4391,"Ġprofile":4392,"hel":4393,"¼":4394,"Ġshouldn":4395,"RA":4396,");":4397,"Ġpermanent":4398,"ome":4399,"Ġet":4400,"Ġmar":4401,"Ġfavor":4402,"Ġmaker":4403,"Ġdiscussions":4404,"ory":4405,"Ġsharp":4406,"Ġpleaded":4407,"Ġpassenger":4408,"quarter":4409,"Ġdem":4410,"Ġversus":4411,"Ġmainly":4412,"Ġeighth":4413,"ĠAirport":4414,"ĠCross":4415,"million":4416,"ĠNas":4417,"Ġcited":4418,"56":4419,"Ġyes":4420,"ĠBelow":4421,"arn":4422,"ĠTurkish":4423,"ĠSl":4424,"Ġstepped":4425,"Ġproducers":4426,"Ġovernight":4427,"Ġsounds":4428,"52":4429,"Ġ64":4430,"Ġ54":4431,"58":4432,"ĠClark":4433,"ĠRick":4434,"Ġgr":4435,"ĠMont":4436,"Ġbeer":4437,"une":4438,"Ġreporter":4439,"Ġcharity":4440,"Ġeating":4441,"Ġextend":4442,"Ġguess":4443,"NA":4444,"Ġhedge":4445,"Ġencouraged":4446,"owned":4447,"ĠMel":4448,"ĠKentucky":4449,"ace":4450,"Ġlineup":4451,"Ġhosts":4452,"Ġcapable":4453,"PR":4454,"ĠArts":4455,"Ġcontroversial":4456,"Ġhosted":4457,"ries":4458,"Ġroster":4459,"Ġfixed":4460,"ĠWalker":4461,"ged":4462,"Ġdisaster":4463,"Ġdispute":4464,"ĠDenver":4465,"ĠTrade":4466,"ute":4467,"ese":4468,"cy":4469,"Ġgrant":4470,"ĠMax":4471,"Ġdistance":4472,"isc":4473,"Ġeditor":4474,"ĠDave":4475,"Ġperformances":4476,"Ġlay":4477,"Ġvulnerable":4478,"ĠMurray":4479,"ĠâĤ¬":4480,"Ġmining":4481,"Ġ2004":4482,"level":4483,"ability":4484,"Ġauto":4485,"Ġfake":4486,"Ġattacked":4487,"ona":4488,"ups":4489,"ened":4490,"Ġfallen":4491,"Ġstations":4492,"ĠContact":4493,"itz":4494,"Ġincidents":4495,"Ġcomplaints":4496,"Ġoperates":4497,"Ġrefugees":4498,"Ġessential":4499,"ĠTest":4500,"Ġdemands":4501,"Ġroles":4502,"yr":4503,"Ġacts":4504,"Ġusual":4505,"ring":4506,"Ġhanded":4507,"ĠMatthew":4508,"hour":4509,"Ġindustries":4510,"Ġshoot":4511,"ĠAuthorities":4512,"Ġprobe":4513,"ĠUtah":4514,"ĠRBI":4515,"ĠAD":4516,"Ġprospect":4517,"outs":4518,"ĠUber":4519,"Ġbright":4520,"Ġmention":4521,"Ġsavings":4522,"ĠMiss":4523,"ONDON":4524,"Ġ1990":4525,"arm":4526,"ĠTen":4527,"These":4528,"Ġexplains":4529,"minute":4530,"85":4531,"Ġmaximum":4532,"Ġro":4533,"Ġrookie":4534,"Ġstudio":4535,"ĠCam":4536,"ĠGal":4537,"Ġdefend":4538,"hand":4539,"53":4540,"ĠOil":4541,"Ġserves":4542,"Ġsn":4543,"ios":4544,"ĠDefense":4545,"AB":4546,"Ġhired":4547,"Ġsupports":4548,"Ġpremium":4549,"ef":4550,"Ġfailing":4551,"ĠIndiana":4552,"Ġexp":4553,"Ġobjective":4554,"Ġaffordable":4555,"ĠCom":4556,"ĠThanks":4557,"Ġanywhere":4558,"Ġconfirm":4559,"ited":4560,"Ġrepresenting":4561,"Ġwitness":4562,"69":4563,"Ġclaiming":4564,"Ġviolation":4565,"Ġhistorical":4566,"med":4567,"Ġpreparing":4568,"ĠTech":4569,"Ġposts":4570,"OC":4571,"ĠGraham":4572,"ĠGl":4573,"ĠLions":4574,"ales":4575,"ĠID":4576,"Ġcorrect":4577,"ĠAntonio":4578,"Ġadvertising":4579,"Ġeastern":4580,"OW":4581,"Ġholdings":4582,"Ġpolls":4583,"ĠSH":4584,"Ġexecutives":4585,"ĠJewish":4586,"ĠGary":4587,"Ġprize":4588,"ĠCommissioner":4589,"Ġcells":4590,"ify":4591,"Ġlunch":4592,"Ġdemocracy":4593,"ĠEr":4594,"Ġregularly":4595,"Ġresulted":4596,"ĠAve":4597,"ĠPartners":4598,"Ġrewritten":4599,"Ġlo":4600,"Ġcooperation":4601,"ĠGulf":4602,"Ġsmoke":4603,"ĠMemorial":4604,"Ġwave":4605,"Ġfears":4606,"Ġkid":4607,"ĠGiants":4608,"Ġrecovered":4609,"row":4610,"ĠRadio":4611,"ĠBarcelona":4612,"Ġwonderful":4613,"ĠDow":4614,"Ġstream":4615,"ĠSimon":4616,"Ġdetail":4617,"Ġvolunteers":4618,"ĠInd":4619,"Ġforms":4620,"mann":4621,"ĠRay":4622,"oor":4623,"ĠTake":4624,"Ġrepresented":4625,"het":4626,"Ġblow":4627,"aged":4628,"RE":4629,"ĠMissouri":4630,"Ġcovering":4631,"Ġprofits":4632,"Ġconcluded":4633,"Ġthus":4634,"ĠColumbia":4635,"ode":4636,"ĠZimbabwe":4637,"Ġdisclosed":4638,"Ġlifted":4639,"ĠSean":4640,"ĠHarvey":4641,"ĠPlus":4642,"ces":4643,"ĠGreece":4644,"ĠLady":4645,"Ġdelay":4646,"Ġkitchen":4647,"ĠIndex":4648,"Ġbear":4649,"Ġputs":4650,"new":4651,"88":4652,"ĠAsh":4653,"Å¡":4654,"Ġperforming":4655,"law":4656,"ĠPart":4657,"Ġindicated":4658,"Ġannounce":4659,"Ġcompensation":4660,"Ġka":4661,"ĠScience":4662,"ris":4663,"Ġrecommendations":4664,"ĠSecond":4665,"Ġlights":4666,"Ġtemporary":4667,"urs":4668,"Ġwestern":4669,"stone":4670,"68":4671,"ĠDisney":4672,"Ġplayoffs":4673,"Ġjudges":4674,"Ġengineering":4675,"ĠPen":4676,"ĠPal":4677,"Ġobvious":4678,"ĠBridge":4679,"ĠEnd":4680,"ĠArab":4681,"Ġexcept":4682,"Ġhole":4683,"class":4684,"Ġcauses":4685,"Ġconnect":4686,"ĠAI":4687,"An":4688,"Ġchose":4689,"ĠElizabeth":4690,"min":4691,"Ġproper":4692,"ĠNHL":4693,"Ġraces":4694,"Ġinnovation":4695,"Ġsugar":4696,"600":4697,"ĠModi":4698,"illa":4699,"Ġtrillion":4700,"ĠSar":4701,"ĠAffairs":4702,"Ġimpossible":4703,"Ġguide":4704,"Ġcaptured":4705,"ĠSales":4706,"Ġspecies":4707,"51":4708,"Ġar":4709,"Ġmaster":4710,"Ġstayed":4711,"iro":4712,"ĠEconomic":4713,"Ġvast":4714,"ili":4715,"Ġpet":4716,"ye":4717,"77":4718,"Ġkeeps":4719,"ĠPhil":4720,"ĠEPS":4721,"ĠRegional":4722,"Ġsectors":4723,"Ġdesire":4724,"ĠStanley":4725,"¾":4726,"Ġunknown":4727,"Ġpot":4728,"ĠPR":4729,"Ġknowing":4730,"Ġflying":4731,"ĠTreasury":4732,"iers":4733,"enn":4734,"ably":4735,"Ġsick":4736,"Ġmanner":4737,"Ġmanufacturers":4738,"Ġchampions":4739,"gy":4740,"Part":4741,"ister":4742,"ĠMountain":4743,"Ġimagine":4744,"Ġportion":4745,"ĠCamp":4746,"Ġchemical":4747,"ible":4748,"ĠAnaly":4749,"ĠBureau":4750,"Ġpm":4751,"Ġupdated":4752,"Ġetc":4753,"ĠField":4754,"iles":4755,"Ġobtained":4756,"Ġstick":4757,"Ġcat":4758,"har":4759,"Ġmarked":4760,"Ġmedium":4761,"ĠDes":4762,"People":4763,"Ġwealth":4764,"ores":4765,"ĠBaltimore":4766,"Ġtip":4767,"Ġdismissed":4768,"ĠVictoria":4769,"ĠBrad":4770,"Ch":4771,"Ġ56":4772,"Ġstadium":4773,"eth":4774,"Ġthunder":4775,"Ġtested":4776,"Ġdrawn":4777,"Ġcounsel":4778,"ld":4779,"Ġspirit":4780,"uss":4781,"Ġtheme":4782,"my":4783,"Ġnecessarily":4784,"Ġelements":4785,"Ġcollected":4786,"ĠRes":4787,"ĠMaryland":4788,"ĠEnter":4789,"Ġfounded":4790,"ae":4791,"Ġpilot":4792,"Ġshoulder":4793,"PC":4794,"Ġargument":4795,"Ġyen":4796,"Ġreceiver":4797,"Ġharm":4798,"ĠET":4799,"Ġprotesters":4800,"Ġ72":4801,"ĠAaron":4802,"Ġed":4803,"Ġexpecting":4804,"\":\"":4805,"Ġbike":4806,"Äĩ":4807,"Ġluxury":4808,"half":4809,"ĠBarbara":4810,"Ġfoundation":4811,"Ġill":4812,"Ġsubmitted":4813,"Ġdeeply":4814,"Ġhospitals":4815,"ĠBJP":4816,"Ġshock":4817,"Ġplatforms":4818,"Ġsummary":4819,"ĠWhere":4820,"Ġcelebration":4821,"iff":4822,"Ġveterans":4823,"Ġachieved":4824,"fl":4825,"Ġactivists":4826,"ĠManager":4827,"Ġformal":4828,"Ġformed":4829,"Ġinvestigate":4830,"ĠKyle":4831,"Ġ:":4832,"ĠRa":4833,"ovic":4834,"Ġdrinking":4835,"Ġnetworks":4836,"ĠAlexander":4837,"ĠOs":4838,"Ġ)":4839,"Ġbomb":4840,"Ġrecalled":4841,"ito":4842,"ient":4843,"Ġrepresentatives":4844,"ĠChrist":4845,"ĠWay":4846,"Ġdeadly":4847,"Ġinvesting":4848,"ĠRussell":4849,"Ġconsumption":4850,"Ġharder":4851,"Ġbail":4852,"Ġcritics":4853,"Ġdanger":4854,"Ġdrew":4855,"ĠSol":4856,"Ġcopyright":4857,"ĠHenry":4858,"Ġbuyers":4859,"Ġresidential":4860,"Ġmaintenance":4861,"pr":4862,"Ġmarks":4863,"Ġages":4864,"Ġcovers":4865,"Ġton":4866,"Ġtitles":4867,"ĠPS":4868,"ĠEvans":4869,"Ġmigrants":4870,"Ġflights":4871,"Ġmonitoring":4872,"Ġaddressed":4873,"Ġvital":4874,"Ġcontrolled":4875,"Ġweapon":4876,"Ġinches":4877,"Ġreduction":4878,"Ġurban":4879,"Ġcoaching":4880,"Ġreducing":4881,"ila":4882,"Ġrealize":4883,"Ġmeat":4884,"Ġref":4885,"Ġoverseas":4886,"Ġblame":4887,"Ġterrorist":4888,"Ġstuck":4889,"ĠUs":4890,"esh":4891,"pro":4892,"Ġ58":4893,"ough":4894,"Ġexposure":4895,"ĠAbu":4896,"state":4897,"Ġproviders":4898,"Ġfore":4899,"Ġjet":4900,"bar":4901,"Ġownership":4902,"ret":4903,"Ġupset":4904,"Ġfacts":4905,"Ġpurchasing":4906,"Ġreforms":4907,"Ġriver":4908,"Ġsomebody":4909,"Ġguest":4910,"iy":4911,"Ġauction":4912,"ĠReading":4913,"Ġconsequences":4914,"Ġrepresentative":4915,"Ġappointment":4916,"add":4917,"Ġcollaboration":4918,"ĠTesla":4919,"ĠCohen":4920,"Ġengagement":4921,"Ġspeaks":4922,"EST":4923,"Ġexposed":4924,"Ġmaintained":4925,"rs":4926,"Ġdating":4927,"ĠProgram":4928,"board":4929,"Ġracing":4930,"Ġpension":4931,"ign":4932,"iti":4933,"ĠFive":4934,"Ġextensive":4935,"ĠHa":4936,"ĠPoint":4937,"ĠMexican":4938,"Ġexpanded":4939,"Ġtotally":4940,"Ġinvestigations":4941,"ĠOrleans":4942,"Ġcycle":4943,"ĠESPN":4944,"ifying":4945,"Ġcup":4946,"ĠAz":4947,"ĠInvestors":4948,"Ġengage":4949,"reg":4950,"Ġfought":4951,"Ġterrorism":4952,"Ġblocked":4953,"ĠOK":4954,"Äį":4955,"72":4956,"Ġdestroyed":4957,"«":4958,"Ġstaying":4959,"Ġafford":4960,"Ġappearances":4961,"ĠHills":4962,"Ġcrore":4963,"Ġstrategies":4964,"Ġtips":4965,"ĠSm":4966,"ĠFr":4967,"Ġbanned":4968,"ĠSon":4969,"ask":4970,"Ġlimits":4971,"Ġrecognition":4972,"Ġeligible":4973,"ĠGar":4974,"Ġvolatility":4975,"Ġlaid":4976,"nes":4977,"Ġgrade":4978,"ĠRE":4979,"ĠHart":4980,"Ġ57":4981,"oma":4982,"Ġuncertainty":4983,"Ġrecognized":4984,"ĠPC":4985,"Ġchosen":4986,"uz":4987,"Ġadviser":4988,"una":4989,"Ġassessment":4990,"Ġreveal":4991,"mo":4992,"After":4993,"ĠBro":4994,"ĠOff":4995,"Ġpeak":4996,"Ġreferred":4997,"ĠSC":4998,"Ġ2003":4999,"ification":5000,"Ġshutdown":5001,"ĠOfficials":5002,"ias":5003,"Ġextreme":5004,"Ġflood":5005,"Ġhockey":5006,"Ġwage":5007,"ĠNet":5008,"Ġdamaged":5009,"Ġreplacement":5010,"ĠMaria":5011,"Ġcreation":5012,"Ġguns":5013,"aci":5014,"Ġworker":5015,"do":5016,"Ġviewers":5017,"Ġseed":5018,"sts":5019,"Ġtouchdowns":5020,"Ġmistake":5021,"ray":5022,"ull":5023,"Ġpricing":5024,"Ġstrongly":5025,"Ġaims":5026,"ĠNavy":5027,"ĠEgypt":5028,"ker":5029,"Ġve":5030,"ĠSteven":5031,"Ġres":5032,"ational":5033,"Ġrequests":5034,"Ġemissions":5035,"ĠArena":5036,"uma":5037,"ĠAtlantic":5038,"hr":5039,"ĠAFP":5040,"ĠSquare":5041,"Ġcontribute":5042,"Ġfunction":5043,"Ġdec":5044,"ĠNelson":5045,"89":5046,"Ġreferendum":5047,"ĠPre":5048,"Ġapplied":5049,"ĠGMT":5050,"ĠIranian":5051,"ĠNigerian":5052,"ĠAny":5053,"NG":5054,"Ġacknowledged":5055,"Ġreferring":5056,"Ġventure":5057,"Ġimports":5058,"Ġblog":5059,"Ġfutures":5060,"OU":5061,"ĠUFC":5062,"Ġneither":5063,"Ġextension":5064,"hes":5065,"ĠMed":5066,"76":5067,"Ġsustainable":5068,"ains":5069,"Ġreputation":5070,"ĠVancouver":5071,"Ġbasically":5072,"acy":5073,"Ġsad":5074,"ĠFrancis":5075,"ĠKennedy":5076,"ĠNevada":5077,"ĠLu":5078,"ras":5079,"ĠAv":5080,"Ġrear":5081,"ĠHo":5082,"Ġproperly":5083,"abe":5084,"ĠHotel":5085,"Ġopinions":5086,"under":5087,"ĠStation":5088,"ĠFOR":5089,"ops":5090,"Ġadopted":5091,"ĠSwiss":5092,"ĠCountry":5093,"ĠTer":5094,"ĠAndy":5095,"Me":5096,"ĠCooper":5097,"ĠTigers":5098,"ĠCreek":5099,"Ġgay":5100,"iner":5101,"ĠAN":5102,"Ġbird":5103,"lla":5104,"ĠKate":5105,"ĠPet":5106,"ni":5107,"Ġprospects":5108,"ater":5109,"ites":5110,"Ġescape":5111,"lam":5112,"ake":5113,"Ġ1980":5114,"ĠLag":5115,"Ġsuccessfully":5116,"Ġdistricts":5117,"Ġministers":5118,"aries":5119,"Ġframe":5120,"ĠON":5121,"ĠEuro":5122,"ĠMarkets":5123,"Ġregister":5124,"Ġdefeated":5125,"Ġdevelopments":5126,"Ġninth":5127,"Ġquiet":5128,"Ġgenerated":5129,"Ġvaluable":5130,"Ġrecommended":5131,"ĠTheatre":5132,"ĠCap":5133,"bed":5134,"Ġreference":5135,"Ġease":5136,"oring":5137,"Ġ66":5138,"Ġimprovements":5139,"Ġelsewhere":5140,"ĠHillary":5141,"Ġdefender":5142,"ĠRight":5143,"zy":5144,"Ġcomprehensive":5145,"Ġspotted":5146,"ĠOakland":5147,"ĠOk":5148,"ĠSystem":5149,"ique":5150,"Ġpersons":5151,"Ġexist":5152,"Ġbroader":5153,"Ġclinical":5154,"Ġ2001":5155,"oul":5156,"Ġsecurities":5157,"ghan":5158,"Ġshelter":5159,"ero":5160,"ATED":5161,"Ġhosting":5162,"Ġselect":5163,"ĠKavanaugh":5164,"Ġrestrictions":5165,"osa":5166,"Ġyields":5167,"ĠLA":5168,"Ġ59":5169,"Ġwonder":5170,"Ġabsence":5171,"ür":5172,"ÅĤ":5173,"DP":5174,"Ġelectronic":5175,"Ġillegally":5176,"Ġmicro":5177,"ĠNEW":5178,"Ġhall":5179,"Ġaged":5180,"Ġtemperature":5181,"cast":5182,"atic":5183,"Ġlegacy":5184,"Ġaffairs":5185,"ji":5186,"ĠResources":5187,"Ġgang":5188,"winning":5189,"Ġattending":5190,"aro":5191,"Ġfriendly":5192,"aine":5193,"Ġcannabis":5194,"Ġairline":5195,"Ġnoting":5196,"Ġprofessionals":5197,"ĠFREE":5198,"RC":5199,"Ġfinancing":5200,"Ġindependence":5201,"ved":5202,"Ġresulting":5203,"Ġsteady":5204,"ĠWinter":5205,"uring":5206,"Ġhoped":5207,"98":5208,"Ġpresentation":5209,"aya":5210,"Ġrated":5211,"osh":5212,"ĠAnalysis":5213,"=":5214,"Ġdonations":5215,"IR":5216,"Ġcombat":5217,"ĠHoward":5218,"anda":5219,"79":5220,"Ġinvested":5221,"Ġexpanding":5222,"omb":5223,"ress":5224,"ble":5225,"Ġjournalist":5226,"ĠWoods":5227,"Ġcenters":5228,"ott":5229,"Ġstreaming":5230,"Ġterror":5231,"Ġsustained":5232,"ĠWWE":5233,"pre":5234,"ÅŁ":5235,"ait":5236,"Ġarrival":5237,"Ġresidence":5238,"Ġextent":5239,"Ġarrive":5240,"Ġ2002":5241,"Ġestablish":5242,"74":5243,"ĠArgentina":5244,"ĠDem":5245,"inn":5246,"aud":5247,"ĠNCAA":5248,"Ġquestioned":5249,"Ġballot":5250,"Ġmin":5251,"Ġlandscape":5252,"Ġhorse":5253,"Ġopponent":5254,"iel":5255,"Ġprompted":5256,"atory":5257,"Ġlift":5258,"Ġassociation":5259,"cher":5260,"Ġdefending":5261,"Ġtiny":5262,"Ġpoverty":5263,"ĠSafety":5264,"Ġpetition":5265,"ĠLimited":5266,"ĠCA":5267,"FC":5268,"Ãł":5269,"oni":5270,"Ġmonitor":5271,"ÃŃa":5272,"MA":5273,"Ġanswers":5274,"ĠMitchell":5275,"Ġbo":5276,"ĠShah":5277,"Ġsm":5278,"Ġmedal":5279,"ĠCivil":5280,"Ġrecognize":5281,"key":5282,"Ġpregnant":5283,"Ġspots":5284,"ante":5285,"Ġacademic":5286,"Ġinitiatives":5287,"Ġsecured":5288,"ĠCL":5289,"ils":5290,"Ġanticipated":5291,"Ġinvolvement":5292,"ĠMake":5293,"Ġinsisted":5294,"ĠWales":5295,"Ġclothing":5296,"Ġtracks":5297,"Ġsymptoms":5298,"Ġplate":5299,"ĠNY":5300,"Ġretailers":5301,"ĠPan":5302,"Ġfled":5303,"Ġquoted":5304,"Ġsaved":5305,"ĠCarter":5306,"Ġteaching":5307,"ĠTokyo":5308,"ĠCr":5309,"ĠSix":5310,"ĠPicture":5311,"Ġrecover":5312,"Ġcomedy":5313,"ree":5314,"Ġstrikes":5315,"ĠSanders":5316,"sel":5317,"Ġgraduate":5318,"Ġpending":5319,"St":5320,"Ġwarrant":5321,"Ġhonest":5322,"ĠGM":5323,"Ġnoticed":5324,"ĠGalaxy":5325,"ider":5326,"Ġproposals":5327,"Ġwore":5328,"Ġindeed":5329,"EM":5330,"ĠChannel":5331,"ances":5332,"ĠBrady":5333,"86":5334,"Ġgotten":5335,"Ġthrowing":5336,"ĠLeader":5337,"ĠVideo":5338,"71":5339,"Ġwelcomed":5340,"NEW":5341,"Ġfairly":5342,"Ġpromises":5343,"ĠSilver":5344,"Ġrape":5345,"Ġopener":5346,"ares":5347,"ĠSir":5348,"making":5349,"Ġcur":5350,"Ġrooms":5351,"73":5352,"Ġamounts":5353,"ĠIndustry":5354,"ĠDar":5355,"Ġ62":5356,"ted":5357,"Ġabroad":5358,"ĠMaybe":5359,"Ġreaders":5360,"oke":5361,"Ġpublication":5362,"ĠJean":5363,"Ġoperator":5364,"ĠHaving":5365,"ĠMil":5366,"life":5367,"Ġgenerate":5368,"ĠCraig":5369,"ĠMass":5370,"ĠBh":5371,"Ġrequested":5372,"Ġcrazy":5373,"ĠSpace":5374,"Ġcopy":5375,"Ġexport":5376,"Ġcontext":5377,"Ġbr":5378,"62":5379,"ĠRobinson":5380,"Ġcyber":5381,"ENT":5382,"BI":5383,"arg":5384,"Ġspeaker":5385,"Ġdramatic":5386,"ĠOl":5387,"ĠMill":5388,"Ġtrained":5389,"Ġediting":5390,"Ġsalary":5391,"Ġdirectors":5392,"Ġexplore":5393,"Ġlucky":5394,"Ġprominent":5395,"Ġbrothers":5396,"Ġneck":5397,"icht":5398,"ĠWatson":5399,"born":5400,"Ġproven":5401,"Ġprincipal":5402,"Ġedition":5403,"Ed":5404,"Ġswitch":5405,"maker":5406,"Ġrelative":5407,"mi":5408,"ĠBruce":5409,"ho":5410,"ĠScottish":5411,"water":5412,"ĠSport":5413,"ĠKings":5414,"ĠCollins":5415,"adi":5416,"Ġcelebrated":5417,"Ġclothes":5418,"Ġsunny":5419,"ĠCharlotte":5420,"ees":5421,"Ġscenes":5422,"ĠData":5423,"Ġwounded":5424,"Ġunusual":5425,"Ġrealized":5426,"ĠPlan":5427,"ĠTrans":5428,"ĠFC":5429,"Ġletters":5430,"Ġalerts":5431,"ĠWarren":5432,"DS":5433,"oss":5434,"pping":5435,"Ġsuspension":5436,"Ġbenchmark":5437,"ĠAcc":5438,"Ġalert":5439,"Ġpassion":5440,"ĠEst":5441,"Ġlatter":5442,"Ġstability":5443,"Ġarts":5444,"Ġpursue":5445,"ĠSeason":5446,"Ġfields":5447,"Ġmethod":5448,"63":5449,"Ġfolks":5450,"Ġexclusive":5451,"Ġcrews":5452,"Ġsessions":5453,"ĠMajor":5454,"ĠMount":5455,"Ġmap":5456,"Ġ=":5457,"Ġsituations":5458,"ĠBerlin":5459,"rey":5460,"Ġdates":5461,"Ġsheet":5462,"ĠLo":5463,"Ġfighters":5464,"ĠMart":5465,"Ġatmosphere":5466,"Ġillness":5467,"Ġcompeting":5468,"ĠChristopher":5469,"ĠRoy":5470,"mm":5471,"iano":5472,"Ġge":5473,"ĠRams":5474,"Ġconversations":5475,"ĠPa":5476,"ĠTel":5477,"Ġappreciate":5478,"78":5479,"ĠTotal":5480,"low":5481,"ĠStone":5482,"Ġopposite":5483,"Ġbarrel":5484,"Ġdevelopers":5485,"Ġexpress":5486,"Ġhighs":5487,"which":5488,"par":5489,"ĠVietnam":5490,"Ġblocks":5491,"Ġrecording":5492,"Ġadjusted":5493,"Ġret":5494,"ĠAR":5495,"Ġmilitants":5496,"Ġinnovative":5497,"ĠGhana":5498,"FR":5499,"Ġfantastic":5500,"Ġmortgage":5501,"ando":5502,"ĠLane":5503,"ises":5504,"ĠÂ":5505,"Ġhomeless":5506,"ĠKal":5507,"Ġapproached":5508,"Ġrounds":5509,"Ġmargins":5510,"ament":5511,"ĠMotor":5512,"Ġencouraging":5513,"ÂŃ":5514,"uru":5515,"Ġhandling":5516,"ĠMassachusetts":5517,"Ġplanet":5518,"ĠSpring":5519,"ĠBon":5520,"gu":5521,"Beat":5522,"Ġdrawing":5523,"ĠPhoenix":5524,"very":5525,"aid":5526,"ĠSte":5527,"ĠEntertainment":5528,"ĠRon":5529,"Ġassigned":5530,"ĠSA":5531,"News":5532,"Ġinterviews":5533,"ĠOh":5534,"media":5535,"vel":5536,"Ġpermission":5537,"Ġtransactions":5538,"Ġtraders":5539,"Ġsolo":5540,"Ġprovincial":5541,"Ġsuggesting":5542,"¡":5543,"Ġdiverse":5544,"Ġ67":5545,"Ġranks":5546,"ĠFre":5547,"Ġfavourite":5548,"Ġ63":5549,"Ġdifferences":5550,"Ġtargeting":5551,"Ġactors":5552,"Ġ76":5553,"icated":5554,"Ġcollect":5555,"akes":5556,"war":5557,"Ġcontained":5558,"ches":5559,"Ġlibrary":5560,"Ġsegments":5561,"ĠLine":5562,"ê":5563,"ual":5564,"Ġbags":5565,"Ġfactory":5566,"Ġear":5567,"Ġsomewhat":5568,"Ġrail":5569,"ĠUP":5570,"ula":5571,"ĠNiger":5572,"Ġlas":5573,"Ġimplementation":5574,"Ġemails":5575,"kel":5576,"wing":5577,"Ġadvised":5578,"--":5579,"istic":5580,"Ġdepth":5581,"Ġshoes":5582,"ĠJennifer":5583,"Ġvenue":5584,"Ġcontain":5585,"Ġhighlights":5586,"Ġcapabilities":5587,"Ġprocesses":5588,"Ġtradition":5589,"Ġcontacted":5590,"Ġproducing":5591,"Ġtrail":5592,"rem":5593,"Ġ600":5594,"Ġ68":5595,"AA":5596,"ĠBa":5597,"ĠSuch":5598,"ĠTyler":5599,"ipp":5600,"Ġsurvived":5601,"ami":5602,"ĠContinue":5603,"Ġcapture":5604,"bi":5605,"61":5606,"96":5607,"Ġthreatening":5608,"Ġkeen":5609,"dale":5610,"Ġtrailer":5611,"Ġstages":5612,"ĠGordon":5613,"Ġfinishing":5614,"Ġlegislative":5615,"Ġuseful":5616,"ĠGreek":5617,"ald":5618,"Ġgrounds":5619,"ĠDu":5620,"storms":5621,"ills":5622,"Ġexpense":5623,"Ġdetained":5624,"Today":5625,"Ġdiet":5626,"Ġwood":5627,"ĠCameron":5628,"Ġthrown":5629,"Ġcricket":5630,"Ġideal":5631,"with":5632,"Ġteammates":5633,"ours":5634,"Ġprojected":5635,"Ġpersonally":5636,"ĠBoy":5637,"rom":5638,"ĠPhilippines":5639,"win":5640,"ges":5641,"Ġcounties":5642,"ĠBaker":5643,"Ġprosecutor":5644,"Ġroof":5645,"met":5646,"Ġpartly":5647,"ĠMoon":5648,"eman":5649,"Ġfocusing":5650,"Ġfishing":5651,"than":5652,"ĠJeremy":5653,"ĠBad":5654,"ais":5655,"Ġcontrols":5656,"Ġtonnes":5657,"Ġshall":5658,"Ġ61":5659,"Ġgathering":5660,"ĠERA":5661,"Ġpresidency":5662,"Ġ85":5663,"ĠGas":5664,"Ġscenario":5665,"Ġquarters":5666,"Ġang":5667,"Ġsettled":5668,"ĠCommerce":5669,"Ġanybody":5670,"Ġgarden":5671,"ĠLibrary":5672,"Ġbet":5673,"Ġtopic":5674,"olo":5675,"Ġintense":5676,"87":5677,"Ġlinks":5678,"Ġmed":5679,"ĠAG":5680,"Ġflooding":5681,"ĠMurphy":5682,"PM":5683,"Ġfinds":5684,"Ġsensitive":5685,"pped":5686,"Ġcompletion":5687,"Ġminority":5688,"Ġvon":5689,"Ġstriking":5690,"rich":5691,"Ġbars":5692,"Ġefficient":5693,"Ġcontributions":5694,"Ġvisits":5695,"Ġattract":5696,"ĠMalaysia":5697,"ĠREL":5698,"Ġopens":5699,"Ġessentially":5700,"Ġreasonable":5701,"Ġsentiment":5702,"ĠMelbourne":5703,"Ġfitness":5704,"Ġfrequently":5705,"ĠRangers":5706,"Ġmuseum":5707,"ĠDNA":5708,"Ġcontrast":5709,"ĠAdams":5710,"ĠWin":5711,"Ġfalls":5712,"Ġimposed":5713,"250":5714,"ood":5715,"ĠRio":5716,"Ġchoices":5717,"Ġyellow":5718,"rin":5719,"ben":5720,"ĠStaff":5721,"ĠIndonesia":5722,"Ġcarries":5723,"Ġtourism":5724,"UM":5725,"ĠOrange":5726,"sell":5727,"Ġresolve":5728,"ĠMumbai":5729,"Ġpan":5730,"Ġimplement":5731,"Ġmidfielder":5732,"OP":5733,"Ġtensions":5734,"Ġ800":5735,"ĠLord":5736,"ĠLight":5737,"Ġlies":5738,"és":5739,"Ġparticipation":5740,"Ġtries":5741,"Ġsheriff":5742,"degree":5743,"Ġcongressional":5744,"Ġmode":5745,"Ġregulation":5746,"ĠJacob":5747,"ĠCrown":5748,"Ġbowl":5749,"ĠMississippi":5750,"Ġtheft":5751,"ĠKingdom":5752,"Ġresort":5753,"Ġroyal":5754,"Ġunemployment":5755,"PP":5756,"Ġnomination":5757,"ĠTR":5758,"Ġbehaviour":5759,"bank":5760,"ĠForest":5761,"WASHINGTON":5762,"ĠOthers":5763,"Ġslowly":5764,"Ġmenu":5765,"vo":5766,"ĠSy":5767,"ĠMetro":5768,"ĠLisa":5769,"Ġregistration":5770,"While":5771,"ĠJesus":5772,"Ġ250":5773,"Ġprocessing":5774,"Ġmonetary":5775,"ape":5776,"ener":5777,"ĠSystems":5778,"Ġdisappointed":5779,"Ġprint":5780,"uy":5781,"ħ":5782,"Ġdemanding":5783,"Ġincredibly":5784,"play":5785,"Ġsurveillance":5786,"ĠStandard":5787,"Ġperiods":5788,"Ġwrites":5789,"ĠLuke":5790,"ĠPalestinian":5791,"Ġwalks":5792,"Ġriding":5793,"Ġwaters":5794,"ĠSox":5795,"Ġtraveling":5796,"Ġtap":5797,"Ġorganized":5798,"Ġresource":5799,"Ġangry":5800,"Ġtiming":5801,"Ġempty":5802,"Ġmilk":5803,"Ġtherapy":5804,"ĠBrandon":5805,"mon":5806,"Ġnationwide":5807,"Ġnovel":5808,"ĠStorm":5809,"iet":5810,"ĠBre":5811,"Ġbegun":5812,"Ġdiplomatic":5813,"Ġads":5814,"ĠDC":5815,"ĠOb":5816,"ĠMontreal":5817,"ĠDown":5818,"ĠMilwaukee":5819,"Ġmeal":5820,"ĠPuerto":5821,"ĠMas":5822,"Ġjoy":5823,"Ġdeparture":5824,"ĠWright":5825,"Ġspoken":5826,"style":5827,"ĠAction":5828,"ĠComey":5829,"Ġdelivering":5830,"Ġtoll":5831,"Ġmidnight":5832,"ĠRevenue":5833,"Ġfiring":5834,"Ġstunning":5835,"Ġkicked":5836,"ĠOttawa":5837,"Ġefficiency":5838,"ĠLincoln":5839,"Ġtaste":5840,"ez":5841,"ĠWeather":5842,"ĠMorning":5843,"Ġhadn":5844,"Ġdiversity":5845,"ily":5846,"ĠAy":5847,"Ġargue":5848,"Ġerror":5849,"Ġtaught":5850,"Ġche":5851,"Ġoccasion":5852,"Ġinc":5853,"ĠOrlando":5854,"ĠOnline":5855,"Ġlegs":5856,"ĠNation":5857,"uck":5858,"Ġwidespread":5859,"ĠOcean":5860,"Ġconstantly":5861,"ĠLatin":5862,"Ġcomfort":5863,"Ġrely":5864,"uff":5865,"ĠCard":5866,"aring":5867,"Ġhumans":5868,"ĠThomson":5869,"aka":5870,"BIT":5871,"ĠReview":5872,"po":5873,"ú":5874,"Ġtrucks":5875,"Ġforecasts":5876,"view":5877,"Ġlongtime":5878,"ĠConstitution":5879,"Ġreserves":5880,"bit":5881,"Ġstressed":5882,"Ġcontribution":5883,"Ġchicken":5884,"ĠDE":5885,"Ġfat":5886,"ĠOscar":5887,"Ġcriticized":5888,"Ġtestimony":5889,"Ġapparent":5890,"Ġconstant":5891,"Ġcabinet":5892,"ĠDuke":5893,"Ġaspects":5894,"lic":5895,"ĠVol":5896,"Ġwing":5897,"Ġreb":5898,"ĠSessions":5899,"ĠSmart":5900,"car":5901,"ĠIm":5902,"Ġoperational":5903,"Ġregulators":5904,"ĠJimmy":5905,"eter":5906,"Ġnobody":5907,"ĠMarc":5908,"Ġliterally":5909,"Ġresistance":5910,"ĠKam":5911,"Ġsexually":5912,"Ġ69":5913,"uth":5914,"Ġviewed":5915,"Ġpicks":5916,"Ġdin":5917,"Ġtalented":5918,"Ġtennis":5919,"Ġstrengthen":5920,"Ġgl":5921,"ĠProtection":5922,"Ġinstalled":5923,"ways":5924,"ĠCampbell":5925,"ĠPortland":5926,"Ġintent":5927,"ĠPalace":5928,"Ġsecondary":5929,"Ġlocked":5930,"ĠPA":5931,"Ġlanded":5932,"Ġlength":5933,"Ġboosted":5934,"Ġpurchases":5935,"Ġcommand":5936,"ĠAsked":5937,"Ġspaces":5938,"Ġiconic":5939,"Ġrecommend":5940,"Ġduties":5941,"Ġseized":5942,"Ġdelayed":5943,"FA":5944,"AND":5945,"daq":5946,"Ġhiring":5947,"Ġoccur":5948,"DC":5949,"ĠMus":5950,"Ġag":5951,"Ġhopefully":5952,"ĠPenn":5953,"ards":5954,"Ġstriker":5955,"Ġrent":5956,"ĠTy":5957,"ĠBuffalo":5958,"ĠKy":5959,"Ġhike":5960,"pper":5961,"Ġ120":5962,"Ġop":5963,"Ġwheel":5964,"ĠIan":5965,"Ġchart":5966,"tt":5967,"Ġvolunteer":5968,"IG":5969,"person":5970,"ight":5971,"ĠBook":5972,"unt":5973,"ĠTechnologies":5974,"Now":5975,"Ġfavour":5976,"ĠGh":5977,"ĠQatar":5978,"ĠDutch":5979,"ĠGrant":5980,"ĠBan":5981,"rel":5982,"Ġagreements":5983,"Ġeducational":5984,"worth":5985,"ĠWard":5986,"700":5987,"Ġanymore":5988,"Ġrepair":5989,"Ġoperators":5990,"ĠLi":5991,"ots":5992,"ĠLouisiana":5993,"ĠWhether":5994,"Ġodds":5995,"Ġnoon":5996,"ĠStr":5997,"Ġfail":5998,"iser":5999,"Ġforever":6000,"Ġrecall":6001,"ĠPo":6002,"ĠHot":6003,"Ġdesigner":6004,"ido":6005,"LL":6006,"ĠControl":6007,"Ġsurvive":6008,"iam":6009,"Ġorganisation":6010,"ĠWork":6011,"Ġwider":6012,"Ġtank":6013,"work":6014,"ĠAS":6015,"Ġposting":6016,"Ġsuddenly":6017,"MC":6018,"ĠAL":6019,"ĠProfessor":6020,"ĠCoach":6021,"Ġrushed":6022,"Ġafraid":6023,"Ġactivist":6024,"that":6025,"ĠFilm":6026,"Ġbacking":6027,"Ġhousehold":6028,"Ġsignal":6029,"Ġaccurate":6030,"str":6031,"ĠThread":6032,"ĠBears":6033,"ATION":6034,"ĠAlliance":6035,"ĠMcDonald":6036,"ĠVenezuela":6037,"ogg":6038,"ĠWindows":6039,"makers":6040,"Ġutility":6041,"Ġrapidly":6042,"Ġattractive":6043,"Ġpa":6044,"ĠLarry":6045,"Ġmisconduct":6046,"Ġfreshman":6047,"Ġqualified":6048,"Ġcleared":6049,"Ġcrashed":6050,"Ġparticipating":6051,"Ġpages":6052,"Ġhighlight":6053,"Ġdialogue":6054,"ĠAlberta":6055,"Ġca":6056,"Ġwitnesses":6057,"ables":6058,"Ġfollowers":6059,"Ġensuring":6060,"Ġpromoting":6061,"Ġsearching":6062,"Ġremote":6063,"Ġclash":6064,"Ġfirefighters":6065,"Ġteen":6066,"ĠPlace":6067,"ĠNote":6068,"Ġregardless":6069,"ult":6070,"oney":6071,"ander":6072,"ional":6073,"ining":6074,"Ġdemanded":6075,"ĠCommunications":6076,"Ġconsideration":6077,"TC":6078,"ĠSoutheast":6079,"aga":6080,"ĠGarden":6081,"inger":6082,"ht":6083,"Ġbranch":6084,"Ġmouth":6085,"Ġaudio":6086,"Ġraw":6087,"Ġcoordinator":6088,"Ġexact":6089,"ĠHan":6090,"Ġdelays":6091,"ĠWal":6092,"ĠWells":6093,"Ġng":6094,"Ġhandful":6095,"Ġgirlfriend":6096,"Ġtypical":6097,"ĠWayne":6098,"ĠFranklin":6099,"Ġconstitutional":6100,"ĠChance":6101,"Ġblamed":6102,"rim":6103,"Ġpreliminary":6104,"Ġlie":6105,"da":6106,"ĠCapitol":6107,"Ġroutine":6108,"ĠNASA":6109,"Ġtre":6110,"ĠGolf":6111,"Ġsight":6112,"ĠDer":6113,"Ġreserve":6114,"150":6115,"Ġspeculation":6116,"Ġcompetitors":6117,"ĠMacron":6118,"ony":6119,"Ġovertime":6120,"Ġ71":6121,"Ġdepending":6122,"ĠWarner":6123,"Ġaccusations":6124,"ius":6125,"Ġpredicted":6126,"ĠCharlie":6127,"Ġeverywhere":6128,"Ġcable":6129,"ĠSaint":6130,"ĠRegion":6131,"Ġhero":6132,"ĠEmb":6133,"Ġkinds":6134,"Ġstarter":6135,"Ġsolve":6136,"ĠGuard":6137,"Ġloves":6138,"ĠDouglas":6139,"Ġfunded":6140,"ĠBrent":6141,"ĠAnyone":6142,"Ġsubstantial":6143,"ĠMarine":6144,"ĠMichelle":6145,"Ġcelebrating":6146,"Ġoffset":6147,"Ġbutton":6148,"gg":6149,"Ġmedicine":6150,"uri":6151,"Ġsomewhere":6152,"PD":6153,"Ġmon":6154,"Ġfires":6155,"final":6156,"oth":6157,"ined":6158,"Ġunderway":6159,"Ġmistakes":6160,"Ġgrateful":6161,"Ġcheap":6162,"È":6163,"Ġ95":6164,"Ġviolations":6165,"arr":6166,"Ġsurprising":6167,"Ġob":6168,"ĠNATO":6169,"Ġcontroversy":6170,"ĠSweden":6171,"Ġfuneral":6172,"Ġreviews":6173,"Ġpromotion":6174,"TY":6175,"Ġliberal":6176,"Ġpromising":6177,"ĠSP":6178,"How":6179,"Ġmemories":6180,"Ġbreast":6181,"zi":6182,"ights":6183,"Ġpattern":6184,"Ġoutdoor":6185,"ĠMu":6186,"Ġrush":6187,"ĠTheresa":6188,"ĠPol":6189,"Ġdescribe":6190,"ĠBand":6191,"ĠStewart":6192,"Ġ1999":6193,"ĠRaiders":6194,"mp":6195,"Ġprocedures":6196,"Ġplot":6197,"Ġhire":6198,"used":6199,"Ġ1970":6200,"Ġpicking":6201,"ĠSim":6202,"Ġregard":6203,"inal":6204,"backs":6205,"ĠHard":6206,"ĠLow":6207,"ĠAc":6208,"Is":6209,"Ġguarantee":6210,"ĠGiven":6211,"Ġbeta":6212,"ĠTre":6213,"Ġtrans":6214,"Ġretailer":6215,"Ġpurposes":6216,"ĠHol":6217,"Ġenjoying":6218,"Ġbrown":6219,"ĠPerry":6220,"Ġplea":6221,"MS":6222,"ĠDakota":6223,"ĠParker":6224,"Ġcommit":6225,"ĠLawrence":6226,"ĠMorris":6227,"ended":6228,"Ġvirtual":6229,"ÃĹ":6230,"Ġfruit":6231,"84":6232,"ĠHas":6233,"ishing":6234,"Ġdominated":6235,"ĠFA":6236,"Ġchannels":6237,"Ġunderstood":6238,"Ġcitizen":6239,"Ġchecks":6240,"ĠKenya":6241,"Ġdisabled":6242,"SD":6243,"Ġprotecting":6244,"Ġtweets":6245,"Ġsparked":6246,"ĠCO":6247,"§":6248,"ori":6249,"ĠGDP":6250,"ĠSer":6251,"ĠVisit":6252,"ĠMS":6253,"Ġbarely":6254,"Ġsand":6255,"Ġap":6256,"aging":6257,"Ġrel":6258,"ĠPerhaps":6259,"ĠMourinho":6260,"ĠJets":6261,"Ġdisclosure":6262,"Ġhighlighted":6263,"Ġimplemented":6264,"Ġcompliance":6265,"ĠAB":6266,"ĠAssistant":6267,"ĠCape":6268,"Ġfunny":6269,"Ġleverage":6270,"Ġmachines":6271,"Ġranging":6272,"Ġfastest":6273,"ĠRoberts":6274,"ĠPolicy":6275,"gar":6276,"Ġcollapse":6277,"ĠThrough":6278,"Ġrobbery":6279,"ĠHay":6280,"Ġelite":6281,"ĠDigital":6282,"ĠFun":6283,"ĠAlan":6284,"ement":6285,"Ġmit":6286,"Ġspin":6287,"Ġlistening":6288,"ĠDoug":6289,"ĠSaints":6290,"Ġinterior":6291,"Ġenhance":6292,"ĠCardinals":6293,"ever":6294,"Ġrobust":6295,"Ġinform":6296,"Ġsuffer":6297,"book":6298,"ĠMuslims":6299,"Ġagriculture":6300,"Ġkm":6301,"Ġdivers":6302,"ñ":6303,"ĠReg":6304,"Ġequivalent":6305,"Ġcraft":6306,"Ġsettle":6307,"Ġcontains":6308,"ĠMack":6309,"ĠDis":6310,"ĠFore":6311,"ĠSudan":6312,"ĠMail":6313,"ĠBrooklyn":6314,"izer":6315,"bn":6316,"Ġhundred":6317,"Ġexhibition":6318,"ĠHave":6319,"vin":6320,"Ġcivilians":6321,"ĠCincinnati":6322,"Some":6323,"ĠSE":6324,"Ġbat":6325,"ĠIns":6326,"Ġcalm":6327,"Ġtone":6328,"Ġnormally":6329,"Ġseeks":6330,"ĠAss":6331,"Ġmembership":6332,"Ġannually":6333,"Ġemployers":6334,"CO":6335,"Ġcomplicated":6336,"Ġheadlines":6337,"ĠLabor":6338,"Ġlifestyle":6339,"ĠRen":6340,"ĠRich":6341,"cent":6342,"ude":6343,"Ġawesome":6344,"Ġpaint":6345,"Ġrolling":6346,"Ġwalls":6347,"Ġlab":6348,"Ġtourists":6349,"care":6350,"Ġgear":6351,"izz":6352,"Ġcream":6353,"ĠTro":6354,"ices":6355,"Ġpack":6356,"Ġdiseases":6357,"ĠSpeaker":6358,"ĠOfficers":6359,"Ġsky":6360,"83":6361,"ĠBE":6362,"Ġcategories":6363,"Ġindicate":6364,"Ġru":6365,"ĠSony":6366,"ĠDun":6367,"ocks":6368,"Ġconcrete":6369,"ĠMadison":6370,"ĠSab":6371,"IV":6372,"Ġobserved":6373,"ria":6374,"Ġinterim":6375,"Ġencounter":6376,"ista":6377,"Ġanger":6378,"Ġrapid":6379,"mail":6380,"Ġdestination":6381,"ĩ":6382,"Ġbreaks":6383,"rell":6384,"ĠChase":6385,"Ġattorneys":6386,"Ġrolled":6387,"ĠSprings":6388,"ĠVillage":6389,"TO":6390,"HS":6391,"Ġcampaigns":6392,"ologist":6393,"ĠTax":6394,"ĠIII":6395,"Ġteach":6396,"Ġprovision":6397,"Ġrem":6398,"Ġshirt":6399,"Ġdeployed":6400,"Ġguidelines":6401,"Ġav":6402,"zer":6403,"Ġrushing":6404,"94":6405,"place":6406,"Man":6407,"Ġdivided":6408,"ĠGun":6409,"Ġwindows":6410,"Ġcomponents":6411,"aba":6412,"ĠSwitzerland":6413,"election":6414,"ĠTampa":6415,"ĠAri":6416,"ás":6417,"Ġhighway":6418,"Ġacres":6419,"Ġcrown":6420,"known":6421,"Ġinquiry":6422,"url":6423,"Ġexpertise":6424,"Ġpraised":6425,"yer":6426,"Ġconclusion":6427,"Ġabortion":6428,"Ġlady":6429,"Ġtribute":6430,"Ġunveiled":6431,"Ġbeaten":6432,"TE":6433,"ĠMot":6434,"unk":6435,"Ġtriple":6436,"Ġforcing":6437,"ĠTickets":6438,"uit":6439,"Ġiron":6440,"Ġscientific":6441,"ĠIP":6442,"Ġdiagnosed":6443,"Ġocean":6444,"wide":6445,"ĠCowboys":6446,"LC":6447,"Ġmethods":6448,"ĠFind":6449,"ĠDean":6450,"Ġfundamental":6451,"ĠGill":6452,"Ġfeelings":6453,"IO":6454,"hu":6455,"Ġfeedback":6456,"ote":6457,"Ġduo":6458,"fully":6459,"get":6460,"Ġproof":6461,"story":6462,"Ġlongest":6463,"Ġshops":6464,"ĠJong":6465,"ĠCro":6466,"ĠHawaii":6467,"91":6468,"ĠJake":6469,"ĠSusan":6470,"Ġsubmit":6471,"rav":6472,"Ġmodest":6473,"Ġlit":6474,"Ġattempting":6475,"Ġsits":6476,"Ġaddressing":6477,"93":6478,"ĠBi":6479,"Ġlying":6480,"ĠOrganization":6481,"ĠOak":6482,"oli":6483,"Ġfatal":6484,"Ġmountain":6485,"val":6486,"lu":6487,"ĠMaine":6488,"Ġcharging":6489,"Ġresigned":6490,"illo":6491,"Ġrecommendation":6492,"party":6493,"ĠWeb":6494,"ĠPanthers":6495,"Ġnoise":6496,"ĠBrussels":6497,"awa":6498,"Ġambassador":6499,"Ġaccessible":6500,"ĠCalgary":6501,"idd":6502,"ĠAirlines":6503,"gr":6504,"Ġnu":6505,"roy":6506,"ĠMars":6507,"ĠPoland":6508,"ĠJerry":6509,"ados":6510,"ĠRico":6511,"ĠMir":6512,"ĠFin":6513,"ious":6514,"Ġpacked":6515,"Ġinsider":6516,"President":6517,"ĠBull":6518,"ĠYemen":6519,"ĠConnecticut":6520,"Ġ73":6521,"Ġdepartments":6522,"Ġorganic":6523,"ĠSummer":6524,"ĠBet":6525,"ste":6526,"zo":6527,"rat":6528,"Ġalliance":6529,"Ġintervention":6530,"wan":6531,"ĠOR":6532,"Ġdefined":6533,"ĠÃł":6534,"ĠChiefs":6535,"Ġknocked":6536,"ared":6537,"Ġholes":6538,"Ġpulling":6539,"ĠTodd":6540,"ĠJamie":6541,"ĠSher":6542,"Ġsignature":6543,"ĠSur":6544,"Ġgym":6545,"ĠVladimir":6546,"ĠThailand":6547,"Ġgaming":6548,"Ġsaving":6549,"ceive":6550,"82":6551,"ĠBern":6552,"ĠDid":6553,"Ġhardware":6554,"ished":6555,"Ġconspiracy":6556,"ANS":6557,"ĠIntelligence":6558,"Ġassembly":6559,"Ġ101":6560,"Ġconcise":6561,"ĠManhattan":6562,"Ġbelief":6563,"Ġsurge":6564,"Ġdeserve":6565,"Ġconsistently":6566,"ĠNor":6567,"okes":6568,"ðŁ":6569,"ME":6570,"ĠAsset":6571,"Ġsubstance":6572,"Ġprefer":6573,"Ġburning":6574,"ĠNik":6575,"ook":6576,"ĠPinterest":6577,"Ġboyfriend":6578,"ĠHal":6579,"ĠMerkel":6580,"Ġintroduce":6581,"ĠLinkedIn":6582,"ĠFull":6583,"ĠFarm":6584,"Ġchildhood":6585,"ĠTransportation":6586,"Ġterrible":6587,"du":6588,"Ġintention":6589,"Ġseemingly":6590,"elle":6591,"Ġfoods":6592,"Ġtitled":6593,"Ġdual":6594,"Ġimport":6595,"Ġdeveloper":6596,"UL":6597,"ington":6598,"ĠDelta":6599,"?'":6600,"iness":6601,"Ġquit":6602,"ĠGarcia":6603,"ĠSri":6604,"Ġhip":6605,"ĠBrazilian":6606,"elt":6607,"ively":6608,"Ġstructures":6609,"Ġlabour":6610,"Ġneighbors":6611,"Ġtill":6612,"Ġsoil":6613,"Ġdropping":6614,"Ġnominee":6615,"Ġmeets":6616,"92":6617,"rant":6618,"isa":6619,"Ġluck":6620,"aa":6621,"jet":6622,"ĠTor":6623,"ĠCrime":6624,"Ġlane":6625,"Ġflu":6626,"Ġlaunching":6627,"ĠAutom":6628,"aks":6629,"Ġuniversities":6630,"Ġpollution":6631,"ĠAdvis":6632,"ĠMall":6633,"ls":6634,"Ġdeeper":6635,"Ġrepeated":6636,"Ġmeanwhile":6637,"Ġchip":6638,"Ġoutlets":6639,"Ġliked":6640,"Ġsal":6641,"Ġwelfare":6642,"ago":6643,"Ġmakers":6644,"ving":6645,"fer":6646,"Ġovercome":6647,"mb":6648,"Ġshocked":6649,"akers":6650,"Ġnonprofit":6651,"Ġdonated":6652,"eral":6653,"Ġresume":6654,"Ġlogo":6655,"Ġsubscription":6656,"Ġ74":6657,"ela":6658,"Ġaspect":6659,"html":6660,"Ġsorry":6661,"Ġupgrade":6662,"Ġstance":6663,"Ġfr":6664,"Ġpapers":6665,"Ġattacking":6666,"Ġmeaningful":6667,"81":6668,"ĠWeinstein":6669,"Ġcreates":6670,"Ġhonour":6671,"ĠReply":6672,"oph":6673,"Ġmarch":6674,"Ġsmile":6675,"Ġcomparison":6676,"will":6677,"ĠSanchez":6678,"Ġvoter":6679,"Ġtheory":6680,"Ġequally":6681,"ĠRoger":6682,"Ġperfectly":6683,"Ġlanding":6684,"Ġbillions":6685,"ĠBloomberg":6686,"Ġpermit":6687,"Ġfinals":6688,"Ġracial":6689,"Ġpregnancy":6690,"iled":6691,"ĠFederation":6692,"Ġforest":6693,"Ġtag":6694,"aul":6695,"Ġdrinks":6696,"Ġ(\"":6697,"ĠMobile":6698,"Ġtouched":6699,"Ġclock":6700,"Ġreg":6701,"Ġasylum":6702,"igan":6703,"Ġsenator":6704,"Ġ99":6705,"ĠKumar":6706,"Ġskill":6707,"Ġ1998":6708,"pa":6709,"ĠAf":6710,"Ġmood":6711,"ston":6712,"Ġhang":6713,"ĠMPs":6714,"Please":6715,"ĠEve":6716,"Ġdocumentary":6717,"Ġpersonality":6718,"ĠCast":6719,"Ġdiscount":6720,"bing":6721,"ĠBoeing":6722,"Ġdepend":6723,"Ġcrossing":6724,"EX":6725,"Ġsucceed":6726,"Ġhumanitarian":6727,"ĠMuhammad":6728,"Ġwages":6729,"Ġcolumn":6730,"Ġexternal":6731,"Ġstatistics":6732,"ĠTODAY":6733,"Ġtrips":6734,"Ġta":6735,"Ġpenalties":6736,"Ġwriters":6737,"Ġshipping":6738,"ĠIndians":6739,"Ġsalt":6740,"ĠIndustrial":6741,"ĠYankees":6742,"ĠDen":6743,"Ġrough":6744,"Ġbarrels":6745,"ĠHor":6746,"bert":6747,"ĠDep":6748,"Ġresign":6749,"97":6750,"Ġballs":6751,"ĠJun":6752,"ĠBab":6753,"Ġassociate":6754,"Ġstring":6755,"Ġhub":6756,"Ġorgan":6757,"ĠMarshall":6758,"ĠFIFA":6759,"ĠMun":6760,"ency":6761,"research":6762,"Ġpeers":6763,"Ġtall":6764,"ĠGoldman":6765,"Don":6766,"Ġparade":6767,"Ġparks":6768,"Ġdet":6769,"Ġdisappointing":6770,"Ġreflects":6771,"ĠLakers":6772,"Ġfiles":6773,"Ġrelatives":6774,"ĠUSD":6775,"ĠArticle":6776,"Ġcustom":6777,"ĠCarlos":6778,"Ġtracking":6779,"Ġmaintaining":6780,"ĠCur":6781,"ardo":6782,"ĠSkip":6783,"Ġattitude":6784,"Just":6785,"Ġinstitution":6786,"Ġnarrow":6787,"Ġsnap":6788,"Ġenterprise":6789,"Ġdrives":6790,"Ġ77":6791,"Ġcrop":6792,"Ġvirus":6793,"Ġcelebrity":6794,"Ġeconomies":6795,"ued":6796,"Ġsum":6797,"ĠDubai":6798,"ĠInsurance":6799,"Ĺ":6800,"ury":6801,"ĠUnfortunately":6802,"Ġclosure":6803,"ota":6804,"ĠPhilip":6805,"oms":6806,"Ġinvestigated":6807,"Ġgenerations":6808,"ĠETF":6809,"ĠKeith":6810,"ĠLater":6811,"isk":6812,"Ġpreferred":6813,"Ġdefault":6814,"Ġtowns":6815,"ĠRod":6816,"ĠDie":6817,"Ġintegrated":6818,"Ġacquiring":6819,"Ġvoices":6820,"Ġser":6821,"Ġpresents":6822,"ĠBR":6823,"ĠEmergency":6824,"Ġreligion":6825,"HA":6826,"Ġresponding":6827,"ĠThings":6828,"Ġbeef":6829,"ĠWithout":6830,"urd":6831,"ĠCarl":6832,"Ġadministrative":6833,"ĠWhich":6834,"Ġchallenged":6835,"Ġcooking":6836,"ivid":6837,"ĠFer":6838,"Ġtremendous":6839,"ĠTerry":6840,"iri":6841,"CS":6842,"ĠJunior":6843,"ĠReddit":6844,"Ġtea":6845,"Ġaccounting":6846,"lan":6847,"Ġdetention":6848,"Ġreplied":6849,"SI":6850,"ĠHel":6851,"ns":6852,"ĠProf":6853,"Ġramp":6854,"ĠConservative":6855,"Ġattendance":6856,"Ġspecialist":6857,"ĠFinal":6858,"Ġadvertisement":6859,"Ġacquire":6860,"ĠWhatsApp":6861,"Ġworkforce":6862,"ĠCalif":6863,"Ġspeakers":6864,"ĠEPA":6865,"Ġconviction":6866,"hire":6867,"ĠFisher":6868,"ĠIntel":6869,"Ġbin":6870,"ĠWas":6871,"Ġearth":6872,"vi":6873,"Ġhurricane":6874,"Ġholidays":6875,"Ġassume":6876,"Ġinvolve":6877,"Ġdynamic":6878,"ĠGre":6879,"Ġitem":6880,"Ġpound":6881,"Ġanxiety":6882,"ĠPrint":6883,"rop":6884,"Ġautomatically":6885,"Ġdiscrimination":6886,"ĠLam":6887,"ĠColl":6888,"Ġimpressed":6889,"Ġinvolves":6890,"ĠLes":6891,"ĠTri":6892,"ĠLook":6893,"ĠiOS":6894,"Ġgrab":6895,"ĠAngel":6896,"Ġstops":6897,"ĠPay":6898,"ĠECB":6899,"Ġbunch":6900,"Ġletting":6901,"ele":6902,"ĠAdditionally":6903,"Ġboards":6904,"NC":6905,"Ġtragedy":6906,"Ġpink":6907,"Ġgonna":6908,"ones":6909,"Ġrev":6910,"ĠIndependent":6911,"ĠCambridge":6912,"ĠPence":6913,"Ġprosecution":6914,"Ġdeputies":6915,"ĠAhmed":6916,"Ġlows":6917,"ĠAmy":6918,"ĠBuilding":6919,"mark":6920,"Ġsmooth":6921,"Ġsole":6922,"Ġwanting":6923,"ĠHeart":6924,"Ġobtain":6925,"ĠBus":6926,"Ġexchanges":6927,"friendly":6928,"Ġlabel":6929,"elect":6930,"ĠCompanies":6931,"owing":6932,"ĠCB":6933,"RI":6934,"ĠMaster":6935,"Ġliquid":6936,"ĠDanny":6937,"Ġproceeds":6938,"ĠLaura":6939,"card":6940,"Ġtears":6941,"Ġexploration":6942,"Ġdepression":6943,"ken":6944,"ĠFe":6945,"Ġlending":6946,"ĠYouth":6947,"ality":6948,"NS":6949,"Ġmoon":6950,"ĠTaiwan":6951,"Ġstruggles":6952,"Ġdiscovery":6953,"Ġqualify":6954,"Ġwireless":6955,"alia":6956,"Ġwitnessed":6957,"Ġheight":6958,"ĠGuy":6959,"left":6960,"KE":6961,"Ġfoul":6962,"ĠMohammed":6963,"Ġgrass":6964,"ĠNon":6965,"Ġswim":6966,"Ġbrilliant":6967,"you":6968,"ĠFlynn":6969,"Ġsinging":6970,"eria":6971,"UT":6972,"ĠMcCain":6973,"ĠSep":6974,"ĠWars":6975,"Ġburden":6976,"Ġpas":6977,"Ġabandoned":6978,"Ġint":6979,"ĠTurner":6980,"Ġcollective":6981,"ĠEnvironmental":6982,"ĠStudents":6983,"Ġofferings":6984,"Ġresignation":6985,"Ġexplosion":6986,"ĠKoh":6987,"ager":6988,"Ġthrows":6989,"Ġasks":6990,"light":6991,"Ġanyway":6992,"Ġyard":6993,"Ġcarrier":6994,"Ġwaves":6995,"backed":6996,"TR":6997,"oud":6998,"Ġbreach":6999,"Ġdated":7000,"Ġdressed":7001,"ĠDodgers":7002,"oles":7003,"Ġ78":7004,"Ġreads":7005,"Ġpredict":7006,"ĠJerusalem":7007,"ĠPT":7008,"Ġcrack":7009,"yan":7010,"Ġnights":7011,"eline":7012,"Ġconvinced":7013,"Ġlock":7014,"Ġcarefully":7015,"ĠMercedes":7016,"Ġultimate":7017,"Ġdist":7018,"Ġslight":7019,"ĠEdwards":7020,"Ġswing":7021,"iling":7022,"Ġknife":7023,"ĠNashville":7024,"IF":7025,"inder":7026,"udd":7027,"Ġsenators":7028,"ĠFurther":7029,"ĠXi":7030,"Ġstr":7031,"ĠOd":7032,"days":7033,"Ġcomm":7034,"Ġverdict":7035,"Ġconfirmation":7036,"king":7037,"ĠCS":7038,"Ġadvocates":7039,"Ġpride":7040,"Ġmemorial":7041,"ams":7042,"erman":7043,"Ġteenager":7044,"ĠNeil":7045,"uts":7046,"Ġsoul":7047,"see":7048,"post":7049,"Ġchest":7050,"fire":7051,"ĠLynch":7052,"Ġpeaceful":7053,"OND":7054,"ĠIndustries":7055,"ĠJuan":7056,"Ġrestore":7057,"Ġreliable":7058,"ming":7059,"agan":7060,"Source":7061,"ĠCabinet":7062,"Ġremarkable":7063,"ĠTrudeau":7064,"ĠEs":7065,"Ġintegrity":7066,"ove":7067,"fe":7068,"Ġproceedings":7069,"Ġconnections":7070,"Ġunprecedented":7071,"ĠGlen":7072,"ux":7073,"Ġearning":7074,"Ġingredients":7075,"Ġnominated":7076,"ĠBangladesh":7077,"made":7078,"Ġlessons":7079,"Ġbreakfast":7080,"ĠRelations":7081,"Ġloose":7082,"Al":7083,"Ġupgraded":7084,"ral":7085,"ĠPage":7086,"oto":7087,"ĠQueensland":7088,"Ġprocedure":7089,"ĠSmall":7090,"Ġrespective":7091,"Ġpictured":7092,"ĠBas":7093,"Ġpreparation":7094,"ĠMyanmar":7095,"Ġdonation":7096,"Ġvisible":7097,"iest":7098,"ĠBroadway":7099,"rick":7100,"ĠSchools":7101,"Ġarrests":7102,"ĠJessica":7103,"ĠBengal":7104,"Ġhell":7105,"Ġannouncing":7106,"Ġmail":7107,"ĠMcG":7108,"two":7109,"rest":7110,"OD":7111,"ĠBradley":7112,"Ġdoubled":7113,"Ġpledged":7114,"Ġcomeback":7115,"Ġextraordinary":7116,"Ġslide":7117,"Ġassess":7118,"Ġagricultural":7119,"ĠKay":7120,"Ġvendors":7121,"Ġnarrative":7122,"Ġreviewed":7123,"ĠPass":7124,"Ġinspiration":7125,"ĠHunter":7126,"Ġcalendar":7127,"ĠDiamond":7128,"Ġremoval":7129,"ners":7130,"ĠKap":7131,"Ġconsent":7132,"Ġvisual":7133,"Ġcheese":7134,"ĠTher":7135,"ĠFR":7136,"ĠShanghai":7137,"iah":7138,"ĠCole":7139,"AK":7140,"Ġranking":7141,"Ġcook":7142,"Ġhalftime":7143,"ĠStars":7144,"Ġroutes":7145,"aim":7146,"Ġestablishment":7147,"ĠMug":7148,"Ġsurvivors":7149,"urg":7150,"ĠBrett":7151,"Ġunexpected":7152,"ained":7153,"Ġrarely":7154,"ĠGall":7155,"Ġadvocate":7156,"ĠNad":7157,"Ġ911":7158,"Ġracist":7159,"erer":7160,"ĠRev":7161,"ĠSection":7162,"Ġhelpful":7163,"CT":7164,"agg":7165,"Ġgovernance":7166,"Ġfelony":7167,"Ġoptimistic":7168,"Ġelectoral":7169,"EG":7170,"town":7171,"Ġdaughters":7172,"Ġanswered":7173,"Ġthin":7174,"ĠClassic":7175,"Ġshareholder":7176,"ĠBlake":7177,"ĠFla":7178,"Ġparliamentary":7179,"dy":7180,"Ġcommented":7181,"Ġtri":7182,"Ġglobe":7183,"Ġmandate":7184,"Ġslipped":7185,"ĠTower":7186,"Ġoperated":7187,"gers":7188,"Ġassured":7189,"ĠMartinez":7190,"Ġdesigns":7191,"ĠModel":7192,"Ġstakeholders":7193,"Ġdefended":7194,"Ġseniors":7195,"Ġvacation":7196,"Ġglobally":7197,"ump":7198,"Not":7199,"Ġclip":7200,"Ġarticles":7201,"BR":7202,"km":7203,"ĠFront":7204,"PL":7205,"Ġadoption":7206,"Ġsudden":7207,"Ġframework":7208,"Ġhanging":7209,"gl":7210,"ĠSel":7211,"Ġmoderate":7212,"Ġreverse":7213,"income":7214,"cor":7215,"ĠGB":7216,"Ġphysically":7217,"Ġtransparency":7218,"ĠElectric":7219,"Ġrefugee":7220,"profile":7221,"iva":7222,"ately":7223,"ĠAC":7224,"Ġtransferred":7225,"Ġaffair":7226,"ĠAlaska":7227,"oria":7228,"ĠChange":7229,"Ġrepeat":7230,"Ġscreening":7231,"ender":7232,"ĠCas":7233,"ĠDav":7234,"Ġfocuses":7235,"Ġcommissioner":7236,"Ġupside":7237,"ĠKeep":7238,"ĠBlues":7239,"ently":7240,"Ġaut":7241,"Ġexperiencing":7242,"aman":7243,"Ġapprove":7244,"Ġmile":7245,"Ġcheaper":7246,"ĠWind":7247,"ĠStore":7248,"Ġgrabbed":7249,"Ġsons":7250,"Ġfighter":7251,"Ġum":7252,"ĠBased":7253,"don":7254,"Ġconstitution":7255,"finals":7256,"act":7257,"¢":7258,"Ġmill":7259,"Ġorganisations":7260,"ĠToyota":7261,"Ġyuan":7262,"Ġterrorists":7263,"Ġforth":7264,"Ġavailability":7265,"Ġentrance":7266,"Ġvolumes":7267,"Ġmult":7268,"plus":7269,"ĠColumbus":7270,"ĠSummit":7271,"Ġbabies":7272,"ĠMur":7273,"ĠGray":7274,"ĠChar":7275,"ĠButler":7276,"Ġpose":7277,"ĠNatural":7278,"ĠAtt":7279,"Ġdecrease":7280,"Ġtens":7281,"kt":7282,"Ġminds":7283,"Ġimpacted":7284,"Ġchapter":7285,"ĠOp":7286,"ĠHarrison":7287,"ĠRodriguez":7288,"Ġethnic":7289,"Ġtravelling":7290,"ĠBond":7291,"ader":7292,"core":7293,"Ġgallery":7294,"founder":7295,"ĠVill":7296,"Ġdecent":7297,"ĠHistory":7298,"ĠInt":7299,"ĠNa":7300,"ĠHad":7301,"Ġmainstream":7302,"ĠTs":7303,"Ġbottle":7304,"sen":7305,"Ġrecession":7306,"Ġsophomore":7307,"Ġsilence":7308,"cc":7309,"Ġqualifying":7310,"Ġcomplained":7311,"ĠRad":7312,"Ġactively":7313,"Ġbacks":7314,"ĠMusk":7315,"Ġcareful":7316,"Ġmeals":7317,"ĠDor":7318,"Ġmess":7319,"ĠBelgium":7320,"Ġke":7321,"ĠLopez":7322,"Ġbow":7323,"Ġhelicopter":7324,"was":7325,"Ġstone":7326,"kins":7327,"Ġunlike":7328,"Ġcollision":7329,"ĠAlt":7330,"HP":7331,"ĠMason":7332,"has":7333,"Ġclimbed":7334,"Ġindication":7335,"Ġhotels":7336,"Ġloud":7337,"ĠMilan":7338,"kes":7339,"Ġbadly":7340,"Ġtrials":7341,"Ġimpacts":7342,"ĠJane":7343,"Ġcrossed":7344,"Ġdiscussing":7345,"ĠSM":7346,"Ġpopularity":7347,"ĠWant":7348,"fall":7349,"Ġartificial":7350,"ĠBu":7351,"akh":7352,"Ġdominant":7353,"gov":7354,"Ġpremier":7355,"Ġexecution":7356,"gate":7357,"Ġswimming":7358,"Ġchat":7359,"Ġdevastating":7360,"acking":7361,"Ġreception":7362,"urt":7363,"Ġtheater":7364,"Ġgather":7365,"Ġtear":7366,"uro":7367,"Ġdemocratic":7368,"Ġrebels":7369,"Ġlifetime":7370,"Ġradical":7371,"uan":7372,"Ġtechniques":7373,"ache":7374,"ior":7375,"Ġcamps":7376,"Ġtelephone":7377,"ĠDublin":7378,"ĠBrand":7379,"ĠMarcus":7380,"aun":7381,"ĠRec":7382,"Ġ82":7383,"ban":7384,"Ġsafely":7385,"aku":7386,"aki":7387,"Ġbankruptcy":7388,"FF":7389,"Ġformat":7390,"Ġattached":7391,"ĠFame":7392,"ĠEdward":7393,"Ġmerger":7394,"ĠRepresentatives":7395,"izes":7396,"Ġhidden":7397,"Ġval":7398,"zz":7399,"Ġexcess":7400,"Ġscope":7401,"Ġdivorce":7402,"Ġburn":7403,"Ġrequirement":7404,"BB":7405,"ĠHand":7406,"Ġcons":7407,"Ġrisen":7408,"Ġtwitter":7409,"Ġoffseason":7410,"ĠSometimes":7411,"ĠInf":7412,"ĠAng":7413,"uer":7414,"report":7415,"Ġdreams":7416,"Ġ700":7417,"ips":7418,"ĠDream":7419,"Ġgifts":7420,"Ġsomehow":7421,"ĠTur":7422,"ĠRachel":7423,"can":7424,"Ġlog":7425,"ĠMedicaid":7426,"Ġles":7427,"Ġtired":7428,"ĠArkansas":7429,"Ġliquidity":7430,"ĠPhillips":7431,"ĠBTC":7432,"Ġhide":7433,"Ġpun":7434,"ĠRun":7435,"lyn":7436,"ĠUC":7437,"ĠDesign":7438,"ĠDev":7439,"Ġvaluation":7440,"Ġreveals":7441,"ĠChild":7442,"other":7443,"Ġposed":7444,"lee":7445,"Ġships":7446,"ĠTrue":7447,"Ġdescribes":7448,"Ġrunner":7449,"bro":7450,"Ġankle":7451,"Ġod":7452,"ĠAnnual":7453,"CL":7454,"Ġoverhaul":7455,"ned":7456,"Ġbold":7457,"Ġmo":7458,"ĠFalls":7459,"Ġemployed":7460,"ĠGro":7461,"Ġflash":7462,"ĠTD":7463,"Ġnervous":7464,"Ġintegration":7465,"Ġsmartphones":7466,"Ġmovements":7467,"nie":7468,"ition":7469,"ĠThird":7470,"Ģ":7471,"Ġmetres":7472,"Ġeconomist":7473,"omp":7474,"Ġteens":7475,"Ġeveryday":7476,"Ġinterviewed":7477,"Ġbriefly":7478,"],":7479,"uke":7480,"ĠFOX":7481,"Ġunderlying":7482,"ĠLuc":7483,"Ġcourses":7484,"ss":7485,"amed":7486,"°":7487,"ju":7488,"ĠBanks":7489,"Ġoutfit":7490,"illing":7491,"Ġtrafficking":7492,"Ġurging":7493,"Ġbelt":7494,"Ġrid":7495,"CP":7496,"Ġelderly":7497,"ĠGrowth":7498,"án":7499,"ĠSn":7500,"Ġsurrounded":7501,"Ġsisters":7502,"ĠIslam":7503,"Ġsynd":7504,"ĠCosta":7505,"di":7506,"ĠKl":7507,"Ġmanufacturer":7508,"holders":7509,"Ġelement":7510,"Ġload":7511,"Ġbooked":7512,"Ġaccompanied":7513,"ĠChamber":7514,"Ġbriefing":7515,"Oh":7516,"imi":7517,"ĠDefence":7518,"ĠCurrently":7519,"aking":7520,"Ġhandled":7521,"ĠCD":7522,"ĠBenjamin":7523,"Ġpocket":7524,"ĠKashmir":7525,"Ġlighting":7526,"aps":7527,"Ġ1997":7528,"ech":7529,"Ġaddiction":7530,"Ġbases":7531,"Ġpriorities":7532,"Ġhardly":7533,"ĠQuebec":7534,"ĠEarn":7535,"IES":7536,"ĠZach":7537,"ĠAlong":7538,"MI":7539,"Ġins":7540,"ĠRogers":7541,"ĠKan":7542,"ĠFuture":7543,"Ġtriggered":7544,"ĠUnit":7545,"Ġweighed":7546,"Ġpointing":7547,"Ġchocolate":7548,"ĠBrowns":7549,"ĠISIS":7550,"Ġgoalkeeper":7551,"Ġsaves":7552,"ĠAndre":7553,"burn":7554,"ĠCont":7555,"ĠNetherlands":7556,"Ġpolitically":7557,"ĠAshley":7558,"ĠWhit":7559,"aded":7560,"PH":7561,"Ġborders":7562,"ORE":7563,"Ġally":7564,"Trump":7565,"istan":7566,"ĠHunt":7567,"ĠCancer":7568,"ĠGrace":7569,"ĠTottenham":7570,"Ġ1960":7571,"ĠMarg":7572,"ĠBryan":7573,"ĠAgain":7574,"acing":7575,"Ġarguments":7576,"ĠSouthwest":7577,"Ġvocal":7578,"Ġjudgment":7579,"Ġengaging":7580,"Ġadopt":7581,"Ġrental":7582,"Ġlinebacker":7583,"ĠKardashian":7584,"Ġepisodes":7585,"..":7586,"Ġunt":7587,"Ġvowed":7588,"Ġ79":7589,"ule":7590,"Ġtransit":7591,"Ġoffshore":7592,"Ġsuppliers":7593,"Ġarguing":7594,"Ġsatellite":7595,"ĠLind":7596,"ĠTaliban":7597,"Buy":7598,"ĠCaribbean":7599,"ĠBarry":7600,"Ġauthors":7601,"ĠWolf":7602,"Ġviewing":7603,"ĠCubs":7604,"From":7605,"Ġ%":7606,"Ġcurrencies":7607,"Why":7608,"ĠBroncos":7609,"Ġtrick":7610,"Ġdiesel":7611,"ĠLiberal":7612,"FL":7613,"Ġtopics":7614,"Ġretain":7615,"ĠLiberty":7616,"Ġacquisitions":7617,"ced":7618,"Ġfre":7619,"Ġfleet":7620,"Ġcopper":7621,"ĠPot":7622,"jen":7623,"ĠElliott":7624,"ĠPyongyang":7625,"Ġobject":7626,"ĠUse":7627,"Ġmutual":7628,"MP":7629,"Ġev":7630,"Ġdeny":7631,"ĠEveryone":7632,"lling":7633,"Ġpays":7634,"Ġdrought":7635,"Ġcorn":7636,"Ġworkplace":7637,"rig":7638,"ĠMn":7639,"Ġadvisory":7640,"ĠCat":7641,"Ġchronic":7642,"ĠSteelers":7643,"Ġboxes":7644,"ĠNap":7645,"Ġdemonstrated":7646,"ĠTournament":7647,"Ġsymbol":7648,"ĠAfghan":7649,"ĠTan":7650,"ired":7651,"ĠEv":7652,"ĠConsumer":7653,"Ġmoral":7654,"ĠAdditional":7655,"Ġwebsites":7656,"Ġoccasions":7657,"Ġfate":7658,"Ġpitcher":7659,"Ġtaxpayers":7660,"Ġdeemed":7661,"ĠLibya":7662,"Ġpriced":7663,"Ġdistributed":7664,"ĠForum":7665,"Ġrice":7666,"Ġbloc":7667,"Ġprovisions":7668,"agh":7669,"Ġpen":7670,"Ġattracted":7671,"ĠEdmonton":7672,"Ġthousand":7673,"Ġpainting":7674,"Ġil":7675,"Ġcourtesy":7676,"Ġeliminate":7677,"Ġacc":7678,"Ġmeters":7679,"Ġreflected":7680,"Ġcomponent":7681,"Every":7682,"Ġsells":7683,"Ġfault":7684,"Ġburned":7685,"ĠKirk":7686,"ĠAnna":7687,"Ġappeals":7688,"Ġeggs":7689,"Ġfrequent":7690,"Ġtrigger":7691,"Ġrevised":7692,"ĠAngela":7693,"Ġ81":7694,"Ġsingles":7695,"Ġviral":7696,"Ġworries":7697,"ĠShould":7698,"profit":7699,"Ġraises":7700,"ĠBryant":7701,"ĠProduct":7702,"Ġtenure":7703,"Ġdiabetes":7704,"Ġcolour":7705,"azz":7706,"ĠGirls":7707,"Ġpractical":7708,"Ġblind":7709,"ancing":7710,"pictured":7711,"Ġfinale":7712,"ĠElection":7713,"Ġathletic":7714,"Ġpromoted":7715,"Ġflowers":7716,"Ġtrains":7717,"ario":7718,"Ġsufficient":7719,"IE":7720,"Ġexamples":7721,"Ġshed":7722,"Ġbirds":7723,"Ġchaos":7724,"Ġwound":7725,"Ġrocket":7726,"Ġwet":7727,"Ġsample":7728,"ĠNag":7729,"ĠOliver":7730,"Ġscrutiny":7731,"ĠSeven":7732,"ĠRoman":7733,"ĠFred":7734,"Ġweird":7735,"ĠTam":7736,"ĠSupport":7737,"ĠNathan":7738,"Ġstudying":7739,"Ġintroduction":7740,"Ġtons":7741,"cer":7742,"aus":7743,"ION":7744,"Ġcritic":7745,"ĠAh":7746,"alo":7747,"pur":7748,"Ġstorms":7749,"ĠMission":7750,"Ġcredits":7751,"Ġgrants":7752,"Ġcomp":7753,"Ġhearts":7754,"part":7755,"Ġpin":7756,"Ġsubsequent":7757,"Ġmad":7758,"ĠSacramento":7759,"woman":7760,"from":7761,"Ġoutcomes":7762,"Ġoldest":7763,"Ġdesperate":7764,"ĠTal":7765,"ĠDJ":7766,"ward":7767,"Ġaudiences":7768,"Ġimportantly":7769,"ĠEmily":7770,"sk":7771,"ĠHeat":7772,"ĠType":7773,"ĠPeace":7774,"Ġsuspicious":7775,"aly":7776,"ĠGET":7777,"ĠCAP":7778,"dis":7779,"ĠIraqi":7780,"ĠReed":7781,"Ġstrange":7782,"ĠParent":7783,"900":7784,"Ġglad":7785,"ĠTroy":7786,"ĠShort":7787,"Ġheritage":7788,"Ġarriving":7789,"ingly":7790,"Ġtransformation":7791,"Ġlease":7792,"Ġcollapsed":7793,"cha":7794,"ĠPatrol":7795,"Ġcomputers":7796,"Ġprinciples":7797,"Ġsporting":7798,"ĠHughes":7799,"mile":7800,"ĠCit":7801,"Ġdrilling":7802,"ĠBox":7803,"ÃŁ":7804,"bre":7805,"ĠOverall":7806,"Ġopioid":7807,"Ġdelighted":7808,"Ġhonored":7809,"ĠCold":7810,"Ġunions":7811,"ĠCou":7812,"ĠCircuit":7813,"Ġblast":7814,"sson":7815,"ĠHernandez":7816,"ĠLooking":7817,"Ġlegally":7818,"ĠWalmart":7819,"bridge":7820,"Ġmat":7821,"rad":7822,"ids":7823,"Ġdining":7824,"Ġrebound":7825,"abad":7826,"ĠRom":7827,"Ġimpose":7828,"ĠAlpha":7829,"ĠWeekly":7830,"TER":7831,"ĠJam":7832,"Ġabsolute":7833,"Ġinventory":7834,"ĠBilly":7835,"ĠKaren":7836,"ĠFriends":7837,"ĠCent":7838,"ĠVikings":7839,"ĠMuch":7840,"cell":7841,"ads":7842,"Ġph":7843,"Ġkiller":7844,"ĠMembers":7845,"Ġshooter":7846,"ĠInvestigators":7847,"ĠJoshua":7848,"Ġparticipated":7849,"Ġinnocent":7850,"ĠRichmond":7851,"itor":7852,"ĠDal":7853,"ĠOperator":7854,"Ġmakeup":7855,"Ġconf":7856,"ĠNEWS":7857,"ĠDef":7858,"Ġchase":7859,"ĠCost":7860,"mont":7861,"\":":7862,"Ġarrangements":7863,"stein":7864,"Ġretire":7865,"ĠLuis":7866,"Ġrenewed":7867,"ĠTownship":7868,"Ġchecked":7869,"arts":7870,"ĠCash":7871,"Ġcentres":7872,"chers":7873,"ĠSolutions":7874,"Ġlegend":7875,"ige":7876,"most":7877,"osed":7878,"ĠPor":7879,"Ġpremiere":7880,"FS":7881,"Ġmissiles":7882,"ĠLang":7883,"Ġsing":7884,"best":7885,"Ġtail":7886,"Ġriders":7887,"Picture":7888,"zen":7889,"ĠKent":7890,"Ġtransform":7891,"Ġwildlife":7892,"Ġsmoking":7893,"Ġpreseason":7894,"ĠLucas":7895,"ĠAnne":7896,"owski":7897,"Ġtape":7898,"Ġdisplayed":7899,"Ġforum":7900,"Ġanonymity":7901,"ĠIndianapolis":7902,"hips":7903,"acc":7904,"ĠMoreover":7905,"lers":7906,"area":7907,"ĠIndeed":7908,"Ġconducting":7909,"Ġinfection":7910,"Ġdealt":7911,"OB":7912,"asing":7913,"ĠGaza":7914,"itter":7915,"ĠKa":7916,"Ġhopeful":7917,"ĠSnow":7918,"Ġentitled":7919,"Ġaffecting":7920,"Ġeager":7921,"Ġcircle":7922,"Ġlaugh":7923,"ĠProsecutors":7924,"ĠDur":7925,"Ġbarriers":7926,"ĠPoll":7927,"oun":7928,"ĠPalm":7929,"chi":7930,"Ġsamples":7931,"Ġcompromise":7932,"atter":7933,"Ġenormous":7934,"Ġé":7935,"coming":7936,"ĠPharmaceutical":7937,"Ġrank":7938,"Let":7939,"Ġtransgender":7940,"ĠCloud":7941,"FO":7942,"ĠBor":7943,"Ġbonus":7944,"Ġordinary":7945,"ĠPres":7946,"ĠHIV":7947,"ires":7948,"OSE":7949,"Ġdancing":7950,"ĠHD":7951,"Ġversions":7952,"Ġ88":7953,"rate":7954,"Ġtackles":7955,"Ġknock":7956,"ĠEmma":7957,"Ġmotivated":7958,"ĠBennett":7959,"ĠBurn":7960,"Ġgrid":7961,"Ġembrace":7962,"ĠSpurs":7963,"Ġflows":7964,"ĠGer":7965,"Ġsponsored":7966,"Ġsurvival":7967,"ching":7968,"Ġ1995":7969,"Ġreward":7970,"Ġdepends":7971,"Ġpostseason":7972,"Ġloaded":7973,"Ġneutral":7974,"ĠPop":7975,"BL":7976,"Ġrevolution":7977,"ĠFreedom":7978,"Ġrecovering":7979,"Ġrequiring":7980,"ALL":7981,"ARE":7982,"Ġmini":7983,"lt":7984,"ĠFDA":7985,"Ġcarpet":7986,"ĠPrior":7987,"Ġadmission":7988,"ĠEver":7989,"ĠTribune":7990,"ĠRonaldo":7991,"Ġthick":7992,"Ġlanes":7993,"Ġ84":7994,"ĠMemphis":7995,"Ġopt":7996,"BO":7997,"Ġfaculty":7998,"ĠChad":7999,"ĠSUV":8000,"ĠHen":8001,"Ġeste":8002,"ĠHu":8003,"ĠAgriculture":8004,"store":8005,"ĠDrug":8006,"inter":8007,"Ġ1996":8008,"ident":8009,"Ġbackup":8010,"ĠHonda":8011,"ĠHope":8012,"oes":8013,"ums":8014,"amer":8015,"Ġbreath":8016,"Ġ110":8017,"Ġjoke":8018,"ĠAld":8019,"Ġwondering":8020,"ĠAssad":8021,"ĠRem":8022,"Ġfundraising":8023,"pot":8024,"è":8025,"Ġquestioning":8026,"Ġpent":8027,"ĠMoney":8028,"ĠMedicine":8029,"wick":8030,"ĠKnights":8031,"Ġbatting":8032,"ĠMos":8033,"Ġdesignated":8034,"isse":8035,"Ġspotlight":8036,"Ġlake":8037,"Ġcaution":8038,"Ġinmates":8039,"Ġlap":8040,"CE":8041,"ĠJavascript":8042,"ĠDeutsche":8043,"ĠFargo":8044,"Ġguaranteed":8045,"borough":8046,"Ġfunctions":8047,"ĠElementary":8048,"ĠChuck":8049,"Ġpitched":8050,"ĠKrist":8051,"Ġsteal":8052,"Ġchips":8053,"Ġalarm":8054,"Ġbeloved":8055,"scale":8056,"Ġassaulted":8057,"ĠPentagon":8058,"Ġtemporarily":8059,"Ġ93":8060,"Ġ>":8061,"ĠPortugal":8062,"ti":8063,"HL":8064,"Ġdecreased":8065,"Ġexistence":8066,"Ġisolated":8067,"Ġdeposit":8068,"Ġstudied":8069,"\")":8070,"Ġtrophy":8071,"ĠBrooks":8072,"Ġbattling":8073,"Ġweaker":8074,"ĠPrivate":8075,"ĠAccess":8076,"Ġvirtually":8077,"Ġshortage":8078,"Ġgaining":8079,"Ġbathroom":8080,"TON":8081,"Ġconcerning":8082,"Ġengineer":8083,"Ġbread":8084,"Ġdemonstrate":8085,"ĠDh":8086,"Ġhorses":8087,"Ġintersection":8088,"Ġcolors":8089,"Ġdelegation":8090,"Ġnotable":8091,"Ġwithdrawal":8092,"ĠDennis":8093,"Ġlocally":8094,"Ġcoastal":8095,"Ġcomply":8096,"ĠMoh":8097,"ĠAlbert":8098,"Ġclosest":8099,"ĠCITY":8100,"Ġ83":8101,"Ġcancelled":8102,"ĠðŁ":8103,"Ġsharply":8104,"RS":8105,"Ġproductivity":8106,"Ġbasket":8107,"SS":8108,"Ġadmit":8109,"ool":8110,"ination":8111,"ĠBB":8112,"Ġsur":8113,"ĠSteel":8114,"ĠTed":8115,"ĠPac":8116,"Ġpatterns":8117,"Ġlisting":8118,"Ġreplacing":8119,"ĠPradesh":8120,"Ġroots":8121,"Ġbroker":8122,"ĠWriting":8123,"Ġsued":8124,"Ġorganised":8125,"ĠThanksgiving":8126,"ĠNOT":8127,"Ġjournalism":8128,"uel":8129,"Ġkilometers":8130,"Ġhunt":8131,"berry":8132,"ĠMother":8133,"Ġlegitimate":8134,"Ġinput":8135,"ĠRel":8136,"ĠGuardian":8137,"Ar":8138,"Ġtransported":8139,"Ġbedroom":8140,"ashing":8141,"Ġbats":8142,"Ġcleaning":8143,"Ġwrapped":8144,"Pacific":8145,"Ġfence":8146,"Ġtestified":8147,"Ġ1994":8148,"Ġinterference":8149,"Ġmatching":8150,"Ġexpression":8151,"eta":8152,"ĠSpencer":8153,"Ġstrategist":8154,"who":8155,"Ġvictories":8156,"Ġ2022":8157,"Ġstakes":8158,"Ġbuses":8159,"ĠHousing":8160,"Ġeditorial":8161,"Ġ86":8162,"ĠBishop":8163,"Ġfrustrated":8164,"Ġappearing":8165,"http":8166,"IGHT":8167,"Ġmemo":8168,"Ġinsiders":8169,"Even":8170,"Ġclassroom":8171,"Ġchef":8172,"aining":8173,"].":8174,"ĠMcD":8175,"Ġ87":8176,"ĠPunjab":8177,"Ġancient":8178,"Ġresolved":8179,"Ġdying":8180,"Ġdestruction":8181,"Ġgoverning":8182,"Ġrestructuring":8183,"ĠPick":8184,"Ġmunicipal":8185,"Ġengines":8186,"ĠHudson":8187,"Æ":8188,"Ġrepeal":8189,"standing":8190,"Ġbound":8191,"ĠOS":8192,"ĠCommonwealth":8193,"Ġdescription":8194,"Ġhouseholds":8195,"Ġmal":8196,"Ġstopping":8197,"equ":8198,"Ġregulator":8199,"Ġcontaining":8200,"Ġremoving":8201,"Ġwithdraw":8202,"Ġburied":8203,"Ġlists":8204,"ĠGil":8205,"Ġlowered":8206,"Ġformally":8207,"ĠRound":8208,"asi":8209,"¥":8210,"lett":8211,"Ġprogressive":8212,"ĠFalcons":8213,"ĠRaw":8214,"gun":8215,"Ġcontributing":8216,"Ġhunting":8217,"Ġvalid":8218,"Ġexception":8219,"ĠPlayers":8220,"ĠTra":8221,"Ġracism":8222,"hing":8223,"chen":8224,"Ġdifferently":8225,"Ġchampionships":8226,"ĠEng":8227,"ĠNO":8228,"ĠAuto":8229,"ĠErdogan":8230,"iding":8231,"Ġwarming":8232,"Ġcivilian":8233,"ĠDam":8234,"Ġfantasy":8235,"ĠNav":8236,"itions":8237,"ĠDrew":8238,"ĠNancy":8239,"Ġtrapped":8240,"ĠRussians":8241,"ĠIC":8242,"Ġflexibility":8243,"ular":8244,"Ġviolated":8245,"ipped":8246,"Ġgarage":8247,"ĠDeep":8248,"Ġpraise":8249,"ĠLab":8250,"ĠPlayer":8251,"Ġjudicial":8252,"Ġdonate":8253,"Ġseparated":8254,"Ġreleases":8255,"nik":8256,"Ġexplanation":8257,"aph":8258,"Ġloyal":8259,"Ġstrongest":8260,"ĠShar":8261,"Ġrescued":8262,"Ġambitious":8263,"Ġclimb":8264,"Ġscared":8265,"Ġignored":8266,"cut":8267,"Ġstole":8268,"Ġweakness":8269,"ĠRidge":8270,"oa":8271,"LA":8272,"Ġdep":8273,"ĠPowell":8274,"Do":8275,"Ġprotein":8276,"Ġreiterated":8277,"ĠCox":8278,"aling":8279,"ĠUnlike":8280,"ĠKane":8281,"ĠMcConnell":8282,"Ġshowcase":8283,"Ġuniform":8284,"ower":8285,"Ġdiscover":8286,"stop":8287,"ipper":8288,"Ġtreatments":8289,"Ġgrocery":8290,"Ġsubscribers":8291,"lock":8292,"ple":8293,"Ġflew":8294,"ania":8295,"Ġstepping":8296,"ĠSoviet":8297,"Ġconsultant":8298,"ags":8299,"ĠLim":8300,"Ġ91":8301,"ĠCode":8302,"ports":8303,"box":8304,"Ġlakh":8305,"Ġreminder":8306,"ym":8307,"ĠTravis":8308,"Ġpure":8309,"now":8310,"ĠVR":8311,"Ġachievement":8312,"ĠEmirates":8313,"ĠThunder":8314,"Ġmerely":8315,"ĠCa":8316,"ĠAverage":8317,"ĠDa":8318,"Ġtopped":8319,"ĠCurry":8320,"Ġchemicals":8321,"Ġamendment":8322,"ĠBorder":8323,"ĠBat":8324,"Ġ130":8325,"Ġprogramming":8326,"Ġtele":8327,"ĠKarl":8328,"Ġaveraged":8329,"ĠSpe":8330,"world":8331,"PG":8332,"Ġfights":8333,"ĠPrincess":8334,"ĠCIA":8335,"ĠAbe":8336,"Ġacted":8337,"only":8338,"Ġinsight":8339,"Ġathlete":8340,"ĠTar":8341,"commerce":8342,"Ġaveraging":8343,"cr":8344,"ĠPalestinians":8345,"Well":8346,"Ġbull":8347,"Ġchoosing":8348,"Ġsurely":8349,"ĠSecret":8350,"Ġteammate":8351,"ĠAmendment":8352,"ĠBirmingham":8353,"Ġexcitement":8354,"strong":8355,"ĠSin":8356,"Ġdamages":8357,"rated":8358,"Ġrankings":8359,"Ġconservation":8360,"home":8361,"erm":8362,"ield":8363,"Ġdisorder":8364,"acher":8365,"Ġnaturally":8366,"atur":8367,"Ġpackages":8368,"Ġapproaches":8369,"icks":8370,"ourn":8371,"Ġodd":8372,"Ġshore":8373,"ĠBeing":8374,"Ġmagic":8375,"Ġtourist":8376,"largest":8377,"Ġwhenever":8378,"Ġlenders":8379,"Ġegg":8380,"ĠChair":8381,"Ġlets":8382,"Ġwarnings":8383,"į":8384,"Ġpol":8385,"Ġdrag":8386,"ĠAmb":8387,"ĠCle":8388,"ĠLouisville":8389,"ĠShaw":8390,"lands":8391,"Ġanthem":8392,"ĠTrail":8393,"Ġaccepting":8394,"anger":8395,"good":8396,"ĠBroad":8397,"ĠLebanon":8398,"ĠMillion":8399,"ĠHenderson":8400,"Ġwh":8401,"Ġdust":8402,"Ġ92":8403,"ĠMend":8404,"Ġchecking":8405,"ĠCow":8406,"sized":8407,"Ġautomatic":8408,"Ġcelebrates":8409,"Ġarena":8410,"Ġfinger":8411,"ĠHarvard":8412,"Ġfrustration":8413,"Ġstrict":8414,"Ġpreserve":8415,"Ġsleeping":8416,"Ġconverted":8417,"Ġinsights":8418,"Ġtra":8419,"Ġjailed":8420,"Ġchamber":8421,"Ġtoxic":8422,"ading":8423,"ĠTriple":8424,"grade":8425,"ĠRest":8426,"ĠHoly":8427,"oper":8428,"Ġdesk":8429,"Ġmatchup":8430,"Ġsteep":8431,"ĠGot":8432,"lay":8433,"ĠCab":8434,"aked":8435,"ĠFoster":8436,"Ġrunners":8437,"ĠNA":8438,"Ġdestroy":8439,"Ġsupportive":8440,"ĠRacing":8441,"Ġtrademark":8442,"Ġjacket":8443,"Ġhorror":8444,"ĠAle":8445,"Ġass":8446,"Ġsch":8447,"abb":8448,"Ġplanes":8449,"Ġimpression":8450,"ĠEarly":8451,"ĠPompe":8452,"Ġking":8453,"Ġsilent":8454,"ĠCuba":8455,"Ġmedication":8456,"ences":8457,"list":8458,"ailing":8459,"WA":8460,"ella":8461,"Ġprop":8462,"Ġhalt":8463,"Ġslowing":8464,"ĠFoods":8465,"Ġanonymous":8466,"kh":8467,"Ġtraveled":8468,"Ġcommunicate":8469,"Ġter":8470,"ĠHockey":8471,"ĠRobin":8472,"Ġswept":8473,"Ġclinic":8474,"ration":8475,"len":8476,"Ġau":8477,"Ġcareers":8478,"ĠSound":8479,"Ġaddresses":8480,"China":8481,"ĠSr":8482,"Ġexhibit":8483,"ĠMotors":8484,"ĠIl":8485,"Ġinstall":8486,"ĠOkay":8487,"Ġ>>":8488,"hood":8489,"stand":8490,"Ġaudit":8491,"Ġcake":8492,"Ġflames":8493,"bel":8494,"ĠMust":8495,"ĠManafort":8496,"Ġcommodity":8497,"night":8498,"ĠRoom":8499,"ĠLanka":8500,"Ġcommander":8501,"ln":8502,"Ġdatabase":8503,"ĠSet":8504,"Ġgraduated":8505,"ĠTarget":8506,"Ġoutbreak":8507,"rou":8508,"ĠPope":8509,"ĠEqu":8510,"Ġpolling":8511,"Ġdig":8512,"Ġbrutal":8513,"ĠBarn":8514,"Ġdefinition":8515,"Ġpit":8516,"Ġpickup":8517,"ĠBitcoin":8518,"ĠReid":8519,"Ġloving":8520,"ĠHerald":8521,"ĠCanadians":8522,"Ġneighbor":8523,"Ġdies":8524,"ione":8525,"ĠRef":8526,"big":8527,"Ġguards":8528,"including":8529,"ente":8530,"Ġpartially":8531,"Image":8532,"Ġbulk":8533,"Ġslot":8534,"ĠNorthwest":8535,"ĠBarclays":8536,"Ġairlines":8537,"iver":8538,"isi":8539,"Ġsubsidiary":8540,"Ġcont":8541,"ĠDaniels":8542,"Ġscript":8543,"Ġunfair":8544,"Ġscreens":8545,"Ġprof":8546,"ĠIrma":8547,"Ġ1992":8548,"Ġmandatory":8549,"ĠSant":8550,"Ġsuspicion":8551,"NES":8552,"ĠLauren":8553,"igen":8554,"Ġprevention":8555,"Ġtension":8556,"ema":8557,"Ġtasks":8558,"Ġshake":8559,"Ġexplosive":8560,"Ġaffects":8561,"Ġmum":8562,"ĠDog":8563,"rer":8564,"Ġopted":8565,"Ġtrio":8566,"Ġlesson":8567,"Ġautomotive":8568,"where":8569,"ĠMontgomery":8570,"Ġcouples":8571,"Ġ89":8572,"AF":8573,"Ġinfo":8574,"ĠForm":8575,"Ġspectrum":8576,"Ġbands":8577,"Ġokay":8578,"Ġstroke":8579,"ĠNetanyahu":8580,"Ġwealthy":8581,"ĠAround":8582,"ĠGlenn":8583,"sec":8584,"there":8585,"ickets":8586,"ĠBudget":8587,"ĠBMW":8588,"Ġflagship":8589,"rier":8590,"Ġpodcast":8591,"Ġpursuing":8592,"Ġpos":8593,"ĠIslands":8594,"ĠUrban":8595,"page":8596,"Ġemotions":8597,"ided":8598,"Ġdividends":8599,"Ġboom":8600,"Ġaccusing":8601,"ird":8602,"ĠNam":8603,"ava":8604,"Ġwishes":8605,"ĠNy":8606,"ĠStanford":8607,"Ġcriteria":8608,"ĠJews":8609,"Ġengineers":8610,"Ġaccuracy":8611,"Ġdisplays":8612,"Ġdeserves":8613,"ridge":8614,"omm":8615,"aur":8616,"Ġdramatically":8617,"Ġunity":8618,"speed":8619,"Ġdeclining":8620,"Ġpermits":8621,"ĠKn":8622,"Ġconsulting":8623,"aux":8624,"ATE":8625,"ĠWat":8626,"ĠEditor":8627,"sy":8628,"urn":8629,"ĠUsing":8630,"asc":8631,"ital":8632,"Ġcre":8633,"quality":8634,"Ġce":8635,"Ġenemy":8636,"Ġoffence":8637,"icket":8638,"ĠDick":8639,"ĠTH":8640,"ĠChampionships":8641,"Ġoverwhelming":8642,"rib":8643,"ku":8644,"rap":8645,"Ġhomer":8646,"acion":8647,"member":8648,"erv":8649,"aney":8650,"MB":8651,"eded":8652,"Ġpunishment":8653,"Ġnegotiate":8654,"ĠFile":8655,"stream":8656,"ĠHur":8657,"Ġnose":8658,"ĠFab":8659,"iter":8660,"Ġpainful":8661,"ITY":8662,"eren":8663,"Ġcollecting":8664,"Additional":8665,"Ġentrepreneurs":8666,"bal":8667,"Ġexploring":8668,"Ġguitar":8669,"Ġpartnerships":8670,"Ġfurniture":8671,"Ġauthorized":8672,"Ġeasing":8673,"shirt":8674,"ĠGross":8675,"Ġpolitician":8676,"ĠSimpson":8677,"Ġdrone":8678,"ĠKatie":8679,"Ġprofitability":8680,"ĠNHS":8681,"ĠSierra":8682,"ĠNorway":8683,"ASHINGTON":8684,"ific":8685,"Ġcondemned":8686,"team":8687,"ĠNebraska":8688,"Ġthrilled":8689,"iller":8690,"Ġpatrol":8691,"ĠWR":8692,"orm":8693,"Ġspectacular":8694,"ĠKnight":8695,"ĠTravel":8696,"nam":8697,"Ġmuscle":8698,"ĠRain":8699,"ĠColombia":8700,"Ġnursing":8701,"Ġmigration":8702,"ĠMitch":8703,"Ġreleasing":8704,"ĠBesides":8705,"ĠMul":8706,"Ġheadline":8707,"Ġcontemporary":8708,"Ġdev":8709,"ĠChan":8710,"Ġindicates":8711,"ĠAp":8712,"ĠLt":8713,"ĠMarvel":8714,"Ġremembered":8715,"®":8716,"ĠForces":8717,"ĠColin":8718,"ĠGabriel":8719,"Ġobjects":8720,"ĠRHP":8721,"kar":8722,"ĠKo":8723,"Ġsignals":8724,"Ġinner":8725,"real":8726,"RO":8727,"Ġromantic":8728,"cat":8729,"ĠKel":8730,"Ġgut":8731,"ĠBoys":8732,"Ġyoungest":8733,"ĠCeltics":8734,"Ġslated":8735,"Ġremind":8736,"Ġproductive":8737,"set":8738,"Co":8739,"ĠBailey":8740,"Ġrenewable":8741,"ĠCarson":8742,"ĠDj":8743,"ĠKos":8744,"Ġurge":8745,"Ġfin":8746,"Ġpursuit":8747,"ĠCON":8748,"ĠChapter":8749,"Ġpal":8750,"Ġgate":8751,"ĠPackers":8752,"ĠReports":8753,"ĠRugby":8754,"ĠMasters":8755,"MO":8756,"Ġ98":8757,"Ġcatches":8758,"ĠAgreement":8759,"ĠTillerson":8760,"ĠIce":8761,"Ġrumors":8762,"ĠLeonard":8763,"ĠDolphins":8764,"ĠLP":8765,"top":8766,"ĠCrist":8767,"ĠHon":8768,"Ġblaze":8769,"Ġrhetoric":8770,"ands":8771,"ady":8772,"David":8773,"igh":8774,"Ġbuzz":8775,"ĠStrong":8776,"Ġshocking":8777,"ĠRh":8778,"Ġnegotiating":8779,"Ġtender":8780,"ĠJohnny":8781,"ĠMario":8782,"Ġ97":8783,"ĠHeritage":8784,"Ġexists":8785,"Ġprayers":8786,"Ġlengthy":8787,"Ġsafer":8788,"ĠHalloween":8789,"ĠJared":8790,"ĠConnect":8791,"Ġbump":8792,"Ġstrain":8793,"Ġfilling":8794,"Ġtrauma":8795,"Ġcompleting":8796,"cht":8797,"Ġkillings":8798,"anne":8799,"GE":8800,"ĠRescue":8801,"Ġdealers":8802,"Ġlocals":8803,"ĠVictor":8804,"Ġtragic":8805,"Ġdelivers":8806,"orts":8807,"Ġrugby":8808,"Ġinstallation":8809,"asa":8810,"ĠBart":8811,"Ġjournal":8812,"school":8813,"ĠCome":8814,"ĠVeterans":8815,"Sun":8816,"Ġcrowds":8817,"Ġtransparent":8818,"Ġimplications":8819,"ĠHuawei":8820,"sex":8821,"Ġrallied":8822,"Ġresponses":8823,"Ġdebris":8824,"Ġconvention":8825,"Ġmothers":8826,"BE":8827,"ĠRoute":8828,"Ġrebel":8829,"ĠEmmanuel":8830,"aster":8831,"Ġunderstands":8832,"pound":8833,"ĠCastle":8834,"Ġ2021":8835,"rik":8836,"ĠGR":8837,"Ġconvince":8838,"ault":8839,"Ġpassionate":8840,"ĠSciences":8841,"Ġarrives":8842,"idad":8843,"Ġcelebrities":8844,"ends":8845,"ĠFans":8846,"Ġdish":8847,"ĠCorps":8848,"hat":8849,"Ġemployer":8850,"ĠHy":8851,"Ġpowered":8852,"Ġgrandmother":8853,"ĠFL":8854,"oured":8855,"VE":8856,"ĠInst":8857,"ĠPerez":8858,"Ġtune":8859,"Ġcitizenship":8860,"Ġignore":8861,"Ġdoubles":8862,"IB":8863,"Ġprogrammes":8864,"inda":8865,"Ġentities":8866,"ĠInterior":8867,"Ġprompting":8868,"Ġwire":8869,"Ġtheatre":8870,"%)":8871,"Ġheels":8872,"ĠJu":8873,"Ġdeposits":8874,"Ġtrash":8875,"mond":8876,"she":8877,"iana":8878,"Ġislands":8879,"ĠTommy":8880,"Ġpub":8881,"Ġdiscipline":8882,"ĠSW":8883,"Ġmusicians":8884,"Ġembassy":8885,"ĠQB":8886,"hander":8887,"UES":8888,"ĠFerguson":8889,"Ġblocking":8890,"ahn":8891,"Ġfines":8892,"Ġtactics":8893,"Ġbullet":8894,"Ġequipped":8895,"Ġescaped":8896,"ĠSil":8897,"ĠPack":8898,"ĠAthletic":8899,"ĠMic":8900,"ĠDoes":8901,"ĠCarr":8902,"ĠChargers":8903,"ĠKyl":8904,"Ġzones":8905,"µ":8906,"iki":8907,"Ġgreatly":8908,"ĠMD":8909,"Ġimmigrant":8910,"ĠConstruction":8911,"ĠBorn":8912,"iment":8913,"ĠWade":8914,"Ġvisa":8915,"Ġgenuine":8916,"Ġelectronics":8917,"ĠSat":8918,"Ġsponsors":8919,"ĠMontana":8920,"Ġspell":8921,"ĠSachs":8922,"ĠEt":8923,"Ġfoster":8924,"Ġlocker":8925,"Ġexplaining":8926,"ĠAge":8927,"Ġgunman":8928,"Ġsauce":8929,"Ġcry":8930,"Ġstimulus":8931,"Ġarray":8932,"Ġcompare":8933,"Ġboats":8934,"Ġext":8935,"iders":8936,"ĠAst":8937,"ĠParks":8938,"ester":8939,"Ġ94":8940,"Ġrelating":8941,"Ġvegetables":8942,"Ġaccountable":8943,"Ġhyper":8944,"ĠWim":8945,"Ġnewest":8946,"ĠRome":8947,"ĠChancellor":8948,"CBS":8949,"Ġbusinessman":8950,"ĠDelaware":8951,"Ġlands":8952,"court":8953,"aria":8954,"Ġapproaching":8955,"cker":8956,"ĠSalt":8957,"ĠMak":8958,"Ġtreating":8959,"Ġsubsequently":8960,"ĠEll":8961,"xton":8962,"Ġ180":8963,"Ġdetermination":8964,"ĠSalman":8965,"ĠJoel":8966,"Ġclassified":8967,"Ġspan":8968,"Ġearthquake":8969,"ranked":8970,"Ġ96":8971,"ĠTiger":8972,"Ġadvocacy":8973,"mit":8974,"Ġcolleges":8975,"ĠYeah":8976,"ĠCaptain":8977,"Ġorange":8978,"Ġprojections":8979,"Ġelectrical":8980,"ĠMA":8981,"olog":8982,"ĠNewcastle":8983,"oppers":8984,"Ġrepresentation":8985,"Ġlawsuits":8986,"just":8987,"aced":8988,"ĠRace":8989,"ĠAqu":8990,"ĠBills":8991,"Ġexclusively":8992,"ĠProfile":8993,"Ġhometown":8994,"ĠStan":8995,"Ġstarring":8996,"Ġdeciding":8997,"ĠRating":8998,"ĠMedicare":8999,"ĠTransport":9000,"Ġmystery":9001,"ĠTa":9002,"ĠPad":9003,"ĠSwedish":9004,"ĠCarroll":9005,"about":9006,"Ġtorn":9007,"Ġnurse":9008,"NE":9009,"Ġwaited":9010,"ĠJeffrey":9011,"ĠUntil":9012,"Ġbone":9013,"ĠBobby":9014,"Ġpronounced":9015,"Ġpharmaceutical":9016,"ĠGallery":9017,"ĠMatch":9018,"Ġeconomists":9019,"ĠMarketing":9020,"face":9021,"ĠPetroleum":9022,"ories":9023,"ĠMets":9024,"ĠCore":9025,"billion":9026,"Ġexamination":9027,"ĠPorter":9028,"2016":9029,"Ġgolden":9030,"Ġsem":9031,"ĠDuterte":9032,"ĠJefferson":9033,"ĠTehran":9034,"ĠLeicester":9035,"ĠDA":9036,"Ġadapt":9037,"ĠDame":9038,"ĠRic":9039,"Ġunchanged":9040,"ect":9041,"Ġsections":9042,"kg":9043,"igned":9044,"Ġfilings":9045,"Ġreact":9046,"Ġurgent":9047,"Ġvessels":9048,"Ġspark":9049,"Ġbutter":9050,"ĠCons":9051,"Ġstating":9052,"Ġcorporations":9053,"ĠHus":9054,"Ġdamaging":9055,"raw":9056,"Ġequality":9057,"Two":9058,"ĠMills":9059,"iu":9060,"Ġobligation":9061,"ĠBrook":9062,"arian":9063,"Re":9064,"Ġphotographs":9065,"Ġepic":9066,"ĠStudent":9067,"ĠTherefore":9068,"Ġgod":9069,"ĠFILE":9070,"iqu":9071,"Ġdescribing":9072,"Ġproceed":9073,"Ġcas":9074,"ĠKat":9075,"ĠBra":9076,"Ġadequate":9077,"Ġpassage":9078,"Ġthanked":9079,"USA":9080,"ĠNeither":9081,"ĠLegislature":9082,"Ġfinances":9083,"Ġinst":9084,"ĵ":9085,"ĠAngels":9086,"Ġvet":9087,"ĠDead":9088,"Ex":9089,"Ġkicks":9090,"force":9091,"Ġsoy":9092,"ĠWindsor":9093,"Ġenhanced":9094,"Ġ1993":9095,"ĠCzech":9096,"Ġgradually":9097,"ĠMagic":9098,"Ġshadow":9099,"Ġneighborhoods":9100,"ĠRivers":9101,"Ġrapper":9102,"ĠGirl":9103,"ĠRot":9104,"Ġcrackdown":9105,"fish":9106,"Ġpreventing":9107,"Ġproduces":9108,"ĠMi":9109,"Ġnotified":9110,"Ġunderground":9111,"WE":9112,"Ġadmits":9113,"Ġboxing":9114,"Ġrefer":9115,"Ġcommitments":9116,"ĠWoman":9117,"Ġdenies":9118,"col":9119,"ĠSide":9120,"Ġambulance":9121,"ĠRodgers":9122,"Ġaftermath":9123,"Ġdeck":9124,"irmed":9125,"Ġerrors":9126,"ĠConvention":9127,"Ġcurb":9128,"ĠShop":9129,"ĠThai":9130,"Ġma":9131,"Ġrespected":9132,"ĠMVP":9133,"Ġborrowing":9134,"Ġcruise":9135,"ĠSure":9136,"Ġsentencing":9137,"ĠObamacare":9138,"ĠIr":9139,"ĠSale":9140,"ĠPete":9141,"Ġopenly":9142,"Ġstartup":9143,"rock":9144,"Ġcargo":9145,"Ġtelecom":9146,"ĠDownload":9147,"Ġextending":9148,"ĠCurrent":9149,"Ġcompetitions":9150,"ĠKids":9151,"Ġshy":9152,"ĠKerry":9153,"ĠNever":9154,"ĠDevils":9155,"Ġprim":9156,"Con":9157,"Ġcurve":9158,"Ġassumed":9159,"Ġadjust":9160,"Ġimmune":9161,"UE":9162,"ĠUr":9163,"Ġconventional":9164,"Ġgrandchildren":9165,"ĠBol":9166,"Ad":9167,"ĠMaduro":9168,"fi":9169,"ĠUAE":9170,"ĠOrgan":9171,"Ġindicating":9172,"iem":9173,"ĠAgainst":9174,"ĠAmbassador":9175,"ĠSeoul":9176,"Ġcriminals":9177,"how":9178,"put":9179,"Ġreminded":9180,"Ġparked":9181,"lich":9182,"Ġcontinent":9183,"Ġmatched":9184,"ĠNicole":9185,"Ġgenetic":9186,"Ġhumanity":9187,"ĠTem":9188,"Ġindicator":9189,"Ġvessel":9190,"Ġdefendant":9191,"ĠGriffin":9192,"jan":9193,"Ġvend":9194,"boro":9195,"Ġbrokerage":9196,"ĠFall":9197,"Ġmere":9198,"VILLE":9199,"Ġlasted":9200,"ĠMind":9201,"Ġpatch":9202,"ĠInsider":9203,"ĠComm":9204,"Ġtechnique":9205,"ĠIM":9206,"ĠCavaliers":9207,"Ġshame":9208,"Ġmil":9209,"oot":9210,"irt":9211,"Ġcop":9212,"ĠLeon":9213,"Ġfrozen":9214,"Ġslip":9215,"pton":9216,"Ġpanels":9217,"Ġpitching":9218,"Ġleather":9219,"ĠLogan":9220,"ĠNearly":9221,"urch":9222,"Ġinstructions":9223,"ĠRow":9224,"ĠKurdish":9225,"this":9226,"Ġlegendary":9227,"su":9228,"Ġstabbed":9229,"sters":9230,"Ġteenage":9231,"def":9232,"Ġoversight":9233,"Ġvolatile":9234,"Ġtransmission":9235,"ĠSgt":9236,"ĠIndigenous":9237,"ĠOxford":9238,"ĠCasey":9239,"Ġcor":9240,"Ġsalaries":9241,"Ġsponsor":9242,"Ġprescription":9243,"mat":9244,"ĠLeeds":9245,"ĠPakistani":9246,"Ġevil":9247,"Ġtables":9248,"ĠAbdul":9249,"Ġexpectation":9250,"Ġlegislature":9251,"ĠLin":9252,"¹":9253,"Ġcontractor":9254,"Ġshifting":9255,"Ġgenerous":9256,"ĠEddie":9257,"Ġpuck":9258,"utt":9259,"Ġdubbed":9260,"Ġnowhere":9261,"Ġbetting":9262,"Ġdisclose":9263,"Ĥ":9264,"ĠFashion":9265,"ĠHarper":9266,"handed":9267,"isha":9268,"ĠReds":9269,"Ġachievements":9270,"ume":9271,"Ġshootings":9272,"Ġadvisers":9273,"ĠEaster":9274,"Ġinternationally":9275,"ĠWi":9276,"ĠGandhi":9277,"ĠChristians":9278,"Ġrecruiting":9279,"Ġexperiment":9280,"Ġsol":9281,"Ġdifficulties":9282,"Ġinfluential":9283,"Ġhybrid":9284,"Ġformation":9285,"ĠBoulevard":9286,"Ġflags":9287,"Ġformula":9288,"front":9289,"Ġinclusion":9290,"ĠNone":9291,"ICE":9292,"Ġfilming":9293,"ĠLou":9294,"ĠReynolds":9295,"Ġpump":9296,"Ġexceptional":9297,"ANG":9298,"ĠCorporate":9299,"SAN":9300,"ĠHealthcare":9301,"ĠUkrainian":9302,"aron":9303,"Ġpants":9304,"Ġdrops":9305,"ete":9306,"ĠStudies":9307,"Ġwounds":9308,"END":9309,"Ġshower":9310,"Ġreviewing":9311,"ĠGreater":9312,"Ġ»":9313,"itors":9314,"alled":9315,"Ġsqu":9316,"ĠRonald":9317,"ĠInv":9318,"Ġtougher":9319,"Ġbalanced":9320,"Ġlined":9321,"Ġprinciple":9322,"Ġ1950":9323,"Ġleak":9324,"Be":9325,"Ġcircuit":9326,"Ġunfortunate":9327,"ĠGran":9328,"ĠFish":9329,"Ġfriendship":9330,"asp":9331,"OO":9332,"Ġobligations":9333,"Ġcoup":9334,"OK":9335,"Ġbreakdown":9336,"Ġhook":9337,"Ġresearcher":9338,"inated":9339,"ĠMarie":9340,"ĠGab":9341,"ĠWA":9342,"quez":9343,"General":9344,"ĠSwift":9345,"Ġgust":9346,"ĠCarol":9347,"ĠCentury":9348,"ĠOPEC":9349,"ĠRd":9350,"ĠCop":9351,"Ġsubjects":9352,"ĠComments":9353,"ases":9354,"Ġrelation":9355,"ĠEnvironment":9356,"ı":9357,"Ġgasoline":9358,"ĠLog":9359,"Ġicon":9360,"Ġprofitable":9361,"ĠRetail":9362,"ANC":9363,"Ġappealing":9364,"Ġvillages":9365,"Ġpizza":9366,"Ġmall":9367,"Ġtower":9368,"ĠLinda":9369,"Ġaccomplished":9370,"Ġpod":9371,"Ġleaked":9372,"ĠWed":9373,"Ġmer":9374,"Ġopposing":9375,"!'":9376,"Ġstomach":9377,"Ġrevealing":9378,"Ġho":9379,"DF":9380,"ĠSterling":9381,"Ġsolely":9382,"Ġpres":9383,"ĠCy":9384,"ĠLatest":9385,"ĠPitt":9386,"ĠThink":9387,"Ġcapability":9388,"aled":9389,"Ġexecuted":9390,"alling":9391,"ĠSilva":9392,"Ġrestricted":9393,"Ġdeclaration":9394,"Ġkilometres":9395,"rol":9396,"Ġidentifying":9397,"Ġdonors":9398,"vent":9399,"Ġcostly":9400,"ense":9401,"ĠSeeking":9402,"OURCE":9403,"iving":9404,"Ġplacing":9405,"tech":9406,"Ġbottles":9407,"writer":9408,"ĠSeahawks":9409,"oming":9410,"ĠArthur":9411,"ously":9412,"bin":9413,"ĠVa":9414,"Ġbias":9415,"Ġliability":9416,"ift":9417,"rak":9418,"aves":9419,"Ġcautious":9420,"ĠPrize":9421,"iley":9422,"ĠSharma":9423,"global":9424,"Ġwars":9425,"sm":9426,"ĠRemember":9427,"wind":9428,"ĠRichardson":9429,"ĠSum":9430,"ĠVincent":9431,"ĠRice":9432,"inf":9433,"Ġconsultation":9434,"range":9435,"Ġbacteria":9436,"Ġarchitecture":9437,"Ġpole":9438,"ĠMach":9439,"Ġcattle":9440,"Ġabused":9441,"being":9442,"ĠHERE":9443,"Ġfame":9444,"Ġhearings":9445,"ĠBrit":9446,"Ġjoins":9447,"ĠMcGregor":9448,"Ġoppose":9449,"Ġcheer":9450,"itting":9451,"imes":9452,"Ġusage":9453,"Ġstint":9454,"Ġoutlet":9455,"Ġshoppers":9456,"ĠBaptist":9457,"Ġinappropriate":9458,"ĠALSO":9459,"Ġstealing":9460,"Ġpledge":9461,"ĠRan":9462,"Ġphotographer":9463,"Ġprevented":9464,"Ġ01":9465,"ĠEngineering":9466,"ĠProducts":9467,"Ġuniverse":9468,"ĠMcCarthy":9469,"¿":9470,"graded":9471,"Ġinspection":9472,"Ġind":9473,"Fi":9474,"aren":9475,"Ġprotections":9476,"Ġsorts":9477,"ĠWorks":9478,"Ġbillionaire":9479,"ĠGay":9480,"ĠiPad":9481,"IX":9482,"Ġdefendants":9483,"band":9484,"Ġfarms":9485,"Ġhom":9486,"gal":9487,"iant":9488,"Ġnortheast":9489,"ĠJoint":9490,"Ġcanceled":9491,"Ġtoys":9492,"Ġrein":9493,"ĠTumblr":9494,"pees":9495,"ĠAut":9496,"Police":9497,"Ġaide":9498,"Ġachieving":9499,"Ġmund":9500,"ĠCommercial":9501,"first":9502,"Ġanticipate":9503,"iac":9504,"Ġprobation":9505,"hem":9506,"Ġports":9507,"ĠKer":9508,"Ġsupplier":9509,"ĠFather":9510,"ĠAnti":9511,"ashed":9512,"ĠTable":9513,"bledon":9514,"Ġunf":9515,"ĠRash":9516,"ĠLeBron":9517,"Car":9518,"bu":9519,"ĠDerek":9520,"Ġaccounted":9521,"ĠPri":9522,"nings":9523,"Ġreceives":9524,"lev":9525,"Ġbilateral":9526,"ĠList":9527,"ĠLG":9528,"ĠJazz":9529,"Ġrestored":9530,"Ġbattles":9531,"ials":9532,"Ġoccupied":9533,"Ġrepairs":9534,"Ġradar":9535,"ĠMLB":9536,"ĠNC":9537,"Ġflexible":9538,"ĠCommand":9539,"Ġcoat":9540,"ĠVir":9541,"ĠColts":9542,"ĠBC":9543,"Ġtwin":9544,"Ġprisoners":9545,"Ġslowed":9546,"hop":9547,"ĠInn":9548,"Ġconflicts":9549,"Ġmeasured":9550,"Ġautonomous":9551,"ĠBow":9552,"Ġdisc":9553,"inson":9554,"ĠSche":9555,"aire":9556,"ĠSU":9557,"ĠPeterson":9558,"Ġdrafted":9559,"ĠPelosi":9560,"ĠSoon":9561,"Ġmechanism":9562,"Ġaccountability":9563,"ĠNortheast":9564,"Ġfo":9565,"Ġanalytics":9566,"ĠEverything":9567,"Ġperceived":9568,"bers":9569,"Ġcelebrations":9570,"Ġinstruments":9571,"Ġstrip":9572,"ĠJuventus":9573,"Ġunfortunately":9574,"ĠGA":9575,"Ġwrestling":9576,"Ġstatue":9577,"vis":9578,"five":9579,"Ġmarine":9580,"ĠSamuel":9581,"Ġresponsibilities":9582,"hill":9583,"Ġrecruit":9584,"Ġreferee":9585,"ĠRail":9586,"ĠEagle":9587,"ĠCongressional":9588,"Ġbreathing":9589,"Ġbass":9590,"hit":9591,"Ġspreading":9592,"Ġevacuated":9593,"Ġintellectual":9594,"Ġsovereign":9595,"ocked":9596,"Ġslammed":9597,"Ġformerly":9598,"Ġarch":9599,"Ġdifficulty":9600,"ĠAFC":9601,"ĠFresh":9602,"Ġinvite":9603,"oner":9604,"ĠMich":9605,"Ġpitches":9606,"stock":9607,"Ġinitiated":9608,"ĠKu":9609,"ĠFlorence":9610,"yd":9611,"ĠFast":9612,"Ġmusician":9613,"ĠChile":9614,"anga":9615,"Ġdairy":9616,"Ġcontractors":9617,"ador":9618,"ĠPlanning":9619,"Ġultra":9620,"Ġprayer":9621,"Ġsuggestions":9622,"ĠEk":9623,"Ġrandom":9624,"ĠSullivan":9625,"Ġsensor":9626,"Ġhomicide":9627,"ĠIncome":9628,"Ġsettings":9629,"Ġacknowledge":9630,"ĠStay":9631,"Ġterminal":9632,"Ġ1991":9633,"West":9634,"hard":9635,"arc":9636,"Ġcombine":9637,"Ġprivately":9638,"Ġbarrier":9639,"Ġmedian":9640,"Ġwhereas":9641,"ĠTitans":9642,"Ġincentives":9643,"Ġhistorically":9644,"Ġindictment":9645,"Ġhiding":9646,"ĠPDT":9647,"Ġrebuild":9648,"hol":9649,"Ġpour":9650,"Ġairports":9651,"ĠEdinburgh":9652,"Ġappoint":9653,"ĠJul":9654,"Ġconfusion":9655,"Ġdam":9656,"ork":9657,"Ġcalculated":9658,"Ġhood":9659,"ĠTemple":9660,"ĠYorkshire":9661,"EP":9662,"ented":9663,"Ġapology":9664,"awi":9665,"Ġfacilitate":9666,"ĠSheffield":9667,"Ġrides":9668,"Ġcompelling":9669,"ĠGonzalez":9670,"roll":9671,"ONG":9672,"UP":9673,"ĠAj":9674,"pen":9675,"ĠVar":9676,"ĠIPO":9677,"ĠAnimal":9678,"Ġshifted":9679,"Ġ140":9680,"Ġtobacco":9681,"El":9682,"ild":9683,"Ġuncertain":9684,"Un":9685,"Ġcaps":9686,"Ġrecreational":9687,"ĠTu":9688,"Ġenc":9689,"More":9690,"iko":9691,"ĠEverton":9692,"ĠWalk":9693,"Ġmurdered":9694,"Ġpur":9695,"Ġdivisions":9696,"ivo":9697,"Ġfarming":9698,"Ġcourage":9699,"ped":9700,"Ġcrying":9701,"Ġattributed":9702,"ée":9703,"Ġimplementing":9704,"ĠWang":9705,"Ġspeeds":9706,"alk":9707,"aming":9708,"eries":9709,"Ġavoided":9710,"ĠMessi":9711,"Ġconsiderable":9712,"rt":9713,"Ġinauguration":9714,"ĠPH":9715,"Ġsoldier":9716,"Ġore":9717,"ollywood":9718,"otive":9719,"ĠAuburn":9720,"ĠSav":9721,"ĠPut":9722,"Ġemphasis":9723,"Ġaf":9724,"owed":9725,"Ġdiagnosis":9726,"Ġcart":9727,"Ġassisted":9728,"ĠOrder":9729,"ĠEstate":9730,"Ġintends":9731,"ĠCommon":9732,"Ġadventure":9733,"Ġbeliefs":9734,"Ġlasting":9735,"cel":9736,"Ġdeployment":9737,"tra":9738,"ĠStories":9739,"Ġquote":9740,"Ġfeared":9741,"Ġconvenience":9742,"Ġoptimism":9743,"Ġscientist":9744,"ĠEnterprise":9745,"ĠRex":9746,"ĠFel":9747,"Ġposes":9748,"Ġroot":9749,"Ġevacuation":9750,"Ġpresidents":9751,"ĠRather":9752,"Ġgrave":9753,"ĠHeights":9754,"Ġjumping":9755,"driven":9756,"Ġaluminum":9757,"Ġholders":9758,"Ġboot":9759,"iber":9760,"Ġprecious":9761,"uation":9762,"FP":9763,"uses":9764,"Ġcommentary":9765,"Ġadvances":9766,"ĠNissan":9767,"Ġbronze":9768,"Ġinspire":9769,"Ġstarters":9770,"ĠEvan":9771,"rah":9772,"body":9773,"Ġcrops":9774,"Ġseeds":9775,"Ġharsh":9776,"ĠHomeland":9777,"Ġenabled":9778,"ological":9779,"Ġworkshop":9780,"Ġchains":9781,"amps":9782,"Ġamongst":9783,"ĠBear":9784,"Ġcertified":9785,"ĠJulie":9786,"Ġmountains":9787,"VA":9788,"Ġfed":9789,"Ġbuyer":9790,"ahl":9791,"ĠBos":9792,"ĠCrystal":9793,"Ġquest":9794,"ĠStein":9795,"Ġacceptable":9796,"Ġunbeaten":9797,"iring":9798,"ural":9799,"Ġuncomfortable":9800,"Ġpartial":9801,"Ġsacrifice":9802,"ĠGrande":9803,"Ġarrangement":9804,"Ġpackaging":9805,"screen":9806,"Ġmirror":9807,"Ġsweep":9808,"Ġconnecting":9809,"Ġpanic":9810,"ĠJacksonville":9811,"ĠKremlin":9812,"Ġorigin":9813,"Brien":9814,"Ġnorthwest":9815,"Ġcarriers":9816,"ĠRiley":9817,"Ġaud":9818,"Ġappreciation":9819,"Ġeliminated":9820,"ĠAnalyst":9821,"CR":9822,"Ġfirearm":9823,"Ġaccommodate":9824,"Ġstructural":9825,"Ġappealed":9826,"Ġcharter":9827,"ressing":9828,"Ġalike":9829,"white":9830,"Ġslowdown":9831,"Ġweigh":9832,"ĠPalmer":9833,"ound":9834,"ĠConn":9835,"Ġbranches":9836,"Ġace":9837,"Ġinsists":9838,"yo":9839,"ĠLynn":9840,"ĠCC":9841,"ĠWithin":9842,"Ġcoll":9843,"Ġsustain":9844,"Ġemerge":9845,"ĠBattle":9846,"VER":9847,"Ġaviation":9848,"Ġenables":9849,"ĠProduction":9850,"ĠGrove":9851,"Ġnationally":9852,"ĠBaldwin":9853,"rent":9854,"Ġfirearms":9855,"irm":9856,"Ġconsiders":9857,"ĠCosby":9858,"ĠMcK":9859,"ĠEnt":9860,"Ġincumbent":9861,"iance":9862,"Ġgiants":9863,"Ġkan":9864,"Ġminimal":9865,"ivity":9866,"ĠSay":9867,"ĠNass":9868,"Ġlovely":9869,"ĠFurthermore":9870,"Ġdisplaced":9871,"Ġcontacts":9872,"NY":9873,"Ġtechnological":9874,"ancy":9875,"Ġant":9876,"ope":9877,"ĠFY":9878,"Ġfavorable":9879,"ĠVirgin":9880,"Ġcasual":9881,"ĠLat":9882,"Ġpopulations":9883,"Ġromance":9884,"Ġforgotten":9885,"Ġfleeing":9886,"Ġspecialty":9887,"Ġdrill":9888,"Ġapplying":9889,"Ġcocaine":9890,"rea":9891,"Ġheroin":9892,"Ġsweeping":9893,"ĠMaj":9894,"Ġtroubled":9895,"Ġcolleague":9896,"Ġedged":9897,"omes":9898,"ĠHappy":9899,"´":9900,"Ġmilitant":9901,"boy":9902,"aver":9903,"Yes":9904,"llo":9905,"Ġsupporter":9906,"ĠSubscribe":9907,"ĠBird":9908,"ĠGibson":9909,"Ġhill":9910,"Ġnewspapers":9911,"ĠPHOTO":9912,"Ġouting":9913,"Ġdefine":9914,"Ġann":9915,"Ġrobot":9916,"Ġregret":9917,"ĠCould":9918,"raz":9919,"Ġceiling":9920,"Ġorganizers":9921,"ĠTw":9922,"Ġcriticised":9923,"ĠJoh":9924,"ĠJe":9925,"ĠBulls":9926,"Ġteeth":9927,"ĠRanch":9928,"ĠAndrea":9929,"Ġconservatives":9930,"Ġmag":9931,"vey":9932,"Ġpredecessor":9933,"ĠJPMorgan":9934,"Ġdraws":9935,"umber":9936,"Ġvaccine":9937,"ĠDas":9938,"Ġdisappeared":9939,"ĠIron":9940,"Ġlitigation":9941,"vert":9942,"Ġbelong":9943,"ĠRet":9944,"owers":9945,"rain":9946,"controlled":9947,"ĠKil":9948,"Ġrehab":9949,"ĠAustria":9950,"Ġprivilege":9951,"Ġbounce":9952,"Ġbout":9953,"ĠIslamist":9954,"Ġtaxi":9955,"ody":9956,".'\"":9957,"Ġdos":9958,"shire":9959,"Ġaccidents":9960,"Ġdemonstration":9961,"His":9962,"ĠBO":9963,"ĠICE":9964,"van":9965,"File":9966,"ĠManning":9967,"ounded":9968,"Ġdirections":9969,"lled":9970,"Ġoffences":9971,"Ġlaptop":9972,"ĠUniversal":9973,"Ġmilestone":9974,"ĠNarendra":9975,"Ġnotion":9976,"Ġuns":9977,"ĠLower":9978,"Ġmidfield":9979,"Ġoutper":9980,"trans":9981,"ĠJa":9982,"three":9983,"Adds":9984,"Ġpressures":9985,"Ġprohibited":9986,"Ġutilities":9987,"Ġbes":9988,"ĠReporter":9989,"Ġcommodities":9990,"leton":9991,"Ġslower":9992,"EE":9993,"auer":9994,"Ġtablet":9995,"sl":9996,"iously":9997,"Ġaiming":9998,"eland":9999,"ĠNEXT":10000,"tered":10001,"IVE":10002,"onic":10003,"May":10004,"ĠMilitary":10005,"Mark":10006,"Ġlender":10007,"mate":10008,"Ġaboard":10009,"they":10010,"Ġrespondents":10011,"Ġconversion":10012,"Ġsecuring":10013,"Ġentity":10014,"ĠHarbor":10015,"ĠCu":10016,"Ġcats":10017,"ĠACC":10018,"ĠIbrahim":10019,"GL":10020,"Ġinvitation":10021,"Ġcond":10022,"ĠRecords":10023,"ĠAdrian":10024,"Ġbrave":10025,"Ġmineral":10026,"Ġsooner":10027,"Ġsatisfied":10028,"Ġpets":10029,"Ġnotably":10030,"ı":10031,"Ġmarking":10032,"ĠRO":10033,"ĠHaw":10034,"ĠVis":10035,"Ġmarketplace":10036,"ĠNat":10037,"ĠForward":10038,"ĠLeft":10039,"Ġaggravated":10040,"ĠClose":10041,"acey":10042,"Ġlandmark":10043,"Ġdisruption":10044,"ĠChallenge":10045,"ĠDays":10046,"ĠCoun":10047,"ahan":10048,"Ġaides":10049,"South":10050,"ĠDylan":10051,"ĠRavens":10052,"ĠNature":10053,"lli":10054,"Ġdiplomats":10055,"350":10056,"ĠDrake":10057,"tag":10058,"Ġlicensed":10059,"ĠDenmark":10060,"Ġcancel":10061,"Ġinstant":10062,"DI":10063,"Ġpunch":10064,"ĠJenkins":10065,"Ġstrengthening":10066,"des":10067,"-$":10068,"Ġallegation":10069,"Ġsizes":10070,"iza":10071,"Ġmentally":10072,"ĠResidents":10073,"acked":10074,"Ġsensors":10075,",'\"":10076,"illion":10077,"ĠChampion":10078,"Ġexcessive":10079,"Ġhum":10080,"ĠComp":10081,"rend":10082,"ĠLakes":10083,"Ġburst":10084,"Ġtrainer":10085,"Ġclearing":10086,"ĠSilicon":10087,"Ġ350":10088,"DE":10089,"ĠGates":10090,"ĠHorn":10091,"ests":10092,"ĠCourtesy":10093,"Ġbipartisan":10094,"Ġhabits":10095,"ĠAlexa":10096,"walk":10097,"Ġsnapped":10098,"ĠEight":10099,"itis":10100,"zel":10101,"Ġcustoms":10102,"Ġsouthwest":10103,"Ġvary":10104,"Because":10105,"Ġpayout":10106,"Ġaccelerate":10107,"ĠBarr":10108,"tu":10109,"Ġfined":10110,"cost":10111,"ĠTheater":10112,"ĠCorbyn":10113,"Ġstem":10114,"Ġundermine":10115,".;":10116,"Ġstays":10117,"Ġbreakthrough":10118,"Ġturnover":10119,"hot":10120,"Ġtriumph":10121,"Ġpainted":10122,"ĠWinnipeg":10123,"ĠKas":10124,"ĠStuart":10125,"irk":10126,"Am":10127,"Ġtrusted":10128,"aze":10129,"ĠLate":10130,"Ġaccessories":10131,"Ġmemorable":10132,"ĠFool":10133,"Ġrotation":10134,"ĠBulldogs":10135,"ĠChen":10136,"Ġpoised":10137,"ĠMonte":10138,"ĠClarke":10139,"leading":10140,"Ġvenues":10141,"Ġbeneficial":10142,"ĠLiam":10143,"ĠBrothers":10144,"ĠNeed":10145,"Ġconc":10146,"olly":10147,"ĠJulian":10148,"ogue":10149,"Ġfounding":10150,"Ġsidelines":10151,"Ġdeclare":10152,"ĠMember":10153,"Ġexamine":10154,"abs":10155,"Ġboundaries":10156,"ĠBrisbane":10157,"Ġlaunches":10158,"lor":10159,"ĠGa":10160,"Ġthr":10161,"expected":10162,"wal":10163,"ĠBarnes":10164,"Ġclashes":10165,"content":10166,"ĠClemson":10167,"iger":10168,"Mar":10169,"Ġaccord":10170,"Ġsoutheast":10171,"ģ":10172,"ĠStarbucks":10173,"osing":10174,"Ġseasonal":10175,"icking":10176,"Ġloyalty":10177,"Ġtent":10178,"ĠDy":10179,"Ġevident":10180,"Ġlobby":10181,"Ġtours":10182,"Ġbombing":10183,"uations":10184,"Ġrises":10185,"Ġdemonstrations":10186,"ĠWATCH":10187,"pin":10188,"Ġdeb":10189,"ĠDraft":10190,"rog":10191,"Ġseal":10192,"ĠPerformance":10193,"ĠLGBT":10194,"Ġsed":10195,"Ġgig":10196,"nan":10197,"Ġrainfall":10198,"Ġfabric":10199,"Ġmanages":10200,"Ġlifting":10201,"ĠMagazine":10202,"ĠCriminal":10203,"Ġhikes":10204,"Ġcatching":10205,"Ġ1989":10206,"OG":10207,"Ġdisappointment":10208,"Ġir":10209,"ĠEV":10210,"stown":10211,"pass":10212,"120":10213,"Ġmedals":10214,"ĠSimmons":10215,"Ġinaugural":10216,"ĠCorn":10217,"Ġmotorcycle":10218,"lets":10219,"ĠSkype":10220,"ét":10221,"Ġscary":10222,"opp":10223,"thirds":10224,"ĠMohamed":10225,"Ġteenagers":10226,"ANK":10227,"Ġserver":10228,"Ġouts":10229,"Ġdishes":10230,"four":10231,"dr":10232,"ĠOt":10233,"ĠSandy":10234,"ĠShane":10235,"orters":10236,"SH":10237,"Ġtouching":10238,"ĠNike":10239,"ĠHBO":10240,"driving":10241,"Ġplug":10242,"ĠBaseball":10243,"eling":10244,"hn":10245,"ulate":10246,"eed":10247,"ĠChristine":10248,"ĠGlobe":10249,"Ġethics":10250,"ĠTrevor":10251,"iya":10252,"Ġ360":10253,"Ġawaiting":10254,"Ġcounterpart":10255,"Ġsubsidies":10256,"pointers":10257,"Ġspy":10258,"ILL":10259,"Ġtakeover":10260,"ĠBeyond":10261,"Ġsurprisingly":10262,"TION":10263,"ĠSong":10264,"Ġni":10265,"Ġcommonly":10266,"Ġjack":10267,"Ġsubstitute":10268,"ews":10269,"Ġrecalls":10270,"ĠCommons":10271,"Ġsin":10272,"del":10273,"ĠMod":10274,"Ġpressing":10275,"ĠTelevision":10276,"ĠInside":10277,"ª":10278,"Ġbacklash":10279,"Ġcredible":10280,"ĠJenner":10281,"ĠPu":10282,"ĠStevens":10283,"ĠWE":10284,"Last":10285,"Ġinsurers":10286,"ĠJoin":10287,"bled":10288,"digit":10289,"Ġflooded":10290,"ĠShore":10291,"ĠTrophy":10292,"zing":10293,"ĠImmigration":10294,"Ġsuperior":10295,"IAN":10296,"Ġcasino":10297,"Ġenabling":10298,"Ġmeantime":10299,"Ġperformers":10300,"Ġproportion":10301,"Ġlawmaker":10302,"ĠConf":10303,"Ġconvert":10304,"Ġfarmer":10305,"Ġbu":10306,"ĠGE":10307,"ĠRepresentative":10308,"ĠBannon":10309,"ĠHelp":10310,"PT":10311,"formed":10312,"ĠSuperintendent":10313,"Ġfrustrating":10314,"ĠRegister":10315,"ĠPolitical":10316,"Ġboots":10317,"ĠRu":10318,"ĠSha":10319,"Ġinstrument":10320,"tor":10321,"ĠBelt":10322,"ĠWalsh":10323,"Ġrecipe":10324,"ilt":10325,"ĠClean":10326,"iors":10327,"Ġtwenty":10328,"iler":10329,"nder":10330,"Ġwinger":10331,"Ġwheat":10332,"ĠAviation":10333,"Ġcorrupt":10334,"Ġconnectivity":10335,"ĠVen":10336,"order":10337,"esc":10338,"break":10339,"Ġmetals":10340,"Ġtraditionally":10341,"Ġbell":10342,"Ġviolating":10343,"rough":10344,"Ġintroducing":10345,"Ġguided":10346,"ĠMol":10347,"Ġdesert":10348,"ĠBree":10349,"Le":10350,"ĠZone":10351,"ĠGlass":10352,"ĠEUR":10353,"ĠYahoo":10354,"Ġlaps":10355,"Ġdiffer":10356,"ĠHold":10357,"Ġtimely":10358,"Ġsuccessor":10359,"Ġcomic":10360,"Ġbears":10361,"Ġlicence":10362,"Ġreject":10363,"Ġsophisticated":10364,"Too":10365,"Ġobjectives":10366,"ĠId":10367,"urers":10368,"Ġraid":10369,"COM":10370,"Ġelect":10371,"ĠHampshire":10372,"Ġlens":10373,"Ġdesigners":10374,"Ġpresently":10375,"ĠRCMP":10376,"ĠEgyptian":10377,"ĠWalter":10378,"ĠWallace":10379,"Ġ2025":10380,"utics":10381,"ried":10382,"Ġrefuse":10383,"Ġsiblings":10384,"ĠNothing":10385,"Ġdressing":10386,"Ġnerve":10387,"AST":10388,"Ġuncertainties":10389,"Ġtale":10390,"ĠTalk":10391,"Ġissuing":10392,"shot":10393,"ĠTak":10394,"Ġacid":10395,"ĠNintendo":10396,"Ġwash":10397,"pd":10398,"ĠClaire":10399,"ĠScot":10400,"Ġsuits":10401,"ĠBayern":10402,"gest":10403,"Ġapplicable":10404,"Ġinteraction":10405,"ĠEnforcement":10406,"ĠRohingya":10407,"Ġjan":10408,"Ġunited":10409,"ĠCoalition":10410,"Ġlegislators":10411,"Ġdetectives":10412,"ĠSing":10413,"ĠBetween":10414,"ĠPoly":10415,"pool":10416,"mal":10417,"Ġreply":10418,"Ġschemes":10419,"ĠHolmes":10420,"ĠSenators":10421,"ĠVerizon":10422,"Ġwelcoming":10423,"ĠCricket":10424,"ĠMarco":10425,"ĠYears":10426,"ĠLiving":10427,"Ġcounterparts":10428,"ĠParadise":10429,"ĠTrad":10430,"#":10431,"iw":10432,"ĠSoccer":10433,"umbled":10434,"Ġdeceased":10435,"heim":10436,"Ġevaluation":10437,"Ġwrap":10438,"Ġmild":10439,"aji":10440,"ĠUCLA":10441,"ĠNative":10442,"president":10443,"ĠXbox":10444,"Ġenterprises":10445,"ĠSlam":10446,"oga":10447,"Rock":10448,"piece":10449,"ĠColeman":10450,"Ġcomparable":10451,"uba":10452,"Ġprovinces":10453,"ĠFormula":10454,"ipt":10455,"ô":10456,"Ġtick":10457,"ĠIMF":10458,"anch":10459,"atta":10460,"rew":10461,"However":10462,"LS":10463,"etta":10464,"ĠCustoms":10465,"SU":10466,"Ġpublishing":10467,"Ġinch":10468,"Ġkills":10469,"¤":10470,"ĠSus":10471,"ĠBeth":10472,"Ġsteam":10473,"jpg":10474,"pointer":10475,"Ġturnovers":10476,"Ġpowder":10477,"ĠUSB":10478,"ĠWildlife":10479,"ĠDirect":10480,"atively":10481,"ĠFerrari":10482,"Ġpleasure":10483,"ĠMatthews":10484,"Ġski":10485,"ography":10486,"ĠVermont":10487,"ĠMargaret":10488,"ĠMunich":10489,"Ġlayer":10490,"ĠProperty":10491,"Ġeconomics":10492,"ĠCrew":10493,"UK":10494,"Ġunnecessary":10495,"ĠGlasgow":10496,"Ġsealed":10497,"Ġclarity":10498,"Ġsurplus":10499,"ĠCanyon":10500,"ĠApart":10501,"Ġacceptance":10502,"ĠEllis":10503,"uster":10504,"rid":10505,"ĠHawks":10506,"Ġstatewide":10507,"Ġthreaten":10508,"ĠJail":10509,"Ġinclusive":10510,"Ġmud":10511,"Ġpat":10512,"Ġbitter":10513,"Ġalternatives":10514,"Ġaffiliate":10515,"Ġevaluate":10516,"ĠBaby":10517,"Ġperception":10518,"tim":10519,"Ġrefusing":10520,"Ġgrey":10521,"Ġarguably":10522,"Ġfirmly":10523,"ĠDark":10524,"Ġexcuse":10525,"ĠRaymond":10526,"Ġballots":10527,"inton":10528,"Ġ125":10529,"ĠCatherine":10530,"Ġsacks":10531,"ĠDeb":10532,"Ġworkout":10533,"web":10534,"Ġbatteries":10535,"breaking":10536,"ML":10537,"Ġunacceptable":10538,"ĠValentine":10539,"ĠYOU":10540,"ĠRT":10541,"Ġjurisdiction":10542,"Ġexamined":10543,"strom":10544,"ĠPocket":10545,"Ġcement":10546,"Ġuniversal":10547,"ĠOz":10548,"Ġkit":10549,"Ġchurches":10550,"Ġsuburban":10551,"ĠKushner":10552,"ĠDavidson":10553,"Sports":10554,"email":10555,"Ġrealistic":10556,"Ġintend":10557,"ĠGrey":10558,",''":10559,"Ġscholarship":10560,"Ġphilosophy":10561,"Ġwheels":10562,"Ġmotivation":10563,"eway":10564,"match":10565,"ĠDate":10566,"John":10567,"Ġcontrolling":10568,"750":10569,"aven":10570,"Ġfilmed":10571,"Ġ160":10572,"ĠBrock":10573,"ĠDetails":10574,"Ġlogistics":10575,"Ġassumptions":10576,"ĠStep":10577,"Ġfails":10578,"ĠNotre":10579,"Ġjuice":10580,"Ġcounting":10581,"Ġphotograph":10582,"Ġfortunate":10583,"Ġestablishing":10584,"ĠNJ":10585,"ĠWorkers":10586,"ĠQuinn":10587,"ĠHeather":10588,"Ġtimeline":10589,"Ġimported":10590,"ĠNASCAR":10591,"Ġexercises":10592,"Ġsearched":10593,"ĠRalph":10594,"alf":10595,"Ġgene":10596,"Ġdependent":10597,"én":10598,"iate":10599,"ĠBristol":10600,"Ġhung":10601,"Ġtropical":10602,"Ġintensity":10603,"ĠIdaho":10604,"ĠMull":10605,"Ġsuite":10606,"Ġblockchain":10607,"cz":10608,"ovich":10609,"Ġworn":10610,"ĠLE":10611,"AV":10612,"emi":10613,"Ġidentification":10614,"Ġtunnel":10615,"ĠARE":10616,"ĠArm":10617,"Ġoutrage":10618,"Ġtwist":10619,"uka":10620,"ĠGra":10621,"Ġjets":10622,"ĠThus":10623,"Ġcompound":10624,"Ġfinancially":10625,"2019":10626,"asse":10627,"Ġspare":10628,"ĠNoah":10629,"ĠMade":10630,"ĠMom":10631,"Ġphenomenon":10632,"Ġnurses":10633,"Ġoutlined":10634,"Ġpolit":10635,"ĠCarm":10636,"Ġleagues":10637,"Ġmath":10638,"Ġmodified":10639,"Ġwillingness":10640,"ĠAmanda":10641,"Ġgrandfather":10642,"Of":10643,"DR":10644,"Ġdip":10645,"ĠRAM":10646,"ĠChristie":10647,"Ġargues":10648,"ĠEX":10649,"ĠNine":10650,"ĠScroll":10651,"ĠTHIS":10652,"Pro":10653,"Ġkeys":10654,"Ġprocessor":10655,"Ġscam":10656,"ĠTraining":10657,"Ġhoney":10658,"Ĵ":10659,"Ġfacebook":10660,"ĠLegal":10661,"Ġaging":10662,"Ġspiritual":10663,"ĠHost":10664,"Ġlung":10665,"ĠUSC":10666,"Ġdirt":10667,"Ġfe":10668,"after":10669,"ĠDiana":10670,"Ġounce":10671,"date":10672,"ĠFinals":10673,"Ķ":10674,"Ġthorough":10675,"Ġviable":10676,"Ġanytime":10677,"Ġfost":10678,"orter":10679,"ware":10680,"ĠHolland":10681,"ĠMand":10682,"ĠSend":10683,"2013":10684,"ĠVolkswagen":10685,"Ġsuitable":10686,"ifies":10687,"Ġcomedian":10688,"Ġneighbours":10689,"ĠKnow":10690,"Ġcurious":10691,"ĠTwenty":10692,"ĠPrevention":10693,"ĠStephanie":10694,"Ġpilots":10695,"Ġstored":10696,"Ġdire":10697,"Ġfits":10698,"ision":10699,"ĠShell":10700,"Ġshifts":10701,"Ġpepper":10702,"Ġattendees":10703,"ĠName":10704,"hers":10705,"rip":10706,"Ġwatchdog":10707,"andy":10708,"Ġbio":10709,"Ġpublisher":10710,"powered":10711,"ĠCM":10712,"rian":10713,"ĠRand":10714,"wise":10715,"ĠJesse":10716,"Ġladies":10717,"ĠMetropolitan":10718,"ĠMicro":10719,"Ġkicking":10720,"Ġmeg":10721,"Ġclouds":10722,"Ġtrim":10723,"wear":10724,"ĠML":10725,"Ġconsists":10726,"Ġrig":10727,"Ġhonestly":10728,"GS":10729,"ĠNicholas":10730,"Ġcope":10731,"Ġpublish":10732,"working":10733,"bur":10734,"ĠNar":10735,"olds":10736,"aja":10737,"ĠSad":10738,"Ġclicking":10739,"Ġbids":10740,"ĠZuckerberg":10741,"Ġ900":10742,"Ġexam":10743,"ivers":10744,"Ġpray":10745,"Ġreader":10746,"ĠSeth":10747,"inem":10748,"Ġconfront":10749,"stra":10750,"AW":10751,"ĠGian":10752,"Ġaccordance":10753,"Ġinteract":10754,"ĠSharks":10755,"Ġfireworks":10756,"gment":10757,"illy":10758,"Ġconst":10759,"ARY":10760,"Ġprizes":10761,"Ġshoulders":10762,"Ġaccessed":10763,"Ġecosystem":10764,"Ġlicensing":10765,"La":10766,"Ġdedication":10767,"Ġdé":10768,"Ġyouths":10769,"lem":10770,"Ġtoy":10771,"ĠProm":10772,"ounding":10773,"rod":10774,"Ġ1000":10775,"ishes":10776,"Over":10777,"Ġgaps":10778,"Ġmissions":10779,"Ġrailway":10780,"Day":10781,"orp":10782,"ĠSchumer":10783,"Ġeclipse":10784,"Ġshell":10785,"ĠBY":10786,"Many":10787,"ĠRecord":10788,"Ġdrunk":10789,"ayan":10790,"Ġsuggestion":10791,"Ġdefenders":10792,"ĠNewton":10793,"Ġdisputes":10794,"Ġevolution":10795,"Ġcredibility":10796,"ĠTenn":10797,"Ġplain":10798,"size":10799,"cont":10800,"Ġlone":10801,"Ġfingers":10802,"BUR":10803,"ĠInvestigation":10804,"ĠQualcomm":10805,"var":10806,"Ġcountless":10807,"ĠRebecca":10808,"½":10809,"abi":10810,"Ġreflecting":10811,"ĠTurn":10812,"Ġinteractive":10813,"Ġincentive":10814,"second":10815,"offs":10816,"ĠBerkeley":10817,"ĠTexans":10818,"Ġheated":10819,"Ġscorer":10820,"ĠSharif":10821,"Ġmigrant":10822,"west":10823,"ĠHoliday":10824,"Ġwrist":10825,"Ġchairs":10826,"Ġrecommends":10827,"ĠWildcats":10828,"ĠPed":10829,"ĠQuarter":10830,"ĠIV":10831,"ĠArch":10832,"Ġstandings":10833,"Ġbombs":10834,"Ġcapped":10835,"Can":10836,"Ġcaring":10837,"ĠLah":10838,"lim":10839,"Ġdragged":10840,"ĠBeat":10841,"DB":10842,"Ġaired":10843,"Ġjeans":10844,"action":10845,"Ġgenerating":10846,"ĠGir":10847,"risk":10848,"lon":10849,"stage":10850,"âĤ¬":10851,"earing":10852,"ĠTogether":10853,"Ġreun":10854,"ĠCorey":10855,"ĠBak":10856,"Ġprestigious":10857,"Ġapplicants":10858,"here":10859,"ĠMattis":10860,"Ġridiculous":10861,"ĠLess":10862,"Ġrains":10863,"Ġpresenting":10864,"anti":10865,"Ġdisabilities":10866,"Ġapartments":10867,"storm":10868,"ĠHem":10869,"Ġhabit":10870,"ĠRuth":10871,"ĠNPR":10872,"nut":10873,"Ġappreciated":10874,"Ġseparation":10875,"uda":10876,"Ġminus":10877,"ĠPhotos":10878,"Ġblew":10879,"ĠVoice":10880,"Ġrallies":10881,"Ġfond":10882,"ĠTaking":10883,"yt":10884,"FE":10885,"ĠTory":10886,"ressed":10887,"ĠLy":10888,"Ġrocks":10889,"ĠRah":10890,"Ġelementary":10891,"nis":10892,"ĠPresidential":10893,"Ġnutrition":10894,"Ġbaseman":10895,"Ġsuperstar":10896,"ĠWa":10897,"lar":10898,"Ġstaged":10899,"ĠLearn":10900,"Ġbroadcaster":10901,"Ġboasts":10902,"Ġdoubts":10903,"rum":10904,"Ġbare":10905,"cap":10906,"Ġclimbing":10907,"ĠSelect":10908,"ĠCant":10909,"ĠNord":10910,"ĠBeck":10911,"ĠKad":10912,"ello":10913,"Ġenforce":10914,"ĠZe":10915,"ked":10916,"elly":10917,"ĠLED":10918,"ĠOperations":10919,"ĠLuk":10920,"Ġcertificate":10921,"Ġdeter":10922,"Ġspill":10923,"Ġgrain":10924,"league":10925,"Up":10926,"ĠKid":10927,"using":10928,"ĠJays":10929,"Ġoccasionally":10930,"ĠMI":10931,"yes":10932,"Ġdetect":10933,"Ġpropaganda":10934,"Ġneighboring":10935,"sub":10936,"avan":10937,"ĠAstros":10938,"oti":10939,"threatening":10940,"Ġshorter":10941,"INGS":10942,"Ġfeeding":10943,"Ġelevated":10944,"ĠWenger":10945,"Ġundergo":10946,"Ġpsychological":10947,"Ġautom":10948,"NP":10949,"anks":10950,"ĠNokia":10951,"Ġdrones":10952,"Ġrecognised":10953,"Ġheroes":10954,"agen":10955,"Ġparole":10956,"ĠBah":10957,"Ġhomeowners":10958,"ĠSweet":10959,"Ġinstances":10960,"ĠParish":10961,"ĠSL":10962,"Ġunw":10963,"Ġdelicious":10964,"¯":10965,"ĠInvestments":10966,"ĠPhilippine":10967,"inos":10968,"Ġmes":10969,"Ġbite":10970,"Ġcornerback":10971,"ĠHat":10972,"Ġdeserved":10973,"ologists":10974,"[":10975,"Ġwrongdoing":10976,"ĠTrent":10977,"ĠVe":10978,"ĠDeal":10979,"Mr":10980,"Ġovers":10981,"Ġhonors":10982,"ĠITV":10983,"Ġpayroll":10984,"Ġconfused":10985,"Ġelaborate":10986,"ange":10987,"World":10988,"ĠResort":10989,"ilia":10990,"ĠKr":10991,"Ġconclude":10992,"First":10993,"ĠDR":10994,"Ġpeer":10995,"Ġrunway":10996,"ĠPotter":10997,"cons":10998,"bad":10999,"si":11000,"ĠClimate":11001,"ĠHoll":11002,"Ġweighing":11003,"Ġepidemic":11004,"ĠBible":11005,"Ġhon":11006,"Ġrenew":11007,"Ġgambling":11008,"ĠNationals":11009,"itable":11010,"ĠOutlook":11011,"Ġreactions":11012,"ĠCos":11013,"ĠDana":11014,"India":11015,"ĠAirbus":11016,"power":11017,"watch":11018,"Ġstyles":11019,"Ġordinance":11020,"Ġcam":11021,"Ġinvent":11022,"ĠDurant":11023,"Ġexchanged":11024,"Ġyoga":11025,"ĠMichel":11026,"ĠWyoming":11027,"ĠPhase":11028,"ĠHannah":11029,"Ġtem":11030,"Ġfare":11031,"omer":11032,"Ġtrails":11033,"Ġquietly":11034,"ĠFourth":11035,"Ġwise":11036,"Ġappetite":11037,"Ġpedestrian":11038,"Ġfierce":11039,"hin":11040,"ako":11041,"Ġvacant":11042,"Ġdynamics":11043,"Ġbust":11044,"ĠGT":11045,"century":11046,"Ġpermitted":11047,"Ġfog":11048,"Ġrecruitment":11049,"ĠDue":11050,"Ġbro":11051,"Ġsil":11052,"ĠOpp":11053,"Ġphrase":11054,"ĠChip":11055,"ĠBase":11056,"Ġjazz":11057,"Ġenemies":11058,"Ġremainder":11059,"bles":11060,"Ġ105":11061,"ĠGur":11062,"Ġretiring":11063,"ĠCour":11064,"ĠSi":11065,"Ġinevitable":11066,"ĠAdvisory":11067,"ĠCampaign":11068,"ĠPeninsula":11069,"base":11070,"Ġjustify":11071,"inen":11072,"North":11073,"Ġfreezing":11074,"Ġphotography":11075,"Ġappointments":11076,"ĠTree":11077,"Os":11078,"Ġdivide":11079,"ĠMMA":11080,"Ġdeclines":11081,"ĠAbbott":11082,"ACH":11083,"ĠJah":11084,"Ġspr":11085,"Ġskilled":11086,"ĠTry":11087,"ANT":11088,"ael":11089,"ĠMcN":11090,"Ġtariff":11091,"generation":11092,"ĠMans":11093,"Or":11094,"Ġraped":11095,"Ġdisability":11096,"Ġnominations":11097,"Ġhappiness":11098,"ĠLSU":11099,"ĠInterstate":11100,"ĠDance":11101,"ĠMaking":11102,"Ġbailout":11103,"oro":11104,"ĠObviously":11105,"Ġinbox":11106,"football":11107,"hy":11108,"ĠCase":11109,"Ġentertaining":11110,"Ġhardest":11111,"ĠOpposition":11112,"Ġflip":11113,"ĠPirates":11114,"anu":11115,"ĠKlopp":11116,"Ġballistic":11117,"Ġprinted":11118,"ĠNFC":11119,"UST":11120,"Ġglasses":11121,"Ġrum":11122,"ĠDuncan":11123,"hal":11124,"Ġpreview":11125,"BER":11126,"dec":11127,"Ġsustainability":11128,"Ġaff":11129,"Ġhungry":11130,"service":11131,"avi":11132,"Ġsometime":11133,"Ġmod":11134,"ĠLib":11135,"oko":11136,"Ġfundraiser":11137,"Ġcrowded":11138,"mates":11139,"Ġcreativity":11140,"ĠHell":11141,"Ġtreaty":11142,"ĠSoftware":11143,"ĠRandy":11144,"ĠPolish":11145,"sa":11146,"ardi":11147,"Ġcab":11148,"ĠCamera":11149,"Ġlicenses":11150,"Ġ1988":11151,"Ġcontinuous":11152,"Ġpaired":11153,"Ġtally":11154,"Ġgrip":11155,"cho":11156,"Ġsurged":11157,"Ġpodium":11158,"Ġcontrary":11159,"SL":11160,"ĠResearchers":11161,"cing":11162,"Ġmi":11163,"Ġdisputed":11164,"Ġgrades":11165,"Ġseverely":11166,"ĠMcL":11167,"ondo":11168,"Ġshelters":11169,"Ġdomain":11170,"ĠSwitch":11171,"Ġtestify":11172,"case":11173,"omet":11174,"atch":11175,"ĠAff":11176,"Ġcasting":11177,"berger":11178,"Ġintimate":11179,"erc":11180,"plan":11181,"ĠPast":11182,"ĠUt":11183,"Ġapologized":11184,"ĠDet":11185,"alle":11186,"Ġwhilst":11187,"Ġpel":11188,"Ġexecute":11189,"Ġharmful":11190,"ĠRB":11191,"onda":11192,"ĠFul":11193,"II":11194,"Those":11195,"Ġcryptocurrency":11196,"Ġrealise":11197,"ĠAthens":11198,"ĠApplication":11199,"ORD":11200,"Ġmidst":11201,"ĠSem":11202,"Ġmessaging":11203,"Ġcousin":11204,"ĠMarsh":11205,"ĠAlmost":11206,"uto":11207,"wire":11208,"ĠManaging":11209,"Ġsends":11210,"ĠDerby":11211,"Ġpad":11212,"Ġdevoted":11213,"ĠWorking":11214,"ĠWestminster":11215,"Ġdirty":11216,"ements":11217,"ĠLew":11218,"door":11219,"Ġadvisor":11220,"ival":11221,"Ġsubscribe":11222,"Ġcredited":11223,"Ġpressed":11224,"Ġbrick":11225,"Ġrehabilitation":11226,"Ġ\"[":11227,"erry":11228,"Ġtransformed":11229,"arp":11230,"Ġreceivers":11231,"ĠFan":11232,"ĠKris":11233,"ĠCharlottesville":11234,"Ġste":11235,"Ġconstructed":11236,"Ġbroadly":11237,"ĠBetter":11238,"ĠJanet":11239,"Ġenthusiasm":11240,"ĠIrving":11241,"ĠConst":11242,"Everyone":11243,"agn":11244,"ĠCrawford":11245,"Ġregards":11246,"ĠBurns":11247,"Ġjokes":11248,"erg":11249,"ARD":11250,"apped":11251,"Ġtravelled":11252,"ĠPoor":11253,"ĠHolly":11254,"Ġcontainer":11255,"Ġinfected":11256,"Ġlean":11257,"ĠWould":11258,"Ġmagnitude":11259,"ĠDou":11260,"minded":11261,"Ġpastor":11262,"Ġwherever":11263,"ulation":11264,"Ġ1986":11265,"ĠMegan":11266,"Ġgraphic":11267,"Ġtalents":11268,"Ġkn":11269,"ĠEC":11270,"ĠMcM":11271,"ĠKon":11272,"eni":11273,"ĠEsc":11274,"inas":11275,"ĠNom":11276,"Ġchasing":11277,"arl":11278,"ĠHungary":11279,"Ġmainland":11280,"ĠDist":11281,"utes":11282,"Ġrubber":11283,"iat":11284,"ĠMorrison":11285,"ushing":11286,"iny":11287,"Ġcopies":11288,"ĠFat":11289,"agged":11290,"Ġfloating":11291,"ĠCurtis":11292,"Ġfatally":11293,"ĠManuel":11294,"Ġgraduates":11295,"nar":11296,"ĠKenny":11297,"Ġretreat":11298,"Ġretro":11299,"ĠPierre":11300,"listed":11301,"ĠDale":11302,"ding":11303,"Ġintentions":11304,"Ġsentences":11305,"ĠSere":11306,"Ġinvasion":11307,"Ġpremiums":11308,"ĠGardner":11309,"Ġshipments":11310,"Ġcol":11311,"bell":11312,"ilo":11313,"Ġworthy":11314,"Ġinterceptions":11315,"Ġcomplain":11316,"icle":11317,"ĠTah":11318,"ĠMt":11319,"ĠSyracuse":11320,"Since":11321,"aches":11322,"ĠCand":11323,"Ġinteractions":11324,"ĠShawn":11325,"nc":11326,"Ġtheaters":11327,"ART":11328,"Th":11329,"Ġalter":11330,"aley":11331,"imo":11332,"Ġresponders":11333,"kan":11334,"ĠDarren":11335,"Ġdeliveries":11336,"PI":11337,"125":11338,"Ġlaughing":11339,"ĠPatterson":11340,"Ġinfections":11341,"Ġtur":11342,"130":11343,"Ġhackers":11344,"Ġwarn":11345,"Ġfreeze":11346,"Ġscreaming":11347,"ĠEcho":11348,"ĠDom":11349,"MAN":11350,"ĠJoy":11351,"Ġbeneath":11352,"ĠHalf":11353,"Ġpatent":11354,"Ġugly":11355,"Ġlip":11356,"Ġnominees":11357,"ĠGrade":11358,"Ġinfluenced":11359,"Ġabilities":11360,"Ġlimiting":11361,"Ġsmell":11362,"Ġesc":11363,"ĠBernard":11364,"cs":11365,"ĠMyers":11366,"oted":11367,"Black":11368,"Ġlim":11369,"Ġsworn":11370,"ĠBlair":11371,"anes":11372,"ĠEvent":11373,"Ġmature":11374,"Ġpositioned":11375,"Ġerupted":11376,"grand":11377,"ĠTell":11378,"Ġbackdrop":11379,"Ġyeah":11380,"ĠClear":11381,"Ġsignificance":11382,"Ġpatience":11383,"ĠWing":11384,"Ġhorrible":11385,"Ġdeploy":11386,"ipe":11387,"Ġbitcoin":11388,"Ġcommitting":11389,"Ġdismiss":11390,"ĠBlood":11391,"ĠMeyer":11392,"selling":11393,"Ġregarded":11394,"Ġlottery":11395,"ĠLuther":11396,"Ġpipe":11397,"Ġcro":11398,"ĠANC":11399,"ĠSolar":11400,"Ġsimilarly":11401,"Ġham":11402,"ĠHonor":11403,"tar":11404,"gin":11405,"ĠArmstrong":11406,"Ġbrowser":11407,"agon":11408,"via":11409,"Ġentries":11410,"Ġinfl":11411,"Ġgraduation":11412,"Ġalleges":11413,"ĠLoading":11414,"Ġsuperb":11415,"ially":11416,"Ġadministrator":11417,"uls":11418,"Ġartistic":11419,"ĠANGEL":11420,"ĠBang":11421,"Ġfossil":11422,"¨":11423,"Ġpoly":11424,"ĠGuardiola":11425,"ĠPerth":11426,"Ġeducate":11427,"Cl":11428,"Ġcommittees":11429,"Ġforthcoming":11430,"Ġadjustments":11431,"count":11432,"Ġincoming":11433,"brook":11434,"ĠMinneapolis":11435,"Ġgown":11436,"ĠCroatia":11437,"host":11438,"Ġcompetitor":11439,"Ġlyrics":11440,"Ġbelonging":11441,"ĠFrances":11442,"ĠHaley":11443,"ĠBruins":11444,"Ġmask":11445,"ĠPv":11446,"dollar":11447,"Ġbowling":11448,"Ġjewelry":11449,"ĠJulia":11450,"Ġbroadband":11451,"ĠBhar":11452,"ĠArmed":11453,"vy":11454,"government":11455,"kov":11456,"Ġpremises":11457,"Ġjersey":11458,"Ġapplies":11459,"ĠFreeman":11460,"Ġgrows":11461,"ĠEquity":11462,"Ġmaterially":11463,"Ġfigured":11464,"ience":11465,"Ġmajors":11466,"ĠYe":11467,"ĠHey":11468,"oned":11469,"aping":11470,"Ġtoilet":11471,"ĠConnor":11472,"Ġavoiding":11473,"pos":11474,"Once":11475,"ĠRockets":11476,"ĠSnapchat":11477,"Go":11478,"Ġsolidarity":11479,"ĠAffordable":11480,"Ġdial":11481,"ĠOmar":11482,"xt":11483,"ĠVatican":11484,"anta":11485,"ĠSuperior":11486,"Ġbeaches":11487,"ĠKi":11488,"Ã¥":11489,"KY":11490,"Ġgro":11491,"ĠEmpire":11492,"Ġoccurs":11493,"Ġjoked":11494,"Ġquotes":11495,"ĠSaskatchewan":11496,"pert":11497,"Ġmaintains":11498,"olt":11499,"Ġupgrades":11500,"ĠCho":11501,"ĠAlexis":11502,"ĠHundreds":11503,"ĠBud":11504,"Ġcenturies":11505,"ĠInvestor":11506,"ĠGomez":11507,"Ġconceded":11508,"Ġexpressing":11509,"ĠIBM":11510,"Ġadvancing":11511,"ĠDollar":11512,"jer":11513,"Ġexceed":11514,"author":11515,"rist":11516,"seat":11517,"ĠPrimary":11518,"ĠForbes":11519,"ĠAlzheimer":11520,"Ġdevastated":11521,"Ġawful":11522,"ĠStudio":11523,"Ġbullpen":11524,"Ġmobility":11525,"Ġanalyze":11526,"lie":11527,"AFP":11528,"iche":11529,"ĠRoyals":11530,"Ġcoupled":11531,"Ġdug":11532,"ĠRing":11533,"Ġenvironments":11534,"national":11535,"ĠCongo":11536,"Ġalleging":11537,"wn":11538,"ulating":11539,"Ġur":11540,"Ġreaches":11541,"ĠPine":11542,"Ġthreshold":11543,"Ġtournaments":11544,"Ġheating":11545,"ĠGard":11546,"ĠHamas":11547,"Ġ«":11548,"ĠHolding":11549,"Ġpossibilities":11550,"ĠHassan":11551,"ĠMohammad":11552,"Ġoffenders":11553,"Ġautomated":11554,"Ġrealised":11555,"ouse":11556,"building":11557,"ĠDub":11558,"ĠGeneva":11559,"Ġfacial":11560,"ĠRestaurant":11561,"ĠNg":11562,"Ġtot":11563,"Ġgrace":11564,"ĠCP":11565,"Ġposter":11566,"hart":11567,"ĠNi":11568,"Ġreaff":11569,"Ġprov":11570,"Ġ111":11571,"ĠAid":11572,"Ġscrap":11573,"izers":11574,"ogen":11575,"Ġtissue":11576,"Ġvibrant":11577,"Ġrider":11578,"CD":11579,"ĠKitchen":11580,"Ġgenre":11581,"¬":11582,"depth":11583,"kind":11584,"Ġendorsed":11585,"Ġsimultaneously":11586,"Ġintern":11587,"ĠDrag":11588,"Ġembraced":11589,"Ġcounted":11590,"uj":11591,"ĠOg":11592,"Ġphysician":11593,"ĠIR":11594,"IST":11595,"ĠKir":11596,"Ġhacking":11597,"ĠSources":11598,"astic":11599,"growing":11600,"ĠWake":11601,"Ġhint":11602,"Ġcompiled":11603,"Ġreign":11604,"Ġcinema":11605,"Ġboosting":11606,"Ġaccommodation":11607,"ĠEuropa":11608,"Ġsubsidiaries":11609,"Ġclosures":11610,"ĠBil":11611,"ĠBou":11612,"wh":11613,"ĠAw":11614,"FT":11615,"hole":11616,"ĠNova":11617,"ĠNSW":11618,"Ġrap":11619,"Ġencourages":11620,"GR":11621,"ds":11622,"ĠMuk":11623,"ĠSurvey":11624,"ĠReagan":11625,"oning":11626,"Ġneighbouring":11627,"ĠMcCl":11628,"acht":11629,"Ġfinishes":11630,"ĠEsp":11631,"pat":11632,"Ġdestinations":11633,"ĠWagner":11634,"Ġconfronted":11635,"square":11636,"Ġpie":11637,"brand":11638,"hl":11639,"Ġabsent":11640,"Ġsurf":11641,"Ġrifle":11642,"ĠSS":11643,"ĠDeath":11644,"wich":11645,"Ġbeds":11646,"ĠLock":11647,"ĠAgu":11648,"atives":11649,"jee":11650,"Ġoral":11651,"Ġbudgets":11652,"Ġinspiring":11653,"IONS":11654,"works":11655,"Ġspirits":11656,"Ġcabin":11657,"Ġsatisfaction":11658,"Ġvoluntary":11659,"ĠMunicipal":11660,"Ġdeportation":11661,"ĠWriter":11662,"ĠVI":11663,"VERTISEMENT":11664,"/.":11665,"ĠSouthampton":11666,"aces":11667,"ĠHelen":11668,"ĠHum":11669,"110":11670,"Ġgarbage":11671,"through":11672,"Ġkingdom":11673,"MT":11674,"augh":11675,"Ġbizarre":11676,"ĠStarting":11677,"Ġwooden":11678,"ĠProgress":11679,"iron":11680,"sten":11681,"ĠSergio":11682,"ĠHR":11683,"Ġturnout":11684,"ĠAmericas":11685,"ĠSara":11686,"Ġagrees":11687,"apper":11688,"Ġbra":11689,"Ġrecycling":11690,"oom":11691,"Ġflee":11692,"Ġdistinct":11693,"IAL":11694,"aha":11695,"Ġfever":11696,"ĠPartnership":11697,"ĠYu":11698,"ĠPixel":11699,"ĠBlock":11700,"ĠMelissa":11701,"igg":11702,"Ġdecides":11703,"ĠNorman":11704,"Ġmas":11705,"held":11706,"ĠPD":11707,"Ġsheer":11708,"ĠDim":11709,"ĠCass":11710,"Ġcolumnist":11711,"ĠBros":11712,"Ġturnaround":11713,"ĠValue":11714,"ĠBachelor":11715,"awn":11716,"Ġassignment":11717,"ested":11718,"ĠJudiciary":11719,"Ġdiamond":11720,"Ġmus":11721,"Ġindigenous":11722,"lines":11723,"Ġ1984":11724,"igroup":11725,"ict":11726,"ĠJaguars":11727,"Ġlun":11728,"Ġprofiles":11729,"Ġcomputing":11730,"ĠBelgian":11731,"ĠLloyd":11732,"ĠGoing":11733,"Ġdisp":11734,"Ġ1987":11735,"eder":11736,"ĠVin":11737,"Ġgovern":11738,"Ġblend":11739,"ĠSebastian":11740,"ĠMidwest":11741,"iga":11742,"Ġspl":11743,"Ġtopping":11744,"Ġnetworking":11745,"ĠEmer":11746,"Ġoxygen":11747,"ĠInterest":11748,"ĠMoy":11749,"Ġtrader":11750,"Ġbay":11751,"Ġsticking":11752,"ĠMovement":11753,"Ġbidding":11754,"tax":11755,"Ġacademy":11756,"ĠMO":11757,"ĠSpirit":11758,"Ġhealing":11759,"wen":11760,"ĠPrix":11761,"cal":11762,"ĠOperating":11763,"Ġinstantly":11764,"ĠTonight":11765,"Ġsacked":11766,"Ġautomation":11767,"umps":11768,"ĠNey":11769,"March":11770,"ĠBuck":11771,"Ġconcentration":11772,"Here":11773,"Ġtravelers":11774,"Ġprotective":11775,"ĠMoody":11776,"Ġentrepreneur":11777,"Ġfac":11778,"kowski":11779,"Ġpreparations":11780,"Ġdominate":11781,"Ġspray":11782,"Ġdisturbing":11783,"ĠFraser":11784,"ĠCody":11785,"ashi":11786,"ĠPel":11787,"Ġrisky":11788,"Ġawkward":11789,"ĠVA":11790,"ails":11791,"Ġangle":11792,"Ġundergoing":11793,"Ġalbums":11794,"Ġafterwards":11795,"ĠNaw":11796,"uge":11797,"enter":11798,"ĠSussex":11799,"ĠRecently":11800,"Ġlikelihood":11801,"large":11802,"Ġsnaps":11803,"ibr":11804,"ĠMalcolm":11805,"Ġcru":11806,"Ġaltogether":11807,"Ġsetup":11808,"Ġtorture":11809,"Ġfiber":11810,"Ġquarterbacks":11811,"ĠGetting":11812,"ipping":11813,"ĠNorwegian":11814,"ĠMiles":11815,"ĠArnold":11816,"ĠDisease":11817,"Ġtends":11818,"ife":11819,"ĠCaroline":11820,"Ġnavigate":11821,"Ġbrush":11822,"ĠAssociates":11823,"Ġbath":11824,"ĠCenters":11825,"ĠMC":11826,"Ġtaxpayer":11827,"comp":11828,"Ġaccomplish":11829,"ĠTraffic":11830,"ĠBru":11831,"Ġgreenhouse":11832,"ĠMalaysian":11833,"ĠPur":11834,"ased":11835,"ĠKnicks":11836,"aters":11837,"Ġalt":11838,"ICK":11839,"Ġcalculations":11840,"Ġmindset":11841,"unch":11842,"Ġgu":11843,"Ġsteadily":11844,"Ġfiction":11845,"ĠPap":11846,"forming":11847,"ĠActor":11848,"ĠBerry":11849,"imp":11850,"ĠUpper":11851,"Ġassessed":11852,"Ġlawn":11853,"ĠRoh":11854,"Ġclearance":11855,"funded":11856,"Ġpret":11857,"ĠHom":11858,"VS":11859,"ĠTourism":11860,"ĠRy":11861,"ĠGonz":11862,"ĠStudios":11863,"Ġanchor":11864,"Ġrecognise":11865,"Ġcooperate":11866,"enny":11867,"aza":11868,"ĠMeet":11869,"Ġeventual":11870,"SW":11871,"ĠCounsel":11872,"ĠSave":11873,"Ġlucrative":11874,"Ġslim":11875,"ĠGreens":11876,"Ġchemistry":11877,"ĠSheikh":11878,"Ġbridges":11879,"business":11880,"ĠSaf":11881,"ĠGy":11882,"Ġprotocol":11883,"Ġnephew":11884,"ĠBrands":11885,"ĠCulture":11886,"orship":11887,"Ġ(£":11888,"ĠDell":11889,"astics":11890,"Ġproving":11891,"ĠMann":11892,"aca":11893,"Ġindoor":11894,"ĠUganda":11895,"ĠRomney":11896,"ĠStage":11897,"Ġward":11898,"ĠAmber":11899,"haw":11900,"Ġtw":11901,"Ġbullying":11902,"ĠCAR":11903,"Ġassociates":11904,"ĠHopkins":11905,"Ġsuburb":11906,"Ġaggressively":11907,"Ġpostponed":11908,"Ġbas":11909,"Ġburglary":11910,"ĠFound":11911,"Ġfloors":11912,"Any":11913,"Ġjam":11914,"Ġvisibility":11915,"Ġbenefited":11916,"ĠAud":11917,"aying":11918,"iku":11919,"ĠPas":11920,"ĠGPS":11921,"ĠOwens":11922,"Ġreluctant":11923,"ĠOlivia":11924,"ols":11925,"Ġemotion":11926,"ĠHeavy":11927,"Ġhostile":11928,"Ġfavorites":11929,"Ġfeat":11930,"ĠCord":11931,"ĠGO":11932,"Ġindicted":11933,"idal":11934,"ĠIL":11935,"Ħ":11936,"acer":11937,"ICH":11938,"oda":11939,"Ġrecipients":11940,"Ġtribal":11941,"Ġresist":11942,"ĠCritics":11943,"Ġsang":11944,"ĠMath":11945,"ĠBrighton":11946,"ĠKw":11947,"Ġlimitations":11948,"Ġinterception":11949,"onde":11950,"ĠRobertson":11951,"Ġenjoys":11952,"site":11953,"Ġwings":11954,"ĠCeltic":11955,"Ġrelaxed":11956,"Share":11957,"Ġwarrants":11958,"oco":11959,"Ġcritically":11960,"GC":11961,"Ġcute":11962,"Ġlaying":11963,"itude":11964,"ĠMediterranean":11965,"Ġwatches":11966,"Ġdisagree":11967,"ĠReturn":11968,"ARC":11969,"people":11970,"Ġtwelve":11971,"Ġoverdose":11972,"ĠLot":11973,"ĠFROM":11974,"ĠPeters":11975,"Ġadministrators":11976,"Ġslam":11977,"jar":11978,"OH":11979,"ĠInitiative":11980,"Ġteamed":11981,"ĠMajority":11982,"June":11983,"ĠPlaza":11984,"lake":11985,"Ġglimpse":11986,"Ġrings":11987,"Ġos":11988,"Ġmentor":11989,"have":11990,"Ġlanguages":11991,"Ġuncle":11992,"agu":11993,"ĠWine":11994,"ĠCategory":11995,"ĠIng":11996,"Ġcontests":11997,"ĠRosen":11998,"ĠWhatever":11999,"Ġdenying":12000,"ean":12001,"Ġspec":12002,"Ġgrad":12003,"Ġtenants":12004,"show":12005,"ĠGregory":12006,"Ġcontention":12007,"Ġunanimously":12008,"ĠPin":12009,"fa":12010,"ĠPink":12011,"Ġswitched":12012,"acre":12013,"ĠTrading":12014,"VP":12015,"ĠMaple":12016,"Neill":12017,"Ġdiscounts":12018,"alls":12019,"Ġsounded":12020,"Ġrumours":12021,"ĠCre":12022,"hall":12023,"ĠTele":12024,"Ġthankful":12025,"Ġsurveyed":12026,"UB":12027,"Ġdignity":12028,"Ġnod":12029,"Ġmisleading":12030,"ĠTX":12031,"ĠBurke":12032,"Ġmounting":12033,"Ġskies":12034,"Ġbesides":12035,"ĠGarrett":12036,"tha":12037,"Ġintelligent":12038,"Ġtanks":12039,"apping":12040,"ĠRat":12041,"aint":12042,"Ġentertain":12043,"ĠAbdullah":12044,"Ġsink":12045,"ĠLan":12046,"ĠManufacturing":12047,"NFL":12048,"Ġthemes":12049,"ĠHaven":12050,"ĠDavies":12051,"ĠKerr":12052,"ĠLen":12053,"Ġcourtroom":12054,"Ġfailures":12055,"Ġlately":12056,"ĠElectronics":12057,"Ġgorgeous":12058,"Ġnotification":12059,"Ġ2030":12060,"aved":12061,"Ġdeer":12062,"economic":12063,"ĠStatistics":12064,"Ġconfrontation":12065,"Ġgovernors":12066,"ĠHaram":12067,"ĠLGBTQ":12068,"Ġprocessed":12069,"ĠDuchess":12070,"Ġdowns":12071,"Ġpork":12072,"Ġhumor":12073,"ocese":12074,"Ġneeding":12075,"Ġmidterm":12076,"ĠOval":12077,"Ġcorners":12078,"Ġtablets":12079,"eds":12080,"vere":12081,"Ġattacker":12082,"Paul":12083,"pee":12084,"ĠAlice":12085,"Ġrenowned":12086,"Ġ09":12087,"ocking":12088,"Ġcreditors":12089,"ĠPedro":12090,"ĠPhone":12091,"Ġsurveys":12092,"ĠWelsh":12093,"Ġcow":12094,"Ġbuilds":12095,"Ġ000":12096,"ĠAzerbaijan":12097,"ĠYad":12098,"Ġinfant":12099,"Ġmotorists":12100,"Ġpoorly":12101,"Ġmedications":12102,"Ġstupid":12103,"ĠCastro":12104,"user":12105,"antly":12106,"alty":12107,"ĠCond":12108,"issa":12109,"ĠIvan":12110,"Ġcostume":12111,"Ġ08":12112,"Ġhence":12113,"Ġdangers":12114,"Ġbullish":12115,"Life":12116,"Ġflavor":12117,"ĠCharleston":12118,"Ġbikes":12119,"Ġworkshops":12120,"Ġarranged":12121,"Ġcontender":12122,"Ġsequel":12123,"ĠPlant":12124,"Ġdonor":12125,"Ġfactories":12126,"rict":12127,"ellen":12128,"Ġrobots":12129,"ĠWor":12130,"ĠDirectors":12131,"ĠPeru":12132,"Ġqueen":12133,"ĠTimothy":12134,"ĠToo":12135,"Ġobservers":12136,"Ġears":12137,"Ġbel":12138,"link":12139,"uns":12140,"Ġhomers":12141,"Ġadjacent":12142,"Ġconfidential":12143,"Ġstunned":12144,"iden":12145,"illed":12146,"ESS":12147,"Ġconvenient":12148,"ĠLindsey":12149,"por":12150,"upp":12151,"Ġborrow":12152,"ĠAhmad":12153,"ORT":12154,"Ġrelate":12155,"ĠSelf":12156,"ĠVanguard":12157,"utter":12158,"ĠBranch":12159,"ĠBolton":12160,"bat":12161,"Ġoutright":12162,"fighters":12163,"ĠBed":12164,"Ġpes":12165,"inski":12166,"Ġgunshot":12167,"Ġprinting":12168,"ĠSent":12169,"vern":12170,"Ġharvest":12171,"Ġbubble":12172,"Ġrefund":12173,"Ġfuels":12174,"Ġdive":12175,"Ġdiplomat":12176,"Ġpile":12177,"ĠVery":12178,"rot":12179,"ĠSearch":12180,"ĠJoyce":12181,"ĠPruitt":12182,"ĠLevel":12183,"ĠBP":12184,"ĠLac":12185,"had":12186,"Ġexpenditure":12187,"ĠMadd":12188,"Ġpockets":12189,"ĠClippers":12190,"ĠDear":12191,"ĠGive":12192,"Ġhal":12193,"Ġvertical":12194,"Ġwholesale":12195,"what":12196,"ĠSpringfield":12197,"ayed":12198,"ĠSom":12199,"Ġsecrets":12200,"Ġcharts":12201,"iar":12202,"ibility":12203,"LAND":12204,"Ġbearing":12205,"Ġprom":12206,"Ġtab":12207,"Ġsheets":12208,"ĠGL":12209,"Ġendless":12210,"opening":12211,"ĠOwen":12212,"Ġunderneath":12213,"ĠErik":12214,"ĠDACA":12215,"Ġsteering":12216,"Ġfootprint":12217,"ĠRoma":12218,"ĠDucks":12219,"ĠEllen":12220,"ĠProfessional":12221,"ĠGardens":12222,"Ġgoalie":12223,"Ġshine":12224,"Ġturmoil":12225,"Ġhunger":12226,"ĠâĢĭ":12227,"active":12228,"hey":12229,"Ġblessed":12230,"ason":12231,"oping":12232,"ĠThousands":12233,"Ġdose":12234,"ĠLor":12235,"Ġevolved":12236,"Ġcharities":12237,"ĠPE":12238,"ĠRub":12239,"ws":12240,"Ġmist":12241,"ĠShen":12242,"Ġbiological":12243,"ĠTweet":12244,"Ġcollections":12245,"Ġsubstantially":12246,"inner":12247,"Ġbattled":12248,"ĠCong":12249,"Hold":12250,"wp":12251,"Ġwells":12252,"Ġsake":12253,"Ġunrest":12254,"ĠKurt":12255,"Ġripped":12256,"itation":12257,"Ġneighbourhood":12258,"Ġinv":12259,"Ġcad":12260,"ĠCuban":12261,"ĠWealth":12262,"Ġtuition":12263,"Ġdeclaring":12264,"sch":12265,"orne":12266,"Ġwondered":12267,"ĠChaff":12268,"Ġdealer":12269,"ĠNumber":12270,"Mobile":12271,"Ġscratch":12272,"Ġprepares":12273,"ĠSens":12274,"ĠIstanbul":12275,"ĠPanama":12276,"ĠCay":12277,"Ġallocation":12278,"itutional":12279,"Ġhar":12280,"ĠNazi":12281,"ĠSund":12282,"Ġwarehouse":12283,"Ġbackyard":12284,"ĠIll":12285,"Ġunlawful":12286,"ĠReform":12287,"Ġbasement":12288,"ĠHi":12289,"ĠPictures":12290,"Ġtransfers":12291,"ĠSell":12292,"Ġfluid":12293,"Ġambitions":12294,"wife":12295,"Ġintensive":12296,"Ġsteals":12297,"Ġfestive":12298,"ĠHayes":12299,"Ġrestoration":12300,"Ġbranded":12301,"Journal":12302,"Ġmacro":12303,"Ġconsole":12304,"ĠMelania":12305,"ĠRahul":12306,"Ġdisposal":12307,"Ġcult":12308,"Ġpetrol":12309,"Ġtires":12310,"Ġkidnapping":12311,"Ġ115":12312,"Ġswap":12313,"ĠSud":12314,"Ġblown":12315,"ĠHindu":12316,"ĠBeckham":12317,"ĠGul":12318,"Ġfixture":12319,"Ġwisdom":12320,"Ġmines":12321,"fort":12322,"Ġrivers":12323,"ĠCyber":12324,"Ġtouches":12325,"race":12326,"Ġrelax":12327,"Ġcrashes":12328,"Ġconstituency":12329,"Ġ1979":12330,"Ġbureau":12331,"Ġinterface":12332,"Ġdetected":12333,"ĠBio":12334,"Ġhighlighting":12335,"ames":12336,"Ġcorresponding":12337,"great":12338,"Ġgray":12339,"Ġadvantages":12340,"ĠME":12341,"ĠAbbas":12342,"Ġnaked":12343,"rington":12344,".),":12345,"ĠFace":12346,"third":12347,"Ġtranscript":12348,"ples":12349,"Good":12350,"ĠArctic":12351,"Ġtolerance":12352,"reat":12353,"green":12354,"ĠMik":12355,"Ġoutreach":12356,"Ġrolls":12357,"Ġgen":12358,"Ġsupplied":12359,"Ġguarantees":12360,"aug":12361,"Ġsemif":12362,"ounds":12363,"running":12364,"Ġfitting":12365,"ĠRisk":12366,"iveness":12367,"family":12368,"Ġti":12369,"ĠIsaac":12370,"Ġdump":12371,"ĠPatricia":12372,"Ġpassport":12373,"ĠRhode":12374,"Who":12375,"log":12376,"Ġstat":12377,"Ġrat":12378,"ango":12379,"SB":12380,"ĠMaur":12381,"Ġsmiling":12382,"Ġstrikeouts":12383,"Ġpupils":12384,"Ġcomplications":12385,"ĠAdvanced":12386,"ĠMonetary":12387,"ĠTall":12388,"ĠALL":12389,"Ġcontributor":12390,"ĠAdvertising":12391,"Ġhorrific":12392,"Ġcompeted":12393,"ĠKenneth":12394,"Ġhailed":12395,"Ġbones":12396,"Ġbolster":12397,"ĠBoss":12398,"Ġhospitalized":12399,"ĠTelegraph":12400,"ĠIndependence":12401,"Ġdr":12402,"ĠHang":12403,"Ġdocumented":12404,"Ġsubtle":12405,"invest":12406,"Ġbounced":12407,"ĠMAN":12408,"Ġprofession":12409,"Ń":12410,"Ġexcellence":12411,"ĠInspector":12412,"ĠBL":12413,"Ġdisrupt":12414,"ĠWinston":12415,"ĠCommunist":12416,"ĠSharon":12417,"Ġmechanical":12418,"Ġtreats":12419,"Ġdesperately":12420,"ĠIndy":12421,"ĠGi":12422,"ĠComposite":12423,"ĠHeath":12424,"aser":12425,"ĠCardiff":12426,"ilit":12427,"Ġeased":12428,"Ġprospective":12429,"Ġcommissioned":12430,"Ġtire":12431,"Ġalign":12432,"Ġgesture":12433,"Ġweakened":12434,"URE":12435,"SN":12436,"Ġnationals":12437,"Ġrelies":12438,"ĠIRS":12439,"ĠCount":12440,"Ġmedicines":12441,"Ġcongress":12442,"Ġstranger":12443,"Qu":12444,"lessly":12445,"ĠQueens":12446,"ĠAlleg":12447,"uing":12448,"ĠWy":12449,"ĠMiguel":12450,"idi":12451,"Ġcivic":12452,"ĠPetro":12453,"endo":12454,"Obviously":12455,"Ġreflection":12456,"ĠStop":12457,"ĠFitzgerald":12458,"placed":12459,"shore":12460,"Ġcorrectly":12461,"ĠNE":12462,"amy":12463,"ĠCT":12464,"some":12465,"ĠMb":12466,"oi":12467,"ĠHogan":12468,"ĠInnovation":12469,"ĠVilla":12470,"ĠCAN":12471,"ĠCemetery":12472,"into":12473,"Ġquestionable":12474,"Ġcreator":12475,"rug":12476,"Ġsemifinals":12477,"mission":12478,"Ġcle":12479,"ĠWaters":12480,"ĠNixon":12481,"ĠBT":12482,"Ġassuming":12483,"ĠJer":12484,"ĠClay":12485,"pack":12486,"ĠCool":12487,"may":12488,"Ġdecor":12489,"Ġspike":12490,"ĠSomalia":12491,"ĠKarn":12492,"ĠDamascus":12493,"Shares":12494,"Ġsus":12495,"ĠMoss":12496,"Ġ1985":12497,"Ġsuperintendent":12498,"ĠResults":12499,"Ġspends":12500,"prom":12501,"Ġshipped":12502,"Ġlaundering":12503,"ĠLeslie":12504,"Ġmeteor":12505,"Ġabandon":12506,"Ġdeliberately":12507,"ĠSentinel":12508,"Ġfascinating":12509,"Ġenrollment":12510,"ĠExperts":12511,"ĠSimilarly":12512,"ĠCuomo":12513,"bor":12514,"Ġune":12515,"neutral":12516,"Ġhamstring":12517,"Ġnegotiated":12518,"zes":12519,"ĠLeo":12520,"ĠDoctor":12521,"Ġcurriculum":12522,"ĠFocus":12523,"Ġtravels":12524,"Ġbeverage":12525,"ĠIncluding":12526,"tz":12527,"type":12528,"ĠRange":12529,"Ġfloods":12530,"Ġcoached":12531,"Ġdominance":12532,"letico":12533,"ĠRafael":12534,"Ġpredictions":12535,"Ġprosperity":12536,"ĠCav":12537,"Ġclinics":12538,"ĠBanking":12539,"ĠComing":12540,"ears":12541,"ĠKaepernick":12542,"ĠBlvd":12543,"Ġretained":12544,"isions":12545,"Ġko":12546,"Ġensemble":12547,"Ġprecise":12548,"Ġcompact":12549,"MD":12550,"ĠJet":12551,"ached":12552,"ĠTru":12553,"ĠBass":12554,"ĠIcon":12555,"Ġexcluding":12556,"sur":12557,"Ġconstruct":12558,"Ġvoiced":12559,"pan":12560,"Ġinability":12561,"Ġexc":12562,"Ġmate":12563,"Ġtrailing":12564,"Ġsuccessive":12565,"Ġbets":12566,"Ġgauge":12567,"Ġminorities":12568,"ĠIND":12569,"ĠVel":12570,"ĠGP":12571,"oid":12572,"bon":12573,"Ġpred":12574,"Ġdash":12575,"Ġperformer":12576,"Ġoccasional":12577,"aken":12578,"mes":12579,"America":12580,"Ġliver":12581,"Sp":12582,"Big":12583,"Ġwildfires":12584,"ĠJackie":12585,"ĠLed":12586,"ĠFinland":12587,"Ġjurors":12588,"olic":12589,"urance":12590,"ĠEdge":12591,"open":12592,"Ġscenarios":12593,"Ġglory":12594,"entry":12595,"ĠCoffee":12596,"rep":12597,"ĠChand":12598,"ĠVas":12599,"ĠIslamabad":12600,"Ġbur":12601,"ĠFle":12602,"ĠEdition":12603,"Ġshoe":12604,"ï¸ı":12605,"**":12606,"tle":12607,"ĠEb":12608,"keeping":12609,"ĠBasketball":12610,"ĠVon":12611,"ĠCF":12612,"MENT":12613,"amm":12614,"ĠFernando":12615,"Ġcompares":12616,"ĠDouble":12617,"Ġconvictions":12618,"Ġatop":12619,"Ġcops":12620,"Ġremembers":12621,"Ġlacking":12622,"dom":12623,"itate":12624,"ĠBeauty":12625,"Ġdevelops":12626,"ĠGor":12627,"Ġfunctional":12628,"ĠCOUNTY":12629,"ĠUpon":12630,"Ġsprint":12631,"Ġinjection":12632,"Ġminors":12633,"ĠTamil":12634,"ĠGat":12635,"101":12636,"ety":12637,"Ġdrum":12638,"Ġtasked":12639,"Ġpact":12640,"Ġ170":12641,"MR":12642,"ĠRamos":12643,"Ġcandy":12644,"Sc":12645,"iced":12646,"Ġsupermarket":12647,"Ġworrying":12648,"Ġsellers":12649,"ĠTag":12650,".:":12651,"Ġmixture":12652,"oting":12653,"Bl":12654,"ĠLl":12655,"ĠJal":12656,"ican":12657,"ĠBid":12658,"country":12659,"ĠStrategy":12660,"Ġadverse":12661,"Ġplunged":12662,"ĠMit":12663,"Ġstark":12664,"aton":12665,"Ġbooking":12666,"Tr":12667,"Ġcontainers":12668,"Ġvintage":12669,"ĠPit":12670,"Ġsurfaced":12671,"Ġindependently":12672,"Ġdetection":12673,"ĠBeyon":12674,"Ġcasualties":12675,"Ġstabbing":12676,"oved":12677,"Ġbarred":12678,"Ġthereby":12679,"Ġpartnered":12680,"Ġposing":12681,"ĠShannon":12682,"ĠChapel":12683,"Ġtechnically":12684,"uous":12685,"»":12686,"ometer":12687,"Ġwildfire":12688,"share":12689,"heart":12690,"Ġammunition":12691,"Ġthrive":12692,"ĠStre":12693,"GP":12694,"cé":12695,"ĠMonaco":12696,"goal":12697,"ĠUm":12698,"ĠHSBC":12699,"ĠHilton":12700,"ĠViv":12701,"ĠKell":12702,"Ġdecisive":12703,"Ġmotive":12704,"amo":12705,"feld":12706,"ĠWH":12707,"iry":12708,"ulu":12709,"ĠSchneider":12710,"Ġcampaigning":12711,"Ġseparately":12712,"igo":12713,"ĠED":12714,"ĠRamirez":12715,"Ġmetro":12716,"ĠPatel":12717,"ĠChi":12718,"ĠAudi":12719,"Ġcharacteristics":12720,"Ġrestart":12721,"Ġkeyboard":12722,"ĠSD":12723,"his":12724,"biz":12725,"ĠSoft":12726,"ĠGrammy":12727,"Ġcontested":12728,"Ġweekends":12729,"Ġ112":12730,"Ġcycling":12731,"Ġhealthier":12732,"ija":12733,"Ġheader":12734,"Ġemploy":12735,"İ":12736,"Ġshortages":12737,"ĠAsk":12738,"ĠIvanka":12739,"Ġpartisan":12740,"Ġflowing":12741,"Ġcave":12742,"ENS":12743,"Ġups":12744,"read":12745,"ouch":12746,"Ġ102":12747,"Ġforming":12748,"bot":12749,"bie":12750,"Ġenrolled":12751,"Ġconcussion":12752,"Ġaffidavit":12753,"Ġmysterious":12754,"uries":12755,"ĠMang":12756,"Ġauthentic":12757,"Ġmetrics":12758,"ĠTwins":12759,"Ġprep":12760,"IJ":12761,"Ġdesired":12762,"ĠDiv":12763,"wall":12764,"ĠTab":12765,"Ġcompet":12766,"Ġrelied":12767,"Ġinequality":12768,"Ġmanual":12769,"ĠBucks":12770,"agging":12771,"Ġcorporation":12772,"Ġbanner":12773,"Ġgraphics":12774,"Ġaccurately":12775,"ĠMeeting":12776,"Ġconsult":12777,"ser":12778,"Ġprotesting":12779,"Ġhurting":12780,"omed":12781,"tes":12782,"Ġrode":12783,"Ġstartups":12784,"Ġhanding":12785,"ĠNest":12786,"Ġconsistency":12787,"anned":12788,"dem":12789,"ĠLyon":12790,"ĠCompetition":12791,"Ġtricky":12792,"Ġcos":12793,"ĠBengals":12794,"arry":12795,"Ġunderwent":12796,"ĠKit":12797,"à":12798,"uploads":12799,"Ġskate":12800,"Ġ''":12801,"Ġjun":12802,"ĠContent":12803,"focused":12804,"lat":12805,"ĠExp":12806,"ought":12807,"Ġnightmare":12808,"ĠExpect":12809,"Ġprecisely":12810,"ĠMonica":12811,"Ġlobbying":12812,"ĠChester":12813,"ĠInvest":12814,"Former":12815,"Ġimminent":12816,"ĠNL":12817,"Ġcomparing":12818,"ĠChes":12819,"ede":12820,"ĠNobel":12821,"mers":12822,"ĠKin":12823,"ĠBoko":12824,"ount":12825,"Ġthoroughly":12826,"Ġscattered":12827,"sharing":12828,"markets":12829,"ĠMis":12830,"Ġambition":12831,"Ġpreference":12832,"Ġeffectiveness":12833,"rio":12834,"Ġheavyweight":12835,"Ġovert":12836,"anya":12837,"ĠKanye":12838,"ishi":12839,"Ġrewards":12840,"uled":12841,"bach":12842,"Ġemphasized":12843,"Ġapologize":12844,"ĠRecent":12845,"!!":12846,"Ġanimated":12847,"ĠExxon":12848,"Ġfruits":12849,"Ġstripped":12850,"fold":12851,"ĠIndonesian":12852,"ller":12853,"Ġdementia":12854,"Ġkidney":12855,"Ġhalted":12856,"years":12857,"Ġconcerts":12858,"Ġrefers":12859,"ĠFri":12860,"Your":12861,"irl":12862,"Ġleap":12863,"jud":12864,"ĠHugh":12865,"ĠFO":12866,"Ġsore":12867,"Ġkil":12868,"ĠMate":12869,"cci":12870,"Ġsetback":12871,"Ġtightening":12872,"keeper":12873,"ĠAlbany":12874,"Ġpolicymakers":12875,"Ġdisorders":12876,"ĠCBC":12877,"ĠDiaz":12878,"Ġmaps":12879,"Ġroutinely":12880,"Ġverify":12881,"Ġbash":12882,"ĠJinping":12883,"Ġdisasters":12884,"ĠMonroe":12885,"ĠLouise":12886,"JP":12887,"ĠNevertheless":12888,"Ġconcessions":12889,"ĠPog":12890,"going":12891,"ĠFifth":12892,"ĠJill":12893,"ICT":12894,"ĠFM":12895,"ĠSugar":12896,"ĠBarb":12897,"Ġmidway":12898,"Ġtin":12899,"ĠPic":12900,"ĠPL":12901,"Ġleaks":12902,"Ġgrief":12903,"Ġtattoo":12904,"`":12905,"Ġment":12906,"ĠNu":12907,"Ġmarry":12908,"Ġdiving":12909,"Ġ1982":12910,"Ġcoin":12911,"ĠPoc":12912,"Ġstarred":12913,"ĠRiverside":12914,"Ġsidelined":12915,"Ġminers":12916,"STON":12917,"Ġbelongs":12918,"ĠSantos":12919,"ĠTechnical":12920,"aco":12921,"Ġadvise":12922,"Ġstreams":12923,"Ġcooler":12924,"ĠHE":12925,"Ġordering":12926,"ĠTask":12927,"ĠACT":12928,"ĠAnton":12929,"Ġcertification":12930,"ĠLeafs":12931,"ĠTS":12932,"ĠSerbia":12933,"azi":12934,"inks":12935,"ĠEST":12936,"Ġrelay":12937,"°":12938,"Ġdisappearance":12939,"ĠRomania":12940,"Ġoven":12941,"Ġowed":12942,"ĠStrip":12943,"ulated":12944,"UC":12945,"ITE":12946,"bling":12947,"Then":12948,"ppy":12949,"Ġunlimited":12950,"Ġcalories":12951,"Ġmerchandise":12952,"Ġblonde":12953,"ĠSpicer":12954,"performing":12955,"Ġimpl":12956,"Ġplates":12957,"Ġmosque":12958,"Ġdemon":12959,"Ġought":12960,"Ġdumped":12961,"Ġtracked":12962,"even":12963,"Ġstabil":12964,"imet":12965,"ĠLiga":12966,"ugh":12967,"ther":12968,"agar":12969,"Ġarchitect":12970,"Ġallocated":12971,"ĠJoey":12972,"Ġmarathon":12973,"master":12974,"ĠBert":12975,"Ġast":12976,"ĠEbola":12977,"ĠConservation":12978,"nic":12979,"Ġparallel":12980,"Ġinmate":12981,"Ġlocate":12982,"Ġdistribute":12983,"guard":12984,"Ġtackling":12985,"ential":12986,"Ġvi":12987,"Ġcups":12988,"Ġrhythm":12989,"Ġendured":12990,"ĠHub":12991,"ois":12992,"ĠLiberals":12993,"ĠRedskins":12994,"ĠEP":12995,"ĠKnox":12996,"fr":12997,"Ġmassacre":12998,"oka":12999,"Ġcompl":13000,"raft":13001,"ĠPublished":13002,"Ġattraction":13003,"ĠStephens":13004,"ility":13005,"ĠPul":13006,"ĠCapt":13007,"Ġexploded":13008,"Ġexceeded":13009,"lying":13010,"Ġcal":13011,"Mart":13012,"Ġpaintings":13013,"inate":13014,"ĠBrendan":13015,"Ġfortune":13016,"onductor":13017,"Ġphysicians":13018,"ĠStudy":13019,"ĠBul":13020,"ĠModern":13021,"HD":13022,"ĠBour":13023,"Ġtying":13024,"Ġ1967":13025,"Ġlighter":13026,"Ġtoss":13027,"inspired":13028,"Ġgreeted":13029,"Ġcycl":13030,"Ġverified":13031,"Ġmerit":13032,"sign":13033,"lder":13034,"Ġdebts":13035,"ĠSnyder":13036,"Ġamendments":13037,"Ġindicators":13038,"ĠDortmund":13039,"then":13040,"ĠListen":13041,"ĠFB":13042,"ref":13043,"ĠIoT":13044,"ĠBrewers":13045,"ĠLeadership":13046,"ĠNicolas":13047,"ĠBody":13048,"Ġsam":13049,"ĠAdvisor":13050,"Ġcord":13051,"Ġabuses":13052,"ĠPortuguese":13053,"Ġflown":13054,"VR":13055,"Ġconsumed":13056,"Ġreass":13057,"Ġalien":13058,"Ġrivalry":13059,"ĠREPORT":13060,"ĠRush":13061,"Ġdirecting":13062,"Ġsearches":13063,"ĠHP":13064,"ĠRoll":13065,"ĠFay":13066,"ĠClare":13067,"Ġhaul":13068,"Ġriot":13069,"Ġsettlements":13070,"Ġnorm":13071,"Ġaccelerated":13072,"ĠLok":13073,"Ġclever":13074,"Ġhyd":13075,"Ġstats":13076,"ĠHull":13077,"kers":13078,"Ġbuys":13079,"uter":13080,"Ġfue":13081,"https":13082,"UD":13083,"Ġisolation":13084,"Ġsuspend":13085,"ĠRules":13086,"ĠCircle":13087,"ĠHopefully":13088,"played":13089,"â̳":13090,"ĠPRE":13091,"sim":13092,"edd":13093,"ĠProperties":13094,"Ġbeans":13095,"Ġrevive":13096,"ĠBir":13097,"oug":13098,"Ġmob":13099,"Ġshowdown":13100,"iman":13101,"Ġpap":13102,"Ġvol":13103,"wu":13104,"Ġdiver":13105,"Ġpill":13106,"ĠMarlins":13107,"ĠLamar":13108,"Ġpersistent":13109,"Ġcondolences":13110,"ĠThor":13111,"Ab":13112,"Ġimpress":13113,"ĠRaptors":13114,"Ġreferences":13115,"Ġstiff":13116,"ĠBash":13117,"eding":13118,"Ġmurders":13119,"ĠGene":13120,"ĠManila":13121,"Ġbrokers":13122,"Ms":13123,"start":13124,"ĠDhabi":13125,"etz":13126,"Ġsubmission":13127,"ĠSchmidt":13128,"ĠPersonal":13129,"ĠBeverly":13130,"ĠMovie":13131,"ĠLamb":13132,"Ġplacement":13133,"Ġfolk":13134,"Ġfrequency":13135,"Ġplanted":13136,"Ġtwins":13137,"prov":13138,"rec":13139,"Ġpermanently":13140,"Ġcoordination":13141,"ĠCart":13142,"Ġobstacles":13143,"Ġliterature":13144,"Ġtu":13145,"Ġchill":13146,"ĠReserved":13147,"Ġlovers":13148,"ĠOutside":13149,"Ġslideshow":13150,"ĠGru":13151,"Ġty":13152,"Ġsalad":13153,"Ġlaboratory":13154,"ĠHolt":13155,"Ġ103":13156,"urb":13157,"ĠOrganisation":13158,"ĠAndrews":13159,"Ġrecipient":13160,"arch":13161,"Ġbleeding":13162,"ĠPand":13163,"Ġoverturned":13164,"Ġlistened":13165,"Ġclause":13166,"Ġnationalist":13167,"Ġresumed":13168,"ĠCout":13169,"ĠPride":13170,"Ġlayers":13171,"ĠBella":13172,"Ġreversed":13173,"Ġpriest":13174,"ĠFX":13175,"Ġalbeit":13176,"Ġhalfway":13177,"Ġcotton":13178,"ĠCarey":13179,"ĠTE":13180,"OCK":13181,"Ġbuck":13182,"ributes":13183,"ea":13184,"Ġfancy":13185,"ĠBuc":13186,"Ġbans":13187,"uters":13188,"Ġliabilities":13189,"ĠSou":13190,"ĠBernie":13191,"Ġintervene":13192,"food":13193,"ĠNDP":13194,"Ġinsist":13195,"Ġcontracted":13196,"hawk":13197,"),\"":13198,"ĠDawn":13199,"Ġmol":13200,"Ġcommissioners":13201,"Ġstranded":13202,"Ġoverwhelmed":13203,"Ġrecipes":13204,"Ġva":13205,"Ġrad":13206,"Ġscare":13207,"rez":13208,"Ġeliminating":13209,"Ġresc":13210,"ĠBreak":13211,"chn":13212,"Ġdelight":13213,"iot":13214,"Ġfreely":13215,"TI":13216,"ĠBluetooth":13217,"ĠMonth":13218,"ĠFlor":13219,"ĠFreddie":13220,"Ġtrailed":13221,"Ġinvestigative":13222,"Ġimposing":13223,"Ġattracting":13224,"awk":13225,"ĠSherman":13226,"Ġsucceeded":13227,"Ġvent":13228,"Ġreconciliation":13229,"ĠCel":13230,"ĠThroughout":13231,"ĠDowntown":13232,"ĠBrother":13233,"Ġtraditions":13234,"Ġmir":13235,"Ġstamp":13236,"tery":13237,"etti":13238,"isch":13239,"tic":13240,"Ġbanning":13241,"loss":13242,"ĠSpeedway":13243,"Ġstalled":13244,"ĠEN":13245,"ASH":13246,"thing":13247,"ĠAppeals":13248,"rac":13249,"Ġdistress":13250,"ĠConservatives":13251,"ĠPremium":13252,"usa":13253,"Ġslump":13254,"imm":13255,"ĠSupp":13256,"ĠWong":13257,"Ġdistant":13258,"Ġ104":13259,"Ġtide":13260,"ĠNorfolk":13261,"ĠYang":13262,"Ġsmashed":13263,"ĠBarrett":13264,"inho":13265,"Ġrobbed":13266,"ĠFarmers":13267,"filled":13268,"BT":13269,"Ġautumn":13270,"Ġtemple":13271,"ĠJacobs":13272,"Ġprecipitation":13273,"ĠHours":13274,"ĠFlight":13275,"Ġbeside":13276,"ĠOre":13277,"!)":13278,"ĠTurnbull":13279,"Ġpig":13280,"Ġcooling":13281,"Ġservers":13282,"oriented":13283,"Ġlocks":13284,"ĠSears":13285,"aving":13286,"ĠQuick":13287,"ĠGlob":13288,"ĠMining":13289,"Ġhorizon":13290,"arians":13291,"ĠOm":13292,"writing":13293,"Ġbelieving":13294,"Ġbon":13295,"Ġmounted":13296,"Ġpunt":13297,"ucci":13298,"uzz":13299,"cul":13300,"Ġkiss":13301,"ĠOnt":13302,"ĠCyprus":13303,"Ġrelying":13304,"Ġpiano":13305,"Ġcure":13306,"Ġcontinuously":13307,"ĠNobody":13308,"ĠBund":13309,"osis":13310,"ĠAurora":13311,"ĠBach":13312,"ĠKendall":13313,"Ġechoed":13314,"iable":13315,"Ġconscious":13316,"Ġmonster":13317,"omo":13318,"proof":13319,"ĠNate":13320,"Ġfilmmaker":13321,"ĠNaj":13322,"Ġvendor":13323,"ĠFoot":13324,"ĠChang":13325,"ĠFest":13326,"Ġselfie":13327,"Ġenters":13328,"ĠConor":13329,"ĠMosul":13330,"ĠWHAT":13331,"Ġwa":13332,"ĠGamb":13333,"osta":13334,"Ġcautioned":13335,"ĠTucker":13336,"ĠAirways":13337,"Ġvisitor":13338,"Ġ·":13339,"ĠRevolution":13340,"aching":13341,"Ġearliest":13342,"ĠQuality":13343,"Ġshorts":13344,"ube":13345,"ĠOperation":13346,"ĠSabha":13347,"Ġstrengths":13348,"ikes":13349,"Ġsexy":13350,"Ġrot":13351,"ibles":13352,"Ġcolours":13353,"THE":13354,"ailed":13355,"Ġwoke":13356,"ĠEmbassy":13357,"Ġinfamous":13358,"rov":13359,"State":13360,"â̦.":13361,"Ġpond":13362,"Ġcapt":13363,"fore":13364,"De":13365,"Ġedited":13366,"self":13367,"Hey":13368,"Ġportrait":13369,"ĠManufact":13370,"ĠStand":13371,"Ġcontenders":13372,"':":13373,"acker":13374,"Ġwithdrawn":13375,"ĠBraves":13376,"ĠHosp":13377,"changing":13378,"ĠBag":13379,"Ġadjustment":13380,"ĠCousins":13381,"ĠAAP":13382,"Ġfi":13383,"Ġoutdoors":13384,"Ġlacked":13385,"BM":13386,"ĠWHO":13387,"ĠPST":13388,"ĠLuck":13389,"Ġassisting":13390,"ĠGround":13391,"ĠTeen":13392,"ĠOle":13393,"Ġembarrassing":13394,"ĠWalt":13395,"ĠVision":13396,"ĠFal":13397,"ĠZoo":13398,"ĠWorth":13399,"ĠFloyd":13400,"ĠGujarat":13401,"Ġtipped":13402,"Ġfam":13403,"ĠDad":13404,"Ġworship":13405,"Ġtyre":13406,"Ġrebuilding":13407,"Ġqualities":13408,"ĠLives":13409,"Ġbeats":13410,"Ġ450":13411,"Ġexisted":13412,"ĠGeorg":13413,"Ġpoured":13414,"rows":13415,"ĠOx":13416,"ĠSid":13417,"Ġmac":13418,"Ġteaches":13419,"ĠEli":13420,"alla":13421,"Ġdownside":13422,"ĠBend":13423,"non":13424,"ĠArmenia":13425,"Ġcultures":13426,"ĠMae":13427,"Ġduration":13428,"ĠAthletics":13429,"Ġjuvenile":13430,"Ġlid":13431,"Ġbankers":13432,"Ġoverview":13433,"wy":13434,"Ġorbit":13435,"Vs":13436,"because":13437,"Ps":13438,"ĠFran":13439,"Ġtouring":13440,"Ġwary":13441,"Ġ106":13442,"Ġlaser":13443,"ĠVij":13444,"âĦ¢":13445,"Ġsurrender":13446,"press":13447,"rees":13448,"NO":13449,"ĠShortly":13450,"ĠKor":13451,"edu":13452,"Ġhatred":13453,"Ġtee":13454,"Ġfamously":13455,"Ġkeeper":13456,"ND":13457,"Ġreduces":13458,"HC":13459,"Ġhay":13460,"Ġunnamed":13461,"ĠTes":13462,"Ġattackers":13463,"ĠFew":13464,"ĠRichards":13465,"Ġ1968":13466,"Ġspeeches":13467,"Ġcybersecurity":13468,"ĠInfrastructure":13469,"Ġ07":13470,"ENCE":13471,"uties":13472,"Ġanxious":13473,"ĠGang":13474,"Ġannouncements":13475,"lette":13476,"oret":13477,"ĠRockies":13478,"ĠEmployees":13479,"ĠThrones":13480,"Ġhugely":13481,"Ġclin":13482,"ĠHob":13483,"Ġfraction":13484,"ĠOfficial":13485,"ĠMariners":13486,"ĠElse":13487,"Ġsanctuary":13488,"ĠPhotograph":13489,"Ġreopen":13490,"lf":13491,"hm":13492,"vest":13493,"Ġspeeding":13494,"Ġtooth":13495,"ĠShi":13496,"ĠTitle":13497,"ĠMes":13498,"ĠJobs":13499,"fair":13500,"ĠDanish":13501,"ĠMalik":13502,"Ġlaughed":13503,"Ġnavy":13504,"ĠActress":13505,"ĠWilliamson":13506,"overs":13507,"Ġreckless":13508,"Ġjo":13509,"otic":13510,"Ġassaulting":13511,"Ġpri":13512,"ĠPi":13513,"Ġlesser":13514,"Ġtit":13515,"Ġdat":13516,"Ġnail":13517,"ĠMarathon":13518,"ĠGren":13519,"ĠDol":13520,"Ġjointly":13521,"Ġamended":13522,"mine":13523,"ĠBashar":13524,"ĠHyundai":13525,"Ġuncovered":13526,"Ġeducated":13527,"atti":13528,"pres":13529,"ĠBRE":13530,"Ġya":13531,"Bank":13532,"odd":13533,"lit":13534,"ĠLinks":13535,"Ġswitching":13536,"itte":13537,"ĠSind":13538,"erved":13539,"Ġ**":13540,"Ġpositively":13541,"Ġfrankly":13542,"Ġrevenge":13543,"ĠTrinity":13544,"ĠCDC":13545,"Ġthreatens":13546,"Ġhammer":13547,"NET":13548,"ĠMut":13549,"Ġsy":13550,"Ġunidentified":13551,"icken":13552,"Ġdrills":13553,"Ġtense":13554,"Ġforeigners":13555,"OST":13556,"Ġethical":13557,"ĠDurham":13558,"ĠQual":13559,"Ġterritories":13560,"Ġid":13561,"hor":13562,"enders":13563,"Mc":13564,"OV":13565,"percent":13566,"Ġdom":13567,"Ġupward":13568,"Ġamb":13569,"Ġvisas":13570,"zan":13571,"Ãĥ":13572,"Ġundocumented":13573,"Ġsuburbs":13574,"Ġhydro":13575,"ĠJob":13576,"ĠAdelaide":13577,"oya":13578,"ĠSR":13579,"ĠMick":13580,"Ġconsolidation":13581,"Ġemotionally":13582,"ĠHop":13583,"Her":13584,"Ġloses":13585,"ĠMoto":13586,"eled":13587,"Ġregulated":13588,"ental":13589,"Ġencountered":13590,"Ġhop":13591,"ĠTrafford":13592,"Ġsticks":13593,"Ġveto":13594,"Ġexpose":13595,"Ġstretched":13596,"fin":13597,"inance":13598,"chair":13599,"ĠGareth":13600,"ĠPil":13601,"ĠHammond":13602,"Ġserial":13603,"omy":13604,"Ġcellphone":13605,"ĠClara":13606,"Ġreacted":13607,"ĠNic":13608,"ĠHomes":13609,"ĠBroadcasting":13610,"ĠFut":13611,"ĠSupply":13612,"assing":13613,"ĠNewman":13614,"Ġcharitable":13615,"ĠClayton":13616,"Ġsovereignty":13617,"Ġconvincing":13618,"ĠPrincipal":13619,"ĠHigher":13620,"ĠCut":13621,"ĠCarrie":13622,"ĠSpot":13623,"Sometimes":13624,"ĠJar":13625,"ĠConsider":13626,"ieu":13627,"Ġrefinery":13628,"Ġbloody":13629,"wheel":13630,"Ġcryptocurrencies":13631,"Fund":13632,"ĠSunderland":13633,"ĠEvents":13634,"âĢĭ":13635,"Ġaccidentally":13636,"deep":13637,"Ġfranc":13638,"bec":13639,"ĠHartford":13640,"Ġstellar":13641,"wright":13642,"kick":13643,"UG":13644,"ĠBeast":13645,"Ġrefusal":13646,"ĠRoberto":13647,"ĠDixon":13648,"ĠDiane":13649,"name":13650,"asts":13651,"ĠCharter":13652,"Ġfueled":13653,"Ġcontents":13654,"Ġaccessing":13655,"Ġtroubles":13656,"Ġtops":13657,"Ġdebuted":13658,"icating":13659,"Ġinvestigator":13660,"Ġsubscribing":13661,"Ġcoordinated":13662,"ĠFil":13663,"six":13664,"teen":13665,"Ġwithdrew":13666,"ĠGilbert":13667,"Ġ1983":13668,"arsity":13669,"Ġimagination":13670,"Ġhandgun":13671,"ĠAlibaba":13672,"Ġbug":13673,"Ġ107":13674,"ĠCOMP":13675,"ĠSomething":13676,"Ġreliability":13677,"ĠFCC":13678,"ĠFowler":13679,"Ġsingled":13680,"nom":13681,"Ġknocking":13682,"Ġmeddling":13683,"Ġdetermining":13684,"reports":13685,"Ġshade":13686,"ĠSN":13687,"anto":13688,"Ġcomplaining":13689,"ĠNan":13690,"WS":13691,"Ġyoungsters":13692,"Il":13693,"ĠKaw":13694,"ĠProp":13695,"ĠCell":13696,"ĠHurricanes":13697,"Ġpublicity":13698,"ĠXin":13699,"rial":13700,"ICO":13701,"Ġsupervision":13702,"ĠSpotify":13703,"ĠNewport":13704,"Ġprince":13705,"anche":13706,"Ġsubscriber":13707,"ĠVic":13708,"ACT":13709,"ĠRaf":13710,"ĠActing":13711,"Ġcollusion":13712,"pet":13713,"isl":13714,"Ġcommerce":13715,"Health":13716,"ĠAbraham":13717,"pri":13718,"Ġlightweight":13719,"Ġinsurer":13720,"Like":13721,"Ġhelmet":13722,"Ġevac":13723,"look":13724,"ĠNaval":13725,"160":13726,"ĠFleet":13727,"vol":13728,"Ġexpired":13729,"ĠKlein":13730,"ĠEmmy":13731,"ABLE":13732,"ĠMorocco":13733,"ĠTrip":13734,"uted":13735,"Ġnos":13736,"ĠVista":13737,"mas":13738,"ĠRocky":13739,"ĠFlint":13740,"enberg":13741,"ĠBrow":13742,"Ġsignatures":13743,"Ġpolar":13744,"ajo":13745,"Ġendorsement":13746,"Ġreservations":13747,"LIN":13748,"anny":13749,"elli":13750,"last":13751,"Ġoversee":13752,"cm":13753,"ĠOilers":13754,"Are":13755,"Ġjudiciary":13756,"onte":13757,"ĠTrack":13758,"Ġsupervisor":13759,"erk":13760,"isher":13761,"Ġintact":13762,"Ġslid":13763,"icals":13764,"paid":13765,"ĠMAR":13766,"lement":13767,"ĠLiu":13768,"ĠLarge":13769,"ĠWings":13770,"pect":13771,"ĠRum":13772,"Ġanalyzed":13773,"Ġemploys":13774,"arte":13775,"ims":13776,"ĠEventually":13777,"Ġaffiliated":13778,"Ġhospitality":13779,"ĠSprint":13780,"Ġresolutions":13781,"Ġliquor":13782,"ĠNAFTA":13783,"ANY":13784,"Ġradiation":13785,"ĠProv":13786,"Ġpause":13787,"ĠTMZ":13788,"Ġelbow":13789,"Ġresilience":13790,"ĠParents":13791,"mus":13792,"ĠSafe":13793,"Ġinterpretation":13794,"Ġraced":13795,"IND":13796,"KR":13797,"Ġhinted":13798,"ĠErin":13799,"ĠBahrain":13800,"Ġcredentials":13801,"eless":13802,"Ġprocurement":13803,"ĠWebb":13804,"ĠLowe":13805,"ĠNak":13806,"ĠLearning":13807,"zh":13808,"Ġdipped":13809,"ĠSuite":13810,"Ġmisdemeanor":13811,"ALE":13812,"Ġstrengthened":13813,"ĠSophie":13814,"Ġconfirms":13815,"Ġrac":13816,"gey":13817,"Ġshootout":13818,"Ġble":13819,"Ġcircles":13820,"ĠChef":13821,"Ġcomprised":13822,"ĠSantiago":13823,"Ġfeud":13824,"beat":13825,"Ġstaffers":13826,"Ġacute":13827,"ski":13828,"Ġpolled":13829,"ĠKur":13830,"ĠJen":13831,"ĠUltimately":13832,"anded":13833,"ĠHoney":13834,"Ġannounces":13835,"Ġamateur":13836,"around":13837,"Ġfunctioning":13838,"group":13839,"ĠSqu":13840,"Where":13841,"Ġvoid":13842,"ĠSandra":13843,"isers":13844,"Ġhelicopters":13845,"ĠGym":13846,"ĠWol":13847,"mouth":13848,"Ġsubjected":13849,"ici":13850,"ually":13851,"ĠWash":13852,"ĠLindsay":13853,"ĠVers":13854,"Ġjumps":13855,"Ġneglect":13856,"ĠKuwait":13857,"fund":13858,"ĭ":13859,"ather":13860,"lly":13861,"ei":13862,"Although":13863,".''":13864,"Ġunhappy":13865,"Ġpills":13866,"Ġmagical":13867,"Ġdro":13868,"Ġinviting":13869,"ĠJohnston":13870,"oving":13871,"450":13872,"ĠMerc":13873,"Ġadmitting":13874,"Ġinsisting":13875,"ĠCru":13876,"ĠResource":13877,"oir":13878,"Ġcomplexity":13879,"ĠRoth":13880,"ĠCher":13881,"July":13882,"raf":13883,"Ġaggregate":13884,"Ġhelm":13885,"uclear":13886,"olan":13887,"Ġoffenses":13888,"ĠWolves":13889,"ĠFu":13890,"ĠPierce":13891,"Ġemailed":13892,"ĠStra":13893,"Ġpedestrians":13894,"ĠER":13895,"ĠConway":13896,"Ġblowing":13897,"CLOSE":13898,"hab":13899,"ĠGreene":13900,"Ġconfessed":13901,"ĠTorres":13902,"ĠHolocaust":13903,"Ġrepay":13904,"Ġdemonstrates":13905,"ĠPool":13906,"gent":13907,"Ġdeleted":13908,"Ġ$$":13909,"ĠSO":13910,"Ġdri":13911,"ĠNeg":13912,"ĠVP":13913,"ĠPF":13914,"ĠPrep":13915,"Ġorganizing":13916,"icker":13917,"Ġmanufactured":13918,"enson":13919,"adas":13920,"Ġwines":13921,"Ġmachinery":13922,"Ġspecialists":13923,"ĠDetective":13924,"ĠDL":13925,"Op":13926,"Ġquicker":13927,"ĠPenguins":13928,"Engine":13929,"zone":13930,"Ġsequence":13931,"ĠLost":13932,"Ġwarmer":13933,"ĠEthiopia":13934,"Ġaffirmed":13935,"fest":13936,"resses":13937,"Ġsoap":13938,"Ġbooth":13939,"Ġnotorious":13940,"amin":13941,"Ġpursued":13942,"ĠCer":13943,"ĠSB":13944,"Ġlivestock":13945,"Ġtrace":13946,"Ġrespects":13947,"arden":13948,"April":13949,"Ġ128":13950,"ĠSaid":13951,"ennial":13952,"Ġnamely":13953,"ĠBot":13954,"Ġ108":13955,"ĠLem":13956,"nell":13957,"Ġconfirming":13958,"Ġlogged":13959,"Ġprofound":13960,"elo":13961,"ĠChambers":13962,"RT":13963,"Ġnewer":13964,"Ġsideline":13965,"ĠCardinal":13966,"este":13967,"Ġnarrowly":13968,"Ġcompromised":13969,"Ġpolicing":13970,"Ġporn":13971,"Ġarc":13972,"Ġlearnt":13973,"INE":13974,"step":13975,"ĠDomin":13976,"Ġwaist":13977,"Ġboycott":13978,"mitted":13979,"iffs":13980,"ground":13981,"ĠMaterials":13982,"Ġceasefire":13983,"Right":13984,"ĠZen":13985,"estyle":13986,"Thank":13987,"ĠOnePlus":13988,"ĠMLS":13989,"Ġconstituents":13990,"oster":13991,"ĠProsecutor":13992,"Ġpriorit":13993,"ĠDebbie":13994,"ĠExpand":13995,"uv":13996,"Ġintegrate":13997,"Ġimmun":13998,"Ġdisciplinary":13999,"ĠImm":14000,"Ġja":14001,"Ġgardens":14002,"ĠHim":14003,"obe":14004,"Ġhitter":14005,"Ġbullets":14006,"Ġevolving":14007,"ĠScientists":14008,"Michael":14009,"ĠDO":14010,"Ġunbelievable":14011,"Ġlooming":14012,"Ġdownturn":14013,"Ġmentality":14014,"Ġreopened":14015,"Ġash":14016,"ĠChapman":14017,"Ġloop":14018,"ĠUT":14019,"ĠTier":14020,"Ġunaware":14021,"Ġgratitude":14022,"Ġperforms":14023,"olk":14024,"Ġ\"(":14025,"Ġlacks":14026,"Ġinstructed":14027,"ĠRecreation":14028,"sample":14029,"Ġrequesting":14030,"Canada":14031,"Ġsupposedly":14032,"ĠHardy":14033,"Ġholder":14034,"change":14035,"ĠDominic":14036,"ĠXavier":14037,"Ġlig":14038,"Ġcandid":14039,"ĠRab":14040,"Ġconferences":14041,"ĠBurton":14042,"Dr":14043,"Ġmunicipalities":14044,"Ġcrushed":14045,"Ġseekers":14046,"ĠCitizens":14047,"Ġheightened":14048,"ĠCasino":14049,"Ġdesktop":14050,"Ġwhoever":14051,"ĠImpact":14052,"Ġcocktail":14053,"Ġphilanthrop":14054,"ĠSAN":14055,"ĠPreston":14056,"Ġobesity":14057,"Ġrestrict":14058,"ĠKab":14059,"ĠProvidence":14060,"Ġscar":14061,"ĠChart":14062,"Ġbosses":14063,"ĠRate":14064,"Ġsav":14065,"pay":14066,"Ġtransplant":14067,"ĠNoble":14068,"child":14069,"Ġconclusions":14070,"FI":14071,"Ġsack":14072,"Ġexperimental":14073,"holder":14074,"oca":14075,"herty":14076,"ĠMT":14077,"Ġcatcher":14078,"LY":14079,"Ġgrams":14080,"reet":14081,"Ġadaptation":14082,"Ġhumble":14083,"Ġbot":14084,"Ġidentical":14085,"ication":14086,"ifer":14087,"ĠCrow":14088,"Ġregain":14089,"ĠLightning":14090,"Ġkg":14091,"Ġcomposed":14092,"Ġcorrespondent":14093,"Ġreunion":14094,"Ġobserve":14095,"Ġcomprising":14096,"Ġimpeachment":14097,"Ġresh":14098,"Ġlemon":14099,"ĠSnap":14100,"Ġproprietary":14101,"een":14102,"ourt":14103,"Ġdetective":14104,"Ġlabels":14105,"Ġcorridor":14106,"ĠClinic":14107,"Ġarra":14108,"ĠPearl":14109,"Ġinformal":14110,"ĠUnd":14111,"ĠVenezuelan":14112,"Ġpeninsula":14113,"Ġdefeating":14114,"Ġsyndrome":14115,"iere":14116,"Ġspite":14117,"bag":14118,"aran":14119,"Ġspecialized":14120,"ĠAA":14121,"ĠLyn":14122,"Ġinstrumental":14123,"Smith":14124,"Ġpivotal":14125,"Ġnightclub":14126,"ĠCob":14127,"Ġcolorful":14128,"Ġartwork":14129,"Ġ1981":14130,"Ġdawn":14131,"erville":14132,"uated":14133,"ief":14134,"Ġlinking":14135,"ĠOw":14136,"Ġappreci":14137,"Ġreductions":14138,"elling":14139,"Ġsalmon":14140,"bb":14141,"ĠPhillip":14142,"yle":14143,"Ġassure":14144,"Ġdiscretion":14145,"Ġefficiently":14146,"ĠMau":14147,"abil":14148,"Ġintentionally":14149,"Ġactivated":14150,"Ġimmense":14151,"ĠStrategic":14152,"Ġcheating":14153,"ĠTrend":14154,"ĠSamantha":14155,"Ġcomple":14156,"Ġhack":14157,"ĠSerie":14158,"ĠText":14159,"Ġstylish":14160,"ĠFaith":14161,"ĠGST":14162,"Ġexterior":14163,"Ġblessing":14164,"Ġblanket":14165,"Ġcooked":14166,"Ġretaliation":14167,"Ġtro":14168,"Ġshelves":14169,"rose":14170,"ĠGram":14171,"Ġsho":14172,"ĠArgentine":14173,"Ġclerk":14174,"specific":14175,"Ġagreeing":14176,"Ġstandout":14177,"black":14178,"Ġtrending":14179,"Ġviolate":14180,"Get":14181,"ño":14182,"ĠOpt":14183,"ĠFrankfurt":14184,"ĠFranco":14185,"eness":14186,"Ġlining":14187,"Ġzoo":14188,"oil":14189,"lia":14190,"rab":14191,"Ġorganize":14192,"Ġwoods":14193,"Ġscan":14194,"Ġurgency":14195,"Ġoccurring":14196,"Ġreliance":14197,"Ġconcepts":14198,"Ġeligibility":14199,"0000":14200,"ĠBrief":14201,"Ġabusive":14202,"ĠBench":14203,"Ġrub":14204,"ĠDil":14205,"Ġmount":14206,"Ġmaturity":14207,"ĠNut":14208,"nee":14209,"enc":14210,"Ġgunfire":14211,"ĠKill":14212,"Ġgates":14213,"Ġflower":14214,"iol":14215,"Ġshaped":14216,"Ġundoubtedly":14217,"Ġbackgrounds":14218,"ĠComplex":14219,"\":{\"":14220,"Ġnaming":14221,"Ġmonument":14222,"Ġoh":14223,"Ġembedded":14224,"Ġbang":14225,"ĠKro":14226,"Ġaggression":14227,"ĠMits":14228,"During":14229,"ĠEp":14230,"iners":14231,"ĠAnaheim":14232,"Ġrom":14233,"Ġoutgoing":14234,"Ġfulfill":14235,"Ġreminds":14236,"Ġren":14237,"à¤":14238,"ĠSue":14239,"Ġrefresh":14240,"Ġlif":14241,"Ġfil":14242,"ĠLead":14243,"Ġregulate":14244,"ĠTeachers":14245,"Ġclarify":14246,"obs":14247,"Ġblasted":14248,"ĠAx":14249,"Ġflavors":14250,"Ġmega":14251,"Ġhurdles":14252,"Ġinspector":14253,"ĠSalvador":14254,"Ġprescribed":14255,"Ġrenovation":14256,"OUR":14257,"Ġutil":14258,"ĠBradford":14259,"Ġwasted":14260,"Ġlineman":14261,"Ġpalm":14262,"icate":14263,"Ġoverseeing":14264,"otted":14265,"ĠRapids":14266,"Ġjustified":14267,"aby":14268,"Ġextends":14269,"Ġoath":14270,"bow":14271,"ĠRivera":14272,"Jan":14273,"ĠImran":14274,"Ġforests":14275,"ĠShel":14276,"ĠBrun":14277,"Ġaerial":14278,"ĠNOW":14279,"PAR":14280,"Ġbeverages":14281,"ettel":14282,"Ġfragile":14283,"Ġcodes":14284,"Į":14285,"abel":14286,"Watch":14287,"road":14288,"Ġdismissal":14289,"ĠRosa":14290,"Ġcrunch":14291,"²":14292,"Ġinnovations":14293,"Ġhabitat":14294,"Ġforefront":14295,"ĠKoch":14296,"ĠChevrolet":14297,"Ġwheelchair":14298,"Ġconsiderably":14299,"Ġexpenditures":14300,"Ġtexts":14301,"Ġprompt":14302,"Ġskating":14303,"Ġpetroleum":14304,"ĠICC":14305,"Ġvit":14306,"fit":14307,"Ġprolonged":14308,"ĠLucy":14309,"Ġcho":14310,"Ġrocked":14311,"ĠBrom":14312,"Ġfreed":14313,"Ġyours":14314,"ĠEden":14315,"Ġmonitored":14316,"asted":14317,"Ġoversees":14318,"ieri":14319,"Ġideology":14320,"ĠFine":14321,"tering":14322,"Top":14323,"Ġdamp":14324,"uta":14325,"Ġlethal":14326,"Ġpurple":14327,"udge":14328,"ĠChemical":14329,"ĠPetersburg":14330,"Ġwarns":14331,"Ġcollectively":14332,"Ġâ":14333,"Ġplaintiffs":14334,"ĠBoris":14335,"Ġsheep":14336,"oves":14337,"ĠAuthor":14338,"Ġcampuses":14339,"Ġdestroying":14340,"Ġgloves":14341,"Ġcease":14342,"Ġdelegates":14343,"Ġpreceded":14344,"realDonaldTrump":14345,"Ġforwards":14346,"erton":14347,"ĠBuzzFeed":14348,"Ġoccupation":14349,"ĠLegion":14350,"Ġstir":14351,"Ġshale":14352,"Ġterrific":14353,"Ġnewborn":14354,"Ġstandoff":14355,"OWN":14356,"Ġmuscles":14357,"ĠHerman":14358,"ĠLiz":14359,"ĠExperience":14360,"ĠSuccess":14361,"ĠHispanic":14362,"ĠCCTV":14363,"Ġcomplement":14364,"ĠBing":14365,"Ġprem":14366,"ĠJohannes":14367,"Ġdent":14368,"itar":14369,"ĠHein":14370,"ĠNicola":14371,"Ġconcludes":14372,"ĠKhal":14373,"Ġparish":14374,"Ġshaking":14375,"ĠSchw":14376,"mod":14377,"ĠLil":14378,"ña":14379,"ĠBog":14380,"ĠFight":14381,"Ġgre":14382,"Ġfel":14383,"Ġheal":14384,"err":14385,"TM":14386,"airo":14387,"health":14388,"Ġswings":14389,"Ġtier":14390,"anka":14391,"ribune":14392,"emouth":14393,"ĠBloom":14394,"Ġowing":14395,"Tech":14396,"Ġdough":14397,"Ġbatch":14398,"ĠLion":14399,"ĠZamb":14400,"Ġcrashing":14401,"ĠXL":14402,"ppers":14403,"ĠDoctors":14404,"ĠSor":14405,"video":14406,"Ġcigarettes":14407,"ĠBoxing":14408,"Ġconstitute":14409,"Ġconcentrate":14410,"ĠArmenian":14411,"Ġsemester":14412,"position":14413,"emic":14414,"ĠNYC":14415,"ĠCampus":14416,"Ġalternate":14417,"Ġexped":14418,"Ġpublishers":14419,"2015":14420,"Ġunanimous":14421,"ĠPrevious":14422,"Ġwellness":14423,"ĠCreative":14424,"edy":14425,"AGE":14426,"ĠCavs":14427,"Ġ1978":14428,"Ġfu":14429,"ĠTata":14430,"ĠChoice":14431,"Ġwoes":14432,"ĠCable":14433,"Ġ~":14434,"ĠGem":14435,"Ġconsolidated":14436,"ĠManitoba":14437,"Cloud":14438,"Ġrounded":14439,"ĠVentura":14440,"Ġshark":14441,"Ġdresses":14442,"Ġtraction":14443,"eda":14444,"Ġdiv":14445,"Ġdental":14446,"Wh":14447,"ĠGig":14448,"ĠBoyd":14449,"ĠTransit":14450,"Ġtelevised":14451,"SON":14452,"ĠVince":14453,"Ġcloses":14454,"apt":14455,"ĠWheeler":14456,"ĠTyson":14457,"Ġforensic":14458,"Ġpunished":14459,"Ġseas":14460,"Ġnavigation":14461,"Ġprecedent":14462,"Ġextremist":14463,"Ġcomposite":14464,"PO":14465,"Ġsurvivor":14466,"ĠVale":14467,"gars":14468,"HT":14469,"ĠRiyadh":14470,"Ġrevival":14471,"ĠPayne":14472,"Ġcollaborative":14473,"ĠCustomers":14474,"ĠPf":14475,"Ġproves":14476,"erve":14477,"Ġelev":14478,"ĠPaper":14479,"Ġchore":14480,"Ġthriller":14481,"Ġstraw":14482,"cock":14483,"Gu":14484,"Ġaligned":14485,"ĠChronicle":14486,"Ġshouting":14487,"Ġ1976":14488,"Ġlightning":14489,"Ġworlds":14490,"ĠOpening":14491,"enton":14492,"ĠAna":14493,"ĠGol":14494,"ĠTechn":14495,"lis":14496,"Ġorientation":14497,"ĠArri":14498,"ĠPG":14499,"ross":14500,"Ġsank":14501,"LOS":14502,"ĠAllison":14503,"Ġsmiles":14504,"USD":14505,"Ġkits":14506,"Bar":14507,"ĠBri":14508,"Ġounces":14509,"ĠNielsen":14510,"eno":14511,"Ġ109":14512,"Ġnorms":14513,"Ġskip":14514,"180":14515,"Ġmonitors":14516,"2012":14517,"Ġincorporate":14518,"Ġmechanisms":14519,"ĠHack":14520,"ĠBomb":14521,"ĠGavin":14522,"ĠNatalie":14523,"Ġdiscusses":14524,"Ġassembled":14525,"Ġcognitive":14526,"owner":14527,"Ġgenuinely":14528,"Ġdisappear":14529,"ĠAK":14530,"Ġstal":14531,"Ġsoup":14532,"ĠFinn":14533,"Ġcares":14534,"Ġfinest":14535,"Ġtuned":14536,"ende":14537,"ĠStefan":14538,"Ġaccompanying":14539,"î":14540,"Maybe":14541,"Ġoffender":14542,"TT":14543,"Ġ212":14544,"Ġvolleyball":14545,"needed":14546,"Ġquo":14547,"Ġdim":14548,"ĠHistorical":14549,"ĠLance":14550,"gmail":14551,"ĠGate":14552,"Ġdemonstrators":14553,"Ġdy":14554,"cia":14555,"ĠSteele":14556,"ĠJoan":14557,"ĠKerala":14558,"KA":14559,"ĠElectoral":14560,"Ġpaths":14561,"ø":14562,"Ne":14563,"Ġaccepts":14564,"Ġlowering":14565,"Ġportions":14566,"ĠValencia":14567,"Ġfestivals":14568,"Ġgeneric":14569,"usk":14570,"ĠVernon":14571,"ĠOrioles":14572,"Ġrenewal":14573,"Ġbelonged":14574,"Ġbreathe":14575,"Ġ220":14576,"Ġrecruited":14577,"Ġlogic":14578,"Ġrecreation":14579,"Ġverbal":14580,"ĠHaz":14581,"double":14582,"Ġfavourites":14583,"Ġfundamentals":14584,"ĠSoc":14585,"360":14586,"SO":14587,"Ġalerted":14588,"Ġbriefed":14589,"ĠBruno":14590,"Ġseating":14591,"Ġfreight":14592,"ĠAmer":14593,"Ġwished":14594,"table":14595,"growth":14596,"ĠWent":14597,"Ġhilarious":14598,"Ġthroat":14599,"bet":14600,"gon":14601,"Ġample":14602,"hee":14603,"ĠHood":14604,"ĠIceland":14605,"ĠAnkara":14606,"iang":14607,"Ġpracticing":14608,"azer":14609,"Ġleaf":14610,"Ġhottest":14611,"Ġmarginal":14612,"Ġrevelations":14613,"ĠPrices":14614,"ĠLar":14615,"times":14616,"Ġhandles":14617,"ĠNaz":14618,"Ġinstitute":14619,"Ġtranslate":14620,"ĠJP":14621,"Ġsoared":14622,"Ġconsume":14623,"ĠTap":14624,"ĠCelebrity":14625,"ĠMayweather":14626,"ĠOracle":14627,"Ġmor":14628,"ANA":14629,"Ġpaperwork":14630,"aste":14631,"Ġdil":14632,"Ġdecorated":14633,"Ġpromotional":14634,"ĠMerrill":14635,"Ġappliances":14636,"ĠCOP":14637,"Ġlips":14638,"ĠBrennan":14639,"ĠMile":14640,"ĠNetworks":14641,"ĠComment":14642,"ĠIb":14643,"ĠAgg":14644,"IDE":14645,"Ġinitiate":14646,"Ġknockout":14647,"Ġbargain":14648,"Ġaccordingly":14649,"bee":14650,"ĠGerald":14651,"Ġproblematic":14652,"Ġtrap":14653,"Ġfinalists":14654,"addy":14655,"would":14656,"Ġstrictly":14657,"ĠRamsey":14658,"Ġdownward":14659,"Ġextract":14660,"Ġfamed":14661,"ĠOUT":14662,"Ġinduct":14663,"ĠAuckland":14664,"Ġpoetry":14665,"mos":14666,"ĠGuinea":14667,"management":14668,"ohan":14669,"ĠGuide":14670,"aily":14671,"umping":14672,"Ġenacted":14673,"ĠEye":14674,"vision":14675,"umi":14676,"aped":14677,"Ġbicycle":14678,"ĠHouth":14679,"ĠNAS":14680,"Ġtapped":14681,"wer":14682,"otti":14683,"EA":14684,"Ġsurprises":14685,"ĠUpdate":14686,"ĠPun":14687,"ĠMiz":14688,"ĠOro":14689,"Ġcostumes":14690,"title":14691,"Ġsurviving":14692,"According":14693,"themed":14694,"ĠPeoples":14695,"Se":14696,"Ġassociations":14697,"hett":14698,"Time":14699,"Ġessay":14700,"Ġmu":14701,"ĠScore":14702,"ĠSpani":14703,"ĠSEE":14704,"Ġmales":14705,"Ġrage":14706,"EU":14707,"ĠYellow":14708,"rupt":14709,"Ġapparel":14710,"Ġsweat":14711,"Ġnearest":14712,"zman":14713,"Ġanticipation":14714,"Ġinjuring":14715,"Ġousted":14716,"chan":14717,"ĠAlert":14718,"Ġber":14719,"atal":14720,"Com":14721,"Ġ04":14722,"Ġafterward":14723,"edge":14724,"ĠBooker":14725,"lex":14726,"ĠWhole":14727,"Ġtoughest":14728,"ĠMaharashtra":14729,"lier":14730,"ĠTennis":14731,"Ġhandy":14732,"ĠMetal":14733,"ĠiTunes":14734,"ĠDiscovery":14735,"Ġcompassion":14736,"ĠLIVE":14737,"Ġeconomically":14738,"Ġendangered":14739,"GO":14740,"Ġmound":14741,"word":14742,"ĠTouch":14743,"ogo":14744,"Ġincomes":14745,"when":14746,"ĠAside":14747,"Ġscandals":14748,"Ġfunctionality":14749,"ĠAer":14750,"Ġcouncils":14751,"Ġdenial":14752,"140":14753,"Ġimplied":14754,"Ġoutfits":14755,"Ġsuited":14756,"Ġ1973":14757,"ĠPizza":14758,"Ġdebates":14759,"record":14760,"Ġhype":14761,"ĠRus":14762,"ĠRobbie":14763,"Ġtouted":14764,"ĠSharp":14765,"Ġbeings":14766,"Ġslavery":14767,"encies":14768,"ĠRooney":14769,"Ġnan":14770,"Ġraids":14771,"Ġinstructor":14772,"Market":14773,"Ġshook":14774,"Ġdeliberate":14775,"ĠNorthwestern":14776,"ĠEss":14777,"Ġwhatsoever":14778,"ĠConfederate":14779,"YS":14780,"ĠCameroon":14781,"ĠFlip":14782,"Yeah":14783,"Ġwashing":14784,"mand":14785,"ĠLex":14786,"Ġissuance":14787,"Ġniche":14788,"Ġfold":14789,"ĠWendy":14790,"Ġhy":14791,"Ġbucket":14792,"ĠVW":14793,"ĠCairo":14794,"ĠSK":14795,"ĠKang":14796,"Ġintake":14797,"Ġhills":14798,"anz":14799,"©":14800,"ugu":14801,"ĠFortunately":14802,"ĠMarqu":14803,"Ġimprisonment":14804,"oking":14805,"Ġdistributors":14806,"zie":14807,"Ġstip":14808,"ĠWire":14809,"Ġcouncillors":14810,"Ġsue":14811,"ĠRegardless":14812,"ĠEnc":14813,"Ġbaking":14814,"ĠVenture":14815,"Ġintriguing":14816,"Ġupheld":14817,"ĠActive":14818,"Ġgenes":14819,"ĠDawson":14820,"ĠPreviously":14821,"ĠRac":14822,"Ġmetric":14823,"Files":14824,"ĠiPhones":14825,"ĠWelcome":14826,"Ġburns":14827,"ĠScreen":14828,"ashes":14829,"ĠApr":14830,"Ġtheories":14831,"san":14832,"ĠRenault":14833,"ĠSinger":14834,"Ġfounders":14835,"Russian":14836,"ĠBelfast":14837,"Ġimagined":14838,"ĠPlanet":14839,"ĠCatalan":14840,"ĠRochester":14841,"Ġevolve":14842,"ĠOT":14843,"Ġpassword":14844,"Ġhomelessness":14845,"Ġbacklog":14846,"Ġpresenter":14847,"Ġfal":14848,"ISH":14849,"ĠEM":14850,"icked":14851,"Ġunlock":14852,"city":14853,"Ġnegotiation":14854,"Ġdancers":14855,"dan":14856,"ĠCOL":14857,"VC":14858,"boat":14859,"Ġoverly":14860,"deal":14861,"lander":14862,"Ġdiss":14863,"ICS":14864,"Ġfifty":14865,"Ġowe":14866,"Ġprisons":14867,"ifications":14868,"wo":14869,"ĠAu":14870,"Ġapiece":14871,"ĠCourtney":14872,"Ġ1975":14873,"Ġsurpass":14874,"Ġidentities":14875,"Ġintegral":14876,"Ġdocumentation":14877,"Ġelegant":14878,"ĠIg":14879,"Ġdear":14880,"Ġ113":14881,"ĠGupta":14882,"Ġcontentious":14883,"rish":14884,"Ġclues":14885,"Ġadditions":14886,"Ġep":14887,"rus":14888,"Ġcentered":14889,"ĠPhillies":14890,"father":14891,"Ġborough":14892,"Ġbuttons":14893,"Ġdeported":14894,"ĠREC":14895,"ĠAlready":14896,"eh":14897,"hur":14898,"Ġupbeat":14899,"omen":14900,"Ġdetailing":14901,"Ġwr":14902,"Ġvaried":14903,"ĠEconomics":14904,"Ġensures":14905,"ĠCivic":14906,"Ġunpaid":14907,"sold":14908,"ĠHil":14909,"ĠMult":14910,"ĠRising":14911,"ĠMini":14912,"Ġneuro":14913,"Ġpenal":14914,"Ġneighbour":14915,"ĠChavez":14916,"Ġjew":14917,"ĠVIP":14918,"Connor":14919,"ĠTalking":14920,"Ġcorrection":14921,"Ġstandpoint":14922,"roads":14923,"ĠWool":14924,"Ġverification":14925,"Ġmic":14926,"olf":14927,"Ġexemption":14928,"Ġfilter":14929,"Ġballoon":14930,"leases":14931,"ician":14932,"ĠSpr":14933,"Ġtoe":14934,"Ġunconstitutional":14935,"Ġmanslaughter":14936,"Ġtossed":14937,"ĠMeg":14938,"ATIONS":14939,"ACK":14940,"ĠRouge":14941,"ĠHansen":14942,"ĠHook":14943,"Out":14944,"ĠHorse":14945,"ĠBath":14946,"ĠAlways":14947,"Ġincorporated":14948,"Ġconjunction":14949,"ĠFit":14950,"Ġexamining":14951,"Ġwallet":14952,"Ġensured":14953,"Ġacclaimed":14954,"ippers":14955,"Ġbeneficiaries":14956,"Ġunexpectedly":14957,"Ġexploit":14958,"ĠWillie":14959,"Ġcomb":14960,"ĠWalton":14961,"rica":14962,"icky":14963,"Ġate":14964,"ĠPadres":14965,"Ġrib":14966,"Ġsnacks":14967,"ĠFernandez":14968,"ĠMachine":14969,"ction":14970,"Ġillnesses":14971,"ĠHoffman":14972,"ĠSpaceX":14973,"Ġju":14974,"Ġswift":14975,"Ġembark":14976,"ĠRailway":14977,"Ġmeasuring":14978,"agers":14979,"arsh":14980,"Ġessence":14981,"angle":14982,"Ġolive":14983,"ĠCommander":14984,"iggs":14985,"Ġrewarded":14986,"Ġdispatched":14987,"Ġplayground":14988,"½":14989,"ĠProgramme":14990,"Ġstudios":14991,"Ġskeptical":14992,"ĠOlymp":14993,"ĠKeys":14994,"ĠSunshine":14995,"amba":14996,"ĠDonna":14997,"Ġlightly":14998,"Ġobtaining":14999,"Ġpoisoning":15000,"Ġaz":15001,"Ġ1972":15002,"Ġunconscious":15003,"ECT":15004,"Ġlied":15005,"ĠKaz":15006,"Ġ06":15007,"ĠMoving":15008,"Ġnum":15009,"oral":15010,"Ġassessments":15011,"Ġscholarships":15012,"Ġevacuate":15013,"ĠSunni":15014,"Ġquake":15015,"Ġfort":15016,"ques":15017,"ĠAlonso":15018,"Ġthread":15019,"Ġsqueeze":15020,"arat":15021,"oly":15022,"ĠAlphabet":15023,"uting":15024,"icio":15025,"ĠRetirement":15026,"ither":15027,"Ġasleep":15028,"Ġpairs":15029,"Ġmanufacture":15030,"ĠHazard":15031,"Ġsidewalk":15032,"Ġwears":15033,"ĠCraft":15034,"emen":15035,"ieth":15036,"Ġbypass":15037,"ĠLancaster":15038,"Ġflour":15039,"charge":15040,"ĠCLICK":15041,"Ġpotatoes":15042,"ĠKarachi":15043,"Ġvalley":15044,"Ġsights":15045,"Ġfallout":15046,"ords":15047,"BN":15048,"Ġsunshine":15049,"Ġundertaken":15050,"Ġcontestants":15051,"Ġaccomplishments":15052,"Ġconditioning":15053,"Ġcel":15054,"ĠHalifax":15055,"Ġaccent":15056,"***":15057,"Ġpitchers":15058,"Ġadopting":15059,"Ġjustices":15060,"Ġrip":15061,"ince":15062,"Ġelimination":15063,"Ġaerospace":15064,"ĠBeer":15065,"ĠBasin":15066,"Ġunwanted":15067,"goers":15068,"isco":15069,"ĠTwin":15070,"ĠDesert":15071,"rix":15072,"Ġdarkness":15073,"ĠDunn":15074,"City":15075,"pop":15076,"Ġ1969":15077,"ataka":15078,"Ġtal":15079,"Ġautism":15080,"ĠMcLaren":15081,"ĠUEFA":15082,"Ġclassrooms":15083,"ĠLeave":15084,"Americans":15085,"las":15086,"Ġqui":15087,"Ġundefeated":15088,"otto":15089,"ĠNRA":15090,"ĠPorsche":15091,"Ġnuts":15092,"oys":15093,"ĠMethodist":15094,"Ġatt":15095,"Ġtweeting":15096,"children":15097,"eller":15098,"Ġinquiries":15099,"Ġmillennials":15100,"ĠWembley":15101,"INS":15102,"Ġautopsy":15103,"ĠElon":15104,"ĠHicks":15105,"ugg":15106,"Ġwreck":15107,"ĠComcast":15108,"Ġstones":15109,"public":15110,"ĠKem":15111,"bedroom":15112,"ļ":15113,"itated":15114,"Ġsemic":15115,"uman":15116,"Cal":15117,"ANN":15118,"ĠGaz":15119,"Ġundisclosed":15120,"ĠPlanned":15121,"ĠYale":15122,"ĠIST":15123,"lies":15124,"ĠStanding":15125,"Ġrelieved":15126,"EO":15127,"Ġgraduating":15128,"park":15129,"ĠâĢķ":15130,"Ġpensions":15131,"rave":15132,"ĠWonder":15133,"AZ":15134,"Ġcosting":15135,"Ġeditors":15136,"Ġtotaled":15137,"Ġspacecraft":15138,"meter":15139,"Ġ02":15140,"ĠNikki":15141,"sworth":15142,"ĠCrit":15143,"asha":15144,"Ġknees":15145,"Ġhats":15146,"uity":15147,"ĠPanther":15148,"Ġtan":15149,"ĠBuzz":15150,"ĠGlad":15151,"ĠPleasant":15152,"SM":15153,"Ġtricks":15154,"Ġplac":15155,"ĠDanielle":15156,"Ġours":15157,"Ġwashed":15158,"haven":15159,"Ġdrain":15160,"ĠUttar":15161,"Ġapple":15162,"Ġjunk":15163,"Ġturkey":15164,"ĠDug":15165,"Ġdiplomacy":15166,"Ġempire":15167,"Ġpinch":15168,"Ġferry":15169,"ĠDustin":15170,"Ġ03":15171,"Ġelder":15172,"Everything":15173,"ĠProgressive":15174,"ution":15175,"VI":15176,"dam":15177,"Ġlever":15178,"ĠAustralians":15179,"Ġconsequence":15180,"itan":15181,"Ġcondemn":15182,"Ġneg":15183,"ĠOverview":15184,"Ġsuccesses":15185,"Ġprobable":15186,"ĠMirror":15187,"mor":15188,"verse":15189,"Ġevaluating":15190,"ĠBes":15191,"Ġimm":15192,"Ġharness":15193,"Ġresilient":15194,"ĠBuild":15195,"Ġstraightforward":15196,"ADE":15197,"Ġgrandparents":15198,"Ġmarched":15199,"ĠKiev":15200,"Ġchiefs":15201,"oha":15202,"Ġvest":15203,"kn":15204,"enda":15205,"ĠSev":15206,"Ġbatters":15207,"ĠJos":15208,"ĠQue":15209,"ĠCourse":15210,"ĠCorner":15211,"ĠMess":15212,"Ġmourn":15213,"keepers":15214,"ĠRegina":15215,"Everybody":15216,"Ġtrajectory":15217,"Ġdefenseman":15218,"ĠArticles":15219,"Ġspur":15220,"ĠPhD":15221,"Ġpipes":15222,"Ġduck":15223,"Ġcombining":15224,"ĠHit":15225,"ĠGeorgetown":15226,"ĠBee":15227,"Cor":15228,"Ġcomposition":15229,"Ġconnects":15230,"ĠMARK":15231,"taker":15232,"Ġcertainty":15233,"Ġhefty":15234,"ĠHezbollah":15235,"ĠShip":15236,"Ġmalicious":15237,"AI":15238,"Ġbits":15239,"Ġstyl":15240,"Ġimpaired":15241,"ĠCBI":15242,"Despite":15243,"othe":15244,"ĠRyder":15245,"ĠAlf":15246,"ifa":15247,"Ind":15248,"Ġblaming":15249,"ĠToledo":15250,"EW":15251,"ĠEssex":15252,"iated":15253,"ĠAberdeen":15254,"ANCE":15255,"Ġpossess":15256,"Ġsuperhero":15257,"Ġoverhead":15258,"quet":15259,"ĠRicky":15260,"Ġdock":15261,"ĠTelecom":15262,"Ġshelf":15263,"³":15264,"Ġmaritime":15265,"Ġportrayed":15266,"ĠYesterday":15267,"Ġcollided":15268,"Ġcookies":15269,"ĠCul":15270,"Ġindexes":15271,"Ġnaval":15272,"oval":15273,"105":15274,"ĠWeber":15275,"chief":15276,"arma":15277,"ĠRey":15278,"Ġauditor":15279,"ĠMarion":15280,"ĠMartha":15281,"ĠSally":15282,"Ġsedan":15283,"ĠAlison":15284,"nce":15285,"Es":15286,"ĠParade":15287,"Ġpharmacy":15288,"ĠKre":15289,"loe":15290,"cks":15291,"Ġmitigate":15292,"Ġdesigning":15293,"Ġ2024":15294,"Ġportable":15295,"Ġimproves":15296,"ĠAMD":15297,"Ġexcluded":15298,"CON":15299,"ĠOscars":15300,"Ġfixtures":15301,"comb":15302,"ĠBerg":15303,"Ġbother":15304,"Ġboring":15305,"Ġobservation":15306,"ĠCad":15307,"Ġrecordings":15308,"ĠCultural":15309,"Ġweaken":15310,"Ġaccuse":15311,"ĠAbd":15312,"abor":15313,"115":15314,"uffle":15315,"Ġhighways":15316,"atham":15317,"empt":15318,"ĠDeer":15319,"ĠEDT":15320,"ĠWait":15321,"athan":15322,"Ġaccumulated":15323,"Ġguilt":15324,"Ġexempt":15325,"Ġdiluted":15326,"ĠJamal":15327,"Ġshit":15328,"cross":15329,"Ġeve":15330,"Ġshirts":15331,"Ġsatisfy":15332,"ĠPaulo":15333,"AH":15334,"sic":15335,"ĠChloe":15336,"ĠCities":15337,"ĠSwansea":15338,"Ġprecision":15339,"ĠTracy":15340,"ping":15341,"Ġcontinually":15342,"Ġdemographic":15343,"Ġcliff":15344,"Ġjaw":15345,"isted":15346,"ĠDevelop":15347,"ĠAJ":15348,"Ġaisle":15349,"ĠLionel":15350,"Ġpredominantly":15351,"Ġmel":15352,"Ġlifelong":15353,"hs":15354,"Ġshouted":15355,"lad":15356,"Ġdest":15357,"Ġpacks":15358,"ĠKath":15359,"ĠCruise":15360,"fired":15361,"oder":15362,"hua":15363,"Ġgoodbye":15364,"Ġinterfere":15365,"eca":15366,"Ġré":15367,"atum":15368,"itas":15369,"ĠLodge":15370,"ĠWald":15371,"Ġmidday":15372,"umble":15373,"asting":15374,"©":15375,"ĠLeg":15376,"ĠNepal":15377,"Ġchased":15378,"idge":15379,"Ġconv":15380,"Ġfraudulent":15381,"Ġopera":15382,"Ġshr":15383,"ĠUniverse":15384,"ĠJerome":15385,"Ġ1977":15386,"ĠDancing":15387,"ĠRS":15388,"±":15389,"eks":15390,"Ġchic":15391,"Ġpunish":15392,"Ġpropose":15393,"arin":15394,"ĠChop":15395,"ĠAhead":15396,"ĠGallagher":15397,"ĠBangkok":15398,"ĠShelby":15399,"ĠNS":15400,"Ġcheek":15401,"onia":15402,"Ġrelegation":15403,"ĠHind":15404,"ĠCory":15405,"Ġfingerprint":15406,"Ġstrive":15407,"Ġmm":15408,"igs":15409,"Ġholy":15410,"Ġfavored":15411,"ĠSomeone":15412,"ĠLatino":15413,"ĠPatt":15414,"Ġchallenger":15415,"ĠCotton":15416,"Sw":15417,"itten":15418,"ĠXI":15419,"ĠStat":15420,"ĠDIS":15421,"Ġautomakers":15422,"Ġevaluated":15423,"ĠArc":15424,"Ġpersuade":15425,"Af":15426,"Ġreunited":15427,"Ġabs":15428,"Ġbride":15429,"Ġpurely":15430,"uce":15431,"uded":15432,"Ġsettling":15433,"Ġlodged":15434,"Ġfixing":15435,"Ġsuccession":15436,"ĠAlfred":15437,"ĠAlvarez":15438,"mac":15439,"ĠFont":15440,"Ġcontra":15441,"affle":15442,"Ġcopied":15443,"Ġmasses":15444,"ĠElections":15445,"ĠThan":15446,"Ġsoaring":15447,"jay":15448,"Ġsuing":15449,"Ġconcentrated":15450,"Ġconvey":15451,"Ġ240":15452,"gs":15453,"ĠNeal":15454,"Ġnasty":15455,"ĠLB":15456,"odi":15457,"ĠSergei":15458,"Ġthumb":15459,"Ġservants":15460,"Ġrevelation":15461,"Ġdischarge":15462,"ĠBright":15463,"ĠBent":15464,"ĠChrysler":15465,"mill":15466,"ĠImagine":15467,"Ġreceptions":15468,"Ġpersonalities":15469,"Ġsilly":15470,"ĠLoc":15471,"ĠZero":15472,"HI":15473,"rice":15474,"Ġgar":15475,"far":15476,"enh":15477,"ĠBiden":15478,"ĠEntreprene":15479,"Ġassumption":15480,"Ġnicely":15481,"ĠEither":15482,"|":15483,"ĠNW":15484,"ĠKens":15485,"ĠNolan":15486,"Ġowning":15487,"atures":15488,"ĠPastor":15489,"ĠRegistration":15490,"Ġexperiments":15491,"Ġassurance":15492,"Ġhashtag":15493,"oint":15494,"ĠBin":15495,"Ġqualification":15496,"center":15497,"Ġausterity":15498,"ĠPers":15499,"Ġscoop":15500,"Ġpros":15501,"ĠFields":15502,"Ġfur":15503,"ĠJas":15504,"Ġplanting":15505,"security":15506,"ĠTrain":15507,"ĠKathy":15508,"demand":15509,"ĠLev":15510,"Ġtut":15511,"tier":15512,"QU":15513,"Ġexploitation":15514,"Ġignoring":15515,"ĠSex":15516,"Ġadapted":15517,"Ġdisastrous":15518,"Ġempower":15519,"Ġcreators":15520,"ĠLay":15521,"ĠDragon":15522,"ĠWyn":15523,"Ġ1974":15524,"acious":15525,"performance":15526,"ĠTiffany":15527,"isting":15528,"Ġindividually":15529,"ĠLeading":15530,"ĠSask":15531,"Ġcatastrophic":15532,"Ġpunched":15533,"ĠVienna":15534,"Ġsurgical":15535,"Gr":15536,"odo":15537,"Ġgem":15538,"ĠMinority":15539,"Ġmice":15540,"ĠHistoric":15541,"ĠKot":15542,"caster":15543,"Ġsuff":15544,"journal":15545,"Ġpresumably":15546,"ĠBit":15547,"inary":15548,"Ġbre":15549,"Ġenhancing":15550,"Ġgru":15551,"ĠRunning":15552,"hardt":15553,"Ġtroubling":15554,"Ġpumps":15555,"ĠProspect":15556,"etic":15557,"Ġmartial":15558,"Ġcouncillor":15559,"atra":15560,"ths":15561,"ĠSark":15562,"ĠChamp":15563,"scoring":15564,"ĠWel":15565,"rup":15566,"Ġterrifying":15567,"ĠCatch":15568,"Ġinspections":15569,"Ġpornography":15570,"bra":15571,"ĠKeeping":15572,"Ġbanker":15573,"angers":15574,"ĠCrimea":15575,"ĠDisclosure":15576,"iba":15577,"Ġturf":15578,"Ġschedules":15579,"ĠJorge":15580,"ĠAcross":15581,"Ġsolving":15582,"Ġsensation":15583,"ĠWW":15584,"cial":15585,"atz":15586,"Ġlion":15587,"Ġcertificates":15588,"itive":15589,"ĠWes":15590,"ĠPrison":15591,"ĠPlayStation":15592,"duty":15593,"Ġvariable":15594,"Ġstrangers":15595,"istrates":15596,"vs":15597,"Ġreigning":15598,"Ġsliding":15599,"ĠShin":15600,"Ġtelecommunications":15601,"Ġinstalling":15602,"Ġrecogn":15603,"Ġsubway":15604,"too":15605,"ĠMcKin":15606,"ĠStoke":15607,"Ġsensitivity":15608,"bas":15609,"Ġsan":15610,"Ġ(-":15611,"ĠSuarez":15612,"Ġaverages":15613,"ammu":15614,"ĠFen":15615,"Ġrefined":15616,"outh":15617,"Ġcob":15618,"ĠLaz":15619,"essa":15620,"Ġpositioning":15621,"Three":15622,"Ġoils":15623,"Ġassaults":15624,"Ġcompanion":15625,"ĠFlash":15626,"ĠMam":15627,"ĠTill":15628,"Ġblues":15629,"ĠJae":15630,"ĠPier":15631,"Ġbedrooms":15632,"ĠHawkins":15633,"ĠCornell":15634,"Ġanswering":15635,"Ġsec":15636,"Ġrecognizes":15637,"Red":15638,"ĠJamaica":15639,"Ġinsurgents":15640,"Ġbrace":15641,"Ġra":15642,"ĠTai":15643,"ocation":15644,"ignment":15645,"Ġreasonably":15646,"inating":15647,"Ġbonuses":15648,"Ġsandwich":15649,"Ġinadequate":15650,"Ġdelicate":15651,"Ġadorable":15652,"Ġpalace":15653,"Ġsmallest":15654,"Ġpractically":15655,"ĠCrosby":15656,"Ġlevy":15657,"Ġlend":15658,"boards":15659,"shaped":15660,"Ġvulnerability":15661,"ĠKelley":15662,"Ġsponsorship":15663,"ract":15664,"Ġslew":15665,"Ġfederation":15666,"ĠLal":15667,"acies":15668,"ĠFamilies":15669,"Ġproposing":15670,"Ġhyp":15671,"elected":15672,"inkle":15673,"ĠSays":15674,"ĠApollo":15675,"ĠWis":15676,"imer":15677,"Ġcombines":15678,"Ġtim":15679,"ĠQuestion":15680,"Ġborrowers":15681,"Ġswiftly":15682,"ĠMagn":15683,"Ġheadphones":15684,"Russia":15685,"Ġtongue":15686,"Ġbye":15687,"nn":15688,"Ġseller":15689,"ĠWord":15690,"Tom":15691,"ĠDevin":15692,"ĠSurrey":15693,"Ġquad":15694,"Ġcourthouse":15695,"gi":15696,"ĠGrill":15697,">":15698,"Ġrational":15699,"ĠFlames":15700,"ĠCham":15701,"Ġvacuum":15702,"ĠRays":15703,"Ġescalating":15704,"Ġouter":15705,"Ġstretches":15706,"ĠSpeed":15707,"Ġnegatively":15708,"Ġabsorb":15709,"ĠAustrian":15710,"Ġslice":15711,"ĠDiet":15712,"Ġbun":15713,"Ġtactical":15714,"ĠCBD":15715,"Ġedges":15716,"Ġnest":15717,"Ġstrained":15718,"ulates":15719,"ĠTina":15720,"Net":15721,"ķ":15722,"ĠGos":15723,"God":15724,"White":15725,"Ġproudly":15726,"usion":15727,"ĠArlington":15728,"ĠNear":15729,"ĠMaxwell":15730,"Ġbomber":15731,"Ġcared":15732,"Ġapprovals":15733,"Ġexams":15734,"ĠEconomy":15735,"Ġposters":15736,"ĠHampton":15737,"ĠPere":15738,"ĠContract":15739,"Ġhoused":15740,"Ġinstruction":15741,"ĠJess":15742,"Ġacre":15743,"Ġcongestion":15744,"ĠGener":15745,"Ġdioxide":15746,"Ġvar":15747,"ĠAlexandria":15748,"ĠSpider":15749,"Ġcoins":15750,"Ġ225":15751,"Ġterritorial":15752,"ĠSPD":15753,"Ġfloat":15754,"null":15755,"Ġcalculate":15756,"ĠDin":15757,"eto":15758,"Ġcows":15759,"Ġpunct":15760,"Ġexpire":15761,"Ġkidnapped":15762,"Ġcou":15763,"Ġattitudes":15764,"ĠLeh":15765,"ĠHero":15766,"ĠKabul":15767,"Ġcubic":15768,"Ġdigits":15769,"ĠRES":15770,"Ġpipelines":15771,"icide":15772,"ĠSingle":15773,"Ġhurts":15774,"ĠMaz":15775,"ĠPak":15776,"Ġslate":15777,"Ġmultimedia":15778,"ADA":15779,"Mexico":15780,"ĠRelease":15781,"chard":15782,"Ġgarlic":15783,"ĠFletcher":15784,"Ġaforementioned":15785,"Ġ05":15786,"ĠParkway":15787,"Ġfirefighter":15788,"Ġcounseling":15789,"utions":15790,"Cap":15791,"Ġconsultants":15792,"ĠMeh":15793,"ouring":15794,"ĠDI":15795,"mic":15796,"phones":15797,"Ġencounters":15798,"ĠHapp":15799,"Ġcartoon":15800,"flight":15801,"Ġundertake":15802,"ĠHans":15803,"Ġplunge":15804,"ĠParenthood":15805,"Ġkickoff":15806,"ĠCelsius":15807,"ĠRas":15808,"ĠDund":15809,"ounce":15810,"Ġpurse":15811,"Ġmortality":15812,"Ġbrains":15813,"Ġconglomerate":15814,"ĠObserver":15815,"ĠSector":15816,"ĠApparently":15817,"Ġblank":15818,"iston":15819,"Ġweighs":15820,"gro":15821,"ĠPaw":15822,"ĠCOM":15823,"ĠPurdue":15824,"Ġnetted":15825,"ĠLinux":15826,"Mike":15827,"Ġfaithful":15828,"Ġmagazines":15829,"Ġheadquartered":15830,"ĠIps":15831,"Ġindications":15832,"Look":15833,"ĠElite":15834,"Ġsupreme":15835,"Ġchunk":15836,"ĠSz":15837,"ĠVine":15838,"rise":15839,"ĠYas":15840,"general":15841,"ĠOpera":15842,"Ġpriests":15843,"Assad":15844,"Ġaunt":15845,"Ġwhopping":15846,"enzie":15847,"Ġvegan":15848,"Ġinflux":15849,"ĠConsult":15850,"Ġwaiver":15851,"Having":15852,"inning":15853,"Ġproximity":15854,"Ġclassical":15855,"ĠIslanders":15856,"Ġadvertisers":15857,"ĠCe":15858,"ĠSochi":15859,"Ġmemoir":15860,"ĠPlaying":15861,"yers":15862,"Ġstud":15863,"Ġobservations":15864,"Ġadmire":15865,"Ġhiking":15866,"Ġbatter":15867,"Ġconfusing":15868,"Ġprecaution":15869,"kil":15870,"clusive":15871,"opoulos":15872,"ĠWestbrook":15873,"ĠTanzania":15874,"ĠCedar":15875,"usted":15876,"Ġdestructive":15877,"ĠIndies":15878,"osi":15879,"ĠAmid":15880,"Ġintercepted":15881,"Ġpartnering":15882,"Ġsubstances":15883,"ĠSuns":15884,"Ġpromotes":15885,"bird":15886,"Gen":15887,"aper":15888,"ĠEy":15889,"Ġterrain":15890,"Ġ1930":15891,"zon":15892,"Ġbreed":15893,"broken":15894,"uchin":15895,"ĠPrim":15896,"ĠRoland":15897,"Ġfitted":15898,"Ġprotects":15899,"Ġ114":15900,"RP":15901,"Ġdisrupted":15902,"ĠBaylor":15903,"oren":15904,"ĠKeen":15905,"Ġmansion":15906,"Ġgrassroots":15907,"ĠVictory":15908,"Ġbarn":15909,"Ġdepreciation":15910,"oped":15911,"immer":15912,"Ġgarnered":15913,"ĠLip":15914,"ĠTob":15915,"Ġcreatures":15916,"ooter":15917,"Ġconsortium":15918,"obi":15919,"ĠMonster":15920,"arks":15921,"turn":15922,"Ġsketch":15923,"Ġpredicting":15924,"Ġminimize":15925,"ĠEthan":15926,"anson":15927,"ĠAdjusted":15928,"ĠHornets":15929,"ĠNZ":15930,"ĠKathleen":15931,"ĠKier":15932,"ĠMercury":15933,"Ġghost":15934,"Ġhaw":15935,"ĠDemand":15936,"ĠCollection":15937,"ĠFortune":15938,"Ġcruel":15939,"Ġfurious":15940,"ĠKun":15941,"ĠSalem":15942,"Ġunsuccessful":15943,"ĠLomb":15944,"ĠFury":15945,"ahi":15946,"Ġenthusiastic":15947,"Ġsurgeries":15948,"ACE":15949,"Ġroller":15950,"ĠStamford":15951,"Being":15952,"Dec":15953,"check":15954,"Ġaffection":15955,"Ġgifted":15956,"Ġenerg":15957,"Ġvarying":15958,"ĠCharl":15959,"Ġsolved":15960,"ĠNV":15961,"Ġlaptops":15962,"Ġkindness":15963,"mart":15964,"ĠPenny":15965,"Ġ116":15966,"ĠFeder":15967,"ĠCisco":15968,"Ġeducators":15969,"Ġminim":15970,"Ġgangs":15971,"Ġfestivities":15972,"ĠOriginal":15973,"yre":15974,"rying":15975,"Ġtighter":15976,"ĠMalta":15977,"Ġshield":15978,"interest":15979,"Ġbuoy":15980,"Ġsupplement":15981,"ĠSof":15982,"Ġok":15983,"Ġprosecuted":15984,"Ġinterventions":15985,"Ġseize":15986,"Ġcaravan":15987,"ĠCarlson":15988,"ĠEnterprises":15989,"ĠChristina":15990,"ĠWellington":15991,"Ġaltered":15992,"TP":15993,"Ġexpresses":15994,"Ġcomfortably":15995,"Ġstaffing":15996,"afa":15997,"itu":15998,"saving":15999,"Ġinflammation":16000,"hatt":16001,"ĠMiranda":16002,"icious":16003,"Ġgrabbing":16004,"ĠANY":16005,"Ġobjections":16006,"Ġdot":16007,"cle":16008,"Ġrelates":16009,"Ġtribe":16010,"Ġboarding":16011,"ĠEpisode":16012,"ĠEnjoy":16013,"arding":16014,"Ġathletics":16015,"Ġflies":16016,"Ġmortgages":16017,"ruct":16018,"Ġink":16019,"ĠKC":16020,"ĠSecondary":16021,"Ġfer":16022,"ĠQaeda":16023,"OA":16024,"Frank":16025,"track":16026,"ĠChandler":16027,"Ġenv":16028,"ĠLeaders":16029,"ĠKemp":16030,"Ġunsafe":16031,"sponsored":16032,"San":16033,"ĠUsers":16034,"PE":16035,"ĠAccount":16036,"otta":16037,"ĠMix":16038,"ĠCindy":16039,"En":16040,"Ġ175":16041,"Ġoverlooked":16042,"Ġpublications":16043,"Ġrewarding":16044,"Ġexplicit":16045,"Ġnotch":16046,"Ġspecifics":16047,"Ġdesignation":16048,"ĠAppeal":16049,"Ġcontingent":16050,"Ġcage":16051,"ĠKol":16052,"ĠJohns":16053,"ĠReach":16054,"ĠTin":16055,"ĠAfricans":16056,"Ġprec":16057,"ĠRural":16058,"ĠDw":16059,"Ġuphold":16060,"Ġsuffers":16061,"Ġweed":16062,"inst":16063,"Ġcancellation":16064,"ĠShaun":16065,"Ġleve":16066,"Ġdivisive":16067,"Ġhel":16068,"Ġfatigue":16069,"ĠSchwartz":16070,"ĠKirst":16071,"Ġarise":16072,"Ġgrandson":16073,"ĠLawson":16074,"Ġcollaborate":16075,"Ġparticipant":16076,"ĠBryce":16077,"Ġinfield":16078,"mid":16079,"Ġut":16080,"Ġnotices":16081,"Ġsneak":16082,"ĠPAR":16083,"Chris":16084,"Ġutilize":16085,"ĠByron":16086,"ĠZhang":16087,"PF":16088,"Ġoverwhelmingly":16089,"Ġvegetable":16090,"Ġabsurd":16091,"ĠChem":16092,"etime":16093,"Ġenvoy":16094,"Ġlover":16095,"length":16096,"Ġrevolutionary":16097,"ĠYam":16098,"Ġshutting":16099,"mt":16100,"super":16101,"ĠToby":16102,"ĠCoca":16103,"Ġproposition":16104,"Ġembracing":16105,"Ġversatile":16106,"ĠWalking":16107,"Ġillicit":16108,"Ġnude":16109,"Ġunpredictable":16110,"take":16111,"Ġgotta":16112,"ĠXiaomi":16113,"Ġinstit":16114,"ĠPep":16115,"ĠPearson":16116,"Ġrejection":16117,"stead":16118,"Ġmut":16119,"Ġoutspoken":16120,"ĠBaghdad":16121,"ĠFly":16122,"Ġwholly":16123,"ĠRM":16124,"ĠFa":16125,"Ġcleaner":16126,"frey":16127,"ĠHab":16128,"ĠLiber":16129,"Ġwhereabouts":16130,"Ġchefs":16131,"Ġalumni":16132,"Ġstopp":16133,"dd":16134,"forward":16135,"rast":16136,"ĠNash":16137,"ĠCort":16138,"Ġpotent":16139,"Ġmold":16140,"Ġdistinctive":16141,"chip":16142,"ĠBrunswick":16143,"Ġpopulist":16144,"Ġplagued":16145,"eka":16146,"ĠIOC":16147,"ugs":16148,"ĠDob":16149,"Ġmagn":16150,"asser":16151,"hew":16152,"Ġcapturing":16153,"oos":16154,"Ġcrystal":16155,"Ġalarming":16156,"Ġ135":16157,"iating":16158,"Ġnap":16159,"umar":16160,"ĠExpl":16161,"Ġupgrading":16162,"Ġdecl":16163,"Ġoverturn":16164,"ARK":16165,"linked":16166,"ĠContinued":16167,"Ġslumped":16168,"ĠGaga":16169,"iful":16170,"ĠPosted":16171,"ĠRecommended":16172,"Ġsnake":16173,"Ġexplosives":16174,"Ġhind":16175,"Ġcontempt":16176,"Ġmock":16177,"NBA":16178,"Ġstall":16179,"Ġorganisers":16180,"Ġingredient":16181,"Ġblockbuster":16182,"ĠStream":16183,"ĠLeah":16184,"Pic":16185,"Ġventures":16186,"oman":16187,"Ġweakening":16188,"Ġmaximize":16189,"Ġdigging":16190,"uez":16191,"Ġdistinction":16192,"ĠMali":16193,"Ġcontaminated":16194,"Ġhij":16195,"Ġcrafts":16196,"Fl":16197,"Ġcloset":16198,"ĠRapp":16199,"Ġtowers":16200,"Ġamenities":16201,"Ġopioids":16202,"Ġcontend":16203,"load":16204,"ĠJol":16205,"ĠBooks":16206,"Ġsim":16207,"Ġthrilling":16208,"Ġmeter":16209,"ĠMultiple":16210,"Ġarbitration":16211,"Ġcracked":16212,"Pl":16213,"Ġphotographers":16214,"Te":16215,"ĠSidd":16216,"Ġexplored":16217,"170":16218,"Ġpleasant":16219,"ĠCapitals":16220,"ĠRi":16221,"ĠRandall":16222,"overed":16223,"Ġchar":16224,"ĠEverybody":16225,"ĠPolitics":16226,"Ġmoisture":16227,"Ġthriving":16228,"ĠScotia":16229,"arded":16230,"imb":16231,"ĠFantasy":16232,"Ġcemetery":16233,"ĠPath":16234,"eur":16235,"ĠSec":16236,"ĠPlatform":16237,"Ġdeparted":16238,"ĠVIDEO":16239,"ĠPant":16240,"ĠSyn":16241,"Ġ230":16242,"bleacher":16243,"live":16244,"Ġprob":16245,"Ġgymn":16246,"Ġjudged":16247,"orns":16248,"Ġstemming":16249,"umbling":16250,"ĠHew":16251,"ĠCheryl":16252,"Ġconsciousness":16253,"cos":16254,"ĠTate":16255,"CNN":16256,"Ġrecognizing":16257,"meg":16258,"Ġpant":16259,"ulk":16260,"MM":16261,"ĠPrescott":16262,"ĠMarcel":16263,"anas":16264,"Ġhappier":16265,"mag":16266,"ĠLov":16267,"Ġspreads":16268,"ĠSample":16269,"Ġpopped":16270,"HR":16271,"ĠMitt":16272,"Ġ00":16273,"Ġlabeled":16274,"Ġaspirations":16275,"?)":16276,"Ġloads":16277,"ĠBritt":16278,"hurst":16279,"ĠTeams":16280,"Ġextremists":16281,"ĠClement":16282,"lings":16283,"shirts":16284,"cheon":16285,"ĠDEL":16286,"ĠLocation":16287,"Ġpresentations":16288,"ĠFalcon":16289,"Ġtoddler":16290,"kl":16291,"Ġprone":16292,"Ġcommemor":16293,"ĠStanton":16294,"201":16295,"Ġranges":16296,"Ġfielder":16297,"Ġattends":16298,"rade":16299,"Ġproactive":16300,"Ġhostage":16301,"ĠGriffith":16302,"ockey":16303,"ĠAdding":16304,"ĠAFL":16305,"gas":16306,"istics":16307,"Ġsurgeon":16308,"Ġtsunami":16309,"2014":16310,"Ġconstraints":16311,"cu":16312,"Ġsurrendered":16313,"azed":16314,"ĠAirbnb":16315,"650":16316,"zed":16317,"Ġinjustice":16318,"dog":16319,"full":16320,"ĠHear":16321,"Ġsprawling":16322,"Ġhomeland":16323,"ĠSG":16324,"anced":16325,"Ġpools":16326,"ĠCE":16327,"Ġbeers":16328,"AE":16329,"ĠJac":16330,"Ġrecurring":16331,"Writing":16332,"Ġgenius":16333,"ĠFrost":16334,"Ġgrounded":16335,"Ġallege":16336,"lessness":16337,"Ġjumper":16338,"Ġvicious":16339,"Ġsecretly":16340,"Ġhacked":16341,"ĠAmsterdam":16342,"ibu":16343,"Ġ1971":16344,"ĠRosenstein":16345,"nick":16346,"arge":16347,"Ġladder":16348,"elled":16349,"Ġsatellites":16350,"Ġassassination":16351,"ĠDepot":16352,"built":16353,"Ġunrelated":16354,"maid":16355,"ĠDod":16356,"ĠVanderbilt":16357,"Ġboundary":16358,"ĠStafford":16359,"ĠBry":16360,"Ġtribunal":16361,"Ġoutings":16362,"Ġquantity":16363,"imming":16364,"ĠBlacks":16365,"Br":16366,"eri":16367,"uffed":16368,"Ġexplicitly":16369,"ĠBieber":16370,"AKING":16371,"Ġphotographed":16372,"ĠPolit":16373,"Ġpremature":16374,"hered":16375,"ĠVi":16376,"Ġmarsh":16377,"casters":16378,"ĠKra":16379,"Ġdried":16380,"Ġcafe":16381,"eting":16382,"Ġshaping":16383,"aram":16384,"orf":16385,"Ġrichest":16386,"Ġhurricanes":16387,"Ġcommands":16388,"Gl":16389,"anth":16390,"Ġstunt":16391,"Ġyearly":16392,"Ġdefeats":16393,"Ġconsultancy":16394,"call":16395,"Ġlag":16396,"adh":16397,"ĠPalestine":16398,"Ġcustomized":16399,"ĠScar":16400,"ĠWesley":16401,"ready":16402,"Ġpersist":16403,"Ġpacking":16404,"ono":16405,"Ġdischarged":16406,"Ġpouring":16407,"sburg":16408,"Ġreconsider":16409,"ĠMethod":16410,"enez":16411,"cill":16412,"Ġsecular":16413,"pers":16414,"Ġple":16415,"ELS":16416,"ĠMine":16417,"Ġpushes":16418,"Us":16419,"Ġframes":16420,"ĠNets":16421,"ĠSiem":16422,"ĠHitler":16423,"kill":16424,"Ġrented":16425,"Ġcharm":16426,"Ġpulls":16427,"ĠTide":16428,"Ġinsufficient":16429,"itted":16430,"Care":16431,"iera":16432,"Ġcouch":16433,"aders":16434,"ext":16435,"ĠCitizen":16436,"Ġlogical":16437,"ĠMeadows":16438,"ĠDenis":16439,"ĠDrivers":16440,"Ġrepublic":16441,"Ġadvising":16442,"Ġparamedics":16443,"insky":16444,"illard":16445,"encia":16446,"Ġkh":16447,"Ġrh":16448,"Ġfinalized":16449,"Ġreins":16450,"ĠFarrell":16451,"Ġsteer":16452,"Ġproxy":16453,"unes":16454,"ĠSoul":16455,"ĠCopper":16456,"ĠKenyan":16457,"amped":16458,"conference":16459,"sted":16460,"ĠLon":16461,"Ġreplay":16462,"ĠBle":16463,"Ġvibe":16464,"Ġportfolios":16465,"sea":16466,"Ġbeautifully":16467,"Ġairs":16468,"ĠRap":16469,"ĠKatrina":16470,"Ġberth":16471,"gold":16472,"ĠIsaiah":16473,"iques":16474,"elson":16475,"Ġrelentless":16476,"ĠHighland":16477,"ĠPhilippe":16478,"ĠFol":16479,"Ġenduring":16480,"enz":16481,"Ġaer":16482,"icing":16483,"ĠHTC":16484,"Ġdoping":16485,"ĠAlb":16486,"Ġsom":16487,"icia":16488,"Ġcoroner":16489,"Ġdamn":16490,"Ġ119":16491,"Ġwiped":16492,"ĠAuditor":16493,"hern":16494,"ĠJew":16495,"endra":16496,"osp":16497,"ĠRory":16498,"Ġshapes":16499,"ĠPablo":16500,"Ġforemost":16501,"ĠHos":16502,"ĠCunningham":16503,"145":16504,"ĠRecovery":16505,"!!!":16506,"western":16507,"Ġimaging":16508,"ĠRookie":16509,"ĠMTV":16510,"Ġunc":16511,"ĠSporting":16512,"Ġpatrons":16513,"ĠCoverage":16514,"ĠObservatory":16515,"Ġfishermen":16516,"ĠProvince":16517,"ĠAston":16518,"ĠOsh":16519,"ĠWeekend":16520,"Ġrecruits":16521,"Ġdensity":16522,"FM":16523,"ĠGorsuch":16524,"ĠErie":16525,"lining":16526,"Ġshowcased":16527,"ĠRubio":16528,"Ġchaotic":16529,"Ġattractions":16530,"Ġhug":16531,"ĠHerbert":16532,"ĠRespond":16533,"Ġhappily":16534,"Ġtor":16535,"ĠOTHER":16536,"runner":16537,"ĠShakespeare":16538,"Ġstretching":16539,"ĠJudy":16540,"wyn":16541,"ĠCafe":16542,"Ġgreens":16543,"ĠHend":16544,"Ġglam":16545,"iation":16546,"ĠKingston":16547,"Ġincremental":16548,"Live":16549,"ĠBraun":16550,"USS":16551,"reb":16552,"Ġimperative":16553,"Ġsympathy":16554,"Ġrefuge":16555,"Ġadministered":16556,"rance":16557,"ĠLiberia":16558,"Ġmobil":16559,"heads":16560,"Ġinevitably":16561,"ĠEugene":16562,"ĠBerkshire":16563,"ĠHarbour":16564,"ĠTrends":16565,"TB":16566,"Ġdeficits":16567,"Ġlistings":16568,"Ġreadings":16569,"Ġtumor":16570,"Ġoffic":16571,"opy":16572,"Ġdistracted":16573,"Ġappropriately":16574,"ĠWillis":16575,"Ġskirt":16576,"ĠTea":16577,"Ġshades":16578,"Ġbargaining":16579,"Ġretention":16580,"ĠConcert":16581,"ĠMeteor":16582,"ĠCustom":16583,"Ġinputs":16584,"ĠSah":16585,"enta":16586,"Love":16587,"ĠBurg":16588,"ĠCynthia":16589,"ĠMoses":16590,"ubb":16591,"Ġpeoples":16592,"dh":16593,"ĠFro":16594,"bean":16595,"Ġcigarette":16596,"tta":16597,"umm":16598,"Ġphenomenal":16599,"Ġyelling":16600,"Ġinaug":16601,"Ġconven":16602,"ĠGore":16603,"request":16604,"Ġcolonial":16605,"ĠAleppo":16606,"Ġdemolition":16607,"Ġamounted":16608,"Ġstaggering":16609,"Ġclips":16610,"Ġinconsistent":16611,"ĠMilton":16612,"ĠWireless":16613,"ĠReno":16614,"ĠPerkins":16615,"Ġunusually":16616,"Ġmemor":16617,"Ġhectares":16618,"Ġlat":16619,"central":16620,"ĠDig":16621,"ĠMarina":16622,"ĠPartner":16623,"daily":16624,"your":16625,"Reilly":16626,"Ġpope":16627,"phy":16628,"Ġassessing":16629,"ĠRodrigo":16630,"wi":16631,"Ġcompatible":16632,"imate":16633,"Ġgentle":16634,"ĠRhodes":16635,"Brexit":16636,"ieve":16637,"Ġbreaches":16638,"Ġchopped":16639,"Ġcancers":16640,"VEL":16641,"Ġsluggish":16642,"ĠUltra":16643,"ĠUl":16644,"Ġcrises":16645,"ONE":16646,"ĠEquipment":16647,"Ġcater":16648,"Ġadjourn":16649,"Ġreadily":16650,"ĠRolling":16651,"ĠBott":16652,"inel":16653,"ĠRule":16654,"Ġgrind":16655,"ĠHussain":16656,"ussie":16657,"Ġdepressed":16658,"ĠImperial":16659,"ongo":16660,"Ġuniforms":16661,"Ġ117":16662,"Ġchambers":16663,"ĠDum":16664,"ifi":16665,"ĠBetty":16666,"ĠTA":16667,"Ġpromotions":16668,"itary":16669,"Ġcried":16670,"Ġbranding":16671,"ĠBahamas":16672,"ĠDat":16673,"Ġantibiotics":16674,"ĠAus":16675,"Ġumbrella":16676,"Ġgradual":16677,"Ġaltercation":16678,"Ġlure":16679,"ĠJakarta":16680,"Ġunified":16681,"chin":16682,"ettes":16683,"ĠRwanda":16684,"ulations":16685,"Ġbrink":16686,"Ġbroadcasting":16687,"ĠArtist":16688,"Ġrecon":16689,"Ġaqu":16690,"ĠServ":16691,"999":16692,"ĠParticipants":16693,"ĠVentures":16694,"fight":16695,"Ġactivism":16696,"Ġstructured":16697,"Ġportal":16698,"Ġtendency":16699,"ĠAssociate":16700,"Ġcalf":16701,"ĠOrd":16702,"ĠTi":16703,"ĠFrancois":16704,"uary":16705,"ĠVik":16706,"urchase":16707,"Ġfried":16708,"Ġbooming":16709,"Ġparticles":16710,"amas":16711,"INA":16712,"Super":16713,"supp":16714,"urring":16715,"ĠWatts":16716,"affer":16717,"ĠDEC":16718,"Ġroadway":16719,"border":16720,"Ġsequ":16721,"entially":16722,"ieg":16723,"Ġcamping":16724,"Ġ750":16725,"Ġcycles":16726,"ĠReese":16727,"ĠFellow":16728,"isters":16729,"ĠVehicle":16730,"kies":16731,"ĠJonas":16732,"Ġfoundations":16733,"ĠNigel":16734,"Ġstab":16735,"Ġcongressman":16736,"ĠWichita":16737,"antes":16738,"Ġprogression":16739,"Ġditch":16740,"lik":16741,"Ġsid":16742,"Ġele":16743,"ĠMund":16744,"Ġstairs":16745,"lete":16746,"Ġlingering":16747,"Ġsadly":16748,"Ġay":16749,"Em":16750,"Ġdeadliest":16751,"soon":16752,"Ġtangible":16753,"Ġabusing":16754,"Ġcomprises":16755,"vil":16756,"ĠBun":16757,"Ġdoubling":16758,"Ġcommun":16759,"Ġslogan":16760,"Ġloading":16761,"Ġshallow":16762,"Ġattributes":16763,"Che":16764,"Ġcheering":16765,"Ġrefuses":16766,"cam":16767,"bes":16768,"hon":16769,"ĠSpartans":16770,"cept":16771,"ĠComputer":16772,"ĠCanberra":16773,"ĠWARNING":16774,"Ġstuffed":16775,"block":16776,"ĠJennings":16777,"ĠAU":16778,"atin":16779,"Ġom":16780,"Ġbachelor":16781,"Ġprediction":16782,"ĠWinner":16783,"agne":16784,"Ġrob":16785,"ĠKatherine":16786,"Ġli":16787,"ĠHumph":16788,"ĠPEOPLE":16789,"IRO":16790,"Cola":16791,"Ġguitarist":16792,"isen":16793,"ĠHighlights":16794,"Ġwelcomes":16795,"Ġprisoner":16796,"Ġpsychology":16797,"Ġextradition":16798,"Ġrou":16799,"ĠLund":16800,"Ġthoughtful":16801,"RY":16802,"orman":16803,"Alex":16804,"Ġlaughter":16805,"Ġfumble":16806,"Ġsynthetic":16807,"Ġdigit":16808,"ĠRoc":16809,"ĠFactory":16810,"ellery":16811,"ishment":16812,"ilar":16813,"ĠEarl":16814,"ĠSutton":16815,"ĠJur":16816,"ĠAllan":16817,"ĠKoreans":16818,"uki":16819,"Ġculinary":16820,"PU":16821,"Stock":16822,"stars":16823,"ĠDayton":16824,"beck":16825,"Ġinstability":16826,"ĠBring":16827,"Ġbreeding":16828,"Ġmiracle":16829,"bons":16830,"Ġdonating":16831,"ĠKick":16832,"ĠSag":16833,"afi":16834,"Ġharassed":16835,"asm":16836,"Their":16837,"inity":16838,"Ġacademics":16839,"Ġstatute":16840,"ĠAmit":16841,"Ġpressured":16842,"east":16843,"\"),":16844,"iso":16845,"220":16846,"Ġairplane":16847,"ĠMcCabe":16848,"ctions":16849,"ĠMesa":16850,"Ġsensational":16851,"ĠFE":16852,"ĠNeigh":16853,"Ġbribery":16854,"Ġflaws":16855,"Ġfemales":16856,"Ġmisses":16857,"ĠColor":16858,"ĠVietnamese":16859,"ĠMental":16860,"Unfortunately":16861,"ĠPont":16862,"Ġ1940":16863,"dry":16864,"ĠGazette":16865,"ĠAns":16866,"Ġwhistle":16867,"Ġsymbolic":16868,"Ġpossessions":16869,"ĠDriver":16870,"Ġbracket":16871,"ĠReign":16872,"oji":16873,"Ġoct":16874,"Ġtube":16875,"ĠFelix":16876,"Ġtranslated":16877,"Ġpromptly":16878,"ĠErnest":16879,"arth":16880,"Ġdumb":16881,"Ġinfluences":16882,"taking":16883,"Ġprivat":16884,"erers":16885,"Ġmalware":16886,"Ġpredictable":16887,"Ġtighten":16888,"Ġheights":16889,"Ġfairness":16890,"facing":16891,"Ġrematch":16892,"Ġpoet":16893,"Ġfundamentally":16894,"Ġcoveted":16895,"Ġlivelihood":16896,"ĠABOUT":16897,"Ġsourced":16898,"Ġdeferred":16899,"Ġslashed":16900,"ĠSchultz":16901,"Ġtriggering":16902,"ĠShiv":16903,"Ġlithium":16904,"ahead":16905,"Ġleisure":16906,"Ġbackpack":16907,"ilateral":16908,"ĠNuclear":16909,"ĠLeone":16910,"ĠNice":16911,"Ġenthusiasts":16912,"September":16913,"Ġenroll":16914,"ĠWear":16915,"erey":16916,"angs":16917,"such":16918,"Ġunpopular":16919,"Ġdisciplined":16920,"Ġshrinking":16921,"ĠBrewing":16922,"ĠReally":16923,"Ġdirective":16924,"175":16925,"Ġnotifications":16926,"Ġfortunes":16927,"ĠHour":16928,"ĠGan":16929,"ĠChurchill":16930,"ĠDodge":16931,"ĠJeep":16932,"Ġsour":16933,"Ġderived":16934,"Ġft":16935,"riv":16936,"Ġlaundry":16937,"Ġfentanyl":16938,"ĠSioux":16939,"achi":16940,"workers":16941,"Ġworkload":16942,"rooms":16943,"ĠQU":16944,"ĠTruth":16945,"Ġdefenses":16946,"Ġdunk":16947,"IJ":16948,"Ġderby":16949,"ĠMotion":16950,"ĠMayo":16951,"ĠIke":16952,"Ġpreferences":16953,"Ġped":16954,"elman":16955,"moon":16956,"Ġshoots":16957,"ĠNoel":16958,"Ġmilit":16959,"ĠCambodia":16960,"ĠMLA":16961,"Ġhonoured":16962,"fast":16963,"Ġalgorithms":16964,"Ġstormed":16965,"NT":16966,"Benz":16967,"Ġvaccines":16968,"Ġmarching":16969,"Ġ118":16970,"ĠWilmington":16971,"GM":16972,"coin":16973,"Ġunderwater":16974,"ĠClearly":16975,"Ġorgans":16976,"mir":16977,"Ġdenounced":16978,"pless":16979,"imal":16980,"ĠKom":16981,"Ġfatalities":16982,"Ġyoungster":16983,"Ġthirty":16984,"Ġinternally":16985,"222":16986,"Ġdemonstrating":16987,"Ġbusiest":16988,"Ġperpetrators":16989,"Ġstun":16990,"Both":16991,"ĠMcCoy":16992,"gn":16993,"ĠDalton":16994,"ĠDAY":16995,"Ġsacred":16996,"Ġconsuming":16997,"Ġ(+":16998,"ĠPioneer":16999,"ĠApplications":17000,"ĠBolt":17001,"ĠBarkley":17002,"ĠExpo":17003,"ĠLore":17004,"ĠPrivacy":17005,"ĠHarley":17006,"Ġtractor":17007,"Ġtenth":17008,"ĠHaiti":17009,"ÃŃn":17010,"ĠTVs":17011,"ĠCathedral":17012,"Ġunite":17013,"Ġbinding":17014,"oks":17015,"ĠJenny":17016,"Ġcaller":17017,"ĠIngram":17018,"ĠPrairie":17019,"Ġrunoff":17020,"Ġasserted":17021,"icit":17022,"ĠSie":17023,"102":17024,"ĠMB":17025,"Ġobstruction":17026,"Ġgroom":17027,"Ġtolerate":17028,"Ġcans":17029,"forth":17030,"Ġvillain":17031,"Ġdefining":17032,"ĠFrenchman":17033,"otte":17034,"Ġcontr":17035,"clock":17036,"onder":17037,"Ġprolific":17038,"ĠElectronic":17039,"ĠSak":17040,"annie":17041,"ASS":17042,"Ġmultinational":17043,"Associated":17044,"IZ":17045,"ĠBelle":17046,"Ġmand":17047,"asis":17048,"Mac":17049,"Ġpretend":17050,"ĠCommunication":17051,"Ġheartbreaking":17052,"ĠShepherd":17053,"ĠBIG":17054,"mph":17055,"ĠShield":17056,"ĠLiv":17057,"ĠStatus":17058,"Ġbikini":17059,"Ġranch":17060,"Ġpeacefully":17061,"ITCH":17062,"bourne":17063,"ĠVariety":17064,"Ġstationed":17065,"Ġhed":17066,"Ġexhausted":17067,"Ġsurpassed":17068,"Ġcatalyst":17069,"Ġsmuggling":17070,"uating":17071,"Ġ123":17072,"Ġdup":17073,"ĠSul":17074,"conf":17075,"jit":17076,"Ġmaiden":17077,"asta":17078,"ĠCalvin":17079,"borne":17080,"Ġgrim":17081,"Ġtort":17082,"cott":17083,"olas":17084,"NR":17085,"Ġbreakout":17086,"ĠHun":17087,"ĠGuatemala":17088,"Ġhistorian":17089,"ĠLawyers":17090,"ĠDisplay":17091,"Ġobstruct":17092,"ĠOsborne":17093,"Ġtherapies":17094,"ĠAub":17095,"Ġinjunction":17096,"stroke":17097,"Ġseafood":17098,"Ġhazardous":17099,"ĠWolver":17100,"ĠViolence":17101,"ĠBillion":17102,"ĠLetter":17103,"ĠWorldwide":17104,"Real":17105,"Ġexpires":17106,"Ġflawed":17107,"European":17108,"Ġrigorous":17109,"ĠSimilar":17110,"ĠSurface":17111,"ĠEF":17112,"mys":17113,"ĠFunds":17114,"ographer":17115,"Ġtribes":17116,"Ġspouse":17117,"Ġunsure":17118,"aways":17119,"Ġtrainers":17120,"arie":17121,"ĠZar":17122,"ĠComedy":17123,"ĠLit":17124,"ĠNoon":17125,"Ġgallon":17126,"Ġconsulate":17127,"ĠBras":17128,"iology":17129,"onies":17130,"ĠBelichick":17131,"ĠRoot":17132,"ĠLux":17133,"ĠSed":17134,"ĠTos":17135,"Ġinherited":17136,"tw":17137,"Ġdeaf":17138,"Ġdriveway":17139,"jah":17140,"ĠScientific":17141,"ĠNottingham":17142,"both":17143,"awan":17144,"Ġnut":17145,"ĠLebanese":17146,"ĠAAA":17147,"ĠSuzuki":17148,"ĠBU":17149,"ells":17150,"Ġspecify":17151,"ĠNotes":17152,"Ġvoluntarily":17153,"ĠMolly":17154,"Ġoutskirts":17155,"Ġbehaviors":17156,"Ġmilitia":17157,"Ġsplash":17158,"Ġpersonalized":17159,"ĠFiat":17160,"ĠKind":17161,"ĠTruck":17162,"py":17163,"ĠWIN":17164,"dist":17165,"itational":17166,"APP":17167,"ĠPelicans":17168,"ĠGam":17169,"mel":17170,"Ġmandated":17171,"Ġbalances":17172,"ĠWizards":17173,"iary":17174,"ĠAvailable":17175,"Ġkay":17176,"jin":17177,"eyed":17178,"Ġsterling":17179,"Ġconcealed":17180,"ĠFedEx":17181,"ĠPO":17182,"ĠJacqu":17183,"anted":17184,"eme":17185,"ĠDefensive":17186,"manship":17187,"Ġreliever":17188,"Ġshortstop":17189,"Ġphot":17190,"ĠGain":17191,"ĠConcern":17192,"due":17193,"Ġalgorithm":17194,"fell":17195,"ĠMountains":17196,"icians":17197,"Ġhonoring":17198,"Ġuploaded":17199,"Ġtore":17200,"GH":17201,"orde":17202,"ĠCoin":17203,"ĠAven":17204,"Ġliterary":17205,"Before":17206,"Ġtactic":17207,"Ġsocially":17208,"ĠSik":17209,"Ġthermal":17210,"Ġhor":17211,"price":17212,"Ġrooted":17213,"arrow":17214,"Ġcirculating":17215,"Ġlaughs":17216,"ĠLines":17217,"lig":17218,"Ġjudgement":17219,"....":17220,"Ġsewer":17221,"Ġdancer":17222,"ĠPens":17223,"Ġsig":17224,"ische":17225,"wives":17226,"Ġgran":17227,"ĠBron":17228,"ĠHyde":17229,"yards":17230,"Ġcandidacy":17231,"Ġhey":17232,"Ġcontributors":17233,"ĠUpdated":17234,"Ġ190":17235,"Ġhalls":17236,"Ġemphas":17237,"ĠCherry":17238,"Ġrim":17239,"Ġbilled":17240,"Ġbaked":17241,"ĠPopular":17242,"lb":17243,"Ġgravity":17244,"Under":17245,"Ġreservation":17246,"organ":17247,"ĠPict":17248,"ĠWhitney":17249,"Ġonboard":17250,"NEY":17251,"ĠBreaking":17252,"Ġflagged":17253,"rar":17254,"ĠBasic":17255,"ĠDomestic":17256,"ĠPent":17257,"Ġvigilant":17258,"Ġzoning":17259,"Fire":17260,"Ġcorrected":17261,"isbury":17262,"ĠLaure":17263,"ĠDevon":17264,"print":17265,"ĠTopics":17266,"ĠFuel":17267,"Ġcirculation":17268,"ĠPratt":17269,"Ġskiing":17270,"Ġtornado":17271,"dep":17272,"ĠUnless":17273,"ifting":17274,"Ġfool":17275,"should":17276,"Ġinspectors":17277,"Ġprotested":17278,"Ġba":17279,"ussia":17280,"Ġspun":17281,"grass":17282,"phone":17283,"Ġpotato":17284,"ĠBehind":17285,"cil":17286,"Ġconcession":17287,"Ġapplause":17288,"ĠChin":17289,"Ġceremonies":17290,"pit":17291,"Ġtraumatic":17292,"Ġbasics":17293,"Ġparameters":17294,"ĠMoz":17295,"ĠAIDS":17296,"Ph":17297,"Ġjudging":17298,"Ġlecture":17299,"Ġmunicipality":17300,"Ġcardiac":17301,"ogan":17302,"pir":17303,"could":17304,"Channel":17305,"Ġshattered":17306,"ĠAV":17307,"continental":17308,"chie":17309,"ibi":17310,"ĠOy":17311,"Mon":17312,"ĠCN":17313,"WC":17314,"Ġdistributor":17315,"ĠSavannah":17316,"Ġcleaned":17317,"ĠFlores":17318,"Ġembarrassed":17319,"Ġclay":17320,"Ġvolcano":17321,"Ġstressful":17322,"Ġsummoned":17323,"ĠSeg":17324,"Ġstatistical":17325,"ĠShak":17326,"Ġadequately":17327,"worthy":17328,"fighting":17329,"alan":17330,"Ġnecessity":17331,"Ġresidency":17332,"Ġsober":17333,"arius":17334,"ĠTaj":17335,"mount":17336,"wards":17337,"Ġaesthetic":17338,"Coin":17339,"ĠDew":17340,"were":17341,"SK":17342,"Ġpowerhouse":17343,"Ġcleanup":17344,"ĠWITH":17345,"ĠHers":17346,"ĠRao":17347,"ĠFlyers":17348,"Ġdominating":17349,"issued":17350,"ĠMcGr":17351,"Ġinsurgency":17352,"Ġburial":17353,"ĠPlains":17354,"ensive":17355,"ĠPresent":17356,"Mo":17357,"Ġnerves":17358,"Ġsmoothly":17359,"staff":17360,"Ġrestoring":17361,"ĠGeneration":17362,"Ġcommuters":17363,"ĠLegend":17364,"ĠGad":17365,"lied":17366,"Ġissuer":17367,"ĠDozens":17368,"Ġphases":17369,"ĠWu":17370,"ĠTunisia":17371,"ĠPacers":17372,"Ġdur":17373,"ĠIG":17374,"annon":17375,"sided":17376,"Ġvo":17377,"ĠNI":17378,"Ġvitamin":17379,"Ġsoc":17380,"Ġimmunity":17381,"Ġgenerates":17382,"ĠMcGu":17383,"Ġexplores":17384,"Ġassistants":17385,"Ġstems":17386,"ushed":17387,"ĠZak":17388,"ĠOwners":17389,"Ġvariant":17390,"ardy":17391,"ĠNewark":17392,"ĠCatalonia":17393,"Ġautonomy":17394,"Ġgreet":17395,"Ġawait":17396,"ĠLuckily":17397,"ĠTicket":17398,"ĠSTOR":17399,"asy":17400,"Ġincorrect":17401,"Ġconsisting":17402,"Ġperspectives":17403,"ĠQuint":17404,"Ġtotaling":17405,"Ġnortheastern":17406,"Ġcharacterized":17407,"Ġsurfaces":17408,"nation":17409,"Ġprevents":17410,"ĠSho":17411,"Ġelectorate":17412,"Ġshortfall":17413,"chy":17414,"aws":17415,"ĠAddress":17416,"Ġdefensively":17417,"quel":17418,"chester":17419,"Ġterr":17420,"ahu":17421,"lined":17422,"ĠNev":17423,"unn":17424,"Def":17425,"pc":17426,"ĠSig":17427,"Ġnonetheless":17428,"ĠSundays":17429,"ĠBAS":17430,"Ġpolicemen":17431,"ĠGoal":17432,"apa":17433,"Ġrope":17434,"Ġoutage":17435,"ĠPaso":17436,"Ġsadness":17437,"ĠGrowing":17438,"ĠKyr":17439,"Ġale":17440,"ĠBreitbart":17441,"ĠVia":17442,"ĠBrig":17443,"idence":17444,"Ġ145":17445,"quire":17446,"Ġdistraction":17447,"ĠOdd":17448,"ĠSimply":17449,"ĠNin":17450,"Ġcompetent":17451,"ded":17452,"iper":17453,"ĠKaty":17454,"ĠSolomon":17455,"Ġfeeds":17456,"ĠMort":17457,"ĠRica":17458,"affe":17459,"Ġcooperating":17460,"Ġarrivals":17461,"Ġdelete":17462,"ĠAth":17463,"Ġtrustees":17464,"Ġtub":17465,"Ġsaga":17466,"otes":17467,"ĠCJ":17468,"Ġexited":17469,"stakes":17470,"Ġinflu":17471,"2000":17472,"ĠDonovan":17473,"ĠNur":17474,"Ġoutline":17475,"Ġaudition":17476,"oked":17477,"ĠJag":17478,"money":17479,"Ġcardiovascular":17480,"song":17481,"ĠOften":17482,"ĠGoff":17483,"ĠOaks":17484,"Will":17485,"acon":17486,"Ġ?":17487,"Har":17488,"ĠLambert":17489,"atoon":17490,"ĠAF":17491,"ĠMavericks":17492,"nia":17493,"ĠChennai":17494,"\"},\"":17495,"Ġpairing":17496,"mad":17497,"ause":17498,"ĠRide":17499,"111":17500,"ĠFallon":17501,"ĠHyder":17502,"ĠPiper":17503,"Ġfilmmakers":17504,"icon":17505,"ĠBeau":17506,"Ġbutt":17507,"lot":17508,"Ġrifles":17509,"Ġsunglasses":17510,"ĠTRA":17511,"Ġmagnetic":17512,"arty":17513,"ĠYo":17514,"ĠWeight":17515,"?!":17516,"ether":17517,"Ġaspir":17518,"Ġhunters":17519,"Ġcontamination":17520,"Ben":17521,"political":17522,"],\"":17523,"ĠBever":17524,"Ġmonuments":17525,"won":17526,"auc":17527,"Ġexpressions":17528,"Ġlakes":17529,"iao":17530,"abin":17531,"Ġpleading":17532,"Ġdiscounted":17533,"Ġdisappoint":17534,"ĠTW":17535,"craft":17536,"Ġsocieties":17537,"ĠAugusta":17538,"Ġbott":17539,"Ġmarker":17540,"ĠWrestling":17541,"CBC":17542,"athy":17543,"ĠAZ":17544,"Ġfabulous":17545,"valued":17546,"Ġoptical":17547,"Ġshaken":17548,"OSS":17549,"ĠImp":17550,"ĠAUD":17551,"inals":17552,"Ġrevital":17553,"Ġcontroller":17554,"Ġgrasp":17555,"uling":17556,"ĠFrederick":17557,"ague":17558,"bull":17559,"ĠLadies":17560,"Ġdisruptive":17561,"Ġbenefiting":17562,"Ġverge":17563,"ĠDak":17564,"Ġgrabs":17565,"ĠPAC":17566,"GN":17567,"ĠMcMahon":17568,"rob":17569,"ĠEspecially":17570,"ĠChrome":17571,"ĠBundesliga":17572,"104":17573,"Ġliberty":17574,"ĠSF":17575,"Ġvarieties":17576,"East":17577,"Ġgrowers":17578,"Ġsocialist":17579,"Ġunemployed":17580,"AMI":17581,"Ġtotals":17582,"ĠGib":17583,"Ġdefect":17584,"ĠOrtiz":17585,"ĠPerfect":17586,"Ġpraying":17587,"ISS":17588,"Ġul":17589,"Ġthrust":17590,"osc":17591,"ĠOtherwise":17592,"Ġobsessed":17593,"Ġ650":17594,"ĠWebsite":17595,"Ġspectators":17596,"ĠScout":17597,"ĠBoone":17598,"ĠDillon":17599,"Ġabortions":17600,"lect":17601,"utz":17602,"Ġvillagers":17603,"Ġaccelerating":17604,"Ġslap":17605,"Ġvague":17606,"Ġjurisdictions":17607,"League":17608,"ĠUruguay":17609,"Ġobstacle":17610,"Ġmanufactures":17611,"Ġcampaigned":17612,"ĠAdvance":17613,"ĠNort":17614,"emer":17615,"Ġ1964":17616,"Ġirre":17617,"Ġprog":17618,"ĠFeatured":17619,"Ġcommute":17620,"Ġhandset":17621,"akis":17622,"ĠArs":17623,"tail":17624,"iker":17625,"Ġcrafted":17626,"Ġupl":17627,"ĠMarcos":17628,"Looking":17629,"Ġseated":17630,"ĠBoat":17631,"Ġreadiness":17632,"ĠLLP":17633,"otechnology":17634,"facebook":17635,"ĠScouts":17636,"ĠEar":17637,"ĠAdv":17638,"ĠDemocracy":17639,"NI":17640,"oci":17641,"ĠSnapdragon":17642,"Saturday":17643,"ĠPra":17644,"ĠCoastal":17645,"ĠVoters":17646,"ĠLeigh":17647,"ohn":17648,"orry":17649,"Ġtechnicians":17650,"armed":17651,"Ġshrink":17652,"Ġspinning":17653,"agram":17654,"320":17655,"liner":17656,"ĠContest":17657,"ĠCountries":17658,"Ġfarewell":17659,"ĠCW":17660,"aris":17661,"Ġstorytelling":17662,"Ġpasser":17663,"Ġsailing":17664,"control":17665,"Ġdissent":17666,"ĠRih":17667,"Ġedit":17668,"Ġspoilers":17669,"itched":17670,"ĠBentley":17671,"Ġcant":17672,"mn":17673,"ĠMacy":17674,"Ġindefinitely":17675,"Ġvill":17676,"Ġmeth":17677,"ĠEL":17678,"Ġoptional":17679,"Ġremark":17680,"ĠVanessa":17681,"ã":17682,"Ġmasks":17683,"ĠProvincial":17684,"Ġculprit":17685,"ĠTol":17686,"Ġsnack":17687,"ĠInfinity":17688,"ĠPub":17689,"Ġbrakes":17690,"Ġclar":17691,"Ġinception":17692,"love":17693,"Ġwonders":17694,"Ġforged":17695,"ĠCEOs":17696,"Ġspecifications":17697,"irst":17698,"ension":17699,"ĠMarin":17700,"det":17701,"Ġordeal":17702,"ĠFeed":17703,"December":17704,"Ġstrokes":17705,"fect":17706,"orial":17707,"Ġshowcasing":17708,"Ġstack":17709,"UAL":17710,"ĠAlexandra":17711,"Ġpoison":17712,"ĠFry":17713,"ĠCars":17714,"Ġprototype":17715,"ĠUSDA":17716,"ĠIF":17717,"flows":17718,"Ġtailored":17719,"ĠGear":17720,"Ġmyth":17721,"Ġplatinum":17722,"seven":17723,"founded":17724,"encing":17725,"ĠTip":17726,"ĠMald":17727,"Ġgeopolitical":17728,"112":17729,"Ġenqu":17730,"ĠNR":17731,"ĠNadu":17732,"leen":17733,"ĠTat":17734,"Ġcolon":17735,"ĠSize":17736,"Ġvis":17737,"Ġbere":17738,"ĠAnnie":17739,"ĠWatkins":17740,"Ġpumping":17741,"cur":17742,"ĠBates":17743,"Ġslug":17744,"miss":17745,"Ġforecasting":17746,"source":17747,"Ġacknowledges":17748,"Ġprosecute":17749,"Ġtestament":17750,"Ġcum":17751,"ems":17752,"Ġsocks":17753,"ĠSame":17754,"Ġcompetitiveness":17755,"Ġdefinitive":17756,"Ġintensified":17757,"Ġsatisfying":17758,"Ġphysics":17759,"ĠHarden":17760,"Ġsubsidy":17761,"Men":17762,"ĠPaddock":17763,"Ġworkouts":17764,"ĠSaw":17765,"Ġcrisp":17766,"ĠBezos":17767,"ĠVote":17768,"Ġguiding":17769,"anged":17770,"Ġstaple":17771,"ŀ":17772,"ules":17773,"ĠAvengers":17774,"Ġoptim":17775,"ĠBuffett":17776,"Ġtimetable":17777,"oust":17778,"HE":17779,"ĠGrab":17780,"Have":17781,"cca":17782,"Ġwaived":17783,"Ġretaining":17784,"Ġaber":17785,"Ġoffline":17786,"Ġvigil":17787,"books":17788,"ĠRein":17789,"Ġacknowledging":17790,"ĠDoyle":17791,"Ġproteins":17792,"Ġmixing":17793,"ĠAlcohol":17794,"ĠJD":17795,"Ġsyn":17796,"Ġthieves":17797,"Ġhomemade":17798,"Ġfeminist":17799,"ĠRoosevelt":17800,"ĠCoal":17801,"Ġwishing":17802,"ĠSIGN":17803,"ĠLad":17804,"Ġempathy":17805,"ĠBrooke":17806,"ĠMash":17807,"inations":17808,"''":17809,"ulators":17810,"Ġdrastically":17811,"Ġfloral":17812,"ĠGuild":17813,"Ġundercover":17814,"ĠLaboratory":17815,"ĠRank":17816,"Ġrestraining":17817,"Ġparagraph":17818,"Ġpersona":17819,"ĠEmployment":17820,"ogs":17821,"ĠGw":17822,"ĠMedal":17823,"Ġwildly":17824,"fare":17825,"ĠCNBC":17826,"photo":17827,"Ġtransforming":17828,"Ġtermination":17829,"still":17830,"INT":17831,"Ġbal":17832,"ĠEconom":17833,"ĠLarson":17834,"Ġheck":17835,"Ġquantitative":17836,"Ġemergence":17837,"esta":17838,"Ġknot":17839,"Ġwhale":17840,"ĠðŁĺ":17841,"Ġperimeter":17842,"Ġempowerment":17843,"Ġmg":17844,"Ġrents":17845,"Ġrefreshing":17846,"Ġleasing":17847,"Ġpatents":17848,"andi":17849,"Ġfathers":17850,"Ġunse":17851,"Ġprocessors":17852,"Down":17853,"Ġreversal":17854,"veh":17855,"andal":17856,"ĠKov":17857,"Blue":17858,"Ġspecializes":17859,"Link":17860,"ĠConsidering":17861,"ĠEdmund":17862,"Ġneo":17863,"agger":17864,"rg":17865,"Ġseverity":17866,"Ġcour":17867,"RL":17868,"ĠTeresa":17869,"Ġgallons":17870,"Ġacquitted":17871,"Ġaccompl":17872,"Ġcracks":17873,"Ġsciences":17874,"Club":17875,"Ġpredicts":17876,"ĠVu":17877,"Ġhints":17878,"ĠZack":17879,"Ġrefurb":17880,"Ġdestabil":17881,"ĠSamar":17882,"ĠInfo":17883,"fs":17884,"Ġratios":17885,"Ġinherent":17886,"ĠContinental":17887,"Ġtreasure":17888,"Ġcaucus":17889,"Ġenact":17890,"orporated":17891,"ineries":17892,"Ġtastes":17893,"main":17894,"Ġsq":17895,"ickson":17896,"corruption":17897,"ulture":17898,"ĠGoodman":17899,"ĠLing":17900,"ĠSup":17901,"Ġexposing":17902,"immers":17903,"Ġresponds":17904,"heimer":17905,"Air":17906,"ĠFigures":17907,"Ġlongstanding":17908,"ĠAnalytics":17909,"Ġenforced":17910,"Ġnickname":17911,"Ġclinch":17912,"ĠCarpenter":17913,"ĠPharma":17914,"Ġconstructive":17915,"Ġgel":17916,"ĠSham":17917,"ĠTOP":17918,"ĠDerrick":17919,"ör":17920,"birds":17921,"ĠTong":17922,"ĠBatman":17923,"ĠRouhani":17924,"ĠOlive":17925,"ĠRiv":17926,"Ġdessert":17927,"Ġguides":17928,"Ġsag":17929,"Ġchemotherapy":17930,"Ġslept":17931,"ĠFranc":17932,"ĠDunk":17933,"writers":17934,"ĠÃĹ":17935,"Ġ401":17936,"Ġoutfielder":17937,"ĠHamburg":17938,"izu":17939,"Ġscr":17940,"Ġcomparisons":17941,"Ġwhites":17942,"Ġtraits":17943,"Ġcollateral":17944,"LEY":17945,"ideshow":17946,"Ġstatutory":17947,"Ġruin":17948,"Ġsituated":17949,"tem":17950,"Ġinject":17951,"rage":17952,"550":17953,"Ġfactions":17954,"ĠNaomi":17955,"cutting":17956,"Ġcommunicating":17957,"Ġrailroad":17958,"Ġsparking":17959,"Ġrespiratory":17960,"ĠWebster":17961,"ĠCarbon":17962,"Ġundertaking":17963,"Ġcomposer":17964,"ĠFigure":17965,"Ġspecified":17966,"Video":17967,"uber":17968,"Ġsexuality":17969,"lected":17970,"ĠBurger":17971,"ĠCards":17972,"SR":17973,"ĠLie":17974,"Ġrecount":17975,"Ġexceeding":17976,"Ġquoting":17977,"ĠJama":17978,"ĠVictorian":17979,"Ġsway":17980,"ĠGes":17981,"ĠSI":17982,"ĠKazakhstan":17983,"Ġaccusation":17984,"etr":17985,"Ah":17986,"Ġproc":17987,"Ġlamb":17988,"ĠMorales":17989,"ĠLily":17990,"Ġderail":17991,"Ġcontributes":17992,"iddle":17993,"ĠConcord":17994,"Ġelectr":17995,"Ġequip":17996,"Ġquantum":17997,"Ġthereafter":17998,"Ġarrange":17999,"Ġraided":18000,"ĠMove":18001,"ĠSang":18002,"ĠGaming":18003,"Ġbiology":18004,"ĠAmnesty":18005,"Ġdemise":18006,"ĠBarton":18007,"Ġqualifier":18008,"ANI":18009,"Ġundersc":18010,"Ġroyalty":18011,"ĠINC":18012,"Ġsne":18013,"ariat":18014,"ĠWan":18015,"Ġcluster":18016,"quin":18017,"Ġwhales":18018,"ĠFear":18019,"ĠBrew":18020,"Ġdeport":18021,"airs":18022,"Ġcensus":18023,"OUS":18024,"Ġrespectful":18025,"bone":18026,"Ġwaivers":18027,"friend":18028,"Ġsystemic":18029,"ĠDion":18030,"James":18031,"ĠAdmission":18032,"Ġstigma":18033,"ĠTIME":18034,"Ġunderpin":18035,"ĠWitnesses":18036,"Ġdigs":18037,"Ġgenocide":18038,"Ġstaging":18039,"rolled":18040,"Ġspecially":18041,"oop":18042,"Ġbaseline":18043,"ĠRF":18044,"avis":18045,"Ġvocals":18046,"COL":18047,"LD":18048,"Ġimpending":18049,"ĠCaldwell":18050,"Ġaluminium":18051,"Ġstra":18052,"ĠTayyip":18053,"Ġadmissions":18054,"falls":18055,"Ġrealizing":18056,"oen":18057,"ĠRV":18058,"ĠMog":18059,"Ġadvocating":18060,"ĠPepper":18061,"lived":18062,"ĠWick":18063,"Facebook":18064,"ĠSpect":18065,"Ġshout":18066,"Ġfractured":18067,"vet":18068,"Ġ1966":18069,"Ġcompensate":18070,"ĠVolume":18071,"Ġcategor":18072,"ĠHuntington":18073,"Free":18074,"OUGH":18075,"local":18076,"Sch":18077,"uti":18078,"Ġburger":18079,"Ġbush":18080,"Ġimpacting":18081,"Ġfrost":18082,"tti":18083,"ĠFresno":18084,"onz":18085,"shaw":18086,"ĠLibyan":18087,"Ġassert":18088,"ĠLegacy":18089,"ĠIE":18090,"ĠKinder":18091,"ĠHorizon":18092,"Ġtum":18093,"Ġsignaled":18094,"ĠFors":18095,"Ġspeedy":18096,"rang":18097,"ĠFT":18098,"Ġselecting":18099,"Ġpale":18100,"WD":18101,"Ġprobability":18102,"OUND":18103,"istrate":18104,"Ġsens":18105,"ocating":18106,"Ġinterpret":18107,"Ġpuzzle":18108,"Ġinland":18109,"Ġmanipulation":18110,"Sal":18111,"Ġfulfilling":18112,"ĠMcMaster":18113,"Make":18114,"jun":18115,"giving":18116,"ĠNiagara":18117,"Ġscholars":18118,"ALT":18119,"ĠSteam":18120,"omin":18121,"ĠSau":18122,"ĠDowning":18123,"Ġgy":18124,"ĠTit":18125,"ĠLav":18126,"ĠPepsi":18127,"Ġdumping":18128,"ĠDetect":18129,"ĠTDs":18130,"ĠKob":18131,"ĠSY":18132,"Ġpioneer":18133,"Ġ_":18134,"Ġclarified":18135,"ĠTests":18136,"opic":18137,"ĠMN":18138,"ĠBowman":18139,"umin":18140,"Ġwidow":18141,"Ġrallying":18142,"ĠPull":18143,"Ġprojection":18144,"Ġescalation":18145,"Ġlibraries":18146,"ĠFounder":18147,"ĠHugo":18148,"ĠStyle":18149,"Ġfreelance":18150,"Ġlisteners":18151,"Ġdiscovering":18152,"ĠPlans":18153,"Ġfranchises":18154,"ĠPam":18155,"Ġfarther":18156,"UI":18157,"opers":18158,"103":18159,"ublished":18160,"keys":18161,"aky":18162,"Ġinnov":18163,"¦":18164,"ĠDrum":18165,"Ġwraps":18166,"ĠCongressman":18167,"ĠVenus":18168,"fake":18169,"ĠBronx":18170,"ĠDinner":18171,"faced":18172,"Ġbackward":18173,"inge":18174,"Ġarsenal":18175,"ĠAce":18176,"uden":18177,"fre":18178,"Ġspa":18179,"ĠSaunders":18180,"ĠMatter":18181,"ĠSpons":18182,"Ġconsultations":18183,"ĠRuss":18184,"Ġsculpture":18185,"Ġuncommon":18186,"Nov":18187,"pg":18188,"otherapy":18189,"Ġgol":18190,"ĠBlazers":18191,"Ġadvises":18192,"ĠRegulatory":18193,"ĠBoyle":18194,"Äģ":18195,"Ġcuisine":18196,"Ġencouragement":18197,"yp":18198,"eny":18199,"ĠOrchestra":18200,"ĠChicken":18201,"Ġ1965":18202,"ĠPret":18203,"ĠCooperation":18204,"ĠDevices":18205,"ĠRodney":18206,"ĠHonduras":18207,"ĠEgg":18208,"Ġchurn":18209,"Ġclutch":18210,"ĠBernstein":18211,"Ġain":18212,"Ġformidable":18213,"ĠFacility":18214,"Ġpag":18215,"mons":18216,"bol":18217,"Ġliteracy":18218,"Ġsubmissions":18219,"ĠHulu":18220,"ĠConstitutional":18221,"ĠIsh":18222,"ĠPaula":18223,"olve":18224,"Ġabundance":18225,"ĠAla":18226,"ĠEcuador":18227,"Ġreconstruction":18228,"Ġcrush":18229,"reek":18230,"ĠÂŃ":18231,"ibo":18232,"Ġpracticed":18233,"Ġpac":18234,"rett":18235,"Ġpasta":18236,"Ġresp":18237,"ĠFlag":18238,"pal":18239,"Ġcommenting":18240,"Ġrecap":18241,"âĢĶâĢĶ":18242,"ĠToy":18243,"ĠMeredith":18244,"Ġreceipt":18245,"Ġseparating":18246,"ĠMap":18247,"Ġmogul":18248,"ĠBurlington":18249,"Ġger":18250,"Ġcoordinate":18251,"grad":18252,"Ġescalated":18253,"Ġproceeded":18254,"turned":18255,"Ġupt":18256,"hum":18257,"ĠWere":18258,"Whether":18259,"Ġenjoyable":18260,"energy":18261,"Ġprohibit":18262,"Ġhurdle":18263,"Ġdivorced":18264,"Ġcommentator":18265,"GT":18266,"ATH":18267,"Ġtravellers":18268,"Ġpopulated":18269,"ĠVo":18270,"ĠRebels":18271,"Ġspurred":18272,"Ġideological":18273,"Ġelephant":18274,"keyes":18275,"Pat":18276,"Ġlinger":18277,"Ġreps":18278,"Ġcocktails":18279,"ĠKristen":18280,"istically":18281,"Ġgunmen":18282,"Ġ1920":18283,"Ġquart":18284,"National":18285,"Ġexceptions":18286,"kat":18287,"priced":18288,"ĠHarold":18289,"ĠPistons":18290,"Ġcompounds":18291,"Ġmouse":18292,"Ġexhibits":18293,"ĠBurk":18294,"Ġclassmates":18295,"Ġcirculated":18296,"Ġattributable":18297,"ĠBaton":18298,"Ġorganizer":18299,"Ġdurable":18300,"Ġsingers":18301,"ĠOman":18302,"Ġhydrogen":18303,"Ġslash":18304,"Ġaccidental":18305,"ĠAbrams":18306,"KS":18307,"itty":18308,"Ġrust":18309,"Ġselections":18310,"porting":18311,"ĠEmanuel":18312,"XX":18313,"ĠThornton":18314,"Ġcolumns":18315,"Ġsentiments":18316,"fun":18317,"Ġplight":18318,"ĠSister":18319,"ĠMaggie":18320,"hya":18321,"Daniel":18322,"Ġplung":18323,"orio":18324,"ĠYorker":18325,"ĠSaturdays":18326,"Ġloc":18327,"aye":18328,"illon":18329,"ĠConsulting":18330,"pled":18331,"ĠZin":18332,"ĠFarms":18333,"ĠGiuliani":18334,"ĠMIN":18335,"ĠHanson":18336,"ĠComplete":18337,"ourke":18338,"oche":18339,"ĠJord":18340,"Ġprofessors":18341,"ĠWILL":18342,"ĠCron":18343,"Ġdorm":18344,"Ġcracking":18345,"tur":18346,"ORS":18347,"Ant":18348,"Ġdeduction":18349,"ĠSIM":18350,"igue":18351,"ĠValent":18352,"ĠEthereum":18353,"ĠSunny":18354,"ĠExtra":18355,"ivan":18356,"ĠFo":18357,"Ġleases":18358,"ibe":18359,"Ġ1800":18360,"Ġslapped":18361,"emaker":18362,"Ġfa":18363,"rien":18364,"ĠPeriod":18365,"ĠES":18366,"ĠBlu":18367,"Ġpreserving":18368,"Ġsmarter":18369,"mans":18370,"Ġgest":18371,"zu":18372,"nu":18373,"Ġdivest":18374,"roc":18375,"ĠFlood":18376,"Given":18377,"ĠNorton":18378,"Ġgranting":18379,"Ġdealings":18380,"Ġgeographic":18381,"esa":18382,"Ġcub":18383,"Ġcriticizing":18384,"ĠCub":18385,"Ġsurroundings":18386,"ĠInternal":18387,"Ġsle":18388,"Ġcrushing":18389,"ĠPP":18390,"izations":18391,"ĠAbdel":18392,"Joe":18393,"ĠVisitors":18394,"ĠCarly":18395,"INGTON":18396,"ĠGC":18397,"ĠWB":18398,"Ġgently":18399,"·":18400,"though":18401,"ĠAlto":18402,"Ġresting":18403,"ĠPerson":18404,"ĠTon":18405,"Ġbore":18406,"ĠClar":18407,"Ġmot":18408,"Ġbathrooms":18409,"ĠTypically":18410,"Ġdisconnect":18411,"Ġtightly":18412,"ĠHarvest":18413,"ĠHed":18414,"ĠGermans":18415,"atar":18416,"Ġkeynote":18417,"Ġimproper":18418,"fil":18419,"Ġintens":18420,"iev":18421,"Ġmedi":18422,"Ġtenant":18423,"Ġfootsteps":18424,"uli":18425,"Ġlegalization":18426,"106":18427,"ĠLexington":18428,"folio":18429,"Ġ½":18430,"ĠRita":18431,"Ġbattered":18432,"inka":18433,"ĠJavaScript":18434,"ĠMusical":18435,"ĠTalent":18436,"Ġlounge":18437,"Ġintimidation":18438,"ikh":18439,"ĠFam":18440,"Ġtherapeutic":18441,"Ġbalancing":18442,"Ġrocky":18443,"liners":18444,"ĠPredators":18445,"Ġregistering":18446,"Ġdiligence":18447,"ĠRover":18448,"ĠDot":18449,"Ġterminated":18450,"ĠEdu":18451,"Ġcharming":18452,"ĠPLAY":18453,"ĠFact":18454,"ĠCi":18455,").\"":18456,"ĠWrestle":18457,"hun":18458,"Ġopenings":18459,"Ġfou":18460,"Ġ126":18461,"spe":18462,"ĠAW":18463,"Ġbud":18464,"ĠTemper":18465,"ĠOrthodox":18466,"Ġprogressed":18467,"tre":18468,"Ġtasting":18469,"Ġscrutin":18470,"ĠLima":18471,"Ġlayout":18472,"Ġlitter":18473,"ijk":18474,"ĠParkinson":18475,"ĠAnfield":18476,"Ġdevelopmental":18477,"Ġheaven":18478,"ĠWoodward":18479,"index":18480,"Ġpistol":18481,"Ġreson":18482,"ĠWS":18483,"Ġemb":18484,"ĠLap":18485,"ĠPle":18486,"lington":18487,"ĠSit":18488,"Ġabruptly":18489,"ĠSenegal":18490,"ĠYates":18491,"aceutical":18492,"ĠJak":18493,"ĠHastings":18494,"iste":18495,"ĠDB":18496,"ĠAgent":18497,"Ġpreservation":18498,"ĠLank":18499,"ĠSuffolk":18500,"Ġboo":18501,"essed":18502,"Ġempowering":18503,"enne":18504,"Ġrecycled":18505,"Ġstrateg":18506,"Ġbrake":18507,"135":18508,"ĠStef":18509,"ĠFlake":18510,"ĠGregg":18511,"ĠRent":18512,"Ġinstallment":18513,"FW":18514,"ĠCran":18515,"obo":18516,"ml":18517,"ĠJade":18518,"Ġaccuses":18519,"ĠNvidia":18520,"Ġburg":18521,"High":18522,"Ġbothered":18523,"ĠBenn":18524,"Ġinterrupted":18525,"Ġtrek":18526,"Ġserv":18527,"Ġpatron":18528,"Ġdictator":18529,"owa":18530,"jad":18531,"ĠTulsa":18532,"Ġboil":18533,"Ġdisplaying":18534,"Ġcinem":18535,"awaited":18536,"¸":18537,"Ġreacts":18538,"ĠDee":18539,"ĠGron":18540,"igation":18541,"Ġservic":18542,"capt":18543,"Ġinsane":18544,"ĠVeteran":18545,"umen":18546,"End":18547,"ĠCream":18548,"Ġextremism":18549,"ĠMalone":18550,"Col":18551,"Ġsafeguard":18552,"Ġtomatoes":18553,"die":18554,"Ġchamp":18555,"zero":18556,"ĠPRES":18557,"Ġchoir":18558,"Ġpediatric":18559,"Ġprivileged":18560,"Ġdownstream":18561,"Business":18562,"ĠFighting":18563,"atable":18564,"Ġsums":18565,"Ġinsult":18566,"arten":18567,"ĠWikiLeaks":18568,"Ġpads":18569,"Ġretali":18570,"ĠHunts":18571,"Ġindie":18572,"ĠShields":18573,"ĠMortgage":18574,"oses":18575,"ampton":18576,"ĠVideos":18577,"ĠPER":18578,"itionally":18579,"ĠKimmel":18580,"sum":18581,"trade":18582,"acity":18583,"marked":18584,"ĠAngus":18585,"Ġtemper":18586,"Ġseizure":18587,"Ġfictional":18588,"utton":18589,"eva":18590,"Rs":18591,"Ġintra":18592,"ĠRequest":18593,"ppe":18594,"ĠeBay":18595,"ĠUSS":18596,"Ġ1500":18597,"Ġpossessing":18598,"Ġbacon":18599,"ĠSexual":18600,"ĠBuff":18601,"Ġslaughter":18602,"Ġjur":18603,"zhou":18604,"suit":18605,"ĠCha":18606,"ĠBuk":18607,"crime":18608,"ĠEasy":18609,"ĠChain":18610,"aq":18611,"ĠPall":18612,"flation":18613,"225":18614,"oup":18615,"109":18616,"ĠMcKenzie":18617,"Ġclearer":18618,"ĠDogs":18619,"oration":18620,"Ġsubs":18621,"Follow":18622,"ĠShirley":18623,"Ġadjusting":18624,"ĠEFF":18625,"Ġflipped":18626,"Ġconform":18627,"ĠLaurent":18628,"Ġcircular":18629,"ĠNOR":18630,"Ġmort":18631,"Ġtexture":18632,"avour":18633,"Ġflex":18634,"ĠHedge":18635,"ðŁĺ":18636,"Ġtrophies":18637,"ĠINV":18638,"Ġboast":18639,"ĠTyr":18640,"ĠNichols":18641,"ĠSpa":18642,"Ġcheered":18643,"Ġprey":18644,"reach":18645,"Ġbreached":18646,"ĠRegions":18647,"ĠLyft":18648,"ĠTul":18649,"ĠKore":18650,"Ġendure":18651,"ĠCover":18652,"\").":18653,"ĠSavage":18654,"ère":18655,"reens":18656,"Ġnic":18657,"sector":18658,"Ġweaknesses":18659,"Ġreboot":18660,"Ġ210":18661,"Ġimagery":18662,"ĠFrem":18663,"Ġclue":18664,"ĠLars":18665,"Ġfaction":18666,"hetic":18667,"Ġallied":18668,"ĠMarvin":18669,"Ġmethodology":18670,"ĠTN":18671,"Ġutter":18672,"Ġ270":18673,"ĠVolvo":18674,"oline":18675,"ĠACLU":18676,"Ġindirect":18677,"Ġminer":18678,"ĠBale":18679,"ĠStrange":18680,"ĠFuller":18681,"Ġexpelled":18682,"ĠTropical":18683,"Ġremotely":18684,"ĠTIM":18685,"Ġinnocence":18686,"Ġconfined":18687,"Ġfares":18688,"Ġprevalent":18689,"Ġdesp":18690,"House":18691,"azar":18692,"Ġgestures":18693,"ĠCES":18694,"ĠDM":18695,"eal":18696,"ĠÐ":18697,"Ġburnt":18698,"Ġframed":18699,"ĠDani":18700,"Ġhol":18701,"ĠCannes":18702,"ĠHayden":18703,"Ġwardrobe":18704,"ĠAssange":18705,"ĠSamp":18706,"bay":18707,"sky":18708,"ĠHence":18709,"ĠGrizzlies":18710,"rates":18711,"laws":18712,"ĠMandela":18713,"ĠHoover":18714,"rics":18715,"charged":18716,"Ġexclude":18717,"Ġpassive":18718,"Ġcontinuation":18719,"Ġblunt":18720,"Ġvac":18721,"ĠEmerging":18722,"rench":18723,"tv":18724,"ĠHollow":18725,"ĠOC":18726,"Ġadvisors":18727,"Ġrendered":18728,"ĠBernardino":18729,"ĠSupporters":18730,"ronic":18731,"Ġchancellor":18732,"Ġ1963":18733,"Ġuranium":18734,"Ġak":18735,"ĠOptions":18736,"ermott":18737,"ĠBerger":18738,"ibia":18739,"Ġexplosions":18740,"Ġimpairment":18741,"Ġhail":18742,"Ġalley":18743,"Ġcruelty":18744,"ĠClarence":18745,"Ġvariations":18746,"Ġrealm":18747,"Ġrenovations":18748,"ĠNorwich":18749,"Ġbelongings":18750,"Ġmerchants":18751,"ĠMinisters":18752,"ĠDodd":18753,"Ġviewer":18754,"Ġneutrality":18755,"quer":18756,"ĠPrinceton":18757,"dead":18758,"arest":18759,"GET":18760,"ĠCanadiens":18761,"ĠIgn":18762,"clear":18763,"Mal":18764,"ĠBridges":18765,"ĠHayward":18766,"Ġremarked":18767,"ingle":18768,"Ġsob":18769,"Ġdepart":18770,"beans":18771,"Ġpreserved":18772,"ĠFairfax":18773,"Ġforgot":18774,"ĠBeh":18775,"Rob":18776,"Ġcooperative":18777,"ullah":18778,"Ġmates":18779,"Ġrang":18780,"Ġthigh":18781,"Ġabducted":18782,"Ġchaired":18783,"ĠHearts":18784,"Ġidentifies":18785,"ĠBuckingham":18786,"ijn":18787,"ĠJab":18788,"Ġclashed":18789,"feed":18790,"sites":18791,"ĠCareer":18792,"exp":18793,"ĠBuccaneers":18794,"scape":18795,"Ġupdating":18796,"Ġintentional":18797,"ĠGuam":18798,"ĠBreakfast":18799,"ĠHag":18800,"Media":18801,"Ġtapping":18802,"Ġpics":18803,"Ġeaten":18804,"Ġpremise":18805,"Kim":18806,"ĠStorage":18807,"Ġextensively":18808,"Ġoutrageous":18809,"ĠSadly":18810,"Global":18811,"¢":18812,"leaning":18813,"CM":18814,"Ġeasiest":18815,"ument":18816,"Ġ122":18817,"Ġdaunting":18818,"ISE":18819,"Ġsunset":18820,"Ġreset":18821,"Ġbent":18822,"Trust":18823,"ĠCaleb":18824,"ĠRut":18825,"ĠBast":18826,"ETS":18827,"iencies":18828,"Ġpu":18829,"ature":18830,"Ġrealities":18831,"omi":18832,"Ġsoda":18833,"Ġunveil":18834,"ĠGoldberg":18835,"opes":18836,"Ġuprising":18837,"ĠMR":18838,"Ġendorse":18839,"Ġsail":18840,"Ġconverting":18841,"Ġglamorous":18842,"ĠHollande":18843,"108":18844,"isky":18845,"Ġcushion":18846,"240":18847,"Ġadventures":18848,"Ġantitrust":18849,"ĠStockholm":18850,"pace":18851,"ĠVald":18852,"ĠTransfer":18853,"ERT":18854,"ĠMcInt":18855,"Ġsurging":18856,"ogn":18857,"Ġlauded":18858,"ĠZam":18859,"ĠRough":18860,"TOR":18861,"Ġwed":18862,"Ġorigins":18863,"ĠEld":18864,"oso":18865,"Ġsupplying":18866,"ĠPetty":18867,"ĠTwe":18868,"ĠDenise":18869,"ĠBec":18870,"Ġbehave":18871,"Ġ121":18872,"estone":18873,"ĠBoulder":18874,"ĠBlackhawks":18875,"ĠWyatt":18876,"Ġfiguring":18877,"ĠDeborah":18878,"agi":18879,"significant":18880,"Ġasthma":18881,"Ġmessy":18882,"mpire":18883,"Ġax":18884,"Ġaspiring":18885,"ĠNH":18886,"ĠGina":18887,"heavy":18888,"ĠVick":18889,"ÃŃs":18890,"something":18891,"Ġbodily":18892,"Ġunauthorized":18893,"ĠActually":18894,"ĠOH":18895,"Ġmicrophone":18896,"allah":18897,"Ġrampant":18898,"Ġrelocated":18899,"Ġwidening":18900,"ĠCait":18901,"nel":18902,"ĠBlackBerry":18903,"Ġprofessionally":18904,"ĠInterestingly":18905,"Ġbarbecue":18906,"Ġresisting":18907,"ĠNunes":18908,"disc":18909,"Ġgroundbreaking":18910,"orable":18911,"ĠRegulation":18912,"Ġborrowed":18913,"Ġleaking":18914,"Ġlengths":18915,"Ġunveiling":18916,"houses":18917,"Ġ155":18918,"ĠBillboard":18919,"icion":18920,"Times":18921,"ĠZoe":18922,"ĠAbby":18923,"bus":18924,"ĠMinutes":18925,"ributed":18926,"Ġparap":18927,"Ġfertil":18928,"ABC":18929,"ĠIsle":18930,"Ġtherapist":18931,"Ġgubernatorial":18932,"ĠAust":18933,"ĠLoan":18934,"Bo":18935,"ĠNRL":18936,"rag":18937,"Clear":18938,"Ġrevision":18939,"Ġflesh":18940,"BD":18941,"iji":18942,"Ġproductions":18943,"Ġcoconut":18944,"ĠMcCorm":18945,"ĠDash":18946,"Ġgeography":18947,"hearted":18948,"Ġarson":18949,"Ġgoaltender":18950,"Ġbelly":18951,"Ġqualifications":18952,"ĠActiv":18953,"Ġhooked":18954,"ĠHungarian":18955,"Ġprotocols":18956,"inking":18957,"Ġfronts":18958,"ĠKuala":18959,"ĠToys":18960,"ĠFitness":18961,"Ġwarfare":18962,"Ġoutp":18963,"ĠQuestions":18964,"Ġwel":18965,"ĠShan":18966,"ĠMorton":18967,"ĠRomero":18968,"Ġglance":18969,"ĠTay":18970,"Ġsneakers":18971,"ĠSymphony":18972,"Ġinspect":18973,"enna":18974,"Nobody":18975,"Ġscrapped":18976,"ĠDeVos":18977,"ĠDominican":18978,"Ġplanets":18979,"anova":18980,"Ġnotify":18981,"Ġincurred":18982,"Ġunders":18983,"Ġdetainees":18984,"ĠMarriott":18985,"electric":18986,"ĠKes":18987,"union":18988,"ĠWatt":18989,"ATING":18990,"Ġslipping":18991,"Ġraft":18992,"Ġresisted":18993,"Ġcred":18994,"tern":18995,"Ġflurry":18996,"Line":18997,"Ġconsulted":18998,"Ġanalyzing":18999,"107":19000,"ĠWide":19001,"¶":19002,"human":19003,"ĠFEMA":19004,"Ġsmash":19005,"Ġcorps":19006,"Ġbarric":19007,"Ġcollar":19008,"ĠTB":19009,"without":19010,"ĠCanucks":19011,"Ġneedle":19012,"ĠSidney":19013,"ĠLauderdale":19014,"Ġglove":19015,"ilee":19016,"pic":19017,"Ġbenef":19018,"ĠHydro":19019,"ĠDisc":19020,"ĠArg":19021,"Ġtermin":19022,"Ġsympath":19023,"Ġpest":19024,"ĠCoff":19025,"Ġadvancement":19026,"social":19027,"pol":19028,"ĠEmails":19029,"Ġstacked":19030,"ibly":19031,"ĠAlbion":19032,"Ġfist":19033,"hero":19034,"ĠMarian":19035,"asia":19036,"Ġtownship":19037,"Ġslick":19038,"Ġmodeling":19039,"achers":19040,"ĠArgent":19041,"ĠSUN":19042,"arde":19043,"Ġpinned":19044,"Ġhitters":19045,"Ġdare":19046,"ictions":19047,"arily":19048,"Ġsting":19049,"Ġprimaries":19050,"appointed":19051,"Ġformats":19052,"Ġglitter":19053,"Ġpatches":19054,"Ġstrategically":19055,"Ġaka":19056,"Ġyielded":19057,"BY":19058,"Ġjeopard":19059,"ĠVand":19060,"Ġcrowned":19061,"Ġoccupants":19062,"Ġtanker":19063,"ĠVisa":19064,"Great":19065,"Ġseasoned":19066,"ĠAviv":19067,"Ġfiery":19068,"Ġderivatives":19069,"Ġdiverted":19070,"Ġacqu":19071,"Ġsandwiches":19072,"ĠLorenzo":19073,"Ġpardon":19074,"ĠBarber":19075,"ĠAgricultural":19076,"ĠPhilly":19077,"Ġregrets":19078,"ĠMillions":19079,"ĠFrazier":19080,"Ġtreasury":19081,"ĠKenn":19082,"Ġdestined":19083,"olved":19084,"Back":19085,"leader":19086,"lyss":19087,"ĠReyes":19088,"001":19089,"bags":19090,"ĠStandards":19091,"ĠExcellence":19092,"ĠMaid":19093,"ĠAnthem":19094,"FIELD":19095,"Ġrevived":19096,"ĠQuad":19097,"Ġdistinguished":19098,"Ġweighted":19099,"Ġritual":19100,"Ġinvites":19101,"wana":19102,"iture":19103,"ĠCI":19104,"ĠMAY":19105,"Ġunfairly":19106,"ĠKP":19107,"ĠMidlands":19108,"Ġmint":19109,"uers":19110,"Ġcatalog":19111,"arant":19112,"Ġlosers":19113,"Ġscheduling":19114,"esar":19115,"Ġtransferring":19116,"Ġbankrupt":19117,"Ġmethamphetamine":19118,"ĠEsk":19119,"ĠTreatment":19120,"ĠResponse":19121,"Ġhomework":19122,"ĠBald":19123,"Ġembarrassment":19124,"Ġpoorest":19125,"ĠPlatinum":19126,"ĠFac":19127,"Ġunleashed":19128,"Ġbrighter":19129,"002":19130,"Ġdisl":19131,"ĠLowry":19132,"ived":19133,"ĠDemon":19134,"ĠNonetheless":19135,"arro":19136,"ĠCONT":19137,"ifted":19138,"ĠFreder":19139,"isson":19140,"Ġrout":19141,"ARA":19142,"Ġswinging":19143,"Oct":19144,"Ġliable":19145,"Ġleaning":19146,"Ġlungs":19147,"380":19148,"ĠProcess":19149,"ĠCov":19150,"terrorism":19151,"Ġresistant":19152,"Ġpumped":19153,"Ġtripled":19154,"Semitism":19155,"ĠMia":19156,"Ġpenetration":19157,"ĠLutheran":19158,"BU":19159,"odes":19160,"Ġspanning":19161,"utch":19162,"Trans":19163,"ĠVolunteers":19164,"Ġpathway":19165,"Ġinfectious":19166,"Ġdrastic":19167,"ĠEngineers":19168,"Ġprincess":19169,"acts":19170,"usting":19171,"utive":19172,"achel":19173,"DO":19174,"Ġpave":19175,"ĠHerrera":19176,"Ġnearing":19177,"help":19178,"Ġembarked":19179,"Ġmodes":19180,"ĠDriving":19181,"Ġopting":19182,"Best":19183,"Ġbehavioral":19184,"Ġcables":19185,"App":19186,"otion":19187,"ĠExt":19188,"ĠSinclair":19189,"ĠInsp":19190,"Ġsinking":19191,"Next":19192,"ĠLumpur":19193,"ĠShadow":19194,"Donald":19195,"itals":19196,"Ġmentions":19197,"floor":19198,"Ġconsiderations":19199,"ĠSquad":19200,"ĠPlate":19201,"dos":19202,"Friday":19203,"Hopefully":19204,"arre":19205,"Ġalum":19206,"\":\"/":19207,"Ġfet":19208,"anza":19209,"Ġdign":19210,"ĠNguyen":19211,"ĠRutgers":19212,"ĠSew":19213,"Ġfilters":19214,"ofi":19215,"Ġunavailable":19216,"ranking":19217,"Ġrefining":19218,"ĠUNC":19219,"Ġmax":19220,"yll":19221,"Ġhandsome":19222,"Ġutterly":19223,"See":19224,"ĠStores":19225,"Ke":19226,"ĠAdvoc":19227,"ordon":19228,"umbles":19229,"Ġbugs":19230,"olar":19231,"ĠCork":19232,"Ġtoken":19233,"Ġauthorization":19234,"Ġconscience":19235,"Ġrepl":19236,"edi":19237,"owitz":19238,"iven":19239,"Ġlieu":19240,"Ġlifts":19241,"Lean":19242,"Ġmagnificent":19243,"ĠFilms":19244,"onents":19245,"Ġ***":19246,"Green":19247,"ĠAdvocate":19248,"ĠArrow":19249,"Ġblows":19250,"Ġexploited":19251,"fly":19252,"ĠAmar":19253,"ĠNOTICE":19254,"Ġsincere":19255,"found":19256,"ĠRud":19257,"Ġcy":19258,"ĠHeidi":19259,"Ġempowered":19260,"Ġweakest":19261,"ĠKru":19262,"Credit":19263,"aunted":19264,"Ġexotic":19265,"aning":19266,"Ġaw":19267,"ĠMulti":19268,"Ġanimation":19269,"850":19270,"ĠCounter":19271,"ĠNit":19272,"alli":19273,"Ġcapitalize":19274,"Ġexecuting":19275,"Ġdescent":19276,"ovi":19277,"ĠKimberly":19278,"headed":19279,"Ġmentioning":19280,")-":19281,"ĠSpecifically":19282,"ayette":19283,"ihad":19284,"ĠIss":19285,"Ġdisagreed":19286,"ĠKum":19287,"Ġurges":19288,"Ġpermitting":19289,"Ġpy":19290,"isp":19291,"Ġhygiene":19292,"Ġmourning":19293,"Ġcyclists":19294,"cats":19295,"FER":19296,"cycl":19297,"Ġnewcomers":19298,"Ġplead":19299,"Ġmend":19300,"secret":19301,"fan":19302,"Ġtranslates":19303,"unit":19304,"ĠTank":19305,"drive":19306,"ĠSite":19307,"Ġacceleration":19308,"ĠEnrique":19309,"ĠElaine":19310,"Ġstaring":19311,"Ġbackwards":19312,"Ġot":19313,"Ġvot":19314,"ĠHK":19315,"Ġfian":19316,"ĠLockheed":19317,"Ġmanifest":19318,"ĠZurich":19319,"pad":19320,"ĠRav":19321,"flow":19322,"Ġmoms":19323,"ĠSolid":19324,"ĠReady":19325,"aughlin":19326,"Ġreminding":19327,"ĠCOR":19328,"Ġoptimal":19329,"ĠCrisis":19330,"Ġcholesterol":19331,"ĠGerard":19332,"Ġfest":19333,"Ġsanction":19334,"Ġdragging":19335,"inent":19336,"ĠBravo":19337,"Ġamend":19338,"aval":19339,"Ġpoem":19340,"Ġinvasive":19341,"Ġlandsc":19342,"leigh":19343,"Ġheadache":19344,"ĠMuse":19345,"ĠTurning":19346,"girl":19347,"cess":19348,"Ġfalsely":19349,"Ġplaintiff":19350,"Ġheavier":19351,"Ġrumored":19352,"Ġeleven":19353,"ĠConsumers":19354,"ĠOriginally":19355,"ĠStatement":19356,"bors":19357,"Ġrevoked":19358,"ĠOmaha":19359,"Fox":19360,"ĠKle":19361,"Ġvault":19362,"Ġoutdated":19363,"umes":19364,"ĠArk":19365,"Ġapologised":19366,"Ġrockets":19367,"ĠMarines":19368,"Ġcaptures":19369,"ĠMW":19370,"ĠWalters":19371,"ĠFactor":19372,"Ġensuing":19373,"ĠSession":19374,"oons":19375,"Ġ132":19376,"gt":19377,"ĠPoints":19378,"Ġexhaust":19379,"ĠOsaka":19380,"heed":19381,"Ġhandic":19382,"amber":19383,"inging":19384,"Ġll":19385,"Ġescorted":19386,"Ġfloated":19387,"Ġmerge":19388,"Ġcompliment":19389,"ĠVC":19390,"Ġinsulin":19391,"ĠDebt":19392,"ça":19393,"Ġpens":19394,"Ġassertion":19395,"Ġredevelopment":19396,"moderate":19397,"Ġleftist":19398,"ĠBA":19399,"Ġherd":19400,"Ġinsecurity":19401,"liter":19402,"Ġcommence":19403,"ĠCaucus":19404,"Ġnovels":19405,"ĠChevron":19406,"Ġerosion":19407,"ĠNicholson":19408,"ĠRoof":19409,"ĠVolunteer":19410,"Ġcompelled":19411,"Ġcongratulated":19412,"ĠPanel":19413,"Ġov":19414,"idelity":19415,"Ġspect":19416,"Ġbee":19417,"ĠAssistance":19418,"Ġterrified":19419,"iew":19420,"Ġweekday":19421,"ĠHiggins":19422,"special":19423,"ubs":19424,"anton":19425,"Ġbribes":19426,"Ġneat":19427,"ĠCliff":19428,"Ġdisqualified":19429,"ĠND":19430,"Ġvers":19431,"andra":19432,"Ġgraft":19433,"value":19434,"Ġportray":19435,"Ġdaytime":19436,"ksh":19437,"Ġconsist":19438,"Ġhonesty":19439,"ĠTimber":19440,"ĠNich":19441,"Ġinvented":19442,"ĠBuch":19443,"Ġskull":19444,"Ġtags":19445,"Ġ124":19446,"ighth":19447,"Ġrelaxing":19448,"Online":19449,"Ġsanctioned":19450,"Sport":19451,"ĠCove":19452,"Ġcomics":19453,"MW":19454,"AMA":19455,"mother":19456,"Home":19457,"ĠCustomer":19458,"Ġstrides":19459,"ĠWins":19460,"Ġrollout":19461,"ĠWeaver":19462,"Ġshuttle":19463,"Ġsteak":19464,"Ġglorious":19465,"ĠToll":19466,"Ġtrustee":19467,"Ġinstallations":19468,"ĠOpportunity":19469,"Ġoper":19470,"horse":19471,"Ġaided":19472,"irus":19473,"Ġsleek":19474,"Ġyelled":19475,"ĠSocialist":19476,"Ġapplaud":19477,"ĠWah":19478,"Ġdevote":19479,"Ġdh":19480,"Ġarchitectural":19481,"ĠMAC":19482,"centric":19483,"ĠSense":19484,"illas":19485,"ĠArchbishop":19486,"glass":19487,"Ġallowance":19488,"Ġbundle":19489,"andon":19490,"eight":19491,"ĠKare":19492,"haus":19493,"ĠAndreas":19494,"Ġdoll":19495,"RAM":19496,"Ġvolunteering":19497,"ĠRaleigh":19498,"Ġbees":19499,"Ġnickel":19500,"Ġgenerosity":19501,"Ġhomeowner":19502,"ĠLieutenant":19503,"Ġlandfall":19504,"ĠRenew":19505,"ĠGiving":19506,"ĠContribut":19507,"aret":19508,"ulf":19509,"Ġreinforce":19510,"ĠSalv":19511,"ĠVenice":19512,"Ġfreedoms":19513,"ĠTools":19514,"Ġ1962":19515,"ĠWarm":19516,"majority":19517,"Ġpleas":19518,"oding":19519,"plant":19520,"Ġtow":19521,"ĠBlanc":19522,"ĠPipeline":19523,"ĠMoor":19524,"Ġrefrain":19525,"ĠExplore":19526,"language":19527,"cers":19528,"ĠWT":19529,"sent":19530,"ĠNun":19531,"Ġplastics":19532,"acas":19533,"Ġdisruptions":19534,"Ġdiscomfort":19535,"enko":19536,"Ġimprisoned":19537,"Copyright":19538,"Ġmyriad":19539,"Ġparenting":19540,"Ġspree":19541,"NBC":19542,"Ġonion":19543,"ĠIsraelis":19544,"ĠRA":19545,"Ġrelocate":19546,"113":19547,"ĠHir":19548,"ĠDre":19549,"ĠDry":19550,"ĠONE":19551,"ĠAdministrator":19552,"Ġprints":19553,"ĠGret":19554,"Ġundergraduate":19555,"ĠLif":19556,"avers":19557,"ĠCarney":19558,"Ġapex":19559,"Ġlenses":19560,"Ġliberals":19561,"gb":19562,"ĠWhereas":19563,"Ġcountryside":19564,"amine":19565,"ĠTerminal":19566,"Ġintr":19567,"ĠTrey":19568,"ALS":19569,"Ġcontinental":19570,"Ġselfies":19571,"FILE":19572,"ĠUnity":19573,"Ġauthoritarian":19574,"Ġoriginated":19575,"ĠExcept":19576,"yna":19577,"Ġmonet":19578,"Ġundermining":19579,"ĠGS":19580,"pi":19581,"iq":19582,"Ġslides":19583,"ĠSummary":19584,"Ġpains":19585,"cluding":19586,"Ġequation":19587,"locked":19588,"Ġfraternity":19589,"Ġwithstand":19590,"Ġdevastation":19591,"Ġdemo":19592,"late":19593,"Ġpunches":19594,"Ġgeared":19595,"nen":19596,"ĠBowie":19597,"attle":19598,"Ġpolitic":19599,"ĠGle":19600,"mented":19601,"ĠCoordinator":19602,"Ġupwards":19603,"ĠMega":19604,"angled":19605,"Ġengineered":19606,"Ġluggage":19607,"ĠWen":19608,"ĠSergeant":19609,"Ġkindergarten":19610,"ĠPortsmouth":19611,"uddin":19612,"ket":19613,"oba":19614,"Ġoscill":19615,"esse":19616,"ĠOlson":19617,"ĠBorough":19618,"Ġsupplements":19619,"ĠEvening":19620,"ANE":19621,"Ġlava":19622,"Ġgearing":19623,"setting":19624,"urgical":19625,"asty":19626,"ĠDaytona":19627,"Ġbrewery":19628,"Ġpledges":19629,"rounder":19630,"ulous":19631,"ĠHancock":19632,"rex":19633,"Ġram":19634,"Ġproceeding":19635,"ĠMurdoch":19636,"Ġdowngrade":19637,"Ġstatues":19638,"Ġdebated":19639,"ĠSleep":19640,"Ġ144":19641,"ĠRuby":19642,"ĠFi":19643,"123":19644,"ĠArabic":19645,"Ġlasts":19646,"ĠIvy":19647,"ĠWid":19648,"rown":19649,"stick":19650,"?'\"":19651,"ĠSTEM":19652,"Ġsensible":19653,"htar":19654,"Ġharbor":19655,"Ġcra":19656,"ĠAlbum":19657,"ĠCarnival":19658,"Ġimplies":19659,"agement":19660,"ĠInitially":19661,"Ġchooses":19662,"Jeff":19663,"ĠHig":19664,"Ġtam":19665,"Ġlump":19666,"ucks":19667,"Ġrepatri":19668,"ĠMercy":19669,"zza":19670,"Ġ365":19671,"ĠRicardo":19672,"ogram":19673,"Ġundergone":19674,"system":19675,"Ġtel":19676,"ĠKee":19677,"ully":19678,"istas":19679,"Ġgrains":19680,"ĠTomorrow":19681,"ĠRC":19682,"ĠTurk":19683,"Ġfreshmen":19684,"ĠAway":19685,"ĠSach":19686,"ĠUltimate":19687,"Ġoffensively":19688,"ismo":19689,"Ġteaser":19690,"ĠJud":19691,"Ġlegitimacy":19692,"opt":19693,"ĠCobb":19694,"Ġrejecting":19695,"ĠSolo":19696,"ĠArcher":19697,"Ġsoutheastern":19698,"ĠPlain":19699,"ĠLoss":19700,"Ġminerals":19701,"ĠMari":19702,"Ġscrambling":19703,"ĠPeak":19704,"Ġhavoc":19705,"rings":19706,"Ġunofficial":19707,"ĠHaj":19708,"director":19709,"ĠCanal":19710,"ĠNSA":19711,"ĠEaton":19712,"ĠPART":19713,"ĠCommissioners":19714,"Ġwellbeing":19715,"resa":19716,"Ġunderstandable":19717,"dates":19718,"ĠSorry":19719,"Ġastonishing":19720,"Ġrevise":19721,"ĠEc":19722,"ĠLack":19723,"endi":19724,"endale":19725,"also":19726,"Ġcolder":19727,"Ġheel":19728,"Ġcellular":19729,"Conn":19730,"ĠThur":19731,"Ġmassage":19732,"olla":19733,"clus":19734,"Ġtoilets":19735,"ĠCelebr":19736,"Ġtackled":19737,"Ġchorus":19738,"ETA":19739,"anca":19740,"ĠOLED":19741,"Ġpunk":19742,"ĠBrain":19743,"ĠNuggets":19744,"Ġseamless":19745,"make":19746,"atted":19747,"ĠRog":19748,"ĠPatch":19749,"Ġruined":19750,"Ins":19751,"Ġconsolidate":19752,"Ġgospel":19753,"ĠCaption":19754,"Ġoverweight":19755,"Ġscreened":19756,"ĠKraft":19757,"ĠBain":19758,"breaker":19759,"ĠFeinstein":19760,"ĠDoc":19761,"Ġdeepest":19762,"ĠOL":19763,"Ġtunes":19764,"Ġrightly":19765,"ĠLanc":19766,"ĠBrotherhood":19767,"Ġpoultry":19768,"ĠPure":19769,"Ġstimulate":19770,"Ġdiscourse":19771,"ĠStark":19772,"Ġmuseums":19773,"ention":19774,"Ġtaxation":19775,"ĠAkron":19776,"ayer":19777,"ĠKirby":19778,"farm":19779,"oser":19780,"Ġcommend":19781,"Ġunarmed":19782,"ensions":19783,"Ġsuperst":19784,"Ġoceans":19785,"Ġmisuse":19786,"LO":19787,"ĠByrne":19788,"ĠMaritime":19789,"Ġdense":19790,"Ġexcuses":19791,"Ġsuppose":19792,"ĠMarks":19793,"Ġrainy":19794,"Ġreplicate":19795,"Ġboutique":19796,"ĠRenaissance":19797,"jas":19798,"icted":19799,"Ġreferenced":19800,"ĠTir":19801,"ĠHatch":19802,"ĠCry":19803,"ĠPayPal":19804,"Ġfulfil":19805,"ĠHawaiian":19806,"come":19807,"ĠThirty":19808,"Ġ260":19809,"ĠYak":19810,"Ġangles":19811,"Ġlandlord":19812,"Ġlavish":19813,"Women":19814,"ĠNT":19815,"Ġreinforced":19816,"Ġprevail":19817,"ĠCommunities":19818,"Ġfootwear":19819,"Ġassurances":19820,"Ġlb":19821,"Ġairing":19822,"Ġresorts":19823,"ĠFiji":19824,"ĠShay":19825,"Ġprevailing":19826,"many":19827,"Ġimpe":19828,"ĠDul":19829,"Ġsymbols":19830,"zb":19831,"ĠCere":19832,"Ġapplauded":19833,"Ġsoundtrack":19834,"Ġdrunken":19835,"ĠEuropeans":19836,"Ġherds":19837,"moving":19838,"WR":19839,"ĠHindi":19840,"Ġwaking":19841,"Jo":19842,"Andrew":19843,"rosse":19844,"ĠLegislative":19845,"Ġdisgrace":19846,"Nothing":19847,"ĠBulgaria":19848,"Ġhumidity":19849,"Ġtranslation":19850,"Ġmeasurements":19851,"Ġvying":19852,"ĠBrid":19853,"Max":19854,"Ġdir":19855,"unci":19856,"Ġdefines":19857,"Ġperfection":19858,"ancers":19859,"Matt":19860,"ĠShinzo":19861,"ĠPresidents":19862,"Ġginger":19863,"onna":19864,"existing":19865,"rika":19866,"enced":19867,"ĠBray":19868,"Ġgall":19869,"Ġdisrespect":19870,"ĠCumber":19871,"Ġcontestant":19872,"ucky":19873,"anticipated":19874,"abled":19875,"LLOW":19876,"Bel":19877,"ĠKear":19878,"Ġstoryline":19879,"Ġrigs":19880,"ĠScots":19881,"ĠChap":19882,"ĠThankfully":19883,"Ġcommunist":19884,"ĠAdviser":19885,"Ġregist":19886,"Ġannoying":19887,"ĠDVD":19888,"Ġethic":19889,"ĠFilipino":19890,"ĠAdidas":19891,"Ġbilling":19892,"Ġalleviate":19893,"Ġsmoked":19894,"Ġhazard":19895,"EV":19896,"Ag":19897,"baum":19898,"Ġdoses":19899,"Ġoutcry":19900,"Ġinclined":19901,"Ġpsychologist":19902,"itzer":19903,"January":19904,"Ġmornings":19905,"aught":19906,"Ġsurreal":19907,"ĠCannon":19908,"avy":19909,"ĠCris":19910,"cf":19911,"Ġinterpreted":19912,"Ġpersecution":19913,"vation":19914,"Ġupfront":19915,"ĠWaste":19916,"Ġmills":19917,"Ġbombings":19918,"ĠHeaven":19919,"ĠFlat":19920,"Ġboxer":19921,"Ġavenues":19922,"Invest":19923,"ĠZika":19924,"Ġbackstage":19925,"idas":19926,"eston":19927,"ead":19928,"Ġbishops":19929,"Ġrender":19930,"Ġfootballer":19931,"Ġspilled":19932,"Only":19933,"Ġsaddened":19934,"ĠAbove":19935,"inator":19936,"tro":19937,"onen":19938,"ĠAMC":19939,"Ġstringent":19940,"Ġfooting":19941,"ĠGhost":19942,"Ġtexting":19943,"ĠCPI":19944,"ĠUW":19945,"Ġaccol":19946,"iries":19947,"ĠFlex":19948,"ĠCarolyn":19949,"Andre":19950,"Ġsiege":19951,"Muslim":19952,"Ġautomobile":19953,"reci":19954,"Ġdean":19955,"atre":19956,"Ġwax":19957,"Ġwo":19958,"ĠDuffy":19959,"Ġfiance":19960,"Ġfib":19961,"Ġeagle":19962,"ĠCatal":19963,"Ġinfants":19964,"Ġsubmitting":19965,"Ġdownhill":19966,"Ġstaffer":19967,"ĠLights":19968,"Ġeater":19969,"ĠCaliforn":19970,"Ġsupervisors":19971,"ĠPy":19972,"Ġcondemnation":19973,"Ġsci":19974,"Ġhated":19975,"Ġtil":19976,"ĠLavrov":19977,"Ġsab":19978,"Ġmotors":19979,"Ġlogging":19980,"ĠOwn":19981,"Ġpi":19982,"Ġrepeating":19983,"ĠDOJ":19984,"enary":19985,"ĠChow":19986,"fat":19987,"Ġbalcony":19988,"orie":19989,"NING":19990,"ĠUnified":19991,"Neil":19992,"Bill":19993,"ĠSims":19994,"uten":19995,"LV":19996,"ĠEMS":19997,"Ġsip":19998,"Ġreplaces":19999,"ichi":20000,"ĠFig":20001,"ĠCharity":20002,"Ġpeek":20003,"Ġrack":20004,"Ġcousins":20005,"Ġresolving":20006,"Ġthrone":20007,"ĠEngine":20008,"ĠChak":20009,"Ġlamented":20010,"Ġwipe":20011,"Ġnutrients":20012,"ĠChat":20013,"AMP":20014,"ĠOprah":20015,"uming":20016,"serving":20017,"Ġfir":20018,"Ġlandlords":20019,"neck":20020,"Ġupload":20021,"Ġunspecified":20022,"Ġicy":20023,"´":20024,"Ġze":20025,"Ġprohibits":20026,"ĠFI":20027,"Res":20028,"ĠEff":20029,"hell":20030,"umbo":20031,"Ġreceipts":20032,"Ġoperatives":20033,"stant":20034,"Ġwives":20035,"ĠCinema":20036,"Ġnegligence":20037,"Ġgases":20038,"ĠLau":20039,"Ġbrew":20040,"August":20041,"never":20042,"Ġpenned":20043,"Ġincomplete":20044,"ĠZh":20045,"esi":20046,"Ġranged":20047,"apolis":20048,"Ġwithdrawing":20049,"ĠLevi":20050,"ĠLevy":20051,"ĠDaly":20052,"Ġdelaying":20053,"ĠMSNBC":20054,"ĠCyrus":20055,"ĠNutrition":20056,"NN":20057,"Ġwinding":20058,"Ġglow":20059,"ĠMY":20060,"Ġgoodwill":20061,"ĠMON":20062,"Ġslots":20063,"ĠNina":20064,"ĠFIR":20065,"ĠLTE":20066,"ĠInnov":20067,"dev":20068,"ctic":20069,"Ġanalyses":20070,"ĠBangalore":20071,"Ġtales":20072,"Ġovercame":20073,"ĠThurs":20074,"Ġcherry":20075,"ĠNou":20076,"ĠFlowers":20077,"1000":20078,"updated":20079,"rieve":20080,"ĠBeautiful":20081,"iak":20082,"Ġplayback":20083,"Ġheadset":20084,"Ġashamed":20085,"Min":20086,"Ġadm":20087,"ĠLucky":20088,"ĠTucson":20089,"Ġentirety":20090,"ranging":20091,"ĠVance":20092,"kered":20093,"image":20094,"ĠGord":20095,"War":20096,"Ġsimilarities":20097,"dig":20098,"ĠJude":20099,"Ġlonely":20100,"hra":20101,"ĠStaples":20102,"ĠACA":20103,"Ġmeasurement":20104,"Ġcooper":20105,"ATER":20106,"ĠMeng":20107,"Ġbarring":20108,"190":20109,"ĠBatt":20110,"Ġreproductive":20111,"ĠRowe":20112,"Ġsubsid":20113,"Ġslogans":20114,"ugar":20115,"ĠKeller":20116,"ingham":20117,"fuel":20118,"Ġhid":20119,"afe":20120,"Ġindul":20121,"cash":20122,"Ġstressing":20123,"ĠMIT":20124,"Ġtrump":20125,"ancer":20126,"ĠPes":20127,"ĠMint":20128,"Ġcrossover":20129,"ĠWeiss":20130,"ĠElvis":20131,"ĠPermanent":20132,"ĠKhalid":20133,"Ġunjust":20134,"Ġexceptionally":20135,"Ġfut":20136,"Ġavid":20137,"ĠEthics":20138,"Ġutilized":20139,"Ġfeasibility":20140,"Ġcatering":20141,"Press":20142,"wayne":20143,"October":20144,"Ġfavors":20145,"Ġobsession":20146,"Ġmelt":20147,"Ġmug":20148,"ĠMK":20149,"Ġapples":20150,"Ġvine":20151,"cliffe":20152,"Ġgrat":20153,"Ġspells":20154,"ounced":20155,"Ġdecree":20156,"issy":20157,"Team":20158,"Ġdeploying":20159,"Feb":20160,"Ġmiserable":20161,"Ġwat":20162,"ĠBust":20163,"ĠNorris":20164,"ĠTimberwolves":20165,"Ġangered":20166,"ĠArn":20167,"oft":20168,"rome":20169,"Ġadvertisements":20170,"onal":20171,"Ġnun":20172,"Ġtorque":20173,"Ġslave":20174,"Ġnonsense":20175,"Ġcoy":20176,"Ġcites":20177,"Game":20178,"Ġarchitects":20179,"playing":20180,"Ġgener":20181,"Ġsocio":20182,"Ġmeditation":20183,"Ġforgive":20184,"Ġsmiled":20185,"%),":20186,"Ġpers":20187,"ĠSoph":20188,"Ġoccupy":20189,"atton":20190,"Ġwitnessing":20191,"Ġapologise":20192,"Ġpredecessors":20193,"ĠCassidy":20194,"Ġtallied":20195,"NER":20196,"Ġtract":20197,"ĠHolder":20198,"ĠPav":20199,"Ġjackets":20200,"Mel":20201,"raud":20202,"Ġexercising":20203,"ĠChung":20204,"ĠAmin":20205,"athi":20206,"ĠMem":20207,"Ġracked":20208,"Ġcarved":20209,"ĠMickey":20210,"ĠLafayette":20211,"Ġgrill":20212,"ĠINFORMATION":20213,"usc":20214,"ĠPromotion":20215,"yson":20216,"istry":20217,"Ġfulfilled":20218,"Ġrestraint":20219,"Ġpopping":20220,"ĠSlater":20221,"Ġmercy":20222,"aden":20223,"Ġsubmarine":20224,"ĠBowling":20225,"dogs":20226,"ĠSwe":20227,"Ġnoticeable":20228,"Ġbis":20229,"ĠPremiership":20230,"Ġspat":20231,"ĠTow":20232,"ĠWand":20233,"Ġmechanics":20234,"while":20235,"ĠBenson":20236,"Ġmolecules":20237,"Ġcrosses":20238,"Ġrecalling":20239,"ĠCertainly":20240,"HAM":20241,"Ġsever":20242,"ĠRudy":20243,"ĠDUI":20244,"OLD":20245,"ĠTobacco":20246,"Ġsubdued":20247,"Ġquota":20248,"TF":20249,"Ġflats":20250,"Ġemphasize":20251,"Ġbelts":20252,"ĠOpinion":20253,"Ġpiled":20254,"ĠSpark":20255,"ĠElias":20256,"Ġclassification":20257,"ĠHands":20258,"ĠCV":20259,"Ġtoast":20260,"Ġcandle":20261,"atching":20262,"short":20263,"ĠDup":20264,"Ġult":20265,"bats":20266,"Ġmarketers":20267,"ĠAvery":20268,"ĠColbert":20269,"ĠIk":20270,"ĠVac":20271,"ĠJackets":20272,"Ġmerits":20273,"eli":20274,"PORT":20275,"Ġelevator":20276,"irming":20277,"effective":20278,"Ġgroceries":20279,"Ġhi":20280,"ĠINTER":20281,"ĠSAP":20282,"ĠNYPD":20283,"ĠKY":20284,"Ġangel":20285,"Ġspectacle":20286,"ré":20287,"ĠRoche":20288,"Ġinsects":20289,"Ġcommenced":20290,"ĠFoley":20291,"Ġdarker":20292,"ĠUg":20293,"ĠMostly":20294,"Ġtermed":20295,"uci":20296,"ĠExec":20297,"ĠBrittany":20298,"Ġharmony":20299,"Ġadvocated":20300,"Ġparcel":20301,"ĠHots":20302,"Ġmonarch":20303,"ĠSiri":20304,"odge":20305,"ĠPag":20306,"Ġprogressing":20307,"grounds":20308,"Ġonstage":20309,"Ġwarmth":20310,"ĠWon":20311,"Ġviolates":20312,"ĠSaudis":20313,"Ġbumper":20314,"Ġpatrols":20315,"ĠBarron":20316,"Ġindoors":20317,"Ġtar":20318,"Each":20319,"Val":20320,"Ġapplicant":20321,"ĠCater":20322,"Ġclassics":20323,"ĠThreat":20324,"Ġwrapping":20325,"ĠIdlib":20326,"anking":20327,"Did":20328,"adia":20329,"ĠRig":20330,"ĠBram":20331,"ĠLaurie":20332,"ĠHair":20333,"ĠCannabis":20334,"Ġdaylight":20335,"ĠNorm":20336,"ĠRip":20337,"sin":20338,"unta":20339,"Pass":20340,"ĠAcad":20341,"ĠCummings":20342,"Ġtheirs":20343,"ĠDistribution":20344,"especially":20345,"Ġgrilled":20346,"Ġaffiliates":20347,"ĠVander":20348,"ĠCath":20349,"ĠProductions":20350,"ĠTrek":20351,"230":20352,"Ġcasinos":20353,"ĠCain":20354,"atu":20355,"idget":20356,"ĠWinds":20357,"Ġunanswered":20358,"Ġintercept":20359,"ĠMarty":20360,"Ġrefin":20361,"Ġlieutenant":20362,"cas":20363,"Chief":20364,"average":20365,"ilot":20366,"Ġscrimmage":20367,"ĠMud":20368,"speaking":20369,"ĠFranken":20370,"ĠTories":20371,"Ġabstract":20372,"awar":20373,"ĠTerms":20374,"dal":20375,"ĠFur":20376,"Ġhumour":20377,"rh":20378,"Ġsitu":20379,"aed":20380,"ĠFIN":20381,"Ġtranscripts":20382,"approved":20383,"ĠParsons":20384,"Ġpigs":20385,"Ġrepayment":20386,"ĠARM":20387,"ĠElliot":20388,"ĠLevine":20389,"Ġtagged":20390,"pun":20391,"ĠDwight":20392,"Ġconfiguration":20393,"sis":20394,"ĠAdult":20395,"Ġearthquakes":20396,"Ġcreature":20397,"ĠMRI":20398,"Ġmach":20399,"Ġprescriptions":20400,"cover":20401,"Ġministries":20402,"Ġinaccurate":20403,"ĠLabs":20404,"ĠMGM":20405,"Ġtomato":20406,"Ġeng":20407,"Ġopposes":20408,"owan":20409,"Ġmapping":20410,"Ġconsum":20411,"online":20412,"eters":20413,"code":20414,"Aug":20415,"Point":20416,"branded":20417,"pling":20418,"ĠCalder":20419,"Oper":20420,"ĠMiddles":20421,"Ġchampagne":20422,"ĠTues":20423,"Ġsampling":20424,"Ġenergetic":20425,"rano":20426,"ĠStyles":20427,"Ġneglected":20428,"ĠDamon":20429,"Ġendanger":20430,"Ġsouthwestern":20431,"ĠATM":20432,"ĠDuck":20433,"engers":20434,"Ġdan":20435,"yth":20436,"Ġbou":20437,"ĠDecl":20438,"Gold":20439,"Ġprojecting":20440,"Google":20441,"ĠHussein":20442,"Ġaccomplishment":20443,"itarian":20444,"Ġgossip":20445,"ĠRai":20446,"ril":20447,"ĠSke":20448,"Ġpsychiatric":20449,"ĠMacBook":20450,"ĠAdobe":20451,"ĠHodg":20452,"Ġaccompany":20453,"Ġadvertised":20454,"Ġreminiscent":20455,"Ġgeographical":20456,"Ġconvertible":20457,"IK":20458,"CTV":20459,"Ġcommunal":20460,"Ġchim":20461,"Ġselfish":20462,"Ġdrilled":20463,"Ġtortured":20464,"Ġblacks":20465,"noon":20466,"Ġmanifesto":20467,"ĠRichie":20468,"acco":20469,"Im":20470,"Ġdebit":20471,"ĠSNP":20472,"perfect":20473,"gard":20474,"ĠRatio":20475,"Ġstubborn":20476,"Ġaccumulation":20477,"Ġcongregation":20478,"Ġkissing":20479,"Ġkillers":20480,"ĠAbbey":20481,"von":20482,"ĠFuj":20483,"ĠIsabel":20484,"NB":20485,"ĠNish":20486,"ĠJulius":20487,"ĠZimmer":20488,"Ġuncover":20489,"dar":20490,"isle":20491,"ĠCompar":20492,"Ġcounselor":20493,"ĠSok":20494,"ĠCumm":20495,"ĠHip":20496,"Ġurgently":20497,"Ġrentals":20498,"Ġapproving":20499,"Ġirrigation":20500,"Ġprostate":20501,"ĠJudicial":20502,"ĠSubmit":20503,"ĠTanner":20504,"attack":20505,"emb":20506,"Ġreclaim":20507,"Ġec":20508,"Ġbrutality":20509,"Ġcommanding":20510,"Ġreasoning":20511,"Roy":20512,"ĠElect":20513,"ĠMobil":20514,"anding":20515,"Ġmirrors":20516,"Israel":20517,"Ġpavement":20518,"Ġoverdue":20519,"ĠMd":20520,"street":20521,"Ġthrill":20522,"pora":20523,"azon":20524,"Ġbrewing":20525,"enge":20526,"ĠDisaster":20527,"Ġbuilder":20528,"ods":20529,"utsch":20530,"Ġterminals":20531,"ĠBaird":20532,"enburg":20533,"Ġhast":20534,"Ġbrass":20535,"Ġparental":20536,"enture":20537,"ĠConduct":20538,"Ġexpands":20539,"luck":20540,"mur":20541,"ĠBj":20542,"Ġadministrations":20543,"ĠOlivier":20544,"oux":20545,"Ġnarrowed":20546,"winner":20547,"Ġmakeshift":20548,"ĠVAT":20549,"ĠJavier":20550,"-,":20551,"Ġsystematic":20552,"Ġenforcing":20553,"emin":20554,"ĠAudio":20555,"United":20556,"gener":20557,"ĠKara":20558,"ivas":20559,"ĠPretty":20560,"ĠLob":20561,"Ġpetitions":20562,"ĠMercer":20563,"ampa":20564,"product":20565,"Ġdistributing":20566,"Ġtunnels":20567,"Ġcondo":20568,"ĠRSS":20569,"ĠCarlo":20570,"Ġpumpkin":20571,"Ġsto":20572,"Ġassumes":20573,"oway":20574,"hiba":20575,"lection":20576,"Ġgam":20577,"ĠAires":20578,"Ġtransmitted":20579,"Ġtrousers":20580,"Ġcheers":20581,"ĠJensen":20582,"Ġemer":20583,"Ġsimpler":20584,"Ġcolored":20585,"ĠSustainable":20586,"Ġinstruct":20587,"Ġpoles":20588,"Ġsupervised":20589,"Ġinteg":20590,"ĠMoreno":20591,"boarding":20592,"igrant":20593,"ĠYoga":20594,"Ġenvironmentally":20595,"Ġsacrifices":20596,"Ġshores":20597,"Ġ127":20598,"Ġestranged":20599,"Ġintoxicated":20600,"Ġemergencies":20601,"ĠKosovo":20602,"yang":20603,"Ġfastball":20604,"Ġpackaged":20605,"LAN":20606,"Ġhurry":20607,"ĠManny":20608,"Ġporch":20609,"Ġcuriosity":20610,"ĠKend":20611,"thouse":20612,"ĠTou":20613,"mun":20614,"Ġwaving":20615,"Ġpasswords":20616,"ĠSwan":20617,"Ġprefers":20618,"ĠCorrections":20619,"aic":20620,"Ġejected":20621,"Ġdossier":20622,"ĠChal":20623,"Ġfacto":20624,"Ġspine":20625,"leck":20626,"Ġrestriction":20627,"Ġdisagreement":20628,"grown":20629,"ĠEdgar":20630,"Ġquantities":20631,"ĠRapid":20632,"Ġpals":20633,"Ġspared":20634,"Ġremarkably":20635,"ructure":20636,"Ġbackers":20637,"ĠGoals":20638,"cles":20639,"rolling":20640,"ĠBlasio":20641,"Ġorchestra":20642,"ologies":20643,"ĠRise":20644,"Power":20645,"Ġuptick":20646,"atha":20647,"ĠMob":20648,"Ġshotgun":20649,"downs":20650,"ĠBorg":20651,"Ġmorale":20652,"Call":20653,"wave":20654,"ĠDuc":20655,"Ġunwilling":20656,"oad":20657,"Ġbusinessmen":20658,"Ġrefriger":20659,"Ġgamers":20660,"Ġcele":20661,"Ġprecip":20662,"Ġrenegoti":20663,"OY":20664,"ĠPharm":20665,"Ġresponsive":20666,"Ġservant":20667,"eye":20668,"Ġraping":20669,"vas":20670,"Ġgroin":20671,"ĠMelvin":20672,"ĠKurds":20673,"Ġstricter":20674,"ĠMum":20675,"ients":20676,"Ġstandalone":20677,"Ġforums":20678,"Ġcommemorate":20679,"Far":20680,"ĠTelegram":20681,"Ġscreenings":20682,"ĠLeonardo":20683,"ighton":20684,"ĠDOWN":20685,"Ġmodule":20686,"Ġremedy":20687,"Ġ280":20688,"Su":20689,"ĠBecker":20690,"ĠGast":20691,"prem":20692,"ĠInto":20693,"oyle":20694,"114":20695,"Ġadhere":20696,"Report":20697,"ĠJaneiro":20698,"ĠKry":20699,"Pakistan":20700,"Ġrobotic":20701,"ande":20702,"Ġoverlooking":20703,"ĠTreaty":20704,"Ġrect":20705,"yne":20706,"Ġbattlefield":20707,"ĠGeoff":20708,"Ġearns":20709,"ĠMiner":20710,"Ġteased":20711,"Ġexemptions":20712,"Ġvacancy":20713,"oku":20714,"Ġvulnerabilities":20715,"ĠRou":20716,"Ġobserv":20717,"Ġoverlook":20718,"Ġcorrespond":20719,"Ġtheatrical":20720,"Ġrobotics":20721,"ĠCompl":20722,"ĠPasadena":20723,"laden":20724,"Ġvastly":20725,"olit":20726,"Ġjustification":20727,"Ġtampering":20728,"ĠSutherland":20729,"ĠMens":20730,"Ġinvisible":20731,"uren":20732,"ĠAshton":20733,"owl":20734,"Ġdisqual":20735,"ĠEva":20736,"Ġfriction":20737,"ĠIrvine":20738,"Ġaliens":20739,"ĠPension":20740,"ĠAssets":20741,"ĠBenedict":20742,"ittal":20743,"Ġsword":20744,"Ġunderwear":20745,"ĠFarmer":20746,"Ġtimber":20747,"Ġdependence":20748,"ĠTang":20749,"Ġ165":20750,"ĠNazis":20751,"Ġpunching":20752,"ĠGloria":20753,"usat":20754,"Ġluxurious":20755,"chuk":20756,"ĠCot":20757,"Ġregained":20758,"Ġreassure":20759,"Ġhello":20760,"Ġante":20761,"Ġnegotiators":20762,"Add":20763,"paced":20764,"ér":20765,"Ġdemolished":20766,"Ann":20767,"joy":20768,"ĠJenna":20769,"Apple":20770,"Ġdisturbance":20771,"Ġcommissions":20772,"ĠPolitico":20773,"along":20774,"Ġnem":20775,"Ġauctions":20776,"ruck":20777,"ĠOD":20778,"ofer":20779,"Play":20780,"Ġcarn":20781,"vez":20782,"Ġtents":20783,"Ġcongratulate":20784,"ĠLiquid":20785,"ĠCoyotes":20786,"uku":20787,"ĠAllah":20788,"Ġbend":20789,"Ġcanvas":20790,"ĠClifford":20791,"Ġvolunteered":20792,"Luc":20793,"bp":20794,"ĠCensus":20795,"ĠShot":20796,"Ġanonymously":20797,"ĠAnglo":20798,"ĠBayer":20799,"ĠAber":20800,"ĠCorrectional":20801,"Ġhardship":20802,"ĠBuenos":20803,"ĠDaw":20804,"Ġbaskets":20805,"Ġupstairs":20806,"Ġmindful":20807,"ĠLCD":20808,"ĠBlackburn":20809,"ĠHale":20810,"477":20811,"Ġcircus":20812,"ĠDragons":20813,"Ġrubble":20814,"rb":20815,"Ġheadaches":20816,"aunt":20817,"itus":20818,"Ġscaled":20819,"ĠComic":20820,"asio":20821,"ĠNordic":20822,"Per":20823,"Ġbombers":20824,"ilitation":20825,"Ġindirectly":20826,"ĠHod":20827,"andan":20828,"operation":20829,"Ġpuppy":20830,"ĠMats":20831,"Ġstewards":20832,"roup":20833,"Ġmemorandum":20834,"Ġpatio":20835,"const":20836,"ĠBold":20837,"ĠKaiser":20838,"Following":20839,"Ġcompat":20840,"Ġsidewalks":20841,"ĠFitzpatrick":20842,"Ġsunlight":20843,"ĠLever":20844,"ĠBecky":20845,"icles":20846,"ĠProbably":20847,"Ġgarner":20848,"ĠTomas":20849,"Ġblankets":20850,"uga":20851,"jiang":20852,"Ġrevel":20853,"ĠHutch":20854,"llers":20855,"Ġtrimmed":20856,"ĠSTR":20857,"ĠKR":20858,"ĠPike":20859,"ĠASS":20860,"Bay":20861,"Ġdiagnostic":20862,"ĠSteph":20863,"Ġtoured":20864,"ĠAvoid":20865,"vic":20866,"Without":20867,"ĠClinical":20868,"Ġblo":20869,"undo":20870,"ĠBoise":20871,"Ġspeculated":20872,"ĠProt":20873,"vention":20874,"Ġscholar":20875,"ĠSta":20876,"Featured":20877,"ĠPrev":20878,"Ġpenny":20879,"ĠHath":20880,"rawn":20881,"Ġrenovated":20882,"ĠFried":20883,"itol":20884,"uddle":20885,"Ġinquest":20886,"Ġmetropolitan":20887,"lights":20888,"Ġtempo":20889,"onom":20890,"ĠImport":20891,"Asia":20892,"Ġowes":20893,"Ġmagistrate":20894,"ĠFriedman":20895,"Ġcontacting":20896,"Ġstrains":20897,"Ġhomage":20898,"Ġlent":20899,"ception":20900,"git":20901,"Ġlively":20902,"Ġscra":20903,"WW":20904,"ön":20905,"rill":20906,"Jack":20907,"ĠShank":20908,"iani":20909,"Ġdecreasing":20910,"MON":20911,"ĠSupervisor":20912,"ĠCats":20913,"ĠFusion":20914,"Ġracially":20915,"ĠTara":20916,"ĠPurchase":20917,"ĠRally":20918,"ĠGraph":20919,"ĠHello":20920,"hest":20921,"ĠVarg":20922,"Ġdrowned":20923,"ĠThu":20924,"ĠWet":20925,"ĠEug":20926,"Ġrainbow":20927,"Ġtelev":20928,"ĠAmir":20929,"Based":20930,"Ġcookie":20931,"uding":20932,"Ġcontracting":20933,"Ġobjected":20934,"Ġfork":20935,"acent":20936,"ĠTil":20937,"ĠLilly":20938,"ĠEur":20939,"Ġhormone":20940,"Ġnails":20941,"ĠFischer":20942,"Ġpier":20943,"EMENT":20944,"Ġeruption":20945,"visory":20946,"Ġspeculate":20947,"apan":20948,"ĠJub":20949,"ĠHuckabee":20950,"string":20951,"stay":20952,"Ġsustaining":20953,"VM":20954,"Ġpriv":20955,"Ġclos":20956,"Ġdownloaded":20957,"ĠIv":20958,"Ġfinanced":20959,"ĠSao":20960,"ĠEverett":20961,"rene":20962,"ĠWo":20963,"ĠPiet":20964,"Ġengulfed":20965,"Ġexiting":20966,"uni":20967,"horn":20968,"Ġgrav":20969,"ection":20970,"Ġdrainage":20971,"Ġfuelled":20972,"Ġorganizational":20973,"bike":20974,"ĠAreas":20975,"Ġpoliceman":20976,"ĠFirm":20977,"ĠSlide":20978,"Ġrand":20979,"ĠJedi":20980,"Ge":20981,"really":20982,"Manchester":20983,"ĠWise":20984,"parent":20985,"Ġlad":20986,"Ġurine":20987,"ĠColombian":20988,"geon":20989,"Ġ1961":20990,"Mania":20991,"Ġgraph":20992,"Ġcod":20993,"fred":20994,"Ġeffic":20995,"ĠGateway":20996,"asket":20997,"Ġdiminished":20998,"Mass":20999,"Ġ205":21000,"Long":21001,"Ġgranddaughter":21002,"Ġshining":21003,"Semitic":21004,"Ġarising":21005,"Ġ330":21006,"ĠDU":21007,"ĠZah":21008,"Ġexclusion":21009,"ĠClaus":21010,"Ġven":21011,"oine":21012,"ĠAPI":21013,"reve":21014,"Ġmilitias":21015,"Ġfro":21016,"Ġwaved":21017,"ĠLuxembourg":21018,"Ġdiamonds":21019,"Ġstabilize":21020,"Ġqueue":21021,"ĠSponsor":21022,"Ġeldest":21023,"ĠLud":21024,"Ġwasting":21025,"Ġdimension":21026,"Ġmotorcycles":21027,"ucker":21028,"ĠTav":21029,"Ġsupremacy":21030,"Take":21031,"ĠCPU":21032,"cup":21033,"Ġdisregard":21034,"Ġenvelope":21035,"ĠCah":21036,"Ġproposes":21037,"ĠMaurice":21038,"Ġhobby":21039,"Ġharmon":21040,"Ġribbon":21041,"ĠOrigin":21042,"Ġbuilders":21043,"Ġconj":21044,"Ġcert":21045,"eat":21046,"ĠStern":21047,"ulia":21048,"vals":21049,"cling":21050,"Ġprovocative":21051,"Ġsofter":21052,"Ġ1948":21053,"Ġremod":21054,"ĠSob":21055,"Ġmaxim":21056,"Ġblueprint":21057,"oit":21058,"ĠGarner":21059,"Ġfibre":21060,"search":21061,"ĠWrite":21062,"270":21063,"Ġclergy":21064,"ĠPalo":21065,"obile":21066,"Mad":21067,"Ġclown":21068,"Ġtraced":21069,"280":21070,"ĠAlberto":21071,"Ġdrums":21072,"ĠFridays":21073,"ĠStrat":21074,"stated":21075,"ĠStevenson":21076,"Pr":21077,"Ġboasted":21078,"ĠBrees":21079,"ĠDonn":21080,"ĠMaya":21081,"Ġrelieve":21082,"Ġ1080":21083,"Ġcheapest":21084,"Ġuniquely":21085,"Ġjungle":21086,"Ġprevalence":21087,"Ġoutfield":21088,"ĠMaps":21089,"Ġaccustomed":21090,"pac":21091,"Ġcombinations":21092,"ĠSoros":21093,"stad":21094,"Ġket":21095,"Ġdisgusting":21096,"ĠOFF":21097,"irs":21098,"Ġbiased":21099,"Ġpaved":21100,"iked":21101,"utterstock":21102,"ocal":21103,"Ġsurround":21104,"ĠGuang":21105,"Ġspear":21106,"ĠBellev":21107,"ortun":21108,"Rec":21109,"acho":21110,"Ġfrightening":21111,"Ġtyres":21112,"normal":21113,"ĠYan":21114,"ĠWarsaw":21115,"ĠBod":21116,"ourse":21117,"199":21118,"Ver":21119,"erent":21120,"Ġsparkling":21121,"Ġchanting":21122,"Ġ1945":21123,"Ġturbo":21124,"Ġhazards":21125,"IRE":21126,"ĠRonnie":21127,"Ġsplitting":21128,"ĠMatte":21129,"roph":21130,"Ġtended":21131,"Ġvandalism":21132,"alis":21133,"SY":21134,"Ġoversaw":21135,"Happy":21136,"ĠTC":21137,"275":21138,"Ġeco":21139,"ĠKers":21140,"Ġextensions":21141,"ĠFlan":21142,"ĠCena":21143,"ĠDowns":21144,"Ġdrummer":21145,"Ġawaited":21146,"ĠACL":21147,"Ġlegends":21148,"ĠRollins":21149,"hend":21150,"Ġdeparting":21151,"Ġtha":21152,"Ġunre":21153,".(":21154,"Ġfaded":21155,"Ġretirees":21156,"vid":21157,"Ġentrants":21158,"ĠStella":21159,"arer":21160,"Ġteaspoon":21161,"ĠSheridan":21162,"irc":21163,"ĠRelief":21164,"ĠButt":21165,"Ġris":21166,"Ġundermined":21167,"Ġsunk":21168,"Sam":21169,"kamp":21170,"riot":21171,"rating":21172,"Ġclubhouse":21173,"Ġpeaked":21174,"ĠSki":21175,"Ġairstrikes":21176,"Ġconce":21177,"ĠCPR":21178,"Ġesp":21179,"ĠWave":21180,"ĠColiseum":21181,"outheastern":21182,"Ġtrou":21183,"Ġfeather":21184,"ĠSoy":21185,"ĠBihar":21186,"Ġintervened":21187,"mits":21188,"colored":21189,"330":21190,"Ġprocession":21191,"apeake":21192,"ité":21193,"riel":21194,"Ġmart":21195,"afer":21196,"ĠGuests":21197,"ĠPie":21198,"Ġshiny":21199,"ĠSixers":21200,"ĠRoads":21201,"Ġkicker":21202,"ĠCrimes":21203,"Ġfrontier":21204,"ansen":21205,"November":21206,"smith":21207,"ĠLaun":21208,"fried":21209,"weet":21210,"ĠGrass":21211,"Ġsanitation":21212,"ĠEat":21213,"ĠParts":21214,"ĠTun":21215,"amar":21216,"ĠJupiter":21217,"ĠFS":21218,"Ġunsc":21219,"ĠDone":21220,"Ġleveraging":21221,"Ġtucked":21222,"Ġineffective":21223,"Ġriots":21224,"wei":21225,"ĠAttend":21226,"Ġpertaining":21227,"amen":21228,"monds":21229,"Ġmism":21230,"serious":21231,"ĠViol":21232,"rous":21233,"Ġ129":21234,"uebl":21235,"umption":21236,"tri":21237,"ĠWedding":21238,"Ġtroopers":21239,"ĠTHR":21240,"olving":21241,"leys":21242,"Med":21243,"Ġseparatists":21244,"Ġimper":21245,"ĠFrontier":21246,"Ġwhit":21247,"ĠMutual":21248,"Ġrested":21249,"Ġunhealthy":21250,"gang":21251,"Ġresearching":21252,"ĠColonel":21253,"Ġaffordability":21254,"ĠRegarding":21255,"ĠWend":21256,"ĠMellon":21257,"Ġplots":21258,"Ġcanal":21259,"PER":21260,"ĠShopping":21261,"etry":21262,"Ġoccurrence":21263,"Ġgraves":21264,"BF":21265,"ĠKau":21266,"indust":21267,"Ġbeard":21268,"uate":21269,"ĠProdu":21270,"ĠSomali":21271,"ishers":21272,"ĠFell":21273,"ĠHutchinson":21274,"Ġhust":21275,"Ġillustration":21276,"Ġ//":21277,"Ġsharks":21278,"Ġcoincidence":21279,"Ġremake":21280,"Ġmural":21281,"course":21282,"ĠSultan":21283,"arse":21284,"Ġwhip":21285,"ĠPodcast":21286,"Ġtightened":21287,"Ġdenim":21288,"Ġlandfill":21289,"future":21290,"Ġsuperv":21291,"Hand":21292,"Ġpraising":21293,"ĠEly":21294,"ĠGust":21295,"ĠMayer":21296,"Ġorphan":21297,"Ġrepaired":21298,"ĠPir":21299,"Ġspiral":21300,"husband":21301,"ienne":21302,"iatric":21303,"Ġmarriages":21304,"Ġhorn":21305,"plain":21306,"ĠLum":21307,"ession":21308,"ĠFeatures":21309,"Ġbreakup":21310,"Ġentrepreneurship":21311,"rina":21312,"Ġembargo":21313,"Ġcapitalism":21314,"ĠMinor":21315,"Ġpromo":21316,"Ġexcel":21317,"Japan":21318,"Ġworsening":21319,"Ġstumbled":21320,"Ġpins":21321,"Ġswipe":21322,"Ġexile":21323,"Ġseparatist":21324,"ĠBian":21325,"Ġrelocation":21326,"Ġcommanders":21327,"Ġdowned":21328,"Ġblogger":21329,"packed":21330,"ĠSchn":21331,"Ġwaterfront":21332,"ĠYus":21333,"Ġnegotiator":21334,"Ġfavourable":21335,"Iran":21336,"oulder":21337,"Ġcance":21338,"Ġvind":21339,"angel":21340,"Ġauthenticity":21341,"Ġtowel":21342,"bul":21343,"ĠNeville":21344,"ĠBuddhist":21345,"fields":21346,"uly":21347,"Ġniece":21348,"Ġcorrections":21349,"Ġassignments":21350,"ĠSchl":21351,"Ġharmed":21352,"375":21353,"Ġwounding":21354,"ĠPosition":21355,"Ġsupermarkets":21356,"Ġdisclosures":21357,"Ġ185":21358,"esp":21359,"ĠMcCull":21360,"ĠMale":21361,"Ġsailors":21362,"mis":21363,"ĠSophia":21364,"Ġunfolded":21365,"owell":21366,"ĠScarborough":21367,"Ġentrepreneurial":21368,"118":21369,"ogy":21370,"ĠLikewise":21371,"Ġswung":21372,"Ġdrawings":21373,"Ġdrafting":21374,"ĠSimple":21375,"ĠFilip":21376,"arf":21377,"Ġfade":21378,"Ġmerged":21379,"ĠLeaf":21380,"sun":21381,"Ġflame":21382,"Ġindices":21383,"ĠCreate":21384,"ittle":21385,"ĠWer":21386,"ĠMond":21387,"Ġoz":21388,"ĠSmoke":21389,"Ġreplies":21390,"ĠDH":21391,"Ġjud":21392,"ĠFalk":21393,"Ġ---":21394,"Ġconstitutes":21395,"Ġtheat":21396,"119":21397,"Ġintermediate":21398,"vill":21399,"ĠGow":21400,"ĠHut":21401,"ł":21402,"155":21403,"ĠLocated":21404,"ĠDoor":21405,"Ġsliced":21406,"aru":21407,"Ġtearing":21408,"defense":21409,"oyer":21410,"Ġprodu":21411,"Ġseminar":21412,"asso":21413,"Ġpeaks":21414,"Ġconceal":21415,"Ġcrypto":21416,"Ġsetbacks":21417,"ĠAlicia":21418,"ĠFAA":21419,"Ġcontinuity":21420,"Ġcatastrophe":21421,"Ġbeg":21422,"Ġscales":21423,"apixel":21424,"Ġsalon":21425,"Ste":21426,"Ġlesbian":21427,"Ġanticip":21428,"Ġutilization":21429,"Ġchickens":21430,"Ġspinal":21431,"ĠJuliet":21432,"ĠFas":21433,"prising":21434,"ĠSalvation":21435,"Ġ138":21436,"Ġutilizing":21437,"âĢ¢":21438,"ĠMessenger":21439,"Ġrebellion":21440,"ĠAlexand":21441,"Ġinsect":21442,"Ġribs":21443,"ĠBild":21444,"Ġmonopoly":21445,"Queen":21446,"ĠNaples":21447,"Ġ133":21448,"Ġhourly":21449,"Ġego":21450,"Ġpencil":21451,"ĠPew":21452,"Ġdesirable":21453,"vant":21454,"ĠLAT":21455,"Ġperpet":21456,"lish":21457,"Ġ201":21458,"Ġdistances":21459,"Ġdistressed":21460,"Work":21461,"Ġtattoos":21462,"Ġstereotypes":21463,"istent":21464,"ĠCoral":21465,"fo":21466,"Ġpayable":21467,"Ġakin":21468,"ĠLis":21469,"ĠFinding":21470,"Ġsusceptible":21471,"ĠKiw":21472,"Ġforgiveness":21473,"ĠMoment":21474,"ĠDmitry":21475,"Ġrenov":21476,"Ġquint":21477,"ĠWaterloo":21478,"ĠReality":21479,"Ġstray":21480,"ĠBeaver":21481,"Ġbites":21482,"Ġelusive":21483,"Ġvirtue":21484,"Ġgadgets":21485,"Ġlandslide":21486,"ĠHealthy":21487,"Ġpits":21488,"Donnell":21489,"Ġirony":21490,"uct":21491,"Ġpractitioners":21492,"Ġreck":21493,"governmental":21494,"Ġatomic":21495,"Ġmotiv":21496,"Ġpolic":21497,"Ġcommunicated":21498,"ĠHS":21499,"Ġcriticize":21500,"Ġsynerg":21501,"Del":21502,"ĠRoe":21503,"Ġinspirational":21504,"ĠWarning":21505,"pel":21506,"Ġnevertheless":21507,"Ġdespair":21508,"Ġ(.":21509,"Ġfearing":21510,"Ġgrop":21511,"tree":21512,"Ġtrusts":21513,"Ġinterviewing":21514,"amic":21515,"Ġscor":21516,"ject":21517,"Another":21518,"pose":21519,"Ġdepicted":21520,"ĠPhotography":21521,"ĠLenovo":21522,"ĠEpic":21523,"ĠBoot":21524,"GI":21525,"enses":21526,"Class":21527,"arity":21528,"Ġservicing":21529,"ĠHann":21530,"Ġawe":21531,"Ġoverdoses":21532,"ĠFinnish":21533,"Ġpav":21534,"ĠPCs":21535,"SEC":21536,"ĠStro":21537,"Ġattracts":21538,"Ġapprehended":21539,"128":21540,"Ġunstable":21541,"ĠOutdoor":21542,"Ġcloth":21543,"ĠUlster":21544,"Ġvisually":21545,"Ġsculpt":21546,"Ġsufficiently":21547,"ĠKendrick":21548,"Ġengages":21549,"Ġknives":21550,"ĠGut":21551,"Ġarbit":21552,"osition":21553,"Ġemoji":21554,"Ġpinpoint":21555,"Ġremembering":21556,"rence":21557,"ĠVish":21558,"Ġimproperly":21559,"Ġranc":21560,"Ġupstream":21561,"Ġcheckpoint":21562,"Ġrash":21563,"eson":21564,"Ġtoes":21565,"260":21566,"Ġinvalid":21567,"Ġonions":21568,"Ġlashed":21569,"ĠDong":21570,"Ġprovisional":21571,"ĠFern":21572,"Ġirresponsible":21573,"actively":21574,"ĠKnown":21575,"Ġben":21576,"ĠBlank":21577,"Ġactresses":21578,"paying":21579,"Ġsyrup":21580,"isman":21581,"Ġeducating":21582,"Sunday":21583,"ifiable":21584,"Post":21585,"Ġcalculation":21586,"Ġhesitate":21587,"ĠIncreasing":21588,"Ġreeling":21589,"ĠDairy":21590,"ensing":21591,"Ġmaternity":21592,"Ø":21593,"./":21594,"ĠElm":21595,"Ġweddings":21596,"ĠYard":21597,"117":21598,"ĠRocket":21599,"OF":21600,"Ġtreasurer":21601,"Ġrattled":21602,"ĠDrop":21603,"arel":21604,"ĠFulton":21605,"ĠGiant":21606,"ĠFloor":21607,"Jet":21608,"ikk":21609,"ĠBucs":21610,"ostics":21611,"reme":21612,"ĠRouse":21613,"Ġdeliber":21614,"ĠEle":21615,"Ġconducts":21616,"ĠBlog":21617,"connected":21618,"Ġprayed":21619,"Ġcolourful":21620,"Ġaugmented":21621,"Ġbatted":21622,"Ġrelevance":21623,"ĠRomanian":21624,"acqu":21625,"ĠChel":21626,"ĠClo":21627,"ĠGraves":21628,"Ġchees":21629,"ĠGibbs":21630,"CLE":21631,"Ġfertility":21632,"Ġambul":21633,"Ġspecs":21634,"ĠIRA":21635,"ĠBooth":21636,"ithe":21637,"ĠPlayoff":21638,"ammed":21639,"Ġcollaborating":21640,"Ġlunar":21641,"Ġconfronting":21642,"Ġattribute":21643,"King":21644,"riz":21645,"Ġcasualty":21646,"acia":21647,"waters":21648,"Ġpaving":21649,"Ġcaregivers":21650,"nor":21651,"Ġreacting":21652,"ĠHash":21653,"Ġsqueezed":21654,"Ġexert":21655,"ĠMichele":21656,"ĠConc":21657,"ĠHep":21658,"Ġsewage":21659,"wart":21660,"GY":21661,"Ġdiscourage":21662,"ĠFir":21663,"Ġtextile":21664,"ĠSpice":21665,"ĠFah":21666,"Ġcomplainant":21667,"Ġinstinct":21668,"camp":21669,"ĠEdison":21670,"ĠVIDEOS":21671,"LM":21672,"ĠSands":21673,"About":21674,"Ġdisk":21675,"brid":21676,"Ġmuted":21677,"ACC":21678,"Ġwre":21679,"event":21680,"Ġicons":21681,"Express":21682,"udes":21683,"ĠBeatles":21684,"color":21685,"ĠHaas":21686,"ĠWolfe":21687,"ĠYOUR":21688,"Ġaccessibility":21689,"ĠCornwall":21690,"Ġing":21691,"Ġatrocities":21692,"weather":21693,"ĠDominion":21694,"ĠMIL":21695,"ĠLara":21696,"Ġunravel":21697,"Ġmaneuver":21698,"Ġfoam":21699,"ribe":21700,"CI":21701,"Ġcandles":21702,"acs":21703,")(":21704,"coon":21705,"ĠPurple":21706,"ĠGovernors":21707,"ĠKeystone":21708,"ĠYuk":21709,"file":21710,"Ġviol":21711,"gery":21712,"370":21713,"train":21714,"Ġgunshots":21715,"olin":21716,"Ġviruses":21717,"ĠTex":21718,"hours":21719,"Ġprev":21720,"ĠRid":21721,"ected":21722,"ĠVog":21723,"riers":21724,"Ġmurdering":21725,"ĠIz":21726,"Ġdeliberations":21727,"arming":21728,"unda":21729,"Ġrink":21730,"ĠDrugs":21731,"idered":21732,"Ġforge":21733,"Ġexpansive":21734,"VIEW":21735,"ĠBots":21736,"Ġswitches":21737,"KO":21738,"atten":21739,"Ġvariants":21740,"ĠVirtual":21741,"ĠCoch":21742,"yon":21743,"ĠKai":21744,"Ġbullied":21745,"iday":21746,"version":21747,"Ġlib":21748,"ĠCec":21749,"igated":21750,"ĠTRUMP":21751,"ĠPod":21752,"Ġtoppled":21753,"Ġeyeing":21754,"ĠPatients":21755,"techn":21756,"Ġhampered":21757,"Ġavert":21758,"ĠScheme":21759,"ĠCorm":21760,"Ġpony":21761,"Ġzoom":21762,"abo":21763,"Ġsleeves":21764,"lane":21765,"ĠLester":21766,"ĠDane":21767,"Ġcough":21768,"Ġsignings":21769,"HER":21770,"Ġsibling":21771,"Ġredemption":21772,"Ġstockp":21773,"ĠAlgeria":21774,"Ġpadd":21775,"ĠBrenda":21776,"uchi":21777,"Ġtransporting":21778,"Ġspeculative":21779,"ĠSek":21780,"abal":21781,"Ġshipment":21782,"oker":21783,"Ġwarranty":21784,"atan":21785,"Ġblister":21786,"ĠCelebration":21787,"Ġwal":21788,"Ġlac":21789,"Ġprioritize":21790,"ression":21791,"BP":21792,"Ġcollaborated":21793,"ĠNewsletter":21794,"ĠDamian":21795,"ĠResidential":21796,"Ġgra":21797,"Ġfeasible":21798,"ĠCrest":21799,"ĠBean":21800,"ĠSturgeon":21801,"ĠTale":21802,"ĠContin":21803,"ĠMush":21804,"Ġrocking":21805,"ĠMane":21806,"ĠHumane":21807,"resistant":21808,"ĠFra":21809,"highest":21810,"fts":21811,"Ġamassed":21812,"ĠPavilion":21813,"ĠSkin":21814,"Ġunfold":21815,"Ġresur":21816,"ĠPET":21817,"model":21818,"Ġemploying":21819,"Ġrude":21820,"Ġirrelevant":21821,"angu":21822,"Page":21823,"PN":21824,"igator":21825,"ĠReb":21826,"ĠArrest":21827,"ĠGund":21828,"Ġmalls":21829,"zhen":21830,"wed":21831,"Ġdaring":21832,"Ġfactual":21833,"ĠGent":21834,"Ġinforming":21835,"ĠStri":21836,"ĠLounge":21837,".]":21838,"ĠTribunal":21839,"ĠMoines":21840,"Ġshadows":21841,"generated":21842,"fulness":21843,"Ġheartfelt":21844,"ĠLivingston":21845,"ĠClerk":21846,"Ġnationalism":21847,"ĠMiche":21848,"balls":21849,"anos":21850,"agle":21851,"Ġprejudice":21852,"Ġevenly":21853,"Ġswearing":21854,"Ġexits":21855,"Ġcondemning":21856,"Ġvanilla":21857,"club":21858,"ĠFunding":21859,"ĠDover":21860,"Ġhots":21861,"Ġfres":21862,"Ġgoodness":21863,"ĠMcKay":21864,"Ġbulls":21865,"avia":21866,"129":21867,"Ġ1947":21868,"Ġdefamation":21869,"ĠMoran":21870,"irms":21871,"ĠFitz":21872,"ĠRossi":21873,"urated":21874,"Ġvariation":21875,"ĠBauer":21876,"ĠSchro":21877,"Ġcolony":21878,"ĠParliamentary":21879,"ikan":21880,"Ġstirring":21881,"ĠSheldon":21882,"Ġaccessory":21883,"ĠUtilities":21884,"Ġnab":21885,"Ġpract":21886,"Ġherein":21887,"ĠRole":21888,"ĠMant":21889,"Ġpharm":21890,"Ġ215":21891,"ĠNGO":21892,"ĠAnything":21893,"ĠMacedonia":21894,"Ġbree":21895,"ĠWTO":21896,"Chicago":21897,"ĠProtect":21898,"quarters":21899,"ĠGrassley":21900,"ĠInteractive":21901,"ĠInterview":21902,"Ġ550":21903,"Ġastronauts":21904,"Ġfreak":21905,"ĠIntegrated":21906,"Ġindict":21907,"Ġgenerators":21908,"acio":21909,"Kevin":21910,"Ġvaccination":21911,"Ġblockade":21912,"ĠSons":21913,"Ġcapita":21914,"ĠAnita":21915,"ĠExport":21916,"ĠNex":21917,"ĠAram":21918,"Ġzinc":21919,"Ġrevamped":21920,"Ġselective":21921,"Ġmanipulate":21922,"ĠBedford":21923,"ĠBattery":21924,"Ġqualifiers":21925,"lean":21926,"Ġscrew":21927,"film":21928,"ror":21929,"ĠEllison":21930,"ombo":21931,"ĠOst":21932,"165":21933,"Ġslaves":21934,"ĠPayton":21935,"Ġbarg":21936,"Ġrugged":21937,"ĠWinn":21938,"ĠHammer":21939,"ĠUPS":21940,"Euro":21941,"Ġunfamiliar":21942,"Ġdistract":21943,"Ġbuffer":21944,"ledge":21945,"Ġtrunk":21946,"Ġ320":21947,"122":21948,"Ġdilemma":21949,"Ġpra":21950,"Ġutmost":21951,"Ġcampaigners":21952,"icular":21953,"eful":21954,"�":21955,"ĠHQ":21956,"neau":21957,"Ġsir":21958,"test":21959,"Company":21960,"Ġrescind":21961,"ardon":21962,"MG":21963,"Gov":21964,"ĠRaz":21965,"Ġrod":21966,"fed":21967,"Ġpsych":21968,"Ġunin":21969,"ĠArbor":21970,"Ġnewcomer":21971,"ĠEdwin":21972,"raising":21973,"quist":21974,"Ġdiscoveries":21975,"Steve":21976,"Ġscramble":21977,"js":21978,"Ġacoustic":21979,"Ġdeterioration":21980,"Ġobserving":21981,"ĠWinning":21982,"ĠSaban":21983,"idy":21984,"Ġoverd":21985,"Ġscouting":21986,"Ġpunitive":21987,"ĠShelter":21988,"Ġmocked":21989,"Ġdreamed":21990,"Ġinvaluable":21991,"LP":21992,"standard":21993,"Ġrecounted":21994,"ĠSabres":21995,"points":21996,"Ġfringe":21997,"ĠBarker":21998,"alian":21999,"ĠPROV":22000,"Ġcartel":22001,"Ġovercrowd":22002,"tain":22003,"Year":22004,"ĠWelfare":22005,"ĠChr":22006,"Ġintroduces":22007,"ĠDoing":22008,"ĠGlover":22009,"Ġdeteriorating":22010,"Par":22011,"Ġattendant":22012,"ĠMold":22013,"ĠFlying":22014,"ovan":22015,"Ġoptimize":22016,"Ġchapters":22017,"Ġdull":22018,"gay":22019,"ĠATP":22020,"ĠKah":22021,"ainer":22022,"feet":22023,"Ġjoking":22024,"Ġdisadvantage":22025,"Rep":22026,"Ġtwisted":22027,"Ġslain":22028,"Ġcomprise":22029,"Ġrestricting":22030,"Ġdispos":22031,"Ġshaky":22032,"Ġembattled":22033,"owe":22034,"conscious":22035,"oken":22036,"Ġmistaken":22037,"ĠDra":22038,"Ġreservoir":22039,"Ġspate":22040,"Scott":22041,"avor":22042,"Ġqual":22043,"amel":22044,"hunt":22045,"ĠChevy":22046,"Ġclaw":22047,"Ġwitch":22048,"ĠZimmerman":22049,"arium":22050,"Ġrubbish":22051,"Ġstrings":22052,"Ġdoc":22053,"Ġplaque":22054,"ĠCyr":22055,"Ġflourish":22056,"Ġworthwhile":22057,"Ġbanners":22058,"ĠLemon":22059,"ĠRainbow":22060,"Ġconsisted":22061,"ĠHOW":22062,"Ñ":22063,"Ġblogs":22064,"CLUS":22065,"eely":22066,"Ġbeast":22067,"ĠMai":22068,"Ġhostility":22069,"eros":22070,"Ġforeseeable":22071,"ĠCorker":22072,"ĠWEEK":22073,"visors":22074,"ressive":22075,"ĠViktor":22076,"Ġbureaucracy":22077,"Ġ256":22078,"ĠFeel":22079,"ĠAdventure":22080,"Ġefficacy":22081,"ĠInstitution":22082,"ĠHarbaugh":22083,"ĠPractice":22084,"ĠChristianity":22085,"Thanks":22086,"Ġfridge":22087,"idel":22088,"Ġeff":22089,"Ġvein":22090,"terms":22091,"Ġignorance":22092,"Ġscream":22093,"Ġwit":22094,"ĠRousse":22095,"ĠWillow":22096,"Ġhallway":22097,"former":22098,"Ġshooters":22099,"ĠReporting":22100,"Ġgal":22101,"Ġsavvy":22102,"rand":22103,"Ġremed":22104,"ĠBaron":22105,"inar":22106,"Ġseizures":22107,"ĠThorn":22108,"ĠProtesters":22109,"ĠRevolutionary":22110,"think":22111,"ĠCabrera":22112,"Four":22113,"ĠRudd":22114,"Ġprost":22115,"ĠBottom":22116,"Port":22117,"nas":22118,"ifax":22119,"Wire":22120,"Ġtokens":22121,"antis":22122,"ĠSOU":22123,"ĠMilk":22124,"asters":22125,"Ġshrimp":22126,"Ġcakes":22127,"blue":22128,"ifty":22129,"View":22130,"adium":22131,"fen":22132,"zyk":22133,"ĠEmil":22134,"Ġdismay":22135,"Ġtilt":22136,"aska":22137,"Young":22138,"Ġpredators":22139,"Ġovershadowed":22140,"mitt":22141,"ĠSemin":22142,"ĠSchiff":22143,"ĠClarkson":22144,"212":22145,"210":22146,"Ġvanished":22147,"Ġmesh":22148,"ĠBurnett":22149,"ĠMent":22150,"ĠBlind":22151,"ĠPatriot":22152,"ĠVil":22153,"Ġflick":22154,"ĠTowns":22155,"ĠWhites":22156,"Ġspice":22157,"ĠMode":22158,"Ġnominate":22159,"Ġwrest":22160,"ĠAshes":22161,"Ġrows":22162,"ĠClint":22163,"Ġgentleman":22164,"utan":22165,"athlon":22166,"ĠIntermediate":22167,"hews":22168,"Ġoffended":22169,"ĠPaige":22170,"ĠFinch":22171,"ĠAboriginal":22172,"positive":22173,"Stop":22174,"Ġrenting":22175,"Ġ[â̦]":22176,"ĠHert":22177,"Ġvegetation":22178,"apes":22179,"ĠCanon":22180,"appa":22181,"Ġabst":22182,"ĠKatz":22183,"Ġsurfing":22184,"aghan":22185,"ĠPresidency":22186,"Ġscaling":22187,"ĠSas":22188,"Ġpeanut":22189,"Ġrecommending":22190,"cious":22191,"endez":22192,"eker":22193,"ĠKamp":22194,"Ġsitcom":22195,"Ġcrust":22196,"women":22197,"ĠJes":22198,"ĠWhe":22199,"ĠWarwick":22200,"Ġepit":22201,"ĠAlc":22202,"Ġdictate":22203,"ĠSPORTS":22204,"ĠLanguage":22205,"Ġindicative":22206,"ĠMacDonald":22207,"Ġreorgan":22208,"Ġ`":22209,"ARS":22210,"Ġliberation":22211,"Ġbless":22212,"Ġreflective":22213,"Ġà¤":22214,"Ġdesires":22215,"ĠHank":22216,"ĠLaunch":22217,"Ġrotating":22218,"ĠStones":22219,"Ġcoordinating":22220,"ĠZeit":22221,"Ġskepticism":22222,"ĠAlam":22223,"ĠTrout":22224,"ĠSMS":22225,"ĠCrescent":22226,"ĠTeacher":22227,"Ġfury":22228,"Ġeyebrows":22229,"onga":22230,"ĠPilot":22231,"ĠRutherford":22232,"Ġinterstate":22233,"established":22234,"Ġbaggage":22235,"Ġ131":22236,"riks":22237,"mil":22238,"Ġneon":22239,"Ġqueer":22240,"ourced":22241,"ĠKash":22242,"ĠEleven":22243,"illes":22244,"ĠOpportun":22245,"Ġstre":22246,"Washington":22247,"ĠDifferent":22248,"Ġexempl":22249,"Ġboarded":22250,"Ġrogue":22251,"ĠDNC":22252,"rone":22253,"Ġreversing":22254,"nine":22255,"ĠIvory":22256,"itating":22257,"uve":22258,"Ġfracture":22259,"255":22260,"ĠAssessment":22261,"Ġsubjective":22262,"Ġfluct":22263,"ĠJaguar":22264,"Ġstride":22265,"Ġreapp":22266,"ĠGrow":22267,"against":22268,"ĠMedina":22269,"scenes":22270,"ĠNieto":22271,"Ġsou":22272,"ĠFleming":22273,"Ġnarcotics":22274,"ĠBere":22275,"ĠBub":22276,"ĠAck":22277,"Ġvinyl":22278,"ĠCopy":22279,"ĠGarland":22280,"ĠDuty":22281,"Ġinn":22282,"Ġmerchant":22283,"Ġactivate":22284,"Ġglowing":22285,"ettle":22286,"ĠBran":22287,"Ġsilk":22288,"anco":22289,"TL":22290,"ĠFurn":22291,"Ġwithheld":22292,"Ġpulse":22293,"ĠGU":22294,"BUS":22295,"ĠHyper":22296,"Ġpicnic":22297,"Ġpositives":22298,"ĠParamount":22299,"Ġ737":22300,"Ġenlisted":22301,"ĠValerie":22302,"false":22303,"ĠChocolate":22304,"ĠSTAR":22305,"Ġdescended":22306,"Ġtasty":22307,"ĠDaesh":22308,"ĠNed":22309,"Ġcomplimentary":22310,"Ġdepicting":22311,"ĠHavana":22312,"college":22313,"Ġtraces":22314,"Ġundue":22315,"ĠSisters":22316,"aum":22317,"ĠCourier":22318,"ĠOng":22319,"ĠSparks":22320,"ongs":22321,"ĠYong":22322,"URR":22323,"los":22324,"Ġhorsepower":22325,"confidence":22326,"ĠPett":22327,"ĠMeasure":22328,"Ġmarches":22329,"zig":22330,"ĠTOR":22331,"Ġexported":22332,"ĠRak":22333,"ĠInvestigations":22334,"Ġterminate":22335,"ĠTian":22336,"Ġmasters":22337,"ĠDS":22338,"Ġoutraged":22339,"ĠCups":22340,"ĠWeir":22341,"exec":22342,"Ġjourneys":22343,"Ġabide":22344,"Ġavail":22345,"ĠStreets":22346,"Ġfixes":22347,"Ġcocoa":22348,"Ġabundant":22349,"Ġhubs":22350,"mort":22351,"Ġrobberies":22352,"ĠBark":22353,"Ġprecautions":22354,"Ġhammered":22355,"ometric":22356,"mith":22357,"ĠMcCann":22358,"ĠJaw":22359,"ĠQuest":22360,"ĠMcF":22361,"Ġlob":22362,"Ġlegalized":22363,"Ġquirky":22364,"Ġtrailers":22365,"ĠIndividual":22366,"Ġcumulative":22367,"Ġenlarge":22368,"Ġconvoy":22369,"olen":22370,"got":22371,"landers":22372,"Ġscanner":22373,"Ġscans":22374,"ĠEg":22375,"prof":22376,"Ġhosp":22377,"ĠColo":22378,"Ġerr":22379,"Ġdeval":22380,"ĠUsually":22381,"Ġbul":22382,"ummy":22383,"Ġtandem":22384,"occupied":22385,"Ġmandates":22386,"ĠSwim":22387,"121":22388,"ussed":22389,"EF":22390,"Ġfries":22391,"Until":22392,"rc":22393,"Ġbadge":22394,"Ġstrips":22395,"Ġmagnet":22396,"Ġarchive":22397,"stan":22398,"ĠDeadline":22399,"Ġdisposable":22400,"Ġbob":22401,"Ġnorthwestern":22402,"Jul":22403,"ĠSAL":22404,"Ġinfluencing":22405,"Ġdevil":22406,"ĠEllie":22407,"cms":22408,"ingo":22409,"888":22410,"Ġcosmetic":22411,"Also":22412,"Ġyacht":22413,"Ġlazy":22414,"Ġmerc":22415,"Ġabsorbed":22416,"harm":22417,"116":22418,"Ġsubpoena":22419,"Ġcounters":22420,"ĠLori":22421,"Ġrandomly":22422,"nea":22423,"waves":22424,"Ġrelie":22425,"ĠKiss":22426,"Ġchassis":22427,"Ġbakery":22428,"Images":22429,"ĠHolden":22430,"Ġamazed":22431,"Ġalignment":22432,"ĠPowers":22433,"Ġlabelled":22434,"Ġstaunch":22435,"Ġsignaling":22436,"Ġsenate":22437,"Ġunconventional":22438,"ĠAlternative":22439,"Ġambassadors":22440,"ĠVPN":22441,"atics":22442,"Ġmosquito":22443,"ĠScholarship":22444,"Ġhelpless":22445,"alone":22446,"ZA":22447,"chel":22448,"Ġconstituencies":22449,"ĠCafé":22450,"Ġhatch":22451,"ĠRupert":22452,"Ġrendering":22453,"Ġreinstated":22454,"Ġinterval":22455,"Texas":22456,"ĠAHL":22457,"February":22458,"review":22459,"Ġgle":22460,"Ġfals":22461,"Ġmarkers":22462,"Ġgovernmental":22463,"ĠPos":22464,"Ġarose":22465,"every":22466,"Ġrulings":22467,"obar":22468,"Govern":22469,"gren":22470,"isan":22471,"Ġmarketed":22472,"Click":22473,"Ġord":22474,"Ġballoons":22475,"asers":22476,"ĠHorton":22477,"pub":22478,"ĠAerospace":22479,"Ġflank":22480,"Ġmolecular":22481,"bour":22482,"nuts":22483,"Ġalliances":22484,"Ġbenchmarks":22485,"ocate":22486,"stadt":22487,"ĠGoodwin":22488,"lap":22489,"ĠFactors":22490,"Never":22491,"ĠNem":22492,"Ġroadside":22493,"orth":22494,"Ġexhibited":22495,"ĠPearce":22496,"ĠOlsen":22497,"Ġpostal":22498,"ĠLiberation":22499,"reen":22500,"mary":22501,"Ġropes":22502,"Ġlarg":22503,"Ġgob":22504,"boys":22505,"ĠSax":22506,"Ġreimbursement":22507,"ĠVie":22508,"ĠCatholics":22509,"ĠMartial":22510,"Ġpremiered":22511,"Ġawaits":22512,"ĠUnderstanding":22513,"ĠBelarus":22514,"ĠVor":22515,"ogi":22516,"iaz":22517,"Ġvictorious":22518,"Ġancestors":22519,"Ġwreckage":22520,"Ġoppression":22521,"ĠChildhood":22522,"Ġwidth":22523,"ĠPlymouth":22524,"ĠFifty":22525,"Ġoccupancy":22526,"etts":22527,"ĠFiscal":22528,"lifting":22529,"ĠTraditional":22530,"Ġnostalgia":22531,"Law":22532,"Ġlays":22533,"Ġarresting":22534,"Ġanticipating":22535,"Ġinsults":22536,"ĠExtension":22537,"Ġgenerator":22538,"ummer":22539,"Ġageing":22540,"Ġbouncing":22541,"ember":22542,"ĠWAR":22543,"ĠNico":22544,"ĠWow":22545,"ĠRaven":22546,"flower":22547,"ĠCrim":22548,"bh":22549,"Ġundo":22550,"Ġburgers":22551,"roud":22552,"ĠAtkinson":22553,"ĠYEAR":22554,"Ġpoorer":22555,"ICA":22556,"ĠSchedule":22557,"Ġstronghold":22558,"ĠMillennium":22559,"Ġ###":22560,"ilda":22561,"ĠGH":22562,"Ġupscale":22563,"aldi":22564,"ĠResolution":22565,"Ġswelling":22566,"Ġgrieving":22567,"ĠNile":22568,"ĠTig":22569,"ERY":22570,"ooth":22571,"BALL":22572,"Ġballet":22573,"Ġbucks":22574,"ĠUV":22575,"akin":22576,"Ġchilling":22577,"Ġdatabases":22578,"ĠGD":22579,"section":22580,"Ġhires":22581,"Ġmul":22582,"Ġsen":22583,"ĠTownsend":22584,"Ġinspected":22585,"ilic":22586,"Ġdiscriminatory":22587,"fol":22588,"Ġalcoholic":22589,"ĠHoff":22590,"Carl":22591,"Ġvicinity":22592,"lein":22593,"ĠEco":22594,"ĠGovern":22595,"Ġsecrecy":22596,"aned":22597,"ĠDUP":22598,"Ġ570":22599,"Ġsow":22600,"Ġstalls":22601,"Ġinsulting":22602,"ĠDT":22603,"Ġinforms":22604,"fitting":22605,"ĠDepending":22606,"ĠMelanie":22607,"ĠThom":22608,"path":22609,"Ġadmired":22610,"Peter":22611,"idents":22612,"ielding":22613,"ĠShanahan":22614,"TD":22615,"Things":22616,"sn":22617,"Ġconstituted":22618,"Ġ137":22619,"Ġderailed":22620,"ĠBonnie":22621,"Ġgraffiti":22622,"Ġearnest":22623,"Ġcompliant":22624,"blown":22625,"Ġalle":22626,"prise":22627,"Ġfocal":22628,"Ġgentlemen":22629,"ĠTalks":22630,"Ġpassports":22631,"Ġdeprived":22632,"Ġdude":22633,"ĠNath":22634,"Ġgoverned":22635,"Ġsac":22636,"Ġcastle":22637,"qv":22638,"Ġtolerated":22639,"ĠSci":22640,"close":22641,"ĠDynamics":22642,"Ġflashing":22643,"yk":22644,"ĠConsolid":22645,"Ġinherently":22646,"ĠForrest":22647,"Gene":22648,"Public":22649,"Ġloser":22650,"runners":22651,"Ġprudent":22652,"Ġpioneering":22653,"ĠHowe":22654,"ĠButter":22655,"ĠArabian":22656,"acha":22657,"ĠBBQ":22658,"ĠMineral":22659,"Ġdestiny":22660,"Ġretrieve":22661,"ĠBav":22662,"reth":22663,"oby":22664,"ĠGrid":22665,"Ġgrievances":22666,"ĠTips":22667,"Ġadamant":22668,"Ġdiets":22669,"Ġmilestones":22670,"Ġcollects":22671,"ĠLaboratories":22672,"ĠWC":22673,"Ġpostp":22674,"Ġdams":22675,"ĠOEM":22676,"Ġrumor":22677,"Ġlocking":22678,"Ġemission":22679,"Ġqueries":22680,"Jones":22681,"Ġlang":22682,"ĠAcqu":22683,"ĠMedium":22684,"ĠTreasurer":22685,"Sept":22686,"FB":22687,"Ġintegrating":22688,"Ġbolstered":22689,"Ġincorporating":22690,"encers":22691,"Ġirregularities":22692,"Ġnom":22693,"iod":22694,"ĠAi":22695,"Ġsor":22696,"anked":22697,"Ġrehears":22698,"fig":22699,"ĠBug":22700,"hoff":22701,"Ġtrooper":22702,"Ġgalaxy":22703,"amon":22704,"ĠAtlas":22705,"Ġsolicit":22706,"Ġsings":22707,"ĠInstructions":22708,"ĠMig":22709,"thinking":22710,"ĠCostco":22711,"Ġbreasts":22712,"Ġportraits":22713,"ĠCock":22714,"Ġsubscriptions":22715,"Ġpine":22716,"Ġhaunted":22717,"ĠMED":22718,"eer":22719,"ega":22720,"ĠZa":22721,"ENN":22722,"ĠWinners":22723,"aith":22724,"safe":22725,"Ġ143":22726,"ĠWeston":22727,"ĠLansing":22728,"ĠLaurel":22729,"ocrat":22730,"ograph":22731,"Ġmatchups":22732,"ĠFriend":22733,"Ġdigest":22734,"Ġdimensions":22735,"azing":22736,"Ġtipping":22737,"Ġenrich":22738,"gart":22739,"argo":22740,"Ġoutbreaks":22741,"Ġsalvage":22742,"ĠErica":22743,"Ġmodules":22744,"ĠPDF":22745,"ĠGoods":22746,"oots":22747,"2011":22748,"Ġinterrupt":22749,"Ġradi":22750,"ĠSimone":22751,"vell":22752,"ĠSV":22753,"extremely":22754,"Ġstadiums":22755,"ĠRox":22756,"Ġconflicting":22757,"Ġyouthful":22758,"ĠUM":22759,"series":22760,"Ġded":22761,"Ġfielding":22762,"Pre":22763,"itled":22764,"Ġstreamed":22765,"Ġapprentices":22766,"ĠAlec":22767,"ĠGap":22768,"ĠPrem":22769,"Ġleased":22770,"Ġdeepening":22771,"Ġbounds":22772,"Ġrethink":22773,"ĠVoting":22774,"ĠScha":22775,"blood":22776,"ĠReeves":22777,"Ġbells":22778,"Ġcollector":22779,"ĠCrimson":22780,"ĠWheat":22781,"207":22782,"ĠHB":22783,"ĠBCC":22784,"Ġsync":22785,"ĠAnders":22786,"Ġthanking":22787,"Ġlayoffs":22788,"Ġfoolish":22789,"Ġcustod":22790,"Ġelephants":22791,"Ġcorrelation":22792,"ĠHarding":22793,"ĠGPU":22794,"ĠBarnett":22795,"Ġol":22796,"Ġalarms":22797,"Ġfluctuations":22798,"shop":22799,"Ġcommentators":22800,"ĠAlpine":22801,"Ġmur":22802,"Ġbiotech":22803,"Ġunlocked":22804,"ouri":22805,"roe":22806,"ĠPayment":22807,"ĠPOL":22808,"ĠGuest":22809,"Ġphrases":22810,"ĠBuilt":22811,"erves":22812,"Ġnutritional":22813,"205":22814,"ourage":22815,"Related":22816,"Come":22817,"ĠSAT":22818,"Ġgatherings":22819,"Ġsquads":22820,"Ġorganising":22821,"Ġministerial":22822,"Ġkilomet":22823,"ĠJump":22824,"ĠStrength":22825,"ĠFerr":22826,"Ġillustrated":22827,"ĠOber":22828,"Ġextrad":22829,"Ġlimitation":22830,"idis":22831,"ĠMonths":22832,"ifts":22833,"Ġmotives":22834,"Ġmaternal":22835,"Ġbait":22836,"Ġadversity":22837,"Twitter":22838,"ĠUni":22839,"Ġgrappling":22840,"Ġbowls":22841,"ĠHib":22842,"ĠCopenhagen":22843,"Ġsergeant":22844,"Ġintro":22845,"Ġscrambled":22846,"ĠExc":22847,"Ġshowcases":22848,"Ġplotting":22849,"Ġsym":22850,"ĠNah":22851,"berries":22852,"itching":22853,"conn":22854,"istle":22855,"ĠBeginning":22856,"asley":22857,"ĠMeadow":22858,"ĠCra":22859,"Ġsupremacist":22860,"Ġsweats":22861,"production":22862,"innon":22863,"ovo":22864,"Ġscept":22865,"Ġdrowning":22866,"ĠEh":22867,"Ġdecorations":22868,"Ġsympathetic":22869,"raction":22870,"Ġ195":22871,"ripp":22872,"ĠNotice":22873,"charging":22874,"ĠDIY":22875,"ĠJin":22876,"Ġskinny":22877,"Ġmaj":22878,"Ġwhisk":22879,"Ġcongreg":22880,"RAL":22881,"Ġvolley":22882,"Ġestablishments":22883,"Ġcite":22884,"Miss":22885,"Int":22886,"iola":22887,"ĠBare":22888,"KING":22889,"ools":22890,"private":22891,"Ġflaw":22892,"Ġwires":22893,"Ġideals":22894,"oub":22895,"Ġ\"'":22896,"ĠCompet":22897,"ĠStatements":22898,"ĠHDR":22899,"rm":22900,"Ġbegging":22901,"uffs":22902,"Ġdispatch":22903,"Ġskipped":22904,"Ġlabs":22905,"hawks":22906,"Ġexpl":22907,"Ġpatriotic":22908,"ussions":22909,"Ġportrayal":22910,"ĠBudapest":22911,"ĠCod":22912,"Ġextingu":22913,"smart":22914,"Ġburdens":22915,"ĠDrama":22916,"Ġaltitude":22917,"Ġpursuant":22918,"à¥":22919,"atari":22920,"cot":22921,"Ġhotline":22922,"ooters":22923,"ĠRolls":22924,"Ġjeopardy":22925,"oids":22926,"Ġpageant":22927,"149":22928,"Ġdistinguish":22929,"support":22930,"ĠHighlands":22931,"ĠErnst":22932,"ĠHole":22933,"pering":22934,"ĠHasan":22935,"Ġrece":22936,"Ġirregular":22937,"Ġdisturbed":22938,"Ġcoupon":22939,"ĠElijah":22940,"oise":22941,"Ġfriendships":22942,"girlfriend":22943,"Ġrampage":22944,"arers":22945,"Ġdispens":22946,"assion":22947,"Ġtentative":22948,"ĠExploration":22949,"fashioned":22950,"ĠInstit":22951,"Ġthemed":22952,"ĠKurdistan":22953,"ĠCAL":22954,"ĠSweeney":22955,"Ġransom":22956,"Ġstamps":22957,"ĠSchwe":22958,"ĠLucia":22959,"124":22960,"omore":22961,"Ġmotivate":22962,"ĠWorcester":22963,"wald":22964,"CAR":22965,"iken":22966,"andro":22967,"ffic":22968,"ĠRehab":22969,"Ġgrou":22970,"Ġcontrollers":22971,"ĠHai":22972,"nz":22973,"Ġartillery":22974,"ĠMish":22975,"Ġregistry":22976,"Ġfrontman":22977,"ĠCharg":22978,"orneys":22979,"ĠPRESS":22980,"Ġperceptions":22981,"ĠMcGee":22982,"AU":22983,"mg":22984,"Off":22985,"ĠNGOs":22986,"chemical":22987,"Ġbrun":22988,"ĠHav":22989,"Ġlace":22990,"Ġ202":22991,"Ġdefer":22992,"Ġinjected":22993,"Ġgluten":22994,"ĠRin":22995,"ĠAvalanche":22996,"Ġcorpor":22997,"ĠPamela":22998,"Ġfills":22999,"ĠReve":23000,"ĠMonument":23001,"Ġnationalists":23002,"ĠIQ":23003,"adden":23004,"ĠLoop":23005,"Ġ134":23006,"Reg":23007,"click":23008,"bush":23009,"ĠKub":23010,"ipes":23011,"Ġtoggle":23012,"ĠRae":23013,"Ġburgl":23014,"Ġholistic":23015,"ronics":23016,"Ġprominence":23017,"jack":23018,"Ġfinan":23019,"icates":23020,"Ġvel":23021,"important":23022,"Thursday":23023,"chet":23024,"Ġrefunds":23025,"ĠElder":23026,"ĠOwner":23027,"Ġtakeaway":23028,"Pe":23029,"ĠToro":23030,"Tim":23031,"fix":23032,"before":23033,"ĠMotorola":23034,"Ġlev":23035,"Term":23036,"ĠSne":23037,"Ġmisinformation":23038,"ĠSinai":23039,"Ġnitrogen":23040,"Ġ203":23041,"Ġescaping":23042,"Ġjunction":23043,"ĠSantana":23044,"ĠYemeni":23045,"Ġwhipped":23046,"ĠStephenson":23047,"Ġattire":23048,"ĠBard":23049,"atically":23050,"ĠFaul":23051,"ĠSym":23052,"resh":23053,"ĠMG":23054,"Sub":23055,"ĠCarmen":23056,"Ġig":23057,"ĠSanford":23058,"ĠYa":23059,"cycle":23060,"Ġencryption":23061,"ĠScal":23062,"ĠChest":23063,"ĠMadonna":23064,"agin":23065,"ĠDHS":23066,"ĠCed":23067,"YR":23068,"Ġtruce":23069,"ĠBike":23070,"Ġfoes":23071,"ĠSlovakia":23072,"adal":23073,"Rain":23074,"OPE":23075,"Ġlockdown":23076,"Ġunilateral":23077,"Ġoverseen":23078,"Ġblames":23079,"Ġbarrage":23080,"aan":23081,"uds":23082,"ĠRust":23083,"ĠHC":23084,"cox":23085,"ĠAllied":23086,"ĠJosé":23087,"pected":23088,"Ġunp":23089,"Ġsomeday":23090,"Ġdeductions":23091,"icial":23092,"ĠPRO":23093,"ĠIntern":23094,"Ġhemp":23095,"Ġkilograms":23096,"Ġnets":23097,"ĠBACK":23098,"early":23099,"outed":23100,"Ġrelegated":23101,"Ġ1958":23102,"ĠMustang":23103,"Ġgamble":23104,"Ġprostitution":23105,"ĠPapa":23106,"Ġinexpensive":23107,"GHz":23108,"Ġjerseys":23109,"Ġmisery":23110,"VIS":23111,"ĠRAW":23112,"Ġthri":23113,"Ġaffiliation":23114,"small":23115,"Ġflashed":23116,"Ġcoastline":23117,"Ġgard":23118,"Ġsv":23119,"Ġwaits":23120,"itton":23121,"London":23122,"Ġaccus":23123,"ĠCharge":23124,"Ġincub":23125,"Ġwanna":23126,"ĠAwareness":23127,"abies":23128,"ĠUh":23129,"Ġpersuaded":23130,"ĠThames":23131,"Ġcurated":23132,"Ī":23133,"Ġbrutally":23134,"Ġrooftop":23135,"Ġoy":23136,"Ġ1900":23137,"bery":23138,"Ġuphill":23139,"Ġinteracting":23140,"Ġchilly":23141,"ERE":23142,"Ġcapsule":23143,"ĠSaul":23144,"ocker":23145,"Ġdeserving":23146,"ĠBowen":23147,"ĠReaders":23148,"ĠWriters":23149,"Ġartifacts":23150,"ĠRanger":23151,"reau":23152,"Ġimperson":23153,"Ġhears":23154,"ĠMaher":23155,"neg":23156,"Ġmantra":23157,"Ġmull":23158,"Ġelders":23159,"ĠAmtrak":23160,"Ġspouses":23161,"ĠHak":23162,"Ġopenness":23163,"Ġprevailed":23164,"Ġfortnight":23165,"Pal":23166,"ride":23167,"Ġillustrate":23168,"dominated":23169,"trust":23170,"ī":23171,"ĠFemale":23172,"ĠSlim":23173,"Ġdesc":23174,"ĠKathryn":23175,"Ġdeepen":23176,"TAIN":23177,"eredith":23178,"Ġchanted":23179,"ĠHector":23180,"bread":23181,"ĠIsa":23182,"Ġvolcanic":23183,"Ġah":23184,"owners":23185,"aquin":23186,"Ġmelting":23187,"Ġpreschool":23188,"ocus":23189,"ĠMast":23190,"ĠMyr":23191,"Ġsuppress":23192,"Ġversatility":23193,"ĠNEC":23194,"Ġhoax":23195,"Ġmutually":23196,"ĠNeb":23197,"ĠWheel":23198,"kit":23199,"abl":23200,"again":23201,"ĠSonny":23202,"rift":23203,"Ġsweater":23204,"Ġinund":23205,"ĠTaco":23206,"ĠBout":23207,"Ġnonprofits":23208,"Ġmodify":23209,"Ġprofessionalism":23210,"ĠGould":23211,"ĠGuerrero":23212,"Ġterribly":23213,"ĠBenz":23214,"Ġcountered":23215,"Ġbean":23216,"ĠPhelps":23217,"Ġprowess":23218,"bc":23219,"Ġfeast":23220,"Ġ5000":23221,"Ġrevisit":23222,"Ġchin":23223,"agent":23224,"Ġtones":23225,"Ġextraction":23226,"ĠPosts":23227,"oin":23228,"Ġattain":23229,"Ġgardening":23230,"earned":23231,"ĠOtto":23232,"player":23233,"Ġscams":23234,"ĠHonolulu":23235,"ĠAppro":23236,"ĠHIGH":23237,"Ġdwell":23238,"Islam":23239,"leaders":23240,"Ġlegisl":23241,"expl":23242,"ĠChoi":23243,"Ġfrenzy":23244,"Ġcommercially":23245,"Ġlbs":23246,"Ġgateway":23247,"ĠAndersen":23248,"emia":23249,"lez":23250,"Ġresidences":23251,"office":23252,"ĠHelsinki":23253,"olia":23254,"Ġwolf":23255,"Ġstyling":23256,"ĠJunction":23257,"ĠPeyton":23258,"udo":23259,"ĠDorothy":23260,"Ġfreshly":23261,"ĠJulio":23262,"ĠSunset":23263,"ĠMadden":23264,"Ġissu":23265,"Ġsounding":23266,"sports":23267,"Ġmassively":23268,"ĠRahman":23269,"Ġpresided":23270,"Instead":23271,"Ġ136":23272,"ĠHowell":23273,"beit":23274,"Ġprosperous":23275,"Ġwrongly":23276,"ĠRaqqa":23277,"ĠCes":23278,"Ġbuddy":23279,"Ġchatting":23280,"Ġfencing":23281,"Ġtant":23282,"ocated":23283,"ALK":23284,"Ġsnapping":23285,"euro":23286,"Ryan":23287,"ĠRecogn":23288,"ucked":23289,"Ġpurported":23290,"ĠCann":23291,"Ġintimidating":23292,"Ġrulers":23293,"ĠMarse":23294,"Art":23295,"ĠAadhaar":23296,"Ġvows":23297,"Ġhunter":23298,"ourmet":23299,"ĠVarious":23300,"2009":23301,"anie":23302,"Ġcompassionate":23303,"ĠParking":23304,"Ġmalaria":23305,"Ġamnesty":23306,"Ġworsened":23307,"ĠTitan":23308,"Ġcrossings":23309,"drug":23310,"Ġaddicted":23311,"Ġremorse":23312,"ĠDestiny":23313,"Dear":23314,"Ġhur":23315,"Ġimplicated":23316,"Ġplayful":23317,"Ġripe":23318,"Ġsizable":23319,"Ġcrab":23320,"Ġliqu":23321,"Ġdrib":23322,"Ġcontraction":23323,"cro":23324,"ĠGus":23325,"Ġdoomed":23326,"Ġmog":23327,"ĠMonitor":23328,"Count":23329,"Ġsadd":23330,"Ġwrestler":23331,"Ġrestraints":23332,"Ġraging":23333,"185":23334,"Ġtapes":23335,"Ġmitigation":23336,"ocratic":23337,"Ġvib":23338,"ĠSnowden":23339,"aldo":23340,"Ġweights":23341,"Ġ1959":23342,"ucc":23343,"ĠCoc":23344,"Log":23345,"ĠStev":23346,"Ġdealership":23347,"Ġtrademarks":23348,"iru":23349,"Ġbeneficiary":23350,"Ġlegislator":23351,"Ġdeadlines":23352,"Ġcosmetics":23353,"ĠTammy":23354,"ĠCombined":23355,"Ġeducator":23356,"athon":23357,"Ġcombo":23358,"fu":23359,"appropriate":23360,"nington":23361,"ĠLiberties":23362,"missions":23363,"opard":23364,"ĠMondays":23365,"Ġfetch":23366,"Ġhers":23367,"jon":23368,"ukes":23369,"zek":23370,"Ġvetting":23371,"yet":23372,"Ġfacilitating":23373,"ĠStras":23374,"character":23375,"ĠHeads":23376,"Ġclim":23377,"ĠAlbuquerque":23378,"Ġbind":23379,"Ġconcluding":23380,"ĠBasically":23381,"rail":23382,"ĠTCU":23383,"ĠDepression":23384,"Ġhem":23385,"ĠHue":23386,"Ġpand":23387,"Ġscoreboard":23388,"Av":23389,"Ġidol":23390,"compl":23391,"Ġredesign":23392,"ĠJarrett":23393,"Ġfavoured":23394,"ĠINS":23395,"Ġpropelled":23396,"Ġevasion":23397,"Ġwidened":23398,"Ġwastewater":23399,"nard":23400,"responsive":23401,"Ġdemographics":23402,"engine":23403,"ĠBrewer":23404,"ĠBaxter":23405,"ront":23406,"ĠColon":23407,"Ġpromoter":23408,"Ġgenres":23409,"ovsky":23410,"build":23411,"urate":23412,"ĠCohn":23413,"design":23414,"Ġturbulent":23415,"Ġcurtain":23416,"310":23417,"ĠLamp":23418,"ĠBonds":23419,"church":23420,"Ġdeterrent":23421,"Ġdictatorship":23422,"acement":23423,"haul":23424,"Ġspir":23425,"Ġconceived":23426,"Ġstern":23427,"sit":23428,"Ġsingular":23429,"ĠYog":23430,"Ġconditional":23431,"Ġide":23432,"lund":23433,"Ġautop":23434,"ĠBEST":23435,"ĠJed":23436,"Ġrationale":23437,"Ġalarmed":23438,"Ġshovel":23439,"ĠProb":23440,"ĠMao":23441,"ĠBurgess":23442,"Ġ1953":23443,"above":23444,"ĠManson":23445,"Ġdismal":23446,"ĠFrankie":23447,"Ġtempted":23448,"Ġunderdog":23449,"ribing":23450,"ENCY":23451,"ĠDele":23452,"Las":23453,"places":23454,"Ġnotoriously":23455,"ĠAkin":23456,"Ġglut":23457,"Ġseamlessly":23458,"Ġrecess":23459,"written":23460,"ĠTJ":23461,"occ":23462,"ĠTerritory":23463,"ĠAIR":23464,"ĠDiagn":23465,"Ġvacancies":23466,"Ġcultivation":23467,"ĠAless":23468,"Ġrenamed":23469,"ĠMahmoud":23470,"bright":23471,"Ġvisibly":23472,"Ġnas":23473,"erred":23474,"ĠCarn":23475,"Ġtriggers":23476,"Ġpunishing":23477,"Ġluc":23478,"ĠBett":23479,"Ġbeam":23480,"ĠCheng":23481,"aina":23482,"Ġdetermines":23483,"ĠGerry":23484,"Ġshocks":23485,"Ġstainless":23486,"Ġdefects":23487,"ĠCinem":23488,"Ġtorrent":23489,"Ġresurgence":23490,"Ġcoral":23491,"Ġblitz":23492,"ĠGel":23493,"Ġstemmed":23494,"gur":23495,"Ġlymph":23496,"zzo":23497,"Ġspearheaded":23498,"Ġlicences":23499,"';":23500,"Ġarbitrary":23501,"ĠUzbek":23502,"Ġthief":23503,"reaching":23504,"Ġcand":23505,"ĠEA":23506,"ĠParaly":23507,"ĠEmerson":23508,"ĠSergey":23509,"ĠScher":23510,"ĠWr":23511,"rowing":23512,"Ġ3000":23513,"Ġmighty":23514,"elight":23515,"mAh":23516,"Ġcelebr":23517,"ĠConclusion":23518,"ĠCathy":23519,"Ġpolished":23520,"uddled":23521,"ewski":23522,"Ġfucking":23523,"Ġinterfering":23524,"Ġlandscapes":23525,"Ġfearful":23526,"ĠDetention":23527,"%).":23528,"ĠTT":23529,"Ġbleak":23530,"Ġindebted":23531,"Ġcheat":23532,"Ġconsolation":23533,"ĠPace":23534,"raine":23535,"Ġhonorary":23536,"420":23537,"Ġtechnician":23538,"ĠComprehensive":23539,"Ġfences":23540,"Ġwearable":23541,"ĠMarilyn":23542,"stru":23543,"Ġdrained":23544,"ĠGibraltar":23545,"lag":23546,"Ġdisorderly":23547,"Ġproclaimed":23548,"Ġcapacities":23549,"Ġretains":23550,"ĠVid":23551,"oshi":23552,"ĠEid":23553,"Ġanalytical":23554,"ominium":23555,"ĠExaminer":23556,"ĠNAACP":23557,"ocol":23558,"rev":23559,"ĠRim":23560,"ĠWoody":23561,"ĠMcKenna":23562,"ĠLennon":23563,"ĠEmploy":23564,"Fort":23565,"psy":23566,"Ġsphere":23567,"oday":23568,"ĠChick":23569,"ĠCompared":23570,"ĠIranians":23571,"ĠAccountability":23572,"itchie":23573,"ĠDickinson":23574,"Ġflock":23575,"Ġeclips":23576,"Ġnat":23577,"anke":23578,"ĠNeighborhood":23579,"Ġ141":23580,"Ġscarce":23581,"Ġcreations":23582,"lists":23583,"Ġuseless":23584,"Ġcriticisms":23585,"Ġruler":23586,"ĠHick":23587,"arya":23588,"worker":23589,"alam":23590,"Angelo":23591,"otle":23592,"Ġnewsletters":23593,"Ġerected":23594,"Ġzip":23595,"ĠBirthday":23596,"Ġdogged":23597,"Ġdanced":23598,"Ġconfession":23599,"Ġvomiting":23600,"ickers":23601,"Ġfox":23602,"Ġdeduct":23603,"Ġstresses":23604,"poll":23605,"ĠRadar":23606,"Ġengagements":23607,"Ġexaminer":23608,"Ġopportun":23609,"Ġlongevity":23610,"Ġbanana":23611,"carbon":23612,"uo":23613,"ĠLT":23614,"Ġsynagogue":23615,"Ġblackmail":23616,"INK":23617,"Ġfle":23618,"ĠGutierrez":23619,"Ġracket":23620,"Ġevenings":23621,"Ġdietary":23622,"ĠKok":23623,"Ġfaulty":23624,"Ġabandoning":23625,"ĠFlow":23626,"quest":23627,"estead":23628,"Ġbir":23629,"Ġsuicidal":23630,"ĠGift":23631,"ĠMissing":23632,"ĠMazda":23633,"ĠRib":23634,"ĠJourney":23635,"Ġconcede":23636,"Ġbrushed":23637,"Tw":23638,"andowski":23639,"ĠYun":23640,"Bride":23641,"zai":23642,"awatts":23643,"Ġcha":23644,"Ġspans":23645,"SF":23646,"Ġshells":23647,"planned":23648,"ĠGeographic":23649,"ĠVent":23650,"Ġfav":23651,"Ġinterrogation":23652,"Ġvaries":23653,"ĠPlat":23654,"operative":23655,"avid":23656,"Ġgreatness":23657,"ĠStrait":23658,"ĠSelling":23659,"Ġlawful":23660,"Ġlyn":23661,"Ġfunnel":23662,"Ġpundits":23663,"ties":23664,"Ġpneumonia":23665,"Ġcommencement":23666,"Ġbrisk":23667,"fires":23668,"ĠHTML":23669,"ĠSevent":23670,"Ġhistor":23671,"Ġ147":23672,"olls":23673,"Ġpian":23674,"Little":23675,"Ġcommercials":23676,"Ġdeteriorated":23677,"Ġbasin":23678,"Ġprohibition":23679,"Ġrestrictive":23680,"Ġtom":23681,"ĠPulse":23682,"vale":23683,"Ġmim":23684,"ĠLyons":23685,"ĠTrinidad":23686,"data":23687,"195":23688,"ĠPain":23689,"vor":23690,"ĠDirectorate":23691,"Wow":23692,"essential":23693,"Ġemerges":23694,"ĠDoors":23695,"Ġunde":23696,"Ġarchives":23697,"ĠIX":23698,"ĠAman":23699,"oric":23700,"ĠOper":23701,"nothing":23702,"Ġ142":23703,"igr":23704,"rust":23705,"ĠBYU":23706,"ĠBom":23707,"Ġrift":23708,"ĠAbs":23709,"ĠJenn":23710,"Ġrookies":23711,"hoe":23712,"Ġunderage":23713,"eden":23714,"Ġroasted":23715,"Ġenrol":23716,"Ġerased":23717,"Ġfreeway":23718,"Sil":23719,"Ġplanner":23720,"Ġconfess":23721,"ĠDual":23722,"ĠHeadquarters":23723,"bottom":23724,"Ġstatistic":23725,"ĠPush":23726,"Ġanim":23727,"ITT":23728,"Ġexecutions":23729,"Hub":23730,"ĠStick":23731,"Ġobscure":23732,"oven":23733,"Ġcoats":23734,"unc":23735,"Morning":23736,"Ġnit":23737,"mie":23738,"Ġcurves":23739,"gew":23740,"ĠAnniversary":23741,"members":23742,"ĠAbsolutely":23743,"Ġapt":23744,"otional":23745,"ĠGin":23746,"izo":23747,"Ġpretending":23748,"arak":23749,"Ġorganise":23750,"Ġroyalties":23751,"ĠCamden":23752,"Ġsausage":23753,"Inst":23754,"Ġchalk":23755,"ĠSurf":23756,"ĠSunrise":23757,"Ġmoder":23758,"aido":23759,"loving":23760,"lus":23761,"Ġoblig":23762,"Ġmotions":23763,"Ġclarification":23764,"ĠOM":23765,"Ġbishop":23766,"Ġexhibitions":23767,"ĠRifle":23768,"ĠPhot":23769,"ĠHM":23770,"ATIONAL":23771,"Ġwid":23772,"Ġreside":23773,"ĠPV":23774,"OOK":23775,"ĠTue":23776,"Ġ1200":23777,"Ġ1957":23778,"Ġespionage":23779,"ĠAPPLIC":23780,"Ġblasts":23781,"fter":23782,"Ġimmensely":23783,"ĠLots":23784,"Ġinflammatory":23785,"anging":23786,"Ġtumultuous":23787,"identified":23788,"Ġstead":23789,"ĠAch":23790,"Ãī":23791,"Ġbub":23792,"hler":23793,"olution":23794,"Ġshun":23795,"Ġnull":23796,"Ġunused":23797,"ĠObs":23798,"Ġinsol":23799,"ĠAttack":23800,"ertain":23801,"Ġdefiant":23802,"Through":23803,"ĠArmour":23804,"Ġsimulation":23805,"UCK":23806,"Ġinfluenza":23807,"Ġonset":23808,"Ġbored":23809,"Ġsouls":23810,"Ġreferees":23811,"Ġcollaborations":23812,"ĠLer":23813,"Ġcreepy":23814,"Ġanaly":23815,"ĠEffect":23816,"orting":23817,"Card":23818,"Ġdice":23819,"Ġharvesting":23820,"235":23821,"sty":23822,"ĠMcCartney":23823,"Ġsalute":23824,"UMP":23825,"Ġherb":23826,"ĠAbuse":23827,"ĠRamadan":23828,"Ġsuck":23829,"trained":23830,"ĠPhysical":23831,"iren":23832,"anches":23833,"erie":23834,"Ġhangs":23835,"Ġcataly":23836,"Ġintuitive":23837,"assi":23838,"Ġtechn":23839,"Ġjugg":23840,"Ġgameplay":23841,"Ġapolog":23842,"Ġfifteen":23843,"Ġgalleries":23844,"Ġoutlines":23845,"patient":23846,"ĠPotential":23847,"Ġethnicity":23848,"Ġharbour":23849,"Ġoverthrow":23850,"ĠLung":23851,"Ġwarehouses":23852,"ĠMonitoring":23853,"Ġmentors":23854,"Ġsized":23855,"Ġenvisioned":23856,"Ġgin":23857,"DT":23858,"Ġpropel":23859,"ĠKul":23860,"ference":23861,"estic":23862,"ĠLego":23863,"Ġdinners":23864,"ĠMoe":23865,"designed":23866,"ĠSusp":23867,"ĠBrick":23868,"qua":23869,"IDS":23870,"ĠBam":23871,"athe":23872,"Ġslices":23873,"Ġbottled":23874,"thy":23875,"producing":23876,"ĠTerror":23877,"professional":23878,"ĠKis":23879,"erto":23880,"ĠVehicles":23881,"Ġbeforehand":23882,"Ġdetrimental":23883,"weights":23884,"Ġallowances":23885,"Williams":23886,"ĠSyrians":23887,"ĠSto":23888,"Ġcozy":23889,"reditation":23890,"ensen":23891,"ĠSard":23892,"Ġroy":23893,"ooting":23894,"ĠReserv":23895,"ominated":23896,"emate":23897,"ĠTot":23898,"ĠCarnegie":23899,"ĠThib":23900,"ĠMarshal":23901,"Ġ152":23902,"Ġmayors":23903,"inery":23904,"ĠFiona":23905,"ĠCadillac":23906,"ivated":23907,"Ġeagerly":23908,"ĠOffensive":23909,"Ġastronaut":23910,"ĠVital":23911,"Ġcane":23912,"Ġquitting":23913,"ĠLone":23914,"Ġcensorship":23915,"ĠWelch":23916,"ĠUd":23917,"Ġmarquee":23918,"ĠDip":23919,"Ġwhereby":23920,"Ġtiger":23921,"gem":23922,"Ġconserv":23923,"Ġpresumed":23924,"ĠEntry":23925,"ffer":23926,"ĠProceed":23927,"Ġbrawl":23928,"ĠJaime":23929,"Ġecho":23930,"Ġadvancements":23931,"Ġtransitional":23932,"erick":23933,"Ġbully":23934,"anan":23935,"Ġreinvent":23936,"ĠLetters":23937,"Ġbricks":23938,"ĠSmy":23939,"Ġtowering":23940,"gging":23941,"299":23942,"orian":23943,"dimensional":23944,"ĠForty":23945,"ĠSinn":23946,"ushi":23947,"ĠSurveillance":23948,"enabled":23949,"ĠMous":23950,"ĠVive":23951,"Marcus":23952,"Ġvom":23953,"Ġcreek":23954,"Ġlime":23955,"Ġseismic":23956,"ĠFork":23957,"Ġembroiled":23958,"marks":23959,"Ġherald":23960,"ĠSonia":23961,"â̦\"":23962,"wired":23963,"Ġobliged":23964,"ĠProjects":23965,"lde":23966,"ĠRiders":23967,"Ġovercoming":23968,"Mail":23969,"ĠLawn":23970,"ĠHawk":23971,"figure":23972,"ĠWritten":23973,"Ġens":23974,"Ġspacious":23975,"target":23976,"ĠRecep":23977,"ĠSAM":23978,"Ġentertained":23979,"Ġignited":23980,"ĠCENT":23981,"ogenic":23982,"Ġunatt":23983,"Ġexceeds":23984,"Ġ--------------------------------":23985,"Ġpillars":23986,"ĠBorders":23987,"ickey":23988,"Ġextinction":23989,"Ġviability":23990,"Ġtumors":23991,"ĠWilkinson":23992,"ĠKEY":23993,"Ġbins":23994,"ĠReported":23995,"Sm":23996,"ĠExclusive":23997,"ĠChilean":23998,"info":23999,"Ġwilderness":24000,"did":24001,"absolutely":24002,"pillar":24003,"Ġelites":24004,"ĠPreview":24005,"ixie":24006,"Mont":24007,"ribut":24008,"dream":24009,"Ġplanners":24010,"ĠSomerset":24011,"Ġenvis":24012,"ĠStall":24013,"Ġelevate":24014,"ographies":24015,"rama":24016,"Ha":24017,"Ġamidst":24018,"oho":24019,"Ġrejects":24020,"Jim":24021,"Ġmarginally":24022,"Ġusher":24023,"arez":24024,"ĠHawth":24025,"Ġsprink":24026,"ĠOffer":24027,"Ġanchored":24028,"ucking":24029,"ĠGarn":24030,"ĠConserv":24031,"Ġsocietal":24032,"Ġbrowsing":24033,"Ġbidder":24034,"burgh":24035,"ĠRunner":24036,"Ġtrendy":24037,"verts":24038,"imposed":24039,"ĠPatton":24040,"lements":24041,"Ġspicy":24042,"Ġswe":24043,"ĠStrike":24044,"Ġclam":24045,"ĠYankee":24046,"ĠKT":24047,"ĠGreenwood":24048,"ĠWays":24049,"Ġ2050":24050,"Ġattach":24051,"ĠShim":24052,"Ġmeltdown":24053,"Ġassemble":24054,"ĠUPDATE":24055,"Ġscout":24056,"Brown":24057,"ĠKobe":24058,"Ġpostpone":24059,"liness":24060,"allo":24061,"rief":24062,"ĠGerm":24063,"ĠFD":24064,"ĠReggie":24065,"ĠUnivers":24066,"ĠShepard":24067,"Ġcancell":24068,"ĠRomeo":24069,"ĠWarrior":24070,"ench":24071,"ifier":24072,"Ġprivileges":24073,"Ġsenses":24074,"Ġimpoverished":24075,"ĠPostal":24076,"encer":24077,"ĠConrad":24078,"Ġprinter":24079,"Ġinflicted":24080,"ĠGamble":24081,"ĠHeroes":24082,"132":24083,"Ġrevisions":24084,"Ġunsuccessfully":24085,"ĠHeisman":24086,"Ġstamped":24087,"inding":24088,"ĠLuna":24089,"Ġreinvest":24090,"ducers":24091,"ĠPassword":24092,"Leod":24093,"Ġcompounded":24094,"',\"":24095,"ogging":24096,"Ġprobing":24097,"ĠPBS":24098,"ĠMU":24099,"ĠWhenever":24100,"Ġsped":24101,"ĠCompetitive":24102,"isans":24103,"opa":24104,"Ġcleric":24105,"Ġvivid":24106,"à¸":24107,"126":24108,"Ġinconvenience":24109,"udi":24110,"Ġimmersive":24111,"Ġdiversion":24112,"Ġlogs":24113,"Ġspying":24114,"inct":24115,"Ġlitres":24116,"Ġmetallic":24117,"identally":24118,"FX":24119,"Ġloudly":24120,"Ġnursery":24121,"Ġcollectors":24122,"ĠKart":24123,"Ġescalate":24124,"Ġringing":24125,"Ġprocedural":24126,"Ġdisrupting":24127,"ĠEthiopian":24128,"ĠCFL":24129,"Ġillustrates":24130,"Ġperks":24131,"official":24132,"325":24133,"Ġmillennial":24134,"Ġbreadth":24135,"Ġmelted":24136,"Ġ850":24137,"ĠBake":24138,"donald":24139,"ĠGrac":24140,"Ġseeded":24141,"ĠDiscount":24142,"idates":24143,"Ġdrift":24144,"Ġcaptive":24145,"Ġseriousness":24146,"Ġrepercussions":24147,"Ġdisciplines":24148,"Ġthesis":24149,"Ġsleeve":24150,"ses":24151,"Monday":24152,"Ġthwart":24153,"ĠLic":24154,"Ġquadru":24155,"ĠPresbyterian":24156,"Ġreactors":24157,"ĠSuzanne":24158,"ewater":24159,"Ġlam":24160,"Ġbreastfeeding":24161,"Ġrats":24162,"ĠArtists":24163,"Ġdomestically":24164,"Ġdecom":24165,"ĠArms":24166,"basketball":24167,"Ġscrub":24168,"ĠTeddy":24169,"beh":24170,"ĠBetsy":24171,"ĠNursing":24172,"Ġdescriptions":24173,"127":24174,"gil":24175,"itional":24176,"Ġchampioned":24177,"ĠCalling":24178,"Ġrealization":24179,"ĠBuddy":24180,"hou":24181,"ĠDire":24182,"ĠHuff":24183,"Ġlipstick":24184,"Ray":24185,"Ġflare":24186,"belt":24187,"Ġbrightest":24188,"Ġmalfunction":24189,"ĠManor":24190,"Ġsaturated":24191,"rays":24192,"ĠDW":24193,"ixed":24194,"ĠSlovenia":24195,"seen":24196,"ĠCause":24197,"arios":24198,"ASE":24199,"Ġrend":24200,"ĠTBA":24201,"Ġlecturer":24202,"attering":24203,"Ġaffluent":24204,"CEO":24205,"Ġbreathtaking":24206,"ĠGiles":24207,"irth":24208,"ĠPhilips":24209,"Ġposture":24210,"ĠTSA":24211,"heit":24212,"Ġmenace":24213,"ricks":24214,"ĠAden":24215,"ĠReich":24216,"iggle":24217,"ĠShutterstock":24218,"Ġcourageous":24219,"edia":24220,"Staff":24221,"Ġdivert":24222,"ĠCir":24223,"Ġguessing":24224,"apers":24225,"ĠBritons":24226,"lé":24227,"Ġconvened":24228,"ĠSerbian":24229,"Ġricher":24230,"Ġcock":24231,"Ġdeposited":24232,"company":24233,"Ġdelic":24234,"sensitive":24235,"tank":24236,"ĠPatty":24237,"mia":24238,"onomous":24239,"cn":24240,"Ġclamp":24241,"ĠAcademic":24242,"Ġprosecuting":24243,"ĠTransparency":24244,"Ġdeflation":24245,"Ġdashboard":24246,"ĠDress":24247,"Ġlin":24248,"mu":24249,"ĠGoodell":24250,"Ġlav":24251,"ĠTwelve":24252,"Ġflavour":24253,"Ġfiercely":24254,"Ġbloom":24255,"ĠHaf":24256,"ĠGrad":24257,"LET":24258,"ĠSeeing":24259,"oxide":24260,"Ġmenus":24261,"char":24262,"adoes":24263,"combe":24264,"Street":24265,"ĠRidley":24266,"Ġdepicts":24267,"ĠPred":24268,"ÑĢ":24269,"British":24270,"Ġbumps":24271,"Ġlamp":24272,"ĠDesmond":24273,"ĠPB":24274,"Ġfrag":24275,"tin":24276,"ĠSharing":24277,"Ġdesperation":24278,"Ġcommuter":24279,"igrants":24280,"ĠShapiro":24281,"Ġkinda":24282,"Ġimpartial":24283,"ĠJewel":24284,"Ġcongratulations":24285,"Ġcompost":24286,"Ġadmiration":24287,"Ġpaycheck":24288,"ĠAnonymous":24289,"enger":24290,"Mer":24291,"ĠGospel":24292,"ĠEth":24293,"ĠMH":24294,"Ġfem":24295,"ĠTrial":24296,"Ġdepths":24297,"ĠApplied":24298,"Ġgrit":24299,"Ġerase":24300,"sid":24301,"comm":24302,"}":24303,"Ġretreated":24304,"Ġanalysed":24305,"ĠRegular":24306,"ĠPesh":24307,"ICAL":24308,"pei":24309,"ĠReilly":24310,"ĠTrib":24311,"Ġbooths":24312,"Ġdrank":24313,"Ġcoma":24314,"Ġharvested":24315,"ĠCHAR":24316,"Ġbutterfly":24317,"Ġsailed":24318,"ĠDrink":24319,"eping":24320,"ATCH":24321,"ĠLegends":24322,"Ġinsured":24323,"Ġwholes":24324,"ĠBis":24325,"ĠShea":24326,"ighter":24327,"Ġsnakes":24328,"ĠGunn":24329,"ĠPoss":24330,"Ġdispar":24331,"Ġbombshell":24332,"Ġscanning":24333,"340":24334,"choice":24335,"cool":24336,"\"âĢĶ":24337,"ĠTheo":24338,"rine":24339,"ĠJacques":24340,"Ġdisadvantaged":24341,"Ġparamount":24342,"igate":24343,"stat":24344,"anski":24345,"Ġoutsourcing":24346,"Ġpopulous":24347,"Ġbinge":24348,"ĠOrganic":24349,"urban":24350,"Ġyogurt":24351,"Ġretweet":24352,"osen":24353,"cially":24354,"215":24355,"Ġeditions":24356,"Ġburgeoning":24357,"efully":24358,"ĠThousand":24359,"Ġreplacements":24360,"ĠAmazing":24361,"rator":24362,"icy":24363,"Ġintensify":24364,"Sen":24365,"ĠQuincy":24366,"powers":24367,"ĠAur":24368,"ĠZion":24369,"stal":24370,"Ġpillar":24371,"ĠErit":24372,"ĠPerform":24373,"aston":24374,"Eric":24375,"Ġunh":24376,"IFF":24377,"950":24378,"ĠEngineer":24379,"ĠLands":24380,"Ġdubious":24381,"fy":24382,"ĠWI":24383,"ĠSv":24384,"ĠHendricks":24385,"ĠKod":24386,"Ġoutlining":24387,"ĠCorrespond":24388,"amus":24389,"worst":24390,"arter":24391,"coni":24392,"Ġhierarchy":24393,"ĠTHAT":24394,"Ġexce":24395,"Ġrailways":24396,"Ġmasked":24397,"lene":24398,"Ġoutset":24399,"Ġavalanche":24400,"Ġnicknamed":24401,"Ġ702":24402,"Lee":24403,"Ġ139":24404,"ĠSixth":24405,"365":24406,"nda":24407,"Ġaccountant":24408,"Ġobese":24409,"Ġgrape":24410,"Ġimpunity":24411,"ĠYorkers":24412,"Ġguardian":24413,"icity":24414,"Ġcentrist":24415,"Ġwaterways":24416,"ursed":24417,"Ġhopeless":24418,"header":24419,"Ġtack":24420,"Ġric":24421,"umn":24422,"Ġvalve":24423,"Ġtread":24424,"ĠCST":24425,"Ġhepatitis":24426,"ctor":24427,"ĠRED":24428,"Ġsolitary":24429,"NW":24430,"Ġceremonial":24431,"Ġfoe":24432,"Ġling":24433,"Jason":24434,"ĠLisbon":24435,"Ġ1955":24436,"ĠHeller":24437,"Ġkin":24438,"essen":24439,"Ġturbines":24440,"shi":24441,"Ġlodge":24442,"Ġveterinary":24443,"ĠBoll":24444,"ĠConfederation":24445,"ĠJournalists":24446,"Ġtug":24447,"ĠStarr":24448,"Ġpiles":24449,"Way":24450,"adel":24451,"orean":24452,"Ġoft":24453,"Ġshortcomings":24454,"ĠSheila":24455,"Ġbackbone":24456,"III":24457,"ĠDarwin":24458,"ĠTunis":24459,"Ġsuspicions":24460,"Ġdisagreements":24461,"Ġ247":24462,"illery":24463,"'\"":24464,"Ġsegregation":24465,"ohl":24466,"Ġinstincts":24467,"ĠPoo":24468,"nih":24469,"parency":24470,"uddy":24471,"esting":24472,"asses":24473,"ĠIntroduction":24474,"ĠSirius":24475,"Local":24476,"orous":24477,"Ġrehearsal":24478,"Ġdemol":24479,"Ġtraffickers":24480,"Ġupsetting":24481,"Ġheir":24482,"death":24483,"ĠMoments":24484,"Los":24485,"Ġatmospheric":24486,"aints":24487,"ĠDianne":24488,"Ġlikewise":24489,"ĠMing":24490,"auga":24491,"Ġfirsthand":24492,"Ġnarratives":24493,"ĠAstron":24494,"ĠExtreme":24495,"Ġhorns":24496,"ĠSana":24497,"Ġrecapt":24498,"ĠMist":24499,"ĠRandolph":24500,"connect":24501,"Ġindecent":24502,"Ġforty":24503,"Ġjihadists":24504,"azes":24505,"Ġdread":24506,"Ġgrapes":24507,"Ġremoves":24508,"Ġscreamed":24509,"ĠCrus":24510,"ikers":24511,"Ġsnapshot":24512,"ĠCalls":24513,"Cons":24514,"Ġlettuce":24515,"ĠPig":24516,"urable":24517,"jured":24518,"ILY":24519,"ĠJessie":24520,".).":24521,"Pay":24522,"Tra":24523,"----------------":24524,"ĠUnits":24525,"ĠPlayboy":24526,"Ġarthritis":24527,"Ġafforded":24528,"insk":24529,"ĠFake":24530,"ĠLies":24531,"ĠBaltic":24532,"oyal":24533,"ĠVest":24534,"Ġrusher":24535,"Ġincorporates":24536,"ĠMM":24537,"ĠDru":24538,"ĠWare":24539,"ĠSammy":24540,"ĠGob":24541,"ĠRuk":24542,"Ġ146":24543,"ĠCrowd":24544,"Ġduel":24545,"irts":24546,"Ġsourcing":24547,"hp":24548,"ĠJava":24549,"bred":24550,"ĠRefer":24551,"Ġuninsured":24552,"Ġslope":24553,"256":24554,"Ġregulating":24555,"Ġfundra":24556,"Ġinserted":24557,"ĠNickel":24558,"ĠConsumption":24559,"ĠRomo":24560,"Atlantic":24561,"Ġenclave":24562,"Ġpegged":24563,"Ġdirects":24564,"mbudsman":24565,"ĠDES":24566,"Ob":24567,"Ġlimbs":24568,"Ġbury":24569,"ILA":24570,"Ġstew":24571,"Ġbreeze":24572,"Ġabrupt":24573,"ĠGott":24574,"ĠClaude":24575,"Ġgenetically":24576,"Ġrigid":24577,"ĠDudley":24578,"ĠNer":24579,"registered":24580,"Ġentrenched":24581,"Ġextortion":24582,"ĠNurs":24583,"Ġcontingency":24584,"etter":24585,"Ġrejo":24586,"Ġprotagonist":24587,"Ġcounselling":24588,"ĠVit":24589,"aware":24590,"ĠMonsanto":24591,"GG":24592,"Ġincarcerated":24593,"Ġabduction":24594,"Ġreferencing":24595,"Germany":24596,"uates":24597,"reck":24598,"Ġtram":24599,"Ġchron":24600,"Ġmish":24601,"ĠVes":24602,"ĠTire":24603,"Ġvandal":24604,"ĠCrazy":24605,"ĠLifetime":24606,"ĠSpectrum":24607,"celer":24608,"Ġmotto":24609,"hang":24610,"Ġblade":24611,"gel":24612,"Ġbiography":24613,"Ġallegiance":24614,"hod":24615,"hap":24616,"ptic":24617,"acle":24618,"ĠBlade":24619,"ĠBoh":24620,"Ġ149":24621,"Ġchang":24622,"Ġcanned":24623,"Ġfacilitated":24624,"actor":24625,"iologist":24626,"Ġrebuilt":24627,"Ġawake":24628,"Ġmayoral":24629,"ĠEuros":24630,"Ġdangerously":24631,"MK":24632,"Ġreplica":24633,"Ġcoinc":24634,"blog":24635,"ĠEra":24636,"Ġrelinqu":24637,"quite":24638,"ondon":24639,"rosso":24640,"tun":24641,"Ġtouchscreen":24642,"Ġpops":24643,"ousing":24644,"efficient":24645,"Ġ148":24646,"Ġconced":24647,"although":24648,"Ġ1956":24649,"Ġmortar":24650,"ĠCave":24651,"ĠJung":24652,"urer":24653,"Ġillusion":24654,"ĠBerman":24655,"intend":24656,"Ġcoping":24657,"Dem":24658,"tion":24659,"estation":24660,"ĠSounds":24661,"Ġnavigating":24662,"Ġsperm":24663,"Ġreligions":24664,"Ġfol":24665,"Ġheroic":24666,"FD":24667,"Ġhesitant":24668,"asure":24669,"Ġredeem":24670,"Adam":24671,"Ġfireplace":24672,"vertis":24673,"ĠSung":24674,"290":24675,"iland":24676,"ĠUpdates":24677,"OTUS":24678,"ĠPTSD":24679,"Ġhelmets":24680,"\"?":24681,"Ġslashing":24682,"Ġscouts":24683,"Ġspelling":24684,"ĠInitial":24685,"draw":24686,"Ġchallengers":24687,"Ġsupremacists":24688,"Ġpilgrims":24689,"Ġasc":24690,"ĠFill":24691,"ĠPau":24692,"Ġjewel":24693,"ĠMalt":24694,"icip":24695,"Ġinhabitants":24696,"Ġmetre":24697,"ahar":24698,"Comp":24699,"atches":24700,"inv":24701,"Ġcyclist":24702,"ĠQC":24703,"Ġmanually":24704,"ĠAnchorage":24705,"Ġdiscarded":24706,"Ġconsolid":24707,"Ġnavig":24708,"ĠAnimals":24709,"ĠPole":24710,"esson":24711,"Ġ1954":24712,"Ġsorted":24713,"Ġmadness":24714,"ĠBrigade":24715,"ĠGenesis":24716,"Ġdismissing":24717,"ĠPanasonic":24718,"Ġdizz":24719,"ĠEducational":24720,"ĠKO":24721,"ĠPill":24722,"ĠGIF":24723,"Ġbol":24724,"Ġwards":24725,"Ġcontroversies":24726,"Chinese":24727,"Ġantics":24728,"Ġreliant":24729,"ĠMoff":24730,"Ġethanol":24731,"Ġtorch":24732,"rights":24733,"ĠHabit":24734,"arton":24735,"rera":24736,"ĠSasha":24737,"abella":24738,"Ġproliferation":24739,"Ġsincerely":24740,"communication":24741,"ĠNay":24742,"ĠChattanooga":24743,"ounces":24744,"ĠNXT":24745,"ĠEmir":24746,"Ġmanipulated":24747,"Ġharassing":24748,"wat":24749,"Ġbouts":24750,"Book":24751,"Ġhovering":24752,"ĠScan":24753,"ship":24754,"ĠAngola":24755,"ĠLC":24756,"Ġruins":24757,"Ġsexist":24758,"zar":24759,"Ġpledging":24760,"ober":24761,"Ġembold":24762,"Ġobjection":24763,"Ġboasting":24764,"MIN":24765,"Ġherbs":24766,"Ġgears":24767,"ĠIc":24768,"stre":24769,"him":24770,"Ġhomicides":24771,"cki":24772,"castle":24773,"counter":24774,"ĠCAS":24775,"ĠReasons":24776,"ĠDeclaration":24777,"Ġsimplify":24778,"Ġfared":24779,"Ġescort":24780,"Ġkidn":24781,"ĠHamm":24782,"Ġnailed":24783,"Ġaccommodations":24784,"Ġmodifications":24785,"rible":24786,"Ġwool":24787,"EDIT":24788,"2010":24789,"Ġauthentication":24790,"Ġgoat":24791,"hom":24792,"Ġfederally":24793,"ĠRath":24794,"Ġspiked":24795,"Ġmisrepresent":24796,"Ġavenue":24797,"Ġbroadcasts":24798,"ĠEstonia":24799,"ennes":24800,"ĠMare":24801,"ption":24802,"ĠKag":24803,"Ġcircumstance":24804,"orrow":24805,"isons":24806,"ĠCollabor":24807,"Ġstroll":24808,"ĠCPS":24809,"soft":24810,"iral":24811,"apo":24812,"usky":24813,"poke":24814,"Ġwoo":24815,"ĠElena":24816,"ĠLastly":24817,"Ġlinemen":24818,"Canadian":24819,"ĠAnyway":24820,"Ġsubstantive":24821,"ĠCurt":24822,"Ġard":24823,"ĠYosh":24824,"ĠBuchanan":24825,"Ġrevolving":24826,"Ġspecials":24827,"Ġshrine":24828,"Ġlumber":24829,"Ġorchestrated":24830,"kie":24831,"azy":24832,"Ġexpiration":24833,"ĠDaryl":24834,"ĠPatri":24835,"better":24836,"2020":24837,"ĠFav":24838,"ĠOP":24839,"OTT":24840,"Ġflush":24841,"ĠSikh":24842,"Ġecosystems":24843,"ĠBET":24844,"eared":24845,"audio":24846,"ĠFahrenheit":24847,"police":24848,"Ġincarceration":24849,"Ġerupt":24850,"ĠDamien":24851,"ĠHague":24852,"ulz":24853,"ĠAgents":24854,"ĠBanner":24855,"Ġconductor":24856,"ĠAjax":24857,"arson":24858,"Ġrests":24859,"Ġeurozone":24860,"Ġfelon":24861,"Ġcurator":24862,"morning":24863,"Ġevidenced":24864,"ĠNeh":24865,"Ġmattress":24866,"Ġtast":24867,"Ġfueling":24868,"ĠOccup":24869,"Ġbake":24870,"ĠZac":24871,"meaning":24872,"Ill":24873,"ĠHau":24874,"ĠLaden":24875,"Ġbald":24876,"Mary":24877,"oky":24878,"atri":24879,"Ġtracker":24880,"OTA":24881,"catching":24882,"ĠUnderground":24883,"ĠHuffPost":24884,"ĠAtkins":24885,"oglu":24886,"Ġauthorised":24887,"Ġroutines":24888,"ĠHof":24889,"veland":24890,"Ġlangu":24891,"Ġprot":24892,"ĠHyd":24893,"integ":24894,"Ġbravery":24895,"Ġviolin":24896,"Ġdelightful":24897,"Ġticks":24898,"iton":24899,"Ġreap":24900,"Ġoversized":24901,"ĠPitch":24902,"Ġprized":24903,"Ġfusion":24904,"fact":24905,"acting":24906,"Ġfullback":24907,"Ġpolite":24908,"Ġswear":24909,"Ġconfiscated":24910,"ĠStud":24911,"Ġfielded":24912,"rito":24913,"covered":24914,"financial":24915,"bill":24916,"HK":24917,"OTOS":24918,"loaded":24919,"Ġmarble":24920,"ĠDiplom":24921,".âĢĶ":24922,"Ġeats":24923,"Ġbackfield":24924,"Ġtimeframe":24925,"Ġvegetarian":24926,"Ġswaps":24927,"ĠMines":24928,"igor":24929,"ĠLenn":24930,"ĠDP":24931,"ordered":24932,"ĠShark":24933,"Ġquant":24934,"erence":24935,"Ġashes":24936,"ĠBuckley":24937,"ophobia":24938,"Ġwarranted":24939,"Rose":24940,"Ġunreasonable":24941,"ĠJav":24942,"Ġpalette":24943,"Ġjoints":24944,"Ġadvent":24945,"Ġnoteworthy":24946,"ĠNicol":24947,"ĠChristensen":24948,"Ġplummeted":24949,"ayers":24950,"Ġdefends":24951,"Ġcontended":24952,"ĠCongratulations":24953,"kish":24954,"ĠHannity":24955,"Ġgroundwater":24956,"ĠKramer":24957,"Ġerect":24958,"Ġappet":24959,"ĠKardash":24960,"Ġexacerbated":24961,"Ġexplanations":24962,"vious":24963,"eport":24964,"---":24965,"icism":24966,"ĠNatasha":24967,"ĠGeoffrey":24968,"estro":24969,"Article":24970,"Ġincidence":24971,"Ġprovoked":24972,"elf":24973,"Ġinsistence":24974,"ĠOUR":24975,"Ġfertilizer":24976,"Ġstickers":24977,"ĠGators":24978,"ĠLanding":24979,"ĠDON":24980,"sta":24981,"ĠRobbins":24982,"Ġpixels":24983,"ĠHoy":24984,"imated":24985,"ĠÃī":24986,"â":24987,"Ġsimpl":24988,"Other":24989,"245":24990,"Ġforcibly":24991,"'.\"":24992,"Ġsmashing":24993,"Ġmosquitoes":24994,"Ġpaints":24995,"Ġdebating":24996,"enty":24997,"ĠIB":24998,"leaf":24999,"ĠDah":25000,"Ġreferral":25001,"pired":25002,"Ġbrunch":25003,"gie":25004,"Ġvict":25005,"ribute":25006,"Ġbloggers":25007,"Ġgum":25008,"ĠAdmiral":25009,"France":25010,"ĠPK":25011,"ĠSaturn":25012,"Ġinflated":25013,"WAR":25014,"Ġscenic":25015,"usal":25016,"their":25017,"Ġcontends":25018,"Ġpathways":25019,"inis":25020,"Ġawarding":25021,"Ġmisled":25022,"Ġeternal":25023,"Ġexaminations":25024,"Ġpoker":25025,"Ġsafest":25026,"Ġchildcare":25027,"aday":25028,"Ġpreceding":25029,"ĠCollective":25030,"Ġrespectable":25031,"ographical":25032,"Ġoak":25033,"00000":25034,"ĠCorridor":25035,"oran":25036,"133":25037,"Ġmushrooms":25038,"gaard":25039,"ĠOmega":25040,"ĠNaturally":25041,"anim":25042,"Ġcaptains":25043,"Ġtang":25044,"Ġlobbyists":25045,"ĠSug":25046,"Ġsucc":25047,"249":25048,"ENG":25049,"134":25050,"Ġsolic":25051,"ĠAdded":25052,"ĠSuicide":25053,"ĠFULL":25054,"ĠStrauss":25055,"ĠDiesel":25056,"Ġtempting":25057,"acist":25058,"ĠDelivery":25059,"Ġquiz":25060,"ĠPARK":25061,"Ġcollisions":25062,"Ġrestrained":25063,"purpose":25064,"ĠChanges":25065,"Ġabsentee":25066,"Ġprobes":25067,"hib":25068,"Ġcul":25069,"Ġpetty":25070,"Ġnecess":25071,"Ġcues":25072,"OME":25073,"Ġinadvertently":25074,"urity":25075,"ĠStuff":25076,"FG":25077,"Ġwrestlers":25078,"Ġpaste":25079,"ĠRoku":25080,"Ġcardboard":25081,"aires":25082,"Ġvariables":25083,"ĠSaras":25084,"ĠFif":25085,"Ġinvests":25086,"ĠDiscover":25087,"ĠFix":25088,"Thomas":25089,"ĠLunch":25090,"lv":25091,"camera":25092,"Step":25093,"Ġresumes":25094,"ĠSacred":25095,"ĠShooting":25096,"Ġnoble":25097,"Ġslopes":25098,"Ġont":25099,"Ġtwists":25100,"Very":25101,"Ġbigotry":25102,"ĠTib":25103,"Ġmos":25104,"Ġwarrior":25105,"Ġbroadcasters":25106,"Ġubiquitous":25107,"ameda":25108,"Ġchess":25109,"Special":25110,"Ġconver":25111,"Ġdeleg":25112,"endant":25113,"Ġfoil":25114,"Ġlush":25115,"Ġtaxed":25116,"Mag":25117,"ahs":25118,"Ġtablespoons":25119,"scription":25120,"clamation":25121,"ĠCertain":25122,"ĠDiversity":25123,"Ġhairst":25124,"ĠBrewery":25125,"Ġshedding":25126,"Cla":25127,"Ġpenis":25128,"ĠMurder":25129,"Park":25130,"uner":25131,"iments":25132,"ĠOVER":25133,"hus":25134,"Ġtabloid":25135,"Chart":25136,"Ġvouchers":25137,"ĠCoord":25138,"Ġmethane":25139,"ĠFisheries":25140,"ĠKham":25141,"includes":25142,"ĠSuperman":25143,"ensed":25144,"isure":25145,"Amazon":25146,"Ġvacated":25147,"heet":25148,"Ġroast":25149,"Ġlegalize":25150,"ĠTut":25151,"Ġsignage":25152,"init":25153,"Ġthefts":25154,"202":25155,"Ġstatic":25156,"Ġchants":25157,"Bob":25158,"Ġdiscretionary":25159,"Ġendurance":25160,"Ġcollegiate":25161,"Ġcorridors":25162,"Ġslack":25163,"ĠLash":25164,"Az":25165,"Series":25166,"Ġnonpartisan":25167,"ĠMcGill":25168,"Ġuneven":25169,"ulsive":25170,"eu":25171,"Ġpil":25172,"Ġfisheries":25173,"Ġonslaught":25174,"fiction":25175,"holding":25176,"Ġcheated":25177,"Ġtraumat":25178,"lasting":25179,"Ġmultitude":25180,"ĠThr":25181,"ĠBreast":25182,"Ġ1600":25183,"ĠMatth":25184,"Ġdiminish":25185,"ĠFTC":25186,"Ġgram":25187,"ĠResident":25188,"Ġfading":25189,"Ġmarginalized":25190,"ĠLite":25191,"ĠCarlton":25192,"Ġerad":25193,"Welcome":25194,"ĠFaw":25195,"iddy":25196,"Ġparticip":25197,"Ġcz":25198,"Ġtexted":25199,"Ġsuites":25200,"ĠForever":25201,"Ġrendition":25202,"rait":25203,"ĠPrague":25204,"Ġsponsoring":25205,"Ġcompos":25206,"ĠBeacon":25207,"144":25208,"Ġpupil":25209,"Ġintricate":25210,"Ġathleticism":25211,"Ġoptimization":25212,"Ġloot":25213,"polit":25214,"ĠOtt":25215,"Whatever":25216,"uno":25217,"ĠConstable":25218,"esville":25219,"Ġlookout":25220,"ĠAircraft":25221,"Ġspo":25222,"Ġcorrobor":25223,"Ġhiatus":25224,"ĠKnowing":25225,"ĠHamp":25226,"Ġspe":25227,"Ġstoring":25228,"Ġshakes":25229,"uran":25230,"Ġsickness":25231,"Ġliber":25232,"ĠAdministrative":25233,"Ġpleasing":25234,"ĠEqual":25235,"ĠConversation":25236,"Ġalgae":25237,"Ġlobbyist":25238,"ĠHelena":25239,"ptions":25240,"Ġfaire":25241,"ĠGone":25242,"ĠWiggins":25243,"Robert":25244,"Ġlistens":25245,"ĠDaisy":25246,"Ġsticky":25247,"sale":25248,"ĠMarijuana":25249,"ĠSSD":25250,"ĠTool":25251,"once":25252,"ĠHarmon":25253,"mobile":25254,"Ġdetain":25255,"Money":25256,"Ġflawless":25257,"forced":25258,"Ġguru":25259,"Ġairspace":25260,"ĠArchie":25261,"ĠGender":25262,"ĠMeat":25263,"abilities":25264,"ĠBD":25265,"Open":25266,"Ġoutsider":25267,"issue":25268,"Ġlearns":25269,"natural":25270,"Ġvinegar":25271,"ĠSUB":25272,"ĠRecon":25273,"blers":25274,"Ġsniff":25275,"Ġsuppression":25276,"Ġsaf":25277,"urger":25278,"Ġbunker":25279,"asaki":25280,"ĠSpartan":25281,"ĠTok":25282,"Ġrav":25283,"Ġfoc":25284,"Sean":25285,"etric":25286,"Ġballpark":25287,"ĠHerb":25288,"ĠBM":25289,"ĠPublishing":25290,"Ġroadmap":25291,"pered":25292,"Ġpredator":25293,"ĠBlockchain":25294,"Ġvalidity":25295,"ĠGlou":25296,"ĠYamaha":25297,"Ġadop":25298,"Ġswamp":25299,"Ġcomplied":25300,"Ky":25301,"Greg":25302,"casts":25303,"john":25304,"ĠBosnia":25305,"Ġcinematic":25306,"ĠTavern":25307,"Ġfrustrations":25308,"eryl":25309,"Ġfairy":25310,"UNCH":25311,"ĠTus":25312,"Corp":25313,"ĠNug":25314,"closed":25315,"Ġexercised":25316,"urden":25317,"Ġdigitally":25318,"137":25319,"ĠVictims":25320,"Ġreluctance":25321,"ELL":25322,"ĠTribe":25323,"chall":25324,"Ġwhiskey":25325,"ogl":25326,"Ġmater":25327,"ĠBac":25328,"Ġapartheid":25329,"ĠMBA":25330,"mot":25331,"ĠIre":25332,"®,":25333,"ĠChic":25334,"Ġtimed":25335,"ĠDome":25336,"efer":25337,"Ġobserver":25338,"unky":25339,"ĠKant":25340,"Ġundrafted":25341,"Ġsimplicity":25342,"onds":25343,"Ġstoked":25344,"Ġ1949":25345,"Ġransomware":25346,"ĠPow":25347,"ĠAngelo":25348,"ĠAmbrose":25349,"adjusted":25350,"Guard":25351,"138":25352,"ĠKaplan":25353,"stri":25354,"Ġcries":25355,"NF":25356,"atro":25357,"Ġavocado":25358,"illian":25359,"Ġsculptures":25360,"Ġelevation":25361,"Ġinspires":25362,"Ġgenerals":25363,"arb":25364,"chell":25365,"ĠJournalism":25366,"ĠHybrid":25367,"ĠCaller":25368,"vec":25369,"Lu":25370,"Ġresemble":25371,"bys":25372,"erving":25373,"antz":25374,"Ġwiden":25375,"vised":25376,"Ev":25377,"Ġdiagn":25378,"ĠMakes":25379,"Ġcer":25380,"ĠPats":25381,"single":25382,"sche":25383,"struct":25384,"Ġdissolved":25385,"Ġtimeout":25386,"Ġenhancement":25387,"CF":25388,"Ġindust":25389,"ĠDed":25390,"ĠZo":25391,"CB":25392,"Ġpesticides":25393,"ĠRubin":25394,"George":25395,"opal":25396,"Ġmotel":25397,"critical":25398,"Ġcollapsing":25399,"ĠShal":25400,"tex":25401,"Ġcomplementary":25402,"Ġoust":25403,"ĠFlu":25404,"Ġexporting":25405,"Ġdifferential":25406,"north":25407,"ĠFG":25408,"Ġspoon":25409,"sha":25410,"Ġdismantle":25411,"elta":25412,"Ġjar":25413,"space":25414,"Smart":25415,"mere":25416,"Ð":25417,"ĠGillespie":25418,"Lo":25419,"ĠMead":25420,"capacity":25421,"ĠIssue":25422,"050":25423,"ĠVall":25424,"Ġdisgr":25425,"Ġmeme":25426,"Ġpard":25427,"Ġcompensated":25428,"ĠKet":25429,"major":25430,"ĠBren":25431,"Ġheed":25432,"131":25433,"Ġcm":25434,"Ġdazzling":25435,"ĠCheese":25436,"Ġmonumental":25437,"Ġyielding":25438,"Read":25439,"Ġgrinding":25440,"Ang":25441,"Ġdefiance":25442,"Ġintimidated":25443,"Ġ310":25444,"Ġoutsiders":25445,"houn":25446,"Ma":25447,"ĸ":25448,"ĠForget":25449,"ĠSans":25450,"Ġunfolding":25451,"ĠSap":25452,"ĠLak":25453,"Ġsectarian":25454,"ĠDaddy":25455,"oxy":25456,"hitting":25457,"Ġdetectors":25458,"ĠRee":25459,"Ġbroaden":25460,"Ġslaying":25461,"Ġsuspending":25462,"Ġinvestig":25463,"Tuesday":25464,"Ġantibiotic":25465,"ĠShiite":25466,"igi":25467,"ĠExternal":25468,"ĠPhotographer":25469,"Ġerratic":25470,"NJ":25471,"ĠDock":25472,"Ġoutweigh":25473,"rants":25474,"Ġlobster":25475,"Ġreactor":25476,"Ġunrealistic":25477,"ĠAudrey":25478,"ĠYor":25479,"Anyone":25480,"Ġfraught":25481,"е":25482,"ĠWester":25483,"fc":25484,"ĠDunham":25485,"ĠLug":25486,"allow":25487,"139":25488,"Ġparity":25489,"Ġhorizontal":25490,"ijuana":25491,"Ġcivilization":25492,"ĠGins":25493,"Ġsmokers":25494,"ĠDiabetes":25495,"Five":25496,"ĠDG":25497,"Ġunderscores":25498,"Ġelabor":25499,"ĠLub":25500,"ĠDevil":25501,"Ġ154":25502,"ĠGuarant":25503,"ĠPandora":25504,"Ġexcav":25505,"Ġaccuser":25506,"Ġrevolt":25507,"Ġinstructors":25508,"Ġire":25509,"ographic":25510,"ĠCLE":25511,"Ġexpedition":25512,"ould":25513,"Ġstriving":25514,"south":25515,"onis":25516,"ĠSwed":25517,"MY":25518,"ĠLevin":25519,"Ġcarp":25520,"ĠArchitects":25521,"Ġ{":25522,"Ġcovert":25523,"Ġcooled":25524,"ĠStaten":25525,"Ġspecializing":25526,"ĠHazel":25527,"Ġlen":25528,"ighty":25529,"Ġbrilliantly":25530,"Phil":25531,"Ġlament":25532,"Australia":25533,"203":25534,"Ġticking":25535,"Ġadjud":25536,"Ġroommate":25537,"ĠSheet":25538,"capital":25539,"167":25540,"Ġendeavor":25541,"Ġaver":25542,"Ġdues":25543,"ĠCycl":25544,"oried":25545,"Va":25546,"loading":25547,"Ġpremie":25548,"Ġregimes":25549,"ĠAly":25550,"Ġperennial":25551,"Ġconsoles":25552,"Ġironic":25553,"ichael":25554,"Ġvigorously":25555,"Ġtransmit":25556,"gary":25557,"eking":25558,"Ġjails":25559,"ĠEpiscopal":25560,"eddy":25561,"Ġidle":25562,"Ġsafeguards":25563,"Ġdwindling":25564,"NOR":25565,"torn":25566,"ĠEvangel":25567,"ĠPlastic":25568,"ĠTerm":25569,"Ġforwarded":25570,"avage":25571,"Ġrefrigerator":25572,"arna":25573,"ĠGuinness":25574,"ĠCandy":25575,"Ġbotched":25576,"seller":25577,"Ġpul":25578,"grades":25579,"oshenko":25580,"earth":25581,"nette":25582,"Ġtraps":25583,"Ġtarn":25584,"Ġmilitar":25585,"ĠAriel":25586,"Ġtubes":25587,"ulo":25588,"Water":25589,"edin":25590,"Ġmarvel":25591,"chenko":25592,"ĠElk":25593,"spect":25594,"coe":25595,"ĠIllustrated":25596,"Ġruthless":25597,"etermined":25598,"Ġdys":25599,"Ġbreaching":25600,"gee":25601,"Nick":25602,"Ġcruiser":25603,"Ġciv":25604,"Ġdou":25605,"Ġ;":25606,"deb":25607,"ĠAsheville":25608,"Ġbiting":25609,"Ġyo":25610,"Courtesy":25611,"Ġroses":25612,"ĠConsequently":25613,"Ġrevis":25614,"Ġconfinement":25615,"next":25616,"produced":25617,"Ġmoratorium":25618,"Ġkne":25619,"eties":25620,"Ġplethora":25621,"Ġceleb":25622,"FIN":25623,"Ġdepartures":25624,"ĠWynne":25625,"abilia":25626,"ĠCourts":25627,"olis":25628,"Ġcereal":25629,"Ġblended":25630,"333":25631,"ĠLun":25632,"Ġrepe":25633,"Ġmathematics":25634,"Ġpharmacies":25635,"Center":25636,"Ġwhist":25637,"pine":25638,"Ġperm":25639,"Ġcustomary":25640,"Ġhormones":25641,"Ġcleansing":25642,"Ġconfidentiality":25643,"Ġmascot":25644,"Ġslippery":25645,"Ġmediation":25646,"Ġpodcasts":25647,"Ġcoating":25648,"Ġconveyed":25649,"Ġgir":25650,"ĠNurse":25651,"DM":25652,"Ġlured":25653,"orted":25654,"Ġolig":25655,"ritz":25656,"ĠINF":25657,"Ġtirelessly":25658,"Ġdoorstep":25659,"Ġtomb":25660,"Ġwithholding":25661,"irling":25662,"Ġhog":25663,"Ġ156":25664,"Ġgau":25665,"chem":25666,"raid":25667,"Ġtrolls":25668,"Ġ182":25669,"ĠColumb":25670,"Ġtissues":25671,"Ġnaive":25672,"Ġlect":25673,"Central":25674,"Sign":25675,"168":25676,"Ġbribe":25677,"ĠDoll":25678,"ĠTripoli":25679,"Ġfunk":25680,"Ġplaza":25681,"Ġmechanic":25682,"mem":25683,"Ġmonkey":25684,"grid":25685,"Ġtainted":25686,"ĠNicaragua":25687,"pelling":25688,"ĠXia":25689,"ammers":25690,"Ġorth":25691,"ICAN":25692,"Ġrant":25693,"Ġdiary":25694,"ĠHarrington":25695,"Ġimply":25696,"Qaeda":25697,"Ġworsen":25698,"Ġcrafting":25699,"ĠShir":25700,"Ġcoincided":25701,"Ġsnatched":25702,"ileen":25703,"sei":25704,"Ġsurgeons":25705,"directed":25706,"Ġcompulsory":25707,"Ġnowadays":25708,"ĠLI":25709,"ĠRebel":25710,"Ġlions":25711,"ĠJR":25712,"scar":25713,"ĠRespons":25714,"Ġscroll":25715,"ĠErd":25716,"iety":25717,"\";":25718,"ĠBone":25719,"ĠRumble":25720,"ĠKS":25721,"ĠLaur":25722,"kell":25723,"ĠBirds":25724,"agic":25725,"Ġsimmer":25726,"Ġrunaway":25727,"Ġ162":25728,"auna":25729,"Ġdialog":25730,"Ġlouder":25731,"esque":25732,"RR":25733,"Ġbloss":25734,"Ġcaliber":25735,"nery":25736,"Ġhauled":25737,"Ġbacterial":25738,"ĠVanity":25739,"ĠPrograms":25740,"omew":25741,"ĠMama":25742,"Ġarr":25743,"Ġdod":25744,"ĠJarvis":25745,"ĠFIRST":25746,"Ġinjections":25747,"ĠBallard":25748,"Ġmedically":25749,"angan":25750,"ĠNewfoundland":25751,"Ġfracking":25752,"Ġbast":25753,"outing":25754,"Ġmercury":25755,"Ġwatershed":25756,"ĠAmateur":25757,"Ġ153":25758,"escal":25759,"Ġpainter":25760,"creat":25761,"Ġperceive":25762,"Ġgent":25763,"attacks":25764,"worked":25765,"Ġimporting":25766,"Indian":25767,"Ġconvict":25768,"clad":25769,"Ġbudding":25770,"Ġambient":25771,"ĠWitness":25772,"letes":25773,"Ġbuffet":25774,"Ġneedles":25775,"Ġcoding":25776,"Ġchoke":25777,"Ġcorrespondence":25778,"Ġgods":25779,"Ġdances":25780,"Ġsteadfast":25781,"cert":25782,"Ġroaming":25783,"between":25784,"weak":25785,"Jer":25786,"jandro":25787,"Ġdiscouraged":25788,"Ġfruition":25789,"ĠØ":25790,"ĠKop":25791,"ULL":25792,"efe":25793,"imble":25794,"obb":25795,"ulla":25796,"Ġaccredited":25797,"Ġlectures":25798,"bil":25799,"why":25800,"Ġgreeting":25801,"ĠBoost":25802,"Ġmailed":25803,"Ġtroop":25804,"Ġfrig":25805,"Ġrese":25806,"Ġscratched":25807,"Stars":25808,"ĠRailroad":25809,"ĠIdol":25810,"Ġsuccumbed":25811,"ĠWeeks":25812,"ffe":25813,"Ġjihadist":25814,"ITION":25815,"Ġthreads":25816,"ĠGenerally":25817,"Ġmedieval":25818,"Ġquotas":25819,"ĠFerry":25820,"rique":25821,"Ġprod":25822,"ĠEduc":25823,"rive":25824,"Ġensued":25825,"Cy":25826,"Ġinfring":25827,"Ġprank":25828,"Ġfrontline":25829,"Ġcompletes":25830,"upe":25831,"Ġmanageable":25832,"Ġpoems":25833,"otten":25834,"igne":25835,"threat":25836,"ĠDri":25837,"ĠLINK":25838,"Calif":25839,"ĠDos":25840,"ulent":25841,"Ġaids":25842,"Ġslips":25843,"umped":25844,"Ġstyled":25845,"Ġdisproportionately":25846,"ĠDish":25847,"ĠUncle":25848,"andel":25849,"Ġrecharge":25850,"rators":25851,"ĠSPR":25852,"Ġguarded":25853,"ĠGreatest":25854,"ĠSkills":25855,"ĠNob":25856,"ĠDesk":25857,"ĠCros":25858,"Ġwrit":25859,"Ġquery":25860,"ORTS":25861,"Ġbundled":25862,"Ġgib":25863,"Ġeth":25864,"iesta":25865,"Ġevade":25866,"dict":25867,"straight":25868,"Met":25869,"present":25870,"Ġdiff":25871,"Ġdere":25872,"ĠSpl":25873,"Ġrepr":25874,"ĠBeard":25875,"Ġvain":25876,"Ġappointing":25877,"ĠVisual":25878,"caps":25879,"gado":25880,"ĠRican":25881,"ĠPose":25882,"endor":25883,"Ġ222":25884,"ĠLear":25885,"Ġconstructing":25886,"Dan":25887,"ĠSpears":25888,"ĠTherapy":25889,"pta":25890,"Ġrehabilit":25891,"Ġrisked":25892,"ĠGuer":25893,"HF":25894,"Ġ301":25895,"Ġliking":25896,"Ġmodular":25897,"eree":25898,"ĠMAT":25899,"ĠHomeless":25900,"Ġstove":25901,"erd":25902,"hash":25903,"ĠAchilles":25904,"ĠBeta":25905,"Ġincl":25906,"Ġgunned":25907,"ĠCrab":25908,"ĠMara":25909,"Ġinvaded":25910,"ulatory":25911,"ATA":25912,"angering":25913,"onso":25914,"Ġallocate":25915,"Ġgarment":25916,"itudes":25917,"ĠHuang":25918,"Ġstaples":25919,"ĠAlban":25920,"Ġtrough":25921,"Ġupright":25922,"tie":25923,"Ġexploits":25924,"ĠVaughan":25925,"ĠDarrell":25926,"Ġassortment":25927,"ĠChill":25928,"Ġlearners":25929,"aqu":25930,"Ġexplode":25931,"ĠChong":25932,"bt":25933,"opl":25934,"Ġaltern":25935,"Ġ151":25936,"fur":25937,"ULT":25938,"HOU":25939,"ĠMemory":25940,"Ġboosts":25941,"ynes":25942,"priv":25943,"Ġtimeless":25944,"Ġcurtail":25945,"ĠCary":25946,"ĠHud":25947,"Ġexclus":25948,"Ġ275":25949,"Ġfry":25950,"ĠVera":25951,"Ġdefied":25952,"ĠDust":25953,"Ġenvision":25954,"ĠPhilipp":25955,"Ġenhancements":25956,"ĠLIB":25957,"ggy":25958,"ĠAzure":25959,"esis":25960,"Ġcharismatic":25961,"Ġcoincide":25962,"inged":25963,"ĠChoose":25964,"Ġsizeable":25965,"136":25966,"Ġpronounce":25967,"ĠPositive":25968,"Ġideally":25969,"Ġechoes":25970,"Ġcottage":25971,"Ġencrypted":25972,"Prime":25973,"Ġá":25974,"Ġflashes":25975,"Group":25976,"Ġ501":25977,"heat":25978,"atility":25979,"ĠTesting":25980,"pex":25981,"WT":25982,"154":25983,"annah":25984,"Ġcompromising":25985,"Ġinactive":25986,"Ġdisparity":25987,"Ġgruesome":25988,"ĠFeather":25989,"ĠMandal":25990,"Ġthereof":25991,"ĠProducer":25992,"Ġprofiling":25993,"Ġlogistical":25994,"Ġcornerstone":25995,"ĠClaudia":25996,"Congress":25997,"ĠDill":25998,"ophone":25999,"Ġcameo":26000,"ĠCutler":26001,"Ġcraz":26002,"throw":26003,"ĠKasich":26004,"Ġexploiting":26005,"ĠSeas":26006,"agles":26007,"ĠGeological":26008,"ĠStub":26009,"ĠUps":26010,"MER":26011,"Ġmem":26012,"itution":26013,"Ġunderstandably":26014,"Ġcontractual":26015,"warming":26016,"qi":26017,"Sky":26018,"whelming":26019,"Ġcurse":26020,"ĠAren":26021,"Ġ265":26022,"ĠGree":26023,"Ġpresiding":26024,"Works":26025,"stones":26026,"Ġappalling":26027,"plex":26028,"dj":26029,"aunting":26030,"Ġimag":26031,"Ġsexism":26032,"ĠVert":26033,"ĠRag":26034,"ĠBliss":26035,"posium":26036,"div":26037,"Ġexperimenting":26038,"Ass":26039,"Lago":26040,"worthiness":26041,"ĠBerk":26042,"ĠDisneyland":26043,"Ġexaggerated":26044,"iliation":26045,"ĠFP":26046,"Ġprincipals":26047,"Miami":26048,"ropri":26049,"PLE":26050,"iona":26051,"ĠPokemon":26052,"apse":26053,"Ġbubbles":26054,"INC":26055,"ĠCaps":26056,"ĠBrowne":26057,"sing":26058,"Ġcafé":26059,"Ġceilings":26060,"frame":26061,"ĠIrwin":26062,"ATS":26063,"dated":26064,"Ġprotester":26065,"Ġtaps":26066,"ĠOslo":26067,"Ù":26068,"Ġconcentrations":26069,"Ġdistributions":26070,"Ġglucose":26071,"ĠRudolph":26072,"Ġtowels":26073,"Ġâĸº":26074,"Ġneighbourhoods":26075,"Ġinduction":26076,"Ġglaring":26077,"Ġannexation":26078,"Ġunsustainable":26079,"ĠTend":26080,"Ġthumbs":26081,"iegel":26082,"cript":26083,"gor":26084,"closure":26085,"thought":26086,"Ġpaddle":26087,"Ġemulate":26088,"Ġdiameter":26089,"Ġtailor":26090,"ĠCorpor":26091,"icable":26092,"ĠPrin":26093,"Ġadminister":26094,"ĠJudd":26095,"ĠColleg":26096,"aund":26097,"ĠPond":26098,"ĠNOTE":26099,"Ġcombating":26100,"Ġinvention":26101,"ĠOculus":26102,"ĠRepl":26103,"iscal":26104,"Ġtrilogy":26105,"anian":26106,"ATT":26107,"ĠCoke":26108,"DL":26109,"ĠLup":26110,"living":26111,"Ġadvertise":26112,"ĠConnie":26113,"amping":26114,"Ġsung":26115,"ORY":26116,"ĠTet":26117,"Ġsplits":26118,"Ġreconnect":26119,"Ġlou":26120,"mut":26121,"ulator":26122,"Ġstrap":26123,"Ġswallow":26124,"rote":26125,"Ġexec":26126,"ffen":26127,"ĠCombine":26128,"ĠTreat":26129,"Ġsorrow":26130,"ĠNotably":26131,"ĠSever":26132,"rette":26133,"Ġwherein":26134,"Ġtransitioning":26135,"Ġtrout":26136,"Ġcockpit":26137,"Ġcrawl":26138,"Ġferv":26139,"Ġliquids":26140,"Ġtsp":26141,"atell":26142,"Ġmeasles":26143,"Ġjug":26144,"Ac":26145,"ĠKD":26146,"ĠMoose":26147,"Ġvans":26148,"chain":26149,"ĠPapua":26150,"plet":26151,"Wednesday":26152,"lynn":26153,"chery":26154,"budget":26155,"Tony":26156,"ĠBacon":26157,"Ġstirred":26158,"ĠSpecialist":26159,"Ġcounterfeit":26160,"а":26161,"Ġdifferentiate":26162,"Ġmuscular":26163,"ĠTheodore":26164,"Ġlooms":26165,"ĠXX":26166,"ottage":26167,"Ġbenches":26168,"ĠMunicip":26169,"Po":26170,"ĠHeck":26171,"Ġscars":26172,"ĠNim":26173,"ÙĬ":26174,"ĠIngredients":26175,"Ġecological":26176,"ĠAWS":26177,"Ġdispose":26178,"Ġmattered":26179,"Ġ720":26180,"Ġpatriotism":26181,"ĠGrind":26182,"Ġcurved":26183,"opia":26184,"ĠLiqu":26185,"Ġevangelical":26186,"tto":26187,"ĠMaterial":26188,"ĠShowtime":26189,"ĠBS":26190,"Ġcheckpoints":26191,"Ġcrippling":26192,"ĠBalance":26193,"stress":26194,"bearing":26195,"Ġ216":26196,"ĠGuards":26197,"Ġlinebackers":26198,"Ġoffending":26199,"Ġsands":26200,"umbnail":26201,"atorial":26202,"Ġliberties":26203,"ĠGW":26204,"ĠPulitzer":26205,"ĠAlvin":26206,"ĠFAC":26207,"ĠStrategies":26208,"Ġreiter":26209,"ĠRestaur":26210,"ĠLithuania":26211,"ĠSwanson":26212,"terror":26213,"ĠMaurit":26214,"Ġparadise":26215,"zzle":26216,"owment":26217,"ĠWP":26218,"Ġsodium":26219,"Ġfuturistic":26220,"Ġdots":26221,"Anthony":26222,"Though":26223,"Ġstripes":26224,"Ġorig":26225,"ultz":26226,"Ġ340":26227,"KK":26228,"umer":26229,"ivery":26230,"Ġplacebo":26231,"Ġdemocrat":26232,"Ġsubmerged":26233,"ĠHidden":26234,"pieces":26235,"Ġasteroid":26236,"ĠGraphic":26237,"Ġadvert":26238,"sil":26239,"Ġdreaming":26240,"Ġnationality":26241,"Ġfostering":26242,"daughter":26243,"ĠSavings":26244,"Ġmischief":26245,"ĠClair":26246,"ĠBundy":26247,"Ġblatant":26248,"Ġtabs":26249,"qa":26250,"severe":26251,"attered":26252,"Ġgreed":26253,"Ġresembles":26254,"Ġnominal":26255,"Ġineligible":26256,"wealth":26257,"fax":26258,"payers":26259,"Ġdisplacement":26260,"itute":26261,"Ġunpleasant":26262,"ĠPom":26263,"lif":26264,"edo":26265,"ĠNP":26266,"Inter":26267,"Ġcohort":26268,"ĠStacy":26269,"ĠDai":26270,"Ġhistories":26271,"alin":26272,"273":26273,"Ġdram":26274,"ĠKand":26275,"Ġexpectancy":26276,"ansson":26277,"Ġlimbo":26278,"ĠPolar":26279,"Ġdivine":26280,"oused":26281,"Ġshel":26282,"ĠProblem":26283,"achment":26284,"Ġâĸł":26285,"shoot":26286,"antam":26287,"ĠHerz":26288,"Ġ157":26289,"Ġpreventive":26290,"keye":26291,"Sing":26292,"Ġcharacteristic":26293,"Ġcasually":26294,"ĠTaiwanese":26295,"md":26296,"ĠHubbard":26297,"imon":26298,"Ġsect":26299,"148":26300,"Ġmartyr":26301,"stud":26302,"Ġcongrat":26303,"ĠSWAT":26304,"ĠTheory":26305,"INAL":26306,"opping":26307,"ply":26308,"ĠKindle":26309,"uu":26310,"ĠLith":26311,"kaya":26312,"ĠActivity":26313,"uously":26314,"ĠJeb":26315,"tell":26316,"ĠSpin":26317,"ĠExplorer":26318,"Ġfolded":26319,"ĠCanterbury":26320,"ĠStur":26321,"Ġminiature":26322,"Ġmultif":26323,"ĠPressure":26324,"angling":26325,"ĠOverse":26326,"Ġresides":26327,"Ġimpressions":26328,"Ġauthored":26329,"265":26330,"Ġallergies":26331,"143":26332,"ĠJi":26333,"Ġsticker":26334,"ĠAccord":26335,"Ġcaste":26336,"Ġseparates":26337,"ĠFein":26338,"Daily":26339,"179":26340,"ĠScores":26341,"ĠAuction":26342,"hea":26343,"Ġdisclosing":26344,"ĠTacoma":26345,"Ġverse":26346,"ĠBeg":26347,"Ġfabrics":26348,"aez":26349,"Ġattachment":26350,"isy":26351,"Christ":26352,"Ġaddictive":26353,"Ġvir":26354,"Week":26355,"ĠPlum":26356,"croft":26357,"itivity":26358,"ĠExhibition":26359,"Ġbruised":26360,"Ġmimic":26361,"rers":26362,"Ġanal":26363,"Ġunintended":26364,"Ġpall":26365,"atts":26366,"ĠWarn":26367,"Ġslows":26368,"WH":26369,"Ġembro":26370,"nec":26371,"Ġ168":26372,"285":26373,"ologic":26374,"Ġhob":26375,"ĠPeel":26376,"Mill":26377,"eps":26378,"Ġrobbers":26379,"ĠDahl":26380,"semble":26381,"omics":26382,"toe":26383,"ĠLoch":26384,"Ġreproduction":26385,"ĠCullen":26386,"Ġimplants":26387,"Ġwow":26388,"ĠSTATE":26389,"vt":26390,"Ġdepleted":26391,"Ġbreweries":26392,"Ġhateful":26393,"Ġgast":26394,"Ġhollow":26395,"Ġradically":26396,"ographed":26397,"ĠFog":26398,"onian":26399,"ĠSequ":26400,"Ġdisrespectful":26401,"Dis":26402,"ĠExper":26403,"pron":26404,"ĠAmelia":26405,"ĠSage":26406,"bath":26407,"Ġtransformative":26408,"Ġtremendously":26409,"Ġpillow":26410,"ĠNormal":26411,"Cont":26412,"ĠMedic":26413,"educated":26414,"Ġredesigned":26415,"Ġkneeling":26416,"Ġinh":26417,"Ġroofs":26418,"Ġhandmade":26419,"Ġprotracted":26420,"ĠIsn":26421,"ĠCapacity":26422,"Ġsquash":26423,"ĠVega":26424,"Ġfats":26425,"ĠCertified":26426,"ointed":26427,"Ġpricey":26428,"ĠBasil":26429,"Ġfreezer":26430,"Ġscent":26431,"Ġpizz":26432,"ĠArd":26433,"Ġdistractions":26434,"Ġviolently":26435,"ĠHess":26436,"Ġfunc":26437,"Ġundert":26438,"Ġrejuven":26439,"Ġdisbelief":26440,"cluded":26441,"named":26442,"ĠFailure":26443,"kus":26444,"Ġhostages":26445,"ĠSahara":26446,"Ġ1944":26447,"Leary":26448,"ĠPrel":26449,"enza":26450,"ĠAlly":26451,"ĠKak":26452,"Ġcounselors":26453,"ĠGale":26454,"ĠHok":26455,"ĠSold":26456,"Ġhacker":26457,"Ġhun":26458,"Ġbung":26459,"Ġdeclares":26460,"Ġinfringement":26461,"OOD":26462,"Ġdoub":26463,"jam":26464,"Ġallergy":26465,"ĠShipping":26466,"Ġmedic":26467,"Ġaccommod":26468,"Ġdocumenting":26469,"Ġcompanions":26470,"Ġmodelling":26471,"Ġcarriage":26472,"ĠCherokee":26473,"Ġtresp":26474,"Ġtaxable":26475,"ĠActivities":26476,"ĠCrane":26477,"bots":26478,"ĠRusso":26479,"Ġstocked":26480,"ervation":26481,"Ġcoffin":26482,"aign":26483,"guards":26484,"Ġonwards":26485,"Ġfrank":26486,".*":26487,"unic":26488,"Ġcens":26489,"enic":26490,"ruit":26491,"rained":26492,"Ġadapting":26493,"aments":26494,"Ġstagnant":26495,"azaar":26496,"ĠHarlem":26497,"Ġ158":26498,"ysis":26499,"Ġbraking":26500,"Ġdipping":26501,"Ġclan":26502,"ĠShu":26503,"Ġprops":26504,"qualified":26505,"Ġmistakenly":26506,"ĠStalin":26507,"Ġaddicts":26508,"ĠCALL":26509,"ropolis":26510,"aten":26511,"pec":26512,"ĠDro":26513,"ĠFellowship":26514,"ĠSupporting":26515,"loc":26516,"uben":26517,"499":26518,"Bro":26519,"Ġpots":26520,"Ġchunks":26521,"wr":26522,"ĠColonial":26523,"ĠArchitecture":26524,"Ġconstrained":26525,"Ġenvelop":26526,"ĠIronically":26527,"aban":26528,"Ġapparatus":26529,"Ġcue":26530,"Ġborne":26531,"ĠRoz":26532,"ilton":26533,"Ġtheoretical":26534,"ĠWatching":26535,"Ġfuck":26536,"ĠSilk":26537,"ĠSTE":26538,"bler":26539,"ĠPOST":26540,"ĠUpton":26541,"Ġsummons":26542,"ĠCum":26543,"ĠKL":26544,"Ġrelaxation":26545,"ĠDuff":26546,"Ġincumb":26547,"ĠRedd":26548,"Ġstature":26549,"Ġcanv":26550,"added":26551,"Ġremedies":26552,"ĠISO":26553,"ĠDecker":26554,"Ġafloat":26555,"Ġstartling":26556,"ĠBethlehem":26557,"Ġrealizes":26558,"find":26559,"ĠAra":26560,"Ġphased":26561,"arov":26562,"Ġhalting":26563,"ĠWindow":26564,"Ġdentist":26565,"Ġtumble":26566,"Ġvalidation":26567,"Ġcarve":26568,"ĠIPS":26569,"Ġirrit":26570,"ĠEssential":26571,"Ġfluids":26572,"rons":26573,"Ġimplant":26574,"Ġnuisance":26575,"ĠShelley":26576,"ĠGemini":26577,"Ġpharmac":26578,"iction":26579,"Ġtaped":26580,"ĠGovernments":26581,"ruly":26582,"Ġscant":26583,"Ġprominently":26584,"Ġreim":26585,"unning":26586,"arted":26587,"ĠMatters":26588,"Ġ1918":26589,"ĠPros":26590,"atel":26591,"ĠBattalion":26592,"onduct":26593,"talk":26594,"ĠTinder":26595,"ĠInstant":26596,"ĠKern":26597,"Ġbuckets":26598,"ĠGroups":26599,"Ġmetaphor":26600,"cloud":26601,"ĠString":26602,"Ohio":26603,"Ġcaffeine":26604,"Old":26605,"Ġdefinite":26606,"ĠNikola":26607,"ĠLords":26608,"icol":26609,")?":26610,"Ġenjoyment":26611,"Ġfamine":26612,"Ġdefinitions":26613,"ĠJem":26614,"Check":26615,"Ġaiding":26616,"ĠMé":26617,"Ġrenewables":26618,"Ġsightings":26619,"footed":26620,"Box":26621,"Ġgoats":26622,"Ġshack":26623,"AX":26624,"ĠMonk":26625,"ĠGraduate":26626,"Ġmeats":26627,"handle":26628,"147":26629,"rys":26630,"Ġunsub":26631,"Pont":26632,"uble":26633,"440":26634,"Ġeyel":26635,"thro":26636,"Ġcreep":26637,"^^^^":26638,"Ġpopcorn":26639,"Ġcompression":26640,"sal":26641,"ouf":26642,"Ġrepairing":26643,"Think":26644,"Ġdoubtful":26645,"ĠLooks":26646,"Ġtaller":26647,"Ġsul":26648,"sf":26649,"give":26650,"ĠGau":26651,"Ġrevered":26652,"EMBER":26653,"Ġsloppy":26654,"ersen":26655,"Ġvitamins":26656,"ĠImprovement":26657,"Ġprogresses":26658,"Ġdiploma":26659,"semb":26660,"ustain":26661,"Ġchant":26662,"Ġbumped":26663,"Ġsabotage":26664,"nant":26665,"Ġrabbit":26666,"Ġdividing":26667,"ĠDefender":26668,"Ġlik":26669,"Ġirrespective":26670,"cade":26671,"ĠSter":26672,"touch":26673,"EMA":26674,"Ġparted":26675,"ĠBAR":26676,"hung":26677,"Ġannoyed":26678,"Ġhinder":26679,"Ġexamines":26680,"oan":26681,"ĠBoe":26682,"Ġaggreg":26683,"ĠChu":26684,"ĠUCS":26685,"IGHTS":26686,"pez":26687,"ĠUNESCO":26688,"Ġwindshield":26689,"Martin":26690,"Ġwithhold":26691,"does":26692,"Ġbruising":26693,"Ġdeterior":26694,"bourg":26695,"ĠTowers":26696,"JD":26697,"England":26698,"Ġequivalents":26699,"Ġrazor":26700,"Ġreassuring":26701,"Ġident":26702,"Ġ208":26703,"reath":26704,"ceans":26705,"Ġpatrolling":26706,"eve":26707,"pots":26708,"itative":26709,"Ġsided":26710,"Ġsofa":26711,"Ġunborn":26712,"Ġaug":26713,"Ġperpetual":26714,"effect":26715,"represented":26716,"Ġrails":26717,"ĠSummers":26718,"ĠMOR":26719,"ĠSlow":26720,"ĠExpert":26721,"Ġshameful":26722,"Ġaudits":26723,"Sl":26724,"ĠBurr":26725,"adow":26726,"ĠWAY":26727,"anic":26728,"ĠIslamists":26729,"ĠStranger":26730,"pse":26731,"amaz":26732,"ĠPeggy":26733,"ĠSeventh":26734,"Ġscreenplay":26735,"ĠGriff":26736,"Ireland":26737,"142":26738,"Ġneural":26739,"ĠFernand":26740,"ainment":26741,"ĠMigration":26742,"ureen":26743,"ĠSCH":26744,"Sullivan":26745,"ĠWag":26746,"ĠREG":26747,"Ġ420":26748,"inky":26749,"ĠNewspaper":26750,"School":26751,"Ok":26752,"ĠKrishna":26753,"Ġ480":26754,"erald":26755,"Ġskipping":26756,"Ġharrowing":26757,"158":26758,"rogen":26759,"Ġbetrayal":26760,"Ġculmination":26761,"ĠCirc":26762,"Ġ211":26763,"stro":26764,"ĠTrace":26765,"Ġheaviest":26766,"td":26767,"ĠHenri":26768,"epend":26769,"RB":26770,"arella":26771,"umbai":26772,"Ġcrem":26773,"ĠDistribut":26774,"ruff":26775,"Ġscreams":26776,"Ġscathing":26777,"girls":26778,"Ġtiles":26779,"ĠEvil":26780,"usp":26781,"Ġknowledgeable":26782,"Ġrestitution":26783,"ĠWiFi":26784,"Ġitiner":26785,"exper":26786,"oris":26787,"ĠPokémon":26788,"iane":26789,"produ":26790,"ĠAchievement":26791,"Ġbrunt":26792,"ĠSurgery":26793,"Ġpragmatic":26794,"Ber":26795,"ĠKejriwal":26796,"cus":26797,"Ġconsensual":26798,"acet":26799,"ĠSecondly":26800,"Ġdivul":26801,"uca":26802,"Ġbusted":26803,"emies":26804,"ĠMou":26805,"Ġ217":26806,"Ġexcludes":26807,"ĠSamoa":26808,"Ġlofty":26809,"ĠSic":26810,"ĠRemem":26811,"dn":26812,"Ġeradicate":26813,"Ġpies":26814,"Ġscenery":26815,"ATTLE":26816,"ĠWAS":26817,"Ġinnovate":26818,"ĠEverest":26819,"Ġsynonymous":26820,"izen":26821,"Ġeuth":26822,"ĠFIA":26823,"ITIES":26824,"ĠSuddenly":26825,"Ġforay":26826,"pell":26827,"ÄŁ":26828,"licensed":26829,"Ġfra":26830,"Ġblasting":26831,"autical":26832,"ĠBlizzard":26833,"orer":26834,"Ġchili":26835,"ĠSylvia":26836,"except":26837,"tec":26838,"ĠResistance":26839,"young":26840,"usions":26841,"iotic":26842,"ĠDreams":26843,"ĠArchives":26844,"Ġunleash":26845,"ĠPract":26846,"Ġlikened":26847,"Ġga":26848,"Ġdisappearing":26849,"Ġunnoticed":26850,"Ġfrightened":26851,"arms":26852,"ĠCAD":26853,"Ġcoloured":26854,"ĠSigns":26855,"oing":26856,"Ġvodka":26857,"ruption":26858,"otions":26859,"isal":26860,"ĠBecome":26861,"Ġswoop":26862,"reating":26863,"Ġchoking":26864,"Ġunforgettable":26865,"258":26866,"packs":26867,"345":26868,"ĠAutumn":26869,"Ġther":26870,"399":26871,"ĠFaculty":26872,"Ġ1933":26873,"ĠNormally":26874,"orge":26875,"ĠTess":26876,"ĠChrom":26877,"Ġscripts":26878,"Ġbiking":26879,"Act":26880,"Ġgrazing":26881,"ĠLabrador":26882,"ĠLey":26883,"Ġwandering":26884,"Ġfend":26885,"ĠPolk":26886,"ĠKeane":26887,"ĠBeef":26888,"elope":26889,"ĠApproximately":26890,"Ġ1952":26891,"personal":26892,"Ġhistorians":26893,"ĠMcDonnell":26894,"must":26895,"LES":26896,"iking":26897,"Ġtherm":26898,"Ġhumane":26899,"Ġcrowdfunding":26900,"ĠBenefits":26901,"Land":26902,"Ġanalog":26903,"agency":26904,"ĠCrowley":26905,"Ġbirths":26906,"Ġobj":26907,"Ġfren":26908,"ĠSalmon":26909,"bies":26910,"Ġreve":26911,"216":26912,"Ġbetrayed":26913,"Ġinduced":26914,"acles":26915,"Ġtrad":26916,"Ġforgiven":26917,"Ġearners":26918,"208":26919,"Ġxen":26920,"Ġunle":26921,"Ġnecklace":26922,"Ġgravel":26923,"Ġsalads":26924,"Ġgrooming":26925,"California":26926,"Ġpossessed":26927,"Ġproclamation":26928,"Ġsequences":26929,"ream":26930,"FOX":26931,"arkin":26932,"ĠTRAN":26933,"Ġpurs":26934,"ĠLoans":26935,"Ġsacrificed":26936,"Ġiceberg":26937,"Phill":26938,"Ġgalvan":26939,"Ġsmugglers":26940,"formation":26941,"onson":26942,"ĠVaughn":26943,"Ġdoctrine":26944,"ĠEyes":26945,"Ġunmanned":26946,"states":26947,"Ġdetermin":26948,"almost":26949,"Ġeviction":26950,"Ġtid":26951,"ARR":26952,"Ġcooks":26953,"Bad":26954,"ĠCamb":26955,"Ġlinear":26956,"229":26957,"ĠCooke":26958,"ĠPurch":26959,"join":26960,"ĠCult":26961,"ĠRefugee":26962,"Ġslamming":26963,"ĠðŁij":26964,"Ġpedal":26965,"ĠVeronica":26966,"Ġlandowners":26967,"ĠYel":26968,"ĠWorkshop":26969,"antic":26970,"Ġdysfunction":26971,"Ġ229":26972,"Ġculturally":26973,"Ġinfuri":26974,"ĠEck":26975,"sem":26976,"Ġwired":26977,"ĠWerner":26978,"lov":26979,"ĠJasper":26980,"Ġvehemently":26981,"ĠSpy":26982,"lift":26983,"ĠNab":26984,"ĠPound":26985,"ĠHanna":26986,"Ġleveled":26987,"WOOD":26988,"tm":26989,"ĠKitt":26990,"Ġconve":26991,"nat":26992,"Ġjog":26993,"IVER":26994,"Ġmemes":26995,"Ġseaw":26996,"ector":26997,"Ġsprayed":26998,"Ġvaccinated":26999,"Europe":27000,"Ġmustard":27001,"ĠMahm":27002,"Ġ214":27003,"Research":27004,"iminary":27005,"Ġconcerted":27006,"Detroit":27007,"Ġkios":27008,"Ġplummet":27009,"Ġvisuals":27010,"247":27011,"Ġ228":27012,"development":27013,"ĠPascal":27014,"acial":27015,"ĠSeasons":27016,"ĠTL":27017,"480":27018,"ĠReader":27019,"Ġexpulsion":27020,"Ġchoked":27021,"Ġdevotion":27022,"ĠSTAT":27023,"urred":27024,"Ġfascinated":27025,"Ġstealth":27026,"NL":27027,"Ġbooster":27028,"Kat":27029,"ĠPriebus":27030,"Ġaux":27031,"ĠHate":27032,"ĠThing":27033,"Ġabnormal":27034,"Ġcalmly":27035,"Ġdedicate":27036,"cause":27037,"Ġisolate":27038,"ĠPai":27039,"Ġsuspensions":27040,"Ġpoisoned":27041,"ission":27042,"Ġprohibiting":27043,"353":27044,"banks":27045,"Ġkissed":27046,"ĠBegin":27047,"atis":27048,"LI":27049,"Ġshaft":27050,"ĠGuth":27051,"ĠBoo":27052,"Ġcinnamon":27053,"Ġverbally":27054,"ĠRabbi":27055,"Ġmonsters":27056,"done":27057,"ĠClyde":27058,"Ġspar":27059,"ĠCage":27060,"ĠPersons":27061,"305":27062,"ĠMons":27063,"Ġjealous":27064,"Ġswirling":27065,"know":27066,"Ġprote":27067,"Ġcruising":27068,"Ġduly":27069,"Ġchapel":27070,"Ġgroove":27071,"bps":27072,"ĠKelvin":27073,"iom":27074,"aer":27075,"bomb":27076,"Christian":27077,"Ġgigs":27078,"+.":27079,"ĠWei":27080,"Ġfarmland":27081,"otally":27082,"Ġequitable":27083,"ĠCBO":27084,"chool":27085,"amara":27086,"Ġwealthiest":27087,"ĠMeans":27088,"Ġ235":27089,"ĠUk":27090,"steps":27091,"raham":27092,"nerg":27093,"Ġclad":27094,"Ġsled":27095,"ĠMorrow":27096,"152":27097,"ĠRece":27098,"Ġplausible":27099,"Ġbisexual":27100,"artments":27101,"Ġveh":27102,"ĠLoft":27103,"bly":27104,"ĠCONC":27105,"automatic":27106,"Ġmasterpiece":27107,"ĠSpringer":27108,"Ġtendencies":27109,"Ro":27110,"Ġresentment":27111,"Ġadversely":27112,"Ġbandwidth":27113,"ĠDAV":27114,"Ġtun":27115,"Ġpuppies":27116,"ĠBundes":27117,"ĠHort":27118,"ĠGarfield":27119,"Ġenlist":27120,"Ġmont":27121,"gd":27122,"Ġrooting":27123,"Dream":27124,"Ġfulfillment":27125,"chal":27126,"182":27127,"prop":27128,"159":27129,"Ġcourtyard":27130,"iard":27131,"ĠSle":27132,"Ġoperative":27133,"Ġpublishes":27134,"ĠProposition":27135,"Ġcritique":27136,"Ġredist":27137,"wang":27138,"ĠNep":27139,"DD":27140,"Ġbonding":27141,"141":27142,"ĠAssault":27143,"-'":27144,"Ġlodging":27145,"itters":27146,"cigarettes":27147,"Ġ__":27148,"ĠLaf":27149,"GF":27150,"ĠAnat":27151,"ĠStephan":27152,"214":27153,"ĠKass":27154,"Ġviz":27155,"Ġpiling":27156,"Ġfugitive":27157,"ĠCurrency":27158,"ĠCrypto":27159,"Ġfaux":27160,"ĠPing":27161,"ĠLia":27162,"igl":27163,"Ġadversaries":27164,"ĠYPG":27165,"ĠComb":27166,"ĠYar":27167,"heny":27168,"Ġoverhe":27169,"Fest":27170,"emy":27171,"Ever":27172,"Ġ370":27173,"Ġsecretive":27174,"ĠSEN":27175,"ĠMEM":27176,"PRESS":27177,"ĠBirth":27178,"kos":27179,"Ġprecarious":27180,"irting":27181,"ĠUI":27182,"Ġoccupying":27183,"olute":27184,"Ġperiodic":27185,"eon":27186,"iens":27187,"ĠRH":27188,"Win":27189,"Ġplaybook":27190,"Ġexodus":27191,"ĠSkinner":27192,"Ġorderly":27193,"ĠVed":27194,"ouses":27195,"Ġescal":27196,"Ġbenign":27197,"Ġbots":27198,"ĠWhis":27199,"Ġappra":27200,"FOR":27201,"ĠChromebook":27202,"_____":27203,"990":27204,"athed":27205,"Ġspirited":27206,"illi":27207,"Ġbicycles":27208,"orse":27209,"ifestyle":27210,"orno":27211,"ĠDept":27212,"JA":27213,"Ġnausea":27214,"Ġpervasive":27215,"velop":27216,"commun":27217,"ĠUniversities":27218,"Ġremnants":27219,"Ġdisarm":27220,"ĠBoots":27221,"Ġprin":27222,"...\"":27223,"quila":27224,"Ġcautiously":27225,"uper":27226,"onto":27227,"din":27228,"Ġvelocity":27229,"Ġconspiring":27230,"ĠMX":27231,"Ġemphasizing":27232,"Ġâĸ":27233,"ĠStam":27234,"Ġspices":27235,"Ġairplanes":27236,"uty":27237,"culture":27238,"ĠPetr":27239,"Ġglor":27240,"ĠExcel":27241,"ĠSpeech":27242,"Ġharmless":27243,"ĠPend":27244,"ĠCrossing":27245,"ĠDocument":27246,"Ġramifications":27247,"ĠCroatian":27248,"ĠKiller":27249,"Ġmultim":27250,"Ġdiscontinued":27251,"Ġcherished":27252,"ĠMaker":27253,"aspers":27254,"ĠBlooming":27255,"ĠMata":27256,"offic":27257,"Ġsettlers":27258,"ĠPlenty":27259,"ĠInstitutes":27260,"ĠArpaio":27261,"Pool":27262,"ĠSubst":27263,"Ġ380":27264,"Ġdecidedly":27265,"ollah":27266,"Den":27267,"ĠJiang":27268,"ĠAmos":27269,"Grand":27270,"ĠTurns":27271,"meyer":27272,"Ġconducive":27273,"Ġpoignant":27274,"abortion":27275,"Ġnotebook":27276,"Ġshelling":27277,"common":27278,"ĠPavel":27279,"Ġhumid":27280,"Ġinappropriately":27281,"????":27282,"Ġsoar":27283,"Ġdynasty":27284,"Ġresearched":27285,"ĠYon":27286,"Ġmaple":27287,"Ġwedge":27288,"mass":27289,"ĠTM":27290,"USE":27291,"eln":27292,"Ġgloss":27293,"rigan":27294,"steen":27295,"ĠDeV":27296,"Ġdebacle":27297,"Christmas":27298,"Ġtweaks":27299,"grab":27300,"Ġprofoundly":27301,"Ġcampaigner":27302,"ĠSeal":27303,"Ġiteration":27304,"Ġsigh":27305,"Ġunfounded":27306,"Ġframing":27307,"Ġrecognizable":27308,"Ġseizing":27309,"legal":27310,"Ġproportions":27311,"omers":27312,"rek":27313,"Ġscreenshot":27314,"itsu":27315,"ĠOG":27316,"ĠYing":27317,"ĠMississ":27318,"295":27319,"Ġlandsl":27320,"Ġpsychiatrist":27321,"sov":27322,"arine":27323,"Ju":27324,"Ġflo":27325,"apple":27326,"hof":27327,"wig":27328,"ĠENT":27329,"Ġenthusiast":27330,"Such":27331,"ĠArtificial":27332,"happy":27333,"oton":27334,"ĠFram":27335,"ĠRemove":27336,"Ġsmear":27337,"Ġjer":27338,"Ġtopp":27339,"Ġimbalance":27340,"ĠWords":27341,"Ġcoffers":27342,"olina":27343,"Ġrigged":27344,"uction":27345,"idding":27346,"Ġdispensaries":27347,"Ġdermat":27348,"Ġshutter":27349,"idental":27350,"Ġcontinu":27351,"Ġhumility":27352,"Ġbulbs":27353,"Ġ207":27354,"lass":27355,"ĠBeirut":27356,"ĠUlt":27357,"urry":27358,"NEWS":27359,"Ġfeminine":27360,"Ġsimulated":27361,"Ġcharger":27362,"mom":27363,"ĠCreed":27364,"Ġwolves":27365,"essions":27366,"created":27367,"ifiers":27368,"Ġdissemin":27369,"ĠDarling":27370,"umann":27371,"Ġmarrying":27372,"Ġshred":27373,"avin":27374,"Ġbudgetary":27375,"Ġmedicinal":27376,"ulin":27377,"seys":27378,"agues":27379,"Ġextracted":27380,"ĠFlower":27381,"Ġcontinents":27382,"ĠWish":27383,"Ġdivides":27384,"ĠDing":27385,"Ġinsulation":27386,"respect":27387,"ĠABS":27388,"Ġreconcile":27389,"keep":27390,"ILD":27391,"Ġgenome":27392,"Ġ410":27393,"ĠSweep":27394,"Ġharass":27395,"Ġfrantic":27396,"ĠEE":27397,"dad":27398,"Ġaperture":27399,"rought":27400,"Ġhugs":27401,"Ġdrying":27402,"Ġoverrun":27403,"Space":27404,"Ġperiodically":27405,"Ġbrightness":27406,"atched":27407,"kee":27408,"ĠITS":27409,"ĠSpokane":27410,"ĠSeaf":27411,"Ġdesks":27412,"ĠEisen":27413,"ĠOPS":27414,"Ġcider":27415,"Ġacceler":27416,"ĠAthlet":27417,"2008":27418,"ĠGuid":27419,"ĠManip":27420,"Ġmould":27421,"Ġmisguided":27422,"Ġbrow":27423,"Ġmanagerial":27424,"Ġhugged":27425,"Ġfurnish":27426,"ĠHarmony":27427,"ĠHebrew":27428,"Ġtyph":27429,"Ġdecreases":27430,"Ġimpetus":27431,"Ġcontagious":27432,"Ġunch":27433,"209":27434,"Ġswell":27435,"ĠHuffington":27436,"Ġpubs":27437,"Ġadequ":27438,"amoto":27439,"rir":27440,"Ġpristine":27441,"Ġanx":27442,"ĠSecure":27443,"Ġenrichment":27444,"ĠVAL":27445,"Ġsummed":27446,"Ġconfidently":27447,"ĠProfit":27448,"ĠFrog":27449,"ĠLena":27450,"ĠFUN":27451,"Ġbruises":27452,"Ġuproar":27453,"coll":27454,"ĠImpro":27455,"Ġflair":27456,"146":27457,"ĠBrend":27458,"Ġ166":27459,"Ġenhances":27460,"ĠDent":27461,"Ġdegener":27462,"Ġproponents":27463,"ĠInspired":27464,"Ġramps":27465,"Ġwisely":27466,"Western":27467,"Ġtart":27468,"Ġsteered":27469,"Ġtreason":27470,"dropping":27471,"Ġtransc":27472,"ĠScarlett":27473,"ĠEzekiel":27474,"Ġpivot":27475,"esame":27476,"Show":27477,"Ġdiscontent":27478,"ĠJudith":27479,"ĠPutting":27480,"Ġblessings":27481,"Ġhardcore":27482,"Ġtray":27483,"Ġdiscern":27484,"oley":27485,"ouk":27486,"Ġwil":27487,"Ġintolerance":27488,"157":27489,"ĠRelative":27490,"ĠLynd":27491,"Ġwhistleblower":27492,"Ġincon":27493,"ĠTao":27494,"Ġindefinite":27495,"Ġguardians":27496,"Ġagon":27497,"ĠInstruments":27498,"Ġexistential":27499,"AAF":27500,"vind":27501,"Ġbrazen":27502,"condition":27503,"Ġratified":27504,"fam":27505,"ĠHin":27506,"ĠMichaels":27507,"204":27508,"ĠKats":27509,"ITS":27510,"ISON":27511,"prone":27512,"Ġboiling":27513,"Ġprolong":27514,"Ġnoticing":27515,"resident":27516,"brance":27517,"ĠFolk":27518,"Ġdesserts":27519,"uton":27520,"Web":27521,"ĠLongh":27522,"ĠReef":27523,"Going":27524,"ĠCarb":27525,"Sur":27526,"complete":27527,"ĠSloan":27528,"ĠClubs":27529,"ĠSadd":27530,"Ġshrugged":27531,"Ġedible":27532,"ĠTyp":27533,"thal":27534,"ĠRocks":27535,"ĠClive":27536,"Ġkidding":27537,"ĠCrom":27538,"ĠTurks":27539,"ĠWak":27540,"Ġeyewitness":27541,"ĠHass":27542,"collar":27543,"Ġsucceeding":27544,"Ġinsert":27545,"Ġ224":27546,"ĠBret":27547,"Ġneurological":27548,"Ġrewrite":27549,"imil":27550,"ultimate":27551,"ĠJeremiah":27552,"Ġliaison":27553,"Ġpedd":27554,"direct":27555,"ĠYi":27556,"ĠMAD":27557,"ĠOrion":27558,"oyd":27559,"ĠLOC":27560,"release":27561,"Ġinvestigates":27562,"ĠApache":27563,"û":27564,"ĠVend":27565,"Ġcynical":27566,"ĠHelm":27567,"ĠMovies":27568,"tops":27569,"Ġsinister":27570,"Ġunparalleled":27571,"Ġspikes":27572,"Ġoverlap":27573,"enstein":27574,"Ġhypocrisy":27575,"Plus":27576,"Ġexpansions":27577,"Ġvow":27578,"Ġdetonated":27579,"Ġfellowship":27580,"Ġsolicitor":27581,"ĠNewtown":27582,"mony":27583,"ĠLod":27584,"ĠDevelopers":27585,"ateg":27586,"ibus":27587,"Ġcrumbling":27588,"ĠWein":27589,"ĠKlan":27590,"gio":27591,"ĠPhys":27592,"ĠAntarctica":27593,"368":27594,"Ġseam":27595,"Ġautomobiles":27596,"ĠTEAM":27597,"bern":27598,"Ġmanic":27599,"Ġsanct":27600,"Ġequals":27601,"Est":27602,"Ġincentiv":27603,"ĠHawking":27604,"nin":27605,"Ġresonate":27606,"bid":27607,"Ġtelescope":27608,"endon":27609,"ĠVacc":27610,"Ġregretted":27611,"Ġ1300":27612,"ĠForestry":27613,"BOOK":27614,"Ġgroundwork":27615,"Ġessays":27616,"ĠIndo":27617,"Pierre":27618,"ĠChau":27619,"Ġapologies":27620,"killers":27621,"ĠMoroccan":27622,"0001":27623,"336":27624,"Ra":27625,"Ġparcels":27626,"Ġleaned":27627,"Ġthankfully":27628,"ĠSplit":27629,"Ġlobbied":27630,"ĠDegree":27631,"Ġrisking":27632,"assy":27633,"Ġsupplemental":27634,"little":27635,"Ġeclectic":27636,"Ġ206":27637,"ealing":27638,"206":27639,"Ġrepo":27640,"Ġhose":27641,"ayn":27642,"lux":27643,"Ġbeliever":27644,"')":27645,"ĠHide":27646,"vance":27647,"ĠEinstein":27648,"Ġdepos":27649,"Ġfray":27650,"Ġki":27651,"Ġinternship":27652,"ĠHou":27653,"Vis":27654,"Ġstare":27655,"ĠBreed":27656,"option":27657,"Ġvisionary":27658,"Ġmins":27659,"Ġbitten":27660,"ancies":27661,"ĠShake":27662,"Ġtemplate":27663,"Ġliner":27664,"Ġmuster":27665,"appro":27666,"ĠMubarak":27667,"esty":27668,"mong":27669,"actory":27670,"Ġheadphone":27671,"ĠPrec":27672,"Ġwaive":27673,"Ron":27674,"ĠHearing":27675,"Ġimperfect":27676,"Ġsealing":27677,"Ġlocating":27678,"Ġculminated":27679,"chio":27680,"channel":27681,"lust":27682,"ĠLowell":27683,"woods":27684,"Ġsoak":27685,"Ġforbidden":27686,"Ġdetached":27687,"unct":27688,"ĠHunger":27689,"ĠPatient":27690,"ĠPolo":27691,"Saharan":27692,"Jon":27693,"athered":27694,"ĠSignal":27695,"Six":27696,"Ġstatistically":27697,"ITH":27698,"artment":27699,"ĠCU":27700,"Ġhates":27701,"qual":27702,"Ġcapitalist":27703,"ATES":27704,"ĠDesc":27705,"Ġhandcuffed":27706,"Ġindulge":27707,"ĠReligious":27708,"German":27709,"housing":27710,"Ġdismantling":27711,"Ġconventions":27712,"dain":27713,"chairs":27714,"Ġloos":27715,"Ġknowingly":27716,"Var":27717,"Ġhusbands":27718,"eez":27719,"asion":27720,"ĠIssa":27721,"Ġswollen":27722,"Ġ1946":27723,"Ġheadlined":27724,"Chelsea":27725,"Ġignorant":27726,"Ġperipheral":27727,"Note":27728,"Ġaxe":27729,"Ġnicotine":27730,"ĠSanctuary":27731,"Ġ1917":27732,"Ġwithdrawals":27733,"uits":27734,"Hot":27735,"Ġreimburse":27736,"probably":27737,"ĠAdapt":27738,"industrial":27739,"answer":27740,"orus":27741,"ĠMell":27742,"Talk":27743,"Ġcontemplating":27744,"omas":27745,"Ġtaxis":27746,"Ġencompasses":27747,"rations":27748,"ĠLatvia":27749,"Ġhumiliating":27750,"Ġloft":27751,"tight":27752,"rium":27753,"Ġlogin":27754,"ĠBulletin":27755,"Ġturtles":27756,"EAR":27757,"349":27758,"Radio":27759,"ĠBord":27760,"151":27761,"kk":27762,"pocket":27763,"Ġdove":27764,"348":27765,"Ġtemptation":27766,"ĠCoy":27767,"those":27768,"ĠDest":27769,"ishly":27770,"rn":27771,"Ġmammals":27772,"ĠTub":27773,"arial":27774,"ĠPersian":27775,"Ġdaddy":27776,"Zen":27777,"Ġps":27778,"Ġ]":27779,"Field":27780,"adiq":27781,"Ġmeaningless":27782,"Ġprimer":27783,"Ġ1942":27784,"Ġ!":27785,"625":27786,"Ġfashionable":27787,"ĠTheft":27788,"ĠHAVE":27789,"christ":27790,"Ġperil":27791,"Ġrepealing":27792,"Ġbuff":27793,"Ġodor":27794,"Ġstalking":27795,"ĠDems":27796,"iences":27797,"Ġunilaterally":27798,"odies":27799,"ĠQuite":27800,"Ġbloodshed":27801,"Ġinfect":27802,"Ġreminders":27803,"Ġchop":27804,"Ġevapor":27805,"877":27806,"Ġhorrified":27807,"ĠFruit":27808,"rams":27809,"Ġinsecure":27810,"cester":27811,"ĠNationwide":27812,"Ġmocking":27813,"Ret":27814,"Ġcomplying":27815,"sav":27816,"Ġali":27817,"Family":27818,"Ĩ":27819,"Ġdishonest":27820,"Ġincorrectly":27821,"LOAD":27822,"ĠGand":27823,"ourcing":27824,"obby":27825,"ĠPetersen":27826,"Something":27827,"Ġravaged":27828,"limited":27829,"Ġrituals":27830,"ĠKnowledge":27831,"ĠUtility":27832,"Ġdoom":27833,"Ġsheds":27834,"ĠGael":27835,"ĠMillennials":27836,"ĠMonthly":27837,"Ġdomination":27838,"Ġrapport":27839,"spot":27840,"ĠPrest":27841,"ĠHA":27842,"ushes":27843,"Ġtact":27844,"Richard":27845,"Ġgritty":27846,"Does":27847,"ĠTNT":27848,"Ġdownfall":27849,"Wood":27850,"ĠPrediction":27851,"ĠPour":27852,"ĠFraud":27853,"ĠSyndrome":27854,"166":27855,"Ġliteral":27856,"Ġaddict":27857,"ĠLoud":27858,"hens":27859,"ĠAccounts":27860,"distance":27861,"Ġclassmate":27862,"Ġsalv":27863,"Ġunlucky":27864,"Ġpartying":27865,"ĠKou":27866,"ĠSNAP":27867,"%-":27868,"Ġdelegate":27869,"Ġstrikers":27870,"ĠSlate":27871,"Ġarticulate":27872,"390":27873,"Ġinqu":27874,"Ġdiscredit":27875,"ĠPriv":27876,"ploy":27877,"ĠMarketplace":27878,"ĠTune":27879,"visor":27880,"Ġwrestle":27881,"Ġkindly":27882,"ĠCollect":27883,"Ġcirc":27884,"ĠRemain":27885,"Ġ192":27886,"contin":27887,"Ġ325":27888,"Ġsevered":27889,"isations":27890,"Ġmuddy":27891,"Ġtaxing":27892,"ĠRepresent":27893,"ĠSty":27894,"rology":27895,"ĠJudges":27896,"ĠBronze":27897,"ĠApplic":27898,"Ġarrow":27899,"consuming":27900,"ĠFeaturing":27901,"Ġspies":27902,"Ġnoises":27903,"ĠColony":27904,"lost":27905,"Ġopp":27906,"Ġdeem":27907,"ĠGarc":27908,"icent":27909,"ptroller":27910,"liest":27911,"Ġoutward":27912,"ĠUser":27913,"Ġintimidate":27914,"156":27915,"Ġjab":27916,"ANGE":27917,"Jay":27918,"ĠPoverty":27919,"ACA":27920,"Ġrife":27921,"Ġfaint":27922,"ĠAcceler":27923,"tall":27924,"ĠUNITED":27925,"ĠFighter":27926,"ĠGilmore":27927,"Ġsod":27928,"amura":27929,"Ġpredictive":27930,"Ġpolish":27931,"ĠDD":27932,"Ġfabricated":27933,"ĠDag":27934,"Ġfatty":27935,"Ġplague":27936,"Ġexhib":27937,"ĠAdvent":27938,"Ġ1941":27939,"ERSON":27940,"initely":27941,"Ġloneliness":27942,"ĠEquality":27943,"Ġuntrue":27944,"Ġonlook":27945,"Ġfragmented":27946,"ruce":27947,"Ġdistrust":27948,"Ġscal":27949,"ĠCors":27950,"Ġrobbing":27951,"cultural":27952,"clusion":27953,"ĠObi":27954,"sels":27955,"ĠEvidence":27956,"ĠSac":27957,"Ġfragments":27958,"Ġflipping":27959,"ĠRabbit":27960,"Ġdisproportionate":27961,"ĠCreat":27962,"Ġlabeling":27963,"ĠGri":27964,"Ġ161":27965,"ĠEditors":27966,"holm":27967,"adr":27968,"Ĭ":27969,"tailed":27970,"Ġrenters":27971,"Ġnoodles":27972,"Ġcompetence":27973,"Ġpanc":27974,"uration":27975,"Ġacids":27976,"Ġconfid":27977,"rival":27978,"AAA":27979,"kson":27980,"Ġrecreate":27981,"153":27982,"Ġ164":27983,"ĠOlympia":27984,"ĠUnlimited":27985,"ĠShock":27986,"ĠTeaching":27987,"ĠHouses":27988,"resso":27989,"ĠMaw":27990,"Ġreplen":27991,"Ġprotestors":27992,"bey":27993,"Ġsurve":27994,"Ġemphasizes":27995,"223":27996,"ĠEsther":27997,"ĠNikol":27998,"Ġprosecutions":27999,"ĠFreed":28000,"Ġposs":28001,"OTE":28002,"ĠPrayer":28003,"Ġsquarely":28004,"Ġtir":28005,"adv":28006,"Ġbogus":28007,"Ġwrongful":28008,"Ġembell":28009,"Ġseldom":28010,"Ġpossesses":28011,"Er":28012,"ĠAlternatively":28013,"Ġinstituted":28014,"rr":28015,"Ġvocational":28016,"eval":28017,"ĠComics":28018,"Ġstumbling":28019,"335":28020,"Ġdragon":28021,"vine":28022,"services":28023,"Ġcrit":28024,"irens":28025,"Ġlayered":28026,"orb":28027,"Ġdominates":28028,"ĠMarx":28029,"period":28030,"avering":28031,"Ġbrigade":28032,"Ġchem":28033,"ĠEvolution":28034,"ĠSuk":28035,"Ġ209":28036,"ĠMalk":28037,"Ġtallest":28038,"recogn":28039,"ĠCraw":28040,"Ġell":28041,"ĠCaesar":28042,"php":28043,"ĠSurvivors":28044,"sd":28045,"itsch":28046,"ambo":28047,"Ġashore":28048,"acular":28049,"rost":28050,"Ġmurderer":28051,"Ġcasts":28052,"ĠEconomist":28053,"ĠWeapons":28054,"Ġnostalgic":28055,"Skip":28056,"REAM":28057,"Pa":28058,"Ġjournals":28059,"ĠSitting":28060,"Union":28061,"Att":28062,"ĠMaxim":28063,"Ġpurportedly":28064,"Ġrespecting":28065,"ĠMAX":28066,"seed":28067,"Ġjuicy":28068,"ĠGallup":28069,"Ġmileage":28070,"adier":28071,"Ġbod":28072,"DER":28073,"Ġsummers":28074,"icult":28075,"ipl":28076,"ĠDeng":28077,"Ġsmells":28078,"Ġivory":28079,"Ġ255":28080,"Id":28081,"DEN":28082,"Ġ159":28083,"Due":28084,"ĠLighting":28085,"ĠSurely":28086,"Ġsund":28087,"ĠKessler":28088,"immigrant":28089,"Ġtragedies":28090,"ĠOxy":28091,"ĠFixed":28092,"ĠBalk":28093,"Ġoriented":28094,"pher":28095,"Ġkitchens":28096,"Ġhips":28097,"Ġtweak":28098,"Ġtuna":28099,"ĠCla":28100,"Ġdislike":28101,"ussy":28102,"Ġoutnumbered":28103,"Ġplumbing":28104,"Ġcogn":28105,"ĠThrow":28106,"ĠTER":28107,"urally":28108,"ĠMurd":28109,"Ġcreamy":28110,"Ġresiding":28111,"otics":28112,"Ġfingerprints":28113,"!,":28114,"Ġpaused":28115,"ĠMilo":28116,"Ġhomosexuality":28117,"Ġresponsibly":28118,"iop":28119,"UCT":28120,"Ġsucceeds":28121,"ĠCRE":28122,"ĠThatcher":28123,"Ġcurrents":28124,"Ġarises":28125,"Ġwaterproof":28126,"Ġamp":28127,"ĠClaims":28128,"177":28129,"Ġsubpoen":28130,"Ġvig":28131,"ĠNeuro":28132,"Ġblur":28133,"ĠPaint":28134,"campus":28135,"Ġtoughness":28136,"ĠButton":28137,"Neal":28138,"ĠDEN":28139,"ĠNir":28140,"ĠAxel":28141,"EEP":28142,"Ġpint":28143,"Ġagile":28144,"odor":28145,"Ġessentials":28146,"ĠMov":28147,"ĠVenezuel":28148,"Ġexchanging":28149,"ĠNegative":28150,"Mil":28151,"Key":28152,"Ġbuzzing":28153,"ĠStew":28154,"Ġrebuke":28155,"Ġdepl":28156,"ĠKoz":28157,"Ġ163":28158,"Ġshines":28159,"NZ":28160,"Ġcarnage":28161,"cases":28162,"Ġwarmed":28163,"ĠGreenwich":28164,"College":28165,"Ġneedy":28166,"301":28167,"ĠMü":28168,"culation":28169,"Ġ440":28170,"425":28171,"atories":28172,"Ġsatisfactory":28173,"ĠFib":28174,"ĠElim":28175,"developed":28176,"Ġvacations":28177,"Ġpeculiar":28178,"Ġvets":28179,"onest":28180,"ĠPug":28181,"Ġlifestyles":28182,"zzi":28183,"Ġprovoke":28184,"bah":28185,"arger":28186,"ĠVirt":28187,"Sales":28188,"annel":28189,"ĠMeth":28190,"ivating":28191,"Ġrevoke":28192,"ĠAgenda":28193,"ĠIch":28194,"Ġsensit":28195,"ĠAzerbai":28196,"ĠBombay":28197,"Ġuncon":28198,"river":28199,"Ġapr":28200,"actic":28201,"ĠSubaru":28202,"Ġbanquet":28203,"Ġcontradict":28204,"tek":28205,"Football":28206,"igent":28207,"Ġreintrodu":28208,"ĠInsight":28209,"Ġsystematically":28210,"Ġboun":28211,"ĠFishing":28212,"Ġstri":28213,"ĠOB":28214,"Ġstair":28215,"Wall":28216,"ĠAllow":28217,"Ġcaramel":28218,"169":28219,"Ġcafes":28220,"Ġcalcium":28221,"Ġ169":28222,"Ġportraying":28223,"Ġdiscriminate":28224,"Ġunrestricted":28225,"Ġmant":28226,"Ġscarcity":28227,"Ġfeminism":28228,"ĠJJ":28229,"ĠOversight":28230,"ĠCue":28231,"Ġinexperienced":28232,"Ġdrafts":28233,"Ġ1939":28234,"nm":28235,"forest":28236,"ĠHonour":28237,"Ġceramic":28238,"Ġdownstairs":28239,"Ġboon":28240,"Ġmorality":28241,"Ġhorrifying":28242,"Rad":28243,"justice":28244,"Ġmosques":28245,"Ġcurfew":28246,"Ġsurrogate":28247,"Ġreimb":28248,"enth":28249,"pressure":28250,"beam":28251,"Ġwhirlwind":28252,"ĠRecession":28253,"ĠTours":28254,"Ġclusters":28255,"ĠQuant":28256,"Jonathan":28257,"project":28258,"Ġ777":28259,"ĠNOAA":28260,"abis":28261,"Ġdeficiencies":28262,"Ġsuicides":28263,"Ġfoothold":28264,"ĠYah":28265,"imeter":28266,"URN":28267,"Ġcultivate":28268,"Ġnoisy":28269,"Ġ1951":28270,"Ġpressuring":28271,"ĠDeals":28272,"ĠProphet":28273,"ĠWikipedia":28274,"INESS":28275,"ĠShine":28276,"ĠCalled":28277,"ĠSole":28278,"ĠZhou":28279,"Ġasphalt":28280,"armac":28281,"ĠScorp":28282,"ĠUnknown":28283,"ĠPAT":28284,"Heart":28285,"Ġguessed":28286,"Ġsushi":28287,"Ġheartbeat":28288,"Ġconcent":28289,"eret":28290,"plin":28291,"Ġweeds":28292,"Ġbombed":28293,"ĠTerrorism":28294,"Rich":28295,"Ġblades":28296,"Ġhaunt":28297,"Ġstorefront":28298,"Ġthwarted":28299,"access":28300,"ĠLydia":28301,"LINE":28302,"Ġpregnancies":28303,"Ġripping":28304,"ĠBelieve":28305,"spoken":28306,"inian":28307,"sed":28308,"ĠBrass":28309,"econom":28310,"current":28311,"Ġvoc":28312,"Ġmodeled":28313,"Ġpeppers":28314,"otech":28315,"ĠOption":28316,"Connell":28317,"isel":28318,"Ġcompel":28319,"Ġjuveniles":28320,"ĠNET":28321,"ĠEXP":28322,"Ġparadigm":28323,"Des":28324,"Ġ204":28325,"employed":28326,"Ġdurability":28327,"Ġ245":28328,"Ġbillionaires":28329,"violent":28330,"ĠCooperative":28331,"TOP":28332,"ĠGarry":28333,"ĠSoldiers":28334,"Ġdared":28335,"Ġvoucher":28336,"Ġblends":28337,"gue":28338,"Ġadventurous":28339,"Ġorganisms":28340,"Ġgaze":28341,"Ġcrap":28342,"Coach":28343,"omon":28344,"ĠWheels":28345,"ĠGrayson":28346,"Ġrecy":28347,"grave":28348,"Ġallergic":28349,"Ġreef":28350,"Ġbeginnings":28351,"ĠRuff":28352,"Ġclout":28353,"structed":28354,"315":28355,"ĠGeorgian":28356,"say":28357,"Ġsprings":28358,"ĠAsus":28359,"Ġrepaid":28360,"ĠGuys":28361,"ticket":28362,"Ġunb":28363,"ĠCertificate":28364,"ĠSTORY":28365,"cin":28366,"Ġpassions":28367,"Ġmediocre":28368,"Ġlackluster":28369,"vernight":28370,"kids":28371,"ĠWife":28372,"politics":28373,"ĠHimal":28374,"oddy":28375,"ensus":28376,"ĠGustav":28377,"binding":28378,"ĠIndividuals":28379,"Ġmaize":28380,"Ġhoop":28381,"ĠChanging":28382,"Ġlessen":28383,"Ġarranging":28384,"ĠFukushima":28385,"ĠTrying":28386,"ĠMage":28387,"Ġskeleton":28388,"ĠTec":28389,"289":28390,"Ġrecl":28391,"ĠFIL":28392,"Gs":28393,"ĠOdyssey":28394,"ĠProcessing":28395,"ilion":28396,"Ġsubsidized":28397,"Ġabdomen":28398,"Ġanalyse":28399,"music":28400,"clean":28401,"Ġunfinished":28402,"Ġdownloads":28403,"Ġmorally":28404,"Ġ218":28405,"Ġtrib":28406,"Keep":28407,"ĠSER":28408,"FY":28409,"Ġaust":28410,"Ġdiscovers":28411,"ĠGROUP":28412,"ĠMachines":28413,"Ġeroded":28414,"Ġominous":28415,"Ġbrightly":28416,"IME":28417,"Ġwicked":28418,"ĠTrou":28419,"Ġvisions":28420,"Kay":28421,"reported":28422,"Ġbog":28423,"ĠQuin":28424,"ĠSigma":28425,"urned":28426,"ixon":28427,"Ġharming":28428,"Ġcheckout":28429,"inet":28430,"much":28431,"Ġcherish":28432,"ĠByrd":28433,"ĠSamson":28434,"WP":28435,"orders":28436,"boa":28437,"Ġbron":28438,"oki":28439,"ĠRR":28440,"Ġsuitcase":28441,"Ġfeathers":28442,"ĠChristy":28443,"Islamic":28444,"Ġamusement":28445,"ĠISS":28446,"intensive":28447,"Qaida":28448,"Ġneurons":28449,"Ġwagon":28450,"ĠTek":28451,"Ġdolls":28452,"ĠShoot":28453,"Ġunderestimate":28454,"Ġstreamlined":28455,"Ġfractures":28456,"Ġcathedral":28457,"Ġeliminates":28458,"helle":28459,"Ġcitrus":28460,"risis":28461,"Ġimpecc":28462,"istries":28463,"ĠHog":28464,"vote":28465,"pas":28466,"Ġassign":28467,"ĠSongs":28468,"ĠMiracle":28469,"kas":28470,"zynski":28471,"Ġcrane":28472,"Ġadulthood":28473,"ĠBenefit":28474,"ĠGrimes":28475,"Ġpayday":28476,"ablished":28477,"Ġcenterpiece":28478,"Ġhassle":28479,"ĠAppalachian":28480,"follow":28481,"Ġ290":28482,"ĠRL":28483,"ĠDoe":28484,"Ġacclaim":28485,"Ġlevied":28486,"Ġtossing":28487,"Ġcarrots":28488,"ĠDarius":28489,"161":28490,"Ġoffspring":28491,"ĠJury":28492,"ĠTPP":28493,"CAP":28494,"Ġenvironmentalists":28495,"Ġrays":28496,"267":28497,"Ser":28498,"Ġcaptivity":28499,"Ġappellate":28500,"ĠElectricity":28501,"ĠEnough":28502,"232":28503,"Ġfisher":28504,"Ġbrilliance":28505,"Ġpraises":28506,"aunch":28507,"Ġsolicitation":28508,"Ġadolescent":28509,"Ġinferior":28510,"checks":28511,"Set":28512,"Ġmutations":28513,"ĠLatinos":28514,"ĠLicense":28515,"ĠAme":28516,"hirt":28517,"ĠChun":28518,"Ġdeeds":28519,"ldon":28520,"Ġmammoth":28521,"Ġturtle":28522,"rule":28523,"Ken":28524,"Ġvoyage":28525,"gram":28526,"Ġconquer":28527,"Ġretaliate":28528,"ĠPJ":28529,"ĠViking":28530,"Ġsafegu":28531,"ordinary":28532,"ĠArbit":28533,"ĠDigest":28534,"Die":28535,"Ġbureaucratic":28536,"Ġhonorable":28537,"Ġcafeteria":28538,"ĠRAF":28539,"ĠPlaces":28540,"ĠKlu":28541,"Cam":28542,"ĠBiology":28543,"ĠCycling":28544,"imore":28545,"Ġstripping":28546,"Ġwarriors":28547,"Ġbursting":28548,"Ġlapse":28549,"Ġversa":28550,"Ġclicked":28551,"ogh":28552,"Ġ\"â̦":28553,"Ġdiligently":28554,"ĠMiy":28555,"ĠCorpus":28556,"Ġredef":28557,"Ġ176":28558,"ĠInstrument":28559,"ĠOECD":28560,"Ġstro":28561,"Ġmicrowave":28562,"Santa":28563,"Ġpars":28564,"Social":28565,"iffe":28566,"itability":28567,"Equ":28568,"Ġnud":28569,"legged":28570,"ĠTud":28571,"lav":28572,"Ġinterpreter":28573,"alcohol":28574,"Ġimposition":28575,"Ġdwelling":28576,"Ġ1400":28577,"].\"":28578,"ĠIw":28579,"RM":28580,"Ġ555":28581,"Ġparalyzed":28582,"mind":28583,"rans":28584,"adin":28585,"French":28586,"Ġliar":28587,"Represent":28588,"Ġstrapped":28589,"orate":28590,"Ġrigging":28591,"Ġinterrog":28592,"Ġsparse":28593,"ento":28594,"ĠThem":28595,"Ġbaseless":28596,"Ġbuildup":28597,"Ġundecided":28598,"isms":28599,"Ġabduct":28600,"Ġflowed":28601,"Ġprestige":28602,"Ġhacks":28603,"Ġpanicked":28604,"Cast":28605,"ĠKrish":28606,"umat":28607,"Ġantique":28608,"Ġbitters":28609,"Ġentitlement":28610,"Ġstandby":28611,"Ten":28612,"said":28613,"ĠConditions":28614,"events":28615,"Ġobey":28616,"Ġshortest":28617,"etting":28618,"Ġconcentrating":28619,"ĠNeeds":28620,"234":28621,"Ġintrigued":28622,"enting":28623,"ĠXen":28624,"ĠAlger":28625,"seekers":28626,"anish":28627,"Ġ172":28628,"âĢij":28629,"Ġsilicon":28630,"Ġstandardized":28631,"ĠFountain":28632,"essel":28633,"Ġapproves":28634,"Ġsucked":28635,"gone":28636,"ĠBriggs":28637,"brother":28638,"Ġartisan":28639,"ĠContinuing":28640,"vir":28641,"Ġsubmarines":28642,"ĠInk":28643,"program":28644,"ĠNexus":28645,"ĠCoco":28646,"Ġconceptual":28647,"Ġmatt":28648,"aughters":28649,"Ġbaths":28650,"Ġbeaut":28651,"ĠEmerald":28652,"ĠParties":28653,"248":28654,"completely":28655,"esan":28656,"Ġdiarrhea":28657,"Ġ1100":28658,"borg":28659,"ĠBroken":28660,"Ġreiterate":28661,"Ġsorting":28662,"ONS":28663,"Ġ177":28664,"Ġadmin":28665,"ĠMandatory":28666,"Ġsymptom":28667,"Ġpaced":28668,"Remember":28669,"Ġabdominal":28670,"Ġswapped":28671,"Ġtransitions":28672,"IFA":28673,"pretty":28674,"ĠJC":28675,"Ġallotted":28676,"ĠShows":28677,"Arthur":28678,"Ġsoften":28679,"dozen":28680,"Mah":28681,"Ġextinguished":28682,"Ġreelection":28683,"Ġdeployments":28684,"Ġsturdy":28685,"Ġdownright":28686,"Ġjams":28687,"ĠOptim":28688,"Ġhumiliation":28689,"cd":28690,"Ġbunk":28691,"sie":28692,"NAT":28693,"ilies":28694,"Ġimplying":28695,"Ġ<":28696,"Ġhomepage":28697,"242":28698,"Ġey":28699,"Ġdict":28700,"Ġslender":28701,"Ġforehead":28702,"ĠCecil":28703,"Ġshrunk":28704,"ĠExit":28705,"Ġexpressly":28706,"Ġseals":28707,"ĠThiel":28708,"umni":28709,"Ġdamning":28710,"ĠVS":28711,"ulum":28712,"BBC":28713,"URES":28714,"Ġinhal":28715,"Ġfont":28716,"Ġworkplaces":28717,"ĠPUBLIC":28718,"ĠHorror":28719,"Bs":28720,"arta":28721,"ĠBread":28722,"Ġstret":28723,"Ġethos":28724,"Ġstabilized":28725,"Ġconvers":28726,"ĠInqu":28727,"Ġjudgments":28728,"ĠContemporary":28729,"221":28730,"Ġzombie":28731,"VD":28732,"Ġmisunderstanding":28733,"Ġspam":28734,"ĠPapers":28735,"Ġcrocod":28736,"ENA":28737,"ĠJuven":28738,"ĠAbram":28739,"Ġbursts":28740,"atto":28741,"Ġturbulence":28742,"tty":28743,"sexual":28744,"Ġwaning":28745,"community":28746,"Government":28747,"Ġtranspl":28748,"??":28749,"Getting":28750,"ĠRare":28751,"prime":28752,"Ġlooting":28753,"Ġvalidate":28754,"ĠCreating":28755,"ĠCorruption":28756,"Ġspit":28757,"ĠFavorite":28758,"Kar":28759,"Ġadaptive":28760,"ĠART":28761,"Ġtorso":28762,"ĠIdent":28763,"Ġsubdivision":28764,"azo":28765,"Ġconsequently":28766,"Ġrotate":28767,"ĠWit":28768,"Ġestab":28769,"managed":28770,"ĠBound":28771,"Ġskim":28772,"198":28773,"ĠCorona":28774,"ĠâĿ":28775,"Ġwording":28776,"buck":28777,"iph":28778,"patrick":28779,"Help":28780,"flying":28781,"Ġracer":28782,"Ġfisherman":28783,"____":28784,"ackers":28785,"Ġpersisted":28786,"Ġmyths":28787,"Ġgarn":28788,"ologue":28789,"ĠApprentice":28790,"Ġhereby":28791,"Ġvulgar":28792,"ĠGinger":28793,"Ġtrait":28794,"ĠIdea":28795,"Ġfigur":28796,"ĠSchwarzenegger":28797,"ĠSafari":28798,"178":28799,"ĠAsians":28800,"775":28801,"ĠTriangle":28802,"Ġdemons":28803,"ĠOv":28804,"Ġanime":28805,"Broad":28806,"Ġmolecule":28807,"Ġdeposition":28808,"Ġbiodiversity":28809,"modern":28810,"Ġwallets":28811,"NH":28812,"planes":28813,"rats":28814,"ĠSeed":28815,"Ġ174":28816,"umed":28817,"Ġtouting":28818,"gre":28819,"ĠSEAL":28820,"Ġperpetrator":28821,"ĠGerrard":28822,"Ġallocations":28823,"Ġworsh":28824,"payment":28825,"bett":28826,"ĠIssues":28827,"ennis":28828,"eering":28829,"ĠMV":28830,"yi":28831,"hak":28832,"Ġ167":28833,"Ġorchestr":28834,"224":28835,"Ġsup":28836,"Ġleukemia":28837,"osures":28838,"575":28839,"Ġnoticeably":28840,"Ġparamilitary":28841,"ĠTHERE":28842,"Ġwaged":28843,"igrated":28844,"Ġdocumentaries":28845,"Ġsenseless":28846,"Ġbark":28847,"Ġgenetics":28848,"ĠAlbania":28849,"ĠCrypt":28850,"ĠSEO":28851,"Ġnightly":28852,"Ġfaults":28853,"279":28854,"ĠFerdinand":28855,"ĠSylv":28856,"Ġcalam":28857,"ĠMuller":28858,"ĠSpielberg":28859,"Boy":28860,"ĠUrs":28861,"Ġrug":28862,"Ġcolonies":28863,"ĠFunk":28864,"Ġlyric":28865,"ĠATT":28866,"anni":28867,"ĠNB":28868,"Ġthorn":28869,"Ġpertinent":28870,"188":28871,"Ġpartic":28872,"Head":28873,"Pad":28874,"Palestinian":28875,"ĠBarg":28876,"anical":28877,"beaut":28878,"onge":28879,"Ġgigantic":28880,"travel":28881,"Ġdownloading":28882,"Contin":28883,"whe":28884,"plane":28885,"Wil":28886,"IDA":28887,"Ele":28888,"ĠPAL":28889,"Ġbeams":28890,"ĠProud":28891,"ramer":28892,"Ġindependents":28893,"Ġtranslator":28894,"ĠBrah":28895,"ĠTrooper":28896,"aylor":28897,"pson":28898,"Ġguise":28899,"Ġdiffering":28900,"Ġtopple":28901,"ichen":28902,"ĠSeymour":28903,"deg":28904,"ĠMixed":28905,"Ġinvoluntary":28906,"Ġcountdown":28907,"ĠNarc":28908,"ĠAdults":28909,"Ġcoaster":28910,"Ġ342":28911,"ĠAcquisition":28912,"mone":28913,"Ġpenchant":28914,"Brian":28915,"Gh":28916,"Pres":28917,"enei":28918,"Ġreefs":28919,"ĠMaver":28920,"Ġdevised":28921,"ĠIMP":28922,"vict":28923,"Ġagility":28924,"ĠPayments":28925,"respected":28926,"Ġtuning":28927,"ĠFACE":28928,"actions":28929,"Ġyell":28930,"ĠLeaving":28931,"Ġsnowy":28932,"Saudi":28933,"Ġformations":28934,"Ġairborne":28935,"Ġdeed":28936,"ooks":28937,"Ġnamesake":28938,"Ġpunishable":28939,"Ġagg":28940,"oths":28941,"ĠFamous":28942,"ĠDeposit":28943,"Ġinduce":28944,"189":28945,"Ġhesitation":28946,"ĠBrowse":28947,"ople":28948,"reys":28949,"henko":28950,"Ġsecretaries":28951,"Ġintersections":28952,"Ġdiminishing":28953,"ints":28954,"Ġ1934":28955,"ĠInvestigative":28956,"ĠMexicans":28957,"ĠMahar":28958,"ibur":28959,"Ġstocking":28960,"gross":28961,"Ġasbestos":28962,"Ġagitation":28963,"ĠBST":28964,"Overall":28965,"Ġheats":28966,"ĠSpan":28967,"Ġimped":28968,"Ġtrusting":28969,"Pet":28970,"Ġegregious":28971,"Ġcomedians":28972,"zin":28973,"WIN":28974,"Ġchats":28975,"Ġexploding":28976,"ĠTort":28977,"Ġembraces":28978,"Ġneut":28979,"verson":28980,"ouncing":28981,"ĠFiber":28982,"Ġbaker":28983,"Ġunstoppable":28984,"ĠDial":28985,"cars":28986,"Marc":28987,"164":28988,"volt":28989,"Ġceased":28990,"EFF":28991,"Ġpromoters":28992,"Ġcircuits":28993,"Ġexcise":28994,"Ġseminars":28995,"ĠTiny":28996,"ĠImportant":28997,"ĠTup":28998,"Ġoutburst":28999,"ĠSOC":29000,"ĠWWII":29001,"Ġmerging":29002,"highly":29003,"ĠGmail":29004,"ozy":29005,"ĠKB":29006,"Ġlaboratories":29007,"knit":29008,"ĠClosed":29009,"Ġsurrounds":29010,"ĠVet":29011,"Ġcere":29012,"vard":29013,"ĠDeadpool":29014,"text":29015,"Ġinfusion":29016,"Ġcuc":29017,"ĠAtl":29018,"Ġbustling":29019,"ĠSettings":29020,"Ġ193":29021,"ryan":29022,"184":29023,"186":29024,"Ġswat":29025,"rane":29026,"Ġepidem":29027,"lando":29028,"Ġtestifying":29029,"Ġmoistur":29030,"ĠTens":29031,"Ġexemplary":29032,"ĠPump":29033,"Ġforcefully":29034,"ĠFare":29035,"Ġcomplicate":29036,"Fe":29037,"Di":29038,"ĠThy":29039,"Ġcompartment":29040,"ĠFiesta":29041,"Would":29042,"fitted":29043,"Ġcull":29044,"Ġcomedic":29045,"cyl":29046,"Ġwhichever":29047,"stic":29048,"Ġ213":29049,"Ġspills":29050,"Ġplasma":29051,"Ġdisguise":29052,"ĠCompass":29053,"ĠImmun":29054,"Ġscarf":29055,"Ġdisperse":29056,"Ġreckon":29057,"ĠTaste":29058,"root":29059,"ĠGAME":29060,"xx":29061,"Ġhomophobic":29062,"Ġdimin":29063,"/#":29064,"Ġ178":29065,"Ġgems":29066,"lio":29067,"informed":29068,"ample":29069,"XT":29070,"Ġrepression":29071,"ĠTakes":29072,"Ġhabitats":29073,"Ġmountainous":29074,"ĠMcH":29075,"ENC":29076,"Mobil":29077,"Ġreel":29078,"ĠTI":29079,"Ġauthorize":29080,"ĠAccept":29081,"ĠMetall":29082,"CCC":29083,"Ġwetlands":29084,"ĠWitch":29085,"heading":29086,"Ġintervals":29087,"ĠWitt":29088,"hene":29089,"Ġcomforting":29090,"ollen":29091,"ERN":29092,"ooky":29093,"etch":29094,"Ġassailant":29095,"announced":29096,"elin":29097,"plate":29098,"920":29099,"eating":29100,"induced":29101,"ĠIgor":29102,"ĠAmph":29103,"Ġpatented":29104,"posing":29105,"Ġextraordinarily":29106,"Ġfearless":29107,"mortem":29108,"ĠDraw":29109,"ĠRend":29110,"Son":29111,"ridden":29112,"ĠAdvantage":29113,"Ġ305":29114,"Ġroared":29115,"Str":29116,"Ġradioactive":29117,"Ġslur":29118,"ĠRear":29119,"affles":29120,"ĠPon":29121,"Ġost":29122,"umbs":29123,"ĠSlack":29124,"athom":29125,"baby":29126,"213":29127,"ĠSpending":29128,"ĠAccordingly":29129,"Ġclocks":29130,"archs":29131,"Ġsmugg":29132,"Ġmastermind":29133,"ĠKlaus":29134,"alpha":29135,"Ġspoiled":29136,"264":29137,"Pod":29138,"Ġflared":29139,"Ġcomposure":29140,"ĠCAM":29141,"Ġrestruct":29142,"Ġtasted":29143,"ĠKimber":29144,"Ġupheaval":29145,"CHAR":29146,"ĠGeo":29147,"itations":29148,"Ġbegged":29149,"UX":29150,"Authorities":29151,"ĠEngel":29152,"ĠHOME":29153,"Ġratt":29154,"Ġquickest":29155,"475":29156,"ĠSting":29157,"ĠICO":29158,"yu":29159,"Ġdefy":29160,"Prince":29161,"cards":29162,"Ġovertake":29163,"Ġretrieved":29164,"ĠNavajo":29165,"Ġpastry":29166,"ĠLange":29167,"Ġentrusted":29168,"ĠCull":29169,"aler":29170,"Ġdinosaurs":29171,"Ġbragging":29172,"ĠAlley":29173,"meier":29174,"ĠAssuming":29175,"Ġana":29176,"omatic":29177,"Brend":29178,"acted":29179,"Ġexhaustive":29180,"Ġunfit":29181,"Several":29182,"gap":29183,"Ġtet":29184,"228":29185,"Sk":29186,"302":29187,"Ġdeflect":29188,"Ġ179":29189,"226":29190,"Ġadorned":29191,"ĠSpread":29192,"Ġthirds":29193,"ĠSemi":29194,"Ġdescend":29195,"Ġaccumulate":29196,"Ġflavours":29197,"Ġinvoked":29198,"ĠAnge":29199,"Ġprofess":29200,"unks":29201,"ĠKickstarter":29202,"ENTS":29203,"ĠRw":29204,"Ġchatter":29205,"ĠPOS":29206,"Ġcollaborators":29207,"ĠEW":29208,"ĠMarkus":29209,"Ġimpair":29210,"Ġbolt":29211,"Ġglue":29212,"Ġloosely":29213,"ĠSUM":29214,"Ġhydraulic":29215,"Ġpredatory":29216,"Charles":29217,"cond":29218,"Ġspawned":29219,"Fr":29220,"174":29221,"Ġtame":29222,"Ġaggrav":29223,"Ġchrist":29224,"true":29225,"ivable":29226,"Ġhen":29227,"ĠKut":29228,"Ġskyrocket":29229,"Ġeg":29230,"Ġveterinarian":29231,"ĠStats":29232,"Kit":29233,"Ġbiologist":29234,"Spe":29235,"Ġantenna":29236,"Ġsust":29237,"fill":29238,"Ġpayload":29239,"227":29240,"Ġlivestream":29241,"ORN":29242,"ĠAbel":29243,"Ġdeception":29244,"ussen":29245,"Britain":29246,"partisan":29247,"Ġbrowse":29248,"Ġmelan":29249,"172":29250,"ĠNumerous":29251,"ĠMansion":29252,"Ġassailants":29253,"£":29254,"olerance":29255,"Ġdirectives":29256,"ĠInteg":29257,"zers":29258,"Ġduct":29259,"ĠHonestly":29260,"ĠImmediately":29261,"ixty":29262,"Ġdiagnose":29263,"Ġimplication":29264,"ĠiPads":29265,"testers":29266,"riots":29267,"Ġrespons":29268,"XP":29269,"pes":29270,"875":29271,"Ġ199":29272,"ĠPoe":29273,"303":29274,"Ġailments":29275,"ĠCarrier":29276,"Ġeject":29277,"Ġrestroom":29278,"Drive":29279,"manufact":29280,"Ġcompens":29281,"Ġglossy":29282,"Ġrecovers":29283,"Ġthinner":29284,"Ġdescendants":29285,"antle":29286,"Beaut":29287,"competitive":29288,"ĠRobotics":29289,"Ġpretext":29290,"233":29291,"Ġflanked":29292,"ĠâĻ":29293,"Ġguts":29294,"Ġwee":29295,"Ġaccents":29296,"mc":29297,"Ġgrapp":29298,"ĠNathaniel":29299,"ĠMikhail":29300,"Ġobligated":29301,"Ġmanoeuv":29302,"Ġechoing":29303,"Ġ189":29304,"ĠDevice":29305,"isd":29306,"Ġloopholes":29307,"Ġbehold":29308,"ĠMerry":29309,"Ġfunn":29310,"Ġnuanced":29311,"667":29312,"ELY":29313,"ĠTasmania":29314,"ĠSaddam":29315,"Ġquizz":29316,"military":29317,"cient":29318,"Ġoutlaw":29319,"ĠAudit":29320,"ĠBoom":29321,"Ġcrim":29322,"asured":29323,"ĠApps":29324,"ĠKush":29325,"onica":29326,"Ġamput":29327,"signed":29328,"ĠMEN":29329,"ĠRosenberg":29330,"Ġvide":29331,"ĠDirection":29332,"Ġfountain":29333,"TW":29334,"ĠCARE":29335,"Ġreassured":29336,"Food":29337,"Ġdepressing":29338,"ĠWhilst":29339,"reatment":29340,"Ġspelled":29341,"Ġhipp":29342,"ĠPeach":29343,"hound":29344,"Harry":29345,"Ġcatalogue":29346,"ĠCommun":29347,"Ġnurture":29348,"rush":29349,"ĠPopulation":29350,"ĠNTS":29351,"ĠElectrical":29352,"rounded":29353,"Ġblending":29354,"Ġ223":29355,"alities":29356,"ilation":29357,"eas":29358,"estate":29359,"Ġnarrowing":29360,"ĠTreasure":29361,"192":29362,"Ġwhims":29363,"Ġrobber":29364,"Ġsoaked":29365,"nian":29366,"Ġcongest":29367,"ĠYosemite":29368,"notes":29369,"icer":29370,"ĠGuardians":29371,"ĠFrozen":29372,"Ġ187":29373,"Ġhandcuffs":29374,"Someone":29375,"Ġenshr":29376,"gency":29377,"ĠCube":29378,"Ġprinters":29379,"Ġundercut":29380,"ĠSolution":29381,"rosis":29382,"ĠHumanity":29383,"Ġsucks":29384,"ĠSick":29385,"Tax":29386,"Ġtablespoon":29387,"ĠTrin":29388,"ĠArchive":29389,"Mom":29390,"ĠSAY":29391,"Ġdrifting":29392,"ĠFarage":29393,"Ġforging":29394,"WM":29395,"ĠEleanor":29396,"USH":29397,"Ġemph":29398,"Ġcareless":29399,"Ġspew":29400,"Ġinsensitive":29401,"Ġawhile":29402,"Ġcit":29403,"opened":29404,"ĠFem":29405,"Ġvapor":29406,"Ġdownt":29407,"ylene":29408,"Ġclut":29409,"Ġculp":29410,"1990":29411,"Ġdisgruntled":29412,"Students":29413,"uttering":29414,"gyn":29415,"vre":29416,"Ġrapes":29417,"division":29418,"ĠCalendar":29419,"tal":29420,"icts":29421,"caliber":29422,"ĠFighters":29423,"ĠUnc":29424,"163":29425,"ĠRogue":29426,"Ġregistrations":29427,"Ġundermines":29428,"ĠPunch":29429,"Ġdramas":29430,"176":29431,"Ġslider":29432,"ĠFlore":29433,"ر":29434,"Ġbru":29435,"inelli":29436,"Ġdisparities":29437,"ا":29438,"Ġreferrals":29439,"ĠCharges":29440,"Ġbreeds":29441,"ĠMEP":29442,"288":29443,"Ġmouths":29444,"Ġsideways":29445,"Ġbelievers":29446,"ppard":29447,"Ġhotter":29448,"Ġunderestimated":29449,"Ġjelly":29450,"525":29451,"ĠCMS":29452,"ĠWeiner":29453,"Ġguarding":29454,"Ġampl":29455,"ĠKidd":29456,"UF":29457,"orient":29458,"max":29459,"Ash":29460,"Ġwander":29461,"Ġ..........":29462,"ĠDempsey":29463,"ĠToken":29464,"chat":29465,"Justin":29466,"equipped":29467,"ĠBI":29468,"Ġsins":29469,"Ġnond":29470,"ursion":29471,"Ġcoc":29472,"Ġmailing":29473,"ĠArchitect":29474,"Ġhaunting":29475,"Ġpont":29476,"Ġascertain":29477,"Ġwig":29478,"Ġskysc":29479,"Ġarg":29480,"ĠItalians":29481,"/?":29482,"Ġ----------------------------------------------------------------":29483,"ĠPrecision":29484,"EPA":29485,"Ġhotly":29486,"Ġcircumvent":29487,"ĠEcc":29488,"Ġmerch":29489,"akov":29490,"Ġunab":29491,"heres":29492,"Ġsubcommittee":29493,"ĠDiscuss":29494,"ĠChallenger":29495,"crafted":29496,"Ġcanine":29497,"osphere":29498,"Ġspider":29499,"Ġteachings":29500,"atos":29501,"Ġuniversally":29502,"Ġturbine":29503,"ĠLO":29504,"ĠMAG":29505,"Ġpassers":29506,"Ġroundup":29507,"Ġdenounce":29508,"ĠSpiegel":29509,"until":29510,"Ġshaved":29511,"Ġdisdain":29512,"Nazi":29513,"Ġnewfound":29514,"Ġspontaneous":29515,"Ġmash":29516,"ĠDispatch":29517,"Ġsunrise":29518,"ogged":29519,"Ġfuss":29520,"Ġeas":29521,"acci":29522,"ĠTarg":29523,"Ġhash":29524,"lict":29525,"Ġmisc":29526,"ĠSched":29527,"guy":29528,"linger":29529,"warm":29530,"ipel":29531,"ĠGork":29532,"Ġdispatcher":29533,"Ġ315":29534,"Ġfinely":29535,"Ġreliably":29536,"Ġrupt":29537,"Ġnegligent":29538,"Ġendorsements":29539,"ĠOrient":29540,"Ġelectro":29541,"haired":29542,"Ġphysique":29543,"wine":29544,"Ġadolescents":29545,"Ġ184":29546,"alth":29547,"Ġvalidated":29548,"izzard":29549,"ĠPeck":29550,"Ġemblem":29551,"status":29552,"ĠJungle":29553,"orius":29554,"Ġeccentric":29555,"Ġfolding":29556,"poor":29557,"ĠTHC":29558,"appers":29559,"Ġscripted":29560,"239":29561,"ĠPreferred":29562,"digital":29563,"Ġsharper":29564,"Ġportrays":29565,"rative":29566,"238":29567,"Ġ183":29568,"Ġuneasy":29569,"ĠRI":29570,"Ġvil":29571,"171":29572,"Ġspoil":29573,"ĠPricing":29574,"ĠHardware":29575,"Ġ188":29576,"Ġhorrendous":29577,"Ġostensibly":29578,"nah":29579,"Ġgadget":29580,"ADS":29581,"coat":29582,"Ġexhausting":29583,"Ġdraining":29584,"arate":29585,"ĠBulgarian":29586,"emo":29587,"Ġhier":29588,"Ġguitars":29589,"ieties":29590,"assed":29591,"ĠYaz":29592,"Ġaggress":29593,"ĠBG":29594,"vik":29595,"Ġneatly":29596,"Ġpixel":29597,"Ġintimacy":29598,"ĠRug":29599,"Ġ512":29600,"Ġnarrated":29601,"Ġmast":29602,"ĠNos":29603,"ĠHung":29604,"reciation":29605,"ĠChandra":29606,"Ġbios":29607,"ĠEnded":29608,"lique":29609,"ĠCambod":29610,"Ġworrisome":29611,"ĠEQ":29612,"Ġnovelist":29613,"ĠDynamic":29614,"ĠMIC":29615,"Ġdisposed":29616,"Ġbrackets":29617,"Ġhaircut":29618,"ĠLana":29619,"Ġlull":29620,"Ġbillboard":29621,"ĠReverend":29622,"ĠNAV":29623,"borgh":29624,"Ġadrenaline":29625,"Ġseeming":29626,"ĠPCB":29627,"ĠBridgewater":29628,"Ġsquirrel":29629,"262":29630,"write":29631,"Ġstabilization":29632,"wild":29633,"Ġsecession":29634,"Ġpacket":29635,"AMES":29636,"licted":29637,"Ġmalnutrition":29638,"claimed":29639,"Ġcharred":29640,"Ġtragically":29641,"Published":29642,"Ġrepealed":29643,"ĠSawyer":29644,"ĠMormon":29645,"resolution":29646,"ĠSaud":29647,"Henry":29648,"Ġdiscontin":29649,"Ġsnag":29650,"danger":29651,"Ġmixes":29652,"Ġupbringing":29653,"Ġlimb":29654,"ĠFantastic":29655,"Sim":29656,"ĠAugustine":29657,"ĠGreeks":29658,"cod":29659,"ĠHistorically":29660,"mire":29661,"register":29662,"ĠKund":29663,"Ġdebilitating":29664,"Chat":29665,"ĠTau":29666,"ï":29667,"lower":29668,"pie":29669,"Ġ430":29670,"Ġnascent":29671,"Ġ375":29672,"Ġbum":29673,"WI":29674,"Netflix":29675,"whether":29676,"Ġdearly":29677,"eff":29678,"PRES":29679,"Ġlandmarks":29680,"Ġculminating":29681,"Ġmigrate":29682,"balanced":29683,"Ġregulars":29684,"Ġmodification":29685,"Ġdips":29686,"ĠRedmond":29687,"ationally":29688,"atsu":29689,"Ġphilosophical":29690,"Ġtyping":29691,"Ġunreal":29692,"Ġboiled":29693,"Ġblight":29694,"Ġdru":29695,"ĠGaddafi":29696,"Ġnour":29697,"Ġsequential":29698,"Ġaugment":29699,"ĠEuras":29700,"ĠWiley":29701,"endar":29702,"Ġacronym":29703,"esteem":29704,"ĠMajesty":29705,"Ġgrips":29706,"Ġobsolete":29707,"nos":29708,"Made":29709,"ogie":29710,"ĠLiver":29711,"ĠDonetsk":29712,"Ġdynam":29713,"tel":29714,"bring":29715,"Ġknit":29716,"Ġfirepower":29717,"Ġprepaid":29718,"ĠRaphael":29719,"Ġsensing":29720,"720":29721,"WN":29722,"Nor":29723,"puted":29724,"Ġbureaucrats":29725,"ĠAdjust":29726,"Ġintensely":29727,"Ġsunscreen":29728,"Ho":29729,"ĠYelp":29730,"ĠPU":29731,"ĠSerge":29732,"ĠCyp":29733,"ELF":29734,"ĠGuns":29735,"Ġteamwork":29736,"ĠBib":29737,"ĠMaintenance":29738,"perate":29739,"Ġwiping":29740,"Ġcharcoal":29741,"ordan":29742,"International":29743,"Ġbehaving":29744,"Ġsoftened":29745,"ĠIncreased":29746,"Ġunfl":29747,"470":29748,"Ġinformative":29749,"Ġnovelty":29750,"Ġavoidance":29751,"Ġteasing":29752,"matic":29753,"Ġmaid":29754,"ĠPell":29755,"Ġcounterterrorism":29756,"ĠGabe":29757,"ications":29758,"ĠConnection":29759,"ĠInquiry":29760,"isin":29761,"orama":29762,"Ġcorpse":29763,"Ġpractitioner":29764,"itto":29765,"UA":29766,"Ġforestry":29767,"Ġlic":29768,"Ġrevolves":29769,"Ġcalculating":29770,"Ġpuppet":29771,"ulously":29772,"ĠPebble":29773,"Dep":29774,"Ġupholding":29775,"Ġcarving":29776,"Ġwartime":29777,"Ġenvy":29778,"Ġencro":29779,"ĠPunk":29780,"ĠAdminist":29781,"ucha":29782,"Ġbattleground":29783,"Ġlol":29784,"uable":29785,"Ġunheard":29786,"ĠSpur":29787,"phony":29788,"Ġcarc":29789,"ĠSut":29790,"Ġpollutants":29791,"Cr":29792,"Ġvigorous":29793,"355":29794,"ĠMarriage":29795,"Ġstaffed":29796,"fecture":29797,"ĠArabs":29798,"supported":29799,"Ġmanpower":29800,"ĠSatellite":29801,"None":29802,"Ġqueues":29803,"Ġinsightful":29804,"Ġinterchange":29805,"Rel":29806,"Ġsolemn":29807,"Ġsmuggled":29808,"upt":29809,"Ġ171":29810,"Ġparallels":29811,"intelligence":29812,"punk":29813,"Ġrecycle":29814,"Ġdecorative":29815,"Ġshar":29816,"arrell":29817,"iances":29818,"ĠBolivia":29819,"Ġstrengthens":29820,"430":29821,"Ġhardships":29822,"Ġsignalling":29823,"Ġunthinkable":29824,"READ":29825,"Ġtad":29826,"picked":29827,"Ġarmor":29828,"Ġcores":29829,"ĠMatrix":29830,"Ġdj":29831,"Ġevolutionary":29832,"ĠBermuda":29833,"OE":29834,"organized":29835,"Ġrelentlessly":29836,"sol":29837,"ĠMamm":29838,"Ġpounding":29839,"Weather":29840,"Ġrab":29841,"Ġsweets":29842,"funding":29843,"ĠHUD":29844,"ĠSoldier":29845,"reed":29846,"released":29847,"Ġcontainment":29848,"alid":29849,"ĠNikon":29850,"Ġcervical":29851,"Ġign":29852,"Ġalias":29853,"Ġoptimized":29854,"Ġasserting":29855,"ĠAFTER":29856,"Ġflatt":29857,"Ġdinosaur":29858,"ĠRefugees":29859,"ĠAnch":29860,"Ġadjustable":29861,"Ġroaring":29862,"Ġpilgrimage":29863,"Ġcowboy":29864,"Ġentails":29865,"ractions":29866,"EY":29867,"undy":29868,"ĠKuh":29869,"inges":29870,"ĠTerra":29871,"ĠEscape":29872,"Ġrundown":29873,"Ġstriped":29874,"KN":29875,"ocations":29876,"IDENT":29877,"IGH":29878,"Ġavoids":29879,"Moh":29880,"ĠLS":29881,"lbs":29882,"ĠAttempt":29883,"Ġtriangle":29884,"Ġclimax":29885,"Ġhp":29886,"Ġallot":29887,"learning":29888,"ĠJFK":29889,"Justice":29890,"OUT":29891,"ĠHER":29892,"ĠLect":29893,"Ġtrench":29894,"edar":29895,"Ġreservoirs":29896,"uid":29897,"rf":29898,"162":29899,"Ġinterfered":29900,"Ġemit":29901,"these":29902,"444":29903,"ĠLeather":29904,"essing":29905,"ĠEighth":29906,"uckle":29907,"Breaking":29908,"Ġunresolved":29909,"Ġgoose":29910,"252":29911,"platform":29912,"atus":29913,"Ġcomplexion":29914,"ĠBUS":29915,"Ġstruct":29916,"middle":29917,"Sat":29918,"ĠWHERE":29919,"LB":29920,"redible":29921,"vered":29922,"Louis":29923,"ĠBaz":29924,"Eye":29925,"safety":29926,"Ġhypothetical":29927,"Ġbowel":29928,"Ġuntouched":29929,"312":29930,"ĠPric":29931,"Ġastounding":29932,"meet":29933,"Aaron":29934,"ĠWoo":29935,"236":29936,"ĠShape":29937,"Ġdrifted":29938,"Ġtile":29939,"ĠGrim":29940,"Ġundeniable":29941,"Ġ..":29942,"Ġradius":29943,"Ġovarian":29944,"ĠSeriously":29945,"verning":29946,"Ġassertions":29947,"oxic":29948,"231":29949,"ĠViz":29950,"Jackson":29951,"ĠSno":29952,"Ġboycot":29953,"okingly":29954,"ousse":29955,"proclaimed":29956,"Ġblazing":29957,"Ġinefficient":29958,"Ġfig":29959,"Ġbooze":29960,"259":29961,"agus":29962,"statement":29963,"Ġlocom":29964,"Ġtacos":29965,"Ġmemos":29966,"gender":29967,"ĠOrt":29968,"263":29969,"Ġintervening":29970,"Soc":29971,"University":29972,"ĠPis":29973,"ĠReturns":29974,"ĠPAN":29975,"Ġultrasound":29976,"Ġcoherent":29977,"tracking":29978,"rieved":29979,"383":29980,"Ġqualitative":29981,"uld":29982,"ĠGiovanni":29983,"Ġstorylines":29984,"Ġdarkest":29985,"Ġvelvet":29986,"RIP":29987,"Ġcompatibility":29988,"Ġtroll":29989,"CN":29990,"Found":29991,"ĠOu":29992,"Ġtease":29993,"Ġvested":29994,"Ġprovocation":29995,"Ġimprovised":29996,"Ġactivation":29997,"unte":29998,"ĠMonteneg":29999,"ĠJOHN":30000,"ĠReact":30001,"Ġpolluted":30002,"217":30003,"Ġmushroom":30004,"Ġdisconnected":30005,"ĠVoices":30006,"asu":30007,"Ġsensory":30008,"REE":30009,"Ġmonarchy":30010,"Ġ173":30011,"doing":30012,"involved":30013,"ĠJonah":30014,"Ġtoxins":30015,"Ġtv":30016,"Ġacademia":30017,"IQ":30018,"Mor":30019,"ĠStraight":30020,"ĠRN":30021,"ĠâĹı":30022,"Ġpear":30023,"187":30024,"Ġendeavors":30025,"ĠTurbo":30026,"Ġducks":30027,"ĠRamsay":30028,"Ġoutpatient":30029,"Ġcomprehend":30030,"UNE":30031,"Ġbriefings":30032,"total":30033,"Ġmigr":30034,"always":30035,"Ġmoot":30036,"ĠRider":30037,"Ġbiblical":30038,"Form":30039,"Ġcurry":30040,"Ġexquisite":30041,"385":30042,"244":30043,"Ġattendants":30044,"Ġcabinets":30045,"nton":30046,"Baby":30047,"Honestly":30048,"ĠFIRE":30049,"211":30050,"itech":30051,"ĠProsper":30052,"Ġchops":30053,"odic":30054,"Rod":30055,"job":30056,"orset":30057,"ĠAry":30058,"obic":30059,"ĠNil":30060,"isable":30061,"Ġorche":30062,"Ġtrivial":30063,"ĠZy":30064,"ĠXP":30065,"Ġendorsing":30066,"ĠLIM":30067,"adish":30068,"237":30069,"ĠLaws":30070,"heid":30071,"ĠSignature":30072,"ĠVern":30073,"ĠBland":30074,"ansk":30075,"Ġrepository":30076,"ĠPetra":30077,"Enter":30078,"Ġtruths":30079,"Ġbordering":30080,"Ġpenn":30081,"Ġsimplified":30082,"zn":30083,"ĠCree":30084,"Ġ181":30085,"Hi":30086,"ĠGreenberg":30087,"Ġprematurely":30088,"ĠSass":30089,"Ġwrecked":30090,"Ġheinous":30091,"415":30092,"Turn":30093,"zl":30094,"amental":30095,"ĠBraz":30096,"fing":30097,"ĠAngle":30098,"ĠPhantom":30099,"agra":30100,"ĠShack":30101,"Ġhomegrown":30102,"Ġalright":30103,"AME":30104,"ĠKN":30105,"Ġclicks":30106,"Ġmanned":30107,"ĠScope":30108,"Ġextras":30109,"Ġclinicians":30110,"321":30111,"African":30112,"Ġjuices":30113,"Ġrefere":30114,"****":30115,"ambling":30116,"since":30117,"Ġvoic":30118,"QB":30119,"ĠAtmospheric":30120,"Mat":30121,"Ġperpetrated":30122,"ĠSteps":30123,"Fit":30124,"Ġsilenced":30125,"Ġbonded":30126,"Ġquantify":30127,"Houston":30128,"ocracy":30129,"Ġfreeing":30130,"pipe":30131,"corn":30132,"rones":30133,"ooked":30134,"ĠSuz":30135,"Ġunaccount":30136,"196":30137,"Ġlogos":30138,"ĠFurious":30139,"ĠSpart":30140,"urst":30141,"itri":30142,"ĠZub":30143,"ĠActual":30144,"Ġslee":30145,"Ġgag":30146,"Ġmetabolism":30147,"ĠDesigned":30148,"Ġpedigree":30149,"Ġcoolest":30150,"âĿ":30151,"iuses":30152,"ĠYellowstone":30153,"Ġinformant":30154,"Ġushered":30155,"ĠGarg":30156,"thel":30157,"Hop":30158,"Ġrepetitive":30159,"flag":30160,"Ġunmarked":30161,"ĠBrave":30162,"Ġincur":30163,"reading":30164,"ppel":30165,"lah":30166,"ateurs":30167,"286":30168,"ĠAtomic":30169,"Ġappliance":30170,")'":30171,"traditional":30172,"Ġdads":30173,"Ġregimen":30174,"Ġinfrared":30175,"Ġdotted":30176,"Ġtails":30177,"Ġhorrors":30178,"uments":30179,"Ġdub":30180,"lighting":30181,"Ġunearthed":30182,"assisted":30183,"ĠSpiel":30184,"trial":30185,"Ġpersever":30186,"MAX":30187,"Ġicing":30188,"Energy":30189,"Ġ1943":30190,"move":30191,"Error":30192,"Ġliter":30193,"ĠCly":30194,"Ari":30195,"Ġgranite":30196,"Ġcropped":30197,"ĠRD":30198,"ĠREM":30199,"TX":30200,"Ġdispleasure":30201,"ĠComfort":30202,"Ġunsettling":30203,"Ġscratching":30204,"866":30205,"eton":30206,"560":30207,"Ġcommonplace":30208,"Ġreproduced":30209,"ggie":30210,"Ġschooling":30211,"Ġreprim":30212,"Ġdarling":30213,"huge":30214,"ĠDante":30215,"cp":30216,"heastern":30217,"Ġeduc":30218,"Digital":30219,"Ġwrath":30220,"Ġwatering":30221,"ĠTail":30222,"Ġdegradation":30223,"530":30224,"usive":30225,"ĠXu":30226,"ĠAH":30227,"Ġclassy":30228,"ĠSET":30229,"Ġcriminally":30230,"dependent":30231,"ĠAlps":30232,"Ġnotwithstanding":30233,"Ġfamiliarity":30234,"ĠAPP":30235,"aurus":30236,"gments":30237,"Mid":30238,"Ġepilepsy":30239,"Ġresemblance":30240,"brush":30241,"Ġ333":30242,"Ġliberated":30243,"ĠBeng":30244,"ĠLans":30245,"Ġtraff":30246,"ihu":30247,"establish":30248,"Ġcort":30249,"Rick":30250,"Ġplugged":30251,"onement":30252,"ĠAccounting":30253,"Ġreconstruct":30254,"Pop":30255,"Ġincapable":30256,"aho":30257,"ĠDexter":30258,"Ġpitted":30259,"Ġbathing":30260,"Ġdun":30261,"Ġexplor":30262,"ĠMidnight":30263,"Ġactiv":30264,"iann":30265,"likely":30266,"acons":30267,"owicz":30268,"Ġnegativity":30269,"Ġfreel":30270,"ewitness":30271,"Ġinj":30272,"Stephen":30273,"Ġshredded":30274,"Ġprepar":30275,"Script":30276,"Ġcorrectional":30277,"Ġcommits":30278,"hai":30279,"activity":30280,"Imp":30281,"Ġstumble":30282,"Ġcache":30283,"ĠPromise":30284,"Ġprecinct":30285,"Ġmulticultural":30286,"Ġsubstitutes":30287,"Ġshortened":30288,"ovable":30289,"Ġfasting":30290,"Ġinfused":30291,"Ġbulldo":30292,"alm":30293,"Ġadjoining":30294,"Ġmultiplayer":30295,"ĠAlien":30296,"Ġpund":30297,"ethyl":30298,"Ġbliss":30299,"ĠDecision":30300,"Ġbab":30301,"Ġangrily":30302,"another":30303,"oled":30304,"ainted":30305,"ĠPriest":30306,"Ġdraped":30307,"ĠPersonally":30308,"Ġstomp":30309,"ĠWolfgang":30310,"Ġoste":30311,"itches":30312,"Ġhoops":30313,"ĠJO":30314,"Ġsche":30315,"ĠZan":30316,"Ġcleans":30317,"Ġclimbs":30318,"Ġelectronically":30319,"243":30320,"ocy":30321,"gall":30322,"ĠREAL":30323,"Ġmurky":30324,"Ġmodernization":30325,"tub":30326,"Really":30327,"Ġlax":30328,"Ġdoubted":30329,"yden":30330,"ĠPrevent":30331,"UTERS":30332,"Ġoverride":30333,"ĠSAF":30334,"Ġcoun":30335,"Ġexcerpts":30336,"Ġmotivations":30337,"Ġdecency":30338,"Ġastronomers":30339,"orical":30340,"Ġaltering":30341,"Ġ232":30342,"described":30343,"omic":30344,"Ġexh":30345,"Ġknocks":30346,"ĠRiot":30347,"ĠPurs":30348,"equal":30349,"pleting":30350,"llan":30351,"ĠSOL":30352,"iator":30353,"ILE":30354,"ĠWM":30355,"Ġdefences":30356,"Ġforearm":30357,"Toronto":30358,"526":30359,"Ġacne":30360,"Ġthirteen":30361,"itiz":30362,"akable":30363,"charges":30364,"Ġinaction":30365,"Ġbred":30366,"Ġdeficiency":30367,"Ġintrigue":30368,"opoly":30369,"ĠCamer":30370,"ĠMelt":30371,"Ġunlawfully":30372,"Ġpenetrate":30373,"ĠUsed":30374,"ĠDirty":30375,"Ġexcerpt":30376,"ĠYen":30377,"ĠCARD":30378,"Ġcher":30379,"ĠChallenges":30380,"ieves":30381,"Ġambush":30382,"Data":30383,"eeks":30384,"Ġgiveaway":30385,"Ġpawn":30386,"Ġtransf":30387,"renched":30388,"Ġmoderately":30389,"Ġnumbered":30390,"ĠIntegrity":30391,"ĠHOU":30392,"ĠHDMI":30393,"Royal":30394,"LT":30395,"ĠDirk":30396,"izon":30397,"Ġ227":30398,"Ġdisagrees":30399,"ĠNinth":30400,"Ġincrement":30401,"ĠGlory":30402,"suff":30403,"Ġartery":30404,"ĠEmployee":30405,"bum":30406,"ĠEditorial":30407,"Kh":30408,"ĠPremiere":30409,"ĠWeld":30410,"ĠIncluded":30411,"Ġmathematical":30412,"Ġexponentially":30413,"Ġhandwritten":30414,"ĠMAS":30415,"Ġindiscrim":30416,"Ġnutrient":30417,"ĠSelection":30418,"Ġ219":30419,"hyd":30420,"Ġdeton":30421,"æ":30422,"dark":30423,"ĠFidel":30424,"Ġmonkeys":30425,"Ġnutritious":30426,"Ġheadlights":30427,"oller":30428,"piring":30429,"ĠDefenders":30430,"Ġdrown":30431,"elong":30432,"Ġfloats":30433,"graduate":30434,"Ġprosper":30435,"ĠNamed":30436,"ĠEating":30437,"ECK":30438,"establishment":30439,"XM":30440,"Ġsoaking":30441,"278":30442,"Ġlistener":30443,"Ġsimultaneous":30444,"olutions":30445,"payer":30446,"Ġcustomize":30447,"ĠROCK":30448,"Ġaltar":30449,"ĠExercise":30450,"anky":30451,"ĠProfession":30452,"sever":30453,"ĠMerchant":30454,"RF":30455,"ĠCombat":30456,"Ġlegality":30457,"fledged":30458,"Ġdiapers":30459,"lves":30460,"Ġlur":30461,"Ġignores":30462,"ĠProtocol":30463,"Ġrepresentations":30464,"ĠBlumenthal":30465,"ĠLime":30466,"romptu":30467,"Ġbesieged":30468,"dl":30469,"Ġsighting":30470,"ĠParm":30471,"ĠServer":30472,"ĠBenghazi":30473,"estival":30474,"Ġplaylist":30475,"ĠUng":30476,"ĠQuantum":30477,"Ġcompromises":30478,"ĠSurvivor":30479,"ĠMobility":30480,"Ġbounty":30481,"ophers":30482,"ISA":30483,"need":30484,"uese":30485,"Ġorn":30486,"218":30487,"Ġ530":30488,"Ġbuddies":30489,"Ġagendas":30490,"ĠFeldman":30491,"ĠÃĸ":30492,"ĠBMC":30493,"ĠServe":30494,"Ent":30495,"ĠKH":30496,"ĠINT":30497,"Ġlittered":30498,"Ġvisitation":30499,"mist":30500,"Ġdupl":30501,"Ġrouted":30502,"ĠAmount":30503,"Dev":30504,"ĠConv":30505,"Ġslams":30506,"ĠVeterinary":30507,"bold":30508,"Ġ186":30509,"ĠDOT":30510,"builder":30511,"Ġdecay":30512,"ĠHemp":30513,"pelled":30514,"Ġmankind":30515,"Tonight":30516,"Ġeffortlessly":30517,"ĠBUT":30518,"Ġhostilities":30519,"formerly":30520,"alon":30521,"ĠCrash":30522,"humane":30523,"Ġmayhem":30524,"ĠBudd":30525,"Ġdisinformation":30526,"Ġ226":30527,"Ġprototypes":30528,"__":30529,"IVERS":30530,"izzy":30531,"ĠMight":30532,"ĠPip":30533,"pour":30534,"INO":30535,"ĠLL":30536,"Ġwiret":30537,"Ġresorted":30538,"ĠTanaka":30539,"ĠDOES":30540,"Earlier":30541,"HO":30542,"Ġmoniker":30543,"ĠFang":30544,"ĠHua":30545,"bered":30546,"adding":30547,"194":30548,"STR":30549,".\")":30550,"cop":30551,"ĠFlags":30552,"ĠColleges":30553,"ĠUz":30554,"Ġsparks":30555,"Ġparadox":30556,"Marie":30557,"Strong":30558,"Ġstrawberry":30559,"Ġnurturing":30560,"Ġfax":30561,"Tor":30562,"killer":30563,"burse":30564,"Ġattachments":30565,"Ġpup":30566,"Ġexhaustion":30567,"Ġwhisky":30568,"isu":30569,"ologically":30570,"iership":30571,"Ġlamps":30572,"Ġshuff":30573,"Ġcentralized":30574,"ĠNeedless":30575,"Ġgrenade":30576,"Ġrouter":30577,"Ġoptics":30578,"ivering":30579,"Ġpioneers":30580,"ĠHug":30581,"Ġhandguns":30582,"010":30583,"Ġbailed":30584,"uana":30585,"197":30586,"Ġdistorted":30587,"ĠEssentially":30588,"ĠSilent":30589,"Ġcomparative":30590,"Music":30591,"ĠMUS":30592,"Bur":30593,"ĠComet":30594,"ĠWinchester":30595,"IGN":30596,"Mod":30597,"ĠCandidate":30598,"Ġdysfunctional":30599,"ĠCeleb":30600,"Ġhitch":30601,"api":30602,"Ġidiot":30603,"Ġunsupported":30604,"gat":30605,"inker":30606,"Ġredevelop":30607,"Ġdwind":30608,"Ġforgetting":30609,"ĠRost":30610,"Ġremembrance":30611,"Na":30612,"mopolitan":30613,"Ġberries":30614,"Ġmarital":30615,"Vol":30616,"ĠClosing":30617,"ĠHindus":30618,"itism":30619,"Ġrover":30620,"Ġmysteries":30621,"ĠNig":30622,"ucing":30623,"Ġfabrication":30624,"Ġgarments":30625,"Ġwield":30626,"ĠCompton":30627,"357":30628,"Ġoxide":30629,"chron":30630,"ĠThought":30631,"Ġcomed":30632,"ĠEpstein":30633,"ĠBART":30634,"orative":30635,"ĠKahn":30636,"adan":30637,"APH":30638,"cum":30639,"Ġloophole":30640,"ĠGoPro":30641,"osit":30642,"Ġspecification":30643,"ĠAPR":30644,"Ġdrains":30645,"Ġconserve":30646,"ĠMorse":30647,"Ġcalorie":30648,"ĠCheney":30649,"station":30650,"Ġevangel":30651,"Ġspraying":30652,"lections":30653,"Ġenclosure":30654,"Ġcommanded":30655,"ĠOrganizations":30656,"Ġimb":30657,"mins":30658,"ĠTobias":30659,"Ve":30660,"ĠNau":30661,"183":30662,"ĠGuantanamo":30663,"173":30664,"Ġrequisite":30665,"Ġderivative":30666,"Ġpopulism":30667,"Ġcultivated":30668,"lord":30669,"uler":30670,"ĠDEA":30671,"inally":30672,"Ġdemonstr":30673,"trip":30674,"ĠFirefox":30675,"246":30676,"confirmed":30677,"Anne":30678,"Ġtamp":30679,"ĠHousehold":30680,"amous":30681,"Meet":30682,"Ġdashed":30683,"pire":30684,"Ġinex":30685,"Ġloosen":30686,"272":30687,"famous":30688,"ĠHeard":30689,"Ġhindsight":30690,"Ġdepot":30691,"ĠCutting":30692,"ĠMouse":30693,"Ġgeological":30694,"number":30695,"OUN":30696,".,\"":30697,"Ġmoderation":30698,"ĠUNHCR":30699,"Ġdomains":30700,"eco":30701,"Ġcrater":30702,"Ġ510":30703,"kid":30704,"Ġcylinders":30705,"ĠClasses":30706,"Kn":30707,"Ġcarcin":30708,"ĠHunting":30709,"irit":30710,"ARP":30711,"anting":30712,"ĠMarino":30713,"ĠRESP":30714,"ifle":30715,"Ġ239":30716,"fman":30717,"Ġtheoretically":30718,"Ġdistraught":30719,"Ġstaircase":30720,"Ġexpel":30721,"Ġlord":30722,"Ġbehaviours":30723,"Ġprescribing":30724,"ographs":30725,"ĠNewly":30726,"Ġpatiently":30727,"Ġskyline":30728,"udos":30729,"Ġrepertoire":30730,"Ġhover":30731,"mint":30732,"Ġclears":30733,"Ġkale":30734,"ĠSco":30735,"ĠCoulter":30736,"Ġpancreat":30737,"pu":30738,"995":30739,"Ġincompetent":30740,"2007":30741,"Ġgripping":30742,"enable":30743,"Ġreinforcing":30744,"ĠFee":30745,"education":30746,"ĠKuro":30747,"Ġbowed":30748,"Ġshave":30749,"ĠMean":30750,"xi":30751,"Ġinciting":30752,"atters":30753,"Ġecstatic":30754,"hog":30755,"Ġclauses":30756,"Ġsubt":30757,"Ġbehaved":30758,"tains":30759,"Liverpool":30760,"Ġstrives":30761,"ĠKev":30762,"ĠFramework":30763,"defined":30764,"Ġrecounts":30765,"array":30766,"tips":30767,"Ġartificially":30768,"fits":30769,"Clearly":30770,"mediate":30771,"Ġunseen":30772,"Ġthugs":30773,"ĠLent":30774,"Ġ1938":30775,"Ġgenital":30776,"ĠSonic":30777,"ĠWarehouse":30778,"pler":30779,"Ġunm":30780,"Ġpackets":30781,"ĠMET":30782,"ealous":30783,"ographers":30784,"Ġlabou":30785,"Core":30786,"+,":30787,"parable":30788,"Ġstrat":30789,"Ġinvitations":30790,"Ġsouven":30791,"Ġbillboards":30792,"ĠRegulations":30793,"Ġdwarf":30794,"Ġtoler":30795,"Ġprose":30796,"Ġestates":30797,"Ġmetabolic":30798,"ĠSuff":30799,"ĠFirstly":30800,"Ġpolio":30801,"Ġchick":30802,"ĠDaughter":30803,"Ġsubstant":30804,"ĠIdentity":30805,"umbers":30806,"ĠFacts":30807,"Ġfrust":30808,"Ġdissip":30809,"ĠDeck":30810,"Hy":30811,"ĠBirch":30812,"Ġhurled":30813,"democracy":30814,"nered":30815,"eper":30816,"Ġcerebral":30817,"181":30818,"Ġhalves":30819,"abit":30820,"balance":30821,"ĠTibet":30822,"Ġhandheld":30823,"ĠDough":30824,"Ġprogrammed":30825,"hw":30826,"Ġoutlawed":30827,"ĠSerious":30828,"Ġironically":30829,"Ġmanipulating":30830,")\"":30831,"juries":30832,"Ġfragrance":30833,"crete":30834,"ĠHHS":30835,"cience":30836,"Ġcosmic":30837,"Ġforeclosure":30838,"Ġpercentages":30839,"Bus":30840,"Ġenticing":30841,"extra":30842,"ĠShy":30843,"ĠÂ¥":30844,"Ġheadsets":30845,"imensional":30846,"Ġlux":30847,"Ġresidual":30848,"Ġmantle":30849,"ĠSJ":30850,"ĠPeaks":30851,"ĠFinger":30852,"Ġunfolds":30853,"anity":30854,"Ġresettlement":30855,"ĠWeak":30856,"ĠBeen":30857,"Ġ198":30858,"Ġangels":30859,"ĠFarn":30860,"peace":30861,"Ġcapac":30862,"Ġhue":30863,"Ġlust":30864,"traumatic":30865,"laun":30866,"Ġstrawberries":30867,"Ġherbal":30868,"Ġconversions":30869,"ĠHeld":30870,"Ġprescribe":30871,"Its":30872,"ĠDartmouth":30873,"Ġfashioned":30874,"460":30875,"BLE":30876,"international":30877,"Ġlumin":30878,"Ġplantation":30879,"ilde":30880,"490":30881,"Ġeuph":30882,"Ġdisgust":30883,"Ġaspire":30884,"medical":30885,"Ġsocialism":30886,"Ġdissolve":30887,"Wal":30888,"Ġadmittedly":30889,"Ġsewing":30890,"ĠAcer":30891,"Ġtul":30892,"Ġfacilit":30893,"Ġgrandma":30894,"ĠFeeling":30895,"Ġobst":30896,"ĠFranz":30897,"ĠPalin":30898,"ĠIncrease":30899,"gets":30900,"ĠImam":30901,"âĢİ":30902,"Ġcoincides":30903,"urrence":30904,"Ġlifes":30905,"Lab":30906,"Ham":30907,"angelo":30908,"Wild":30909,"Ġvetoed":30910,"Ġventilation":30911,"olid":30912,"Summer":30913,"Ġfacade":30914,"neys":30915,"ĠWOM":30916,"ĠBenny":30917,"ĠMarried":30918,"squ":30919,"ĠReflect":30920,"return":30921,"elia":30922,"olding":30923,"Ġrefine":30924,"ĠMadness":30925,"innacle":30926,"posts":30927,"287":30928,"fruit":30929,"274":30930,"icator":30931,"ĠVoy":30932,"Ġunsett":30933,"Ġfant":30934,"Ġtreaties":30935,"Ġcrystals":30936,"Ġhijacked":30937,"words":30938,"ĠReleased":30939,"Save":30940,"Ġcannon":30941,"Ġanomaly":30942,"Ġbeacon":30943,"Ġcrippled":30944,"Ġbundles":30945,"Ġuntreated":30946,"Ġhappiest":30947,"Ġgalaxies":30948,"Ġoccupational":30949,"416":30950,"Dar":30951,"Ġcrank":30952,"Ġappropriation":30953,"asking":30954,"mens":30955,"Ġdetector":30956,"Ġskewed":30957,"Ġpoke":30958,"254":30959,"Ġhypertension":30960,"apolog":30961,"Ġevaluations":30962,"blocks":30963,"Ġpow":30964,"GEN":30965,"Ġscalp":30966,"Ġarrogant":30967,"AIDS":30968,"ority":30969,"Ġredirect":30970,"Ġderogatory":30971,"Ġlateral":30972,"495":30973,"rolley":30974,"brew":30975,"Ġbabys":30976,"Ġmuff":30977,"ĠRequ":30978,"Ġdime":30979,"Ġwonderfully":30980,"Ġtreasures":30981,"ĠNES":30982,"Ġponds":30983,"Ġimpulse":30984,"Ġdetecting":30985,"Ġgrin":30986,"Ġbrid":30987,"Ġshoved":30988,"Ġpurge":30989,"irteen":30990,"OTHER":30991,"ÙĦ":30992,"irsch":30993,"ĠOcc":30994,"193":30995,"Ġfodder":30996,"wrote":30997,"meric":30998,"posal":30999,"Ġwinters":31000,"ĠJuice":31001,"hub":31002,"Ġcontrasting":31003,"Brazil":31004,"Ġflashy":31005,"uffer":31006,"technology":31007,"Children":31008,"Ġcatapult":31009,"owsky":31010,"ĠEclipse":31011,"abeth":31012,"ĠParticip":31013,"Ġlaud":31014,"ĠQuiet":31015,"Ġsimulations":31016,"Ġsacrificing":31017,"Ġpreaching":31018,"Ġvoicing":31019,"itizen":31020,"Ġgn":31021,"Ġsans":31022,"Ġ285":31023,"ĠRobot":31024,"Ġ1936":31025,"Ġsham":31026,"ĠKislyak":31027,"ĠGCC":31028,"tale":31029,"ĠShades":31030,"Ġsediment":31031,"Ġconveniently":31032,"Give":31033,"mounted":31034,"Ġpeel":31035,"Jun":31036,"ĠEisenhower":31037,"Ġdiplom":31038,"ĠPreservation":31039,"Ġaffirm":31040,"Ġtaboo":31041,"ĠGarr":31042,"ĠApply":31043,"prim":31044,"Ġausp":31045,"Ġtextbook":31046,"Ġforfeit":31047,"icides":31048,"Ġundis":31049,"DJ":31050,"Ġ\"...":31051,"ĠXperia":31052,"Ġfurry":31053,"Australian":31054,"Ġpreach":31055,"Ġparamed":31056,"Ġ196":31057,"agos":31058,"ĠRIP":31059,"Ġ408":31060,"ĠQuarterly":31061,"ĠQuentin":31062,"Ġdeft":31063,"ĠVlad":31064,"massive":31065,"apore":31066,"Ġquestionnaire":31067,"secution":31068,"ĠTunnel":31069,"ĠAssist":31070,"BILITY":31071,"everything":31072,"vich":31073,"Ġcomparatively":31074,"heng":31075,"ETH":31076,"ĠiPod":31077,"Ġinsurgent":31078,"Ġtestosterone":31079,"191":31080,"Ġmoons":31081,"Ġgripped":31082,"Ġstrang":31083,"pects":31084,"ĠSERVICE":31085,"Ġnumb":31086,"Ġmeasurable":31087,"Ġdismantled":31088,"Ġdepict":31089,"Ġretake":31090,"Light":31091,"Ġaquatic":31092,"useum":31093,"judicial":31094,"Ġ****":31095,"Ġrosters":31096,"certain":31097,"Ġhypothesis":31098,"2002":31099,"Snow":31100,"Ġpounded":31101,"ĠZel":31102,"ĠTrem":31103,"iversity":31104,"219":31105,"Jen":31106,"ĠAdventures":31107,"Ġcylinder":31108,"Ġbanging":31109,"Ġbalk":31110,"analy":31111,"ĠHust":31112,"ookie":31113,"ĠReturning":31114,"Ġpods":31115,"analysis":31116,"ĠTruman":31117,"Ġorg":31118,"Ġsar":31119,"Ġdred":31120,"ĠTelecommunications":31121,"ĠSven":31122,"carry":31123,"ĠLOVE":31124,"Ġparting":31125,"asar":31126,"utations":31127,"itic":31128,"Ġactu":31129,"Ġbananas":31130,"ĠNights":31131,"410":31132,"Still":31133,"Ġtweaked":31134,"went":31135,"Ġtoddlers":31136,"irted":31137,"Ġpaed":31138,"ĠWink":31139,"Ġviewpoint":31140,"ĠHelic":31141,"Ġhandshake":31142,"Ġpoaching":31143,"Ġrounding":31144,"268":31145,"ĠNVIDIA":31146,"Ġsquat":31147,"Ġtowed":31148,"Ġhandler":31149,"Ġconspir":31150,"Ġadditionally":31151,"CENT":31152,"ĠÃľ":31153,"article":31154,"ĠTough":31155,"NM":31156,"Rem":31157,"Ġstunts":31158,"ILS":31159,"ĠLM":31160,"Connect":31161,"ĠParagu":31162,"Ġcomplexities":31163,"Ġhugging":31164,"Ġabolish":31165,"ricting":31166,"ĠItems":31167,"Ġtemples":31168,"ĠSeat":31169,"ĠRubber":31170,"Ġindic":31171,"ĠVitamin":31172,"Ġcitations":31173,"Ġarmored":31174,"---------------":31175,"ĠNeo":31176,"ippy":31177,"Que":31178,"Ġrag":31179,"Ġlov":31180,"630":31181,"Ġadept":31182,"orbit":31183,"253":31184,"412":31185,"Ġbutterflies":31186,"Ġoutl":31187,"ĠCycle":31188,"Ġaesthetics":31189,"ĠTwitch":31190,"405":31191,"factor":31192,"ðŁij":31193,"ĠCircus":31194,"Posted":31195,"Ġintroductory":31196,"ĠStack":31197,"atoes":31198,"Ġfurn":31199,"ĠHond":31200,"Ġbipolar":31201,"ĠAging":31202,"inches":31203,"Ġincompetence":31204,"Ġaloud":31205,"Imagine":31206,"Ġsepar":31207,"Ġmanip":31208,"ophobic":31209,"inion":31210,"bek":31211,"Ġquer":31212,"ĠArmen":31213,"Ġhumorous":31214,"Ġmundane":31215,"Ġapologizing":31216,"Ġpioneered":31217,"Ġ303":31218,"282":31219,"Ġcalming":31220,"orious":31221,"760":31222,"Ġstitches":31223,"Ġthrottle":31224,"Ġspinach":31225,"urities":31226,"ĠCologne":31227,"Ġripple":31228,"Cs":31229,"Cent":31230,"Should":31231,"Ġaffinity":31232,"amount":31233,"ĠMISS":31234,"Ġsage":31235,"Ġamusing":31236,"Ġsnatch":31237,"clair":31238,"ĠGuess":31239,"bench":31240,"ĠMoj":31241,"nuclear":31242,"Ġfid":31243,"ĠVM":31244,"ĠGN":31245,"brainer":31246,"Ġcurled":31247,"Ġbushes":31248,"icably":31249,"Ġcreeping":31250,"Ġveil":31251,"ĠALS":31252,"ESPN":31253,"ulsion":31254,"ĠGTX":31255,"ĠANN":31256,"Ġcomplicit":31257,"assault":31258,"IOR":31259,"Ġpolymer":31260,"Ġestimating":31261,"277":31262,"alog":31263,"Ġglimps":31264,"Ġreinforces":31265,"Ġtextbooks":31266,"Ġdictated":31267,"ĠReyn":31268,"latable":31269,"ĠOrth":31270,"520":31271,"Ġtrickle":31272,"ĠWrong":31273,".[":31274,"ĠDesigner":31275,"304":31276,"ĠInner":31277,"Ġrave":31278,"ppa":31279,"ĠGim":31280,"Ġswath":31281,"Ġcarts":31282,"atlantic":31283,"Ġpersists":31284,"ĠDeveloper":31285,"Ġgoodies":31286,"isive":31287,"Inf":31288,"ĠSaving":31289,"loop":31290,"tions":31291,"Ġabusers":31292,"Ġclot":31293,"Ġmesmer":31294,"Ġdeg":31295,"Ġskirts":31296,"257":31297,"Ġunreliable":31298,"ĠCOMM":31299,"Ġ194":31300,"Ġfledgling":31301,"administ":31302,"Israeli":31303,"ĠBarbie":31304,"ĠJeanne":31305,"Ġgenerously":31306,"ĠStruct":31307,"ĠZap":31308,"Ġvetted":31309,"ĠViolet":31310,"Ġ),":31311,"Ġembarrass":31312,"bang":31313,"ĠProvider":31314,"getting":31315,"alg":31316,"Ġunconditional":31317,"ĠHulk":31318,"ĠWad":31319,"utation":31320,"Ġpointless":31321,"Ġdeprivation":31322,"Ġstarving":31323,"ĠImpossible":31324,"ĠStir":31325,"Ġknack":31326,"anse":31327,"Ġsecurely":31328,"Ġply":31329,"395":31330,"Pack":31331,"liv":31332,"Ġridden":31333,"alks":31334,"308":31335,"male":31336,"Ġbitterly":31337,"Ġirrational":31338,"Members":31339,"ported":31340,"qq":31341,"ractor":31342,"Ġinflict":31343,"ĠBoehner":31344,"Ġthickness":31345,"Ġdome":31346,"ĠInflu":31347,"Ġheap":31348,"Ġmirrored":31349,"Ġconstituent":31350,"Ġfertile":31351,"Ġvaping":31352,"266":31353,"riages":31354,"Ġembassies":31355,"Ġpersu":31356,"ĠMacArthur":31357,"issions":31358,"Main":31359,"aths":31360,"onne":31361,"circ":31362,"Ġsweating":31363,"quartered":31364,"Ġsax":31365,"Ġ540":31366,"Ġreputable":31367,"Ġsatire":31368,"Ġpastors":31369,"ventional":31370,"Mic":31371,"female":31372,"Ġpity":31373,"appropri":31374,"voc":31375,"hei":31376,"Ġimperial":31377,"Ġcorrective":31378,"Ġresent":31379,"Ġtempered":31380,"Ġdiffers":31381,"Hamilton":31382,"Ġsaddle":31383,"Ġgrenades":31384,"ĠQuart":31385,"onymous":31386,"til":31387,"Ġdepiction":31388,"Ġdisreg":31389,"Ġpetitioner":31390,"Ġfret":31391,"ĠEns":31392,"Emer":31393,"540":31394,"opathy":31395,"vertisements":31396,"Ġsketches":31397,"venth":31398,"Ġautomate":31399,"Ġjihad":31400,"iping":31401,"Ġtert":31402,"ĠSop":31403,"ships":31404,"Ġdeceptive":31405,"ĠPryor":31406,"ĠGorge":31407,"ĠMeridian":31408,"rero":31409,"affected":31410,"Ġlame":31411,"660":31412,"rub":31413,"Hello":31414,"ĠNumbers":31415,"269":31416,"Ġmarg":31417,"Fran":31418,"640":31419,"Ġcath":31420,"winter":31421,"ĠMosque":31422,"Ġreckoning":31423,"ĠImaging":31424,"Ġmutation":31425,"ĠMild":31426,"Ġkidnap":31427,"Ġnav":31428,"Ġferocious":31429,"Ġdusty":31430,"Cele":31431,"ĠFoss":31432,"Ġregrett":31433,"lymp":31434,"Ġcoli":31435,"Ġstereo":31436,"Ġforesee":31437,"alties":31438,"Ġresusc":31439,"Full":31440,"wash":31441,"ĠINST":31442,"ĠPars":31443,"Ġcoated":31444,"ĠHT":31445,"Ġdiscord":31446,"Ġreforming":31447,"CAN":31448,"Ġblink":31449,"Ġlubric":31450,"Ġmishand":31451,"ensible":31452,"existent":31453,"secondary":31454,"ĠDoesn":31455,"terrorist":31456,"Ġriff":31457,"custom":31458,"ĠDET":31459,"Ġreusable":31460,"ĠCRA":31461,"ĠScalia":31462,"Ġaccelerator":31463,"Ġpropag":31464,"ĠMID":31465,"ework":31466,"Ġlooted":31467,"oscope":31468,"eners":31469,"ruction":31470,"Ġbarr":31471,"Ġviewership":31472,"Ġlends":31473,"obil":31474,"ĠRoots":31475,"ĠCame":31476,"ibel":31477,"Ġglobalization":31478,"lab":31479,"information":31480,"Ġcoordin":31481,"Ġglitch":31482,"Ġworms":31483,"Ġslurs":31484,"Ġcontemplated":31485,"ĠPenal":31486,"Ġ191":31487,"Ġ221":31488,"Ġexposes":31489,"Ġ248":31490,"ĠASP":31491,"Ġdependency":31492,"urga":31493,"pdf":31494,"Ġvibr":31495,"clone":31496,"ossible":31497,"ĠUtt":31498,"serv":31499,"ĠLevant":31500,"maybe":31501,"MU":31502,"ĠLunar":31503,"Ġbystanders":31504,"Ġcapitals":31505,"Ġpreacher":31506,"thin":31507,"Ġunderscore":31508,"Ġ('":31509,"Ġmedd":31510,"Ġautobiography":31511,"Ġpersistence":31512,"Ġarming":31513,"Ġappalled":31514,"Ġcontradictory":31515,"Ġreciproc":31516,"Ġtakedown":31517,"tan":31518,"Ġnecessities":31519,"itans":31520,"ĠAlas":31521,"Ġsegregated":31522,"ĠResponsibility":31523,"ĠSHOW":31524,"ISIS":31525,"Ġpengu":31526,"Ġumb":31527,"ĠHO":31528,"HB":31529,"ĠChou":31530,"Ġalluded":31531,"Ġharms":31532,"bara":31533,"ĠWOR":31534,"Sorry":31535,"Ġstarvation":31536,"Ġspilling":31537,"Ġcarb":31538,"annis":31539,"ĠGarrison":31540,"Ġmillionaire":31541,"ifling":31542,"ĠCancel":31543,"Ġimprint":31544,"Ġborrower":31545,"455":31546,"ĠCic":31547,"Ġexposures":31548,"dest":31549,"Ġunn":31550,"Ġ802":31551,"Ġadherence":31552,"prints":31553,"Ġweary":31554,"Ġwaging":31555,"Ġ1937":31556,"ĠKepler":31557,"%;":31558,"Ġdefective":31559,"ĠReps":31560,"ĠGranted":31561,"Ġdisco":31562,"ĠRanking":31563,"erno":31564,"Ġarchaeological":31565,"sq":31566,"Ġcapit":31567,"Ġfleets":31568,"Ġinventor":31569,"iffin":31570,"Ġspotting":31571,"ĠSHARES":31572,"309":31573,"Hard":31574,"save":31575,"241":31576,"ĠThinking":31577,"XY":31578,"Ġhavens":31579,"Ġmessed":31580,"crop":31581,"Ġperme":31582,"Ġtimelines":31583,"ĠGarage":31584,"Ġplateau":31585,"together":31586,"fox":31587,"Ġfailings":31588,"ĠTight":31589,"ĠPhysics":31590,"ĠScholars":31591,"Ġpans":31592,"Fall":31593,"Ġhull":31594,"GER":31595,"Ġbourbon":31596,"ceived":31597,"Ġsteroids":31598,"Ġhamb":31599,"Ġinterpretations":31600,"Ġcush":31601,"Chair":31602,"Ġinformational":31603,"aryn":31604,"Ġwoven":31605,"Ġamen":31606,"Bre":31607,"Ġrefreshed":31608,"York":31609,"ĠBlast":31610,"Editor":31611,"Ġmotivating":31612,"ĠReason":31613,"Florida":31614,"Ġdreaded":31615,"Ġstationary":31616,"Ġbil":31617,"doors":31618,"Ġslightest":31619,"Ġcombustion":31620,"Ġfascination":31621,"Ġstraps":31622,"scribed":31623,"Ġexhibiting":31624,"Ġsimplest":31625,"Gar":31626,"Ġprogressives":31627,"claim":31628,"ocket":31629,"Ġexoner":31630,"ĠNETWORK":31631,"Brad":31632,"Ġ197":31633,"Ġnightmares":31634,"Ġillust":31635,"among":31636,"ĠGreenpeace":31637,"Ġoval":31638,"Ġblocker":31639,"3000":31640,"ĠMemor":31641,"Ġmids":31642,"Ġconfuse":31643,"YN":31644,"cow":31645,"Ġdispensary":31646,"telling":31647,"Ġentail":31648,"Ġneurolog":31649,"Ġbroth":31650,"Ġpron":31651,"ĠAnswer":31652,"thank":31653,"Ġintersect":31654,"Ġclinging":31655,"ĠKilling":31656,"Ġcohesion":31657,"Ġcategorized":31658,"Ġtangled":31659,"ĠASC":31660,"Arsenal":31661,"ĠAutomatic":31662,"580":31663,"sac":31664,"Ġshady":31665,"consumer":31666,"hetically":31667,"NV":31668,"Ġoverl":31669,"holes":31670,"ĠDonation":31671,"tera":31672,"score":31673,"library":31674,"Ġsmoother":31675,"Ġcoasts":31676,"Ġintercourse":31677,"Ġunfavorable":31678,"erb":31679,"Hel":31680,"Ġbiases":31681,"Ġinheritance":31682,"Ġsuppressed":31683,"ĠRecommend":31684,"iculture":31685,"ighting":31686,"inguished":31687,"idences":31688,"operated":31689,"Ġhors":31690,"Ġshrug":31691,"aila":31692,"ĠConsortium":31693,"Ġveins":31694,"uria":31695,"ĠSmithsonian":31696,"ĠAX":31697,")âĢĶ":31698,"given":31699,"JC":31700,"Ġreneg":31701,"Ġprincip":31702,"Ġextinct":31703,"Golden":31704,"ASON":31705,"Ġstatutes":31706,"292":31707,"ĠGOOD":31708,"ĠGreenland":31709,"ĠRasmussen":31710,"ATHER":31711,"Ġdeserted":31712,"ĠHitchcock":31713,"Ġqualifies":31714,"Ġdreadful":31715,"Ġsupers":31716,"Ġtendon":31717,"oter":31718,"ĠFate":31719,"Ġrestrooms":31720,"igating":31721,"Sher":31722,"Name":31723,"orph":31724,"ĠCritical":31725,"rox":31726,"Ġdefunct":31727,"Ġcanoe":31728,"Ġbiscuits":31729,"Ġwomb":31730,"808":31731,"istar":31732,"Ġroar":31733,"aundering":31734,"iewicz":31735,"ĠNM":31736,"ĠChamberlain":31737,"Ġ233":31738,"ĠCoat":31739,"Ġ999":31740,"aft":31741,"Ġlurking":31742,"ĠPist":31743,"Ġfollower":31744,"Ġcareg":31745,"ÙĨ":31746,"ĠThin":31747,"ZZ":31748,"ĠGI":31749,"ĠVintage":31750,"Ġpainstaking":31751,"Ġgloom":31752,"Ġtbsp":31753,"Ġwhim":31754,"ĠMask":31755,"rugged":31756,"Ġwritings":31757,"stantial":31758,"luence":31759,"ordable":31760,"akia":31761,"Ġassassinated":31762,"Wind":31763,"Ġdemeanor":31764,"Night":31765,"rape":31766,"ĠBringing":31767,"Ġshields":31768,"ĠAntarctic":31769,"Ġfruitful":31770,"ĠBuster":31771,"ĠLois":31772,"Ġ302":31773,"Style":31774,"ĠRIS":31775,"Ġdissatisfaction":31776,"ulp":31777,"ĠLaser":31778,"Ġdisposition":31779,"ĠAnk":31780,"Ġabsorbing":31781,"276":31782,"Ġvolcan":31783,"Ġleftover":31784,"yah":31785,"ĠVaj":31786,"Ġunsolved":31787,"oland":31788,"Ġstained":31789,"Ġpathetic":31790,"ylan":31791,"Ġknots":31792,"immigration":31793,"ieving":31794,"Coming":31795,"Commerce":31796,"ĠHurt":31797,"drawn":31798,"Ġaxis":31799,"Ġdye":31800,"ĠNora":31801,"ĠPortal":31802,"Ġsuspense":31803,"ĠExactly":31804,"Ġpowering":31805,"ĠClock":31806,"Ġdrawer":31807,"ĠSpike":31808,"Ġhallmark":31809,"aber":31810,"ĠTrainer":31811,"UV":31812,"Ġredundant":31813,"Tour":31814,"Ġdesignate":31815,"Ġredress":31816,"ĠUb":31817,"cake":31818,"oded":31819,"Ġkings":31820,"iates":31821,"Ġcoupons":31822,"Ġextremes":31823,"Elect":31824,"Ġcitation":31825,"Ġdirectory":31826,"Ġtranspired":31827,"cele":31828,"gence":31829,"5000":31830,"ostic":31831,"Ġraining":31832,"ĠSight":31833,"videos":31834,"phthal":31835,"llor":31836,"Ġappraisal":31837,"Ġdetox":31838,"Ġelecting":31839,"Ġordinances":31840,"Ġlifespan":31841,"Ref":31842,"Ġilluminated":31843,"Ġforfe":31844,"Making":31845,"ĠWorst":31846,"ĠTP":31847,"Ġfullest":31848,"ĠISIL":31849,"ĠRates":31850,"Ġyeast":31851,"sett":31852,"ĠYok":31853,"innie":31854,"edition":31855,"ĠGoldstein":31856,"Ġunaff":31857,"god":31858,"Ġzo":31859,"rums":31860,"Ġopaque":31861,"ĠHist":31862,"Yesterday":31863,"AMS":31864,"aband":31865,"005":31866,"illary":31867,"ĠSplash":31868,"Ġaccrued":31869,"Ell":31870,"Ġnominating":31871,"ĠBroadcast":31872,"ĠWhip":31873,"ARM":31874,"Ġunnecessarily":31875,"brown":31876,"429":31877,"ansky":31878,"Ġextravagant":31879,"Malley":31880,"wage":31881,"Ġexempted":31882,"Ġtypo":31883,"Ġesports":31884,"ĠStru":31885,"ĠPython":31886,"Ġsaint":31887,"ĠCSI":31888,"ĠPowder":31889,"Ġdisguised":31890,"ĠSubway":31891,"Ġprecursor":31892,"ĠWizard":31893,"Johnson":31894,"icas":31895,"Ġdefaults":31896,"!).":31897,"ebra":31898,"jected":31899,"Ġunaccompanied":31900,"HH":31901,"Ġproced":31902,"clinical":31903,"Ġmitigating":31904,"ĠSoup":31905,"ĠFunny":31906,"344":31907,"Hall":31908,"Ġscalable":31909,"Ġshimmer":31910,"Ġunderstatement":31911,"zeb":31912,"icus":31913,"Ġretract":31914,"IDER":31915,"ieft":31916,"iii":31917,"ĠEmperor":31918,"Ġvoltage":31919,"343":31920,"Rest":31921,"ĠButcher":31922,"Ġlaced":31923,"Ġsalty":31924,"Ġfourteen":31925,"Ġoxy":31926,"Ġraged":31927,"Ġforg":31928,"Ġcaveat":31929,"Ġponder":31930,"process":31931,"Ġghosts":31932,"ĠGoose":31933,"didn":31934,"stood":31935,"amation":31936,"Ġvillains":31937,"contract":31938,"Ġbooted":31939,"ĠDidn":31940,"ĠSalon":31941,"Ġlewd":31942,"ĠFritz":31943,"Ġorganis":31944,"Ġpuzzles":31945,"ĠRX":31946,"Ġcurtains":31947,"ĠPackage":31948,"Ġrebate":31949,"Ġspokes":31950,"Ġoccupant":31951,"Ġfooled":31952,"appy":31953,"Ġyourselves":31954,"Ġmaths":31955,"Ġ630":31956,"bos":31957,"ĠHeb":31958,"APS":31959,"Ġbulletin":31960,"Ġpests":31961,"Ġlum":31962,"ĠHAS":31963,"users":31964,"idated":31965,"Ġpalpable":31966,"ĠFeature":31967,"ĠPKK":31968,"Ġdetriment":31969,"Ġbamboo":31970,"Ġimmersed":31971,"ĠDud":31972,"Ġion":31973,"icc":31974,"ĠIris":31975,"ĠBeats":31976,"Ġimprobable":31977,"Ġfuner":31978,"Ġsprung":31979,"ĠLieberman":31980,"ĠSTA":31981,"venge":31982,"Ġtreacherous":31983,"Ġpreced":31984,"Ġsniper":31985,"ĠGOLD":31986,"ĠSUR":31987,"Nic":31988,"ĠROB":31989,"Camp":31990,"Ġhooks":31991,"oling":31992,"Ġbolst":31993,"339":31994,"heter":31995,"Ġbracelet":31996,"Ġbreat":31997,"307":31998,"ĠTrader":31999,"ĠPixar":32000,"hist":32001,"Ġmenacing":32002,"Ġgrizz":32003,"294":32004,"Ġillustrious":32005,"Ġtransact":32006,"Ġspoiler":32007,"ĠWORK":32008,"Road":32009,"Ġblackout":32010,"Ġencomp":32011,"proven":32012,"ĠFriendship":32013,"Ġentrances":32014,"Ġprofessions":32015,"Ġinsin":32016,"Ġrecorder":32017,"Ġformulation":32018,"govern":32019,"Ġpainfully":32020,"ĠRepe":32021,"eeds":32022,"cru":32023,"ĠDir":32024,"Ġtriumphant":32025,"Ġignition":32026,"xy":32027,"Ġintrusion":32028,"ĠEAR":32029,"RES":32030,"Ġration":32031,"ĠTaken":32032,"Ġcages":32033,"Ġpeg":32034,"Ġcommem":32035,"680":32036,"ĠRite":32037,"Ġfolder":32038,"Ġvertically":32039,"Ġcheeks":32040,"pick":32041,"Ġcrispy":32042,"Ġsqueezing":32043,"ĠBene":32044,"ĠTrailer":32045,"ĠKM":32046,"acceptable":32047,"ĠSetting":32048,"Ġsupernatural":32049,"ĠEz":32050,"Ġvenom":32051,"ĠFrey":32052,"Ġpulp":32053,"Had":32054,"centered":32055,"metics":32056,"Kent":32057,"ĠDOI":32058,"kr":32059,"ĠWHEN":32060,"Ġtakeoff":32061,"isf":32062,"uko":32063,"Ġquasi":32064,"Ġveggies":32065,"Ġpesticide":32066,"Ġstimulating":32067,"Ġacknowledgement":32068,"Ġattained":32069,"ĠBackground":32070,"281":32071,"317":32072,"ĠTrees":32073,"Ġdetractors":32074,"Ġannouncer":32075,"Ġjoyful":32076,"ĠElf":32077,"istration":32078,"phi":32079,"Ġprogressively":32080,"mini":32081,"Ġcontraception":32082,"asca":32083,"ishops":32084,"Ġmisunderstood":32085,"Ġinitiating":32086,"ĠConversely":32087,"338":32088,"080":32089,"idation":32090,"ĠGoes":32091,"Ġimprov":32092,"Ġswapping":32093,"Vict":32094,"Ġdevoid":32095,"fighter":32096,"ĠMori":32097,"Ġvoy":32098,"ĠElev":32099,"ĠAim":32100,"Ġtrustworthy":32101,"Leg":32102,"675":32103,"ĠPossible":32104,"Crunch":32105,"ĠRings":32106,"Ġphony":32107,"Ġbladder":32108,"ĠChall":32109,"Spot":32110,"oak":32111,"Was":32112,"ĠFAM":32113,"ĠAGA":32114,"ĠFifa":32115,"Ġenclosed":32116,"Ġanthrop":32117,"faith":32118,"ĠAux":32119,"Ġgracious":32120,"roller":32121,"Ġdowntime":32122,"swing":32123,"Ġcamouflage":32124,"ĠCosts":32125,"Ġliv":32126,"ricular":32127,"ĠUran":32128,"Ġdisapproval":32129,"Ġpropriet":32130,"bits":32131,"Ġmafia":32132,"ĠSCHOOL":32133,"ĠPrepar":32134,"button":32135,"Almost":32136,"Ġpastoral":32137,"ĠDove":32138,"Hol":32139,"Ġimposes":32140,"ĠDram":32141,"lys":32142,"ĠSAS":32143,"Ġwiring":32144,"271":32145,"ĠModels":32146,"Ġoutpost":32147,"etics":32148,"Ġinsulted":32149,"ĠMongolia":32150,"Ġoverth":32151,"Haw":32152,"ĠHomer":32153,"itta":32154,"raining":32155,"Ġevidently":32156,"raphic":32157,"impact":32158,"Ġfranch":32159,"Ġ2100":32160,"Ġapproximate":32161,"Ġcartoons":32162,"Ġbackups":32163,"umbing":32164,"Ġforceful":32165,"ĠShad":32166,"Ġsurges":32167,"Ġperf":32168,"Ġdele":32169,"Ġquieter":32170,"ĠHorowitz":32171,"ĠDX":32172,"anners":32173,"ĠNinja":32174,"ĠScript":32175,"ĠElise":32176,"collect":32177,"Ġgrading":32178,"ĠBethesda":32179,"Kids":32180,"ĠTelephone":32181,"Ġpreferring":32182,"Ġreconcil":32183,"Ġmango":32184,"ĠHail":32185,"ĠCitizenship":32186,"Master":32187,"cular":32188,"Ġstuffing":32189,"ĠAlive":32190,"ALLY":32191,"Ġchi":32192,"ĠDynam":32193,"ĠRosenthal":32194,"Ġpurity":32195,"Ġtemp":32196,"ĠHAL":32197,"employ":32198,"Ġplentiful":32199,"ĠComed":32200,"Ġstacks":32201,"ĠHuge":32202,"ĠOlder":32203,"Ġsclerosis":32204,"ONY":32205,"Ġfilmmaking":32206,"chance":32207,"Cry":32208,"Ġworkflow":32209,"ĠPersonnel":32210,"awed":32211,"ĠColumn":32212,"Ġuncomp":32213,"Ġdiscriminated":32214,"Ġpts":32215,"Ġallev":32216,"ĠKinn":32217,"meal":32218,"Ġnovice":32219,"Ġcrest":32220,"Ġhearty":32221,"Ġlowers":32222,"inqu":32223,"ĠPlayoffs":32224,"ĠHyp":32225,"Ġautos":32226,"Ġindec":32227,"Ġnighttime":32228,"Ġreflex":32229,"306":32230,"disciplinary":32231,"ophe":32232,"contact":32233,"Ġachievable":32234,"Ġslab":32235,"ĠMessage":32236,"ĠVMware":32237,"ĠDia":32238,"REG":32239,"Ġconfisc":32240,"ĠMechan":32241,"Ġphenomena":32242,"Ġsequencing":32243,"Ġshaming":32244,"Ġcompilation":32245,"ĠAges":32246,"Ġmastered":32247,"Ġagony":32248,"Ġrestrain":32249,"ĠLyme":32250,"Which":32251,"ĠBarney":32252,"ĠConcept":32253,"Ġsuperheroes":32254,"ĠPsychology":32255,"Ġreminis":32256,"violence":32257,"Lead":32258,"Da":32259,"VEN":32260,"ERC":32261,"ĠVoter":32262,"Ġbetray":32263,"Ġsavage":32264,"driver":32265,"IFT":32266,"Chain":32267,"angler":32268,"'-":32269,"lain":32270,"ĠRatt":32271,"bis":32272,"iverse":32273,"Ġdensely":32274,"Ġuncom":32275,"Ġunsuspecting":32276,"Ġstimulation":32277,"diff":32278,"Ġskins":32279,"ĠRiding":32280,"ategic":32281,"ĠUnderstand":32282,"occup":32283,"ĠCooking":32284,"Ġschizophrenia":32285,"ĠKoen":32286,"Ġcomrades":32287,"HY":32288,"Ġfab":32289,"ĠRowling":32290,"Allen":32291,"ĠJUL":32292,"Ġembryos":32293,"UU":32294,"ĠCAT":32295,"Ġtidy":32296,"finger":32297,"ĠCake":32298,"Ġrightfully":32299,"religious":32300,"Ġ407":32301,"Gal":32302,"408":32303,"Ġgrievance":32304,"Ġswallowed":32305,"251":32306,"283":32307,"ĠBarcl":32308,"opter":32309,"Ġpedoph":32310,"Ġcured":32311,"Ġestablishes":32312,"increasing":32313,"tics":32314,"articles":32315,"Ġunethical":32316,"authored":32317,"Ġanchors":32318,"ĠContra":32319,"Ġventured":32320,"ĠCoh":32321,"Ġpuff":32322,"heddar":32323,"Ġomission":32324,"Ġdich":32325,"ceed":32326,"Ġscares":32327,"Ġdoctoral":32328,"293":32329,"ĠUnt":32330,"Ġdop":32331,"ĠInjury":32332,"ificantly":32333,"ĠRift":32334,"ĠOrders":32335,"Ġmobilize":32336,"particularly":32337,"Ġchilled":32338,"Reports":32339,"redibly":32340,"ĠGuru":32341,"Ġvalleys":32342,"Ġtextures":32343,"Ġreuse":32344,"roit":32345,"unts":32346,"Ġirreversible":32347,"Ġwarships":32348,"Ġpus":32349,"Ġpeeled":32350,"Ġthirst":32351,"Ġgrapple":32352,"busters":32353,"Ġnort":32354,"ĠDates":32355,"Safe":32356,"Ġbirthplace":32357,"hemoth":32358,"Ġvile":32359,"Ġ306":32360,"Ram":32361,"activated":32362,"ĠAero":32363,"Ġbutcher":32364,"ĠKnock":32365,"Ġdisturb":32366,"Ġtotality":32367,"tted":32368,"Ġlegit":32369,"cking":32370,"nikov":32371,"Ġfavoring":32372,"lang":32373,"Ġrightful":32374,"orum":32375,"!!!!":32376,"ĠMinute":32377,"Ġpostings":32378,"Java":32379,"510":32380,"Ġmicrobes":32381,"Ġsixteen":32382,"entimes":32383,"Ġbulb":32384,"Ġgoalt":32385,"Ġhumiliated":32386,"ansom":32387,"roach":32388,"Ġgrouping":32389,"hari":32390,"Ġcler":32391,"Ġstared":32392,"ĠSymptoms":32393,"Ġbasil":32394,"Whenever":32395,"ĠWhoever":32396,"Oil":32397,"ĠJericho":32398,"ĠAlm":32399,"Pol":32400,"Hur":32401,"Ġupro":32402,"ĠSpo":32403,"hammer":32404,"Mur":32405,"ĠTorch":32406,"Ġfrequencies":32407,"ĠExpansion":32408,"Ġparalysis":32409,"igon":32410,"ĠSail":32411,"Ġsilently":32412,"Ġrevolver":32413,"Ġstockpile":32414,"Ġpessimistic":32415,"ESA":32416,"Ġdisclaim":32417,"Ġdemocracies":32418,"ĠTales":32419,"ĠAngry":32420,"ĠWhitman":32421,"ĠOri":32422,"Ġtransitioned":32423,"behind":32424,"ĠLAN":32425,"Ġcav":32426,"ĠJazeera":32427,"KC":32428,"ĠInspect":32429,"irty":32430,"ĠAin":32431,"ĠOrig":32432,"Ġobscene":32433,"Ġdormant":32434,"Ġharb":32435,"ĠWiz":32436,"ĠAdolf":32437,"Ġvic":32438,"Ġdenouncing":32439,"Ġye":32440,"aques":32441,"Ġomn":32442,"Ġassemblies":32443,"nosis":32444,"Ġadmon":32445,"Ġanguish":32446,"Ġvag":32447,"YE":32448,"ĠMacro":32449,"Ġrubbing":32450,"Ġreplicated":32451,"Moon":32452,"ĠGuitar":32453,"Ġcentimeters":32454,"amily":32455,"ĠAmes":32456,"Ġchlorine":32457,"Perhaps":32458,"Ġpartisans":32459,"soc":32460,"Ġvagina":32461,"Ġtrove":32462,"ĠYES":32463,"Ġtherapists":32464,"Ġnods":32465,"Ġhanged":32466,"Ġridge":32467,"Ġhaz":32468,"ĠmacOS":32469,"Ġske":32470,"ĠShia":32471,"Ġsteril":32472,"Ġalmond":32473,"ĠRockefeller":32474,"Ġintrinsic":32475,"Certainly":32476,"Ġsublime":32477,"Earn":32478,"abet":32479,"Ġframeworks":32480,"ogical":32481,"ilst":32482,"ipal":32483,"Ġrescuing":32484,"ĠWatergate":32485,"Ġ231":32486,"ĠNano":32487,"ighthouse":32488,"olph":32489,"Ġ312":32490,"Ġhealed":32491,"ĠTomb":32492,"Ġsubst":32493,"Ġsulph":32494,"ĠNewsp":32495,"ĠLama":32496,"venue":32497,"387":32498,"productive":32499,"ĠNEED":32500,"minus":32501,"ĠPages":32502,"cand":32503,"ĠClover":32504,"ĠForensic":32505,"ryn":32506,"ogle":32507,"ocr":32508,"Ġvaccinations":32509,"cies":32510,"ĠMek":32511,"Ġunaffected":32512,"Ġfetal":32513,"ĠDino":32514,"Ġhemisphere":32515,"Ġfroze":32516,"ĠPeg":32517,"Ġmicroscope":32518,"Ġmoderates":32519,"ĠGEN":32520,"ĠHawai":32521,"Ġstagn":32522,"Absolutely":32523,"practice":32524,"IBLE":32525,"cture":32526,"ĠAshe":32527,"Ġcondoms":32528,"Ġpoked":32529,"training":32530,"Ġintermedi":32531,"347":32532,"Ġcardinal":32533,"ĠSpoon":32534,"Ġsupp":32535,"Ġpreviews":32536,"Service":32537,"ĠBeam":32538,"Ġtranscend":32539,"Fresh":32540,"Sure":32541,"Ġ4000":32542,"idential":32543,"ĠCoinbase":32544,"Ġworkings":32545,"ĠPI":32546,"Ġpassionately":32547,"Ġdecisively":32548,"ĠInspection":32549,"Ġinvoke":32550,"Ġstain":32551,"Ġcleaners":32552,"Ġregulates":32553,"Ġshone":32554,"ĠEVERY":32555,"istance":32556,"map":32557,"Ġredu":32558,"Ġoccupies":32559,"Ġprocure":32560,"acket":32561,"roman":32562,"Ġilleg":32563,"Ġleaps":32564,"yond":32565,"Ġyarn":32566,"ĠLTD":32567,"ĠCONTR":32568,"ĠRestoration":32569,"ĠCDs":32570,"Ġdrinkers":32571,"ĠJordanian":32572,"Ġabl":32573,"Ġdisparate":32574,"Ġprimed":32575,"ĠFirearms":32576,"artz":32577,"Ġindispensable":32578,"Ter":32579,"Ġfright":32580,"Ġmarkedly":32581,"Ġroam":32582,"ĠJurassic":32583,"Ġfeder":32584,"Ġpepp":32585,"ĠDV":32586,"Ġpancakes":32587,"sweet":32588,"Ġunmatched":32589,"Ġassembling":32590,"Ultimately":32591,"Ġendeavour":32592,"Ġluckily":32593,"Ġbitch":32594,"Ġelegance":32595,"eers":32596,"drop":32597,"credit":32598,"Ġscourge":32599,"ĠMinimum":32600,"Ġimpatient":32601,"Ġhunted":32602,"ĠGoddard":32603,"Kal":32604,"Ġmined":32605,"Ġcalves":32606,"Ġ234":32607,"Ġplank":32608,"Ġinjecting":32609,"ĠKaufman":32610,"ĠCompliance":32611,"tone":32612,"Ġ345":32613,"Ġdazz":32614,"ĠClarks":32615,"Ġcomprehens":32616,"Ġpist":32617,"Ġrhythms":32618,"Ġreserv":32619,"337":32620,"ĠIDF":32621,"Ġshouts":32622,"midt":32623,"323":32624,"Ġsoothing":32625,"Ġadministr":32626,"Ġgloomy":32627,"Ġfutile":32628,"ĠProhibition":32629,"upon":32630,"ĠAnglic":32631,"seeking":32632,"Ġdodge":32633,"Ds":32634,"ĠGrants":32635,"editor":32636,"ĠInquis":32637,"Ġ1929":32638,"decl":32639,"ĠPorts":32640,"ĠCure":32641,"ĠDPRK":32642,"oct":32643,"Ġvocabulary":32644,"Ġcling":32645,"298":32646,"Ġpeac":32647,"Ġantibodies":32648,"dor":32649,"ĠWorse":32650,"Ġsmelled":32651,"Ġleash":32652,"MED":32653,"Ġdisinteg":32654,"Ġtruthful":32655,"Ġsalesman":32656,"Ġsquares":32657,"susp":32658,"Ġcraving":32659,"Ġwizard":32660,"moral":32661,"ĠQué":32662,"Anything":32663,"Ġfalsehood":32664,"ARI":32665,"Ġcoworkers":32666,"Ġthy":32667,"outher":32668,"Ġbrushing":32669,"ĠProtest":32670,"ĠMF":32671,"abba":32672,"lead":32673,"ĠExhibit":32674,"Ga":32675,"ĠFranks":32676,"Ġdictates":32677,"illegal":32678,"Ġrelayed":32679,"Ġploy":32680,"ĠاÙĦ":32681,"ĠDocuments":32682,"Ġtint":32683,"ĠYuan":32684,"Ġdepended":32685,"Mir":32686,"ĠIntrodu":32687,"Ġrecourse":32688,"oqu":32689,"ĠTED":32690,"Ġdifferentiated":32691,"ĠWalls":32692,"Ġsentimental":32693,"Ġantis":32694,"retion":32695,"comes":32696,"ĠWORLD":32697,"Ġcoax":32698,"ĠTatt":32699,"ĠGingrich":32700,"2006":32701,"ĠBrut":32702,"Second":32703,"posed":32704,"shots":32705,"Ġ313":32706,"idian":32707,"alking":32708,"Ġdens":32709,"Ġgif":32710,"akings":32711,"Ġkeywords":32712,"Ġchast":32713,"Ġadversary":32714,"Ġnick":32715,"iasis":32716,"ĠLegisl":32717,"Ġcoff":32718,"ĠOriental":32719,"ĠMorg":32720,"ĠHAR":32721,"Ġlegalizing":32722,"Ġbanter":32723,"ĠTart":32724,"ĠTRI":32725,"Ġantagon":32726,"ĠGF":32727,"oler":32728,"ĠUFO":32729,"Therefore":32730,"ĠOsama":32731,"ĠStructure":32732,"apps":32733,"Ġpee":32734,"ĠSomehow":32735,"ĠOverwatch":32736,"ĠCasual":32737,"Ġdishon":32738,"SEE":32739,"ctive":32740,"andering":32741,"ĠTransformation":32742,"Andy":32743,"ĠFever":32744,"Ġspectator":32745,"Ġlash":32746,"Ġprotector":32747,"apy":32748,"Ġexhilar":32749,"aroo":32750,"Ġmamm":32751,"Ġbystand":32752,"acky":32753,"Ġdigestive":32754,"Ġamplified":32755,"Ġalpha":32756,"continue":32757,"Low":32758,"Ġdisgusted":32759,"356":32760,"script":32761,"Ġgenerational":32762,"ĠPassenger":32763,"sight":32764,"Ġcout":32765,"Ġhone":32766,"ulse":32767,"Ġignite":32768,"284":32769,"gow":32770,"Ġbinary":32771,"Ġincess":32772,"Review":32773,"607":32774,"ĠSurprise":32775,"Ġirritation":32776,"ĠBarth":32777,"ĠGum":32778,"Ġvideot":32779,"ĠFres":32780,"asons":32781,"Ġcollaborator":32782,"fal":32783,"ĠGon":32784,"Ġsettles":32785,"regular":32786,"Ġmiscarriage":32787,"cube":32788,"Ġsubord":32789,"ĠRegistered":32790,"Ġnotions":32791,"zzy":32792,"Ġrevert":32793,"OFF":32794,"Ġhasht":32795,"ĠPNG":32796,"Ġunimaginable":32797,"builders":32798,"Taylor":32799,"ĠPAY":32800,"Ġ).":32801,"Ġ238":32802,"ĠLAST":32803,"MAS":32804,"Ġillustrations":32805,"Ġparody":32806,"Ġdispersed":32807,"ĠRoses":32808,"Ġestimation":32809,"ĠGets":32810,"Patrick":32811,"CHA":32812,"Ġmisdem":32813,"agate":32814,"alter":32815,"Ġgeo":32816,"Ġenormously":32817,"Ġarrogance":32818,"Ġpert":32819,"Ġmeta":32820,"ĠJuno":32821,"iov":32822,"imov":32823,"Ġchores":32824,"acan":32825,"Paris":32826,"313":32827,"Lewis":32828,"Ġwillingly":32829,"ERA":32830,"Ġencaps":32831,"ilk":32832,"Ġnodes":32833,"Ġenzyme":32834,"want":32835,"Ġtolerant":32836,"Ġcondos":32837,"Ġasserts":32838,"Ġcanon":32839,"Ġscanned":32840,"bishop":32841,"Ġperched":32842,"util":32843,"ĠBonus":32844,"create":32845,"ĠFuk":32846,"Ġmotif":32847,"Ġcontemplate":32848,"ĠBEN":32849,"imir":32850,"Ġacadem":32851,"uvian":32852,"ĠIdeas":32853,"ĠCY":32854,"Ġants":32855,"Ġprostitutes":32856,"2005":32857,"Spring":32858,"ĠBarrel":32859,"ĠAunt":32860,"ĠLudwig":32861,"ĠHerm":32862,"PRO":32863,"obiles":32864,"rack":32865,"STER":32866,"ucket":32867,"Ġmun":32868,"Ġ419":32869,"ICES":32870,"Ġcardio":32871,"Ġtrenches":32872,"Nation":32873,"yahoo":32874,"Ġburd":32875,"Ġnost":32876,"Ġappropriations":32877,"ĠChili":32878,"Josh":32879,"GW":32880,"Ġoppressed":32881,"ĠBEFORE":32882,"Ġmurderous":32883,"Pen":32884,"achable":32885,"Ġrive":32886,"Ġculmin":32887,"Ġdefin":32888,"ĠMord":32889,"idate":32890,"ĠChim":32891,"ource":32892,"ĠElectro":32893,"orthy":32894,"Ġcalendars":32895,"regation":32896,"Ġretrospect":32897,"ĠTribal":32898,"ĠHes":32899,"Ġcran":32900,"Ġcreditor":32901,"Ġfibers":32902,"note":32903,"idays":32904,"ĠSebast":32905,"ĠKitty":32906,"Ġplainly":32907,"ĠLAPD":32908,"Ġtrumpet":32909,"ĠAppropriations":32910,"Hill":32911,"ĠVeget":32912,"296":32913,"lated":32914,"othes":32915,"ibrarian":32916,"Listen":32917,"nex":32918,"WHO":32919,"Ġshampoo":32920,"Ġclaimants":32921,"Ġisol":32922,"Ġunchecked":32923,"Ġmov":32924,"umo":32925,"ĠLens":32926,"Ġdiscreet":32927,"Ġrespectfully":32928,"Ġreclaimed":32929,"ĠHatt":32930,"thus":32931,"ĠFlo":32932,"Ġsumm":32933,"phas":32934,"ĠHaitian":32935,"Ġstrife":32936,"Ġabound":32937,"verted":32938,"Ġpatronage":32939,"449":32940,"Ġprelim":32941,"ĠZhu":32942,"ĠRevel":32943,"adic":32944,"Ġminded":32945,"ĠStability":32946,"Ġresembling":32947,"Ġvending":32948,"ischer":32949,"Ġkisses":32950,"Ġsuperiority":32951,"Ġinfinite":32952,"ISC":32953,"880":32954,"Ġappease":32955,"VO":32956,"404":32957,"ECH":32958,"gam":32959,"River":32960,"metal":32961,"determination":32962,"Cook":32963,"Ġbuds":32964,"Ġ(%)":32965,"ĠCreated":32966,"Ġstrut":32967,"Ġ425":32968,"Ġverte":32969,"ĠOrb":32970,"Ġweaving":32971,"261":32972,"Ġflyers":32973,"spons":32974,"ĠCovenant":32975,"570":32976,"Ġintangible":32977,"ĠBJ":32978,"ĠStead":32979,"ĠBrune":32980,"pain":32981,"independent":32982,"Ball":32983,"witch":32984,"ĠIon":32985,"Ġpupp":32986,"Cash":32987,"ĠConvert":32988,"Ġimpede":32989,"broad":32990,"onew":32991,"Ġsynergy":32992,"Ġcoined":32993,"620":32994,"ivalent":32995,"ĠInfect":32996,"ĠAqua":32997,"Together":32998,"ĠChemistry":32999,"ĠURL":33000,"ampion":33001,"Ġdeclarations":33002,"Ġaffirmative":33003,"umper":33004,"ĠTarant":33005,"Ġstereotype":33006,"Ġbookstore":33007,"incre":33008,"Ġchipset":33009,"Ġangst":33010,"Jose":33011,"laus":33012,"Ġheater":33013,"ipers":33014,"Ġeminent":33015,"hook":33016,"sticks":33017,"ĠCoul":33018,"Ġmildly":33019,"SG":33020,"Ġworm":33021,"Ġdisable":33022,"Ġperfume":33023,"ISTER":33024,"Ġgathers":33025,"ĠLotus":33026,"hyp":33027,"actus":33028,"Ġdistinctly":33029,"fifth":33030,"!),":33031,"ĠCrunch":33032,"Ġcohesive":33033,"Ġfortunately":33034,"Ġninety":33035,"Ġcartels":33036,"empl":33037,"Direct":33038,"Ġcommuting":33039,"ĠSX":33040,"ractive":33041,"Ġtranslating":33042,"ĠAQ":33043,"Ġslay":33044,"abuse":33045,"ĠProc":33046,"ĠCantor":33047,"ĠTas":33048,"Sir":33049,"Thom":33050,"ĠCHRIST":33051,"Ġreceptive":33052,"ĠCornel":33053,"Arab":33054,"Ġgrammar":33055,"Ġhandlers":33056,"Ġalloy":33057,"Ġthinly":33058,"adem":33059,"Ġproponent":33060,"ĠPVC":33061,"Ġstump":33062,"tom":33063,"rets":33064,"iciency":33065,"780":33066,"Ġ311":33067,"ĠClapper":33068,"ITAL":33069,"Ùħ":33070,"Ġnarrator":33071,"Ġblond":33072,"Ġintermittent":33073,"Ġcollabor":33074,"646":33075,"Ġmetast":33076,"Ġregeneration":33077,"ĠLegendary":33078,"Ġgenitals":33079,"Ġbartender":33080,"atson":33081,"Okay":33082,"Ġpassages":33083,"Ġsubstituted":33084,"orr":33085,"ALTH":33086,"Ġartic":33087,"Ġascent":33088,"Ġmatured":33089,"Ġterminology":33090,"served":33091,"ĠDeliver":33092,"Ġattic":33093,"anges":33094,"Ġrenaissance":33095,"Ġbleed":33096,"claimer":33097,"onse":33098,"Sec":33099,"Ġparticle":33100,"aneous":33101,"ateur":33102,"Ġzeal":33103,"ĠPets":33104,"Working":33105,"ĠRespect":33106,"Ġsermon":33107,"ĠProvided":33108,"Ġfilibuster":33109,"Ġabolished":33110,"reviewed":33111,"cription":33112,"Ġrevers":33113,"atered":33114,"435":33115,"Ġwhe":33116,"ometown":33117,"UFC":33118,"products":33119,"Winter":33120,"Ġ304":33121,"Ġsporadic":33122,"orough":33123,"EB":33124,"ĠAgric":33125,"ĠMTA":33126,"wic":33127,"Ġpowerless":33128,"Ġcarrot":33129,"ww":33130,"Ġabsorption":33131,"ĠTyphoon":33132,"Turkey":33133,"Ġproclaim":33134,"Ġhikers":33135,"Ġpractise":33136,"/$":33137,"Ġfingertips":33138,"Ġbaff":33139,"vu":33140,"Ġans":33141,"plug":33142,"Ġacquaintance":33143,"itement":33144,"ihar":33145,"Ġreluctantly":33146,"Ġforc":33147,"Ġguarant":33148,"ĠWanted":33149,"Walk":33150,"addle":33151,"unders":33152,"Fred":33153,"Ġtides":33154,"ĠBai":33155,"Ġcountering":33156,"raper":33157,"ursions":33158,"ĠFlav":33159,"pared":33160,"raised":33161,"Ñı":33162,"ĠDiff":33163,"Ġreload":33164,"ourses":33165,"ĠBurning":33166,"Ġwand":33167,"Ġledger":33168,"Ġcoughing":33169,"ĠLoren":33170,"Nazis":33171,"Ġcompile":33172,"Eight":33173,"icultural":33174,"yy":33175,"Ġ1932":33176,"Run":33177,"AIN":33178,"Ġattractiveness":33179,"ĠOmn":33180,"Ġconfer":33181,"compliance":33182,"Ġembed":33183,"Steven":33184,"2001":33185,"Ġdecre":33186,"Ġprompts":33187,"ĠHare":33188,"Ġleaping":33189,"Ġslaughtered":33190,"Ġforfeiture":33191,"342":33192,"Charl":33193,"CDC":33194,"ographically":33195,"Ġduplicate":33196,"Ġdistracting":33197,"examination":33198,"Ġpeas":33199,"Ġcatchy":33200,"Ġdives":33201,"ĠAda":33202,"Hay":33203,"Ġenthusiastically":33204,"Ġfunky":33205,"kay":33206,"EVA":33207,"Ġpsychologists":33208,"Ġancestry":33209,"iyah":33210,"ifter":33211,"nob":33212,"518":33213,"rouse":33214,"Ġchord":33215,"Ġcone":33216,"Ġbarracks":33217,"ĠRoyale":33218,"ĠIntegration":33219,"Ġtrolling":33220,"ĠSynt":33221,"andals":33222,"ĠGrain":33223,"ĠNeck":33224,"618":33225,"Ġrapist":33226,"pins":33227,"Ġwitty":33228,"Ġdehydration":33229,"arlane":33230,"Ġimmoral":33231,"Ġaccum":33232,"ĠMcAuliffe":33233,"slow":33234,"Ġinjust":33235,"Ġ1700":33236,"Ġcarbs":33237,"Ġintel":33238,"Non":33239,"isks":33240,"Tre":33241,"Ġinterviewer":33242,"sam":33243,"Ġdelve":33244,"Ġadmirable":33245,"ĠROM":33246,"ĠHispanics":33247,"Ġimpart":33248,"Ġunderrated":33249,"Ġvictimized":33250,"ĠPsych":33251,"ppings":33252,"Ġ610":33253,"pole":33254,"Ġdiner":33255,"ĠScale":33256,"Ġunforeseen":33257,"surprisingly":33258,"opus":33259,"ĠCOURT":33260,"Ġjuggling":33261,"ĠFacilities":33262,"Aid":33263,"ĠHPV":33264,"Ġcrawling":33265,"flu":33266,"etary":33267,"ĠHarriet":33268,"329":33269,"ĠSod":33270,"ĠBiological":33271,"birth":33272,"ribed":33273,"Ġpulses":33274,"396":33275,"eways":33276,"ĠAlma":33277,"nov":33278,"015":33279,"ricane":33280,"agna":33281,"Ak":33282,"ĠClaim":33283,"Ġpref":33284,"Ġinterfaces":33285,"ĠADHD":33286,"604":33287,"ZE":33288,"venture":33289,"Ġascend":33290,"ĠGou":33291,"Ġpriceless":33292,"redo":33293,"kw":33294,"Conf":33295,"Ġmah":33296,"Ġpoets":33297,"Ġstalk":33298,"Ġencamp":33299,"Ġhopped":33300,"Ġmelody":33301,"JECT":33302,"eming":33303,"Ġbewild":33304,"aternal":33305,"uchs":33306,"dit":33307,"ĠTransmission":33308,"Lake":33309,"Ġatoms":33310,"ĠThoughts":33311,"ilts":33312,"volume":33313,"Ġsocioeconomic":33314,"atisf":33315,"Ġnarr":33316,"zinski":33317,"ymes":33318,"episode":33319,"Ġinherit":33320,"Ġintending":33321,"Ġarenas":33322,"uras":33323,"burning":33324,"334":33325,"teenth":33326,"Ġsophistication":33327,"Ġscreenshots":33328,"Ġautistic":33329,"lip":33330,"paper":33331,"Ġmonopol":33332,"799":33333,"forms":33334,"ocrats":33335,"Ġpineapple":33336,"Ġbegs":33337,"Ġpersecuted":33338,"Ġsubscribed":33339,"Ġelic":33340,"ĠPRESIDENT":33341,"297":33342,"Ġpreferential":33343,"Ġpyramid":33344,"Ġconvergence":33345,"Ġwob":33346,"Project":33347,"ĠAluminum":33348,"ĠJPM":33349,"ĠBAT":33350,"Ġdolphins":33351,"018":33352,"healthy":33353,"ĠCG":33354,"ĠEffective":33355,"worm":33356,"ĠEas":33357,"olicited":33358,"ĠUSE":33359,"ĠCaval":33360,"Ġswirl":33361,"Ġspaghetti":33362,"Ġinward":33363,"Republican":33364,"Ġpublicized":33365,"Ġeconomical":33366,"Ġsalsa":33367,"ĠTitanic":33368,"dot":33369,"Ġcontro":33370,"ĠBangl":33371,"iban":33372,"ĠKlux":33373,"Ġhinges":33374,"610":33375,"Ġvalves":33376,"profits":33377,"Wonder":33378,"Ġorient":33379,"Ġsque":33380,"Ġprivatization":33381,"Obama":33382,"Thousands":33383,"ĠTasman":33384,"Ġmaze":33385,"eem":33386,"Ġsurvives":33387,"istant":33388,"Ġenriched":33389,"Ġencl":33390,"Ġcompliments":33391,"ĠShoes":33392,"Ġinsanity":33393,"consider":33394,"agog":33395,"Ġbaffled":33396,"Ġ°":33397,"ĠWordPress":33398,"qus":33399,"usual":33400,"stall":33401,"Deb":33402,"ĠRothschild":33403,"Ġesche":33404,"Ġsoph":33405,"Ġambiguous":33406,"negative":33407,"Ġdiscouraging":33408,"Alexander":33409,"319":33410,"Ġsummon":33411,"ipation":33412,"000000":33413,"Ġminimalist":33414,"Ġenraged":33415,"777":33416,"Ġplanetary":33417,"Ġthroughput":33418,"Ġtemperament":33419,"ĠNIC":33420,"ileged":33421,"minster":33422,"ĠPLEASE":33423,"Ġexagger":33424,"ĠDescription":33425,"Ġagitated":33426,"Ġimmortal":33427,"Ġrenders":33428,"Ġcharisma":33429,"sequ":33430,"Ġmajorities":33431,"Ġfreaking":33432,"ĠAdvice":33433,"Ġembodies":33434,"stable":33435,"Ġcustomization":33436,"started":33437,"ĠAutism":33438,"Ġparticipates":33439,"ĠUTC":33440,"Marco":33441,"Ġoddly":33442,"Ġantiqu":33443,"ĠPear":33444,"ĠFey":33445,"Ġcertify":33446,"Ġdisillusion":33447,"ĠPhysicians":33448,"obl":33449,"855":33450,"Ġelim":33451,"Ġ335":33452,"Ol":33453,"ĠSear":33454,"Ġnuances":33455,"past":33456,"Sa":33457,"ĠSlov":33458,"Ġfiltered":33459,"Ġanalogy":33460,"Ġformulate":33461,"Ġarmies":33462,"Ġpuls":33463,"fters":33464,"ilipp":33465,"ĠHOT":33466,"485":33467,"ĠAfghans":33468,"Ġtopical":33469,"ĠBunny":33470,"seeing":33471,"Ġeloqu":33472,"Ġkidneys":33473,"ĠDEM":33474,"pent":33475,"Ġhus":33476,"stores":33477,"ĠProtestant":33478,"Comm":33479,"label":33480,"Kings":33481,"ĠPurpose":33482,"â̦..":33483,"Ġaccumulating":33484,"calling":33485,"Ġgiveaways":33486,"Ġpredicament":33487,"Ġtyp":33488,"Ġtraveler":33489,"003":33490,"impro":33491,"fac":33492,"Ġmapped":33493,"itious":33494,"Ġmasculinity":33495,"Ġtantal":33496,"ĠDJs":33497,"Ġviewpoints":33498,"Burn":33499,"ĠWii":33500,"pak":33501,"ĠEB":33502,"Ġhinge":33503,"Ġfacets":33504,"Ġphotographic":33505,"Ġcompiling":33506,"Ġdecks":33507,"Ġarticulated":33508,"Federal":33509,"crim":33510,"llah":33511,"Ġfiasco":33512,"ĠLIST":33513,"oute":33514,"ĠDraper":33515,"ĠLaos":33516,"Ġclimbers":33517,"raph":33518,"ĠDek":33519,"WAY":33520,"Ġgreets":33521,"Ġoppressive":33522,"otor":33523,"otiation":33524,"\":[":33525,"Record":33526,"mining":33527,"Town":33528,"Ġfavorably":33529,"ĠYoutube":33530,"William":33531,"Ġlan":33532,"â̲":33533,"ĠSpec":33534,"Ġtranquil":33535,"ĠClient":33536,"oln":33537,"celona":33538,"Ġrealistically":33539,"Ġmisplaced":33540,"ĠBie":33541,"bye":33542,"Yo":33543,"465":33544,"ĠMadagascar":33545,"oplan":33546,"arist":33547,"Ġconfines":33548,"Ġï":33549,"awks":33550,"Ġpiracy":33551,"Ġunwelcome":33552,"Intel":33553,"Ġparanoid":33554,"CLAIM":33555,"Ġblush":33556,"united":33557,"Ġmotivational":33558,"ĠVII":33559,"Ġdiabetic":33560,"Ġantiv":33561,"Ġdissect":33562,"Ġbestselling":33563,"Ġfluffy":33564,"ĠRemote":33565,"Ġvert":33566,"Correct":33567,"Ġcolossal":33568,"Ġcontrasts":33569,"Ġcirca":33570,"ĠDamage":33571,"Ġunrel":33572,"Ġdiscrepancy":33573,"ĠCIS":33574,"ĠCLASS":33575,"ilty":33576,"Ġsynopsis":33577,"emed":33578,"cakes":33579,"ibal":33580,"inea":33581,"ienced":33582,"Ġimplicit":33583,"ĠLOOK":33584,"Ġsilhouette":33585,"affiliated":33586,"ĠHalo":33587,"377":33588,"Ġlyr":33589,"ĠVide":33590,"herent":33591,"Ġbadges":33592,"plays":33593,"orea":33594,"Ġjammed":33595,"cancer":33596,"ĠYep":33597,"racted":33598,"ĠDisability":33599,"Ġfooth":33600,"friends":33601,"Ġbloated":33602,"Bet":33603,"ĠAntioch":33604,"Ġintrodu":33605,"Ġannexed":33606,"ivism":33607,"ĠFlickr":33608,"pants":33609,"Ġinterruption":33610,"645":33611,"ĠIly":33612,"ĠOss":33613,"ĠAMA":33614,"Ġpolitely":33615,"Ġnatives":33616,"Ġrushes":33617,"enges":33618,"ĠHarm":33619,"Ġdestroyer":33620,"ĠEstimates":33621,"Ġtransforms":33622,"Ġinvariably":33623,"Ġcac":33624,"iency":33625,"599":33626,"Ġconstitutionally":33627,"Ġrappers":33628,"ĠSettlement":33629,"icz":33630,"Ġhardened":33631,"citizens":33632,"Ġcircling":33633,"Ġtrapping":33634,"Ġguaranteeing":33635,"690":33636,"agher":33637,"Ġarcade":33638,"Ġfanc":33639,"Ġslapping":33640,"OPS":33641,"Ġmasse":33642,"Ġpudding":33643,"Jac":33644,"ĠGraphics":33645,"Ġuptake":33646,"?,":33647,"Fair":33648,"ĠSatan":33649,"uffy":33650,"ĠGuatem":33651,"ĠTransaction":33652,"Ġunlocking":33653,"ĠLINE":33654,"Ġapprehens":33655,"Ġglean":33656,"291":33657,"Ġexacerbate":33658,"ĠTrave":33659,"ĠTrop":33660,"Supp":33661,"Ġqueens":33662,"cart":33663,"Ġscrolling":33664,"Ġox":33665,"cone":33666,"Matthew":33667,"ĠDIRECT":33668,"Ġbacker":33669,"Ġthyroid":33670,"Sarah":33671,"ĠEDIT":33672,"ĠActivision":33673,"352":33674,"Ġreinforcements":33675,"Ġding":33676,"Ġplush":33677,"Ġpeanuts":33678,"ĠFant":33679,"ĠPediatrics":33680,"Ġaccommodating":33681,"ĠPractices":33682,"Answer":33683,"racial":33684,"ĠConstant":33685,"740":33686,"strength":33687,"apist":33688,"Ġsynthes":33689,"ĠLeap":33690,"ĠFabric":33691,"Ġbrainstorm":33692,"obia":33693,"Ġconception":33694,"Ġtuberculosis":33695,"Ġmajestic":33696,"ĠTitus":33697,"ĠTee":33698,"Ġlikeness":33699,"ĠSEA":33700,"lite":33701,"Ġ950":33702,"sufficient":33703,"Ġtrem":33704,"Ġharshly":33705,"Ġredacted":33706,"Ġwelding":33707,"Ġperplex":33708,"Ġpoetic":33709,"Ġinsignificant":33710,"Ġware":33711,"Ġwandered":33712,"Ġmete":33713,"ĠSTART":33714,"Ġweaponry":33715,"opsy":33716,"shadow":33717,"Ġobsc":33718,"hare":33719,"ĠOPEN":33720,"Ġdiligent":33721,"Girls":33722,"Ġinitials":33723,"Start":33724,"ĠBrookings":33725,"ombs":33726,"Ġlashes":33727,"essor":33728,"Ġgravy":33729,"ĠUbuntu":33730,"Tree":33731,"Ġ435":33732,"Ġcellar":33733,"Ġaquarium":33734,"ĠPodesta":33735,"361":33736,"ĠController":33737,"Ġeru":33738,"reasonable":33739,"Ġpermissions":33740,"725":33741,"Ġadministering":33742,"Ġflirt":33743,"Ġfleeting":33744,"asive":33745,"Ġsubcontract":33746,"Ġfascist":33747,"Ġcabbage":33748,"science":33749,"Ġboiler":33750,"ioned":33751,"Ġintegrates":33752,"Ġresidue":33753,"KEY":33754,"Ġwi":33755,"Ġsquared":33756,"Unless":33757,"Ġmute":33758,"ĠTuc":33759,"Ġverb":33760,"Gary":33761,"Ġexperimentation":33762,"fee":33763,"chini":33764,"Ġmarrow":33765,"ĠBalt":33766,"Ġnodded":33767,"tn":33768,"Ġmissionary":33769,"OTO":33770,"Ġoptimum":33771,"555":33772,"Ġwhipping":33773,"aunts":33774,"ĠScene":33775,"Ġcharacterize":33776,"Ġretrospective":33777,"Ġutilizes":33778,"Ġhastily":33779,"older":33780,"ĠPW":33781,"Ġsleepy":33782,"020":33783,"ĠAcid":33784,"Ġridiculously":33785,"Ġgigg":33786,"649":33787,"Ġcrus":33788,"ĠShame":33789,"ĠTorn":33790,"finding":33791,"IPS":33792,"Ġplat":33793,"ometers":33794,"Ġamphib":33795,"ellow":33796,"ĠSpecies":33797,"commercial":33798,"Ġvirgin":33799,"Ġdarn":33800,"Ġsorely":33801,"Ġrespondent":33802,"Ġray":33803,"ĠCONS":33804,"Ġunequivocally":33805,"server":33806,"Ġdrip":33807,"ĠRazor":33808,"Ban":33809,"ĠHMS":33810,"Ġhijab":33811,"ĠMuss":33812,"Ġsandy":33813,"Ġaversion":33814,"Ġoverarching":33815,"Ġultr":33816,"ĠIraqis":33817,"Ġuninterrupted":33818,"Ġrouting":33819,"Ġundone":33820,"independence":33821,"gra":33822,"ysics":33823,"inflammatory":33824,"cussion":33825,"ĠDefinitely":33826,"Ġelastic":33827,"peer":33828,"ĠGiov":33829,"ĠMandarin":33830,"Ġscratches":33831,"Ġphysicist":33832,"Ġbestowed":33833,"usually":33834,"OULD":33835,"igration":33836,"Human":33837,"Dead":33838,"osph":33839,"bott":33840,"doctoral":33841,"Ġbending":33842,"Ġconfigurations":33843,"psych":33844,"db":33845,"ĠUD":33846,"Ġarteries":33847,"orically":33848,"Ġblasphemy":33849,"jj":33850,"checking":33851,"adian":33852,"IRD":33853,"ĠDialogue":33854,"Ġshielded":33855,"ĠVox":33856,"Dave":33857,"Ġturb":33858,"ĠMassive":33859,"ĠBMI":33860,"ĠNF":33861,"uced":33862,"ickle":33863,"ishable":33864,"Ġembody":33865,"ÙĪ":33866,"Senior":33867,"ĠResult":33868,"try":33869,"egu":33870,"401":33871,"ĠLoyal":33872,"Ġperilous":33873,"Ġdissu":33874,"Ġmythology":33875,"ĠWax":33876,"Jesus":33877,"ĠMotorsport":33878,"Ġadvis":33879,"ĠAki":33880,"ISM":33881,"tested":33882,"Ġplag":33883,"Ġriches":33884,"ĠOCT":33885,"ĠLocke":33886,"BG":33887,"Ġ460":33888,"rawl":33889,"ĠTermin":33890,"Ġ295":33891,"Ġchopping":33892,"KT":33893,"Ġconverts":33894,"Ask":33895,"alse":33896,"ĠKeynes":33897,"Ġrefuted":33898,"Ġrabbits":33899,"Ġbilingual":33900,"urse":33901,"ĠSalad":33902,"odiac":33903,"Ġsolidly":33904,"Dam":33905,"Ġpp":33906,"rities":33907,"Rah":33908,"itness":33909,"Ġsixty":33910,"332":33911,"cold":33912,"Ġhindered":33913,"Ġclipped":33914,"Ġreceptor":33915,"ĠHoms":33916,"Ġdusk":33917,"Ġarchae":33918,"LR":33919,"Ġrods":33920,"Ġ257":33921,"ĠSith":33922,"ĠPumpkin":33923,"ellation":33924,"ĠWD":33925,"Ġdecriminal":33926,"Ġusable":33927,"Ġcheerful":33928,"ĠInform":33929,"Ġbrushes":33930,"vier":33931,"ĠBrush":33932,"590":33933,"boost":33934,"guided":33935,"ĠMJ":33936,"Ġsatirical":33937,"ortion":33938,"efficiency":33939,"Ġstrands":33940,"ĠWilde":33941,"Ġreproduce":33942,"verage":33943,"Ġlug":33944,"Ġhist":33945,"offer":33946,"Ġcollapses":33947,"Ġclerks":33948,"Ġairstrike":33949,"IPP":33950,"iscover":33951,"Ġnefarious":33952,"Ġstripe":33953,"Ġbona":33954,"ocon":33955,"Ġpunishments":33956,"ITED":33957,"ĠAltern":33958,"testing":33959,"Ġeerie":33960,"erous":33961,"Ġcaves":33962,"Ġcondemns":33963,"ĠDropbox":33964,"inese":33965,"axis":33966,"ĠRegistry":33967,"ĠMong":33968,"Ġbullies":33969,"Ġdocks":33970,"ĠAlter":33971,"rella":33972,"446":33973,"ĠDare":33974,"Ġvirtues":33975,"Ġdont":33976,"Value":33977,"ENE":33978,"received":33979,"Ġseaf":33980,"476":33981,"ilon":33982,"ĠKits":33983,"Ġrarity":33984,"Ġnurt":33985,"skin":33986,"ĠUL":33987,"ĠRegiment":33988,"terior":33989,"hate":33990,"ĠEstimated":33991,"ĠSilence":33992,"Ġorganism":33993,"ĠSigned":33994,"ĠIA":33995,"bite":33996,"Ġthicker":33997,"Ġeyeb":33998,"Ġjournalistic":33999,"ĠDisp":34000,"margin":34001,"Dri":34002,"Ġcomplexes":34003,"Ġimaginary":34004,"Ġrefuel":34005,"Ġmeticulous":34006,"Dub":34007,"Ġhaze":34008,"860":34009,"Ġproverbial":34010,"Ġozone":34011,"cale":34012,"resent":34013,"Ġdiscrete":34014,"boats":34015,"Ġ343":34016,"ĠRET":34017,"Ġsailor":34018,"hair":34019,"gear":34020,"Ġmalt":34021,"Ġpeach":34022,"ĠRabb":34023,"699":34024,"318":34025,"ĠVerge":34026,"Fin":34027,"ĠMighty":34028,"ierce":34029,"403":34030,"Ġdisenfranch":34031,"bass":34032,"nice":34033,"Ġsinks":34034,"ĠLaugh":34035,"367":34036,"ĠZur":34037,"Ġtravers":34038,"ĠMystery":34039,"onsense":34040,"ĠMonarch":34041,"Ġleapt":34042,"ergy":34043,"porate":34044,"display":34045,"ilet":34046,"Ġendemic":34047,"Bern":34048,"Ġpulmonary":34049,"Ġbroch":34050,"ĠManziel":34051,"Lyn":34052,"Repe":34053,"lda":34054,"hands":34055,"Ġtroublesome":34056,"Jordan":34057,"UTION":34058,"ĠALP":34059,"ĠLEG":34060,"Ġreconnaissance":34061,"ĠRNA":34062,"letters":34063,"ĠYounger":34064,"ĠLW":34065,"ĠSensor":34066,"388":34067,"Ġwielding":34068,"spr":34069,"Ġancestral":34070,"331":34071,"OTH":34072,"ĠAxis":34073,"irement":34074,"ĠCompact":34075,"voice":34076,"Ġpercussion":34077,"Ġendeav":34078,"Kate":34079,"ĠJACK":34080,"ĠMagnus":34081,"Ġinterconnected":34082,"ĠTraff":34083,"demon":34084,"Ġardent":34085,"ĠSomers":34086,"andum":34087,"346":34088,"heartedly":34089,"ayne":34090,"Design":34091,"melon":34092,"ĠCarib":34093,"Ġ1935":34094,"intention":34095,"cape":34096,"cend":34097,"organic":34098,"373":34099,"ĠRevival":34100,"ĠBLACK":34101,"Ġaspiration":34102,"yellow":34103,"bodied":34104,"Ġcrave":34105,"ĠIntelligent":34106,"ĠUnique":34107,"tab":34108,"386":34109,"ĠNess":34110,"Official":34111,"Stay":34112,"Ġcreat":34113,"iliary":34114,"rified":34115,"ĠPok":34116,"Ġabolition":34117,"Ka":34118,"ĠCourage":34119,"ĠDickens":34120,"rophic":34121,"ĠFAR":34122,"Ġfurnished":34123,".âĢĵ":34124,"rete":34125,"Ġvaginal":34126,"hner":34127,"ĠLONG":34128,"imates":34129,"ĠLiter":34130,"ĠMeasures":34131,"ĠBelg":34132,"\"-":34133,"ĠRaider":34134,"enario":34135,"rification":34136,"ĠFISA":34137,"ĠStab":34138,"Ġnar":34139,"mund":34140,"Tenn":34141,"Ġwakes":34142,"Ġcharg":34143,"okers":34144,"assment":34145,"Ġsiph":34146,"Ġludicrous":34147,"670":34148,"Ġcompositions":34149,"Ġpinnacle":34150,"ĠRankings":34151,"ĠTelescope":34152,"secure":34153,"Ġib":34154,"Ġaptly":34155,"paste":34156,"ĠJUST":34157,"RD":34158,"herry":34159,"sung":34160,"Ġmig":34161,"naires":34162,"Ġmigrated":34163,"Base":34164,"Ġamazingly":34165,"Ġunregulated":34166,"published":34167,"ĠPIT":34168,"ĠMissile":34169,"extreme":34170,"ĠAlone":34171,"skilled":34172,"ĠRamp":34173,"Ġcamer":34174,"Ġflyer":34175,"Ġbrewers":34176,"ĠReference":34177,"ĠMOV":34178,"ĠLep":34179,"Ġentitle":34180,"ivals":34181,"ĠPIN":34182,"Ġbatches":34183,"Ġunexplained":34184,"Ġenergies":34185,"Ġblurred":34186,"enged":34187,"orig":34188,"WF":34189,"olves":34190,"ĠPicks":34191,"ĠTwice":34192,"arranted":34193,"Ġmembrane":34194,"ĠMoonlight":34195,"Ġsulfur":34196,"Ġpurposely":34197,"Ġfumes":34198,"Ġ(#":34199,"onics":34200,"ivities":34201,"rollers":34202,"Ġflattering":34203,"felt":34204,"Ġintoxication":34205,"Bridge":34206,"ĠFallout":34207,"Ġcreatively":34208,"Ġpsychologically":34209,"Ġdespicable":34210,"gae":34211,"820":34212,"VERS":34213,"Ġtidal":34214,"Ġcarbohydrates":34215,"strip":34216,"Ġgravitational":34217,"Ġfeds":34218,"ĠZhao":34219,"legates":34220,"Ġ307":34221,"String":34222,"ĠRepair":34223,"Ġ1928":34224,"orses":34225,"atography":34226,"Boston":34227,"Ġasymm":34228,"ĠSomebody":34229,"Van":34230,"ĠSovereign":34231,"Ġnotoriety":34232,"Ġsimulate":34233,"ĠDiscussion":34234,"ĠTransition":34235,"Ġcopying":34236,"antage":34237,"ĠRodrig":34238,"Ġindifference":34239,"Ġ580":34240,"Ġastronomical":34241,"Ġscrews":34242,"840":34243,"inates":34244,"ĠStreaming":34245,"Ġentit":34246,"ĠLiterature":34247,"369":34248,"805":34249,"OTS":34250,"о":34251,"img":34252,"inness":34253,"Ġreverber":34254,"Ġpartition":34255,"Short":34256,"Ġmoist":34257,"Ġspoof":34258,"ĠDesire":34259,"orce":34260,"Ġcrammed":34261,"Ġunfor":34262,"Pan":34263,"ingen":34264,"Ġrelat":34265,"Mother":34266,"ĠGn":34267,"altern":34268,"Ġresurg":34269,"Ġcramped":34270,"ĠCitadel":34271,"Ġlaureate":34272,"Ġanalys":34273,"Ġnuns":34274,"ĠTie":34275,"activ":34276,"ĠSurprisingly":34277,"ĠProtective":34278,"ĠRedemption":34279,"Ġendlessly":34280,"Ġfists":34281,"spl":34282,"ĠKron":34283,"ĠExamples":34284,"Especially":34285,"Ġprejud":34286,"ĠSchwar":34287,"Ġ237":34288,"ĠPlants":34289,"ĠUNDER":34290,"Ġlasers":34291,"Ġsher":34292,"Ġgoddess":34293,"Ġwipes":34294,"409":34295,"ĠGTA":34296,"Ġhybrids":34297,"rowd":34298,"ĠMILL":34299,"ĠNUM":34300,"ĠGeek":34301,"ĠTWO":34302,"ĠTimbers":34303,"Ġresembled":34304,"ĠGRE":34305,"Bring":34306,"Ġcompressed":34307,"ĠOral":34308,"379":34309,"Ġwrench":34310,"LCS":34311,"Ġhomosexual":34312,"Kelly":34313,"Ġhump":34314,"ĠSicily":34315,"Ġperished":34316,"aos":34317,"doesn":34318,"scrib":34319,"Charlie":34320,"Ġshuffle":34321,"372":34322,"cedented":34323,"402":34324,"Ġtiers":34325,"Ġinteracted":34326,"ĠHG":34327,"ĠJere":34328,"ĠBRA":34329,"ĠDOC":34330,"things":34331,"Ġfaiths":34332,"Ġgirlfriends":34333,"Ġfortified":34334,"develop":34335,"ĠKus":34336,"iability":34337,"rase":34338,"iotics":34339,"ĠChern":34340,"boxes":34341,"abol":34342,"idan":34343,"emon":34344,"ĠJudaism":34345,"ĠSituation":34346,"ĠGrimm":34347,"Ġgou":34348,"ĠVictim":34349,"backer":34350,"Ġanimosity":34351,"ĠHorizons":34352,"ĠKazakh":34353,"Ġgrossly":34354,"ĠTac":34355,"yg":34356,"366":34357,"Ġcheaply":34358,"Ġformulated":34359,"ĠDangerous":34360,"offensive":34361,"Ġsauces":34362,"Ġkeyboards":34363,"666":34364,"Ġcanopy":34365,"Inc":34366,"astered":34367,"iesel":34368,"Ġadv":34369,"currency":34370,"Ġscapego":34371,"plings":34372,"ĠBDS":34373,"Ġstrangely":34374,"today":34375,"ĠEgyptians":34376,"Ġcoron":34377,"often":34378,"ĠTransformers":34379,"ĠAfterwards":34380,"reated":34381,"Ġpoisonous":34382,"Ġgeographically":34383,"Ġmell":34384,"Cross":34385,"Ġdeductible":34386,"ĠZionist":34387,"Ġcutter":34388,"ĠRP":34389,"ĠImag":34390,"Ġoverflow":34391,"358":34392,"ĠADD":34393,"bones":34394,"Ġflattened":34395,"ĠGREEN":34396,"Ġlaure":34397,"haps":34398,"ĠCellular":34399,"kens":34400,"363":34401,"ĠSmash":34402,"ĠSpeak":34403,"ĠMaiden":34404,"Ġgreedy":34405,"ĠManit":34406,"Ġfacet":34407,"ĠGPA":34408,"Ġracks":34409,"popular":34410,"322":34411,"ĠBars":34412,"avement":34413,"359":34414,"Ġpomp":34415,"Ġregisters":34416,"Fs":34417,"ĠLoving":34418,"ĠTaxi":34419,"concert":34420,"ĠArchae":34421,"Ġcurls":34422,"ĠSpit":34423,"ĠLIFE":34424,"Ġinvade":34425,"rolog":34426,"wreck":34427,"Ġconflicted":34428,"Ġ970":34429,"Ġexiled":34430,"Ġchew":34431,"udging":34432,"Ġexper":34433,"ĠFt":34434,"rius":34435,"ĠXer":34436,"~":34437,"Ġbandwagon":34438,"Fore":34439,"Cat":34440,"Ġoverflowing":34441,"Ġradios":34442,"Much":34443,"Ġfacilitates":34444,"ĠCaf":34445,"ĠQing":34446,"Use":34447,"Ġmang":34448,"Ġpissed":34449,"ĠOuter":34450,"within":34451,"ĠSchr":34452,"ĠSherlock":34453,"Ġ336":34454,"Ġcasc":34455,"chens":34456,"incent":34457,"Ġcultivating":34458,"ampions":34459,"Ġwasteful":34460,"adays":34461,"sets":34462,"ĠLF":34463,"watching":34464,"Ġabandonment":34465,"ĠJesuit":34466,"Ġlegislatures":34467,"regnancy":34468,"ĠColt":34469,"Ġinterns":34470,"Ġundertook":34471,"ĠIPA":34472,"ĠInstall":34473,"nsics":34474,"washer":34475,"Ġbeginners":34476,"ĠDiseases":34477,"Ġlimp":34478,"ĠESA":34479,"Basically":34480,"Ġprud":34481,"LED":34482,"Ġgrease":34483,"ousel":34484,"Ġrotten":34485,"ĠCele":34486,"facts":34487,"ĠLouie":34488,"ĠISI":34489,"481":34490,"Ġsett":34491,"Ġtoug":34492,"ĠReck":34493,"OUNT":34494,"ĠFou":34495,"Ġinhibitor":34496,"gru":34497,"bane":34498,"1980":34499,"ĠPanc":34500,"Ġsuperficial":34501,"Ġauthoritative":34502,"ĠVOL":34503,"790":34504,"Ġcrusade":34505,"airy":34506,"Ġemphatically":34507,"Ġflourishing":34508,"Ġ416":34509,"Ġheroine":34510,"inx":34511,"Ġanch":34512,"stretched":34513,"ĠRegener":34514,"ĠAncient":34515,"evaluate":34516,"Ġantibody":34517,"ĠEston":34518,"ĠAeg":34519,"Ġboldly":34520,"TN":34521,"ĠPercentage":34522,"Ġ747":34523,"Ġrapt":34524,"ĠEdited":34525,"Earth":34526,"phal":34527,"ĠXXX":34528,"arling":34529,"ĠReligion":34530,"Ġ503":34531,"forces":34532,"Ġendpoint":34533,"Miller":34534,"Ba":34535,"Ġdisappears":34536,"andre":34537,"Ġconnector":34538,"407":34539,"ĠTOUR":34540,"aura":34541,"ĠRazer":34542,"UPDATE":34543,"Ġcalib":34544,"original":34545,"ĠMonkey":34546,"Ir":34547,"Ġexacerb":34548,"killing":34549,"Ġforb":34550,"native":34551,"Ġpoking":34552,"Ġveiled":34553,"mails":34554,"Ġalphabet":34555,"Ġawkwardly":34556,"ĠNames":34557,"Ġspiders":34558,"ĠParam":34559,"ĠColour":34560,"Ġunification":34561,"ĠPione":34562,"Ġoffend":34563,"Ġscoff":34564,"ĠSAR":34565,"ĠBuildings":34566,"edes":34567,"ĠAke":34568,"Ġfirmware":34569,"Madison":34570,"policy":34571,"ĠComputing":34572,"ĠRW":34573,"Ġfluent":34574,"Ġdece":34575,"Ġswore":34576,"Ġrestaur":34577,"Ġpresses":34578,"ophon":34579,"Ġphilosopher":34580,"ften":34581,"Ġintruder":34582,"Ġleng":34583,"ĠCowboy":34584,"cled":34585,"Ġmeticulously":34586,"ĠPair":34587,"ĠEND":34588,"Ġcapsules":34589,"Ġauxiliary":34590,"Ġverses":34591,"Ġsheltered":34592,"Ġexplorer":34593,"ĠWolverine":34594,"auts":34595,"Ġinhibitors":34596,"ĠPeng":34597,"ĠValve":34598,"imar":34599,"Ġchuck":34600,"ĠRecording":34601,"Ġardu":34602,"Test":34603,"Ġinterven":34604,"Ġchrome":34605,"months":34606,"tap":34607,"ĠManz":34608,"format":34609,"ĠBalkans":34610,"Ġannex":34611,"uder":34612,"ĠAAC":34613,"Ġdisturbances":34614,"354":34615,"asms":34616,"ĠTad":34617,"puting":34618,"Ġfateful":34619,"imen":34620,"Ġaudi":34621,"ĠNewsweek":34622,"Around":34623,"Ġretribution":34624,"Ġsugars":34625,"Ġescapes":34626,"Ġlegitim":34627,"ĠProof":34628,"Ġmisogyn":34629,"cit":34630,"Ġclutching":34631,"exist":34632,"Ġrevol":34633,"Ġdiscs":34634,"discrimination":34635,"Ġstout":34636,"aline":34637,"ĠRandom":34638,"364":34639,"Ġapprehension":34640,"Ġmockery":34641,"Ġfossils":34642,"ĠStress":34643,"Ġbenefic":34644,"exc":34645,"lude":34646,"Small":34647,"Ġgh":34648,"Ġobserves":34649,"ĠSUP":34650,"Ġbrewer":34651,"ĠESP":34652,"Ġomitted":34653,"multiple":34654,"Ġminimizing":34655,"Ġtaco":34656,"Ġindifferent":34657,"medi":34658,"available":34659,"Ġ252":34660,"Ġsanity":34661,"ĠCookie":34662,"mostly":34663,"near":34664,"NASA":34665,"Ġlowly":34666,"seless":34667,"Ġobsess":34668,"itous":34669,"Dispatch":34670,"Ġcanyon":34671,"Ġbriefs":34672,"Say":34673,"ĠNato":34674,"ĠSpend":34675,"Ġ242":34676,"ĠEthernet":34677,"Ġmatte":34678,"ĠStim":34679,"hetics":34680,"Ġflourished":34681,"389":34682,"ĠMcA":34683,"695":34684,"Ġoverr":34685,"Ġtorment":34686,"Ġpirate":34687,"ĠJohann":34688,"roversial":34689,"ĠUnemployment":34690,"breakers":34691,"ĠMessages":34692,"tones":34693,"Ġtagging":34694,"Ġfrog":34695,"Jewish":34696,"Ġmessenger":34697,"Ġexasper":34698,"ernaut":34699,"Ġnarrower":34700,"ĠCatalyst":34701,"ĠSecrets":34702,"Ġadj":34703,"ĠFug":34704,"Ġaura":34705,"Ġtherape":34706,"mber":34707,"Ġcaliphate":34708,"Ġretreating":34709,"ĠComput":34710,"Ġburying":34711,"Ġail":34712,"Ġgriev":34713,"lins":34714,"825":34715,"tten":34716,"ifully":34717,"ĠTrials":34718,"igma":34719,"Ġ1914":34720,"Ġcoordinates":34721,"ocusing":34722,"ĠFeng":34723,"ĠWhale":34724,"Ġshorten":34725,"Ġcorrectness":34726,"evil":34727,"network":34728,"Ġreactive":34729,"assuming":34730,"ĠLaksh":34731,"games":34732,"Ġruining":34733,"excluding":34734,"annels":34735,"º":34736,"Ġrubbed":34737,"aleb":34738,"flex":34739,"iped":34740,"ĠLimit":34741,"allowed":34742,"ĠDMV":34743,"ĠLD":34744,"Ġstamina":34745,"conduct":34746,"Ġmislead":34747,"lib":34748,"ĠEminem":34749,"Ġpayoff":34750,"Ġkernel":34751,"Ġsweeps":34752,"Ġsonic":34753,"ĠKodi":34754,"unique":34755,"Ġsurrog":34756,"Michigan":34757,"Ġattest":34758,"Ġdummy":34759,"ĠStellar":34760,"ĠSquadron":34761,"ĠHait":34762,"ĠSpirits":34763,"605":34764,"ĠHemisphere":34765,"legram":34766,"ĠRack":34767,"opol":34768,"Ġfreshwater":34769,"cession":34770,"Ġabort":34771,"ĠLOG":34772,"Ġfuzzy":34773,"Ġcrystall":34774,"illation":34775,"ĠFreddy":34776,"Ġsalvation":34777,"Ġjuxtap":34778,"weekly":34779,"usha":34780,"456":34781,"Ġ660":34782,"ĠGlacier":34783,"Ġnegatives":34784,"Ġillegitimate":34785,"ĠProtein":34786,"Moore":34787,"Der":34788,"Ġinfancy":34789,"Again":34790,"ALD":34791,"Leon":34792,"ĠIdeally":34793,"fresh":34794,"730":34795,"Ġgamb":34796,"Ġscrewed":34797,"wow":34798,"Ġembodied":34799,"ĠCinderella":34800,"341":34801,"ĠPiano":34802,"Ġbroccoli":34803,"Ġmats":34804,"ĠZheng":34805,"cream":34806,"anut":34807,"ĠZig":34808,"Columb":34809,"ĠTibetan":34810,"Death":34811,"Ġstren":34812,"ĠVertical":34813,"Ġratification":34814,"Ġprincipally":34815,"ELD":34816,"Ġforbid":34817,"Ġamalg":34818,"blind":34819,"auri":34820,"stery":34821,"Ġbarley":34822,"FBI":34823,"ĠHex":34824,"925":34825,"Domin":34826,"oat":34827,"Ġswayed":34828,"ĠKKK":34829,"ĠTaxes":34830,"Ġker":34831,"eeper":34832,"ĠAwakens":34833,"ĠPix":34834,"ĠKING":34835,"dc":34836,"Ren":34837,"Ġlegitimately":34838,"ĠTriumph":34839,"ĠSites":34840,"ĠSai":34841,"tl":34842,"painted":34843,"ĠWaiting":34844,"starting":34845,"parents":34846,"ĠDuo":34847,"eele":34848,"upper":34849,"ĠInvestig":34850,"Ġeighteen":34851,"Ġcorrelated":34852,"ĠCascade":34853,"acca":34854,"ĠAlph":34855,"ĠPolic":34856,"ĠEVs":34857,"Ġworthless":34858,"ĠIndust":34859,"auld":34860,"ĠYiannopoulos":34861,"ĠEzra":34862,"Ġmorphed":34863,"Ġoriginating":34864,"mania":34865,"Ġsparing":34866,"Ġextrem":34867,"cre":34868,"ults":34869,"mare":34870,"classified":34871,"Ġparachute":34872,"Ġmistrust":34873,"ONT":34874,"Mind":34875,"Ġthru":34876,"707":34877,"ĠTwain":34878,"Ġmelodies":34879,"ĠDanger":34880,"ĠDPS":34881,"Ġderive":34882,"Ġdissolution":34883,"Ġchildbirth":34884,"Ġ415":34885,"fork":34886,"solid":34887,"loads":34888,"ĠCGI":34889,"378":34890,"ĠShed":34891,"Face":34892,"Ġcomet":34893,"iceps":34894,"ĠReduction":34895,"Fly":34896,"jp":34897,"ĠAnimation":34898,"Luke":34899,"Ġabiding":34900,"Ġdevise":34901,"ĠAe":34902,"Ġflux":34903,"Ġbras":34904,"Ġfracturing":34905,"Ġinventive":34906,"ĠGranger":34907,"Ġsap":34908,"inducing":34909,"Ġreviewers":34910,"Officers":34911,"ĠWHY":34912,"Ġamplify":34913,"Ġentr":34914,"Ġslit":34915,"457":34916,"Ġreformed":34917,"ĠPhi":34918,"Ġtempt":34919,"Ġcontradiction":34920,"585":34921,"ĠMaced":34922,"371":34923,"kinson":34924,"robe":34925,"ĠHunters":34926,"astern":34927,"criminal":34928,"jew":34929,"Ġdecentralized":34930,"bands":34931,"Ġavatar":34932,"ĠBarrier":34933,"Ġcharacterization":34934,"student":34935,"Ġgays":34936,"Ġspecialize":34937,"ĠJudging":34938,"Ġinitiation":34939,"Ġshove":34940,"Ġpirates":34941,"Ġfictitious":34942,"ĠPoker":34943,"ĠElsa":34944,"ĠTECH":34945,"handedly":34946,"Ġglued":34947,"Ġclinically":34948,"Ġinaccessible":34949,"Ġderegulation":34950,"Ġprohib":34951,"Ġdangling":34952,"Ġnoses":34953,"Ġstash":34954,"اØ":34955,"ESH":34956,"Ġmonstrous":34957,"Ġcrept":34958,"ĠCharm":34959,"Ġbeh":34960,"Ġshuts":34961,"Ġ236":34962,"imedia":34963,"445":34964,"Du":34965,"Ġafar":34966,"ĠRout":34967,"Ġflares":34968,"Utah":34969,"Ġ808":34970,"Ġjewels":34971,"2004":34972,"Ġrecal":34973,"Gas":34974,"ĠExcellent":34975,"Ġpitfalls":34976,"ĠDrawing":34977,"viously":34978,"angered":34979,"changes":34980,"Ġpasture":34981,"talking":34982,"Ġinequ":34983,"Ġbicycl":34984,"Cost":34985,"423":34986,"bard":34987,"Ġanterior":34988,"ecast":34989,"CHR":34990,"397":34991,"masters":34992,"706":34993,"ĠFinish":34994,"Yet":34995,"study":34996,"ĠCogn":34997,"Ġloaf":34998,"Ġspatial":34999,"ĠParad":35000,"batch":35001,"Ġvents":35002,"Ġspins":35003,"ĠAddiction":35004,"Ġcondone":35005,"Ġproble":35006,"English":35007,"ĠRomans":35008,"ĠSaying":35009,"ĠKling":35010,"Universal":35011,"ivist":35012,"Ġskirm":35013,"Ġ2500":35014,"Ġ263":35015,"aired":35016,"ĠMartian":35017,"ĠCompensation":35018,"lation":35019,"ĠSalam":35020,"LGBT":35021,"ĠDart":35022,"strike":35023,"vasive":35024,"ILLE":35025,"Ġimaginative":35026,"ĠEuph":35027,"Financial":35028,"Ġholog":35029,"orah":35030,"crit":35031,"ĠOswald":35032,"512":35033,"ĠUri":35034,"Ġdiscrepancies":35035,"Ġbeads":35036,"ĠShots":35037,"Mem":35038,"Ġhunts":35039,"Ġsubtly":35040,"Ġ470":35041,"ĠVigil":35042,"Ġsew":35043,"ĠBurma":35044,"igm":35045,"ighed":35046,"swe":35047,"Ġ251":35048,"Ġdeceit":35049,"Ġphysi":35050,"iflower":35051,"ĠCert":35052,"Ġchewing":35053,"rax":35054,"ĠMER":35055,"icient":35056,"Les":35057,"Ġ390":35058,"Ġperjury":35059,"Ġfiltering":35060,"770":35061,"Ġpoppy":35062,"Ġbland":35063,"ĠNasa":35064,"Ġorbiting":35065,"ĠRipple":35066,"otal":35067,"ĠRyu":35068,"ĠShap":35069,"ĠJian":35070,"Ġpiv":35071,"ĠNeptune":35072,"rary":35073,"Ġunavoidable":35074,"Ġguideline":35075,"Ġwaterfall":35076,"inators":35077,"ĠLogic":35078,"ĠPlug":35079,"role":35080,"Ġalterations":35081,"ĠSett":35082,"ĠFeld":35083,"Ġfreezes":35084,"Ġbedrock":35085,"ĠVIEW":35086,"ovation":35087,"Ġneedless":35088,"ĠIU":35089,"ignant":35090,"ĠConfeder":35091,"316":35092,"fine":35093,"Ġjars":35094,"gotten":35095,"Bron":35096,"Ġmindfulness":35097,"imating":35098,"Ġhysteria":35099,"Ġhurried":35100,"Ġinfantry":35101,"ĠNYU":35102,"tags":35103,"Penn":35104,"Ġtracing":35105,"ĠSwing":35106,"ĠIo":35107,"Ġreckoned":35108,"ĠRecall":35109,"ĠVersion":35110,"314":35111,"Ġecology":35112,"Ġarmoured":35113,"Ġresonance":35114,"970":35115,"Ġvigilance":35116,"Ġrede":35117,"ĠBohem":35118,"Ġchau":35119,"ĠDevi":35120,"Ġtru":35121,"))":35122,"Put":35123,"Ġflavored":35124,"ĠClown":35125,"Senate":35126,"ĠScandinavian":35127,"mable":35128,"Residents":35129,"ĠFranchise":35130,"Ġprecincts":35131,"Prem":35132,"ĠNeutral":35133,"coal":35134,"Ġdelinqu":35135,"Mus":35136,"UME":35137,"Ġtedious":35138,"roots":35139,"ĠCondition":35140,"ĠIntercept":35141,"017":35142,"itives":35143,"Ġdefinitively":35144,"Ġobliter":35145,"Ġclandestine":35146,"Ġstagnation":35147,"Ġblindness":35148,"abiding":35149,"Ġremix":35150,"feeding":35151,"Ġunrecogn":35152,"2003":35153,"960":35154,"381":35155,"Ġbulky":35156,"xia":35157,"ivered":35158,"inic":35159,"ĠSoci":35160,"ĠYards":35161,"Ġhides":35162,"Film":35163,"Ġtestim":35164,"Ġblacklist":35165,"Deep":35166,"Standard":35167,"ĠClash":35168,"Ġriddled":35169,"Ġdiseng":35170,"ĠTRE":35171,"ĠIDs":35172,"Ġmigrating":35173,"protect":35174,"Ġgraded":35175,"Ġvaguely":35176,"ĠCharacter":35177,"382":35178,"ĠMOD":35179,"Eng":35180,"Ġmobilized":35181,"Ġsincerity":35182,"Ġ317":35183,"sighted":35184,"ownt":35185,"ĠâĢİ":35186,"umpy":35187,"Ġitching":35188,"ĠVerd":35189,"cook":35190,"Ġsimulator":35191,"players":35192,"Early":35193,"infeld":35194,"Ġmaximizing":35195,"Philipp":35196,"ĠPhotoshop":35197,"Ġdestroys":35198,"Ġbefriend":35199,"Ġfilthy":35200,"ĠIncident":35201,"gha":35202,"Ġcomplicity":35203,"Ġmessing":35204,"YA":35205,"ĠNegro":35206,"adows":35207,"374":35208,"Ġpip":35209,"cean":35210,"Ġ1924":35211,"Sent":35212,"represent":35213,"Ġdeems":35214,"ĠRue":35215,"Ġtitanium":35216,"Ġmanners":35217,"â̦â̦":35218,"bare":35219,"Ġusur":35220,"mma":35221,"ĠPanda":35222,"ulus":35223,"ĠSlav":35224,"324":35225,"ĠMole":35226,"^":35227,"micro":35228,"foreign":35229,"lest":35230,"ocular":35231,"ĠUniv":35232,"ĠFrag":35233,"Ġshepherd":35234,"Ġelectron":35235,"ĠFSA":35236,"Ġunl":35237,"dose":35238,"Ġimmersion":35239,"ĠDeL":35240,"Ġbiomedical":35241,"Anna":35242,"Ġskillet":35243,"Ġrecre":35244,"Ġtrillions":35245,"voy":35246,"Ġnormalized":35247,"radio":35248,"cue":35249,"urbed":35250,"Ġthinkers":35251,"328":35252,"327":35253,"ĠForge":35254,"505":35255,"Ġunbearable":35256,"olini":35257,"Ġdisinfect":35258,"Ġshaving":35259,"Ġtoxicity":35260,"453":35261,"Ġheterosexual":35262,"Baltimore":35263,"Ġstool":35264,"lr":35265,"ĠMk":35266,"Ġantidote":35267,"Dark":35268,"810":35269,"Ġirritated":35270,"ĠSUPPORT":35271,"Chance":35272,"bent":35273,"ĠZelda":35274,"ĠPenguin":35275,"ifled":35276,"Ġarte":35277,"705":35278,"Ġcondol":35279,"izza":35280,"ĠCK":35281,"Ġprojector":35282,"ravings":35283,"Ġ1919":35284,"Ġburner":35285,"ĠSchwarz":35286,"Oregon":35287,"Ġridicule":35288,"Ġinstructional":35289,"Ġ\"#":35290,"ĠDign":35291,"Ġkitten":35292,"Ġconstit":35293,"iration":35294,"Speed":35295,"ecycle":35296,"ĠFalse":35297,"ĠDealer":35298,"Could":35299,"655":35300,"outside":35301,"Ġworldview":35302,"Ġ246":35303,"Ġspitting":35304,"595":35305,"MN":35306,"ĠComes":35307,"ingu":35308,"Ġenzymes":35309,"Ġcompass":35310,"Ġexclaimed":35311,"ĠMalays":35312,"Ġ1916":35313,"Ġcoloring":35314,"Ġrepeats":35315,"Ġsoils":35316,"Ġtrivia":35317,"ĠIsles":35318,"Const":35319,"ĠFiction":35320,"665":35321,"Ġcriminality":35322,"ĠZi":35323,"384":35324,"ĠWilderness":35325,"ĠCanary":35326,"ĠVs":35327,"и":35328,"ĠAPIs":35329,"Ġbehest":35330,"Ġeb":35331,"ĠHipp":35332,"Ġpreempt":35333,"Ġevoke":35334,"Ġinept":35335,"tele":35336,"447":35337,"ĠGarmin":35338,"Ġpursuits":35339,"351":35340,"Ġcliché":35341,"ĠJihad":35342,"Ġ308":35343,"ĠSnake":35344,"ĠAnnounce":35345,"Nearly":35346,"!'\"":35347,"Ġ1927":35348,"saw":35349,"Ġabhor":35350,"Plan":35351,"rawled":35352,"ĠRiy":35353,"ensor":35354,"Fal":35355,"quick":35356,"odynamic":35357,"Ġsubstitution":35358,"Ġprovoking":35359,"Operation":35360,"rupulous":35361,"Ġsweetness":35362,"folk":35363,"ĠDefault":35364,"Ġstarved":35365,"ĠPrinting":35366,"urious":35367,"ĠTracker":35368,"them":35369,"Ġleth":35370,"Ġemptied":35371,"Ġfootprints":35372,"ilian":35373,"Ġbattalion":35374,"Ġprophet":35375,"Ġrailing":35376,"Ġhect":35377,"rouch":35378,"lees":35379,"Ġideologies":35380,"Ġ254":35381,"ĠGods":35382,"ĠAvalon":35383,"Ġfrontrunner":35384,"ĠPork":35385,"ĠPipe":35386,"Ġscaven":35387,"Ġming":35388,"Ġerg":35389,"Ġ520":35390,"Ġhatched":35391,"asant":35392,"ĠHI":35393,"Ġpend":35394,"Ġ288":35395,"Prom":35396,"achev":35397,"ĠEcology":35398,"enforcement":35399,"467":35400,"dule":35401,"Ġrealism":35402,"ĠTypes":35403,"USB":35404,"utra":35405,"ĠHiroshima":35406,"Ġcontradicted":35407,"393":35408,"ĠDSL":35409,"Ġtherein":35410,"ĠReconstruction":35411,"Ġ243":35412,"irled":35413,"479":35414,"ĠWhats":35415,"Currently":35416,"ĠPOWER":35417,"ĠHiro":35418,"ĠBreath":35419,"ĠYourself":35420,"Ġlantern":35421,"376":35422,"É":35423,"ĠHumans":35424,"Lady":35425,"Ġdissemination":35426,"ecake":35427,"ĠChao":35428,"flat":35429,"Ġinspecting":35430,"stration":35431,"Ġidentifiable":35432,"CV":35433,"ĠLobby":35434,"function":35435,"Roll":35436,"DIV":35437,"Tell":35438,"Ġfasc":35439,"ĠAOL":35440,"HM":35441,"Keefe":35442,"Ġporous":35443,"Ġsmoot":35444,"existence":35445,"ĠDeg":35446,"Ġdivor":35447,"isner":35448,"allas":35449,"Bloomberg":35450,"Ġdictators":35451,"ĠGeh":35452,"Ġsilicone":35453,"Ġdab":35454,"Ġmashed":35455,"Ġpric":35456,"might":35457,"ĠBLM":35458,"Ġpatriarch":35459,"Microsoft":35460,"ĠAds":35461,"Ġcoronary":35462,"ĠContrary":35463,"Ġdra":35464,"ĠStarted":35465,"Ġbuckle":35466,"lear":35467,"accept":35468,"Within":35469,"bd":35470,"interested":35471,"bia":35472,"POR":35473,"motion":35474,"ĠFounders":35475,"ĠCassandra":35476,"ĠPassion":35477,"Ġbehavioural":35478,"ĠHealing":35479,"Ġmarkings":35480,"Ġsnowball":35481,"Ġridiculed":35482,"phase":35483,"Ġunto":35484,"aque":35485,"uggets":35486,"Ġfrantically":35487,"Ġcoward":35488,"Ġinconvenient":35489,"Taking":35490,"Afee":35491,"Ġtwisting":35492,"930":35493,"ĠSieg":35494,"ĠGit":35495,"Ġcurs":35496,"ĠGlas":35497,"ĠSignificant":35498,"Ġachieves":35499,"Ġpreferably":35500,"Ġcondensed":35501,"Ġfetus":35502,"Ġunivers":35503,"Ġpse":35504,"Access":35505,"Ġintertwined":35506,"been":35507,"quit":35508,"ĠLEGO":35509,"Ġimagining":35510,"454":35511,"Ġplains":35512,"sequently":35513,"pull":35514,"Fast":35515,"Pot":35516,"yles":35517,"AIR":35518,"Ġblatantly":35519,"eki":35520,"ilated":35521,"ĠMembership":35522,"Ġ262":35523,"Ġ}":35524,"Ġexcavation":35525,"Ġethn":35526,"addin":35527,"Ġfoundational":35528,"ceptions":35529,"ĠViet":35530,"exempt":35531,"Ġmicrophones":35532,"Ġ244":35533,"778":35534,"Ġdwar":35535,"attery":35536,"502":35537,"ĠKik":35538,"Ġinspir":35539,"ĠMaximum":35540,"Ġvengeance":35541,"Ġetched":35542,"outine":35543,"552":35544,"Ġunicorn":35545,"gged":35546,".�":35547,"ĠBlackwell":35548,"ĠStatue":35549,"Ġdissidents":35550,"ĠKaine":35551,"Ġdeforestation":35552,"ĠScholar":35553,"Ġpleasantly":35554,"ÑĤ":35555,"398":35556,"ĠRUN":35557,"arent":35558,"Ġundeniably":35559,"Ġtechnologically":35560,"Ġconsciously":35561,"ĠEther":35562,"Ġproportional":35563,"Ġlaund":35564,"ĠRye":35565,"Ġambiguity":35566,"Ġunmist":35567,"Terror":35568,"ciplinary":35569,"ĠImproved":35570,"hesis":35571,"Ġcooker":35572,"elsen":35573,"Ġguerrilla":35574,"opped":35575,"ATURE":35576,"Ġrequ":35577,"Ġunprepared":35578,"Ġcamel":35579,"Ġfitt":35580,"Sex":35581,"edged":35582,"Ġrecurrent":35583,"ctuary":35584,"ĠCompare":35585,"ĠServing":35586,"Tri":35587,"Ġtransient":35588,"ĠBees":35589,"Ġcovenant":35590,"Ġfantasies":35591,"Ġespresso":35592,"draft":35593,"baugh":35594,"Ġdemocratically":35595,"ĠBans":35596,"ĠManual":35597,"ĠTurtle":35598,"ennett":35599,"achy":35600,"ĠClim":35601,"Ġdescending":35602,"Ġprow":35603,"Ġinconsistencies":35604,"Player":35605,"Ġoblivious":35606,"ĠWonderland":35607,"nav":35608,"aughter":35609,"Ġlod":35610,"Ġ403":35611,"ĠPolaris":35612,"ĠLeia":35613,"ĠInfantry":35614,"Sy":35615,"ĠMeter":35616,"Ġautoimmune":35617,"Ġdiagnoses":35618,"Ġtrespass":35619,"011":35620,"wrong":35621,"ĠGREAT":35622,"Ġtelescopes":35623,"shows":35624,"Pac":35625,"olation":35626,"Ġclerics":35627,"Ġdissenting":35628,"406":35629,"Ġetiquette":35630,"Ġdeterrence":35631,"765":35632,"Ġove":35633,"Has":35634,"Pak":35635,"ा":35636,"ĠNec":35637,"Ġsociology":35638,"witz":35639,"Ġkittens":35640,"Ġcontinual":35641,"Ġoverlapping":35642,"Ġmonks":35643,"ĠMechanical":35644,"Captain":35645,"ocial":35646,"ĠFalling":35647,"ĠCorrection":35648,"ĠTrouble":35649,"Ġslog":35650,"Ġ253":35651,"Ġemanating":35652,"Ġwidest":35653,"PROV":35654,"Japanese":35655,"urat":35656,"Ġboxed":35657,"ĠCases":35658,"Ġjarring":35659,"Fix":35660,"'?":35661,"ĠStrateg":35662,"Republic":35663,"ovy":35664,"362":35665,"ĠMothers":35666,"Ġstreaks":35667,"Ġlocalized":35668,"ĠONLY":35669,"Ġeh":35670,"ĠObject":35671,"Ġstub":35672,"Fre":35673,"ĠScarlet":35674,"Ġmultip":35675,"ĠMaul":35676,"ĠProblems":35677,"cest":35678,"Ġmortal":35679,"Ġarche":35680,"ulet":35681,"Ġfuller":35682,"ĠGER":35683,"Si":35684,"mr":35685,"ĠPowerful":35686,"boxing":35687,"ĠPeer":35688,"Jean":35689,"ĠTF":35690,"Ġplural":35691,"optim":35692,"Jimmy":35693,"ĠFriendly":35694,"Mex":35695,"Ġdepri":35696,"PK":35697,"Ġwaitress":35698,"eph":35699,"arrass":35700,"ikawa":35701,"feel":35702,"Finally":35703,"fourth":35704,"394":35705,"conom":35706,"VT":35707,"Ġeleg":35708,"ivot":35709,"Ġharsher":35710,"ĠPepe":35711,"ĠImpl":35712,"Ġankles":35713,"idity":35714,"ĠPrepare":35715,"Rather":35716,"Ġconservatism":35717,"Ġunquestion":35718,"ribution":35719,"ĠPatent":35720,"ĠDeluxe":35721,"ĠAE":35722,"007":35723,"Ġprag":35724,"bg":35725,"Ġpalate":35726,"Ġintric":35727,"ossom":35728,"Ġspac":35729,"ĠSpotlight":35730,"Seven":35731,"amacare":35732,"ĠGotham":35733,"Ġencompass":35734,"Ġnicer":35735,"ĠLauder":35736,"Ġscaff":35737,"worn":35738,"442":35739,"Ġpropri":35740,"443":35741,"ĠCompos":35742,"ĠIniti":35743,"inth":35744,"Ġrehe":35745,"Prov":35746,"Ġgri":35747,"ossip":35748,"ĠModest":35749,"quiet":35750,"Ġwealthier":35751,"Ġ241":35752,"icum":35753,"Ġcommunism":35754,"Ġhelpers":35755,"Ġbellig":35756,"Ġ405":35757,"uttered":35758,"Ġbitterness":35759,"nl":35760,"474":35761,"Ġvitality":35762,"blank":35763,"ĠLeth":35764,"PAC":35765,"326":35766,"ĠNapoleon":35767,"Ġ299":35768,"ĠReviews":35769,"ĠSect":35770,"Ġstrongh":35771,"ĠTube":35772,"Ġwoodland":35773,"Ġhumming":35774,"411":35775,"Alpha":35776,"Ġundet":35777,"Ġmounts":35778,"Officials":35779,"igning":35780,"830":35781,"ĠStamp":35782,"ubby":35783,"424":35784,"Ġoutlandish":35785,"Ġjerk":35786,"Ġradiant":35787,"Ġcubes":35788,"Director":35789,"Ġatro":35790,"vous":35791,"Sab":35792,"Ġpretended":35793,"Ġ620":35794,"975":35795,"Sham":35796,"Ġpotassium":35797,"ĠAttention":35798,"gly":35799,"opens":35800,"ĠWorker":35801,"porter":35802,"Ġsplendid":35803,"embed":35804,"Je":35805,"ĠMeal":35806,"Ġsurname":35807,"Usually":35808,"Ġtimer":35809,"Ġweave":35810,"irin":35811,"ĠGenetics":35812,"ensual":35813,"Ġmerry":35814,"Ġapprehend":35815,"utsche":35816,"strate":35817,"Ġsupplementary":35818,"ĠRoundup":35819,"upid":35820,"Ġmiraculous":35821,"ĠHUN":35822,"Ġglaciers":35823,"weed":35824,"ĠSuggest":35825,"XL":35826,"authors":35827,"Ġbarking":35828,"ĠUKIP":35829,"leased":35830,"ĠRAD":35831,"Ġfide":35832,"Ġphen":35833,"Ġscanners":35834,"Parents":35835,"ĠBlaze":35836,"Ġtweaking":35837,"Ġelaborated":35838,"Ġsusp":35839,"iscovered":35840,"Ġthighs":35841,"Ġradicals":35842,"ULTS":35843,"aggressive":35844,"endants":35845,"Hon":35846,"Ġcorrecting":35847,"391":35848,"pps":35849,"ĠTerritories":35850,"Ġconferred":35851,"crazy":35852,"utor":35853,"ĠSurvival":35854,"Ġbrowsers":35855,"ĠConflict":35856,"pn":35857,"Ġdeprive":35858,"riage":35859,"ilan":35860,"à¦":35861,"949":35862,"Congratulations":35863,"radical":35864,"ĠHits":35865,"powerful":35866,"Ġcrypt":35867,"745":35868,"ĠRegistrar":35869,"ophile":35870,"ĠElement":35871,"cooked":35872,"ĠTwilight":35873,"Ġdemos":35874,"IER":35875,"Ġstricken":35876,"Magic":35877,"abby":35878,"ĠSack":35879,"ĠShrine":35880,"Nev":35881,"Probably":35882,"ĠWisdom":35883,"ulpt":35884,"opher":35885,"Ġcolonel":35886,"atl":35887,"Tem":35888,"kun":35889,"ĠIndie":35890,"Putin":35891,"jection":35892,"areth":35893,"ĠBullet":35894,"Ġsmartest":35895,"ĠEsper":35896,"Ġproficiency":35897,"Ġcessation":35898,"Ġmars":35899,"ĠDATA":35900,"sup":35901,"Ġostr":35902,"Jane":35903,"Ġpathogens":35904,"hd":35905,"ĠNK":35906,"Ġhorribly":35907,"regulated":35908,"Ġesteemed":35909,"ĠChinatown":35910,"Ġvibration":35911,"Ġoverboard":35912,"ĠRhod":35913,"Ġfeces":35914,"otation":35915,"Ġcryptic":35916,"Bal":35917,"OPER":35918,"Ġaffirmation":35919,"Ġmenstrual":35920,"Ġuntold":35921,"Ġanecdotes":35922,"ĠHOUSE":35923,"Ġcape":35924,"311":35925,"ittance":35926,"ĠRemy":35927,"ĠWaves":35928,"ĠCOVER":35929,"ordinate":35930,"Ġrestricts":35931,"Samsung":35932,"Ġplantations":35933,"olver":35934,"Better":35935,"ĠExplos":35936,"Ġnasal":35937,"ĠSyri":35938,"ĠPerl":35939,"Ġlatency":35940,"othermal":35941,"Sweet":35942,"ĠRyzen":35943,"ĠYuri":35944,"Ġsmack":35945,"Ġcrow":35946,"aniel":35947,"iological":35948,"Ġmonk":35949,"Ġtutorial":35950,"ĠAure":35951,"Ġcliffs":35952,"ameron":35953,"umers":35954,"ĠMour":35955,"Ġunorthodox":35956,"Ġgulf":35957,"Ġintrusive":35958,"ĠVIII":35959,"ĠFF":35960,"Ġenlarged":35961,"Ġspheres":35962,"ĠCheap":35963,"ĠAmend":35964,"Ġ::":35965,"Ġpacing":35966,"ĠStartup":35967,"ĠDating":35968,"racist":35969,"ĠDivine":35970,"Ġpollen":35971,"ĠMeaning":35972,"ĠLei":35973,"ĠMOT":35974,"ĠARC":35975,"legate":35976,"Ġbrav":35977,"Ross":35978,"redit":35979,"414":35980,"ringe":35981,"perhaps":35982,"SPA":35983,"Southern":35984,"Front":35985,"undrum":35986,"Ġassorted":35987,"ĠDawkins":35988,"ĠWrap":35989,"Ġconsequential":35990,"ĠFuji":35991,"458":35992,"Ġunst":35993,"Bon":35994,"acter":35995,"Trade":35996,"ingers":35997,"ĠClin":35998,"Ġstimul":35999,"arah":36000,"inois":36001,"urdy":36002,"Ġobsessive":36003,"Zone":36004,"Ġprimitive":36005,"unctions":36006,"Ġadapter":36007,"Ġassures":36008,"Daddy":36009,"Ġunsatisf":36010,"441":36011,"Ġ1910":36012,"Ġsecondly":36013,"truth":36014,"RED":36015,"040":36016,"Pope":36017,"venants":36018,"Ġestim":36019,"Ġhemorrh":36020,"Ġexcruciating":36021,"459":36022,"Ġboils":36023,"ieved":36024,"Storm":36025,"Ġmanifestation":36026,"Ġinsulated":36027,"fb":36028,"Ġclassify":36029,"Mbps":36030,"Ġinclination":36031,"Ġaur":36032,"Ġpolarized":36033,"Ġoccupations":36034,"Secretary":36035,"Ġcustomizable":36036,"scribe":36037,"Ġadjunct":36038,"Ġ1922":36039,"rived":36040,"ocative":36041,"Friends":36042,"Oak":36043,"Ġpsyche":36044,"Ġwrinkles":36045,"anthrop":36046,"Ġcoercion":36047,"enos":36048,"Ġvariability":36049,"hma":36050,"phot":36051,"ĠXander":36052,"ĠDiss":36053,"Ġtigers":36054,"ahoo":36055,"focus":36056,"rical":36057,"grow":36058,"Ġseminal":36059,"Ġdisciples":36060,"Cas":36061,"Hundreds":36062,"Ġscissors":36063,"correct":36064,"Ġfascism":36065,"imoto":36066,"Ġnudity":36067,"charg":36068,"Ġrusty":36069,"ĠLyndon":36070,"Ġanomalies":36071,"onial":36072,"ĠiCloud":36073,"Ġannoy":36074,"Ġdistortion":36075,"Lou":36076,"ĠGiul":36077,"eyes":36078,"870":36079,"uum":36080,"ĠUltr":36081,"Action":36082,"cigarette":36083,"igators":36084,"kj":36085,"Ġ323":36086,"uine":36087,"Score":36088,"Ġmans":36089,"Security":36090,"Ġarom":36091,"ĠBoards":36092,"Ġwrists":36093,"602":36094,"Ġastronomy":36095,"Ġresin":36096,"width":36097,")/":36098,"Ġconcurrent":36099,"unless":36100,"606":36101,"ĠMagnet":36102,"Ġauthorizing":36103,"ĠJunk":36104,"atical":36105,"Ġauthent":36106,"zac":36107,"413":36108,"ĠGrape":36109,"Ġcircled":36110,"Ġooz":36111,"Ġvisceral":36112,"ointment":36113,"Ġincendiary":36114,"ĠBourbon":36115,"Ġgimmick":36116,"vette":36117,"Stan":36118,"Ġdetachment":36119,"488":36120,"Ġmisogyny":36121,"Ġenlight":36122,"utic":36123,"Ġinquire":36124,"ĠBEL":36125,"ascular":36126,"ĠWasserman":36127,"Dallas":36128,"Ġconstellation":36129,"Ġdystopian":36130,"504":36131,"ĠOptical":36132,"Ġsilhou":36133,"Girl":36134,"ĠGong":36135,"ĠHighest":36136,"????????":36137,"Sav":36138,"ocity":36139,"leted":36140,"Ġattrition":36141,"ĠExpedition":36142,"ĠKilled":36143,"501":36144,"ONES":36145,"dat":36146,"Ġglyphosate":36147,"Ġplugs":36148,"Ġlact":36149,"Fla":36150,"fps":36151,"riger":36152,"Ġparagraphs":36153,"Ġinnate":36154,"ĠFoo":36155,"aternity":36156,"ĠGry":36157,"Ġoneself":36158,"642":36159,"Iowa":36160,"oodle":36161,"ĠCoconut":36162,"ĠChess":36163,"ommel":36164,"Ġmagnesium":36165,"Ġairliner":36166,"Ġexceedingly":36167,"ĠCreator":36168,"YouTube":36169,"Ġsleeper":36170,"Ġlonging":36171,"ĠPercy":36172,"Ġmatrix":36173,"Ġâľ":36174,"Ġbarren":36175,"Mrs":36176,"Ġinvading":36177,"Ġincom":36178,"Ġemperor":36179,"Ġip":36180,"irie":36181,"Ġpredictably":36182,"ĠBless":36183,"Ġsuperpower":36184,":-":36185,"Ġpropensity":36186,"easy":36187,"educ":36188,"ĠPolly":36189,"Ġcumbersome":36190,"Ġcollide":36191,"016":36192,"Ġtransports":36193,"Ġscraps":36194,"below":36195,"Ġhairs":36196,"mentation":36197,"Ġevolves":36198,"ĠFallen":36199,"Ġunsurprisingly":36200,"Ġcuff":36201,"Ġ249":36202,"mental":36203,"ĠCamel":36204,"Ġ337":36205,"Clinton":36206,"Ġdecad":36207,"ĠSTEP":36208,"ĠTestament":36209,"Ġirresistible":36210,"ĠACE":36211,"Ġhamm":36212,"ĠTerr":36213,"Ġcaul":36214,"iggins":36215,"Ġproficient":36216,"resp":36217,"Ġheirs":36218,"Ġ321":36219,"dress":36220,"ĠClothing":36221,"Ġ560":36222,"Ġ264":36223,"ĠRobb":36224,"Ġfrail":36225,"Ġoptimizing":36226,"615":36227,"ĠRefuge":36228,"rowth":36229,"washing":36230,"Ġgenders":36231,"indu":36232,"ĠNAT":36233,"Ġleans":36234,"Ġeyed":36235,"Ġhilar":36236,"vice":36237,"wolf":36238,"Ġfatig":36239,"ococ":36240,"ĠCarry":36241,"Community":36242,"Clark":36243,"itably":36244,"sv":36245,"448":36246,"Ġnumer":36247,"Ġ1925":36248,"ĠBehavioral":36249,"ĠScream":36250,"Ġgeek":36251,"rake":36252,"ĠTTC":36253,"Ġadditives":36254,"ĠBye":36255,"ylon":36256,"Ġfoliage":36257,"ateral":36258,"rapnel":36259,"Science":36260,"Ġrecollection":36261,"thening":36262,"ĠUbisoft":36263,"ĠLur":36264,"ĠOkinawa":36265,"ĠProvision":36266,"ferred":36267,"ĠGrounds":36268,"Ġhops":36269,"aterial":36270,"Ġacad":36271,"Ġengulf":36272,"ĠApex":36273,"frequency":36274,"relations":36275,"ĠCorvette":36276,"ĠRepeat":36277,"Ġanew":36278,"Ġhes":36279,"ĠLair":36280,"ĠPSP":36281,"foundation":36282,"Band":36283,"ĠPublisher":36284,"Ġreciprocal":36285,"Ġ287":36286,"Ġpir":36287,"Adams":36288,"Ġprostitute":36289,"ĠMecca":36290,"ectomy":36291,"Ġskew":36292,"ĠLol":36293,"Voice":36294,"ĠCalais":36295,"ISION":36296,"rue":36297,"Ġgaping":36298,"prot":36299,"Ġ6000":36300,"Ġtilted":36301,"Ġgoofy":36302,"Stand":36303,"Ġfellows":36304,"Ġcurly":36305,"ĠPOW":36306,"Ġlore":36307,"Ġinhabited":36308,"ĠIdentification":36309,"Metro":36310,"Ġdispel":36311,"Ġinvoking":36312,"Ġdeleting":36313,"Ġstigmat":36314,"ĠDalai":36315,"Ġequate":36316,"Ġmascara":36317,"endered":36318,"ĠNYT":36319,"ĠCommittees":36320,"rians":36321,"ĠOlympus":36322,"ĠQR":36323,"ĠDrinking":36324,"Ġbatt":36325,"andr":36326,"computer":36327,"Senator":36328,"ĠTwist":36329,"ĠNoise":36330,"Ġcheesy":36331,"Ġ1931":36332,"Ġtyranny":36333,"Ġnegligible":36334,"ĠBok":36335,"Ġwebpage":36336,"ĠHEAD":36337,"ĠNovel":36338,"Ġquarry":36339,"Ġexpressive":36340,"Ġforgiving":36341,"Among":36342,"asin":36343,"ĠSuc":36344,"Democrats":36345,"795":36346,"Ġaback":36347,"¨":36348,"ĠNeon":36349,"392":36350,"ĠRNC":36351,"ĠPROC":36352,"sein":36353,"Ros":36354,"Ġemot":36355,"ĠASA":36356,"ĠSeb":36357,"ĠExtended":36358,"atern":36359,"Ġpsychedelic":36360,"Fil":36361,"ĠOrwell":36362,"ĠSOS":36363,"Ġconceive":36364,"Ġhobbies":36365,"Ġspecimens":36366,"ĠTEXT":36367,"sometimes":36368,"Mario":36369,"orpor":36370,"ĠTemporary":36371,"Ġapocalypse":36372,"Ġcounterproductive":36373,"ĠQUEST":36374,"ĠCargo":36375,"Amb":36376,"Ġoptic":36377,"groups":36378,"Ġparanoia":36379,".?":36380,"sounding":36381,"mediately":36382,"System":36383,"ubi":36384,"Ġuttered":36385,"Ġgraphs":36386,"âĢĭâĢĭ":36387,"Ġscientifically":36388,"Ġbluntly":36389,"Ġhopping":36390,"Fun":36391,"ĠSUPER":36392,"Ġrobe":36393,"VB":36394,"ĠQuote":36395,"Ġincarnation":36396,"Ġtreadmill":36397,"Ġ1915":36398,"Ġbart":36399,"669":36400,"Ġhoc":36401,"Ġ309":36402,"Ġimprovis":36403,"Ġhut":36404,"Ġmixer":36405,"ĠCt":36406,"span":36407,"Ġwatered":36408,"Ġpatriot":36409,"Ġdehyd":36410,"laughs":36411,"ĠFancy":36412,"ĠVoc":36413,"Ġintellect":36414,"ĠTid":36415,"Ġnesting":36416,"Tel":36417,"Ġ()":36418,"letter":36419,"ĠSeems":36420,"Ops":36421,"ĠContents":36422,"ript":36423,"hani":36424,"Ġrecru":36425,"Ġpickups":36426,"repair":36427,"Throughout":36428,"bear":36429,"Ġconquered":36430,"656":36431,"Ġmalf":36432,"Ġordained":36433,"755":36434,"ĠReprodu":36435,"brain":36436,"ĠOuts":36437,"ĠWage":36438,"Ru":36439,"________":36440,"ĠLAW":36441,"ĠWass":36442,"Ġcomplication":36443,"Fri":36444,"Ġregener":36445,"Wait":36446,"577":36447,"Ġmisconception":36448,"Ġbombardment":36449,"Ġunloaded":36450,"Ġdictionary":36451,"IU":36452,"025":36453,"etically":36454,"ĠNarr":36455,"repe":36456,"Ġassigning":36457,"Rail":36458,"Ġnotebooks":36459,"Ġingest":36460,"Ġrpm":36461,"Ġalienated":36462,"ĠCredits":36463,"Ġindis":36464,"ĠGathering":36465,"aration":36466,"-+-+-+-+":36467,"Ġori":36468,"Ġsr":36469,"ndra":36470,"Ġlibertarian":36471,"Ġcoerced":36472,"ording":36473,"Ġtranqu":36474,"Ġelbows":36475,"549":36476,"Ġping":36477,"ĠRELE":36478,"ĠYanuk":36479,"Ġmaneuvers":36480,"ĠTrojan":36481,"IFIED":36482,"ĠViolent":36483,"è":36484,"Ġlest":36485,"Ġarrows":36486,"frog":36487,"anty":36488,"WB":36489,"ĠSeen":36490,"648":36491,"Ġclutter":36492,"ĠBender":36493,"Ġpessim":36494,"ĠTeg":36495,"Asian":36496,"IFIC":36497,"Ġexponential":36498,"Ġsponge":36499,"rite":36500,"ĠDAM":36501,"Ġtacit":36502,"ĠZoom":36503,"Ġolds":36504,"Ġonward":36505,"ĠSandwich":36506,"missible":36507,"isol":36508,"940":36509,"Ġinciner":36510,"ĠTrick":36511,"Ġawakening":36512,"Ġdart":36513,"ĠCouch":36514,"respons":36515,"ĠElephant":36516,"ĠPluto":36517,"ĠTags":36518,"itcher":36519,"644":36520,"702":36521,"Ġelectrons":36522,"ĠMyth":36523,"ĠAad":36524,"Danny":36525,"Ġcraw":36526,"ĠCertification":36527,"Ġtending":36528,"Ġpellets":36529,"Ġamused":36530,"ĠAuschwitz":36531,"ĠAppl":36532,"iris":36533,"ashion":36534,"walking":36535,"Ġabnorm":36536,"Cro":36537,"?:":36538,"ĠIcelandic":36539,"ĠAvailability":36540,"Ġcann":36541,"Opt":36542,"buster":36543,"ĠQuartz":36544,"Executive":36545,"tracks":36546,"igel":36547,"MIT":36548,"ĠTracking":36549,"Ġconditioned":36550,"Ġsampled":36551,"ĠGenius":36552,"Ġsubstit":36553,"ĠSiberia":36554,"Ġfrequ":36555,"historic":36556,"okin":36557,"OWS":36558,"1500":36559,"warts":36560,"ĠEtsy":36561,"licks":36562,"ĠSmooth":36563,"unity":36564,"515":36565,"Ġperk":36566,"aida":36567,"forts":36568,"ĠUA":36569,"RIC":36570,"Spain":36571,"ĠWired":36572,"cuts":36573,"Ġfurnace":36574,"ĠTOTAL":36575,"ĠTables":36576,"662":36577,"Fab":36578,"Ġquaint":36579,"ĠWorlds":36580,"ĠCabin":36581,"atche":36582,"List":36583,"ĠVO":36584,"Ġkeyword":36585,"Ġ258":36586,"Farm":36587,"timer":36588,"ĠVolt":36589,"Build":36590,"pressed":36591,"*,":36592,"Ġ324":36593,"aiman":36594,"TING":36595,"Ġsneaking":36596,"cery":36597,"Ġcrib":36598,"ĠIllust":36599,"later":36600,"Ġcompar":36601,"Ġpropulsion":36602,"647":36603,"ĠTrails":36604,"Ġperiphery":36605,"steel":36606,"Ġvividly":36607,"ĠConver":36608,"eatured":36609,"427":36610,"463":36611,"Ġapprox":36612,"spin":36613,"Ġconfigured":36614,"inside":36615,"razy":36616,"account":36617,"anye":36618,"riend":36619,"Ġbows":36620,"809":36621,"ĠDEF":36622,"ĠRez":36623,"Fans":36624,"ĠDF":36625,"Ġstains":36626,"ĠAtom":36627,"ĠConce":36628,"ĠTOM":36629,"ĠELECT":36630,"Ġdisappro":36631,"019":36632,"afia":36633,"ĠTemperature":36634,"Ġextracts":36635,"fab":36636,"Ġunsur":36637,"Ġseasoning":36638,"Ty":36639,"KB":36640,"Ġposit":36641,"Ġlocality":36642,"1200":36643,"cour":36644,"izons":36645,"hh":36646,"506":36647,"ĠDLC":36648,"iago":36649,"Ġcorpses":36650,"iddling":36651,"Mayor":36652,"Ġsimplistic":36653,"Ġlibel":36654,"Ġalmonds":36655,"Ġswast":36656,"Change":36657,"ĠJoker":36658,"MAR":36659,"ĠScully":36660,"Ġmailbox":36661,"VIDEO":36662,"ĠKyoto":36663,"esley":36664,"ĠIncredible":36665,"youtube":36666,"Ġinequalities":36667,"Ġbolts":36668,"Ġbothering":36669,"Ġattentive":36670,"ĠSparrow":36671,"Ġdiaper":36672,"Ġfanbase":36673,"Ġuncont":36674,"Ap":36675,"ĠQi":36676,"Price":36677,"471":36678,"Ġpearl":36679,"wid":36680,"899":36681,"ĠPony":36682,"casting":36683,"Ġinhabit":36684,"Ġunve":36685,"Ġinsur":36686,"ĠWee":36687,"658":36688,"Ġeffected":36689,"gger":36690,"Ġinstallments":36691,"imilar":36692,"FU":36693,"Ġinfertility":36694,"climate":36695,"HEAD":36696,"fashion":36697,"ĠTHEY":36698,"jc":36699,"Ġsatisf":36700,"ĠGuidelines":36701,"Ġinsure":36702,"ĠRSA":36703,"Ġvirt":36704,"Ġinterpre":36705,"Joshua":36706,"ĠShut":36707,"Ġtestimonies":36708,"Ñģ":36709,"untary":36710,"417":36711,"Ġbeck":36712,"ĠMilky":36713,"ç":36714,"Ġsequels":36715,"Ġ281":36716,"ĠRibbon":36717,"Ġroomm":36718,"Ġsynchron":36719,"452":36720,"Ġ1926":36721,"Ġhawk":36722,"ĠDisorder":36723,"Ġbackstory":36724,"ĠNum":36725,"Ġoverheard":36726,"technical":36727,"Jud":36728,"aii":36729,"Ġdecon":36730,"ĠRape":36731,"ĠWarrant":36732,"Ġpoop":36733,"spir":36734,"Country":36735,"Ġweld":36736,"Ġabuser":36737,"Ġ------":36738,"material":36739,"Ġpreserves":36740,"spring":36741,"Ġpuzzled":36742,"ĠDebate":36743,"Joseph":36744,"Ġ272":36745,"Blood":36746,"antry":36747,"Ġconverge":36748,"Ġimaginable":36749,"oward":36750,"545":36751,"Ġfug":36752,"Vision":36753,"075":36754,"Ġadoptive":36755,"Ġunknow":36756,"Stream":36757,"Ġaffili":36758,"ĠPUR":36759,"ĠWally":36760,"Ġgamer":36761,"Ġfart":36762,"stice":36763,"Ġcongen":36764,"н":36765,"685":36766,"orst":36767,"ĠATF":36768,"Ġml":36769,"ĠMozilla":36770,"Ġcalmed":36771,"bage":36772,"ĠVault":36773,"arkable":36774,"ĠGuan":36775,"Ġclueless":36776,"umatic":36777,"Ġshameless":36778,"Ġpreached":36779,"Ġmisconceptions":36780,"Ġanthology":36781,"Ġbiomass":36782,"ĠPs":36783,"tails":36784,"Ġexcessively":36785,"Ġextr":36786,"Davis":36787,"Ġgrounding":36788,"Ġshortcuts":36789,"ĠShift":36790,"ĠRew":36791,"ĠIllum":36792,"Ġincite":36793,"sense":36794,"ĠScouting":36795,"otos":36796,"respond":36797,"Ġbeware":36798,"gran":36799,"ĠXV":36800,"JM":36801,"ĠSounders":36802,"Ġ276":36803,"Ġshockingly":36804,"Ġgastrointestinal":36805,"erences":36806,"df":36807,"ĠNG":36808,"Ġdiscredited":36809,"Ġdemoral":36810,"Ġgladly":36811,"Tal":36812,"ĠPredator":36813,"708":36814,"Ġdoi":36815,"Ġdecentral":36816,"illin":36817,"printed":36818,"Ġinflicting":36819,"ribes":36820,"Ġsupper":36821,"abc":36822,"Ġgraz":36823,"980":36824,"Bull":36825,"Ġmillionaires":36826,"Ġvanity":36827,"imony":36828,"Ġbiologists":36829,"Ġalternating":36830,"Ġsleeps":36831,"Force":36832,"ĠPrinc":36833,"ĠTransgender":36834,"Ġ314":36835,"ĠProvide":36836,"enthal":36837,"Ġplum":36838,"Ġresurrect":36839,"CW":36840,"Ġinjure":36841,"ĠPerspective":36842,"ĠBei":36843,"Ġrestless":36844,"aciously":36845,"Ġchlor":36846,"catch":36847,"ĠLuigi":36848,"Ġinconsistency":36849,"Ġwhiff":36850,"Arizona":36851,"ustration":36852,"ĠRaid":36853,"ĠDemons":36854,"ĠVita":36855,":\"":36856,"Ġmigraine":36857,"ĠHamb":36858,"Ġwidget":36859,"451":36860,"Ġrandomized":36861,"etchup":36862,"ĠParticularly":36863,"Ġdiced":36864,"Ġperfected":36865,"roid":36866,"710":36867,"Ġreflections":36868,"Ġantioxidants":36869,"ĠLabel":36870,"Ġ326":36871,"igious":36872,"ĠEucl":36873,"608":36874,"Ġstrand":36875,"ĠDirt":36876,"ĠLift":36877,"suits":36878,"ĠControls":36879,"RAW":36880,"Ġcowardly":36881,"ĠUmb":36882,"Growing":36883,"mington":36884,"Ġ339":36885,"ĠCommit":36886,"Ġnonviolent":36887,"Ġcontaminants":36888,"Ġacrylic":36889,"ĠMAP":36890,"Ġ269":36891,"Ġdegrading":36892,"Ġmiracles":36893,"ĠEstablishment":36894,"despite":36895,"cry":36896,"Ġpauses":36897,"Ġmythical":36898,"Ġtwenties":36899,"Actually":36900,"phan":36901,"recorded":36902,"Ġunwillingness":36903,"engineering":36904,"avored":36905,"Ġdevout":36906,"item":36907,"Ġbunny":36908,"ĠMerchants":36909,"Ġconsumes":36910,"508":36911,"Ġlex":36912,"ĠClause":36913,"Ġchecklist":36914,"Sus":36915,"uther":36916,".#":36917,"Bit":36918,"uay":36919,"bf":36920,"Ġpopulace":36921,"Ġ316":36922,"Ġcombust":36923,"Ġnano":36924,"Ġpopul":36925,"Indust":36926,"Ġcapitalists":36927,"ĠFiles":36928,"Bang":36929,"Ġkosher":36930,"atile":36931,"Ġincrim":36932,"OVER":36933,"Ġmelee":36934,"ymph":36935,"ĠPupp":36936,"evin":36937,"ĠMolecular":36938,"Ġmisinterpret":36939,"vc":36940,"olithic":36941,"ĠSimpsons":36942,"Ġshrew":36943,"Ġselectively":36944,"ĠDrain":36945,"mittedly":36946,"conservative":36947,"True":36948,"Using":36949,"562":36950,"apon":36951,"Ġapprentice":36952,"Mas":36953,"ĠBattlefield":36954,"Ġfing":36955,"Ġconcoct":36956,"ĠVIS":36957,"ĠHuss":36958,"Ġdetects":36959,"ĠFriedrich":36960,"Ġlatitude":36961,"Custom":36962,"ĠÙ":36963,"ĠBones":36964,"whose":36965,"Ġredirected":36966,"aligned":36967,"ĠNeighbor":36968,"ĠAmen":36969,"ĠMarble":36970,"Beyond":36971,"Ġbiomark":36972,"Ġerroneous":36973,"Atlanta":36974,"Ġmasturb":36975,"ĠAssoci":36976,"Albert":36977,"Ġcigar":36978,"ĠFraz":36979,"ethe":36980,"skinned":36981,"Ford":36982,"throp":36983,"Acc":36984,"Ġtricked":36985,"Ġoverwhelm":36986,"Ġimplements":36987,"ĠGeForce":36988,"Ġbounces":36989,"Ġmoderator":36990,"910":36991,"ĠButterfly":36992,"ĠIllegal":36993,"ĠSubject":36994,"RET":36995,"ĠFreeze":36996,"ĠNewt":36997,"Ġuterus":36998,"696":36999,"Ġ267":37000,"tk":37001,"Ġdodged":37002,"liam":37003,"Ġparasite":37004,"obal":37005,"ĠHubble":37006,"Ġtheology":37007,"âĢĶ\"":37008,"height":37009,"Ale":37010,"employment":37011,"ĠWallet":37012,"cessive":37013,"Ġ404":37014,"Ġsimilarity":37015,"zens":37016,"Ġdumps":37017,"Ġdepress":37018,"Ġlifeless":37019,"535":37020,"oard":37021,"Scotland":37022,"Ġbelievable":37023,"Ġcalculator":37024,"ĠNaked":37025,"Ġremission":37026,"Ġoranges":37027,"ĠSections":37028,"Ġentangled":37029,"Ġuncanny":37030,"Ġteaspoons":37031,"vr":37032,"ĠPorn":37033,"Organ":37034,"Ġbund":37035,"Doug":37036,"ĠGHz":37037,"Major":37038,"abus":37039,"Bell":37040,"avier":37041,"Ġimplanted":37042,"RON":37043,"Fle":37044,"462":37045,"509":37046,"Ġgoggles":37047,"Ġmanuscript":37048,"NOT":37049,"ĠCanaveral":37050,"ĠDID":37051,"Season":37052,"HAEL":37053,"Edge":37054,"appiness":37055,"DIS":37056,"Ġplotted":37057,"Ġwrought":37058,"Ġquarantine":37059,"Ġrearr":37060,"itage":37061,"Ġsocket":37062,"Ġbrig":37063,"Ġunbelievably":37064,"abytes":37065,"TG":37066,"Ġ444":37067,"ĠOffic":37068,"Ġacquaintances":37069,"ĠComparison":37070,"Nine":37071,"ĠFeast":37072,"758":37073,"YC":37074,"Ġfiner":37075,"ĠStrawberry":37076,"Ġeternity":37077,"liament":37078,"urrency":37079,"ĠCortana":37080,"ĠSabbath":37081,"Ġsprinkle":37082,"unker":37083,"ĠUE":37084,"flies":37085,"Ġblender":37086,"Ġacutely":37087,"emark":37088,"ĠAffect":37089,"Politics":37090,"Ġsane":37091,"Ġcorrosion":37092,"Ġspirituality":37093,"Ġredeemed":37094,"Ġingrained":37095,"manager":37096,"joined":37097,"ĠDumb":37098,"ĠHeight":37099,"Ġseventeen":37100,"Ġ640":37101,"Ġreviewer":37102,"Ġwallpaper":37103,"Ġnurs":37104,"Ġsubset":37105,"703":37106,"Ġsymbolism":37107,"Ġdudes":37108,"Ġmismatch":37109,"gans":37110,"please":37111,"ĠKE":37112,"Ġatom":37113,"004":37114,"ionic":37115,"Ġservings":37116,"Ġproxies":37117,"Ġtranscription":37118,"yx":37119,"bowl":37120,"iscovery":37121,"ĠScotch":37122,"brace":37123,"riter":37124,"ĠDesktop":37125,"Ġlimestone":37126,"æ":37127,"Neg":37128,"013":37129,"Ġformulas":37130,"Ġeval":37131,"Ġzombies":37132,"GU":37133,"ĠHermes":37134,"Ġbrist":37135,"Mand":37136,"Ġmastery":37137,"Ġgoverns":37138,"Ġconstrued":37139,"region":37140,"Ġemitted":37141,"Vice":37142,"060":37143,"Jennifer":37144,"mol":37145,"Ġjealousy":37146,"Ġingenuity":37147,"bug":37148,"olitical":37149,"Ġperce":37150,"ĠSapp":37151,"dim":37152,"utral":37153,"Ġinterrogated":37154,"Gate":37155,"Ġamber":37156,"911":37157,"ĠEveryday":37158,"ĠDDR":37159,"ĠBlades":37160,"Ġnifty":37161,"Ġmurderers":37162,"Ġpresumption":37163,"Pitt":37164,"Div":37165,"ĠDestination":37166,"having":37167,"Ġprolifer":37168,"Ġbreaker":37169,"ĠBW":37170,"Ġcourier":37171,"Try":37172,"ĠBUR":37173,"itized":37174,"Ġcompress":37175,"Ġrepetition":37176,"ĠTik":37177,"Ġdivergence":37178,"Ġcube":37179,"everyone":37180,"ĠPoles":37181,"418":37182,"ĠHighly":37183,"468":37184,"Jeremy":37185,"Ġcontradictions":37186,"Ġmanure":37187,"Sad":37188,"pletion":37189,"626":37190,"Ġ279":37191,"Ġfrivolous":37192,"ĠCanaan":37193,"olor":37194,"Ġincapac":37195,"ĠGentle":37196,"Ġinsomnia":37197,"ĠJing":37198,"688":37199,"ĠViews":37200,"Ġsyll":37201,"486":37202,"antom":37203,"Ġcog":37204,"aintain":37205,"ĠDVDs":37206,"Ġ318":37207,"archy":37208,"Ġreprodu":37209,"Ġconcedes":37210,"Brook":37211,"Ġinterpreting":37212,"Ġextracting":37213,"Ġess":37214,"uning":37215,"ĠMathematics":37216,"iably":37217,"Ġmultit":37218,"ĠActs":37219,"iliated":37220,"Foreign":37221,"Ġflaming":37222,"ĠCoup":37223,"Ġglitches":37224,"Ġdifferentiation":37225,"ihadi":37226,"ĠDrone":37227,"Ġincompatible":37228,"asher":37229,"documented":37230,"agons":37231,"wark":37232,"Ġshielding":37233,"ĠCorrect":37234,"romising":37235,"uned":37236,"Ġconduit":37237,"ĠDiablo":37238,"Ġbeginner":37239,"Ġarchived":37240,"smanship":37241,"ĠTBD":37242,"digy":37243,"Ġ322":37244,"Ġ268":37245,"ĠTears":37246,"ĠPriority":37247,"Italy":37248,"Ġ^":37249,"annot":37250,"different":37251,"Joy":37252,"Ġbreathed":37253,"heon":37254,"Ġracists":37255,"Ġvascular":37256,"Between":37257,"etition":37258,"ĠLikely":37259,"icans":37260,"529":37261,"ĠMonsters":37262,"agy":37263,"Orange":37264,"hide":37265,"SIM":37266,"Ġdeceive":37267,"ĠDAR":37268,"Ġshattering":37269,"Ġow":37270,"peak":37271,"Ġpreferable":37272,"Ġpiping":37273,"ĠLEDs":37274,"ĠCOMMUN":37275,"ĠConstruct":37276,"008":37277,"Ġdissatisfied":37278,"ĠKNOW":37279,"ĠFrame":37280,"ĠToast":37281,"Ġadore":37282,"history":37283,"Soviet":37284,"reporting":37285,"Ġ266":37286,"pract":37287,"ĠSauce":37288,"686":37289,"ievers":37290,"ĠDomain":37291,"ousand":37292,"768":37293,"Cos":37294,"609":37295,"432":37296,"Ġtransl":37297,"oof":37298,"Ġ292":37299,"Turkish":37300,"ĠPOLIT":37301,"Harris":37302,"bj":37303,"Ġrodents":37304,"556":37305,"Ġintellectuals":37306,"Ġinteroper":37307,"ixt":37308,"Ġunbiased":37309,"itia":37310,"Ġ504":37311,"Ġbuttocks":37312,"ĠFlam":37313,"Ġchrom":37314,"Ġ259":37315,"shock":37316,"ĠRJ":37317,"ĠLich":37318,"422":37319,"Ġcondom":37320,"phen":37321,"Ġvigilante":37322,"Ġowl":37323,"Ġdwellings":37324,"Ġarchaeologists":37325,"Ġ680":37326,"RAY":37327,"Ġ1921":37328,"Ġ625":37329,"ĠPLAN":37330,"alde":37331,"030":37332,"abbling":37333,"Wave":37334,"Ni":37335,"Ġfurthe":37336,"JS":37337,"Ġpsycho":37338,"ĠFrançois":37339,"Ġundergrad":37340,"Ġsuccessors":37341,"Ġpadded":37342,"introdu":37343,"Ġreasoned":37344,"Ġvas":37345,"creen":37346,"onsequ":37347,"starter":37348,"Court":37349,"ĠHIS":37350,"Ġplaster":37351,"Ġranger":37352,"Ġ298":37353,"esters":37354,"Ġglare":37355,"ype":37356,"Ġcompute":37357,"Ali":37358,"mallow":37359,"Ġmasculine":37360,"ĠExamination":37361,"improve":37362,"Ġdeclass":37363,"Ġdecoration":37364,"ĠFIG":37365,"abre":37366,"Ġstale":37367,"abling":37368,"ĠRusty":37369,"ĠASAP":37370,"Ġadjusts":37371,"Ġbluff":37372,"density":37373,"Ġdisse":37374,"Ġcensor":37375,"ervatives":37376,"Ġkettle":37377,"Ġskeptics":37378,"fd":37379,"Imm":37380,"461":37381,"Ġadvantageous":37382,"419":37383,"ĠPresents":37384,"482":37385,"ĠRewards":37386,"Ġovershadow":37387,"Alabama":37388,"ĠCPC":37389,"Ġsock":37390,"ĠChurches":37391,"hidden":37392,"Ġcringe":37393,"ĠHOR":37394,"PB":37395,"Pretty":37396,"Hong":37397,"?),":37398,"687":37399,"Ġgrocer":37400,"472":37401,"565":37402,"itent":37403,"Ġpartake":37404,"wait":37405,"usters":37406,"Ġcones":37407,"Ġconcurrently":37408,"Ġlevers":37409,"Ġaroma":37410,"ĠDrill":37411,"498":37412,"804":37413,"ithering":37414,"Ġ355":37415,"Ġlegion":37416,"Ġvitri":37417,"Ġcondu":37418,"Angel":37419,"OWER":37420,"Ġ{*":37421,"Simon":37422,"Ġsynthesis":37423,"ĠContainer":37424,"sheet":37425,"Bi":37426,"ĠRaspberry":37427,"Ġ328":37428,"anders":37429,"ĠBlossom":37430,"ĠFINAL":37431,"acid":37432,"Ġborderline":37433,"Aut":37434,"Ġoriginate":37435,"Ġtransm":37436,"Ġbuffalo":37437,"atial":37438,"ĠCraigslist":37439,"Ġcredential":37440,"Ġdisbanded":37441,"Ġunprotected":37442,"ĠZer":37443,"waukee":37444,"diagn":37445,"1999":37446,"doc":37447,"ellig":37448,"Ġwarheads":37449,"ĠADS":37450,"verified":37451,"ĠHAM":37452,"785":37453,"Cu":37454,"Ġenorm":37455,"ĠSkill":37456,"\\":37457,"Ġbashing":37458,"Ġloudspe":37459,"during":37460,"Ġdebunked":37461,"adequ":37462,"Ġuh":37463,"Feed":37464,"ificial":37465,"pred":37466,"ĠPassing":37467,"Kyle":37468,"enance":37469,"ĠMex":37470,"itect":37471,"Ġcavern":37472,"Ġtrop":37473,"ĠEliot":37474,"753":37475,"Ġencountering":37476,"Ġsulf":37477,"Always":37478,"ĠGest":37479,"Ġadditive":37480,"Ġ278":37481,"Ġloops":37482,"liberal":37483,"urion":37484,"ĠRefresh":37485,"ĠDynasty":37486,"Ġsweaty":37487,"Ġsails":37488,"protection":37489,"ĠRooms":37490,"ĠEXT":37491,"few":37492,"ĠPaid":37493,"Ġ377":37494,"Ġcolonialism":37495,"Ġchuckle":37496,"Ġarmour":37497,"Ġsoftly":37498,"661":37499,"Building":37500,"ĠAMER":37501,"Ġbabe":37502,"Ġshif":37503,"Sem":37504,"Ġdisembark":37505,"ĠSubstance":37506,"Stone":37507,"Ġdialect":37508,"ĠAph":37509,"Ġspreadsheet":37510,"ierra":37511,"Ġlineage":37512,"ĠCust":37513,"ĠBabe":37514,"Ġwra":37515,"ĠMafia":37516,"Ġflakes":37517,"ĠEVER":37518,"cong":37519,"ĠCreation":37520,"loo":37521,"ĠAmpl":37522,"ĠSpectre":37523,"012":37524,"geons":37525,"Ġswarm":37526,"ĠPale":37527,"ĠSeek":37528,"itures":37529,"Ġarri":37530,"Ġredistribution":37531,"campaign":37532,"ĠAbility":37533,"579":37534,"ournament":37535,"locks":37536,"Ġnests":37537,"ĠConstantine":37538,"Ġwhisper":37539,"Ġshrouded":37540,"changed":37541,"ĠEnhanced":37542,"Ġ920":37543,"Ġglob":37544,"Tam":37545,"Ġoutwe":37546,"Ġilliter":37547,"Ġsurg":37548,"Nap":37549,"ĠAerial":37550,"iferation":37551,"Egypt":37552,"ERO":37553,"Ġantip":37554,"environment":37555,"machine":37556,"Ġrupture":37557,"treatment":37558,"internal":37559,"Ġinfiltrate":37560,"Ġgratification":37561,"Uber":37562,"Ġunequal":37563,"Ġflav":37564,"Lord":37565,"tein":37566,"ĠLOT":37567,"Ġbullshit":37568,"Ġoriginals":37569,"Ġminced":37570,"Ġmultiply":37571,"ayson":37572,"Ġrecomm":37573,"Ġreceptors":37574,"Ġflashlight":37575,"Ġinhuman":37576,"Future":37577,"Ġpuzzling":37578,"Ġrouters":37579,"Ġuncontroll":37580,"responsible":37581,"Ġcellul":37582,"ĠTablet":37583,"Ġbolted":37584,"Ġpermissible":37585,"adra":37586,"picture":37587,"ODY":37588,"BRE":37589,"Iraq":37590,"Total":37591,"rising":37592,"Ġ273":37593,"nv":37594,"Ġ327":37595,"alysed":37596,"infect":37597,"Ġ1912":37598,"ĠVT":37599,"ĠLazarus":37600,"ictive":37601,"Bu":37602,"ĠNEVER":37603,"ĠCODE":37604,"ĠModified":37605,"fetched":37606,"ĠTrap":37607,"mob":37608,"Ġupkeep":37609,"WARD":37610,"Ġbrewed":37611,"Ġsaliva":37612,"Ġ1923":37613,"Ġsteroid":37614,"rather":37615,"ĠVER":37616,"Ġcontextual":37617,"Ont":37618,"ĠLSD":37619,"agine":37620,"Ġaudible":37621,"ĠMeta":37622,"erek":37623,"aults":37624,"ĠOttoman":37625,"ĠIncludes":37626,"Ġocc":37627,"678":37628,"ipple":37629,"Ġcontrasted":37630,"014":37631,"ĠLenin":37632,"Ġomega":37633,"885":37634,"civil":37635,"Ġoverload":37636,"},\"":37637,"Ġprogrammers":37638,"Ġgeometry":37639,"?).":37640,"shift":37641,"ĠClancy":37642,"nr":37643,"verb":37644,"Ġ760":37645,"Ġstaggered":37646,"Playing":37647,"ĠSmile":37648,"Ġcomplains":37649,"ĠSloven":37650,"Ġdisobedience":37651,"creator":37652,"Ġly":37653,"incoln":37654,"emp":37655,"Ġcrate":37656,"ĠPledge":37657,"ĠGPUs":37658,"protected":37659,"Vo":37660,"medium":37661,"Ġacet":37662,"603":37663,"478":37664,"469":37665,"Further":37666,"Ġsensed":37667,"Lock":37668,"Ġcrabs":37669,"ĠChains":37670,"ĠNEO":37671,"Ġexperimented":37672,"ĠRhythm":37673,"802":37674,"Ġhormonal":37675,"491":37676,"ĠMedian":37677,"Ġevaluates":37678,"ippi":37679,"Ġremovable":37680,"Ġvector":37681,"ilant":37682,"TERN":37683,"Ġpurch":37684,"ĠBind":37685,"athering":37686,"Ġcords":37687,"Lib":37688,"Ġdamned":37689,"orc":37690,"ĠEverywhere":37691,"Ġgorilla":37692,"ystem":37693,"fail":37694,"Ġecstasy":37695,"allion":37696,"Sea":37697,"Ġuploading":37698,"ĠSpecific":37699,"Ġreinforcement":37700,"cerned":37701,"ĠDollars":37702,"Twenty":37703,"OX":37704,"ADD":37705,"Ġbraces":37706,"Ġraven":37707,"Ġ1890":37708,"Ġcirculate":37709,"udden":37710,"Disney":37711,"ĠNope":37712,"ĠBagg":37713,"ĠBuddha":37714,"rael":37715,"urus":37716,"ĠKarma":37717,"Ġcurl":37718,"Ġflips":37719,"Ġbearer":37720,"Ġmisunderstand":37721,"Ġabras":37722,"ĠAssassin":37723,"Fact":37724,"Ġinterf":37725,"Ġvantage":37726,"ĠGenocide":37727,"Ġdeducted":37728,"Sep":37729,"McC":37730,"Jessica":37731,"ĠBackup":37732,"Ian":37733,"urnal":37734,"Ġlaborers":37735,"438":37736,"ĠContinuous":37737,"ĠNBN":37738,"Cool":37739,"mitting":37740,"ĠNormandy":37741,"Ġpurchaser":37742,"Ġacquainted":37743,"Ġblogging":37744,"route":37745,"marine":37746,"Ġstartled":37747,"6000":37748,"ĠRadical":37749,"kiss":37750,"ĠBlitz":37751,"express":37752,"Ġ601":37753,"hent":37754,"Ġtink":37755,"pires":37756,"launch":37757,"sg":37758,"ĠEffects":37759,"Ġstiffness":37760,"ĠAllies":37761,"Ġthirsty":37762,"Ġmyst":37763,"Ġlogger":37764,"Ġstances":37765,"ĠEvaluation":37766,"090":37767,"Ġproclaiming":37768,"Ġhypocritical":37769,"496":37770,"Ġcaus":37771,"ĠKappa":37772,"ĠLann":37773,"ĠScientist":37774,"Ġempath":37775,"etrical":37776,"lege":37777,"Hom":37778,"Aud":37779,"ĠColors":37780,"ĠStraw":37781,"each":37782,"ĠPatron":37783,"Ġnuance":37784,"send":37785,"ourney":37786,"ĠPhen":37787,"Ġamino":37788,"ĠSeconds":37789,"Sn":37790,"ĠCiv":37791,"Ġconglomer":37792,"Ġ411":37793,"versely":37794,"487":37795,"prises":37796,"Ġ277":37797,"necessary":37798,"Ġdope":37799,"Late":37800,"Ġrake":37801,"ĠBrigham":37802,"ogun":37803,"ĠSTATES":37804,"ĠGaal":37805,"Ġintellig":37806,"Ġglacier":37807,"destruct":37808,"ĠZucker":37809,"484":37810,"Ġ332":37811,"ĠArist":37812,"Ġprotagonists":37813,"Ġgraveyard":37814,"names":37815,"ĠPax":37816,"Ġthresholds":37817,"Seeing":37818,"Ġmunitions":37819,"Ġcontradicts":37820,"684":37821,"Ġ529":37822,"ĠConcent":37823,"ĠBlessed":37824,"Hz":37825,"Ġinhibit":37826,"Ġshenanigans":37827,"ĠSpear":37828,"Ġoverlay":37829,"ritis":37830,"ilus":37831,"Ġvariance":37832,"Ġoverpower":37833,"viol":37834,"erning":37835,"Ġpolarization":37836,"aito":37837,"GV":37838,"493":37839,"Keeping":37840,"Ġpaternity":37841,"ĠHappiness":37842,"oops":37843,"sb":37844,"xit":37845,"ophysical":37846,"Ġconclusive":37847,"Arch":37848,"Ġmiser":37849,"Ġsuffice":37850,"ĠStout":37851,"Ġhrs":37852,"643":37853,"Ġprincipled":37854,"azine":37855,"atorium":37856,"ĠFairy":37857,"Ġinfiltrated":37858,"ĠHier":37859,"ĠMIA":37860,"inders":37861,"Ġrebutt":37862,"Ġxx":37863,"Ġfeats":37864,"izzle":37865,"Ġ780":37866,"668":37867,"Ġrepressive":37868,"ĠYugoslavia":37869,"sole":37870,"704":37871,"ĠRPG":37872,"ĠTroll":37873,"packing":37874,"ĠDatabase":37875,"ĠVelvet":37876,"ĠRELEASE":37877,"ablish":37878,"smoking":37879,"ĠBottle":37880,"ĠFully":37881,"ĠLean":37882,"Ġobjectively":37883,"ĠFounding":37884,"ĠClassics":37885,"Ġmosaic":37886,"473":37887,"Ġrooft":37888,"Ġcentrally":37889,"Ġdismissive":37890,"Ġparasites":37891,"009":37892,"Ġcursed":37893,"Ġvex":37894,"Ġeconom":37895,"ĠBore":37896,"enery":37897,"ĠFundamental":37898,"ĠOmni":37899,"489":37900,"714":37901,"Ġforegoing":37902,"Ġfragment":37903,"oros":37904,"070":37905,"ĠFaust":37906,"Ġsucking":37907,"Ġnode":37908,"Ġrighteous":37909,"ĠPowered":37910,"426":37911,"HQ":37912,"Ġchronically":37913,"ĠBAL":37914,"Ġprest":37915,"Ġrapists":37916,"ĠRelationship":37917,"ĠCHR":37918,"Ġlinen":37919,"Ġnumerical":37920,"oters":37921,"Ġiterations":37922,"ttes":37923,"ĠENTER":37924,"Ġrabbi":37925,"Ġhoard":37926,"Ġmerciless":37927,"Ġrobes":37928,"ĠSpray":37929,"Ġadvers":37930,"ilantro":37931,"483":37932,"Ġfungus":37933,"Ġalcoholism":37934,"anasia":37935,"ĠCruiser":37936,"Ġmorals":37937,"cision":37938,"measures":37939,"Ġsabot":37940,"Ġrecol":37941,"ĠSaur":37942,"ĠError":37943,"Ġmysteriously":37944,"sle":37945,"Ġfeminists":37946,"д":37947,"ackle":37948,"ĠMarxist":37949,"Ġselves":37950,"Ġdoorway":37951,"Ġdiscard":37952,"Ġbandits":37953,"ĠDive":37954,"ameless":37955,"TRY":37956,"Ġgull":37957,"Ġrepublican":37958,"sr":37959,"ĠDynamo":37960,"Ġembryo":37961,"MENTS":37962,"ĠLOW":37963,"Ġ319":37964,"Ġgly":37965,"Ġcowork":37966,"Coll":37967,"Ġcris":37968,"ĠBanana":37969,"reality":37970,"Ġmobilization":37971,"unal":37972,"Updated":37973,"Crew":37974,"ĠGideon":37975,"Ġvines":37976,"Ġknitting":37977,"Ġdag":37978,"ĠSurv":37979,"Ġvacc":37980,"Ġimpulses":37981,"Northern":37982,"Ġnanop":37983,"allows":37984,"UTH":37985,"Ġflashbacks":37986,"alsa":37987,"Ġ282":37988,"Ġtransmissions":37989,"ĠAlmighty":37990,"Office":37991,"ĠBride":37992,"ĠBeasts":37993,"othy":37994,"ĠClouds":37995,"ĠDyn":37996,"ĠJolly":37997,"District":37998,"Ġveget":37999,"Ġantit":38000,"ĠSmoking":38001,"hess":38002,"Ġcompose":38003,"Ġreligiously":38004,"ĠHY":38005,"Ġfluorescent":38006,"rame":38007,"ĠMeier":38008,"ĠSQ":38009,"benefit":38010,"Thirty":38011,"559":38012,"ĠCance":38013,"586":38014,"Ġgrouped":38015,"Ġphys":38016,"Ġrebellious":38017,"ĠBASE":38018,"chid":38019,"582":38020,"ĠLessons":38021,"ĠWonderful":38022,"ODE":38023,"uctions":38024,"Ġbarbaric":38025,"rahim":38026,"635":38027,"Ġcloves":38028,"ĠNIH":38029,"ossession":38030,"Employ":38031,"Ġliberate":38032,"Gro":38033,"Ġmagician":38034,"ountain":38035,"FORM":38036,"533":38037,"Ġunpredict":38038,"rity":38039,"Ġfaked":38040,"plets":38041,"ppelin":38042,"Living":38043,"Ġnearer":38044,"Ġsuperiors":38045,"Ur":38046,"Ġheroism":38047,"Ġbearded":38048,"006":38049,"Cole":38050,"1970":38051,"Ġsill":38052,"ĠReduce":38053,"OLOG":38054,"onel":38055,"Billy":38056,"ĠPainter":38057,"ansas":38058,"Ġintermediary":38059,"trump":38060,"ĠMith":38061,"otom":38062,"434":38063,"Ġterrit":38064,"Wa":38065,"Ġsuprem":38066,"Rh":38067,"liction":38068,"ĠDEAD":38069,"Ġbothers":38070,"503":38071,"Ġfrogs":38072,"Ġsprinkled":38073,"Ġnil":38074,"628":38075,"Private":38076,"ĠKGB":38077,"Ġoverriding":38078,"Ġdeceived":38079,"698":38080,"idium":38081,"Ġseeker":38082,"Final":38083,"Ġsubconscious":38084,"Ġwom":38085,"Ġcass":38086,"Ġchicks":38087,"Ġverifying":38088,"ective":38089,"inia":38090,"ĠDetection":38091,"MH":38092,"fortable":38093,"ĠISPs":38094,"Ġcrumble":38095,"ĠRecap":38096,"598":38097,"ummies":38098,"export":38099,"Irish":38100,"Ġlil":38101,"ĠRapt":38102,"ĠRIGHT":38103,"Ġanecdotal":38104,"Ġpiercing":38105,"deck":38106,"Liber":38107,"Books":38108,"Ġassassin":38109,"Tur":38110,"revolution":38111,"ĠSheep":38112,"ĠPublishers":38113,"EMS":38114,"iosis":38115,"finder":38116,"ĠCuriosity":38117,"ARB":38118,"ĠConvers":38119,"IVES":38120,"clave":38121,"ĠChaos":38122,"ĠMim":38123,"ĠCostume":38124,"Ġtwe":38125,"Ġintim":38126,"757":38127,"berto":38128,"Ġ261":38129,"VPN":38130,"cribed":38131,"ĠVerb":38132,"cb":38133,"Ġaxle":38134,"Ġsandwic":38135,"Ice":38136,"ĠThermal":38137,"654":38138,"709":38139,"ĠPact":38140,"ĠEnsure":38141,"izable":38142,"497":38143,"Ġbloodstream":38144,"Aw":38145,"Ġleakage":38146,"Ġalleg":38147,"ĠMelody":38148,"681":38149,"Austin":38150,"428":38151,"Ġsummarized":38152,"ĠDefendants":38153,"ĠVader":38154,"Ê":38155,"Ġ1880":38156,"Ġassemb":38157,"YOU":38158,"GREEN":38159,"jury":38160,"4000":38161,"Ġvenerable":38162,"Ġcomputational":38163,"Ġperpetuate":38164,"Ġtorpedo":38165,"Ġaborted":38166,"Ġrhetorical":38167,"ĠOvert":38168,"Ġacknowledgment":38169,"essment":38170,"ĠIGN":38171,"ĠSheen":38172,"571":38173,"Ġcontag":38174,"Ġcultiv":38175,"Ġspawn":38176,"mess":38177,"Dur":38178,"Ġvortex":38179,"ixties":38180,"ĠBlow":38181,"Sum":38182,"Åį":38183,"Rom":38184,"ĠRadeon":38185,"Fed":38186,"Ġameric":38187,"ĠAnth":38188,"Ġantic":38189,"Ġfortress":38190,"Cold":38191,"ĠPredict":38192,"Fake":38193,"Ġilluminate":38194,"Find":38195,"Ġintellectually":38196,"Ġgon":38197,"alker":38198,"Ġinvoice":38199,"IELD":38200,"Ġfools":38201,"ĠEnding":38202,"-(":38203,"Ġalk":38204,"ĠControlled":38205,"Ġpurposefully":38206,"ĠChronic":38207,"Ġrele":38208,"ĠOps":38209,"Party":38210,"ethnic":38211,"ĠSpecifications":38212,"ffee":38213,"ĠTeach":38214,"ulas":38215,"Ġenslaved":38216,"onomy":38217,"Ġtenets":38218,"Ġammonia":38219,"Ġ1913":38220,"Ġdripping":38221,"612":38222,"659":38223,"ĠSagan":38224,"Ġinaccur":38225,"Ġabol":38226,"ĠLIKE":38227,"Ġvisualization":38228,"learn":38229,"anon":38230,"cipline":38231,"Ġadaptations":38232,"Ġwaiter":38233,"nergy":38234,"507":38235,"ĠDK":38236,"YD":38237,"Ġpedest":38238,"Sense":38239,"ĠObst":38240,"Ġresurrection":38241,"ĠSPECIAL":38242,"Unlike":38243,"Ġlia":38244,"Ġpersuasive":38245,"iatrics":38246,"ONEY":38247,"esthetic":38248,"494":38249,"zik":38250,"Ġfract":38251,"ĠOutput":38252,"ĠBers":38253,"rozen":38254,"ĠRevis":38255,"Ġdraconian":38256,"Words":38257,"asions":38258,"ĠClintons":38259,"CU":38260,"History":38261,"Ġtwilight":38262,"iform":38263,"Ġdispl":38264,"progress":38265,"ĠIO":38266,"Ġcannibal":38267,"Michelle":38268,"Ġnerv":38269,"Ġcontexts":38270,"ĠHorses":38271,"Ġanatomy":38272,"ĠLegislation":38273,"ĠBloody":38274,"Ġunwittingly":38275,"Ġinquired":38276,"ĠZip":38277,"ĠDesigns":38278,"Ġirritating":38279,"Ġunison":38280,"ĠRG":38281,"aviour":38282,"Ġpseudo":38283,"ĠVenom":38284,"Ġobscured":38285,"Ġner":38286,"uked":38287,"ORGE":38288,"Ġmomentarily":38289,"olyn":38290,"Syrian":38291,"Ġmicroscopic":38292,"Ġmistress":38293,"Less":38294,"Ġawoke":38295,"Ġtutor":38296,"esome":38297,"ollar":38298,"egg":38299,"UTE":38300,"Buzz":38301,"Ġattainment":38302,"Ġdiscriminating":38303,"::":38304,"Ġ525":38305,"azard":38306,"ĠBrist":38307,"oras":38308,"Ġveterin":38309,"jing":38310,"idon":38311,"ĠAustral":38312,"arious":38313,"ĠGrav":38314,"anol":38315,"ĠQuran":38316,"Ġbleach":38317,"588":38318,"ĠOsw":38319,"Ġdiffered":38320,"typ":38321,"ĠSIL":38322,"failed":38323,"436":38324,"Ġpalms":38325,"ĠFail":38326,"idespread":38327,"Ġchap":38328,"ĠIMAGES":38329,"ACP":38330,"matched":38331,"Ġjaws":38332,"MHz":38333,"Nik":38334,"ĠHume":38335,"OSH":38336,"Ġpresume":38337,"secut":38338,"ĠDied":38339,"ĠBreat":38340,"gins":38341,"prison":38342,"ĠUR":38343,"ĠROS":38344,"isitions":38345,"Ġpelvic":38346,"exclusive":38347,"522":38348,"689":38349,"FN":38350,"Ġener":38351,"Ġdispers":38352,"Ġcohorts":38353,"shut":38354,"ĠLoad":38355,"needs":38356,"azaki":38357,"inoa":38358,"Inside":38359,"usra":38360,"ighters":38361,"Ġ271":38362,"Ġsubordinate":38363,"ĠHOL":38364,"ĠGlow":38365,"Ġincred":38366,"ĠMadame":38367,"Ġoats":38368,"Ġdeviation":38369,"ĠApproach":38370,"Ġnarc":38371,"bart":38372,"bole":38373,"ĠSHE":38374,"effects":38375,"ĠADA":38376,"Ġmuse":38377,"Squ":38378,"Ġneuroscience":38379,"ĠValues":38380,"engu":38381,"Ġdosage":38382,"Ġwhispers":38383,"Ġnaughty":38384,"ĠFarming":38385,"Recently":38386,"Ġrelapse":38387,"rentice":38388,"UGH":38389,"Ġdarkened":38390,"appings":38391,"ĠSlaughter":38392,"ĠAnim":38393,"Ġovertly":38394,"poses":38395,"Ġdeficient":38396,"Ġnecks":38397,"Iron":38398,"Ġphysiological":38399,"ĠLiang":38400,"Ġlear":38401,"Ġcelestial":38402,"Ġpistols":38403,"Ġeyebrow":38404,"915":38405,"ratch":38406,"cephal":38407,"ĠPSU":38408,"Ġphotograp":38409,"ĠGaul":38410,"Ġuncontrolled":38411,"ĠJoined":38412,"652":38413,"itory":38414,"Ġ274":38415,"GAN":38416,"imester":38417,"essional":38418,"Ø©":38419,"Ġuncons":38420,"THER":38421,"Ġpaternal":38422,"Zero":38423,"ugen":38424,"538":38425,"Ġende":38426,"Ġ505":38427,"movie":38428,"Lind":38429,"Ġscorn":38430,"ulty":38431,"Ġpesky":38432,"Ġ8000":38433,"677":38434,"Ġhomophobia":38435,"ranch":38436,"Ġnarciss":38437,"ĠVoyager":38438,"ĠHELP":38439,"528":38440,"edly":38441,"Ġdetract":38442,"Hope":38443,"787":38444,"ĠMerlin":38445,"Ġgrids":38446,"KI":38447,"Mu":38448,"ĠSelected":38449,"select":38450,"ĠModer":38451,"ĠFeet":38452,"Ġrename":38453,"intensity":38454,"Wilson":38455,"Ġ414":38456,"leave":38457,"Ready":38458,"intuitive":38459,"Ġmeager":38460,"Franc":38461,"DH":38462,"Ġrhy":38463,"ĠPillar":38464,"ĠDOE":38465,"minist":38466,"ĠGrave":38467,"isible":38468,"Ess":38469,"Ġempt":38470,"Ġpatched":38471,"ĠAbortion":38472,"rals":38473,"Ġdow":38474,"Ġcrawled":38475,"igrate":38476,"Virginia":38477,"Ġconting":38478,"Ġorphans":38479,"ĠCrimean":38480,"Ġdyn":38481,"Ġshadowy":38482,"sound":38483,"ailable":38484,"Ġ293":38485,"vm":38486,"Ġaccompanies":38487,"Meanwhile":38488,"JR":38489,"ĠDirections":38490,"Ġadolescence":38491,"Ġpenetrated":38492,"bars":38493,"Rev":38494,"Ta":38495,"ĠSkywalker":38496,"ĠFires":38497,"concept":38498,"ĠSIG":38499,"554":38500,"currently":38501,"Ġ----------------":38502,"ĠWHITE":38503,"767":38504,"rors":38505,"PDF":38506,"Ġcasing":38507,"673":38508,"Ġdisapprove":38509,"1800":38510,"ĠWeed":38511,"Ġinhib":38512,"Ġmorbid":38513,"433":38514,"Ġawfully":38515,"Ts":38516,"Maria":38517,"Ġillusions":38518,"Ġtotalitarian":38519,"ollo":38520,"Ġsuppl":38521,"Ġsarc":38522,"ĠRGB":38523,"Ġlauncher":38524,"Ġbadass":38525,"ĠSyd":38526,"Ġscrape":38527,"ĠCLA":38528,"Ġcircum":38529,"657":38530,"Ġnucleus":38531,"ĠUkip":38532,"Ġmodem":38533,"ĠJou":38534,"adders":38535,"Ġwiser":38536,"thereal":38537,"Ġdemocr":38538,"ĠInvalid":38539,"Mine":38540,"Ġmanifested":38541,"meat":38542,"MORE":38543,"Larry":38544,"acements":38545,"Ġspecimen":38546,"results":38547,"Ġswallowing":38548,"Ġpigeon":38549,"tons":38550,"ĠLose":38551,"Ġquartz":38552,"Ġintraven":38553,"Ġ412":38554,"alyst":38555,"Ġengraved":38556,"client":38557,"ĠADV":38558,"ĠShared":38559,"Ġrites":38560,"Ġhysterical":38561,"ĠHUM":38562,"Cow":38563,"orously":38564,"Ġpleasures":38565,"democratic":38566,"Ġamph":38567,"Ġnib":38568,"rieg":38569,"Ġcalculates":38570,"Ġfrying":38571,"favorite":38572,"Ġantim":38573,"ĠDoom":38574,"monitor":38575,"Want":38576,"Ġtemplates":38577,"558":38578,"iever":38579,"Photos":38580,",,":38581,"ĠSync":38582,"Ġconfronts":38583,"kept":38584,"dt":38585,"ĠERROR":38586,"ETF":38587,"578":38588,"Ġspor":38589,"718":38590,"ivation":38591,"ĠHaskell":38592,"Ca":38593,"Ġdick":38594,"Ġcivilized":38595,"Ġblah":38596,"enough":38597,"Ġoccup":38598,"Ġ334":38599,"antically":38600,"584":38601,"ĠDolphin":38602,"ĠStarts":38603,"Ġfanatic":38604,"ت":38605,"imag":38606,"Ġmicrobial":38607,"freedom":38608,"cult":38609,"wra":38610,"Ġ423":38611,"RIPT":38612,"601":38613,"BTC":38614,"atmeal":38615,"653":38616,"agogue":38617,"Ġderives":38618,"Wolf":38619,"466":38620,"Susan":38621,"ĠPassage":38622,"ARDS":38623,"Guy":38624,"Council":38625,"Ġerotic":38626,"pure":38627,"ĠMemories":38628,"ĠWikileaks":38629,"elines":38630,"Ġanth":38631,"Capital":38632,"807":38633,"ĠEggs":38634,"cv":38635,"ctors":38636,"Ġshatter":38637,"Ġesteem":38638,"vity":38639,"ĠVulcan":38640,"effic":38641,"ĠBELOW":38642,"Ġplatoon":38643,"Commun":38644,"oustic":38645,"Amy":38646,"Freedom":38647,"ppo":38648,"Ja":38649,"ĠConan":38650,"Ġinsepar":38651,"scene":38652,"Ġurinary":38653,"gain":38654,"Hillary":38655,"ĠTAM":38656,"Hist":38657,"Ġmechan":38658,"ĠRobots":38659,"Leader":38660,"Ġcartridges":38661,"Ġwhistleblowers":38662,"ĠSPL":38663,"Labour":38664,"unction":38665,"Ġfaithfully":38666,"Ġcoarse":38667,"Ġsynth":38668,"ĠLV":38669,"Ġjustifying":38670,"439":38671,"Victoria":38672,"ĠProceedings":38673,"alogy":38674,"Ġmorph":38675,"Ġcove":38676,"Ġlaughable":38677,"ECA":38678,"Ġ670":38679,"aturated":38680,"ĠSouls":38681,"ĠSleeping":38682,"Ly":38683,"ĠRetro":38684,"Ġastroph":38685,"Ġseism":38686,"atherine":38687,"ĠHercules":38688,"Ġfuse":38689,"ĠHL":38690,"Ġunintentionally":38691,"ĠRé":38692,"iery":38693,"Ġconco":38694,"Ġeras":38695,"recent":38696,"Ġlaunchers":38697,"ĠVolcano":38698,"ĠJace":38699,"Ġterminating":38700,"ĠIde":38701,"zee":38702,"asonic":38703,"itone":38704,"Ġnutshell":38705,"Ġbip":38706,"dies":38707,"Ġ286":38708,"Ġnood":38709,"ĠFathers":38710,"alys":38711,"Ġtheor":38712,"???":38713,"548":38714,"674":38715,"efined":38716,"806":38717,"âĻ":38718,"697":38719,"Ġdecap":38720,"ĠFN":38721,"Ġbureaucr":38722,"ĠGoat":38723,"ĠShang":38724,"Ġsemin":38725,"Ġthroats":38726,"Ġmoth":38727,"herer":38728,"Democratic":38729,"ixtures":38730,"impl":38731,"ĠLogo":38732,"ortunate":38733,"Ġclumsy":38734,"Ġinnocuous":38735,"ĠBlend":38736,"abulary":38737,"ĠFaces":38738,"Ġpornographic":38739,"px":38740,"Information":38741,"Ġfluoride":38742,"Ġatroc":38743,"Ġdelta":38744,"whatever":38745,"ossier":38746,"ĠNoir":38747,"ĠYao":38748,"551":38749,"undred":38750,"Ġmillennium":38751,"Ġferal":38752,"Ġconvinc":38753,"cano":38754,"imsy":38755,"angles":38756,"Ġsterile":38757,"ĠMenu":38758,"779":38759,"ĠCrack":38760,"Ġabundantly":38761,"ĠmL":38762,"Ġinfiltration":38763,"ĠDefinition":38764,"733":38765,"oubt":38766,"Ġorbital":38767,"Ġpiss":38768,"Ġbeet":38769,"679":38770,"Ġcounteract":38771,"ĠALE":38772,"ulative":38773,"crew":38774,"Ġliberating":38775,"ĠDull":38776,"Speaking":38777,"Sadly":38778,"Ġmisfortune":38779,"Ġdolphin":38780,"557":38781,"Ġbould":38782,"ĠTorah":38783,"ĠConfederacy":38784,"421":38785,"Ġorbits":38786,"ocused":38787,"beer":38788,"Rand":38789,"ĠORIG":38790,"Ġmuc":38791,"LER":38792,"ĠMisty":38793,"Ġinexpl":38794,"Ġreptiles":38795,"Ġaven":38796,"blocking":38797,"ĠPASS":38798,"Ġarisen":38799,"ĠMock":38800,"Ġops":38801,"Ġshin":38802,"524":38803,"Ġdigestion":38804,"Soft":38805,"irect":38806,"POL":38807,"ĠSpell":38808,"Level":38809,"Ġhex":38810,"Ġbitcoins":38811,"ĠHungry":38812,"VL":38813,"ĠRealm":38814,"RELATED":38815,"Delta":38816,"Pri":38817,"Ġrejoice":38818,"ĠLatter":38819,"LG":38820,"Ġstupidity":38821,"Ġdonkey":38822,"nova":38823,"Vill":38824,"Ġdecomp":38825,"Ġexternally":38826,"Ġsequest":38827,"815":38828,"Ġshortcut":38829,"riminal":38830,"Hun":38831,"EH":38832,"Ġregiment":38833,"Case":38834,"definition":38835,"Ġappendix":38836,"ĠPlayed":38837,"associated":38838,"izens":38839,"ĠVag":38840,"Ġflung":38841,"Ġfru":38842,"Ġcoil":38843,"________________________":38844,"Ġselects":38845,"Ġsolves":38846,"aea":38847,"985":38848,"Tomorrow":38849,"Ġsear":38850,"APE":38851,"492":38852,"Ġenlightened":38853,"Ġnonexistent":38854,"ĠPotato":38855,"Ghost":38856,"Ġrichness":38857,"ĠKarin":38858,"Ġfamilial":38859,"ĠJA":38860,"Regardless":38861,"Ġepis":38862,"GD":38863,"Ġinsanely":38864,"ĠPhill":38865,"Block":38866,"Finding":38867,"omal":38868,"Ġdecipher":38869,"ĠSwap":38870,"derived":38871,"ĠOFFIC":38872,"Support":38873,"Ġnylon":38874,"Ġexaggeration":38875,"Ġevangelicals":38876,"Ġbearings":38877,"587":38878,"Ġlocale":38879,"Ġpowerfully":38880,"Ġappropriated":38881,"itates":38882,"irlfriend":38883,"cule":38884,"ĠSomewhere":38885,"747":38886,"ĠInteresting":38887,"464":38888,"Ġelong":38889,"Ġdegrade":38890,"rafted":38891,"Ġtutorials":38892,"905":38893,"ĠIntervention":38894,"Ġuniqueness":38895,"Ġ284":38896,"Ġexplorers":38897,"Ġnucle":38898,"ĠMillenn":38899,"511":38900,"ĠReneg":38901,"Ġexecut":38902,"urai":38903,"leon":38904,"Ġdeserts":38905,"ĠCig":38906,"Ġsuggestive":38907,"instead":38908,"Ġlousy":38909,"Ġenigmatic":38910,"594":38911,"Know":38912,"rollment":38913,"ipher":38914,"Ġhumanities":38915,"Ġmodifying":38916,".....":38917,"Ġdegraded":38918,"Ġsuppressing":38919,"Ġeman":38920,"abouts":38921,"functional":38922,"ĠOU":38923,"ĠRelax":38924,"786":38925,"esses":38926,"ĠLogin":38927,"spec":38928,"ĠWWF":38929,"Ġ364":38930,"ĠIsis":38931,"Wisconsin":38932,"Ġequival":38933,"ĠCollector":38934,"ibilities":38935,"malink":38936,"acea":38937,"Ġchained":38938,"Ġarist":38939,"Ġdisadvantages":38940,"ĠBrus":38941,"limits":38942,"ĠDmit":38943,"544":38944,"ĠRecipe":38945,"Ġhabitual":38946,".):":38947,"ĠPRODUCT":38948,"772":38949,"Ġrept":38950,"Ġpathology":38951,"Ġresurrected":38952,"uders":38953,"Ġlingu":38954,"Ġdenomination":38955,"Ġfirewall":38956,"scient":38957,"Ġvaliant":38958,"Kansas":38959,"516":38960,"Ġcontemporaries":38961,"Roman":38962,"Ġaccompan":38963,"Ġantennas":38964,"ĠXan":38965,"Ġelectromagnetic":38966,"ĠNek":38967,"alien":38968,"indle":38969,"Ġgraphene":38970,"Ġgraceful":38971,"syn":38972,"ĠBosh":38973,"Ġ1908":38974,"Ġsuccumb":38975,"Technology":38976,"Ġtoxin":38977,"myra":38978,"essert":38979,"Hell":38980,"Gil":38981,"Ġdiarr":38982,"imeters":38983,"Ġexplo":38984,"Ġgeometric":38985,"ĠNavigation":38986,"cern":38987,"Ġprogrammer":38988,"oÄŁan":38989,"Ġdodging":38990,"ĠLU":38991,"573":38992,"inters":38993,"Ġserum":38994,"Ġuber":38995,"Ġmanga":38996,"762":38997,"ĠOccasionally":38998,"437":38999,"ĠTheme":39000,"Ġimmature":39001,"Ġactivating":39002,"ĠTruly":39003,"د":39004,"osion":39005,"Age":39006,"TIME":39007,"Silver":39008,"sand":39009,"ulnerable":39010,"Ġcram":39011,"Large":39012,"ĠAnger":39013,"icators":39014,"431":39015,"ĠHonest":39016,"zip":39017,"Ġdism":39018,"Ġfades":39019,"ĠPik":39020,"Ast":39021,"sequent":39022,"Ġunsigned":39023,"xious":39024,"creation":39025,"Ġ395":39026,"ottenham":39027,"Ġundesirable":39028,"ugal":39029,"ĠDivide":39030,"lp":39031,"563":39032,"ĠPOP":39033,"ĠCET":39034,"session":39035,"Ġoccurrences":39036,"chu":39037,"ĠACS":39038,"ĠProsecut":39039,"Ġhypnot":39040,"rely":39041,"ERG":39042,"Ven":39043,"Republicans":39044,"inez":39045,"ĠImplementation":39046,"Ġsprang":39047,"Ġobs":39048,"Defense":39049,"Ġunexpl":39050,"ĠPAGE":39051,"ĠTent":39052,"ĠNeurolog":39053,"Ġintuition":39054,"759":39055,"Ġterrestrial":39056,"Ġmorphine":39057,"Ġ.\"":39058,"ĠHydra":39059,"651":39060,"Ġneoliberal":39061,"683":39062,"Ġabnormalities":39063,"quant":39064,"Ġmonastery":39065,"jac":39066,"ĠReaction":39067,"Ġcontraceptive":39068,"ĠBalls":39069,"Ġapost":39070,"676":39071,"ĠHELL":39072,"approximately":39073,"Ġvibrations":39074,"COR":39075,"ĠCPUs":39076,"Ġcontin":39077,"Ġsemblance":39078,"Ġshorth":39079,"tip":39080,"ĠChips":39081,"makes":39082,"Ġprett":39083,"Ġconspicuous":39084,"ĠAmp":39085,"Ġvisualize":39086,"Hu":39087,"sorry":39088,"nai":39089,"ĠArcade":39090,"rimination":39091,"obin":39092,"Ġvampire":39093,"773":39094,"ĠCaucasus":39095,"Medic":39096,"ĠGitHub":39097,"ĠWicked":39098,"ĠFet":39099,"Krist":39100,"998":39101,"Ġfrontal":39102,"Ġ283":39103,"ndum":39104,"Ġidols":39105,"ĠMSG":39106,"ĠShuttle":39107,"ĠTowards":39108,"Ġsaturation":39109,"Ġ®":39110,"Ġcradle":39111,"eteen":39112,"Ġprejudices":39113,"separ":39114,"ĠSoda":39115,"ynam":39116,"Ġnause":39117,"Ġpenetrating":39118,"ĠVampire":39119,"Ġmole":39120,"Ġgoogle":39121,"earance":39122,"583":39123,"Ġdomin":39124,"727":39125,"Kind":39126,"Ġcust":39127,"manuel":39128,"ĠAstro":39129,"Roger":39130,"JO":39131,"killed":39132,"ĠDisapp":39133,"833":39134,"ĠEQU":39135,"Ġprecedence":39136,"mberg":39137,"641":39138,"ĠRoller":39139,"Ġspecifying":39140,"035":39141,"phil":39142,"Ġpowdered":39143,"Ġblot":39144,"Ġdeline":39145,"Bruce":39146,"536":39147,"Ġpim":39148,"leasing":39149,"vacc":39150,"RN":39151,"Ġspacing":39152,"Ġhangar":39153,"ĠPlot":39154,"537":39155,"legraph":39156,"596":39157,"Ġpolyg":39158,"doi":39159,"ĠNerd":39160,"installed":39161,"ĠSeeds":39162,"ĠPlays":39163,"ĠRomance":39164,"layer":39165,"Ġunsu":39166,"Ġcurric":39167,"Mi":39168,"restrial":39169,"ĠNiño":39170,"ĠProper":39171,"Ġpores":39172,"Giving":39173,"aeus":39174,"Middle":39175,"liber":39176,"Ġcombatants":39177,"ĠBulk":39178,"Ġ502":39179,"Ġstru":39180,"ĠLonely":39181,"Companies":39182,"inence":39183,"Autom":39184,"Ġfearsome":39185,"Ġsummar":39186,"Ġrotated":39187,"ĠPLA":39188,"ĠFAT":39189,"572":39190,"ĠSkies":39191,"iour":39192,"Ġintimately":39193,"amera":39194,"Ġ475":39195,"623":39196,"Ġirrig":39197,"Ġboosters":39198,"Ġtransmitting":39199,"DOWN":39200,"ĠAble":39201,"Ġfuriously":39202,"spirit":39203,"Ġgrun":39204,"Ġbible":39205,"ĠAdmir":39206,"Ġ§":39207,"ĠRaise":39208,"Ġflowering":39209,"uxe":39210,"ravis":39211,"urther":39212,"ĠScientology":39213,"pathy":39214,"Ġruth":39215,"Ġtempor":39216,"Ġwhispered":39217,"ogly":39218,"coord":39219,"chlor":39220,"processing":39221,"iott":39222,"ĠTY":39223,"wik":39224,"abolic":39225,"ĠUnable":39226,"ĠLiterary":39227,"ĠpH":39228,"Eastern":39229,"Craig":39230,"Fear":39231,"Ġinventions":39232,"ĠNost":39233,"Ġafflicted":39234,"ĠSwamp":39235,"INST":39236,"Jerry":39237,"Ġprope":39238,"ĠLancet":39239,"Ġrefres":39240,"ĠPrinciples":39241,"ĠLys":39242,"ERAL":39243,"addock":39244,"Ġcynicism":39245,"Ġmassacres":39246,"roo":39247,"Ġcollagen":39248,"Johnny":39249,"Keith":39250,"Italian":39251,"553":39252,"Dad":39253,"Neither":39254,"cler":39255,"ilers":39256,"Ġassass":39257,"Travel":39258,"672":39259,"Ġeaves":39260,"ATOR":39261,"Ġoily":39262,"581":39263,"ateful":39264,"728":39265,"Ġchiefly":39266,"tical":39267,"enes":39268,"ĠWouldn":39269,"ĠJacket":39270,"ĠSuit":39271,"Ġindustrialized":39272,"ĠNose":39273,"ĠSECTION":39274,"Ġredd":39275,"Ġcavity":39276,"Ġconn":39277,"Shield":39278,"Ġtongues":39279,"Ġsuccinct":39280,"views":39281,"ĠMUST":39282,"oliath":39283,"Ġlimitless":39284,"Ġapocalyptic":39285,"ĠAtlantis":39286,"DNA":39287,"ilded":39288,"ĠDresden":39289,"nit":39290,"Ġsubdiv":39291,"gressive":39292,"701":39293,"hops":39294,"alist":39295,"Ġunintentional":39296,"Ġpsychic":39297,"Ġcontrovers":39298,"Ġforeground":39299,"Ġnaïve":39300,"Ġfolders":39301,"icist":39302,"Ġdrawbacks":39303,"ĠToxic":39304,"ophy":39305,"ĠMasonic":39306,"Ġcis":39307,"olated":39308,"Ġdepletion":39309,"Rap":39310,"692":39311,"Ġinver":39312,"ĠFAQ":39313,"Ġmeanings":39314,"Ġbisc":39315,"ĠRage":39316,"Ġresear":39317,"Ep":39318,"Ġunbeat":39319,"ĠComponents":39320,"bub":39321,"ĠInterface":39322,"Isa":39323,"ĠArgon":39324,"Ġdenomin":39325,"Ġmammal":39326,"519":39327,"Ġsizing":39328,"imbabwe":39329,"ĠReplacement":39330,"Georgia":39331,"ĠParticipation":39332,"Ġmelts":39333,"Ġfemin":39334,"514":39335,"Ġseams":39336,"513":39337,"ĠGaw":39338,"Ġbrood":39339,"Mit":39340,"Ġannoyance":39341,"Ġequilibrium":39342,"Ġpatri":39343,"Ġ338":39344,"561":39345,"mentioned":39346,"ĠVotes":39347,"Ġintoler":39348,"Ġstrikingly":39349,"Ġ352":39350,"Ġskeletal":39351,"616":39352,"isition":39353,"Ġfluor":39354,"provided":39355,"517":39356,"Ġclimates":39357,"Ġsensibilities":39358,"ĠFrequ":39359,"onite":39360,"Kenn":39361,"Ġmagnets":39362,"assis":39363,"Ġprerequisite":39364,"Ġ>>>":39365,"Ġscree":39366,"google":39367,"ĠMirage":39368,"Ġevict":39369,"Peace":39370,"Ġmissionaries":39371,"617":39372,"748":39373,"rient":39374,"ĠSTATS":39375,"Bird":39376,"ĠShiva":39377,"ĠBlessing":39378,"Ġredundancy":39379,"Ġphotoc":39380,"ĠOnes":39381,"754":39382,"alert":39383,"urous":39384,"Ġfolklore":39385,"ĠIdeal":39386,"sheets":39387,"according":39388,"Hor":39389,"Cle":39390,"ĠEdit":39391,"671":39392,"olitics":39393,"ĠESC":39394,"Ġparaly":39395,"Ġorgasm":39396,"speak":39397,"ð":39398,"Ġsneaky":39399,"Ġswords":39400,"Ġfandom":39401,"776":39402,"ĠScandinav":39403,"Ġdarts":39404,"546":39405,"cerpt":39406,"ĠGifts":39407,"Ġmagically":39408,"phys":39409,"Laughs":39410,"ĠSour":39411,"ources":39412,"789":39413,"ĠEps":39414,"ository":39415,"uality":39416,"literally":39417,"Ġheavens":39418,"FUL":39419,"Ġie":39420,"ĠISP":39421,"Ġwink":39422,"Ġweeping":39423,"Ġdocking":39424,"ACY":39425,"iece":39426,"Ġsignifies":39427,"guns":39428,"Sac":39429,"Leave":39430,"imation":39431,"Ġunex":39432,"uctive":39433,"ĠFees":39434,"ĠPortable":39435,"ĠInvestigator":39436,"pill":39437,"rehensible":39438,"Ġpotency":39439,"803":39440,"Ġembodiment":39441,"overty":39442,"shine":39443,"REL":39444,"ĠMPH":39445,"ĠPatriarch":39446,"Ġaspirin":39447,"Ġrinse":39448,"Ġinher":39449,"ograms":39450,"ĠTHREE":39451,"qt":39452,"ipples":39453,"Ġdehuman":39454,"Ġslander":39455,"Ġflora":39456,"brow":39457,"Ġblindly":39458,"ectar":39459,"endish":39460,"Ġpigment":39461,"cellent":39462,"Ġyells":39463,"ĠLust":39464,"ĠAttacks":39465,"ĠSyndicate":39466,"otin":39467,"gress":39468,"reenshot":39469,"picking":39470,"Ġacupuncture":39471,"images":39472,"glas":39473,"ĠPolicies":39474,"Ġintestinal":39475,"1998":39476,"ULE":39477,"runs":39478,"ĠNing":39479,"ĠAsuka":39480,"ĠSkull":39481,"Motor":39482,"Ġdefund":39483,"Ġattaching":39484,"ĠBAD":39485,"Ġquarrel":39486,"Child":39487,"Dog":39488,"issan":39489,"irmation":39490,"Ġinline":39491,"ĠLover":39492,"Ġcyan":39493,"entary":39494,"awareness":39495,"Ġtraveller":39496,"âĢIJ":39497,"Ġbeasts":39498,"Ġboobs":39499,"ĠDeadly":39500,"Ġplutonium":39501,"ĠIntellectual":39502,"Jam":39503,"Ġconsec":39504,"663":39505,"ĠVegan":39506,"Ġ331":39507,"uron":39508,"ĠHEL":39509,"reements":39510,"Ġclone":39511,"Ġoutputs":39512,"oult":39513,"ĠDOM":39514,"ĠNX":39515,"Ze":39516,"909":39517,"brate":39518,"arations":39519,"ĠJindal":39520,"Ġbooklet":39521,"amide":39522,"Ġscraping":39523,"Sol":39524,"Date":39525,"796":39526,"Ġfulf":39527,"Ġskeletons":39528,"Ġsaints":39529,"ĠCurious":39530,"Han":39531,"Ġrepud":39532,"osity":39533,"ĠGravity":39534,"Ġmetadata":39535,"Focus":39536,"Ġthrott":39537,"ĠProgramming":39538,"Break":39539,"erver":39540,"Ġknight":39541,"yrs":39542,"Ġ376":39543,"sat":39544,"auto":39545,"Ġbroom":39546,"Ġnerd":39547,"Political":39548,"022":39549,"-------------":39550,"oulos":39551,"Ġrelic":39552,"Ġenactment":39553,"rious":39554,"ĠUniform":39555,"Teen":39556,"Colorado":39557,"055":39558,"Ġangled":39559,"bolt":39560,"ĠNeander":39561,"ĠDism":39562,"thanks":39563,"Polit":39564,"ersion":39565,"dro":39566,"install":39567,"Jake":39568,"hz":39569,"Ġ770":39570,"ĠCommodore":39571,"lahoma":39572,"Ġshri":39573,"Ġ....":39574,"Ġ7000":39575,"scope":39576,"Ġgenesis":39577,"Ġresided":39578,"ĠRivals":39579,"Ġsarcastic":39580,"Ġelicit":39581,"Ġmultiplied":39582,"uitous":39583,"Ġoppress":39584,"ĠPROT":39585,"Ġperpetually":39586,"ĠAdds":39587,"Ġbuffers":39588,"Ġmush":39589,"Ġ354":39590,"Ġpresc":39591,"ĠKung":39592,"682":39593,"Education":39594,"Ġpled":39595,"bsp":39596,"Ġconfessions":39597,"Ġrevocation":39598,"Micro":39599,"ĠHobby":39600,"ĠFatal":39601,"STAR":39602,"Ġworkspace":39603,"Ġtransformations":39604,"Ġportals":39605,"orned":39606,"figured":39607,"Ġlinguistic":39608,"pperc":39609,"ergus":39610,"Fel":39611,"ĠIntent":39612,"Ġ289":39613,"Ġdelinquent":39614,"Ġhandwriting":39615,"Ġvap":39616,"576":39617,"redited":39618,"736":39619,"Ġpsychiatry":39620,"GMT":39621,"Ġdisingen":39622,"Ġcrou":39623,"801":39624,"Ġmalice":39625,"itutes":39626,"ĠTiff":39627,"Ġstink":39628,"574":39629,"Story":39630,"Modern":39631,"ĠGly":39632,"Jamie":39633,"Ġadvertis":39634,"Ġhiber":39635,"Ġinfiltr":39636,"Ġelector":39637,"rovers":39638,"ĠFist":39639,"peed":39640,"ĠClassical":39641,"592":39642,"Ġconscientious":39643,"Surv":39644,"Text":39645,"ĠDrunk":39646,"Ġsupplemented":39647,"THIS":39648,"Ġtimid":39649,"Ġstacking":39650,"rites":39651,"Ġrebirth":39652,"Ġbalcon":39653,"Ġyawn":39654,"rosc":39655,"axy":39656,"Hart":39657,"ĠOPER":39658,"996":39659,"Ġrabid":39660,"ĠTick":39661,"Ġgrinning":39662,"elfth":39663,"045":39664,"Ġjustifies":39665,"ĠPirate":39666,"ĠSalary":39667,"Ġmirac":39668,"613":39669,"inately":39670,"ĠLIN":39671,"Ġinadequ":39672,"NPR":39673,"iddled":39674,"storage":39675,"Ġseventy":39676,"onet":39677,"Ġgastro":39678,"FIR":39679,"Ġrodent":39680,"629":39681,"ĠInclude":39682,"ĠCategories":39683,"ĠLiterally":39684,"Ġpree":39685,"aunder":39686,"ĠLOL":39687,"694":39688,"Ġindef":39689,"Ped":39690,"Ġmenstru":39691,"Ġcensored":39692,"Ġconfigure":39693,"Ġoverest":39694,"igenous":39695,"Ġrectangular":39696,"ĠMIS":39697,"ĠMub":39698,"Ġwitches":39699,"izards":39700,"Ġobnoxious":39701,"ĠLoll":39702,"ĠSEM":39703,"Ġspiritually":39704,"Ġcoer":39705,"Ġmodesty":39706,"butt":39707,"Ġedits":39708,"ĠShall":39709,"sburgh":39710,"Ġ1911":39711,"Rex":39712,"manent":39713,"ĠLithuan":39714,"Ġpointers":39715,"ativity":39716,"retch":39717,"Ġcascade":39718,"ĠRagnarok":39719,"ĠPainting":39720,"ĠATL":39721,"Born":39722,"Ġpadding":39723,"whel":39724,"Ġgrotesque":39725,"Ġtheorists":39726,"forcer":39727,"ĠJinn":39728,"Ġrenal":39729,"jamin":39730,"ĠFEC":39731,".\"\"":39732,"redict":39733,"Ġoppos":39734,"opted":39735,"Sel":39736,"ipment":39737,"752":39738,"792":39739,"Pur":39740,"Ġvolt":39741,"Ġflap":39742,"ĠCASE":39743,"Ġdyed":39744,"orers":39745,"becca":39746,",.":39747,"ifice":39748,"ubes":39749,"Ġyr":39750,"DW":39751,"Ġalteration":39752,"ĠSimpl":39753,"Ġunequiv":39754,"756":39755,"Dou":39756,"Ġplunder":39757,"Ġcommons":39758,"Ġstag":39759,"ĠZeal":39760,"avanaugh":39761,"Self":39762,"none":39763,"EGIN":39764,"Ġflashback":39765,"VAL":39766,"Gab":39767,"ĠCapture":39768,"ĠBrilliant":39769,"ĠDisk":39770,"ĠMood":39771,"Ġhaun":39772,"Ġrotting":39773,"ĠCobra":39774,"Ġpsychopath":39775,"Ġhelper":39776,"Starting":39777,"ĠOrbit":39778,"Ġcaf":39779,"Half":39780,"Volume":39781,"aptop":39782,"ĠSaga":39783,"azor":39784,"593":39785,"774":39786,"ĠCaucasian":39787,"compan":39788,"ĠVERY":39789,"GES":39790,"Ġvomit":39791,"Ġdispro":39792,"ĠMechanics":39793,"Ġ385":39794,"Ġmystical":39795,"AFTA":39796,"Ġbacter":39797,"availability":39798,"Ġhairc":39799,"ĠVec":39800,"rypt":39801,"Ġmanipulative":39802,"shell":39803,"ĠWeird":39804,"jab":39805,"ĠByr":39806,"Bow":39807,"uin":39808,"Ġquot":39809,"MX":39810,"Ġ960":39811,"ĠSharia":39812,"ĠWeapon":39813,"ĠPowerPoint":39814,"Ġstitching":39815,"Ġconstraint":39816,"âľ":39817,"ulic":39818,"597":39819,"omedical":39820,"ĠSupplemental":39821,"ĠSurve":39822,"ĠSubcommittee":39823,"ĠDarkness":39824,"Ġpython":39825,"LU":39826,"Ġ402":39827,"ĠQuan":39828,"ĠModerate":39829,"clusively":39830,"Ġextrap":39831,"Ġlatt":39832,"ĠSTUD":39833,"oslav":39834,"Ġsymb":39835,"battle":39836,"flash":39837,"ĠDeploy":39838,"Ġmicrobiome":39839,"Ġingested":39840,"Ġdistort":39841,"Ġassimil":39842,"Ġmobs":39843,"illet":39844,"Gre":39845,"Ġ294":39846,"Ġforbids":39847,"ĠEfficiency":39848,"ĠClan":39849,"763":39850,"Ġdragons":39851,"States":39852,"ĠMAKE":39853,"ĠBOOK":39854,"ĠRuns":39855,"ĠUX":39856,"EED":39857,"Whoever":39858,"ionics":39859,"worldly":39860,"ĠMermaid":39861,"Ġbenz":39862,"Info":39863,"523":39864,"Ġbiod":39865,"ĠPoison":39866,"ceivable":39867,"Services":39868,"ATIVE":39869,"ĠItem":39870,"Ġdisav":39871,"Ġheter":39872,"Ġasteroids":39873,"ĠWooden":39874,"Ġelectroly":39875,"assadors":39876,"nance":39877,"reflect":39878,"Ġattent":39879,"iphany":39880,"Ġspaceship":39881,"Ġbegg":39882,"algia":39883,"Ax":39884,"Ġidiosyncr":39885,"Ġinserting":39886,"ĠCSS":39887,"ĠLET":39888,"ĠStrikes":39889,"ossibly":39890,"Exp":39891,"Opp":39892,"dden":39893,"Ġplayable":39894,"ĠJM":39895,"Ġlawfully":39896,"ĠBlink":39897,"Ġ413":39898,"Ġoverpowered":39899,"Ġcommenter":39900,"Track":39901,"Ġmethyl":39902,"Ġfermented":39903,"Ġinvaders":39904,"ĠMoves":39905,"Ġcommunicates":39906,"rint":39907,"ĠTray":39908,"jug":39909,"Ġsuperf":39910,"ochet":39911,"ĠJelly":39912,"Ġestrogen":39913,"Dom":39914,"mix":39915,"Gun":39916,"ochemistry":39917,"952":39918,"Ġovere":39919,"ĠPlaintiff":39920,"ĠPilgrim":39921,"ĠSERVICES":39922,"ĠExpend":39923,"ĠFRE":39924,"Ġsmelling":39925,"ĠSpaces":39926,"bris":39927,"Mission":39928,"Ġarter":39929,"Ġautonom":39930,"Lisa":39931,"ĠPercent":39932,"NK":39933,"ĠLimits":39934,"Ġ356":39935,"Recent":39936,"ĠSiberian":39937,"etermin":39938,"nets":39939,"ĠSword":39940,"essee":39941,"Ùĩ":39942,"icycle":39943,"Ġparas":39944,"Ġrud":39945,"Ġscrib":39946,"Ġ1860":39947,"Shop":39948,"orld":39949,"Ġpept":39950,"ENSE":39951,"Ġanimations":39952,"ership":39953,"Search":39954,"ĠUSSR":39955,"washed":39956,"Ġpromulg":39957,"Ġdetainee":39958,"Ġunderest":39959,"ĠAppropri":39960,"Left":39961,"Update":39962,"Wallet":39963,"idently":39964,"ĠBicycle":39965,"Ġgorge":39966,"abyte":39967,"ĠMinecraft":39968,"rike":39969,"997":39970,"Tesla":39971,"Often":39972,"ĠTHESE":39973,"Ġregression":39974,"Hen":39975,"Ġsnippets":39976,"irds":39977,"Ġprinces":39978,"Ġwastes":39979,"ĠWond":39980,"itimate":39981,"ĠMongol":39982,"ĠkW":39983,"Ġidiots":39984,"Ġforeigner":39985,"Upon":39986,"Ġbackdoor":39987,"umph":39988,"ĠSquirrel":39989,"Ġtyped":39990,"Ġblockers":39991,"Vote":39992,"ĠPossibly":39993,"geist":39994,"ĠTRANS":39995,"Ġtitan":39996,"VG":39997,"Ġmicrobi":39998,"Ġinteracts":39999,"Ġmasc":40000,"Ġfinite":40001,"Ġcutoff":40002,"ornings":40003,"Ġprototyp":40004,"Ġcompan":40005,"mology":40006,"ĠBOX":40007,"Cre":40008,"Bot":40009,"grading":40010,"PET":40011,"Ġinsidious":40012,"ĠFranch":40013,"orians":40014,"ĠAUT":40015,"ĠCrush":40016,"589":40017,"question":40018,"anguard":40019,"Ġabsurdity":40020,"?\",":40021,"Hum":40022,"Ġliberalism":40023,"Ġpostwar":40024,"Gener":40025,"Personally":40026,"889":40027,"Bul":40028,"Ġlighthouse":40029,"Ġ291":40030,"VK":40031,"ĠExposure":40032,"Ġsubtract":40033,"ometime":40034,"arbon":40035,"ĠThieves":40036,"anus":40037,"ĠLibertarian":40038,"Raw":40039,"Ġsolvent":40040,"Ġcorros":40041,"Ġsignific":40042,"Ġscholarly":40043,"024":40044,"Ġfetish":40045,"Ġlarvae":40046,"Ġcatast":40047,"Ġtraitor":40048,"ijing":40049,"Demand":40050,"math":40051,"Ġconceivable":40052,"either":40053,"acl":40054,"ĠArrows":40055,"627":40056,"ĠFrankenstein":40057,"entious":40058,"Ġimitation":40059,"amn":40060,"ĠSTOP":40061,"Ġcripp":40062,"zag":40063,"ĠZed":40064,"797":40065,"Along":40066,"Ġwont":40067,"Ġfolds":40068,"Shar":40069,"ĠCommentary":40070,"ĠLibraries":40071,"ĠThunderbolt":40072,"itud":40073,"Toy":40074,"Ġincidentally":40075,"ĠResp":40076,"Ġordinarily":40077,"Ġvanish":40078,"acterial":40079,"Minnesota":40080,"rank":40081,"614":40082,"ĠExam":40083,"Got":40084,"Ġsnipers":40085,"ETHOD":40086,"dirty":40087,"igsaw":40088,"Obs":40089,"ĠAuthors":40090,"Ġillustrating":40091,"782":40092,"864":40093,"Ġblinded":40094,"transfer":40095,"Ġspawning":40096,"ĠDiary":40097,"ĠDNS":40098,"CG":40099,"someone":40100,"Ġcruc":40101,"Morgan":40102,"Learn":40103,"API":40104,"toc":40105,"STAT":40106,"ĠFlame":40107,"aganda":40108,"ĠBenef":40109,"stuff":40110,"SEA":40111,"Ġincest":40112,"Normally":40113,"ĠRU":40114,"Ġarsenic":40115,"isine":40116,"ĠTG":40117,"Type":40118,"regn":40119,"Cass":40120,"Touch":40121,"Site":40122,"Ġpict":40123,"Ġcorrupted":40124,"729":40125,"Ġnineteen":40126,"Ġparaph":40127,"Ġtavern":40128,"Ġretard":40129,"ĠKaf":40130,"Ġcolleg":40131,"bucks":40132,"imum":40133,"ĠCandle":40134,"ĠMisc":40135,"ĠAwesome":40136,"edited":40137,"ĠDN":40138,"otomy":40139,"Ġdisclaimer":40140,"798":40141,"ĠGoodbye":40142,"ucle":40143,"atom":40144,"Judge":40145,"cipl":40146,"Ġinexplicable":40147,"iddler":40148,"781":40149,"Ġempirical":40150,"Veter":40151,"Ġascert":40152,"Ġaest":40153,"Ġlaz":40154,"binary":40155,"Ġ358":40156,"contained":40157,"Ġmultipl":40158,"ocado":40159,"Ġdelusional":40160,"Ġaeros":40161,"udence":40162,"Ġjargon":40163,"estine":40164,"Ġarbitrarily":40165,"Ġprick":40166,"BACK":40167,"amines":40168,"Mess":40169,"Knowing":40170,"ublic":40171,"ĠWarfare":40172,"Ġsignify":40173,"Ġfragmentation":40174,"Tex":40175,"Ġnin":40176,"Ġdise":40177,"882":40178,"hospital":40179,"volent":40180,"Need":40181,"Ġinfer":40182,"Sony":40183,"783":40184,"YING":40185,"Ġinfinity":40186,"ĠFortress":40187,"Ġmustache":40188,"Ġcorresponds":40189,"DX":40190,"Ġunmarried":40191,"ĠCruel":40192,"Ġ1901":40193,"Ġappropri":40194,"ZI":40195,"Ġphosph":40196,"901":40197,"IFE":40198,"Ġ347":40199,"Ġconvoluted":40200,"ĠApost":40201,"htm":40202,"Ġilluminating":40203,"568":40204,"Ġassassinate":40205,"Ġparam":40206,"Ġimpractical":40207,"cedes":40208,"ĠProcedure":40209,"ĠMouth":40210,"Battle":40211,"Ġ451":40212,"Sand":40213,"Ġcontamin":40214,"Hour":40215,"Cell":40216,"BIL":40217,"Ġprecon":40218,"ĠScor":40219,"Ġconfig":40220,"ĠMuscle":40221,"Ġhive":40222,"Ġunderworld":40223,"plement":40224,"Ġpostage":40225,"Ġinterpersonal":40226,"Ġpierced":40227,"Ġcharms":40228,"oscopic":40229,"ASC":40230,"ĠDex":40231,"render":40232,"png":40233,"Ġcritiques":40234,"992":40235,"ĠVinyl":40236,"Bear":40237,"idia":40238,"ĠTemp":40239,"Ġcyn":40240,"ĠBCE":40241,"Ġpatriarchal":40242,"Ġantagonist":40243,"ĠGMO":40244,"Ġunnatural":40245,"Race":40246,"imeo":40247,"ĠUkrainians":40248,"Train":40249,"Ġ329":40250,"ritten":40251,"igil":40252,"Lin":40253,"alus":40254,"*****":40255,"olded":40256,"ĠPegasus":40257,"Bas":40258,"photos":40259,"Ġ820":40260,"Ġsquadron":40261,"ESE":40262,"Ġ373":40263,"Uk":40264,"Lost":40265,"Store":40266,"ĠScenes":40267,"JJ":40268,"Ġlick":40269,"Tyler":40270,"cius":40271,"lishing":40272,"ocl":40273,"Ġassoci":40274,"ensitivity":40275,"entanyl":40276,"Rum":40277,"Ġ443":40278,"onding":40279,"Ġpedals":40280,"ĠPsychological":40281,"Ġthro":40282,"Network":40283,"591":40284,"Pick":40285,"Ġchords":40286,"ĠHound":40287,"entials":40288,"faces":40289,"ĠYin":40290,"ugi":40291,"bows":40292,"ĠForms":40293,"886":40294,"Ox":40295,"Ġ351":40296,"Ġmating":40297,"Ġchirop":40298,"916":40299,"Ġexpend":40300,"Ġusefulness":40301,"Marvel":40302,"ĠStretch":40303,"omez":40304,"ĠJS":40305,"Hal":40306,"fle":40307,"ĠCountdown":40308,"ĠLH":40309,"assian":40310,"vd":40311,"ĠTranscript":40312,"ĠExtrem":40313,"idine":40314,"ustainable":40315,"ederal":40316,"ĠOwl":40317,"Ġcreed":40318,"ĠGrateful":40319,"Ġprenatal":40320,"________________________________":40321,"ĠElements":40322,"â̦)":40323,"nesia":40324,"ARGET":40325,"Ġboredom":40326,"Ġdepictions":40327,"verbal":40328,"ĠeSports":40329,"Laura":40330,"ilage":40331,"ĠGalactic":40332,"Investigators":40333,"Ġscattering":40334,"instein":40335,"ĠExperiment":40336,"ĠRecre":40337,"Ġregul":40338,"Ġrelent":40339,"STE":40340,"Ġslicing":40341,"igans":40342,"raped":40343,"ĠDeter":40344,"Ġsmoker":40345,"ĠWikimedia":40346,"pages":40347,"Ted":40348,"713":40349,"Ġpuberty":40350,"Ġhars":40351,"ĠStarter":40352,"patch":40353,"leeve":40354,"Ġ346":40355,"ĠAccessories":40356,"ventions":40357,"ĠSTAND":40358,"ĠUrug":40359,"ĠOccupy":40360,"Ġbinds":40361,"ĠBubble":40362,"Ġincorporation":40363,"Ġstereotypical":40364,"Ġgor":40365,"987":40366,"Ġevils":40367,"tower":40368,"Ġastronomer":40369,"Ble":40370,"ĠNid":40371,"ĠWidow":40372,"Ġpaw":40373,"Ġinnoc":40374,"ĠOWN":40375,"Ġtofu":40376,"drops":40377,"ĠEval":40378,"693":40379,"Collins":40380,"penter":40381,"ĠNib":40382,"Ġsmokes":40383,"Ġ1850":40384,"Ġtechno":40385,"oooo":40386,"ĠUnic":40387,"ĠKirin":40388,"\":[\"":40389,"Ġincrements":40390,"989":40391,"oodoo":40392,"ĠCyborg":40393,"Ġcures":40394,"ĠOW":40395,"ĠAnnex":40396,"behavior":40397,"/-":40398,"Ġbuggy":40399,"onent":40400,"Bey":40401,"Ġsummarize":40402,"putable":40403,"Ġfri":40404,"Gi":40405,"urances":40406,"ĠAppalach":40407,"Ġhegemony":40408,"ĠOrigins":40409,"Ġconnectors":40410,"ĠAST":40411,"object":40412,"ĠSlay":40413,"Arm":40414,"oston":40415,"ĠEVEN":40416,"Ġprophecy":40417,"Bright":40418,"ĠVector":40419,"Marg":40420,"omical":40421,"Holy":40422,"ĠRPM":40423,"ĠReceiver":40424,"Ġtracts":40425,"boss":40426,"Ġblurry":40427,"aspx":40428,"DES":40429,"Ġcess":40430,"ĠAster":40431,"anything":40432,"levard":40433,"unciation":40434,"jong":40435,"Ġiv":40436,"Common":40437,"ĠDistance":40438,"imus":40439,"outheast":40440,"Ġcir":40441,"ĠCato":40442,"Ġinscribed":40443,"ersed":40444,"Ġanarchy":40445,"Ġplagiar":40446,"Ġthug":40447,"Actor":40448,"ĠTant":40449,"Researchers":40450,"remember":40451,"Ġitch":40452,"Ġrefill":40453,"Ġsucker":40454,"ĠWANT":40455,"RAG":40456,"rencies":40457,"ĠTape":40458,"Ġattaches":40459,"nb":40460,"Tan":40461,"Ġappend":40462,"Ġalas":40463,"951":40464,"panel":40465,"Climate":40466,"icrobial":40467,"Brandon":40468,"ĠFreud":40469,"Ġfungi":40470,"Ġcommenters":40471,"ĠDelicious":40472,"Ġhitherto":40473,"conv":40474,"Ġchemist":40475,"Ġdenominations":40476,"ĠBehavior":40477,"comed":40478,"ĠLantern":40479,"ĠFloating":40480,"magic":40481,"ĠBarbar":40482,"bender":40483,"iliar":40484,"unny":40485,"Ġretracted":40486,"atars":40487,"ĠLovely":40488,"Ġinfinitely":40489,"Ġhumili":40490,"Ġinterestingly":40491,"Ġmunicip":40492,"ĠPanic":40493,"Ġcomprehension":40494,"ĠMassacre":40495,"Ġpersuasion":40496,"enf":40497,"Ġcoded":40498,"higher":40499,"chart":40500,"umbered":40501,"ĠIndigo":40502,"Ġthinker":40503,"Ġgoof":40504,"ĠPetition":40505,"fascist":40506,"absor":40507,"Ġassay":40508,"ĠClassification":40509,"Ġhalluc":40510,"speech":40511,"issues":40512,"Ġinexper":40513,"ĠLibre":40514,"Ġsling":40515,"zech":40516,"Ġpouch":40517,"ĠOffense":40518,"ĠHF":40519,"Fight":40520,"026":40521,"ĠTrident":40522,"fm":40523,"Ġintox":40524,"Ġ465":40525,"colonial":40526,"ovies":40527,"794":40528,"Techn":40529,"undreds":40530,"Ġchildish":40531,"arenthood":40532,"ĠShade":40533,"Host":40534,"Ġdirectional":40535,"reader":40536,"rimp":40537,"ĠEater":40538,"prep":40539,"Ġmeas":40540,"Ġlatch":40541,"inant":40542,"nels":40543,"finished":40544,"application":40545,"Board":40546,"Ġfiller":40547,"ivably":40548,"CAST":40549,"Ġstereotyp":40550,"Ġwarranties":40551,"ĠProbe":40552,"Ġspontaneously":40553,"Ġtropes":40554,"Meg":40555,"ĠHandling":40556,"hemer":40557,"986":40558,"ĠSly":40559,"plates":40560,"Ġmolten":40561,"ĠHIT":40562,"strings":40563,"Ġcentrif":40564,"ĠENG":40565,"Indeed":40566,"Ġ429":40567,"Ġsly":40568,"Ġ490":40569,"Ġhordes":40570,"boot":40571,"691":40572,"ihara":40573,"Ġsubversive":40574,"Russell":40575,"aceous":40576,"wk":40577,"Ġreverence":40578,"Ġingenious":40579,"holiday":40580,"eligible":40581,"ĠTactical":40582,"978":40583,"herence":40584,"Ġgimm":40585,"Ġarchaic":40586,"Ġadam":40587,"Ġ297":40588,"Father":40589,"ĠLerner":40590,"Ġhesitated":40591,"Safety":40592,"Ġawakened":40593,"ueller":40594,"Ġextrater":40595,"Ġmummy":40596,"ĠBuddhism":40597,"Ġ359":40598,"Ġlegions":40599,"Ġprehistoric":40600,"ancouver":40601,"Ġmelancholy":40602,"ĠEnemy":40603,"ĠSyl":40604,"ĠRobo":40605,"verting":40606,"ĠBullets":40607,"essler":40608,"Ġmarvelous":40609,"ĠBened":40610,"Ġsavior":40611,"omever":40612,"Bee":40613,"Ġrapp":40614,"Ġpredomin":40615,"ĠScripture":40616,"Ġsnapshots":40617,"Ġunrem":40618,"Ġsquid":40619,"ĠBuddh":40620,"ĠSantorum":40621,"Internet":40622,"avoid":40623,"Ġunamb":40624,"Ġ296":40625,"Ġnexus":40626,"Ġinterchangeable":40627,"ockets":40628,"Ġfoll":40629,"ĠOPT":40630,"023":40631,"²":40632,"Ġhereditary":40633,"Ġvape":40634,"=\"":40635,"1996":40636,"س":40637,"Emergency":40638,"Ġneb":40639,"Ġisot":40640,"Ġdiam":40641,"stairs":40642,"ĠAppendix":40643,"venient":40644,"Ġinvol":40645,"Ġtheorist":40646,"Ġconqu":40647,"Mich":40648,"ĠSort":40649,"antasy":40650,"dating":40651,"771":40652,"Ġape":40653,"Ġindemn":40654,"ween":40655,"Games":40656,"ascal":40657,"Muslims":40658,"Ġleaflets":40659,"Ġtraverse":40660,"Ġtransgress":40661,"Ġflushed":40662,"893":40663,"lasses":40664,"obos":40665,"ooming":40666,"Ġtou":40667,"mast":40668,"âģ":40669,"751":40670,"Either":40671,"Ġgrate":40672,"urgy":40673,"Ġendowed":40674,"ĠRasm":40675,"Nat":40676,"odka":40677,"olon":40678,"iants":40679,"Ġsensations":40680,"Ġsituational":40681,"pox":40682,"Figure":40683,"Ġslime":40684,"Ġ421":40685,"ollow":40686,"Ġanesthesia":40687,"adult":40688,"ĠPiece":40689,"994":40690,"ĠAnalog":40691,"Iv":40692,"flo":40693,"Ġdomest":40694,"Ġcabal":40695,"Ġgarg":40696,"Ġrabb":40697,"REC":40698,"ISTORY":40699,"Friend":40700,"Ġancestor":40701,"ĠLets":40702,"Ġelf":40703,"Ġlobb":40704,"ĠAdren":40705,"silver":40706,"astical":40707,"Ġstitch":40708,"028":40709,"Hug":40710,"Ġmoss":40711,"ompl":40712,"Ġunob":40713,"883":40714,"Ġcortex":40715,"olutely":40716,"052":40717,"Seattle":40718,"restling":40719,"endment":40720,"Ġ366":40721,"ventus":40722,"ĠRated":40723,"ĠClever":40724,"Ġcloak":40725,"phrase":40726,"flake":40727,"Ġphilosophies":40728,"784":40729,"Ġskulls":40730,"wake":40731,"oru":40732,"ĠACTION":40733,"Ġcomprom":40734,"ĠManufacturer":40735,"ĠImprove":40736,"Ns":40737,"ĠRevenge":40738,"lords":40739,"Ġ417":40740,"iddles":40741,"Ġcondesc":40742,"tiny":40743,"Ġchloride":40744,"greg":40745,"ĠREST":40746,"subject":40747,"Ġundes":40748,"ftime":40749,"Ġbottleneck":40750,"ĠZombie":40751,"Ġhabitable":40752,"Ġcigars":40753,"Ġenlarg":40754,"icester":40755,"ðĿ":40756,"regulation":40757,"arters":40758,"Ġformulations":40759,"Ġadhesive":40760,"Ġ344":40761,"pod":40762,"etitive":40763,"Ġcontinuum":40764,"aghd":40765,"Ġ701":40766,"Ġdisband":40767,"Tu":40768,"Ġcivilisation":40769,"ĠPCI":40770,"Ġcrooked":40771,"ammy":40772,"Ġbrim":40773,"Jr":40774,"ĠBunker":40775,"plot":40776,"Ġwielded":40777,"Ġcaricature":40778,"ĠInfinite":40779,"piracy":40780,"aretz":40781,"Ġstares":40782,"incinnati":40783,"agents":40784,"ĠObamaCare":40785,"asuring":40786,"ansion":40787,"Ġastonished":40788,"iovascular":40789,"Bio":40790,"Ġadvisable":40791,"Ġsender":40792,"887":40793,"Led":40794,"DN":40795,"Ġaggregation":40796,"ĠInnocent":40797,"ĠTransactions":40798,"worms":40799,"ĠWorm":40800,"Ġ363":40801,"ĠBiblical":40802,"rared":40803,"Ġgazing":40804,"chant":40805,"Ġsubordinates":40806,"1600":40807,"actually":40808,"olition":40809,"ĠRTX":40810,"ĠPyramid":40811,"alph":40812,"ĠFPS":40813,"Ġerrone":40814,"ĠLR":40815,"Scientists":40816,"Ġincons":40817,"Ġbrittle":40818,"027":40819,"ĠBowser":40820,"Rub":40821,"links":40822,"ĠWik":40823,"ussion":40824,"Marsh":40825,"resents":40826,"Clean":40827,"Ġbrute":40828,"ĠInventory":40829,"1100":40830,"ĠATK":40831,"793":40832,"Ġcaveats":40833,"ĠKnot":40834,"IRT":40835,"ĠCanad":40836,"isma":40837,"entin":40838,"Own":40839,"Ġ455":40840,"Ġlesions":40841,"ĠAres":40842,"ĠKali":40843,"Ġpaws":40844,"Auto":40845,"Ġdiscrim":40846,"044":40847,"ĠCOUN":40848,"Ġ1905":40849,"Ġexperien":40850,"Ġ406":40851,"achelor":40852,"Ġscarcely":40853,"Ġsynchronized":40854,"Rat":40855,"Blake":40856,"Ġrewriting":40857,"Ġcannons":40858,"stem":40859,"Apparently":40860,"Ġleveling":40861,"?]":40862,"Ġfins":40863,"ĠTone":40864,"ogether":40865,"Sound":40866,"Ġmicrosc":40867,"ĠAsylum":40868,"Ġindividuality":40869,"Ġ432":40870,"lease":40871,"Chuck":40872,"Ġhating":40873,"Ġleftists":40874,"ĠPersonality":40875,"ĠBundle":40876,"Dutch":40877,"Ġtransformer":40878,"iami":40879,"ĠTradition":40880,"ĠRecipes":40881,"Ġdiscour":40882,"Viol":40883,"Ext":40884,"ĠOliv":40885,"ashington":40886,"Ġmillennia":40887,"Ġpsychiatrists":40888,"ĠTrilogy":40889,"inction":40890,"Ġdisliked":40891,"088":40892,"954":40893,"Ġoverloaded":40894,"Ġopium":40895,"acus":40896,"resources":40897,"mud":40898,"ometry":40899,"Hit":40900,"Ġguild":40901,"Ġabyss":40902,"884":40903,"ensity":40904,"ĠDifference":40905,"Electric":40906,"authent":40907,"Ġdownloadable":40908,"ellar":40909,"ĠSavior":40910,"ĠFRI":40911,"Ġ445":40912,"Ġincidental":40913,"Ġanalogue":40914,"ounters":40915,"ĠBuilder":40916,"Ġnarration":40917,"ategor":40918,"raise":40919,"Ġindoctr":40920,"Aren":40921,"Ġbaptism":40922,"Ġobe":40923,"Ġtubing":40924,"apsed":40925,"Fortunately":40926,"gered":40927,"Pict":40928,"Ġmastering":40929,"ĠHIM":40930,"ĠObesity":40931,"Ġornament":40932,"advant":40933,"ĠCous":40934,"032":40935,"cells":40936,"Ġpreclude":40937,"Ġanecdote":40938,"Ġpatriarchy":40939,"ĠSending":40940,"Pie":40941,"Ġdepressive":40942,"ĠEnds":40943,"712":40944,"zos":40945,"icka":40946,"Ġ1906":40947,"Anti":40948,"vana":40949,"ĠRestrict":40950,"Ġprotr":40951,"Ġusername":40952,"Ġparach":40953,"1997":40954,"imental":40955,"rower":40956,"carb":40957,"033":40958,"Ġobligatory":40959,"Ġwillful":40960,"Ġsnail":40961,"json":40962,"izarre":40963,"Ġmiscar":40964,"Ġdopamine":40965,"л":40966,"Ġapplic":40967,"Ġnervously":40968,"YY":40969,"alez":40970,"ĠSoviets":40971,"ĠMister":40972,"Ġcrates":40973,"Ġheavenly":40974,"Ġdoct":40975,"048":40976,"Ġ2400":40977,"ivia":40978,"adies":40979,"Phone":40980,"asks":40981,"Ġperenn":40982,"Ġcomposing":40983,"Ġraiding":40984,"requent":40985,"ibli":40986,"ĠFeedback":40987,"cellaneous":40988,"ĠContracts":40989,"ĠCasting":40990,"vim":40991,"Cut":40992,"Ġabbrevi":40993,"Ġintest":40994,"ricted":40995,"969":40996,"nostic":40997,"Ġinverted":40998,"ĠEG":40999,"aiden":41000,"ĠClaud":41001,"ĠiP":41002,"urized":41003,"Emily":41004,"Ġ353":41005,"Ġ((":41006,"ammad":41007,"Reb":41008,"plom":41009,"YES":41010,"connection":41011,"ĠWra":41012,"ĠMerch":41013,"Ġether":41014,"Elizabeth":41015,"Chip":41016,"relevant":41017,"URA":41018,"Ġantioxidant":41019,"ĠChron":41020,"Ġtheological":41021,"HCR":41022,"ruits":41023,"Body":41024,"enezuel":41025,"Few":41026,"adder":41027,"Ġinducing":41028,"ĠDarth":41029,"Ġimplicitly":41030,"Ġoverfl":41031,"Ġrelics":41032,"Must":41033,"ĠAnswers":41034,"Ġretina":41035,"ĠSlowly":41036,"ĠShib":41037,"software":41038,"Ġ\"\"":41039,"hack":41040,"Apart":41041,"told":41042,"Ger":41043,"Civil":41044,"problem":41045,"Ġslang":41046,"Ġtactile":41047,"Ġtabl":41048,"ĠAscension":41049,"Ġhumankind":41050,"Howard":41051,"rescent":41052,"ĠReleases":41053,"arijuana":41054,"Christopher":41055,"ĠWarden":41056,"blogspot":41057,"ĠVari":41058,"idency":41059,"ĠHandler":41060,"Round":41061,"MJ":41062,"Ġrhyth":41063,"Tai":41064,"terson":41065,"Ġ,\"":41066,"portation":41067,"ĠOrbital":41068,"Ġfantas":41069,"Ġattribut":41070,"Ġdiagram":41071,"atech":41072,"1992":41073,"ibl":41074,"Woman":41075,"ternally":41076,"Days":41077,"Ġdebunk":41078,"ĠPhant":41079,"ĠOath":41080,"sharp":41081,"Ġclaws":41082,"Lots":41083,"Incre":41084,"Aff":41085,"hooting":41086,"rect":41087,"Ġaltru":41088,"Ġwors":41089,"Ġtho":41090,"Ġ349":41091,"clusions":41092,"Ġpseudonym":41093,"Bec":41094,"Ġphosphorus":41095,"ivic":41096,"Ġ348":41097,"otent":41098,"Ġub":41099,"Ġcoales":41100,"regate":41101,"Ġ1870":41102,"Ġglide":41103,"treated":41104,"ĠSymb":41105,"Ġenchant":41106,"Besides":41107,"stocks":41108,"Ġ388":41109,"--------------":41110,"interpret":41111,"ouple":41112,"Ġdrawback":41113,"ĠRevised":41114,"Ġanat":41115,"Ġpsychosis":41116,"ب":41117,"Ġdiffuse":41118,"Ġaffidav":41119,"elve":41120,"amination":41121,"ĠTackle":41122,"hunter":41123,"env":41124,"Ġchests":41125,"Ġsubter":41126,"Ġconquest":41127,"Ġfidelity":41128,"Ġinfringing":41129,"opathic":41130,"ĠGrip":41131,"ĠKeyboard":41132,"Ġobjectionable":41133,"Ġmetabol":41134,"ĠGö":41135,"Room":41136,"...)":41137,"KEN":41138,"assic":41139,"Ġgeop":41140,"Tro":41141,"Ġcursing":41142,"Ġdile":41143,"Ġultraviolet":41144,"inarily":41145,"Ġdistilled":41146,"sect":41147,"ĠShooter":41148,"uckles":41149,"Ġdistortions":41150,"Map":41151,"Doctor":41152,"Ġinstalls":41153,"oire":41154,"Ġstarch":41155,"ociation":41156,"Lev":41157,"Ġscripture":41158,"Ġsalient":41159,"ilitating":41160,"wb":41161,"ĠSov":41162,"ĠDamn":41163,"Grey":41164,"Ġ980":41165,"Ġjung":41166,"Ġlicking":41167,"029":41168,"ĠDian":41169,"ĠBabylon":41170,"к":41171,"ĠRomantic":41172,"Ġguesses":41173,"ĠFren":41174,"Generally":41175,"ultural":41176,"istence":41177,"Ġiniti":41178,"Ġ341":41179,"ĠSlave":41180,"ultan":41181,"ĠTrash":41182,"ĠEmpty":41183,"ĠHundred":41184,"ĠDirective":41185,"Anderson":41186,"Advertisement":41187,"RH":41188,"ĠOo":41189,"ĠHik":41190,"peg":41191,"Sup":41192,"ĠXT":41193,"Ġencrypt":41194,"selage":41195,"ĠThrone":41196,"Ġconsecut":41197,"Li":41198,"ĠVirus":41199,"ĠCookies":41200,"SHIP":41201,"Ġflavorful":41202,"odynamics":41203,"animal":41204,"spread":41205,"ĠIPCC":41206,"jobs":41207,"ernand":41208,"ĠHaunted":41209,"Ġintolerable":41210,"ĠLAR":41211,"ixtape":41212,"Ġneur":41213,"Ġcausal":41214,"ĠPsychiatry":41215,"ĠVim":41216,"Ġgenomic":41217,"duration":41218,"ĠUsername":41219,"ategy":41220,"Ġunic":41221,"ĠKILL":41222,"blooded":41223,"Ġcaucuses":41224,"ĠPOLITICO":41225,"Spanish":41226,"Ġobedience":41227,"Ġinconven":41228,"MAT":41229,"Ġbends":41230,"ĠImprovements":41231,"Ġrelig":41232,"ĠForth":41233,"ĠLumia":41234,"uces":41235,"Ġunim":41236,"ĠStatistical":41237,"kb":41238,"auntlet":41239,"ĠDisco":41240,"ĠInstruction":41241,"ooo":41242,"ĠDictionary":41243,"culated":41244,"Adv":41245,"ĠAvatar":41246,"ictional":41247,"Ġcentr":41248,"ifles":41249,"orks":41250,"skill":41251,"Ġlatex":41252,"ĠPagan":41253,"Ġdevast":41254,"Ġprol":41255,"896":41256,"Product":41257,"968":41258,"Ġfrench":41259,"083":41260,"ĠCluster":41261,"cloth":41262,"ĠFilter":41263,"ĠDisorders":41264,"etimes":41265,"Ġinstinctively":41266,"ĠBritann":41267,"Ġaft":41268,"ĠVict":41269,"Ġâĺħ":41270,"Ġperverse":41271,"Ġcontraceptives":41272,"ĠHannibal":41273,"escap":41274,"ĠApostle":41275,"ĠXiao":41276,"ĠMagnum":41277,"Ġphosphate":41278,"Ġ399":41279,"utable":41280,"Ġsten":41281,"Ġwearer":41282,"Ġsmug":41283,"ĠInfluence":41284,"Ġ384":41285,"Truth":41286,"struction":41287,"Ġmaniac":41288,"ĠMagnetic":41289,"ousands":41290,"Ġsemen":41291,"dir":41292,"ĠTornado":41293,"Ġexplos":41294,"1995":41295,"Xi":41296,"Steel":41297,"057":41298,"Barn":41299,"Fan":41300,"ĠChatt":41301,"Chem":41302,"ĠFold":41303,"bees":41304,"1080":41305,"ĠMaze":41306,"ierre":41307,"oeuv":41308,"Cand":41309,"odium":41310,"mmm":41311,"ereo":41312,"Ġreactionary":41313,"Ġacidic":41314,"ĠRemoval":41315,"Ġnont":41316,"031":41317,"ĠTerminator":41318,"ĠVendor":41319,"enemy":41320,"Ġreconstructed":41321,"ĠGalileo":41322,"Ġtesters":41323,"albeit":41324,"uminium":41325,"Ġrite":41326,"ĠInput":41327,"committee":41328,"Ġjour":41329,"gements":41330,"Ġgerm":41331,"Dick":41332,"ĠRequirements":41333,"omsday":41334,"Î":41335,"ISSION":41336,"Ġmolded":41337,"Ġrye":41338,"Attorney":41339,"population":41340,"Ġrepet":41341,"Sync":41342,"breaks":41343,"Ġbanished":41344,"Ġraspberry":41345,"Ġammo":41346,"Ġorthodox":41347,"Ġwebcam":41348,"ĠAsc":41349,"vl":41350,"1989":41351,"Ġdiscipl":41352,"Ġmoreover":41353,"Ġexplodes":41354,"1960":41355,"Ġpropositions":41356,"Protect":41357,"Ġsexes":41358,"physical":41359,"ĠAthena":41360,"ocent":41361,"ĠGothic":41362,"ĠRacial":41363,"istani":41364,"Ġhelium":41365,"ĠPresumably":41366,"Ġperman":41367,"becue":41368,"ĠHW":41369,"rued":41370,"ĠCNS":41371,"DEP":41372,"ĠManifest":41373,"2500":41374,"ĠMyst":41375,"Economic":41376,"Prot":41377,"Ġledge":41378,"Ġimitate":41379,"ĠTotally":41380,"ĠBeaut":41381,"OIL":41382,"Ġ1440":41383,"Moscow":41384,"ĠSets":41385,"merga":41386,"Ġlesbians":41387,"Walker":41388,"Move":41389,"ĠSOM":41390,"ĠPsy":41391,"strument":41392,"Ġiter":41393,"ĠTosh":41394,"oola":41395,"ĠAntiqu":41396,"ĠShining":41397,"Ġobservational":41398,"VW":41399,"rophe":41400,"034":41401,"Ġcontiguous":41402,"Ġstarve":41403,"sure":41404,"Ġnegate":41405,"Ġmindless":41406,"tf":41407,"Ġdownwards":41408,"046":41409,"riors":41410,"Ġreverted":41411,"ĠAthe":41412,"Bra":41413,"eah":41414,"Rachel":41415,"Hung":41416,"Join":41417,"ĠRaces":41418,"Ġmutant":41419,"Ġuncond":41420,"Ġusability":41421,"NESS":41422,"haust":41423,"036":41424,"Ġobscurity":41425,"Ġimperialism":41426,"Ġemitting":41427,"Ġideologically":41428,"ĠIro":41429,"erva":41430,"ĠIzzy":41431,"ĠLevels":41432,"onym":41433,"ĠConspiracy":41434,"ĠSapphire":41435,"Ul":41436,"Ġhuh":41437,"ochem":41438,"Ġbehaves":41439,"ĠMesh":41440,"Ark":41441,"Ġvec":41442,"ĠActions":41443,"Ġdistinguishing":41444,"ĠTsarnaev":41445,"ĠEndurance":41446,"ederation":41447,"itant":41448,"Ġstreetcar":41449,"041":41450,"ĠAval":41451,"ĠCompanion":41452,"ĠCartoon":41453,"Ġcalculus":41454,"993":41455,"eq":41456,"ĠVanilla":41457,"MAC":41458,"wolves":41459,"fg":41460,"Ġfermentation":41461,"Ġinformants":41462,"Ġsudo":41463,"Ġperipher":41464,"Ġindign":41465,"parts":41466,"detail":41467,"femin":41468,"blade":41469,"Ġinserts":41470,"Ġoffsets":41471,"Ġantidepressants":41472,"Ġphr":41473,"Ġresultant":41474,"biology":41475,"Ġacquies":41476,"UFF":41477,"****************":41478,"ĠPenalty":41479,"Ġrever":41480,"heric":41481,"ĠShadows":41482,"command":41483,"Ġreprint":41484,"089":41485,"empty":41486,"ĠTAG":41487,"stim":41488,"FK":41489,"Ġkins":41490,"uggle":41491,"imura":41492,"wit":41493,"Kill":41494,"Beck":41495,"Ocean":41496,"Ġlabyrinth":41497,"ĠNorse":41498,"IENCE":41499,"Ġ+++":41500,"DoS":41501,"gm":41502,"Ġbarbar":41503,"ĠCeres":41504,"Ġhashing":41505,"eworthy":41506,"Ġrecite":41507,"Ġelectrodes":41508,"Ġconformity":41509,"response":41510,"olate":41511,"Ġ357":41512,"Snap":41513,"Crime":41514,"Ġpointer":41515,"ĠTIT":41516,"Ġdistinctions":41517,"Ġ427":41518,"ĠÙĪ":41519,"abases":41520,"Mars":41521,"ĠSpiritual":41522,"Ġimpuls":41523,"Philadelphia":41524,"1994":41525,"Ġcunning":41526,"Ġfram":41527,"Ġinco":41528,"Ġomnip":41529,"imize":41530,"ervative":41531,"Gy":41532,"Drug":41533,"Ġcarniv":41534,"ĠSailor":41535,"download":41536,"ĠBeetle":41537,"ĠEarthqu":41538,"izontal":41539,"Alan":41540,"Nice":41541,"Prior":41542,"MAG":41543,"Ġautobi":41544,"ĠBrill":41545,"Ġpredominant":41546,"ĠMessiah":41547,"REM":41548,"ĠSlip":41549,"ĠWebs":41550,"ademic":41551,"<":41552,"ĠVessel":41553,"vari":41554,"Code":41555,"Ġbeetle":41556,"projects":41557,"BAT":41558,"Ġpsychotic":41559,"Ġunderside":41560,"Ġrefute":41561,"Considering":41562,"kees":41563,"wd":41564,"priority":41565,"Ġtwentieth":41566,"Ġatheist":41567,"amina":41568,"Ġeuphem":41569,"Ġtripod":41570,"ĠTrayvon":41571,"ĠNON":41572,"2200":41573,"ĠNPC":41574,"ependence":41575,"ĠMHz":41576,"ĠBung":41577,"Ġpane":41578,"Ġaboriginal":41579,"ĠPLUS":41580,"igers":41581,"ĠSexy":41582,"MF":41583,"Chall":41584,"Ay":41585,"ilingual":41586,"adj":41587,"Ġfrown":41588,"successful":41589,"stack":41590,"Ġic":41591,"ĠSeah":41592,"Ġconsequ":41593,"bugs":41594,"ĠScand":41595,"ĠCurve":41596,"Nob":41597,"ĠHoo":41598,"ĠKissinger":41599,"ĠTimeline":41600,"Ġmt":41601,"Description":41602,"YP":41603,"ĠInstallation":41604,"levision":41605,"Ġanthropology":41606,"itzerland":41607,"iaries":41608,"kward":41609,"robat":41610,"Ġcarbohydrate":41611,"Phot":41612,"оÐ":41613,"ĠSQL":41614,"Disc":41615,"Ġdataset":41616,"ynski":41617,"Ġfiat":41618,"ĠDres":41619,"ĠFavor":41620,"ĠHalls":41621,"Alt":41622,"PART":41623,"Spider":41624,"Ġdisabling":41625,"RG":41626,"Ward":41627,"aturation":41628,"Ġwillfully":41629,"Ġlockout":41630,"ĠShutdown":41631,"956":41632,"Ġcommunists":41633,"Against":41634,"Ore":41635,"ĠRik":41636,"ĠASD":41637,"ĠOnion":41638,"Ġparticulars":41639,"Analy":41640,"checked":41641,"selected":41642,"romy":41643,"ĠAkira":41644,"Ġcongr":41645,"Choice":41646,"Ġbos":41647,"organisms":41648,"Ġfrowned":41649,"Tok":41650,"Bir":41651,"ĠScrib":41652,"Ġrealms":41653,"Ġcoercive":41654,"1993":41655,"021":41656,"âĢĵâĢĵ":41657,"athetic":41658,"rior":41659,"Ġfolly":41660,"ĠAMERICA":41661,"Ġcassette":41662,"953":41663,"Ġabsorbs":41664,"043":41665,"quad":41666,"''.":41667,"ĠExtract":41668,"Ġ424":41669,"Whit":41670,"Dun":41671,"Ġexerted":41672,"Ġbrethren":41673,"ĠChronicles":41674,"eric":41675,"Mot":41676,"Ġendings":41677,"piration":41678,"Ġpredetermined":41679,"ĠAirl":41680,"Ġgasp":41681,"Ġ367":41682,"Ġexclaim":41683,"cation":41684,"sort":41685,"idden":41686,"missive":41687,"ع":41688,"oice":41689,"same":41690,"Ott":41691,"Ġscatter":41692,"Flight":41693,"ĠTOD":41694,"Stra":41695,"amia":41696,"IZE":41697,"Ġcompressor":41698,"ixels":41699,"lethal":41700,"ĠExperimental":41701,"Ing":41702,"knife":41703,"Ġvanishing":41704,"ĠRequired":41705,"Stat":41706,"ĠPlex":41707,"spection":41708,"ĠBakr":41709,"Amazing":41710,"Ġbreaths":41711,"rots":41712,"OSP":41713,"Ġ840":41714,"Wars":41715,"OGR":41716,"Ġ372":41717,"ĠKhe":41718,"inous":41719,"lightly":41720,"ĠRounds":41721,"Ġrefinement":41722,"property":41723,"Ġmetaph":41724,"oultry":41725,"istor":41726,"Ġintestine":41727,"eus":41728,"ĠWilhelm":41729,"ĠBane":41730,"emption":41731,"oubtedly":41732,"ĠVirtue":41733,"'),":41734,"Ħ¢":41735,"Ġappar":41736,"ĠTranslation":41737,"Quite":41738,"Ġphysicists":41739,"Ġpriesthood":41740,"Ġallowable":41741,"Saint":41742,"OSED":41743,"bind":41744,"Ġtorches":41745,"osexual":41746,"Cruz":41747,"ertility":41748,"ĠAES":41749,"Ġascended":41750,"Ġmuzzle":41751,"Ġelectors":41752,"ĠKrug":41753,"Ġcc":41754,"classic":41755,"ĠMace":41756,"Å«":41757,"Ġâ̦\"":41758,"ĠTEST":41759,"gomery":41760,"Person":41761,"Ġtranslations":41762,"ĠDys":41763,"ĠConsent":41764,"Ġ361":41765,"alos":41766,"Ġallerg":41767,"ĠWast":41768,"ĠChecks":41769,"cerning":41770,"Ġlizard":41771,"Ġrevolutions":41772,"Ġtether":41773,"Ġminimized":41774,"ĠReverse":41775,"itely":41776,"iguous":41777,"athing":41778,"Flow":41779,"Moving":41780,"Ġ409":41781,"047":41782,"Ġsnug":41783,"Nich":41784,"Ġcartridge":41785,"YL":41786,"Ġforwarding":41787,"umerous":41788,"ĠAbedin":41789,"iolet":41790,"tick":41791,"ĠTransform":41792,"Grant":41793,"Ġsubtitles":41794,"ĠEmin":41795,"ghost":41796,"ĠKurd":41797,"Ġfireball":41798,"compatible":41799,"Ġprojectiles":41800,"amorph":41801,"ĠSatisf":41802,"Ġquirks":41803,"Ġrecept":41804,"spective":41805,"Ġgraphical":41806,"ĠPicard":41807,"ĠAuthent":41808,"ĠSponge":41809,"Army":41810,"ĠLumin":41811,"ĠSOME":41812,"Ġsolitude":41813,"ĠSHOULD":41814,"ĠFasc":41815,"opez":41816,"types":41817,"gallery":41818,"OLOGY":41819,"shake":41820,"Ġ369":41821,"Ġreused":41822,"Ġ378":41823,"Ġexorc":41824,"Ġdocs":41825,"Yu":41826,"ĠGOD":41827,"ocrine":41828,"location":41829,"fif":41830,"Grid":41831,"Ġpowd":41832,"Ġ'[":41833,"Ġposterior":41834,"Thompson":41835,"Table":41836,"oslov":41837,"ĠGoddess":41838,"odon":41839,"ĠSTD":41840,"Ġresponsiveness":41841,"stab":41842,"absolute":41843,"Enough":41844,"ĠEssence":41845,"ĠUpgrade":41846,"hematically":41847,"Subscribe":41848,"alsh":41849,"repl":41850,"Ġselector":41851,"ĠLength":41852,"Ġtemporal":41853,"Tele":41854,"ocalyptic":41855,"ĠDeaths":41856,"rl":41857,"Target":41858,"ĠOrn":41859,"ongh":41860,"Ġ1909":41861,"Quest":41862,"Place":41863,"ĠDisabled":41864,"Ġascending":41865,"giene":41866,"ĠMSI":41867,"ivil":41868,"Ġcaval":41869,"Ġintermitt":41870,"Ġsalts":41871,"Apr":41872,"059":41873,"ĠKeeper":41874,"emis":41875,"ĠEternal":41876,"SER":41877,"estones":41878,"Ġrudimentary":41879,"Ġpooled":41880,"ĠAlright":41881,"Ġdiagrams":41882,"ydia":41883,"Jacob":41884,"Ġarchitectures":41885,"ĠUSPS":41886,"Ġfootnote":41887,"ĠBrav":41888,"ĠLeopard":41889,"Ġvirtuous":41890,"ploma":41891,"ĠHIP":41892,"Ġhorizontally":41893,"olith":41894,"Prop":41895,"ĠApocalypse":41896,"Syria":41897,"ĠShowdown":41898,"constitutional":41899,"Independent":41900,"ĠMiliband":41901,"ĠTracks":41902,"adle":41903,"ĠESL":41904,"ĠFIGHT":41905,"Ġjohn":41906,"é":41907,"benef":41908,"eware":41909,"ĠTABLE":41910,"ĠVeg":41911,"ainers":41912,"Ġresolves":41913,"Warren":41914,"ĠRanked":41915,"possibly":41916,"bian":41917,"simple":41918,"Ġuniformly":41919,"ĠSlash":41920,"otton":41921,"ĠAbsent":41922,"agically":41923,"ĠPieces":41924,"Station":41925,"ĠBeware":41926,"ĠDiscrimination":41927,"Ġponies":41928,"Import":41929,"utory":41930,"ĠParas":41931,"Phoenix":41932,"Lat":41933,"UTC":41934,"push":41935,"astically":41936,"urrent":41937,"untarily":41938,"Ġparanormal":41939,"Ġglanced":41940,"Ġmanifestations":41941,"ĠNeuroscience":41942,"irgin":41943,"ROM":41944,"Ġ($)":41945,"Ġ379":41946,"missing":41947,"Ġmercenaries":41948,"Ġenumer":41949,"ĠShant":41950,"Ws":41951,"wered":41952,"Ġbuffs":41953,"ultane":41954,"ĠRohing":41955,"igger":41956,"Ring":41957,"Ġmanifests":41958,"Fat":41959,"ĠReduced":41960,"ĠMinerva":41961,"uart":41962,"ĠArmory":41963,"orange":41964,"igible":41965,"Ġphysiology":41966,"Ut":41967,"Ġparchment":41968,"ĠFired":41969,"trap":41970,"oggle":41971,"mson":41972,"ĠPoster":41973,"Ġbount":41974,"import":41975,"maximum":41976,"Ġ422":41977,"ĠFemin":41978,"Ġnodding":41979,"Ġinscription":41980,"Results":41981,"GRE":41982,"icative":41983,"Ġcognition":41984,"Ġions":41985,"ĠBite":41986,"Ġneutron":41987,"Ġduplication":41988,"ĠZIP":41989,"ĠQuit":41990,"Ġgrasping":41991,"ĠDaylight":41992,"Ġlayouts":41993,"CLA":41994,"reason":41995,"ĠHuh":41996,"Ġpige":41997,"ĠBomber":41998,"Produ":41999,"Ġgland":42000,"ĠAbsolute":42001,"writ":42002,"Ġmassac":42003,"Ġfixation":42004,"device":42005,"yz":42006,"ĠGOT":42007,"ĠDying":42008,"adjust":42009,"grain":42010,"Ġdeform":42011,"Ġtypew":42012,"Ġdagger":42013,"ĠTuring":42014,"ĠBucc":42015,"Heavy":42016,"Ġcommod":42017,"files":42018,"ogeneous":42019,"roth":42020,"Buff":42021,"Ġbookmark":42022,"porary":42023,"Medical":42024,"Um":42025,"Ġtranslucent":42026,"ĠAnxiety":42027,"ĠCorinthians":42028,"optional":42029,"PUT":42030,"Ġcrucifix":42031,"alloween":42032,"ĠVK":42033,"Ġblu":42034,"ĠCorinth":42035,"Mount":42036,"Ġmembranes":42037,"particip":42038,"Ġextraord":42039,"Ġstimulated":42040,"leneck":42041,"Ġspecifies":42042,"Sin":42043,"lash":42044,"Edited":42045,"Ġfused":42046,"Nin":42047,"ĠBungie":42048,"ĠTooth":42049,"WATCH":42050,"Nav":42051,"Initially":42052,"+)":42053,"ĠAncest":42054,"Ġtransmitter":42055,"ĠVolks":42056,"ezvous":42057,"ĠNirvana":42058,"ĠCald":42059,"font":42060,"Und":42061,"remlin":42062,"ichever":42063,"ĠHeal":42064,"shall":42065,"Ġattribution":42066,"authorized":42067,"ĠINTO":42068,"acteria":42069,"ĠTsu":42070,"ĠPlane":42071,"iphate":42072,"igraph":42073,"chev":42074,"Ġinverse":42075,"ifest":42076,"Players":42077,"!!\"":42078,"ĠContrast":42079,"1984":42080,"Ġsevent":42081,"colour":42082,"ĠRational":42083,"virtual":42084,"Ġfec":42085,"ĠETH":42086,"ĠPru":42087,"Õ":42088,"asma":42089,"Cur":42090,"Ġassigns":42091,"Ġridic":42092,"Todd":42093,"ulton":42094,"ĠDefendant":42095,"opsis":42096,"Ġpercentile":42097,"shr":42098,"wagen":42099,"Ġ368":42100,"SIGN":42101,"Screen":42102,"reprene":42103,"Ġerection":42104,"ĠFreak":42105,"ĠStard":42106,"stained":42107,"Ġcla":42108,"fet":42109,"ramids":42110,"QL":42111,"avorable":42112,"ĠTCP":42113,"nown":42114,"ulence":42115,"similar":42116,"Ġlinkage":42117,"ercise":42118,"Path":42119,"LECT":42120,"ĠCollections":42121,"ĠModule":42122,"Ġcs":42123,"Current":42124,"Ġmono":42125,"ĠAlv":42126,"ĠDude":42127,"Ġhypers":42128,"Ġ2600":42129,"surface":42130,"Ġpredictor":42131,"ĠColomb":42132,"Prof":42133,"anqu":42134,"natal":42135,"Ġadultery":42136,"ĠGenerations":42137,"clerosis":42138,"Ġ371":42139,"Ġenlightenment":42140,"onomic":42141,"Ġsatir":42142,"ĠBasics":42143,"Graham":42144,"ĠRove":42145,"Ġadul":42146,"Shut":42147,"ocious":42148,"Ġhandc":42149,"BW":42150,"ĠCognitive":42151,"visible":42152,"Ġinev":42153,"Ġ978":42154,"ĠSupported":42155,"Ġarrays":42156,"Ġalienation":42157,"Weight":42158,"ĠkWh":42159,"Ġwarped":42160,"Ġ386":42161,"lance":42162,"Ġherpes":42163,"ĠPHP":42164,"Ġclaimant":42165,"uitive":42166,"Ġpussy":42167,"Ġcorpus":42168,"ĠAo":42169,"Qual":42170,"ĠXVI":42171,"requ":42172,"Ġsympt":42173,"mination":42174,"Ġhairy":42175,"ĠBattles":42176,"owntown":42177,"Roberts":42178,"Ġnec":42179,"ablo":42180,"AMD":42181,"internet":42182,"Tar":42183,"direction":42184,"ouston":42185,"ĠGlock":42186,"ĠYanukovych":42187,"ogens":42188,"rogram":42189,"otype":42190,"ĠPt":42191,"tenance":42192,"Ġaromatic":42193,"oxin":42194,"Vert":42195,"Ġsociop":42196,"cible":42197,"Db":42198,"________________":42199,"Third":42200,"ĠShips":42201,"!.":42202,"expensive":42203,"WOR":42204,"primary":42205,"Ġ666":42206,"Ġdecaying":42207,"Ġclustered":42208,"Ġbeetles":42209,"ĠHogwarts":42210,"Ġheaders":42211,"ĠJudah":42212,"Ġscen":42213,"Ġcosmos":42214,"ĠGenetic":42215,"blems":42216,"Ġfeeble":42217,"NOW":42218,"NSA":42219,"Ġadminist":42220,"ĠDocker":42221,"portion":42222,"gression":42223,"Ġ1904":42224,"heard":42225,"Ġinhab":42226,"ĠLeaves":42227,"Ġcortisol":42228,"atinum":42229,"unknown":42230,"ĠObserv":42231,"ĠPhilosophy":42232,"Ide":42233,"Ġcopyrighted":42234,"surv":42235,"ĠLocations":42236,"Ġglands":42237,"ĠKnife":42238,"ĠEmber":42239,"ĠUnicorn":42240,"Ġhaste":42241,"Ġkinderg":42242,"ĠTerrit":42243,"ĠKoran":42244,"Ġaval":42245,"addon":42246,"ĠNero":42247,"\"]":42248,"Ġ392":42249,"comfort":42250,"Ġclothed":42251,"ashtra":42252,"mode":42253,"Ġ??":42254,"!\",":42255,"Ġknob":42256,"EMP":42257,"norm":42258,"ĠAgo":42259,"RECT":42260,"Denver":42261,"Ġ1907":42262,"ĠBombs":42263,"Sche":42264,"Ġtriangular":42265,"Ġperv":42266,"rises":42267,"Jes":42268,"Ġcalibration":42269,"Ġts":42270,"Same":42271,"ĠAxe":42272,"ĠMei":42273,"multi":42274,"Ġexerc":42275,"orney":42276,"Ware":42277,"abul":42278,"ĠFior":42279,"Eventually":42280,"ĠGrizz":42281,"Past":42282,"married":42283,"Ġscram":42284,"ĠCache":42285,"posure":42286,"Ġheav":42287,"ĠShirt":42288,"powder":42289,"complex":42290,"Doc":42291,"arus":42292,"Pi":42293,"Ġcurv":42294,"ĠTopic":42295,"Ġ.)":42296,"Ġwills":42297,"philis":42298,"gui":42299,"leground":42300,"Eth":42301,"Strike":42302,"Kid":42303,"Ġdelegated":42304,"Soon":42305,"Ġwast":42306,"gage":42307,"Ġprosecut":42308,"Ġ374":42309,"opolis":42310,"chest":42311,"ensation":42312,"Ġredes":42313,"Ġpresum":42314,"Portland":42315,"Ġannihil":42316,"yssey":42317,"Ġforks":42318,"Ġvitro":42319,"walker":42320,"ĠPsal":42321,"ĠStealth":42322,"Quick":42323,"ĠBaghd":42324,"ĠDrift":42325,"//":42326,"Ġinvincible":42327,"ĠGAM":42328,"Ġcastles":42329,"Ġbondage":42330,"ĠBalloon":42331,"Amid":42332,"individual":42333,"tis":42334,"ĠGuides":42335,"xe":42336,"Cong":42337,"URI":42338,"ĠHH":42339,"PHOTOS":42340,"ĠASIC":42341,"burst":42342,"ahon":42343,"ĠFIX":42344,"ilib":42345,"Ġ457":42346,"ĠLogged":42347,"à¹":42348,"Creat":42349,"inatory":42350,"column":42351,"ĠAugustus":42352,"suggest":42353,"pret":42354,"ĠParan":42355,"Ġsubsistence":42356,"wx":42357,"×":42358,"aleigh":42359,"dash":42360,"ĠMana":42361,"Ko":42362,"opausal":42363,"Ġbene":42364,"ĠSabb":42365,"ĠGhosts":42366,"Ġ1830":42367,"ĠHats":42368,"ĠHive":42369,"Perfect":42370,"Ġsocialists":42371,"Ġtumult":42372,"EGA":42373,"ĠNAME":42374,"Android":42375,"assembled":42376,"phis":42377,"Stage":42378,"Char":42379,"Double":42380,"Ġinsign":42381,"IED":42382,"perial":42383,"ĠEMP":42384,"mx":42385,"Ġskept":42386,"Ġwifi":42387,"Ġparad":42388,"ĠFrequency":42389,"Dist":42390,"nil":42391,"iots":42392,"å":42393,"Message":42394,"Furthermore":42395,"Ġhideous":42396,"ĠLDL":42397,"ĠFault":42398,"ĠDimensions":42399,"ĠImplement":42400,"fram":42401,"Ġamaz":42402,"ĠIndones":42403,"ĠTile":42404,"Ġlar":42405,"gc":42406,"Ġcorrelate":42407,"Ġensl":42408,"mite":42409,"Ġhomosexuals":42410,"Ġagric":42411,"8000":42412,"Ġcuring":42413,"rament":42414,"Ġrecons":42415,"ocene":42416,"ENTION":42417,"Ġcommunion":42418,"ĠFunction":42419,"iple":42420,"Ġredund":42421,"Ġcalibrated":42422,"Ġcontribut":42423,"ĠHuck":42424,"limit":42425,"ĠFedora":42426,"ĠTsuk":42427,"brates":42428,"Ġ1903":42429,"ozo":42430,"visual":42431,"ĠDiscipline":42432,"chains":42433,"ĠOCD":42434,"Ġexpended":42435,"0002":42436,"Ġsty":42437,"ĠNightmare":42438,"ĠReplace":42439,"ounty":42440,"fn":42441,"1900":42442,"ĠEpidem":42443,"ĠFW":42444,"Ġgul":42445,"ĠTomato":42446,"ĠPerse":42447,"wl":42448,"ĠFormation":42449,"Scan":42450,"cosystem":42451,"Brand":42452,"Ġ398":42453,"Ġcaptives":42454,"Ġ×":42455,"ESCO":42456,"ĠEnder":42457,"lesh":42458,"ĠAscend":42459,"poly":42460,"eous":42461,"Ġhyster":42462,"Murray":42463,"phe":42464,"Ġradiator":42465,"esthes":42466,"Ġopin":42467,"Ġconspic":42468,"intosh":42469,"Ġwitchcraft":42470,"ĠCFR":42471,"ussian":42472,"escent":42473,"locking":42474,"Ġnonsensical":42475,"uala":42476,"ĠSerial":42477,"1991":42478,"ĠCalm":42479,"containing":42480,"Ġstimulates":42481,"Ġ448":42482,"Pir":42483,"ĠâĨĴ":42484,"ĠDiver":42485,"Ġmanuscripts":42486,"ĠGaia":42487,"Ñĥ":42488,"Learning":42489,"Ġnipple":42490,"reads":42491,"Ġandroid":42492,"ĠMeditation":42493,"Ġincomprehensible":42494,"edded":42495,"Ġdescendant":42496,"ĠMorty":42497,"Luckily":42498,"ARCH":42499,"ausible":42500,"Dig":42501,"shared":42502,"ĠClip":42503,"Ġtrope":42504,"Ġnarcissistic":42505,"ventures":42506,"Ġcuriously":42507,"ĠCosmos":42508,"Aust":42509,"Lay":42510,"ĠShard":42511,"ĠRecorded":42512,"Ġ458":42513,"........":42514,"Ġperish":42515,"ĠExample":42516,"luent":42517,"Ġapes":42518,"ĠHitch":42519,"Ġholiest":42520,"Ġamplifier":42521,"minent":42522,"xxxxxxxx":42523,"inite":42524,"Ġgenomes":42525,"ĠGuilty":42526,"mult":42527,"Ġorc":42528,"Ġnipples":42529,"Side":42530,"Ġlogically":42531,"Ġdatasets":42532,"ĠTitanium":42533,"Ġrotor":42534,"undle":42535,"handled":42536,"nexpected":42537,"Ġdw":42538,"Ġdiagonal":42539,"ĠAnimated":42540,"Ġnumbering":42541,"Forest":42542,"ĠâĨ":42543,"Prin":42544,"Ġchemically":42545,"ĠGithub":42546,"Ġaph":42547,"ĠFaster":42548,"ĠTinker":42549,"ikini":42550,"Dest":42551,"dri":42552,"Manufact":42553,"isance":42554,"Return":42555,"Alert":42556,"elcome":42557,"ĠMMR":42558,"Ġresid":42559,"ĠLIC":42560,"Ġspecificity":42561,"zanne":42562,"Ġanyways":42563,"Ġ426":42564,"Scot":42565,"astery":42566,"Via":42567,"ĠBlocks":42568,"Ġactivates":42569,"Ġabstinence":42570,"Ġchronological":42571,"Soul":42572,"ĠSchne":42573,"Ġwatts":42574,"AUT":42575,"Ġcalcul":42576,"Simply":42577,"Emb":42578,"ceptive":42579,"ĠCatholicism":42580,"obook":42581,"ĠBits":42582,"ĠMbps":42583,"Ġindignation":42584,"Ġshorthand":42585,"Active":42586,"ĠLimbaugh":42587,"ĠCapcom":42588,"adesh":42589,"Ġclipping":42590,"ĠInstructor":42591,"Secret":42592,"___":42593,"Fer":42594,"rawling":42595,"ĠReward":42596,"Ġweep":42597,"Ġmotherboard":42598,"Above":42599,"metry":42600,"ĠPTS":42601,"Ġbombard":42602,"abetes":42603,".--":42604,"Lens":42605,"Comb":42606,"basic":42607,"ĠREALLY":42608,"Later":42609,"Ġ383":42610,"Ġpositional":42611,"olesc":42612,"Ġcrotch":42613,"ĠMDMA":42614,"requently":42615,"ĠPants":42616,"Ġ433":42617,"uctor":42618,"Ġillumination":42619,"ĠÙħ":42620,"ocrin":42621,"Ġpamph":42622,"atio":42623,"etc":42624,"Ġrestores":42625,"ĠProtector":42626,"Develop":42627,"ĠMew":42628,"trop":42629,"ĠSlayer":42630,"Ti":42631,"ĠNotwithstanding":42632,"Match":42633,"LIST":42634,"IDES":42635,"ĠThick":42636,"Ġdisks":42637,"Kin":42638,"Ġghetto":42639,"ĠObjects":42640,"Ġprism":42641,"ĠNether":42642,"Ġvul":42643,"iky":42644,"]:":42645,"ĠDetail":42646,"Ġfucked":42647,"!?":42648,"anium":42649,"Ġlords":42650,"ilities":42651,"ĠEthnic":42652,"static":42653,"$$":42654,"evidence":42655,"Ġmainline":42656,"Ġpeasant":42657,"ĠEnhance":42658,"ĠForced":42659,"virt":42660,"Ġii":42661,"Ġsymm":42662,"Ġconverter":42663,"ularity":42664,"Ġrepent":42665,"num":42666,"ĠScrew":42667,"ĠFTA":42668,"Ġmarines":42669,"hetto":42670,"blow":42671,"Ġado":42672,"ĠTypical":42673,"Ġoverw":42674,"ĠBerm":42675,"keley":42676,"Song":42677,"hao":42678,"valid":42679,"EXT":42680,"ĠProvides":42681,"âĺħâĺħ":42682,"ĠOdin":42683,"Shot":42684,"Ġgamma":42685,"Princ":42686,"asonry":42687,"ĠAccuracy":42688,"Ġcriterion":42689,"Ġdescriptive":42690,"Gall":42691,"gray":42692,"ĠCalcul":42693,"Ġaxes":42694,"ĠCommunists":42695,"ĠRebellion":42696,"Success":42697,"tg":42698,"Ġâĺ":42699,"Ġmultiplier":42700,"ravity":42701,"Thus":42702,"URL":42703,"Ġalternatively":42704,"duction":42705,"Ġsarcast":42706,"ĠCarth":42707,"ĠUSL":42708,"ĠInvisible":42709,"larg":42710,"pleted":42711,"pathic":42712,"Additionally":42713,"ĠCao":42714,"Ġlatent":42715,"ĠSurge":42716,"MEN":42717,"communications":42718,"ĠArray":42719,"Pink":42720,"commit":42721,"isodes":42722,"earcher":42723,"Ukraine":42724,"ĠAnthrop":42725,"incial":42726,"Ġquotations":42727,"adena":42728,"Ġwhining":42729,"Ġretri":42730,"ĠAssass":42731,"elligent":42732,"ĠPERSON":42733,"Py":42734,"Send":42735,"ĠâĪĴ":42736,"DON":42737,"Ġwatt":42738,"description":42739,"POS":42740,"Ġrepro":42741,"destroy":42742,"icidal":42743,"Ġmidrange":42744,"Ġinfographic":42745,"interesting":42746,"category":42747,"Flash":42748,"ĠInvasion":42749,"ĠExodus":42750,"restricted":42751,"Ġinference":42752,"dding":42753,"mingham":42754,"Ġcircumst":42755,"Wi":42756,"ĠHast":42757,"Ġsubjug":42758,"Ġwhispering":42759,"-.":42760,"Ġadren":42761,"ĠPattern":42762,"BOX":42763,"ĠEnhancement":42764,"Exc":42765,"ĠBucket":42766,"ĠGUN":42767,"deen":42768,"ĠHomo":42769,"1985":42770,"Ġclo":42771,"Ġsnippet":42772,"Ġ1896":42773,"TPP":42774,"Seg":42775,"success":42776,";\"":42777,"ĠMUCH":42778,"Author":42779,"Ġreplication":42780,"Ġhallucinations":42781,"Inv":42782,"ĠAware":42783,"ĠViper":42784,"kai":42785,"frames":42786,"ĠTHANK":42787,"ĠSHA":42788,"wordpress":42789,"Ġbc":42790,"CIA":42791,"arrison":42792,"Ġalloc":42793,"ĠAlz":42794,"letcher":42795,"ĠDaredevil":42796,"iversary":42797,"Ġmanuals":42798,"Catholic":42799,"feat":42800,"Ġkinetic":42801,"JB":42802,"yeah":42803,"ĠLDS":42804,"Ġppm":42805,"ĠADC":42806,"pring":42807,"cence":42808,"Ġclasp":42809,"Ġsetups":42810,"Ġdeity":42811,"ĠIndra":42812,"ĠWander":42813,"Ġantib":42814,"Otherwise":42815,"ombie":42816,"Bitcoin":42817,"ipop":42818,"expression":42819,"Animal":42820,"ĠResurrection":42821,"ĠMoral":42822,"ĠSDK":42823,"Ġwretched":42824,"ogenous":42825,"species":42826,"Ġchuckled":42827,"Thor":42828,"Ġ428":42829,"avery":42830,"ĠPry":42831,"asures":42832,"ĠErn":42833,"apor":42834,"Ġinnumerable":42835,"Ġbaptized":42836,"ĠExplosive":42837,"Ġelves":42838,"idges":42839,"ĠParadox":42840,"Close":42841,"aldehyde":42842,"construct":42843,"Ġvirginity":42844,"Poll":42845,"assin":42846,"Doctors":42847,"Pos":42848,"NECT":42849,"Moreover":42850,"Commercial":42851,"cknowled":42852,"1988":42853,"Ġquotation":42854,"marriage":42855,"ĠBapt":42856,"ĠSina":42857,"ĠGloves":42858,"gian":42859,"Ġconfounding":42860,"URRENT":42861,"Dean":42862,"Brew":42863,"thur":42864,"pty":42865,"immune":42866,"ĠSQU":42867,"Ġcounterfe":42868,"rider":42869,"Ġinferred":42870,"ĠDimension":42871,"ĠToad":42872,"Ġafterlife":42873,"ĠHERO":42874,"Indiana":42875,"seek":42876,"Ġdistinguishes":42877,"ĠQur":42878,"ĠMethods":42879,"combat":42880,"Ġcateg":42881,"ĠStruggle":42882,"teness":42883,"liquid":42884,"Ġblinking":42885,"ĠCONTIN":42886,"iae":42887,"Ġaerobic":42888,"Ġstrugg":42889,"Ġegalitarian":42890,"hello":42891,"orrect":42892,"ĠAbandon":42893,"Ġferment":42894,"Area":42895,"idem":42896,"ĠMania":42897,"Ġjs":42898,"ĠBALL":42899,"Running":42900,"Ġregenerate":42901,"iquid":42902,"Uh":42903,"Crystal":42904,"ĠItal":42905,"ĠHeavenly":42906,"в":42907,"CRIPTION":42908,"Consumer":42909,"dust":42910,"amiliar":42911,"ĠRhino":42912,"Rocket":42913,"Ġreversible":42914,"kok":42915,"ĠSketch":42916,"Ġshotguns":42917,"apses":42918,"Ġdetach":42919,"ĠCells":42920,"artist":42921,"rily":42922,"ĠRestore":42923,"Scar":42924,"Ġevid":42925,"Ġspaced":42926,"ĠContributions":42927,"Ġ418":42928,"ĠMystic":42929,"Ġobfusc":42930,"Russ":42931,"wings":42932,"Pear":42933,"osite":42934,"Nusra":42935,"urations":42936,"ovie":42937,"icago":42938,"ĠConcepts":42939,"Ġstimuli":42940,"Ġaroused":42941,"aughty":42942,"Talking":42943,"ĠPrompt":42944,"Across":42945,"ĠPlaint":42946,"Ġbranching":42947,"Thankfully":42948,"Original":42949,"Esc":42950,"ĠTechnician":42951,"fleet":42952,"usher":42953,"Mos":42954,"livion":42955,"oenix":42956,"Ġhr":42957,"ibble":42958,"Ġindent":42959,"ĠFinished":42960,"Department":42961,"ĠINFO":42962,"Movie":42963,"++":42964,"THING":42965,"Ġtimers":42966,"rocket":42967,"Natural":42968,"lime":42969,"Ġangular":42970,"osure":42971,"Ġdynamically":42972,"Ġpacif":42973,"ĠProcessor":42974,"Ġdisgu":42975,"Ġmoderators":42976,"Ġceases":42977,"Ġinertia":42978,"Ġpaperback":42979,"yton":42980,"ĠHuma":42981,"Ġprohibitions":42982,"Ġgestation":42983,"Bomb":42984,"termin":42985,"Ġcaric":42986,"oS":42987,"tc":42988,"Cop":42989,"raved":42990,"Ġeighty":42991,"ĠEnable":42992,"Ġimplementations":42993,"Ġconquering":42994,"ĠFinder":42995,"window":42996,"Gra":42997,"Ġfonts":42998,"laughter":42999,"Ġcolonization":43000,"ĠDOD":43001,")!":43002,",)":43003,"ĠGeral":43004,"ĠSpoiler":43005,"ĠComponent":43006,"Ġgist":43007,"hiro":43008,"Ġlicens":43009,"nesses":43010,"Ġkarma":43011,"?\".":43012,"OPA":43013,"Ġsquats":43014,"ĠRAND":43015,"Ġorally":43016,"document":43017,"olars":43018,"Ġpresumptive":43019,"Pers":43020,"OAD":43021,"ufficient":43022,"LESS":43023,"Hidden":43024,"ORK":43025,"xs":43026,"Ġmathematician":43027,"ĠGloss":43028,"Ġannihilation":43029,"Ġmanifold":43030,"Ry":43031,"Thunder":43032,"Yan":43033,"Activ":43034,"Ġworldly":43035,"TED":43036,"marg":43037,"ĠStun":43038,"ryce":43039,"ĠVG":43040,"Isn":43041,"ĠCyn":43042,"Expl":43043,"IRED":43044,"Ġcompr":43045,"Ġindisc":43046,"Boss":43047,"()":43048,"berman":43049,"ĠBegins":43050,"ujah":43051,"ornia":43052,"hetical":43053,"Ġcivilizations":43054,"Ġfundamentalist":43055,"strap":43056,"Forward":43057,"ettlement":43058,"Ġprophetic":43059,"glers":43060,"bending":43061,"Terry":43062,"Ġidi":43063,"Ġtrunc":43064,"Ġcreeps":43065,"intel":43066,"switch":43067,"ailand":43068,"Ġinstaller":43069,"GOP":43070,"Ġ499":43071,"ĠParallel":43072,"Cru":43073,"Ġ\"@":43074,"Ġ396":43075,"ĠUnlock":43076,"Raven":43077,"Corn":43078,"Ġcircadian":43079,"Ġ********************************":43080,"iliate":43081,"ĠFunctional":43082,"Ġpronouns":43083,"ĠSatoshi":43084,"Ġstim":43085,"Gay":43086,"Iss":43087,"ĠThief":43088,"atellite":43089,"Ġshards":43090,"Ġphil":43091,"protein":43092,"Ġalters":43093,"Poor":43094,"Typically":43095,"KER":43096,"ociate":43097,"Ġemits":43098,"recy":43099,"Ġmechanically":43100,"Ġ...\"":43101,"nature":43102,"sys":43103,"ysc":43104,"Ġwavelengths":43105,"pattern":43106,"insured":43107,"Ġparasitic":43108,"ĠLCS":43109,"ĠPACs":43110,"Ġheals":43111,"ĠCCP":43112,"ĠHacker":43113,"Ġpsy":43114,"ĠBeans":43115,"Ġdemonic":43116,"JV":43117,"Ġatmosp":43118,"equality":43119,"Ġairst":43120,"Ġincarn":43121,"ynthesis":43122,"Ġequations":43123,"tch":43124,"ĠHUGE":43125,"ĠChanged":43126,"itatively":43127,"Job":43128,"gaming":43129,"Ġ1899":43130,"ĠMorsi":43131,"Ġconjecture":43132,"riad":43133,"Ġprimates":43134,"ĠArtemis":43135,"ĠThro":43136,"Ġbiologically":43137,"Church":43138,"topia":43139,"recomm":43140,"Ġgradient":43141,"Ġful":43142,"Ġbastard":43143,"CHO":43144,"IUM":43145,"sleep":43146,"Construction":43147,"raints":43148,"vable":43149,"ionage":43150,"Ġcomrade":43151,"Ġpopulate":43152,"Ġnerds":43153,"ĠXie":43154,"result":43155,"ĠImper":43156,"Ġpamphlet":43157,"Ku":43158,"Ġbackend":43159,"ificent":43160,"etus":43161,"Ġdisson":43162,"config":43163,"Ġsuc":43164,"Ġwavelength":43165,"external":43166,"owder":43167,"Ġpredis":43168,"eenth":43169,"Det":43170,"andem":43171,"Ġ1865":43172,"ĠDefeat":43173,"Individual":43174,"Ġretrieving":43175,"stories":43176,"Ġdesolate":43177,"Ġlett":43178,"Ġunpublished":43179,"Ġpassively":43180,"Ġdissertation":43181,"raits":43182,"abee":43183,"ĠResist":43184,"Robin":43185,"Ġbenevolent":43186,"blast":43187,"Offic":43188,"snap":43189,"vernment":43190,"Ġextermin":43191,"wt":43192,"bitious":43193,"hibited":43194,"Insp":43195,"posted":43196,"ĠYugoslav":43197,"rational":43198,"adapt":43199,"ĠAtari":43200,"Ġplugin":43201,"oglobin":43202,"efeated":43203,"ĠHRC":43204,"cko":43205,"ilver":43206,"ĠDestruction":43207,"gewater":43208,"ĠRadiation":43209,"Ġimprison":43210,"origin":43211,"antine":43212,"ĠPublication":43213,"Ġhealer":43214,"istered":43215,"ĠTHEIR":43216,"hazard":43217,"Contract":43218,"Ġmediated":43219,"Ġindexed":43220,"ĠSYSTEM":43221,"Labor":43222,"Blade":43223,"Ġyog":43224,"Champ":43225,"Gordon":43226,"IAS":43227,"Ġnineteenth":43228,"animous":43229,"begin":43230,"ĠHolo":43231,"Planet":43232,"udding":43233,"default":43234,"ĠOMG":43235,"Ġwond":43236,"wm":43237,"pend":43238,"Extreme":43239,"Ġinterstellar":43240,"ASED":43241,"ĠBerks":43242,"Ġprimal":43243,"Foot":43244,"Ġinadvert":43245,"amboo":43246,"ĠLeica":43247,"Events":43248,"ĠPigs":43249,"RAFT":43250,"ï":43251,"ĠGentleman":43252,"Multiple":43253,"ĠPsychiatric":43254,"Ġdespise":43255,"ĠZionism":43256,"ĠSSL":43257,"shit":43258,"Ġthreaded":43259,"Ġartifact":43260,"Ġmitochondrial":43261,"ĠLayer":43262,"inus":43263,"podcast":43264,"Ġawaken":43265,"Management":43266,"Ġdelusions":43267,"grey":43268,"Ġpseud":43269,"agonal":43270,"ĠHirosh":43271,"Georg":43272,"Dragon":43273,"Stack":43274,"ohm":43275,"Ġvener":43276,"Row":43277,"Ġsandbox":43278,"Ġblinding":43279,"razen":43280,"Ġ389":43281,"Ġcrappy":43282,"Ġlith":43283,"antha":43284,"Ġplurality":43285,"ĠDAC":43286,"inently":43287,"intage":43288,"Ġ1902":43289,"ĠDepend":43290,"Ġelapsed":43291,"==":43292,"ĠGenie":43293,"Bush":43294,"ĠPlanetary":43295,"Bah":43296,"ĠKira":43297,"emn":43298,"Month":43299,"allic":43300,"coded":43301,"VOL":43302,"Ġ[...]":43303,"ĠRampage":43304,"Ġ(*":43305,"Production":43306,"licts":43307,"Ġinoc":43308,"Cour":43309,"Ġspurious":43310,"Ġultras":43311,"ggles":43312,"Ġdelusion":43313,"ĠRacer":43314,"ĠPrism":43315,"FH":43316,"uppet":43317,"Ġcultured":43318,"Ġ436":43319,"aneously":43320,"اÙĦ":43321,"ĠMissions":43322,"monton":43323,"criptions":43324,"ificate":43325,"Cause":43326,"Ġ1898":43327,"ocaust":43328,"Ġbri":43329,"ĠShoals":43330,"ommod":43331,"alted":43332,"ogenesis":43333,"warn":43334,"illus":43335,"vv":43336,"Ġcontam":43337,"ĠLesbian":43338,"Ġcavalry":43339,"ĠPresence":43340,"rehens":43341,"tool":43342,"accessible":43343,"Ġ(~":43344,"ĠLicensed":43345,"Ġprophets":43346,"Ġboulder":43347,"mean":43348,"akura":43349,"Ġunres":43350,"ĠCinnamon":43351,"Leaks":43352,"........................":43353,"Contact":43354,"Ġassassins":43355,"ĠGreenwald":43356,"dk":43357,"amazon":43358,"Ġagreeable":43359,"ernandez":43360,"Easy":43361,"PLA":43362,"ĠBigfoot":43363,"Ġconvent":43364,"Ġempires":43365,"Ġ387":43366,"Ġgrasped":43367,"Ġruby":43368,"Ġreconc":43369,"Warning":43370,"atem":43371,"Ġretrieval":43372,"ĠFDR":43373,"ĠReaper":43374,"orem":43375,"ĠLuo":43376,"hig":43377,"ĠArmor":43378,"tp":43379,"ĠInterpret":43380,"Conservative":43381,"ĠSodium":43382,"Ġbead":43383,"Ġpropagate":43384,"claw":43385,"href":43386,"ĠPaste":43387,"Ġomit":43388,"Boost":43389,"Diamond":43390,"goo":43391,"Ġanomal":43392,"ĠDISTRICT":43393,"Greek":43394,"warning":43395,"Ġdespised":43396,"Karl":43397,"AGES":43398,"Ġserotonin":43399,"ESSION":43400,"_______":43401,"ĠCollider":43402,"auldron":43403,"Ġsquee":43404,"Control":43405,"ffield":43406,"cycles":43407,"Legal":43408,"xa":43409,"minimum":43410,"ĠGeneric":43411,"Circ":43412,"·":43413,"Behind":43414,"guide":43415,"Ground":43416,"roying":43417,"ĠGrail":43418,"Ġthee":43419,"Ġ9000":43420,"Batman":43421,"Brother":43422,"Ġnons":43423,"RW":43424,"saf":43425,"ĠCroat":43426,"tainment":43427,"sci":43428,"Ye":43429,"Range":43430,"Ey":43431,"perature":43432,"ĠDracula":43433,"oreal":43434,"Fighting":43435,"Ġreleg":43436,"Ġcoupling":43437,"Tracker":43438,"tyard":43439,"Mut":43440,"Military":43441,"lamm":43442,"ittens":43443,"ĠCRC":43444,"ĠXiang":43445,"Ġorthodoxy":43446,"ĠGoth":43447,"Ġalgorith":43448,"ĠAthen":43449,"Ġtyrann":43450,"ĠTorrent":43451,"IDs":43452,"ĠGENERAL":43453,"ĠASUS":43454,"rastructure":43455,"Faith":43456,"models":43457,"rentices":43458,"ĠCurse":43459,"Ġcalibr":43460,"attled":43461,"monary":43462,"Ġpenet":43463,"aclysm":43464,"album":43465,"Ġremnant":43466,"Ġfung":43467,"itiveness":43468,"thodox":43469,"Ġunlocks":43470,"Ġprobabilities":43471,"Ġster":43472,"Ġscrim":43473,"Ġanalytic":43474,"Urban":43475,"âĢĶâĢĶâĢĶâĢĶ":43476,"Craft":43477,"Ġbrut":43478,"1986":43479,"Section":43480,"raged":43481,"arij":43482,"Hero":43483,"ĠHebdo":43484,"ĠEmpress":43485,"Ġvivo":43486,"ĠPublications":43487,"Ġcannabinoids":43488,"arrett":43489,"Ġbounded":43490,"Ġquests":43491,"Ġomin":43492,"ĠRuler":43493,"ĠYue":43494,"ridges":43495,"Ġpeasants":43496,"ĠAlloy":43497,"Desk":43498,"ULAR":43499,"Ġthor":43500,"ĠOvers":43501,"ĠTome":43502,"mk":43503,"Ġ1050":43504,"Ġshroud":43505,"Ġdistribut":43506,"weapons":43507,"ĠAuthorization":43508,"ĠPoke":43509,"ĠAlternate":43510,"scan":43511,"artisan":43512,"ĠGems":43513,"ĠForums":43514,"atonin":43515,"viron":43516,"Rog":43517,"duct":43518,"Ġtabletop":43519,"crow":43520,"/)":43521,"ĠStainless":43522,"ottest":43523,"Ġreborn":43524,"anchez":43525,"cium":43526,"ĠNicarag":43527,"elfare":43528,"Ġupd":43529,"ritic":43530,"bm":43531,"Ġ608":43532,"ĠSlightly":43533,"ĠDrops":43534,"ISO":43535,"ĠiT":43536,"xiety":43537,"ĠGawker":43538,"omination":43539,"ĠReached":43540,"Student":43541,"Drop":43542,"MET":43543,"ĠKubrick":43544,"1950":43545,"ĠTuls":43546,"Ġcomputed":43547,"depending":43548,"ĠCosmetic":43549,"udget":43550,"Lex":43551,"icut":43552,"ĠDepth":43553,"Ġ1893":43554,"ahah":43555,"Ġath":43556,"fights":43557,"thia":43558,"Ġoccult":43559,"Wheel":43560,"ĠSega":43561,"Ġtheolog":43562,"reement":43563,")--":43564,"Ġunus":43565,"ĠGamma":43566,"Looks":43567,"Ġellipt":43568,"Ġairflow":43569,"ĠHimself":43570,"Ġpagan":43571,"ĠRei":43572,"Ġpilgr":43573,"ĠSubmission":43574,"Region":43575,"Ġinsertion":43576,"Ġsket":43577,"Ġsatisfies":43578,"ĠPixie":43579,"Ġcontempl":43580,"abbit":43581,"ĠReplay":43582,"ĠGalile":43583,"ĠGodzilla":43584,"Ġarithmetic":43585,"iasm":43586,"1987":43587,"ĠFeminist":43588,"Liter":43589,"ĠDisable":43590,"ouble":43591,"essors":43592,"Ġfors":43593,"Ġensu":43594,"Putting":43595,"ĠMSM":43596,"Cond":43597,"emade":43598,"Ġindistinguishable":43599,"Magn":43600,"Ġms":43601,"MAL":43602,"ĠBF":43603,"dm":43604,"iltration":43605,"irection":43606,"ĠSpir":43607,"Gb":43608,"ĠIbn":43609,"Abs":43610,"imens":43611,"RNA":43612,"============":43613,"Ġ655":43614,"ĠConversion":43615,"imilation":43616,"igion":43617,"ĠSomew":43618,"mL":43619,"Border":43620,"Ë":43621,"Factor":43622,"Number":43623,"Ġejac":43624,"Cho":43625,"Ġrighteousness":43626,"ĠPATH":43627,"ĠElys":43628,"ouched":43629,"Ġmultic":43630,"Ġfaculties":43631,"ĠEarthquake":43632,"ĠReferences":43633,"ensitive":43634,"Ġimpat":43635,"Ġ................":43636,"buff":43637,"Ġ1895":43638,"colo":43639,"Vi":43640,"Ġubiqu":43641,"ĠChev":43642,"Fish":43643,"ĠBlueprint":43644,"CHQ":43645,"Ġlinem":43646,"ĠFlavor":43647,"Ġcrimson":43648,"ĠAbstract":43649,"arette":43650,"plete":43651,"ranean":43652,"Dash":43653,"Ġdimensional":43654,"Cub":43655,"ttle":43656,"ĠDSM":43657,"Ġinstantaneous":43658,"esy":43659,"Ġepoch":43660,"Brit":43661,"ĠÎ":43662,"ECD":43663,"Ġwarp":43664,"obyl":43665,"ubric":43666,"Ġutilitarian":43667,"Ġsummarizes":43668,"letal":43669,"Ord":43670,"opath":43671,"tained":43672,"ghai":43673,"Ġwhis":43674,"insert":43675,"Ġphon":43676,"rils":43677,"Ġearthly":43678,"ĠAlic":43679,"ĠPCIe":43680,"Ġfurthermore":43681,"ocard":43682,"Ġuter":43683,"ĠAdmin":43684,"ographics":43685,"ĠConstantin":43686,"gravity":43687,"iPhone":43688,"Ġwasteland":43689,"Ġfps":43690,"Tip":43691,"Ġmurm":43692,"paces":43693,"ĠSamurai":43694,"ĠFOIA":43695,"ĠRadiant":43696,"ĠUnreal":43697,"Ġmicrow":43698,"usterity":43699,"zyme":43700,"itbart":43701,"metadata":43702,"Dat":43703,"ĠMoons":43704,"ĠProtestants":43705,"ungle":43706,"Ġvideog":43707,"pid":43708,"Ġdisple":43709,"aucus":43710,"Ġcoils":43711,"ĠDwar":43712,"fixed":43713,"Alice":43714,"Ġgarrison":43715,"ĠVelocity":43716,"ĠJehovah":43717,"Ġfascists":43718,"ĠCHO":43719,"jl":43720,"Ġmetaphors":43721,"ĠSiege":43722,"scientific":43723,"Ä«":43724,"Slow":43725,"hex":43726,"ĠBlaz":43727,"mediated":43728,"esthesia":43729,"ĠAvg":43730,"Ġbelie":43731,"Carter":43732,"Ġexposition":43733,"azeera":43734,"dial":43735,"Ġbask":43736,"Scale":43737,"Ġdisob":43738,"Ġgore":43739,"Ġhypocr":43740,"Ġphantom":43741,"ĠSynd":43742,"BLIC":43743,"pter":43744,"ĠScorpion":43745,"eor":43746,"ĠRecover":43747,"Ġsummoning":43748,"Ġorb":43749,"jump":43750,"Ġ768":43751,"ĠEnix":43752,"Spons":43753,",...":43754,"Wide":43755,"Ġparse":43756,"Ġdebtor":43757,"Ġpathological":43758,"Ġserpent":43759,"ĠFranç":43760,"reetings":43761,"Ġdeletion":43762,"Ġvolunt":43763,"ĠNotification":43764,"liga":43765,"Disk":43766,"Account":43767,"1979":43768,"Ġsymmetry":43769,"ĠBearing":43770,"ĠABV":43771,"ĠORDER":43772,"rpm":43773,"ĠFuck":43774,"?!\"":43775,"mask":43776,"Grade":43777,"neath":43778,"ocom":43779,"Detect":43780,"ryption":43781,"ĠAura":43782,"Ġinert":43783,"PLAY":43784,"gres":43785,"INTON":43786,"Deal":43787,"fficient":43788,"ĠVoid":43789,"gement":43790,"Ġscorp":43791,"Ġreincarn":43792,"ĠVapor":43793,"Ġ1840":43794,"Yellow":43795,"......":43796,"Ġparameter":43797,"ĠDISTR":43798,"ĠForgotten":43799,"Eat":43800,"izational":43801,"Witness":43802,"ĠDupl":43803,"Ġdogma":43804,"Ġzipper":43805,"ĠZeus":43806,"mage":43807,"ormal":43808,"Ġ\".":43809,"Ġecc":43810,"ĠSlot":43811,"ĠRegist":43812,"Others":43813,"VID":43814,"Windows":43815,"Ġshitty":43816,"ĠLethal":43817,"Monster":43818,"ĠExpression":43819,"tx":43820,"ythm":43821,"Were":43822,"ivalry":43823,"atcher":43824,"ĠFormat":43825,"ĠPlasma":43826,"Phys":43827,"laugh":43828,"Fu":43829,"java":43830,"roma":43831,"ĠIncreases":43832,"Ġlicensee":43833,"Ġmystic":43834,"Ġproto":43835,"ĠLoki":43836,"forcing":43837,"hots":43838,"Ġ->":43839,"Outside":43840,"ĠEndless":43841,"Ġachie":43842,"ĠTurtles":43843,"Ġconvin":43844,"JUST":43845,"Ġimmobil":43846,"ĠCauses":43847,"Ġclich":43848,"xes":43849,"ffiti":43850,"Ġhypot":43851,"Bat":43852,"Ġbigot":43853,"Personal":43854,"ĠPharmac":43855,"Lot":43856,"VERT":43857,"Ġbapt":43858,"idelines":43859,"Ġprox":43860,"MAP":43861,"Spirit":43862,"ĠSlug":43863,"Ġebook":43864,"eches":43865,"ĠAndromeda":43866,"Ġceremon":43867,"1975":43868,"PRE":43869,"Ġasshole":43870,"linear":43871,"Nevertheless":43872,"Ġwillpower":43873,"azel":43874,"Fif":43875,"andise":43876,"Ġextravag":43877,"ĠBuffy":43878,"Ġcorrelations":43879,"ptr":43880,"Progress":43881,"shape":43882,"ĠSymbol":43883,"arag":43884,"ĠContext":43885,"ucer":43886,"1983":43887,"ĠMyster":43888,"Pain":43889,"Login":43890,"mbol":43891,"codes":43892,"RANT":43893,"Ġoverse":43894,"opot":43895,"STEM":43896,"enser":43897,"ĠCosmic":43898,"Spl":43899,"ritional":43900,"ĠPharaoh":43901,"ĠRemix":43902,"xon":43903,"ĠXII":43904,"Ġunman":43905,"Ġimmedi":43906,"Ġmonog":43907,"ĠLX":43908,"Ġabstraction":43909,"ocolate":43910,"ĠDonkey":43911,"Ġ!!":43912,"ĠLIA":43913,"shed":43914,"rules":43915,"Ġcalc":43916,"ĠAutob":43917,"anmar":43918,"eworks":43919,"notations":43920,"Ġtenancy":43921,"ĠPetraeus":43922,"dp":43923,"amphetamine":43924,"ĠCortex":43925,"rw":43926,"Ġprojectile":43927,"Ġintrinsically":43928,"Route":43929,"Ġnegoti":43930,"anuts":43931,"Analysis":43932,"redits":43933,"ĠGG":43934,"thread":43935,"ĠChosen":43936,"Years":43937,"otyp":43938,"ĠNCT":43939,"udic":43940,"ochemical":43941,"Neigh":43942,"Ġfishes":43943,"ĠFloat":43944,"Print":43945,"okia":43946,"Ġbarb":43947,"quote":43948,"Lew":43949,"Ġannoun":43950,"istors":43951,"Reading":43952,"ACTION":43953,"Ġintakes":43954,"ĠBeet":43955,"matter":43956,"Swe":43957,"Ther":43958,"Ġtyrant":43959,"ĠPsycho":43960,"ĠDestroy":43961,"Ġesoteric":43962,"Ġbiom":43963,"idious":43964,"Merc":43965,"hran":43966,"ĠBaal":43967,"seconds":43968,"Ġsuperhuman":43969,"ancel":43970,"Ġworshipped":43971,"Ġwebs":43972,"Ġviolet":43973,"ĠMetallic":43974,"eday":43975,"ordering":43976,"Nut":43977,"Ġconstructs":43978,"olescent":43979,"Unit":43980,"otypes":43981,"Ġembryonic":43982,"perm":43983,"Nature":43984,"ĠDecre":43985,"levant":43986,"Ġss":43987,"+(":43988,"ĠDoctrine":43989,"puters":43990,"Ġsaline":43991,"orsche":43992,"1111":43993,"values":43994,"Ġutopian":43995,"ĠBooster":43996,"Technical":43997,"ì":43998,"ĠLIMITED":43999,"nir":44000,"Ġclones":44001,"Performance":44002,"aple":44003,"Ġshudder":44004,"Ġcontempor":44005,"lator":44006,"ĠOops":44007,"Ġammon":44008,"Ġdavid":44009,"Ġbom":44010,"bish":44011,"Ġdetectable":44012,"Ġmultiplying":44013,"Ġreddit":44014,"Prim":44015,"Ġmedial":44016,"Ġsubstrate":44017,"ĠSanskrit":44018,"Spect":44019,"ĠMagical":44020,"Ġarcane":44021,"align":44022,"Ġ1861":44023,"Ġneocons":44024,"Ì":44025,"ĠBounty":44026,"ĠContinent":44027,"Ġhurd":44028,"alions":44029,"Ġgeneralized":44030,"ĠInsect":44031,"Ġsimul":44032,"actual":44033,"advert":44034,"ukong":44035,"Resp":44036,"ĠWarcraft":44037,"Hunter":44038,"hyper":44039,"ĠBreach":44040,"ught":44041,"Ġcomputation":44042,"react":44043,"Feel":44044,"ĠCheong":44045,"Ġslut":44046,"Ġgalactic":44047,"Ġtaunt":44048,"Enjoy":44049,"Ġreprinted":44050,"Word":44051,"ĠHandbook":44052,"amins":44053,"exit":44054,"Wo":44055,"Ġadherents":44056,"Counter":44057,"ĠNode":44058,"ĠTwisted":44059,"Ġgrinned":44060,"universal":44061,"ĠAmon":44062,"Ġaster":44063,"ĠEquip":44064,"!\".":44065,"Ġanalogous":44066,"rients":44067,"alky":44068,"ĠQian":44069,"Ġspont":44070,"docs":44071,"Ġcontemplation":44072,"Ġrevolutionaries":44073,"Ġpreset":44074,"ĠAmendments":44075,"Ġexecutes":44076,"ĠDuration":44077,"Ġcompulsion":44078,"Ġstagger":44079,"ynamic":44080,"blem":44081,"];":44082,"Higher":44083,"Balt":44084,"heast":44085,"Ġcorp":44086,"awei":44087,"Motion":44088,"Mis":44089,"Ġadventurer":44090,"eger":44091,"Ġarsen":44092,"ĠVoltage":44093,"ĠEVENTS":44094,"Salt":44095,"issance":44096,"DK":44097,"Ship":44098,"Ġunwitting":44099,"Ton":44100,"ĠPROGRAM":44101,"Ġtentacles":44102,"erness":44103,"thirst":44104,"Fig":44105,"fty":44106,"ĠTolkien":44107,"Sleep":44108,"ĠExplain":44109,"Pub":44110,"ĠBounce":44111,"ĠDemo":44112,"Ġ1897":44113,"ĠSPI":44114,"intern":44115,"********":44116,"ĠKills":44117,"ĠZombies":44118,"Single":44119,"ratom":44120,"ĠClaw":44121,"hid":44122,"asel":44123,"Shock":44124,"erential":44125,"Ġupgr":44126,"holy":44127,"Ġ\\":44128,"aghetti":44129,"Ġthence":44130,"genic":44131,"papers":44132,"1982":44133,"ravel":44134,"ĠUNIVERS":44135,"Charge":44136,"ĠDelay":44137,"ibrary":44138,"ĠHDD":44139,"olson":44140,"Ġenchanted":44141,"Wr":44142,"graph":44143,"Ġcorro":44144,"ept":44145,"etsu":44146,"ĠQin":44147,"Û":44148,"Ġantidepressant":44149,"ĠCerberus":44150,"Ġappe":44151,"ĠDEFENSE":44152,"Ġdysph":44153,"split":44154,"zilla":44155,"attr":44156,"Clar":44157,"Äĵ":44158,"hov":44159,"IRC":44160,"hibition":44161,"'/":44162,"ĠURLs":44163,"Draft":44164,"Prep":44165,"ĠLanguages":44166,"ĠTravels":44167,"ceiver":44168,"aturally":44169,"pair":44170,"ĠALWAYS":44171,"aaaa":44172,"ĠTenth":44173,"ĠNAD":44174,"Serv":44175,"ĠUID":44176,"cens":44177,"ĠLearned":44178,"Ġtraject":44179,"Ġmoaning":44180,"ĠNare":44181,"Ġingen":44182,"Ġsurn":44183,"Ġfloppy":44184,"breeding":44185,"uph":44186,"rossover":44187,"Understanding":44188,"Glass":44189,"Ġruntime":44190,"gp":44191,"Ġâľĵ":44192,"Ġcyt":44193,"bley":44194,"agall":44195,"Ġunworthy":44196,"otine":44197,"Ġchromosome":44198,"utters":44199,"Ġµ":44200,"Ġexpans":44201,"Ġdement":44202,"Ġinsurrection":44203,"Ġsurviv":44204,"genre":44205,"ospital":44206,"ĠPlato":44207,"ĠTrigger":44208,"selection":44209,"ilege":44210,"Ġsegreg":44211,"itizens":44212,"ĠRAID":44213,"Pure":44214,"hetti":44215,"ĠFailed":44216,"ĠCharacters":44217,"ĠCreep":44218,"akra":44219,"Ec":44220,"ĠAristotle":44221,"Lim":44222,"error":44223,"yrus":44224,"umably":44225,">>":44226,"Ġtsun":44227,"knowledge":44228,"Cert":44229,"bable":44230,"hesion":44231,"ĠProcedures":44232,"Ġmarkup":44233,"ideo":44234,"Ġrhet":44235,"ĠChapters":44236,"ĠChecking":44237,"mega":44238,"Ġphotons":44239,"required":44240,"Unknown":44241,"ĠDrawn":44242,"Ġvari":44243,"EEK":44244,"Ġcompuls":44245,"Ġcloning":44246,"ccoli":44247,"Ġ1070":44248,"Ġkindred":44249,"Ġdiscl":44250,"ĠCind":44251,"Collect":44252,"Ġchromosomes":44253,"phant":44254,"ĠKafka":44255,"Ġeverlasting":44256,"Ġmercenary":44257,"ĠHmm":44258,"----":44259,"riber":44260,"Ġdoubtless":44261,"Ġsusceptibility":44262,"beta":44263,"notice":44264,"Ġcrochet":44265,"Ġrespir":44266,"Ġphilosophers":44267,"ĠExtras":44268,"Ġseparat":44269,"shown":44270,"iblings":44271,"Hispanic":44272,"copy":44273,"Tang":44274,"Knight":44275,"Ġpursu":44276,"ĠAnime":44277,"Ġlipid":44278,"ggies":44279,"levels":44280,"phalt":44281,"ĠCompleted":44282,"bral":44283,"Ġcerv":44284,"ĠAfric":44285,"ĠPhar":44286,"Color":44287,"ogene":44288,"ĠCompan":44289,"memory":44290,"Dust":44291,"ĠXIV":44292,"ĠConsole":44293,"').":44294,"Ġ1888":44295,"byn":44296,"Ġpolygamy":44297,"Auth":44298,"BUT":44299,"istine":44300,"Ġsacr":44301,"Ġabsor":44302,"ijah":44303,"ĠNeural":44304,"olester":44305,"ql":44306,"Already":44307,"Creating":44308,"ĠStarg":44309,"ĠPhilos":44310,"Consider":44311,"Ġrepositories":44312,"cludes":44313,"ĠBuffer":44314,"ĠPerspect":44315,"Ġcomput":44316,"Stew":44317,"iamond":44318,"ĠJudgment":44319,"OVA":44320,"angible":44321,"Ġoxid":44322,"Ġepigen":44323,"Ġsidel":44324,"ĠEag":44325,"devices":44326,"icone":44327,"1920":44328,"atism":44329,"beard":44330,"ĠGujar":44331,"ĠPlaystation":44332,"Ġglances":44333,"ĠCOMPLE":44334,"VERTIS":44335,"ukemia":44336,"Edit":44337,"Tickets":44338,"Square":44339,"ĠSerpent":44340,"Ġtransporter":44341,"MQ":44342,"ĠMongo":44343,"1967":44344,"ibaba":44345,"Ġtimet":44346,"sylvania":44347,"Latin":44348,"osaurs":44349,"Ġhumanoid":44350,"Ġcannabinoid":44351,"Ġdisciple":44352,"Psych":44353,"Ġimpro":44354,"Ġmc":44355,"Raid":44356,"Letter":44357,"ificant":44358,"ĠPortug":44359,"ĠFreem":44360,"Ġappell":44361,"ĠMushroom":44362,"Ġclans":44363,"Ġsinful":44364,"Ġingestion":44365,"ĠDirectory":44366,"abetic":44367,"Ġantigen":44368,"Ġimagin":44369,"mitter":44370,"!!!!!":44371,"ĠDPR":44372,"leness":44373,"\":\"\",\"":44374,"ĠAUTHOR":44375,"Ġgrunt":44376,"Ġflickering":44377,"Cath":44378,"asury":44379,"Ġnozzle":44380,"Secure":44381,"Stre":44382,"ĠBIT":44383,"Ġdeviations":44384,"Professor":44385,"bilt":44386,"ĠConscious":44387,"Ġinterrupts":44388,"ĠMormons":44389,"ĠCutter":44390,"Bed":44391,"ipient":44392,"ĠGhostbusters":44393,"Cart":44394,"endas":44395,"ĠExecution":44396,"ycle":44397,"Ġwedd":44398,"Sold":44399,"Ġvanquished":44400,"Regarding":44401,"Depending":44402,"']":44403,"atron":44404,"oidal":44405,"Cube":44406,"Studio":44407,":/":44408,"ĠExplosion":44409,"activate":44410,"pport":44411,"fuck":44412,"Whe":44413,"Ġsmir":44414,"Ġwidgets":44415,"urses":44416,"izard":44417,")*":44418,"icho":44419,"ĠVersus":44420,"ĠIntroduced":44421,"osaurus":44422,"1977":44423,"forum":44424,"Gray":44425,"Program":44426,"righteous":44427,"endum":44428,"ĠScare":44429,"Ġresists":44430,"*)":44431,"ĠCombo":44432,"Ġsockets":44433,"Ġaston":44434,"LAB":44435,"Ġmutated":44436,"eworld":44437,"DEF":44438,"Trend":44439,"âĢĶ-":44440,"Ġpropagation":44441,"Ġemancipation":44442,"collection":44443,"ĠDifferences":44444,"Tweet":44445,"Ġmajesty":44446,")...":44447,"sylv":44448,"Ġadapters":44449,"Ġmilliseconds":44450,"Jews":44451,"ĠPatreon":44452,"phasis":44453,"ĠHTTP":44454,"onnaissance":44455,"ENDED":44456,"ĠIntro":44457,"qs":44458,"Ġsuperflu":44459,"*.":44460,"Ġminions":44461,"ĠStupid":44462,"Ġspecialization":44463,"ĠPikachu":44464,"Ġappellant":44465,"Training":44466,"circle":44467,"Interest":44468,"Ġfallacy":44469,"ĠDinosaur":44470,"ĠTHEM":44471,"Ġdirectories":44472,"Ġmasturbation":44473,"ĠStain":44474,"1978":44475,"odied":44476,"Ġexqu":44477,"ĠRats":44478,"swick":44479,"Ġemptiness":44480,"ĠXeon":44481,"Ġthereto":44482,"ĠEngels":44483,"ĠSupplement":44484,"Chan":44485,"Ġundead":44486,"ĠNoct":44487,"erest":44488,"ĠQuery":44489,"ĠSOLD":44490,"thritis":44491,"ĠEncounter":44492,"Ġvectors":44493,"Econom":44494,"Rogue":44495,"Ġgelatin":44496,"Rot":44497,"Flickr":44498,"Ġcaching":44499,"Ġloader":44500,"ĠELE":44501,"Ġcamoufl":44502,"Commission":44503,"Ġ1886":44504,"Ġcombos":44505,"ĠAwakening":44506,"Ġfeudal":44507,"Ġasses":44508,"ASY":44509,"atalie":44510,"Ġpanties":44511,"ĠMono":44512,"selves":44513,"Download":44514,"Ġvampires":44515,"------":44516,"ishop":44517,"User":44518,"Ġimperialist":44519,"ĠGOODMAN":44520,"1973":44521,"Vel":44522,"Struct":44523,"ĠUFOs":44524,"drivers":44525,"ĠOptional":44526,"uably":44527,"ĠPrinciple":44528,"verett":44529,"taining":44530,"Ġ1889":44531,"ĠCommunism":44532,"auder":44533,"Keys":44534,"lore":44535,"ĠMedieval":44536,"Hyd":44537,"weapon":44538,"Register":44539,"ĠHighlander":44540,"ĠRFC":44541,"Demon":44542,"ardless":44543,"ĠOrche":44544,"Kick":44545,"pixel":44546,"address":44547,"OUP":44548,"Brain":44549,"ĠMorph":44550,"bash":44551,"ĠANG":44552,"ĠIdle":44553,"ĠLucifer":44554,"Ġcorrelates":44555,"Ġgazed":44556,"colm":44557,"ĠKard":44558,"Solar":44559,"ĠVariable":44560,"ĠPACK":44561,"Ġfuzz":44562,"Ġanonym":44563,"ĠECO":44564,"feature":44565,"ĠEsports":44566,"ĠAnthropology":44567,"cise":44568,"manac":44569,"ĠSupports":44570,"rists":44571,"Quant":44572,"istical":44573,"çļĦ":44574,"Ġdexterity":44575,"monster":44576,"ordial":44577,"Mob":44578,"DEC":44579,"ĠConj":44580,"entric":44581,"1981":44582,"ECTION":44583,"ietal":44584,"ĠUses":44585,"ĠArmageddon":44586,"ĠCapitalism":44587,"Ub":44588,"iazep":44589,"helps":44590,"ouls":44591,"grim":44592,"ĠEthiop":44593,"tesy":44594,"Ġclipboard":44595,"Ġchimpanzees":44596,"PLIC":44597,"Sexual":44598,"wallet":44599,"ĠRect":44600,"ocytes":44601,"ĠHels":44602,"lace":44603,"Damn":44604,"Ġblasp":44605,"ildo":44606,"ĠRober":44607,"APD":44608,"ĠWCS":44609,"ippery":44610,"ellectual":44611,"Ġ$(":44612,"Ġuniverses":44613,"Ġholster":44614,"Ġshading":44615,"Ġinflic":44616,"else":44617,"ĠShiny":44618,"ĠAVG":44619,"Lower":44620,"ĠMayhem":44621,"Originally":44622,"Crypt":44623,"SHARE":44624,"ĠBeir":44625,"!:":44626,"Ġrepentance":44627,"WHAT":44628,".......":44629,"Ġauditory":44630,"aaa":44631,"ĠLoot":44632,"ciples":44633,"Ġcontem":44634,"Ġphoton":44635,"æľ":44636,"omach":44637,"ĠWhedon":44638,"ĠValid":44639,"asonable":44640,"pha":44641,"assad":44642,"ĠPse":44643,"Heat":44644,"Ġplugins":44645,"Ġclenched":44646,"ĠAmeric":44647,"transform":44648,"ĠEnh":44649,"agnetic":44650,"usalem":44651,"sych":44652,"Wed":44653,"replace":44654,"ĠKinect":44655,"shield":44656,"Sax":44657,"ividually":44658,"Ġfunctionally":44659,"Ġ:)":44660,"typically":44661,"Opening":44662,"Fa":44663,"ĠSELECT":44664,"Ġsamurai":44665,"Ġhorde":44666,"entle":44667,"sth":44668,"Changes":44669,"Pin":44670,"ithing":44671,"illance":44672,"ĠEmblem":44673,"ĠMicha":44674,"crypt":44675,"ĠObjective":44676,"ophys":44677,"Ġavg":44678,"poon":44679,"Ġreadable":44680,"ĠRx":44681,"allel":44682,"Sit":44683,"gom":44684,"ureau":44685,"ĠDoodle":44686,"Ġdungeon":44687,"($":44688,"Nintendo":44689,"\"],\"":44690,"Notes":44691,"Grab":44692,"Prosecutors":44693,"Advanced":44694,"Ġ1862":44695,"ĠVeter":44696,"Ġjurisd":44697,"ĠLauncher":44698,"Catal":44699,"udder":44700,"Ġresidues":44701,"Ġregress":44702,"ĠConquer":44703,"osal":44704,"ĠDice":44705,"************":44706,"braska":44707,"ipolar":44708,"Ġathe":44709,"bringing":44710,"Suddenly":44711,"ĠIEEE":44712,"verbs":44713,"Ġdelet":44714,"ipeg":44715,"Previous":44716,"]\"":44717,"Ġsidebar":44718,"illac":44719,"Property":44720,"α":44721,"REP":44722,"Ġauthenticated":44723,"gypt":44724,"uilding":44725,"ĠGing":44726,"Ġwart":44727,"Birth":44728,"Ġobedient":44729,"ĠXuan":44730,"ĠTYPE":44731,"Ġinhibits":44732,"1972":44733,"humans":44734,"IENT":44735,"Ġyoutube":44736,"Shortly":44737,"ophen":44738,"ĠWinc":44739,"ĠWrit":44740,"AUD":44741,"ĠHobbit":44742,"emphasis":44743,"ĠWonders":44744,"Ġtwitch":44745,"ĠProphe":44746,"Berry":44747,"ĠGinny":44748,"ĠBurst":44749,"ĠGenerator":44750,"Ġepile":44751,"ĠBalanced":44752,"GPU":44753,"maps":44754,"Ġneurotrans":44755,"ĠIRC":44756,"Ġ\"$":44757,"Create":44758,"Particip":44759,"ĠMarxism":44760,"Ġthou":44761,"ĠMortal":44762,"Ġ�":44763,"Ġninja":44764,"inburgh":44765,"Ġappro":44766,"ĠPistol":44767,"Jar":44768,"Ġprophes":44769,"classes":44770,"Ġanarchist":44771,"Ġextant":44772,"message":44773,"itaire":44774,"Ġ1863":44775,"ĠProl":44776,"Ġpropell":44777,"Ġimpossibility":44778,"Ġpropos":44779,"itamin":44780,"Rating":44781,"olphin":44782,"Ġmitochond":44783,"versions":44784,"Liberal":44785,"ishy":44786,"Ġspherical":44787,"ĠSurvive":44788,"FREE":44789,"rawler":44790,"Metal":44791,"ĠStarship":44792,"Ġ=================================================================":44793,"ĠDharma":44794,"ĠSeller":44795,"Ġwrapper":44796,"Experience":44797,"Integ":44798,"Customer":44799,"hammad":44800,"Ġunanim":44801,"Jenn":44802,"Ġschizophren":44803,"agree":44804,"ĠEVENT":44805,"Shell":44806,"Ġfractions":44807,"1968":44808,"Ġextermination":44809,"ĠSniper":44810,"Ġpronoun":44811,"ĠHitman":44812,"xp":44813,"resource":44814,"WIND":44815,"Ġhierarchical":44816,"Ġted":44817,"Changing":44818,"Ġplaus":44819,"Transform":44820,"Ġbicy":44821,"imentary":44822,"Fuck":44823,"Mini":44824,"Ġoverc":44825,"ĠOptimus":44826,"outer":44827,"helial":44828,"akening":44829,"fx":44830,"Ġnig":44831,"Ġ+/-":44832,"ĠVICE":44833,"Ġnm":44834,"1976":44835,"ĠRitual":44836,"ĠTyrann":44837,"Ġscriptures":44838,"inical":44839,"ĠNull":44840,"ourgeois":44841,"dra":44842,"Ġpious":44843,"Ġneuron":44844,"Ġcolonists":44845,"ĠNebula":44846,"apply":44847,"Sah":44848,"Marx":44849,"Ġhypotheses":44850,"notation":44851,"acists":44852,"Math":44853,"Manager":44854,"Library":44855,"audi":44856,"Ġmp":44857,"ergic":44858,"Ġwizards":44859,"fw":44860,"DVD":44861,"ĠScala":44862,"Different":44863,"ampoo":44864,"ĠDread":44865,"abbage":44866,"Rus":44867,"ĠDumbledore":44868,"keleton":44869,"elsh":44870,"esian":44871,"ĠCorsair":44872,"Tier":44873,"ĠCelest":44874,"Ġnoun":44875,"Ġlucid":44876,"requisites":44877,"Ġgenus":44878,"Event":44879,"1974":44880,"ĠSatanic":44881,"iox":44882,"ĠHandle":44883,"ĠDestroyer":44884,"Ġinvocation":44885,"ĠXD":44886,"modified":44887,"Gam":44888,"ĠRPC":44889,"Ġsubsystem":44890,"Compared":44891,"odan":44892,"ĠPassive":44893,"ĠHelmet":44894,"nutrition":44895,"riction":44896,"HOW":44897,"Jess":44898,"Ġpiston":44899,"imately":44900,"Ġhypoc":44901,"ĠCelestial":44902,"MRI":44903,"Ġcompiler":44904,"ĠBadge":44905,"ĠRevelation":44906,"Ġintrig":44907,"Grad":44908,"ĠSPACE":44909,"Poly":44910,"ĠVul":44911,"Ġtrembling":44912,"Ġindepend":44913,"doctor":44914,"Certain":44915,"emet":44916,"Password":44917,"Ġgasped":44918,"Ġpronunciation":44919,"Fuel":44920,"ĠSPEC":44921,"assets":44922,"Extra":44923,"Ġformatting":44924,"Ġmods":44925,"\"!":44926,"akedown":44927,"Ġcircuitry":44928,"ĠTRUE":44929,"ĠVeil":44930,"Ġsighed":44931,"Charg":44932,"eals":44933,"Ġworkaround":44934,"Ġank":44935,"ĠScrolls":44936,"Ġdiffusion":44937,"Ġamps":44938,"ĠTempest":44939,"adata":44940,"Ġphenomen":44941,"Ġ???":44942,"Ġpopup":44943,"Ġinhibition":44944,"Ġaliases":44945,"erity":44946,"agraph":44947,"Jew":44948,"Ġbec":44949,"Classic":44950,"comment":44951,"usable":44952,"rodu":44953,"ĠEnlightenment":44954,"Ġinvis":44955,"Ġbiochemical":44956,"latest":44957,"ĠGMOs":44958,"ĠSocialism":44959,"Ġpollut":44960,"Ġeluc":44961,"Js":44962,"orthern":44963,"PDATED":44964,"alyses":44965,"Experts":44966,"Blog":44967,"ĠDemocr":44968,"etooth":44969,"pause":44970,"âĢ¢âĢ¢":44971,"ĠShinji":44972,"Ġdystop":44973,"Sources":44974,"ĠBrach":44975,"np":44976,"ĠXY":44977,"Ġneurot":44978,"assembly":44979,"Ġbourgeois":44980,"ĠReson":44981,"ĠIDE":44982,"Ġrecoil":44983,"raq":44984,"ĠAvenger":44985,"Paper":44986,"UTF":44987,"ĠWrest":44988,"ĠSimulation":44989,"elaide":44990,"ĠDMCA":44991,"utm":44992,"1963":44993,"Ġarcs":44994,"Ġmaximal":44995,"Ġcyl":44996,"Ġphilosoph":44997,"enium":44998,"Ġrelativity":44999,"ĠMacintosh":45000,"Ġpneum":45001,"LOC":45002,"Ġgoddamn":45003,"SHA":45004,"Ġlocalization":45005,"ĠPHI":45006,"Ġhierarch":45007,"Ġatheists":45008,"±":45009,"Luck":45010,"ĠJugg":45011,"options":45012,"alore":45013,"Edward":45014,"Monitor":45015,"Ġneoc":45016,"numbered":45017,"Arc":45018,"ĠCodes":45019,"ĠHallow":45020,"olitan":45021,"sections":45022,"ĠEzek":45023,"Ġamy":45024,"task":45025,"ĠCLS":45026,"ĠValkyrie":45027,"Ġcircumference":45028,"amac":45029,"ĠNotting":45030,"Ġproverb":45031,"Spec":45032,"Ġelemental":45033,"ĠBitcoins":45034,"Except":45035,"Release":45036,"ADVERTISEMENT":45037,"Complete":45038,"phrine":45039,"Ġspores":45040,"random":45041,"neum":45042,"trigger":45043,"ocide":45044,"Ġlongitudinal":45045,"isec":45046,"peat":45047,"Ġprecept":45048,"Wing":45049,"ĠâĹ":45050,"otropic":45051,"mouse":45052,"ĠWitcher":45053,"ĠAppearance":45054,"ROR":45055,"Ġ||":45056,"aird":45057,"Blu":45058,"Ġincomp":45059,"ĠFirefly":45060,"update":45061,"Loc":45062,"Ġnihil":45063,"hesive":45064,"Quality":45065,"youtu":45066,"Seriously":45067,"Ġannot":45068,"ĠCoins":45069,"Visit":45070,"lc":45071,"----------":45072,"Ġdiction":45073,"Ġafore":45074,"Ġimmortality":45075,"ĠForbidden":45076,"Allah":45077,"ĠPartial":45078,"ĠGears":45079,"Ġtrance":45080,"Hat":45081,"irez":45082,"ĠSATA":45083,"Ġelectrode":45084,"ĠLinear":45085,"rikes":45086,"Ġderiv":45087,"ĠXue":45088,"Fine":45089,"ĠIgnore":45090,"desc":45091,"DOM":45092,"Simple":45093,"orescence":45094,"Previously":45095,"Ġcircumcision":45096,"Sphere":45097,"Ġrenown":45098,"SET":45099,"ilight":45100,"ĠByzantine":45101,"EXP":45102,"Ġwhine":45103,"Missing":45104,"Lt":45105,"Guide":45106,"Ġhippocampus":45107,"Ġwip":45108,"yrights":45109,"Ġsubmer":45110,"Maker":45111,"Switch":45112,"Ġspectral":45113,"nect":45114,"Ãį":45115,"Ġreven":45116,"WER":45117,"Adding":45118,"ĠCONTROL":45119,"asper":45120,"0000000":45121,"ynt":45122,"annabin":45123,"ĠAliens":45124,"ĠPCR":45125,"asketball":45126,"ricia":45127,"ĠUnch":45128,"Tap":45129,"Ġpracticable":45130,"ĠUsage":45131,"Ġsoluble":45132,"Scroll":45133,"Random":45134,"Ġmoan":45135,"ĠPuppet":45136,"Dim":45137,"Attack":45138,"Ġspears":45139,"Ġrectangle":45140,"Ġamuse":45141,"ĠDoct":45142,"reon":45143,"ĠReset":45144,"vag":45145,"unin":45146,"ĠBris":45147,"ĠSwarm":45148,"Model":45149,"Standing":45150,"Ġdenotes":45151,"{":45152,"ĠLizard":45153,"nesty":45154,"Ġwor":45155,"Ġamplification":45156,"ĠInferno":45157,"Cover":45158,"SAM":45159,"respective":45160,"Shift":45161,"Ġlibertarians":45162,"Runner":45163,"ĠRevelations":45164,"Spr":45165,"ĠCrusader":45166,"Ġcaffe":45167,"Patch":45168,"stros":45169,"ĠImmortal":45170,"Ġinsofar":45171,"itance":45172,"ĠValhalla":45173,"Ġradial":45174,"Beast":45175,"sync":45176,"Ġ--------":45177,"ĠPathfinder":45178,"iless":45179,"operator":45180,"Choose":45181,"Ġdecode":45182,"Ġvou":45183,"ĠMutant":45184,"ĠCVE":45185,"Female":45186,"Ġoxidation":45187,"inational":45188,"dB":45189,"Scope":45190,"Wan":45191,"ĠBought":45192,"ĠDietary":45193,"rotein":45194,"Present":45195,"aukee":45196,"Ġtotem":45197,"Ġsatur":45198,"wagon":45199,"Builder":45200,"ĠBulg":45201,"Ġsects":45202,"Flo":45203,"ombat":45204,"ĠHermione":45205,"aughs":45206,"Ġhydra":45207,"paren":45208,"ë":45209,"Whereas":45210,"tsky":45211,"Ġchall":45212,"WORK":45213,"opian":45214,"rican":45215,"vati":45216,"ĠHTTPS":45217,"Ġwrink":45218,"Ġthrob":45219,"habi":45220,"Ġiodine":45221,"omorph":45222,"ĠScion":45223,"Hunt":45224,"Written":45225,"iosity":45226,"ĠBrowser":45227,"Ġsinners":45228,"culosis":45229,"Ġunconsciously":45230,"0100":45231,"Ġanarchists":45232,"Pull":45233,"FFER":45234,"Ġpandemonium":45235,"matically":45236,"Rush":45237,"Ġpurified":45238,"ĠCyan":45239,"ĠDifficulty":45240,"«":45241,"Aside":45242,"oggles":45243,"untu":45244,"iege":45245,"iberal":45246,"ĠCOUR":45247,"eteenth":45248,"weeney":45249,"biased":45250,"ĠDecay":45251,"quart":45252,"alysis":45253,"Ġstere":45254,"ellect":45255,"Ġkernels":45256,"juven":45257,"ĠJPEG":45258,"indal":45259,"topic":45260,"Ġidentifier":45261,"åı":45262,"Ġepid":45263,"1969":45264,"Ġpoisons":45265,"sym":45266,"mop":45267,"LOCK":45268,"axe":45269,"cohol":45270,"ctory":45271,"Ġadject":45272,"Skin":45273,"ĠFract":45274,"ĠSHAR":45275,"echo":45276,"thood":45277,"Ġencoding":45278,"Ġrelational":45279,"Len":45280,"Bone":45281,"agara":45282,"uggish":45283,"ĠTanks":45284,"Stats":45285,"lihood":45286,"Mult":45287,"Graph":45288,"ĠCannot":45289,"ĠSpac":45290,"handler":45291,"ĠShit":45292,"Ġmorp":45293,"controller":45294,"udeau":45295,"Screenshot":45296,"Development":45297,"Gear":45298,"Ġtong":45299,"ĠColossus":45300,"rylic":45301,"STRUCT":45302,"capitalist":45303,"Ġsupplementation":45304,"Parts":45305,"pb":45306,"oppy":45307,"pite":45308,"processor":45309,"Ġexplanatory":45310,"Environmental":45311,"Compl":45312,"Gaming":45313,"arently":45314,"Ġconcess":45315,"Ġathlet":45316,"forestation":45317,"orsi":45318,"igmat":45319,"Ġencoded":45320,"misc":45321,"Ġproofs":45322,"ĠRevision":45323,"Ġmathematic":45324,"Ġconstitu":45325,"fficiency":45326,"Ġlightsaber":45327,"gz":45328,"erate":45329,"ournals":45330,"Comment":45331,"Ġpercept":45332,".\"[":45333,"ĠTechniques":45334,"coins":45335,"Shape":45336,"venant":45337,"ĠPrinted":45338,"Native":45339,"ĠGors":45340,"pecting":45341,"ĠDuel":45342,"Ġadmins":45343,"Flor":45344,"ĠDeus":45345,"cham":45346,"ĠRails":45347,"ceptor":45348,"naire":45349,"ĠSquid":45350,"ĠWarranty":45351,"SPEC":45352,"ensis":45353,"FUN":45354,"stellar":45355,"Select":45356,"llular":45357,"arget":45358,"ĠUncharted":45359,"Details":45360,"rison":45361,"Ġsyntax":45362,"chanted":45363,"Ġ-----":45364,"Ġthats":45365,"Registration":45366,"ĠSaber":45367,"ethical":45368,"Ġcryptography":45369,"atown":45370,"Ġdependencies":45371,"nw":45372,"Ġvehement":45373,"Ġrationality":45374,"ĠThou":45375,"Ġ----":45376,"rador":45377,"Ġenh":45378,"ĠCrate":45379,"STATE":45380,"/(":45381,"Ġdelim":45382,"CEPT":45383,"monkey":45384,"pai":45385,"uracy":45386,"Ġmortals":45387,"Sanders":45388,"ĠSeraph":45389,"-\"":45390,"1945":45391,"endix":45392,":'":45393,"ĠLegs":45394,"Exper":45395,"ĠKrypt":45396,"clinton":45397,"Ġuphe":45398,"Vers":45399,"Similarly":45400,"ressor":45401,"leans":45402,"LOG":45403,"cific":45404,"Ġ].":45405,"-)":45406,"resist":45407,"Pred":45408,"Latest":45409,"ilyn":45410,"Ġblob":45411,"Ġdevils":45412,"ĠIllusion":45413,"erella":45414,"Ġyak":45415,"method":45416,"Ġ698":45417,"Shadow":45418,"velt":45419,"Ġsomet":45420,"xc":45421,"Ġtriangles":45422,"netic":45423,"Calling":45424,"ĠDRM":45425,"Ġtriglycer":45426,"Ġinhibited":45427,"Ġnep":45428,"Ġalgebra":45429,"ascar":45430,"laim":45431,"Ġappl":45432,"1971":45433,"Bernie":45434,"Eh":45435,"Ġundefined":45436,"âĢĶâĢĶâĢĶâĢĶâĢĶâĢĶâĢĶâĢĶâĢĶâĢĶâĢĶâĢĶâĢĶâĢĶâĢĶâĢĶ":45437,"Sys":45438,"ournaments":45439,"Solid":45440,"Ġhep":45441,"ĠMales":45442,"Agent":45443,"Ġpsychedel":45444,"Wik":45445,"Ġdoctrines":45446,"rection":45447,"Compare":45448,"âĺ":45449,"Ġcertific":45450,"Ġsubstr":45451,"ĠCitation":45452,"ĠAFB":45453,"ĠBecame":45454,"Ġaristocracy":45455,"aryl":45456,"Ġanatomical":45457,"ocumented":45458,"ĠAssy":45459,"ĠFORM":45460,"Traditional":45461,"azines":45462,"Content":45463,"furt":45464,"Ġscripting":45465,"Ġcloaked":45466,"Ġunint":45467,"ĠCivilization":45468,"Desktop":45469,"ĠRagnar":45470,"Ġcurses":45471,"Ġobservable":45472,"ĠSpock":45473,"ĠPyr":45474,"Ġelectrom":45475,"ĠLump":45476,"oresc":45477,"ĠAttribution":45478,"egal":45479,"achusetts":45480,"Ġmarqu":45481,"âϦ":45482,"Ġcursor":45483,"ascist":45484,"1966":45485,"edit":45486,"lisher":45487,"ocyte":45488,"Writer":45489,"BILITIES":45490,"ĠUpload":45491,"Ġtreacher":45492,"Ġrecomb":45493,"Ġknights":45494,"Ġimmutable":45495,"ĠPly":45496,"Ġatten":45497,"ĠPassed":45498,"Flying":45499,"icipated":45500,"querade":45501,"ĠZot":45502,"CRE":45503,"ĠCursed":45504,"ickr":45505,"ĠDroid":45506,"thereum":45507,"Ġadjective":45508,"DIT":45509,"Ġtob":45510,"Ġinit":45511,"ĠPenet":45512,"Ġignor":45513,"Ġexalted":45514,"ĠDwell":45515,"assemb":45516,"Ġsentient":45517,"Ġ``":45518,"ĠGoo":45519,"Professional":45520,"othing":45521,"rupted":45522,"olics":45523,"ĠSetup":45524,"Thu":45525,"Campaign":45526,"Secondly":45527,"clipse":45528,"hibit":45529,"amate":45530,"SUP":45531,"ĠSuppose":45532,"submit":45533,"ĠDebian":45534,"Ġantid":45535,"Ġentert":45536,"ysical":45537,"ĠGladiator":45538,"ĠSTL":45539,"ĠBugs":45540,"ĠMech":45541,"ĠCoffin":45542,"itored":45543,"ICLE":45544,"Mist":45545,"Ġinfall":45546,"votes":45547,"actly":45548,"Occ":45549,"ĠConquest":45550,"alach":45551,"Ġintertw":45552,"reverse":45553,"amiya":45554,"icularly":45555,"edom":45556,"ĠLuxem":45557,"Fra":45558,"urrencies":45559,"Ġnobility":45560,"Tab":45561,"Beer":45562,"Ġ10000":45563,"Ġincor":45564,"Ġmelanch":45565,"Depth":45566,"Firstly":45567,"usr":45568,"ĠWiki":45569,"hhhh":45570,"ĠProxy":45571,"Ġantagonists":45572,"Ġtransistor":45573,"ĠRelic":45574,"ĠPrometheus":45575,"Ġ1280":45576,"Coun":45577,"ĠMedals":45578,"stats":45579,"Assembly":45580,"inished":45581,"cemic":45582,"Ġadventurers":45583,"Ġcd":45584,"Supporters":45585,"ĠYs":45586,"])":45587,"Ġneglig":45588,"Request":45589,"Ġwhore":45590,"Ġovercl":45591,"_-":45592,"partial":45593,"amd":45594,"Ġfructose":45595,"Ġdivid":45596,"Administ":45597,"amples":45598,"Boo":45599,"akery":45600,"owered":45601,"hester":45602,"Links":45603,"GROUND":45604,"ethy":45605,"Ġincarcer":45606,"Ġincap":45607,"Drag":45608,"ĠElastic":45609,"âĢĶâĢĶâĢĶâĢĶâĢĶâĢĶâĢĶâĢĶ":45610,"Ultra":45611,"AAAA":45612,"Order":45613,"ĠMysteries":45614,"Ġcanonical":45615,"Ign":45616,"Ġanimate":45617,"wegian":45618,"ggle":45619,"Hash":45620,"Arg":45621,"verty":45622,"Ġanalges":45623,"ouver":45624,"ittees":45625,"ĠAsgard":45626,"______":45627,"Mix":45628,"1964":45629,"Rate":45630,"Ġarousal":45631,"pheus":45632,"undai":45633,"hetamine":45634,"ĠMysterious":45635,"Alright":45636,"ĠHerod":45637,"riott":45638,"ĠAnarchy":45639,"ĠArche":45640,"Question":45641,"Chapter":45642,"Token":45643,"ĠSphere":45644,"Ġinduces":45645,"Audio":45646,"Normal":45647,"Ġprophe":45648,"ĠValiant":45649,"Tag":45650,"Relations":45651,"Ġblinked":45652,"onyms":45653,"ĠVortex":45654,"Ġdb":45655,"emonic":45656,"Phase":45657,"Ġkingdoms":45658,"Twe":45659,"ĠLORD":45660,"plementation":45661,"ĠConstantinople":45662,"helm":45663,"ĠFlesh":45664,"Ġthumbnail":45665,"ledged":45666,"ĠPROG":45667,"Ġdisbel":45668,"ĠLikes":45669,"ĠGamer":45670,"renches":45671,"hattan":45672,"Index":45673,"pecially":45674,"ĠJiu":45675,"Ġwhats":45676,"erion":45677,"xf":45678,"ĠPerception":45679,"Alien":45680,"Capt":45681,"ãĢĤ":45682,"joining":45683,"nesium":45684,"ĠSocrates":45685,"Icon":45686,"animate":45687,"ocalypse":45688,"ĠTactics":45689,"assador":45690,"Veh":45691,"src":45692,",-":45693,"Ġvisc":45694,"ĠDiscord":45695,"initial":45696,"atana":45697,"Size":45698,"Claim":45699,"ffect":45700,"iciary":45701,"Ġturret":45702,"reset":45703,"Ï":45704,"wrap":45705,"ulnerability":45706,"ĠInsert":45707,"Ġirrad":45708,"ognitive":45709,"clips":45710,"uncle":45711,"chemy":45712,"ottesville":45713,"Write":45714,"earances":45715,"1965":45716,"MIC":45717,"Ġmanag":45718,"Ġtelesc":45719,"Termin":45720,"Guest":45721,"Ġdenote":45722,"Failure":45723,"ograp":45724,"âĢķ":45725,"Ġscrolls":45726,"ĠArmored":45727,"Ġrecomp":45728,"Ġplaceholder":45729,"ĠISBN":45730,"ĠBelief":45731,"emporary":45732,"Asset":45733,"arcer":45734,"haar":45735,"assium":45736,"%:":45737,"ernal":45738,"ĠLv":45739,"atible":45740,"Pand":45741,"oubted":45742,"Lie":45743,"bial":45744,"STEP":45745,"Ġpresets":45746,"Ġstatist":45747,"Sund":45748,"reshold":45749,"endium":45750,"\");":45751,"Software":45752,"Ġbasal":45753,"ĠYose":45754,"Ġmortg":45755,"ocry":45756,"Ġsubreddit":45757,"omorphic":45758,"ĠLoaded":45759,"berra":45760,"vg":45761,"orkshire":45762,"ĠChrys":45763,"Repeat":45764,"ĠSimulator":45765,"rx":45766,"gex":45767,"Linux":45768,"ĠInstruct":45769,"irable":45770,"Ġmosquit":45771,"ĠManga":45772,"iOS":45773,"Ġsynt":45774,"Ġclitor":45775,"Ġlobe":45776,"ĠDelete":45777,"CVE":45778,"fortunately":45779,"Enc":45780,"vertising":45781,"Ġanten":45782,"Ġfif":45783,"Study":45784,"prev":45785,"ossus":45786,"Nar":45787,"Decl":45788,"erala":45789,"ĠPrototype":45790,"UGE":45791,"1001":45792,"Ġ---------":45793,"deals":45794,"odcast":45795,"TPS":45796,"Ġcodec":45797,"ittee":45798,"isexual":45799,"ĠBreaker":45800,"menu":45801,"ĠURI":45802,"('":45803,"ĠFiorina":45804,"ĠApostles":45805,"ĠWitches":45806,"raint":45807,"addafi":45808,"ersive":45809,"yrim":45810,"Ġmosa":45811,"Ġrog":45812,"Ear":45813,"âĺħ":45814,"Ġcaloric":45815,"matical":45816,"yrics":45817,"ĠKrugman":45818,"axter":45819,"1016":45820,"Ġsep":45821,"ĠExtend":45822,"ropolitan":45823,"thren":45824,"ologne":45825,"atomic":45826,"Naturally":45827,"Pros":45828,"gencies":45829,"akens":45830,"Male":45831,"Ġcausation":45832,"omnia":45833,"Comments":45834,"eeee":45835,"iquette":45836,"Ġcytok":45837,"ename":45838,"details":45839,"Ġdestruct":45840,"leep":45841,"ĠCavern":45842,"ĠInvention":45843,"ueless":45844,"Ġsubsection":45845,"outhern":45846,"metic":45847,"blogs":45848,"ĠPacks":45849,"ĠArduino":45850,"hhh":45851,"elligence":45852,"imity":45853,"ĠUltron":45854,"astrous":45855,"Ġbiome":45856,"ĠHover":45857,"Ġprivile":45858,"igham":45859,"apest":45860,"ĠYoshi":45861,"Artist":45862,".\",":45863,"gamer":45864,"Virgin":45865,"Tea":45866,"ĠDoomsday":45867,"ĠðŁĻĤ":45868,"terday":45869,"ĠCommando":45870,"ĠAchieve":45871,"chrom":45872,"Ġcryptographic":45873,"Ġrebell":45874,"Specifically":45875,"â̦â̦â̦â̦":45876,"ĠEternity":45877,"Ġemulation":45878,"ĠSERV":45879,"ĠMiscellaneous":45880,"ĠParticipant":45881,"duc":45882,"vp":45883,"ĠSparkle":45884,"ategories":45885,"Ġdecrypt":45886,"ĠGNOME":45887,"activation":45888,"Ġanarch":45889,"owler":45890,"adiator":45891,"itars":45892,"ĠTHEN":45893,")\",":45894,"åħ":45895,"Ġembod":45896,"vae":45897,"âĺĨ":45898,"Member":45899,"Ġrm":45900,"nyder":45901,"ĠLeviathan":45902,"Gaza":45903,"erenn":45904,"Chicken":45905,"ĠDefinitive":45906,"ĠBolshe":45907,"ĠJagu":45908,"gorith":45909,"loader":45910,"exe":45911,".........":45912,"ĠReceived":45913,"ĠProto":45914,"ĠLocked":45915,"Posts":45916,"ankind":45917,"Clock":45918,"ĠCLI":45919,"Throw":45920,"dL":45921,"epad":45922,"ĠAtmosp":45923,"Ġmk":45924,"ĠSteal":45925,"uple":45926,"reference":45927,"ĠGNU":45928,"adelphia":45929,"scripts":45930,"ilaterally":45931,"ĠMods":45932,"odus":45933,"ignty":45934,"REF":45935,"Ġhypothesized":45936,"issors":45937,"Ġanus":45938,"HUD":45939,"rices":45940,"Draw":45941,"Computer":45942,"Below":45943,"uthor":45944,"ĠTact":45945,"=$":45946,"00000000":45947,"Ġcaut":45948,"Sharp":45949,"depend":45950,"Ġtatt":45951,"Goal":45952,"Sounds":45953,"zona":45954,"anyon":45955,"ricanes":45956,"ĠUSAF":45957,"Jump":45958,"Bottom":45959,"etermination":45960,"ĠPles":45961,"Ġhypothes":45962,"Reference":45963,"Ġswall":45964,"Ġmaneu":45965,"rifice":45966,"ĠVeh":45967,"Ġtex":45968,"geoning":45969,"ĠâľĶ":45970,"Mach":45971,"eanor":45972,"%);":45973,"archives":45974,"Ġencyclopedia":45975,"ĠPreferences":45976,"damage":45977,"Done":45978,"Ġcoefficient":45979,"ĠCreatures":45980,"Ġital":45981,"ivari":45982,"Revolution":45983,"Ġnob":45984,"Diff":45985,"Ġabbre":45986,"Writ":45987,"ĠDOS":45988,"redd":45989,"Ġsplend":45990,"orest":45991,"flame":45992,"Ġdevs":45993,"Ġ==":45994,"ĠPuzzle":45995,"Ġgit":45996,"MOD":45997,"ĠArgument":45998,"ĠAbyss":45999,"Studies":46000,"ophob":46001,"uild":46002,"scill":46003,"fp":46004,"Ġplur":46005,"Delete":46006,"ĠFALSE":46007,"FIL":46008,"Ġmicrobiota":46009,"ĠIPv":46010,"Stud":46011,"ortal":46012,"ĠDivinity":46013,"ounter":46014,"ä¸":46015,"Naz":46016,"stals":46017,"ihilation":46018,"Ġpersecut":46019,"ĠPlanes":46020,"viation":46021,"Driver":46022,"ĠEEG":46023,"Unity":46024,"Premium":46025,"ĠSiren":46026,"ĠPaleo":46027,"earchers":46028,"Pract":46029,"Ö":46030,"VII":46031,"mosp":46032,"Ġidentifiers":46033,"Near":46034,"achu":46035,"Apps":46036,"tackle":46037,"COLOR":46038,"Ġperpendicular":46039,"viks":46040,"ecided":46041,"ĠDota":46042,"icons":46043,"Ġpsi":46044,"Brave":46045,"Ġunimagin":46046,"ĠATI":46047,"OOL":46048,"Gender":46049,"ĠSwords":46050,"oples":46051,"Rank":46052,"olphins":46053,"Ġdeities":46054,"ĠXIII":46055,"м":46056,"ĠKraken":46057,"ĠLEVEL":46058,"stasy":46059,"ĠBabel":46060,"Hours":46061,"Avoid":46062,"Mech":46063,"Multi":46064,"Ġect":46065,"Occup":46066,"panic":46067,"Ġmutants":46068,"Evidence":46069,"Tips":46070,"Ġvolts":46071,"Exit":46072,"xb":46073,"planet":46074,"avez":46075,"features":46076,")]":46077,"lol":46078,"ĠNeph":46079,"ĠSanct":46080,"Ġimpover":46081,"................................":46082,"Sty":46083,"Email":46084,"Torrent":46085,"Ġgluc":46086,"ĠSins":46087,"ĠIncarn":46088,"ĠWITHOUT":46089,"ĠPanzer":46090,"ĠAssignment":46091,"versible":46092,"Strange":46093,"ITNESS":46094,"incible":46095,"ZX":46096,"ĠMySQL":46097,"Ġconson":46098,"Ġoxidative":46099,"Machine":46100,"Impro":46101,"Parent":46102,"ĠMetroid":46103,"Educ":46104,"Ġdismant":46105,"dx":46106,"ĠPersona":46107,"ĠHDL":46108,"Americ":46109,"Users":46110,"Ġeighteenth":46111,"WARNING":46112,"ĠLists":46113,"ĠCanter":46114,"ĠTrotsky":46115,"Ġhaha":46116,"]'":46117,"ĠEncyclopedia":46118,"admin":46119,"ĠACTIONS":46120,"idav":46121,"ο":46122,"ĠFTP":46123,"Ġquar":46124,"ongyang":46125,"â̦â̦â̦â̦â̦â̦â̦â̦":46126,"Ġsynchronization":46127,"DEM":46128,"riched":46129,"Ġnegro":46130,"Bench":46131,"Ġfilament":46132,"Ġdecoding":46133,"obj":46134,"Ġjoystick":46135,"Decre":46136,"ĠBolshevik":46137,"Virtual":46138,"ĠSacrament":46139,"xd":46140,"BILL":46141,"-+-+":46142,"¶":46143,"anchester":46144,"Pokemon":46145,"Ġslic":46146,"iameter":46147,"errilla":46148,"Exactly":46149,"\"'":46150,"getic":46151,"3333":46152,"solete":46153,"Ġincorpor":46154,"Ġio":46155,"------------":46156,"Ġantiquity":46157,"ATURES":46158,"Policy":46159,"oppable":46160,"Ġ=>":46161,"ODUCT":46162,"otide":46163,"Ú":46164,"Ġnormative":46165,"Fac":46166,"Ġshaman":46167,"element":46168,"Plex":46169,"INTER":46170,"etsk":46171,"ĠGauntlet":46172,"ĠBIOS":46173,"×ķ":46174,"riet":46175,"Rew":46176,"uristic":46177,"urches":46178,"ĠChomsky":46179,"ixir":46180,"package":46181,"Owner":46182,"Ġschematic":46183,"Assistant":46184,"Ġemanc":46185,"Ġarchetype":46186,"Initial":46187,"intent":46188,"Ġfilib":46189,"ispers":46190,"Flag":46191,"Tank":46192,"Ġinsurg":46193,"Ġapproximation":46194,"Ġsemantic":46195,"Ġsubtitle":46196,"Font":46197,"Ġintimid":46198,"Ġhath":46199,"tools":46200,"gob":46201,"Process":46202,"slave":46203,"ĠJUSTICE":46204,"âĻ¥":46205,"ĠHardcore":46206,"Discover":46207,"Ġexch":46208,"ptive":46209,"units":46210,"ĠDjango":46211,"itudinal":46212,"Ġpc":46213,"akespeare":46214,"ospace":46215,"Ġhorny":46216,"auth":46217,"ĠSkyrim":46218,"ENGTH":46219,"perors":46220,"ĠVulkan":46221,"Ġchimpan":46222,"Ġremem":46223,"Ġopacity":46224,"Ġ:(":46225,"ushima":46226,"Ġawoken":46227,"Ġsacrament":46228,"Beginning":46229,"escape":46230,"Anim":46231,"Ġadvant":46232,"ĠRequires":46233,"output":46234,"Ġdroid":46235,"Yep":46236,"rieving":46237,"Ġpt":46238,"ĠShotgun":46239,"ĠOsiris":46240,"disabled":46241,"ĠRadius":46242,"Medium":46243,"ĠScient":46244,"ĠRept":46245,"ymm":46246,"Ġcp":46247,"ĠLabyrinth":46248,"poral":46249,"Ġ'(":46250,"Hack":46251,"ĠTechnique":46252,"/,":46253,"Ġambig":46254,"Basic":46255,"Ġretrie":46256,"VICE":46257,"BIP":46258,"ragon":46259,"phies":46260,"uminum":46261,"ĠFei":46262,"lesi":46263,"Ġsemantics":46264,"ĠHz":46265,"ĠUnderworld":46266,"Ġendot":46267,"olesterol":46268,"ourning":46269,"Ġcaches":46270,"ĠYug":46271,"Legendary":46272,"ĠDocumentation":46273,"ĠSpiral":46274,"ĠClone":46275,"bnb":46276,"ĠâĶ":46277,"ustom":46278,"Mp":46279,"gettable":46280,"agonist":46281,"Ġneuronal":46282,"culus":46283,"enum":46284,"cules":46285,"Ġmuttered":46286,"ctica":46287,"necess":46288,"ĠSubtle":46289,"Ġsolder":46290,"Environment":46291,"oneliness":46292,"orage":46293,"â̦.\"":46294,"nesota":46295,"agements":46296,"Ùİ":46297,"WHERE":46298,"ĠGDDR":46299,"Scient":46300,"ĠMulcair":46301,"ĠRena":46302,"________________________________________________________________":46303,"antics":46304,"Ġtorped":46305,"Brow":46306,"ossal":46307,"Category":46308,"Regular":46309,"remote":46310,"ãģ":46311,"ĠCoil":46312,"ritch":46313,"specified":46314,"Average":46315,"Ġfingert":46316,"entity":46317,"atibility":46318,"ampunk":46319,"ĠScriptures":46320,"Ġunequ":46321,"arettes":46322,"arching":46323,"Ġastron":46324,"Ġnumeric":46325,"ĠeBook":46326,"remove":46327,"onday":46328,"Ġmetaphysical":46329,"ĠGoku":46330,"Element":46331,"ĠRuin":46332,"Norm":46333,"Ġtox":46334,"puff":46335,"Ġharmonic":46336,"ĠAgility":46337,"ĠHearthstone":46338,"Ġmana":46339,"Points":46340,"Ġconduc":46341,"ĠPersia":46342,"-----":46343,"license":46344,"Application":46345,"assert":46346,"Reader":46347,"ĠSacrifice":46348,"float":46349,"inctions":46350,"byter":46351,"Ġfundament":46352,"\"â̦":46353,"Fourth":46354,"Effective":46355,"ĠMeow":46356,"ĠErrors":46357,"ĠIcar":46358,"ĠMMO":46359,"Ġapostles":46360,"Ġfaintly":46361,"component":46362,"bably":46363,"uggage":46364,"ĠMPG":46365,"krit":46366,"container":46367,"ixture":46368,"ĠPOV":46369,"izabeth":46370,"onut":46371,"isdom":46372,"trace":46373,"ĠSDL":46374,"Interestingly":46375,"ĠExplan":46376,"lesiastical":46377,"ternal":46378,"Bug":46379,"Ġmetabolites":46380,"geries":46381,"Ġsupra":46382,"ĠMakoto":46383,"orget":46384,"racuse":46385,"][":46386,"ĠPrelude":46387,"peria":46388,"tube":46389,"ĠCatalog":46390,"ĠGoblin":46391,"QUEST":46392,"ĠINCLUD":46393,"ĠVERS":46394,"erguson":46395,"Ġcommandments":46396,"ĠUDP":46397,"itle":46398,"ι":46399,"domain":46400,"roximately":46401,"ĠTLS":46402,"ongevity":46403,"Ġmodulation":46404,"Ġdidnt":46405,"ĠCalories":46406,"Applications":46407,"ormon":46408,"Ġsd":46409,"dullah":46410,"Ġcous":46411,"ĠDARK":46412,"clip":46413,"ĠPsychiat":46414,"ĠTanz":46415,"ĠCharisma":46416,"ĠMerge":46417,"ĠKDE":46418,"requires":46419,"urdue":46420,"Ġdecimal":46421,"Ġâī¥":46422,"ĠAuth":46423,"ebted":46424,"ĠTempl":46425,"ĠâĢº":46426,"Ultimate":46427,"Ġmammalian":46428,"advertising":46429,"Ġdominion":46430,"Ġacron":46431,"ĠWem":46432,"ĠHeist":46433,"oiler":46434,"FLAG":46435,"ovember":46436,"Syn":46437,"Ġgodd":46438,"ĠPyth":46439,"Ġglyc":46440,"ĠHelpful":46441,"Ġgad":46442,"chedel":46443,"Similar":46444,"Ġ¶":46445,"Ġnp":46446,"ĠREPL":46447,"Fill":46448,"ĠSunder":46449,"etsy":46450,"ĠPAX":46451,"ĠFemales":46452,"ĠKingdoms":46453,"Ġwhistlebl":46454,"Hide":46455,"serial":46456,"ĠEnemies":46457,"ĠPeb":46458,"Ġpiety":46459,"ifact":46460,"esity":46461,"bsite":46462,"esides":46463,"Ġported":46464,"Ġamygdala":46465,"ĠGerr":46466,"afety":46467,"Ġadip":46468,"(\"":46469,"Ġcf":46470,"Ġurl":46471,"unia":46472,"icro":46473,"Austral":46474,"ĠConfig":46475,"accompanied":46476,"isite":46477,"Ġtextual":46478,"\">":46479,"Ġanecd":46480,"Ġ\",":46481,"angular":46482,"ĠUnicode":46483,"Proof":46484,"Ġmultiplication":46485,"Address":46486,"Ġbytes":46487,"lems":46488,"uterte":46489,"Episode":46490,"oshop":46491,"ritical":46492,"Adjust":46493,"argument":46494,"\\'":46495,"Rober":46496,"pection":46497,"Agg":46498,"äº":46499,"interrupted":46500,"ĠDebor":46501,"Ġlair":46502,"Various":46503,"isively":46504,"ĠStatic":46505,"ohyd":46506,"ĠEchoes":46507,"UID":46508,"raught":46509,"Bott":46510,"Ġapostle":46511,"ĠCentauri":46512,"oxicity":46513,"ibling":46514,"Ġparalle":46515,"inav":46516,"Crit":46517,"ĠTyph":46518,"Ġhig":46519,"ĠEDITION":46520,"Ġcoord":46521,"uish":46522,"sectional":46523,"inki":46524,"Title":46525,"anyahu":46526,"osterone":46527,"Ġdesper":46528,"ribly":46529,"Legend":46530,"afort":46531,"Org":46532,"Ġempir":46533,"ĠQuake":46534,"SSL":46535,"ioxide":46536,"åľ":46537,"Ġenz":46538,"urtle":46539,"BSD":46540,"Rust":46541,"ospels":46542,"Rare":46543,"Ġpartitions":46544,"Ġheresy":46545,"overy":46546,"Ġmonop":46547,"Pixel":46548,"odder":46549,"Option":46550,"withstanding":46551,"Transfer":46552,"Ġarrog":46553,"skip":46554,"ĠSSH":46555,"ĠSph":46556,"Ġcallback":46557,"PIN":46558,"Ġpdf":46559,"Ġplaint":46560,"cipled":46561,"reenshots":46562,"Ġparsing":46563,"::::::::":46564,"ioxid":46565,"Ġhereafter":46566,"ĠFunctions":46567,"ĠBulgar":46568,"Ġintu":46569,"DOC":46570,"Location":46571,"Hyper":46572,"ageddon":46573,"Evil":46574,"illions":46575,"Introduction":46576,"Physical":46577,"ĠLayout":46578,"âķ":46579,"------------------------":46580,"ĠRodham":46581,"ĠPatterns":46582,"Delivery":46583,"Ġdistur":46584,"ĠVolunte":46585,"ĠGUI":46586,"Ġclen":46587,"Ġinacc":46588,"ĠBallistic":46589,"ĠSprite":46590,"Privacy":46591,"theme":46592,"dump":46593,"ĠByte":46594,"ĠIncre":46595,"apult":46596,"ĠWrath":46597,"ensibly":46598,"NOTE":46599,"ounge":46600,"ustomed":46601,"ochond":46602,"ĠQt":46603,"Primary":46604,"Ġsidew":46605,"Root":46606,"gregation":46607,"SQL":46608,"ĠSOFTWARE":46609,"Gallery":46610,"ĠDungeon":46611,"ĠVengeance":46612,"->":46613,"steam":46614,"Ġfrivol":46615,"Ġpid":46616,"filter":46617,"Ġfacult":46618,"doms":46619,"Tool":46620,"1959":46621,"Ġprefix":46622,"Ġcomma":46623,"relative":46624,"Ġformatted":46625,"appropriately":46626,"Ġmd":46627,"xxx":46628,"ĠAuthentication":46629,"ĠWTC":46630,"Ġvulner":46631,"reditary":46632,"Steam":46633,"Tx":46634,"ĠGHC":46635,"Increased":46636,"forcement":46637,"ĠGuant":46638,"bernatorial":46639,"Entry":46640,"ĠWarp":46641,"ĠCreature":46642,"ĠAmmunition":46643,"Ġclust":46644,"ĠInher":46645,"Ġunbel":46646,"RGB":46647,"ĠMankind":46648,"ĠPlague":46649,"Ġ=================================":46650,"psc":46651,"Intern":46652,"tml":46653,"ĠCrusade":46654,"inflamm":46655,"Storage":46656,"token":46657,"inse":46658,"False":46659,"Adult":46660,"Pokémon":46661,"PLIED":46662,"Ġglac":46663,"ĠDwarf":46664,"sequence":46665,"Ġmagnification":46666,"ĠIlluminati":46667,"hedral":46668,"param":46669,"regon":46670,".\",\"":46671,"Eva":46672,"igree":46673,"Object":46674,"Ġoptimizations":46675,"uador":46676,"mmmm":46677,"ullivan":46678,"Ġ[\"":46679,"ĠDusk":46680,"Ġtrig":46681,"Ġiss":46682,"Ġhypert":46683,"Ġperspect":46684,"Ġassum":46685,":,":46686,"Ġinterpol":46687,"Asked":46688,"Boot":46689,"LIB":46690,"Loading":46691,"Ident":46692,"upuncture":46693,"ioch":46694,"Ġprefrontal":46695,"delay":46696,"ĠPoké":46697,"bestos":46698,"overe":46699,"Elf":46700,"eteria":46701,"ĠSneak":46702,"bians":46703,"ĠARTICLE":46704,"Xbox":46705,"encrypted":46706,"ync":46707,"ĠNietzsche":46708,"Nonetheless":46709,"Ġ±":46710,"ĠPrimal":46711,"ĠFlare":46712,"Ġconflic":46713,"ĠRune":46714,"Tes":46715,"cellence":46716,"Mega":46717,"ĠEntity":46718,"chrome":46719,"iatures":46720,"Ġuninstall":46721,"Winner":46722,"aimon":46723,"Ġhomebrew":46724,"Ruby":46725,"araoh":46726,"itime":46727,"Ġpotion":46728,"ĠAllows":46729,"ogyn":46730,"osuke":46731,"Limited":46732,"Ġmacros":46733,"ERROR":46734,"gling":46735,"Ġtodd":46736,"repre":46737,"ĠSakura":46738,"erker":46739,"items":46740,"FIG":46741,"ĠUnle":46742,"Ġhardness":46743,"Split":46744,"Ġarous":46745,"ocally":46746,"Ġì":46747,"ĠEVE":46748,"pleasant":46749,"ihil":46750,"ĠRouter":46751,"ĠLucius":46752,"readable":46753,"Ġtremb":46754,"Dro":46755,"Ġblaster":46756,"Ġbourgeoisie":46757,"NUM":46758,"Alternative":46759,"flags":46760,"GAME":46761,"ebook":46762,"ĠIPM":46763,"Ġcorrel":46764,"Setting":46765,"Frame":46766,"Ġatheism":46767,"Interested":46768,"Liquid":46769,"stanbul":46770,"Lv":46771,"Ġtits":46772,"Ġdc":46773,"×Ļ×":46774,"Ġdoctr":46775,"background":46776,"tsy":46777,"ĠCtrl":46778,"ĠCompatibility":46779,"idae":46780,"example":46781,"perture":46782,"Ġguid":46783,"ĠWinged":46784,"Command":46785,"ridor":46786,"bool":46787,"comments":46788,"ĠImmunity":46789,"Nit":46790,"Statement":46791,"Ġmanif":46792,"ĠIntake":46793,"Bloom":46794,"txt":46795,"context":46796,"input":46797,"achus":46798,"proc":46799,"Ñĭ":46800,"Ġdisemb":46801,"ospons":46802,"utical":46803,"ĠRender":46804,"Ironically":46805,"ursday":46806,"ĠExile":46807,"lishes":46808,"iets":46809,"orescent":46810,"cair":46811,"ĠSubjects":46812,"ĠDungeons":46813,"Ġiii":46814,"neapolis":46815,"ĠBlaster":46816,"Ġphp":46817,"ORED":46818,"ĠSLI":46819,"Ġelig":46820,"ĠIdentified":46821,"ĠBrawl":46822,"bytes":46823,"ĠCTR":46824,"Ġsched":46825,"Assuming":46826,"Bound":46827,"ĠMathemat":46828,"razil":46829,"ĠAstral":46830,"mble":46831,"untled":46832,"Ġmech":46833,"ĠDagger":46834,"ĠUseful":46835,"nesday":46836,"tarians":46837,"AMY":46838,"Camera":46839,"node":46840,"pict":46841,"ginx":46842,"Ġyea":46843,">>>>>>>>":46844,"paragraph":46845,"ĠSupplementary":46846,"9999":46847,"ĠAlchemist":46848,"uzzle":46849,"igun":46850,"ĠCalculator":46851,"ĠApplicant":46852,"hift":46853,"ĠGPL":46854,"Ġencode":46855,"Crash":46856,"ĠNutr":46857,"kHz":46858,"TABLE":46859,"intestinal":46860,"andom":46861,"archive":46862,"Ëľ":46863,"Registered":46864,"Questions":46865,"Remote":46866,"ethyst":46867,"Ġgren":46868,"ĠTexture":46869,"Ġseiz":46870,"Anyway":46871,"ĠVariant":46872,"ê":46873,"Adapt":46874,"ittered":46875,"meta":46876,"ambers":46877,"ĠRuins":46878,"ĠChimera":46879,"password":46880,"ĠReboot":46881,"Ġcaster":46882,"Ġamplitude":46883,"Position":46884,"Ġnotation":46885,"Ġsecretion":46886,"Excellent":46887,"delete":46888,"aminer":46889,"ä»":46890,"Exec":46891,"ĠKenobi":46892,"Interview":46893,"ontent":46894,"ospel":46895,"Ġtuber":46896,"CONT":46897,"roups":46898,"Ġemulator":46899,"Ġjava":46900,"0200":46901,"Ġnested":46902,"Ġfert":46903,")).":46904,"Dex":46905,"ĠSora":46906,"Ġpotions":46907,"ĠAnon":46908,"aah":46909,"Ġdunno":46910,"Ġμ":46911,"Ġmethodological":46912,"itles":46913,"phia":46914,"Beg":46915,"Rules":46916,"ĠXML":46917,"Ġflask":46918,"ĠShogun":46919,"Ġ2048":46920,"atchewan":46921,"Ġfuckin":46922,"Built":46923,"Ġbour":46924,"Ġdisag":46925,"yss":46926,"ĠÏ":46927,"Spoiler":46928,"Wiki":46929,"Ġmorphology":46930,"Ġendors":46931,"Ġdungeons":46932,"dragon":46933,")),":46934,"Ġhous":46935,"Ġoverwhel":46936,"SAY":46937,"abwe":46938,"--------------------------------":46939,"Ġepist":46940,"Ġpalp":46941,"ĠExtensions":46942,"ĠMistress":46943,"ĠUkrain":46944,"================":46945,"edience":46946,"abama":46947,"ĠLua":46948,"ĠOffline":46949,"ĠKonami":46950,"unicip":46951,"ĠMachina":46952,"Specific":46953,"Ġpresupp":46954,"ĠGEAR":46955,"rition":46956,"rences":46957,"successfully":46958,"Ġ1024":46959,"Platform":46960,"}}":46961,"clude":46962,"roxy":46963,"Ġpromot":46964,"ĠAdapter":46965,"rocal":46966,"ĠMasquerade":46967,"Panel":46968,"Language":46969,"elsius":46970,"Push":46971,"abase":46972,"ĠdB":46973,"argon":46974,"ĠRemoved":46975,"amph":46976,"ĠWyr":46977,"Ġindisp":46978,"ĠOkin":46979,"aepernick":46980,"moil":46981,"Continue":46982,"00007":46983,"ĠJournals":46984,"TAG":46985,"ĠRemastered":46986,"Ġsymp":46987,"methyl":46988,"Overview":46989,"umeric":46990,"ĠCodex":46991,".$":46992,"ranged":46993,"Sym":46994,"ĠVerse":46995,"ĠEnabled":46996,"ĠFUCK":46997,"ĠHearth":46998,"Ġbrill":46999,"ĠChaser":47000,"Beh":47001,"ĠAlchemy":47002,"Oracle":47003,"roleum":47004,"ĠVoldemort":47005,"();":47006,"Ġcollaps":47007,"Visual":47008,"ĠAngular":47009,"ĠOsc":47010,"ichita":47011,"Ġcig":47012,"Ġtoolbar":47013,"ĠEnlight":47014,"ÑĮ":47015,"ε":47016,"aliation":47017,"ĠLovecraft":47018,"jri":47019,"ĠInterstellar":47020,"Ġdebugging":47021,"Ġparentheses":47022,"ĠInit":47023,"Located":47024,"Weak":47025,"ĠPvP":47026,"ĠCloak":47027,"uture":47028,"iths":47029,"asionally":47030,"FACE":47031,"Introdu":47032,"');":47033,"slot":47034,"aturday":47035,"ĠNiet":47036,"Ġpuzz":47037,"!!!!!!!!":47038,"folios":47039,"Ç":47040,"Ġverbs":47041,"ĠFrames":47042,"ĠAmbro":47043,"Ġmillisec":47044,"ĠRebell":47045,"ylum":47046,"PASS":47047,"ĠConfiguration":47048,"μ":47049,"brids":47050,"vantage":47051,"Ġ['":47052,"ĠScy":47053,"Benef":47054,"gradation":47055,"ĠOrc":47056,"Resources":47057,"Awesome":47058,"ĠMilitia":47059,"POST":47060,"Ġbinaries":47061,"Mode":47062,"Ġkb":47063,"ĠWARRANT":47064,"hemy":47065,"Desc":47066,"alion":47067,"Ġwiki":47068,"Ġcommer":47069,"Serial":47070,"ĠUncommon":47071,"ignore":47072,"Ġconstructor":47073,"ctl":47074,"Ġ):":47075,"ĠVerify":47076,"Notice":47077,"ĠRPGs":47078,"uckland":47079,"Ġincre":47080,"Pinterest":47081,"ĠDefinitions":47082,"iband":47083,"Ġtd":47084,"Ġsubscrib":47085,"Shin":47086,"ĠGadget":47087,"Document":47088,"å®":47089,"Requ":47090,"QUIRE":47091,"ĠQuadro":47092,"ĠUnix":47093,"Enlarge":47094,"thens":47095,"\"...":47096,"gebra":47097,"pload":47098,"alogue":47099,"vironments":47100,"Strength":47101,"ĠPID":47102,"ĠInvaders":47103,"HOME":47104,"Atl":47105,"ĠBlizz":47106,"ĠWidth":47107,"ĠOpenGL":47108,"zx":47109,"$,":47110,"Ġå":47111,"cig":47112,"lectic":47113,"relation":47114,"Ġfeas":47115,"undown":47116,"Said":47117,"ν":47118,"��":47119,"english":47120,"ĠTokens":47121,"ĠALEC":47122,"OOOO":47123,"isconsin":47124,"Ġconstants":47125,"ĠTemplar":47126,"Accept":47127,"Ġmascul":47128,"enegger":47129,"ampires":47130,"Rated":47131,"lua":47132,"ucl":47133,"ĠSequence":47134,"ĠNRS":47135,"STD":47136,"Cra":47137,"autions":47138,"ĠKernel":47139,"oleon":47140,"htaking":47141,"ancial":47142,"Pages":47143,"orthodox":47144,"ropy":47145,"EEE":47146,"Ġtranssexual":47147,"?????":47148,"Ġsurpr":47149,"arthy":47150,"ĠPsychic":47151,"Ġdorsal":47152,"cember":47153,"joice":47154,"/+":47155,"verend":47156,"uint":47157,"Ġderog":47158,"Subject":47159,"hemat":47160,"!]":47161,"Ġ);":47162,"Ġmeshes":47163,"Ġreperc":47164,"ĠTerran":47165,"åĪ":47166,"Load":47167,"å¹":47168,"ikarp":47169,"rompt":47170,"Ġgoblins":47171,"ĠShattered":47172,"tests":47173,"Spread":47174,"ĠNaruto":47175,"Ġpredic":47176,"Hyp":47177,"ĠArkham":47178,"ĠNASL":47179,"Material":47180,"Rule":47181,"raviolet":47182,"ĠKlingon":47183,"Memory":47184,"acers":47185,"Known":47186,"Important":47187,"Ġα":47188,"Ġtraged":47189,"Ġshalt":47190,"Ġiso":47191,"ĠJSON":47192,"Instant":47193,"Ġpg":47194,"Ġexponent":47195,"formance":47196,"bitcoin":47197,"DOS":47198,"cheat":47199,"Ġrook":47200,"ĠBiol":47201,"noticed":47202,"Ġtwent":47203,"ĠRedux":47204,"ĠBorderlands":47205,"Supported":47206,"TRUMP":47207,"Ġturrets":47208,"include":47209,"Effect":47210,"Ġdisg":47211,"ophical":47212,"ĠFaction":47213,"wiki":47214,"Ġsrc":47215,"Laun":47216,"TIT":47217,"Ġorbs":47218,"Ġincompet":47219,"Ġdescriptor":47220,"ĠTrog":47221,"Contribut":47222,"ĠGodd":47223,"inances":47224,"Ult":47225,"lyak":47226,"âĢ¢âĢ¢âĢ¢âĢ¢":47227,"stitial":47228,"essim":47229,"Graphics":47230,"ubis":47231,"Ġegreg":47232,"DEV":47233,"Ġannotations":47234,"Yang":47235,"ĠDruid":47236,"ĠInquisition":47237,"ohydrate":47238,"Critical":47239,"æĸ":47240,"Sample":47241,"ĠPref":47242,"ĠUnleashed":47243,"ĠAccessed":47244,"Ġconceptions":47245,"Minor":47246,"pard":47247,"prus":47248,"Factory":47249,"thinkable":47250,"Ġexecutable":47251,"chapter":47252,"inyl":47253,"Display":47254,"ilater":47255,"Released":47256,"ĠDirectX":47257,"aneers":47258,"Ġ______":47259,"ĠHilbert":47260,"Options":47261,"Ġsorcery":47262,"esm":47263,"ÏĦ":47264,"Ġdescript":47265,"ĠTycoon":47266,"psons":47267,"Ġcov":47268,"Launch":47269,"ogeneity":47270,"Ġsacrific":47271,"ADRA":47272,"netflix":47273,"flix":47274,"usage":47275,"properties":47276,"attach":47277,"req":47278,"Resource":47279,"requisite":47280,"1007":47281,"ĠMIDI":47282,"ĠZoro":47283,"Tue":47284,"hower":47285,"dds":47286,"ynasty":47287,"headers":47288,"Ġdisproportion":47289,"omaly":47290,"Ġvim":47291,"inces":47292,"edient":47293,"ĠWraith":47294,"ilibrium":47295,"Hig":47296,"ĠFrie":47297,"Meat":47298,"ldom":47299,"KNOWN":47300,"orgetown":47301,"Improve":47302,"10000":47303,"Ġretarded":47304,"Disclaimer":47305,"Ġunfocused":47306,"ĠUnsure":47307,"ĠElixir":47308,"idth":47309,"atural":47310,"ĠErr":47311,"Critics":47312,"ĠBows":47313,"ifferent":47314,"proxy":47315,"Lic":47316,"aucas":47317,"rolet":47318,"ĠCoC":47319,"Ġdoesnt":47320,"phabet":47321,"Version":47322,"Ġhepat":47323,"gif":47324,"izophren":47325,"ãĥ»":47326,"ĠGutenberg":47327,"β":47328,"phans":47329,"Scene":47330,"Ġaccomp":47331,"ilings":47332,"rypted":47333,"aceae":47334,"arantine":47335,"heses":47336,"iasco":47337,"lopp":47338,"ĠGSL":47339,"disk":47340,"ãĢģ":47341,"0010":47342,"ĠOutbreak":47343,"Column":47344,"odox":47345,"atform":47346,"ĠThrust":47347,"ĠSVG":47348,"Enhanced":47349,"¯":47350,"Tools":47351,"rogens":47352,"xus":47353,"Available":47354,"zbollah":47355,"è¡":47356,"osate":47357,"usb":47358,"ordes":47359,"Matrix":47360,"ĠBlazing":47361,"ascus":47362,"ĠSovere":47363,"hement":47364,"*:":47365,"amaru":47366,"Ġparsed":47367,"Bonus":47368,"otrop":47369,"spell":47370,"ancock":47371,"ĠEnchant":47372,"vP":47373,"ĠReferred":47374,"Ġalot":47375,"ĠRuntime":47376,"ĠFn":47377,"CPU":47378,"ĠNicotine":47379,"External":47380,"ĠNightmares":47381,"Ġentropy":47382,"kB":47383,"ĠRealms":47384,"Ġ##":47385,"Ġsubmar":47386,"ĠSlime":47387,"itual":47388,"ĠBastard":47389,"Ġacknowled":47390,"Magazine":47391,"rendered":47392,"ircraft":47393,"CSS":47394,"Numbers":47395,"Pg":47396,"utenant":47397,"ĠPalest":47398,"ĠRoose":47399,"udicrous":47400,"anooga":47401,"Unt":47402,"Ġcapacitor":47403,"Ġschema":47404,"hematic":47405,"ĠPinball":47406,"endars":47407,"Ġ===":47408,"nsic":47409,"ipedia":47410,"Ġchromos":47411,"ĠmRNA":47412,"Ct":47413,"ĠPaladin":47414,"sonian":47415,"Ġæ":47416,"ajor":47417,"repeat":47418,"ortex":47419,"ĠHeroic":47420,"ĠHera":47421,"ociated":47422,"Ġdebug":47423,"osher":47424,"upiter":47425,"_.":47426,"Ġsys":47427,"ĠDownloads":47428,"','":47429,"Adventure":47430,"FORE":47431,"ocument":47432,"arning":47433,"Ġmiscon":47434,"vidia":47435,"Cod":47436,"ibraries":47437,"buffer":47438,"cdn":47439,"ĠModes":47440,"tarian":47441,"ĠPyro":47442,"ĠFixes":47443,"ĠâĪ":47444,"ĠCf":47445,"Testing":47446,"Byte":47447,"nants":47448,"oufl":47449,"ĠCipher":47450,"Aim":47451,"ĠAfgh":47452,"ĠStarCraft":47453,"intendent":47454,"akespe":47455,"Apply":47456,">>>":47457,"Lenin":47458,"ĠShaman":47459,"%\"":47460,"ĠFrenzy":47461,"illusion":47462,"===":47463,"Website":47464,"Allow":47465,"ĠBinary":47466,"ensable":47467,"ĠEmpires":47468,"Ġpromul":47469,"ormonal":47470,"ileaks":47471,"ĠAmmo":47472,"assies":47473,"atican":47474,"avior":47475,"ĠIter":47476,"1024":47477,"uesday":47478,"ĠAppears":47479,"achine":47480,"Problem":47481,"ousy":47482,"ramid":47483,"nox":47484,"··":47485,"omething":47486,"ĠPurg":47487,"artney":47488,"Ġ0000":47489,"psey":47490,"Ġglutamate":47491,"ĠActivate":47492,"Repl":47493,"Priv":47494,"cyclop":47495,"ĠHispan":47496,"atsuki":47497,"Likewise":47498,"JOHN":47499,"POSE":47500,"pherd":47501,"schild":47502,"Ġsuffix":47503,"åIJ":47504,"Ġoptionally":47505,"ĠRecomm":47506,"ĠSpawn":47507,"ARDIS":47508,"Ġinconsist":47509,"Ġenglish":47510,"Beta":47511,"ĠContains":47512,"uddenly":47513,"Ġls":47514,"Dynamic":47515,"åĽ":47516,"Ġ{{":47517,"dq":47518,"Hmm":47519,"oliberal":47520,"ĠCarnage":47521,"ĠRebirth":47522,"incerity":47523,"Ġproletariat":47524,"ĠCrafting":47525,"Explore":47526,"Ġeld":47527,"ĠAnarch":47528,"Ġ(>":47529,"ĠClockwork":47530,"ĠProced":47531,"APTER":47532,"ĠSorcerer":47533,"âĶ":47534,"ĠSnape":47535,"elist":47536,"Balance":47537,"Tube":47538,"Ġ--------------------":47539,"Ġnostalg":47540,"ACTED":47541,"ĠVID":47542,"soever":47543,"ignt":47544,"Ġhypothal":47545,"ĠObj":47546,"igure":47547,"ĠElves":47548,"gorithm":47549,"Romney":47550,"idable":47551,"renheit":47552,"aptic":47553,"Ġnonex":47554,"Profile":47555,"Ġscient":47556,"ĠAchievements":47557,"ĠReload":47558,"Products":47559,"ampire":47560,"pread":47561,"ĠYamato":47562,"Thread":47563,"ĠFML":47564,"ĠForsaken":47565,"Statistics":47566,"Ġ([":47567,"utsu":47568,"nces":47569,"...?":47570,"upload":47571,"Typ":47572,"ĠReflex":47573,"Dial":47574,"Ġspawns":47575,"Server":47576,"Ġacquaint":47577,"iterranean":47578,"='":47579,"Device":47580,"ר":47581,"ocaly":47582,"Remove":47583,"Ġ=====":47584,"Ġabdom":47585,"ideos":47586,"Dual":47587,"Fax":47588,"Ġbesie":47589,"ĠAdin":47590,"Ġdescrib":47591,"Ġiod":47592,"Limit":47593,"aunders":47594,"ĠAssassins":47595,"xxxx":47596,"ulner":47597,"Shipping":47598,"Item":47599,"fortune":47600,"Ġcipher":47601,"mA":47602,"acerb":47603,"ebus":47604,"Ġmodifiers":47605,"Added":47606,"prisingly":47607,"Dir":47608,"ĠArchangel":47609,"umbnails":47610,"Huh":47611,"ĠWARN":47612,"Role":47613,"usional":47614,"Ġcortical":47615,"ĠSCP":47616,"ĠException":47617,"ĠWarhammer":47618,")))":47619,"](":47620,"Ġsynaptic":47621,"Ġcached":47622,"archment":47623,"Ġtarg":47624,"Filter":47625,"ĠHades":47626,"Ġprinc":47627,"halla":47628,"ptoms":47629,"Ïģ":47630,"ructose":47631,"termination":47632,"Ġcompe":47633,"define":47634,"Ġprosec":47635,"require":47636,"ĠCorpse":47637,"Abstract":47638,"********************************":47639,"Used":47640,"ĠIbid":47641,"trak":47642,"ä¸Ń":47643,"ĠGABA":47644,"åĬ":47645,"ĠHegel":47646,"Jere":47647,"odore":47648,"í":47649,"namese":47650,"Origin":47651,"ĠMastery":47652,"gerald":47653,"Charges":47654,"--------------------":47655,"Forge":47656,"comings":47657,"åį":47658,"Ġ(&":47659,"Ġgrap":47660,"Mask":47661,"ĠGundam":47662,"generic":47663,"ĠMalf":47664,"raphics":47665,"Internal":47666,"ourge":47667,"Ġirresist":47668,"sterdam":47669,"Ġendogenous":47670,"Export":47671,"Ġë":47672,"poons":47673,"Ġabund":47674,"ĠQuantity":47675,"Issue":47676,"âĪĴ":47677,"cknow":47678,"Anonymous":47679,"ĠDRAG":47680,"Wikipedia":47681,"Ġsubdu":47682,"iverpool":47683,"apesh":47684,"Ability":47685,"ĠCentOS":47686,"iseum":47687,"lycer":47688,"Untitled":47689,"Ġlineback":47690,"Ġtomat":47691,"byte":47692,"tile":47693,"linux":47694,"Palest":47695,"canon":47696,"FAULT":47697,"ĠkHz":47698,"Ġhelic":47699,"ĠIGF":47700,"WARE":47701,"Feature":47702,"ĠGraveyard":47703,"ĠNemesis":47704,"akuya":47705,"inement":47706,"Ġwhence":47707,"ractical":47708,"Ping":47709,"tesque":47710,"scroll":47711,"espie":47712,"Ġasynchronous":47713,"ocre":47714,"Measure":47715,"morph":47716,"std":47717,"Settings":47718,"Course":47719,"Ġ],":47720,"Ïĥ":47721,"Documents":47722,"estern":47723,"Ġtf":47724,"Ġcircumcised":47725,"geant":47726,"Ġconject":47727,"ĠFolder":47728,"outube":47729,"ĠMedline":47730,"Status":47731,"ctr":47732,"anoia":47733,"ĠPowerShell":47734,"Chel":47735,"Loop":47736,"Ġresize":47737,"aphael":47738,"workshop":47739,"velength":47740,"hover":47741,"flush":47742,"Ġβ":47743,"Task":47744,"pedia":47745,"ptin":47746,"bidden":47747,"windows":47748,"ĠCaucas":47749,"aml":47750,"isoft":47751,"Ġrs":47752,"cgi":47753,"urrection":47754,"miah":47755,"ÏĤ":47756,"Ġplaythrough":47757,"Reddit":47758,"׾":47759,"Ġannotation":47760,"Ġnobles":47761,"seq":47762,"mares":47763,"Ġwik":47764,"foreseen":47765,"RPG":47766,"Ġreper":47767,"aredevil":47768,"arcity":47769,"/\"":47770,"Ġ});":47771,"Ġdiscont":47772,"ĠBinding":47773,"answered":47774,"Mesh":47775,"ĠMPEG":47776,"Ġperceptual":47777,"OTAL":47778,"ursive":47779,"ãģĦ":47780,"Ġplun":47781,"onential":47782,"ãĤ":47783,"ĠReloaded":47784,"iscopal":47785,"ĠDespair":47786,"FIX":47787,"Ġheterogeneity":47788,",[":47789,"ichick":47790,"DCS":47791,"Ġcooldown":47792,"................":47793,"Ġsomew":47794,"Battery":47795,"stract":47796,"Attempt":47797,"allery":47798,"ĠNept":47799,"Ġtac":47800,"ĠElemental":47801,"Function":47802,"Ġbindings":47803,"versive":47804,"ĠWarlock":47805,"Response":47806,"ĠNPCs":47807,"ollower":47808,"ĠReborn":47809,"Ġphenotype":47810,"uscript":47811,"Ġpecul":47812,"!/":47813,"Unique":47814,"ĠFreeBSD":47815,"ĠChero":47816,"Ġcolle":47817,"gently":47818,"Empty":47819,"rss":47820,"Ġdd":47821,"forge":47822,"ĠTraps":47823,"×Ķ":47824,"iblical":47825,"---------":47826,"uminati":47827,"login":47828,"asus":47829,"xual":47830,"ĠMiko":47831,"ĠDrac":47832,"ssh":47833,"Submit":47834,"ĠMultiplayer":47835,"leanor":47836,"Orig":47837,"anism":47838,"peror":47839,"ĠESV":47840,"Ġencour":47841,"å°":47842,"ĠPLoS":47843,"ĠCrusher":47844,"ocrates":47845,"ynchronous":47846,"§":47847,"ĠLuffy":47848,"Lastly":47849,"Ġdiffere":47850,"okane":47851,"Enh":47852,"ursor":47853,"Ġapopt":47854,"ĠTotem":47855,"ä½":47856,"Honest":47857,"xml":47858,"Created":47859,"Ġteleport":47860,"NRS":47861,"ccess":47862,"ilitary":47863,"ackets":47864,"Ġenchantment":47865,"ĠCunning":47866,"ortmund":47867,"Altern":47868,"Alternatively":47869,"ĠLuthor":47870,"Publisher":47871,"GBT":47872,"çĶ":47873,"Activity":47874,"Ġleptin":47875,"æĪ":47876,"ĠStarfleet":47877,"å¸":47878,"oooooooo":47879,"Ġlawy":47880,"Frag":47881,"ת":47882,"yright":47883,"cookie":47884,"Finish":47885,"wikipedia":47886,"ĠAbilities":47887,"interface":47888,"Ġglared":47889,"Engineers":47890,"ĠAtk":47891,"oteric":47892,"Ġbyte":47893,"ossibility":47894,"Label":47895,"ĠCSV":47896,"Ġè":47897,"ĠOblivion":47898,"android":47899,"rehensive":47900,"ĠCommands":47901,"clud":47902,"ĠTutorial":47903,"retched":47904,"irlwind":47905,"conserv":47906,"ministic":47907,"void":47908,"ernels":47909,"alias":47910,"ĠDraco":47911,"desktop":47912,"ĠMormonism":47913,"oÄŁ":47914,"kef":47915,"Ġtimestamp":47916,"WAYS":47917,"ãģĹ":47918,"\"(":47919,"eneg":47920,"CHAT":47921,"Ġnpm":47922,"ĠGrenade":47923,"rongh":47924,"dinand":47925,"Definition":47926,"ĠInteger":47927,"Ġmodifier":47928,"Ġdex":47929,"ĠParameters":47930,"andestine":47931,"ĠSHALL":47932,"Purchase":47933,"enaries":47934,"Ġstarship":47935,"Armor":47936,"Skill":47937,"Ġlookup":47938,"verages":47939,"Minimum":47940,"ĠBleach":47941,"Ġdf":47942,"inosaur":47943,"ixel":47944,"Zip":47945,"temp":47946,"ruby":47947,"Fram":47948,"sword":47949,"Minecraft":47950,"strous":47951,"Client":47952,"ĠBarbarian":47953,"æĹ":47954,"USER":47955,"ĠMehran":47956,"axies":47957,"ermanent":47958,"ĠHeader":47959,"ablishment":47960,"hyde":47961,"Snake":47962,"ĠTelesc":47963,"Pocket":47964,"Ġ........":47965,"Destroy":47966,"Method":47967,"ĠZup":47968,"olulu":47969,"Ġunemploy":47970,"Temp":47971,"ĠExplicit":47972,"人":47973,"cache":47974,"innamon":47975,"Ġunavoid":47976,"Summary":47977,"Ġappre":47978,"Ġtaxp":47979,"XXX":47980,"ieval":47981,"ĠSummon":47982,"å¤":47983,"Lear":47984,"ibliography":47985,"CLASS":47986,"dimension":47987,"ĠHorde":47988,"Ġfilesystem":47989,"ĠQiao":47990,"obbies":47991,"DIR":47992,"Ġimpedance":47993,"éĩ":47994,"Names":47995,"ĠDrupal":47996,"Applic":47997,"imei":47998,"ynchron":47999,"Ire":48000,"ĠMinion":48001,"ĠHaste":48002,"ä¿":48003,"Ġ(=":48004,"LinkedIn":48005,"Maps":48006,"ifacts":48007,"Damage":48008,"odynam":48009,"ĠShroud":48010,"Ancient":48011,"enhagen":48012,"Tact":48013,"anship":48014,"aturdays":48015,"ãģ«":48016,"ikhail":48017,"ãģ®":48018,"framework":48019,"lication":48020,"â̦]":48021,"Plug":48022,"ĠLilith":48023,"browser":48024,"offset":48025,"ĠJuda":48026,"ciating":48027,"console":48028,"Ġ=================":48029,"._":48030,"ĠPuzz":48031,"OPLE":48032,"erial":48033,"OHN":48034,"ĠGolem":48035,"ierrez":48036,"Ġ},":48037,"inition":48038,"insula":48039,"ĠEntered":48040,"greSQL":48041,"ĠFlask":48042,"ĠXCOM":48043,"fixes":48044,"ĠWeasley":48045,"arser":48046,"Ġrc":48047,"microsoft":48048,"HHHH":48049,"INFO":48050,"rehend":48051,"Ġpolymorph":48052,"Button":48053,"âī":48054,"QUI":48055,"twitch":48056,"jriwal":48057,"ĠSaiyan":48058,"Ġadherent":48059,"acters":48060,"arthed":48061,"âĢł":48062,"Ġfoss":48063,"ã":48064,"Quote":48065,"ependent":48066,"Ġhorr":48067,"UGC":48068,"Weiss":48069,"styles":48070,"advertisement":48071,"Credits":48072,"Lua":48073,"ĠUCH":48074,"Ġhorrend":48075,"Ġminion":48076,">,":48077,"ãĥ³":48078,"Ġinclud":48079,"Compar":48080,"Ġ[]":48081,"Ġ(<":48082,"Phones":48083,"paralleled":48084,"HTML":48085,"Ġ(%":48086,"raltar":48087,"Ġamd":48088,"Maximum":48089,"ĠSolitaire":48090,"SCP":48091,"ĠVaugh":48092,"ĠCLR":48093,"database":48094,"module":48095,"̶":48096,"Capture":48097,"Window":48098,"ubuntu":48099,"Includes":48100,"ĠUriel":48101,"ORPG":48102,"κ":48103,"âĪ":48104,"ä¸Ģ":48105,"Ġdexter":48106,"ĠGlac":48107,"slice":48108,"HAHAHAHA":48109,"\\\"":48110,"lations":48111,"ÙIJ":48112,"ĠAUTH":48113,"earch":48114,"ĠSocket":48115,"Character":48116,"Sort":48117,"Ġindist":48118,"/_":48119,"ĠAntar":48120,"ifix":48121,"Ġlich":48122,"variable":48123,"_(":48124,"Ġgui":48125,"Herm":48126,"elvet":48127,"è¯":48128,"Developer":48129,"Ġkcal":48130,"ciation":48131,"Transaction":48132,"Ġdocker":48133,"###":48134,"ĠVegeta":48135,"Result":48136,"ocamp":48137,"aughtered":48138,"Increase":48139,"aples":48140,"iannopoulos":48141,"zbek":48142,"estyles":48143,"emonium":48144,"è¿":48145,"ĠFANT":48146,"Reason":48147,"Elsewhere":48148,"\"\"":48149,"ĠArtifact":48150,"Authent":48151,"herical":48152,"Ġmembr":48153,"socket":48154,"Elsa":48155,"Condition":48156,"Ġlapt":48157,"Ġsorcerer":48158,"Layer":48159,"apters":48160,"Ġveter":48161,"Myth":48162,"ensical":48163,"ÏĢ":48164,"noxious":48165,"Ġunpre":48166,"Flags":48167,"OOOOOOOO":48168,"Ġincent":48169,"Combat":48170,"Session":48171,"Ġteleportation":48172,"éĢ":48173,"ortment":48174,"Admin":48175,"Fixed":48176,"×Ļ":48177,"Ġconfir":48178,"ãģŁ":48179,"morrow":48180,"osponsors":48181,"\\/":48182,"ictionary":48183,"Num":48184,"Ġquir":48185,"åº":48186,"à¨":48187,"Ġ<<":48188,"Attempts":48189,"ãģ§":48190,"λ":48191,"Features":48192,"XXXX":48193,"Ġinflamm":48194,"VERSION":48195,"ortality":48196,"spawn":48197,"ratulations":48198,"Ġcharism":48199,"Ġ&&":48200,"Dialogue":48201,"luster":48202,"<<":48203,"args":48204,"redients":48205,"Ġpredicate":48206,"qqa":48207,"etheus":48208,"Ġ(!":48209,"Ġshowc":48210,"cmd":48211,"bringer":48212,"Ġcoh":48213,"Input":48214,"ĠFANTASY":48215,"Ġfict":48216,"Blocks":48217,"Install":48218,"vector":48219,"umblr":48220,"agnar":48221,"Array":48222,"Ġembry":48223,"Ġtheoret":48224,"Ġhref":48225,"irrel":48226,"irements":48227,"iations":48228,"Ġ(/":48229,"Thumbnail":48230,"Ġhashes":48231,"^^":48232,"Copy":48233,"Ġeq":48234,"translation":48235,"Favorite":48236,"Fail":48237,"Ġogre":48238,"isites":48239,"Merit":48240,"ãģ¦":48241,"DATA":48242,"rarily":48243,"igmatic":48244,"Sequ":48245,"Els":48246,"ãģª":48247,"lehem":48248,"requency":48249,"aughed":48250,"Ġdistingu":48251,"Ġartific":48252,"Ġdwarves":48253,"Í":48254,"resy":48255,"~~":48256,"sofar":48257,"ideon":48258,"ozyg":48259,"EEEE":48260,"ĠMelee":48261,"大":48262,"tumblr":48263,"ssl":48264,"Wra":48265,"ONSORED":48266,"Ġvowel":48267,"},":48268,"Vari":48269,"cientious":48270,"Node":48271,"Ġsorce":48272,"========":48273,"perse":48274,"Detailed":48275,"isphere":48276,"Background":48277,"ĺħ":48278,"Redd":48279,"ìĿ":48280,"ãģ¨":48281,"ĠCTRL":48282,"Ġç":48283,"iculty":48284,"ername":48285,"Ġns":48286,"Deploy":48287,"Ġhapp":48288,"Ġ///":48289,"Begin":48290,"Ġgp":48291,"$.":48292,"Output":48293,"Suggest":48294,"×IJ":48295,"ĠToggle":48296,"Ġnutrit":48297,"Ġ\\\"":48298,"Ġpreval":48299,"Ġsubreddits":48300,"Menu":48301,"Amount":48302,"ĠWasteland":48303,"Ġsprites":48304,"Ġshader":48305,"Ġ;)":48306,"NAME":48307,"CLUD":48308,"Ġgoblin":48309,"Refer":48310,"ÙĴ":48311,"á¹":48312,"Improved":48313,"endiary":48314,"Ġassail":48315,"chieve":48316,"reply":48317,"Ġcontrad":48318,"cients":48319,"GROUP":48320,"Controller":48321,"omsky":48322,"chemist":48323,"packages":48324,"ombies":48325,"scl":48326,"Ġibn":48327,"çĽ":48328,":(":48329,"ĠMinotaur":48330,"niper":48331,"====":48332,"Ġsubsc":48333,"è¦":48334,"Ġinteger":48335,"Ġ\"-":48336,"Ġtheorem":48337,"utenberg":48338,"Trigger":48339,"github":48340,"ä¼":48341,"##":48342,"xtap":48343,"oké":48344,"ilial":48345,"idepress":48346,":\\":48347,"Param":48348,"Correction":48349,"ïve":48350,"Chest":48351,"ש":48352,"ĠÏĦ":48353,"Ġrespawn":48354,"Ġrall":48355,"Ġcreatine":48356,"umsy":48357,"ĠTemplate":48358,"foo":48359,"query":48360,"Ġmanufact":48361,"Hardware":48362,"iframe":48363,"Ġ-------":48364,"Ġrecip":48365,"ĠAttributes":48366,"Ġforeskin":48367,"ãĤĭ":48368,"ãĥĦ":48369,"uania":48370,"................................................................":48371,"Ġphylogen":48372,"eaturing":48373,"Ġsprite":48374,"Ġinvari":48375,"DonaldTrump":48376,"({":48377,"ĠMalfoy":48378,"Gamer":48379,"ĠPlugin":48380,"γ":48381,"Query":48382,"ĠPuzzles":48383,"inventory":48384,"trl":48385,"Insert":48386,"Ġawa":48387,"ĠWerewolf":48388,"Ġhorizont":48389,"×ŀ":48390,"Ġcunt":48391,"]]":48392,"ĠByz":48393,"Mouse":48394,"Ġ[[":48395,"ĠCthulhu":48396,"ĠDRAGON":48397,"Default":48398,"ĠPresbyter":48399,"Ġff":48400,"Ġorcs":48401,"Construct":48402,"ĠDebug":48403,"Ġ*/":48404,"×ij":48405,"Ġembr":48406,"License":48407,"css":48408,"incinn":48409,"Prosecut":48410,"Ġsugg":48411,"å¾":48412,"ĠUndead":48413,"æĿ":48414,"Ġfs":48415,"Ġthw":48416,"Vector":48417,"åĮ":48418,"settings":48419,"å¯":48420,"Ġssh":48421,"ĠConverted":48422,"ãĤĴ":48423,"risome":48424,"Ġagre":48425,"Collection":48426,"cmp":48427,"puter":48428,"alloc":48429,"Ġé":48430,"ascade":48431,"ĠSpells":48432,"Ġ:-)":48433,"Haunted":48434,"Ġadolesc":48435,"FORMATION":48436,"ĠImperium":48437,"ãĥ¼":48438,"Supplement":48439,"Render":48440,"Theme":48441,"ĠTorment":48442,"([":48443,"ëĭ":48444,"Ġhtml":48445,"Ġjuven":48446,"ĠSiber":48447,"Ġdaemon":48448,"ivariate":48449,"objects":48450,"negie":48451,"Ġindu":48452,"landish":48453,"Meta":48454,"Impl":48455,"Ġglyph":48456,"Ġ-->":48457,"Ġstreng":48458,"agascar":48459,"guyen":48460,"((":48461,")[":48462,"ĠNorn":48463,"Ġhippocamp":48464,"Ġ¯":48465,"îĢ":48466,"Connection":48467,"PATH":48468,"mbuds":48469,"ĠShards":48470,"Ġadvoc":48471,"Ġsimulac":48472,"âĸij":48473,"!?\"":48474,"ĠPotion":48475,"Ġamulet":48476,"ĠFnatic":48477,"Ġcryptoc":48478,"wav":48479,"radius":48480,"pkg":48481,"ĠMFT":48482,"æĢ":48483,"Ġtoile":48484,"Items":48485,"ifference":48486,"errors":48487,"ĠCelt":48488,"Ġunpop":48489,"ilogy":48490,"6666":48491,"hesda":48492,"Instruct":48493,"å·":48494,"Materials":48495,"ettings":48496,"Percent":48497,"Ġresistor":48498,"tymology":48499,"Ġdeprecated":48500,"Ġgrep":48501,"ĠWRITE":48502,"Ġtriv":48503,"Ġscrut":48504,"[/":48505,"anyl":48506,"skirts":48507,"MSN":48508,"ĠCodec":48509,"ecd":48510,"Anth":48511,"){":48512,"%]":48513,"veyard":48514,"aspberry":48515,"ãĢ":48516,"Reward":48517,"rha":48518,"Stretch":48519,"]-":48520,"Prev":48521,"Context":48522,"Ġlinux":48523,"HAHA":48524,"perties":48525,"ĠVIDE":48526,"Domain":48527,"Ġmurd":48528,"ĠLegions":48529,"apache":48530,"æŃ":48531,"Pause":48532,"Temperature":48533,"ufact":48534,"igslist":48535,"ĠRetrieved":48536,"èª":48537,"ãģĮ":48538,"Ingredients":48539,"ruary":48540,"dyl":48541,"Alias":48542,"ĠÎĶ":48543,"Ġinval":48544,"amsung":48545,"!--":48546,"olean":48547,"æī":48548,"ãģ¯":48549,"Ġcoefficients":48550,"ĠDHCP":48551,"âĨĴ":48552,"utonium":48553,":[":48554,"âĹ":48555,"cli":48556,"Container":48557,"å¼":48558,"nexus":48559,"SOURCE":48560,"Ò":48561,"=/":48562,"Ġmysql":48563,"ĠGained":48564,"Ġ/*":48565,"uncture":48566,"Ġstatically":48567,"âĸł":48568,"æĺ¯":48569,"æ°":48570,"estamp":48571,"Cache":48572,"ulkan":48573,"staking":48574,"apter":48575,"ãģ¾":48576,"Ġμg":48577,"Ġtremend":48578,"ĠPiercing":48579,"naissance":48580,"ĠHealer":48581,"Enabled":48582,"éģ":48583,"âĸ":48584,"ĠThumbnails":48585,"Ġhither":48586,"Format":48587,"utherland":48588,"íķ":48589,"Ġdestro":48590,"fff":48591,"execute":48592,"msg":48593,"romancer":48594,"ĠCanaver":48595,"ĠVaults":48596,"oided":48597,"iage":48598,"Ġimg":48599,"summary":48600,"]);":48601,"ĠABE":48602,"ĠGamergate":48603,"utherford":48604,"Ġoverwrite":48605,"enment":48606,"æķ":48607,"Ġsystemd":48608,"tif":48609,"]).":48610,"ãĤ¤":48611,"Widget":48612,"======":48613,"(-":48614,"Ġ\"+":48615,"ĠIncarnation":48616,"æĥ":48617,"���":48618,"GUI":48619,"èĥ":48620,"forums":48621,"Ġrunes":48622,"Ġâī¤":48623,"Ġdefic":48624,"Distance":48625,"directory":48626,"ĠHorus":48627,"iltr":48628,"ortium":48629,"Ġ./":48630,"bda":48631,"owship":48632,"ĠâĨij":48633,"}.":48634,"åĩ":48635,"1027":48636,"Weapons":48637,"lucent":48638,"Ġauth":48639,";;":48640,"Recommended":48641,"Ġsurv":48642,"Ġvm":48643,"ĠStronghold":48644,"Ġparan":48645,"ĠTrance":48646,"æĺ":48647,"Ġsovere":48648,"Ġcorrid":48649,"ĠPwr":48650,"Ġ[/":48651,"Ġseq":48652,"Population":48653,"Ġ[];":48654,"Ġreferen":48655,"ĠInstr":48656,"ĠStamina":48657,"kernel":48658,"Python":48659,"-+":48660,"Ġallele":48661,"éĽ":48662,"isode":48663,"ä¸į":48664,"otonin":48665,"modules":48666,"Notable":48667,"Spell":48668,"\\\\":48669,"Pref":48670,"Ġdatas":48671,"setup":48672,"Ġhapl":48673,"Height":48674,"åĭ":48675,"ãģ£":48676,"]),":48677,"Handle":48678,"umenthal":48679,"Package":48680,"Ġenthus":48681,"Ġunsus":48682,"Narr":48683,"Examples":48684,"FAQ":48685,"REDACTED":48686,"Ġnotor":48687,"Enable":48688,"Pattern":48689,"aeda":48690,">.":48691,"CHECK":48692,"Ġ����":48693,"Ġ'.":48694,"Ġãĥ":48695,"append":48696,"����":48697,"gemony":48698,"terness":48699,"ĠHaku":48700,"NVIDIA":48701,"queue":48702,"Bind":48703,"Ġneigh":48704,"armor":48705,"retty":48706,"LOD":48707,"plugins":48708,"Ġ/>":48709,"TYPE":48710,"Ġ4096":48711,"-------":48712,"Preview":48713,"FML":48714,"Ġproletarian":48715,"zees":48716,"enfranch":48717,"ãģĨ":48718,"Ctrl":48719,"Module":48720,"ĠSurviv":48721,"ĠStarcraft":48722,"rored":48723,"reddit":48724,"Ġrul":48725,"Ġtx":48726,"Ġmage":48727,"Sword":48728,"Ġ~/":48729,"Effects":48730,"éļ":48731,"ä¹":48732,"Sensor":48733,"Solution":48734,"ãģĻ":48735,"Arcade":48736,"Ġpredec":48737,"Values":48738,"Length":48739,"Ġfortun":48740,"ttp":48741,"\"[":48742,"tmp":48743,"ĠBerserker":48744,"åĨ":48745,"ositories":48746,"Ġcouncill":48747,"ffff":48748,"));":48749,"Recipe":48750,"ĠASCII":48751,"âĦ¢:":48752,"ä":48753,"Ġhorm":48754,"=>":48755,"sers":48756,"ãģĭ":48757,"Recommend":48758,"['":48759,"agame":48760,"Animation":48761,"aucuses":48762,"Discussion":48763,"Ġhelicop":48764,"å¿":48765,"Float":48766,"Component":48767,"instance":48768,"Ġfoo":48769,"localhost":48770,"=-":48771,"Offset":48772,"Psy":48773,"ĠGohan":48774,"buquerque":48775,"Ġdefe":48776,"chwitz":48777,"parse":48778,"Ġdors":48779,"Ġspons":48780,"Ġasync":48781,"agonists":48782,"Ġindo":48783,".>>":48784,"ĠDisciple":48785,"Ġfilename":48786,"rency":48787,"ĠDise":48788,"Ġ\"/":48789,"template":48790,"ãĤ¹":48791,"swers":48792,"Ġ++":48793,"Ġ[(":48794,"thora":48795,"ĠDepths":48796,"livious":48797,"Ġdisadvant":48798,"foundland":48799,"Upload":48800,"Ġ§§":48801,"Ġsophistic":48802,";}":48803,"izont":48804,"\"}":48805,"estial":48806,"Ranked":48807,"ĠOccupations":48808,"LEASE":48809,"ĠOgre":48810,"folder":48811,"Plot":48812,"farious":48813,"Ġsuscept":48814,"Types":48815,"Discuss":48816,"Ġ'/":48817,"æµ":48818,"earable":48819,"æ³":48820,"Tile":48821,"iatus":48822,"åŃ":48823,"Ġreperto":48824,"Helper":48825,"Returns":48826,"ä¸Ĭ":48827,"imaru":48828,"Ġreq":48829,"Ġdissatisf":48830,"multipl":48831,"}{":48832,"-[":48833,"itial":48834,"*/":48835,"Config":48836,"Example":48837,"ĠjQuery":48838,"Mods":48839,"ĠGPIO":48840,"Ġlaun":48841,"layout":48842,"cised":48843,"Ġ......":48844,"+++":48845,"prototype":48846,"Exception":48847,"Ġsubsections":48848,"Ġresemb":48849,"Ġâĩ":48850,"ĠPubMed":48851,"username":48852,"Ġaggro":48853,"éĥ":48854,"Ġ};":48855,"ĠMages":48856,"ryu":48857,"apons":48858,"Optional":48859,"ĠAncients":48860,"ãĤĬ":48861,"Quotes":48862,"oaded":48863,"Ġsuspic":48864,"inline":48865,"omial":48866,"ĠMahjong":48867,"auntlets":48868,"Ġanarchism":48869,"Ġsubclass":48870,"ĠMLG":48871,"...]":48872,"Dialog":48873,"uphem":48874,"Ġrecursive":48875,"7601":48876,"frac":48877,"Else":48878,"ĠSeverus":48879,"},{\"":48880,"ĠCLIENT":48881,"Ġjavascript":48882,"sama":48883,"ĠLearns":48884,"ãĤĤ":48885,"Upgrade":48886,"Listener":48887,"Ġsnipp":48888,"Ġrune":48889,"ĠTTL":48890,"ertation":48891,"olicy":48892,"=\"\"":48893,"«ĺ":48894,"Ġexpr":48895,"ovych":48896,"Ġãģ":48897,"_-_":48898,"munition":48899,"////":48900,"func":48901,">>>>":48902,"Provider":48903,"Ïī":48904,"BUG":48905,"Ġ[-":48906,"Ġarrang":48907,"merce":48908,"ãĥ":48909,"incarn":48910,"Valid":48911,"ĠAether":48912,"ãĤĵ":48913,"ĠUTF":48914,"ĠMonstrous":48915,"ãĤĮ":48916,"hedon":48917,"áµ":48918,":#":48919,"ĠFrieza":48920,"padding":48921,"Reviewer":48922,"Ġpsychiat":48923,"yrinth":48924,"ĠâĶĤ":48925,"hillary":48926,"Static":48927,"Newsletter":48928,"Avg":48929,"Ġfn":48930,"Topic":48931,"choes":48932,"Ġnewsp":48933,"á¸":48934,"Ġ[+":48935,"~~~~~~~~~~~~~~~~":48936,":]":48937,"apego":48938,"buf":48939,"Translation":48940,"ById":48941,"Ġmmol":48942,"ãĥ¼ãĥ":48943,"å½":48944,"ãĤī":48945,"Ġparser":48946,"ãĥª":48947,"`,":48948,"Lair":48949,")}":48950,"ypes":48951,"adobe":48952,"Ġancest":48953,"ernel":48954,"ĠNULL":48955,"ç«":48956,"anguages":48957,"Increases":48958,"æĦ":48959,"utorial":48960,"ithmetic":48961,"dll":48962,"ĠArcane":48963,"çī":48964,"Ġtc":48965,"urtles":48966,"èĪ":48967,"Bytes":48968,"Slot":48969,"ĠBahá":48970,"Weapon":48971,"widget":48972,"querque":48973,"Ġembodiments":48974,"å¥":48975,"WARN":48976,"swer":48977,"thumbnails":48978,"FFFF":48979,"inguishable":48980,"Ġâī":48981,"Ġ${":48982,"AAAAAAAA":48983,"Conclusion":48984,"ĻĤ":48985,"disable":48986,"Rect":48987,"Ġsubp":48988,"Ġ().":48989,"ĠDetected":48990,"èĢ":48991,"[]":48992,"Ġcoerc":48993,"ĠmM":48994,"recated":48995,"fusc":48996,"ĠSorce":48997,"çĶŁ":48998,").[":48999,"Ġ})":49000,"mobi":49001,"yip":49002,"Acknowled":49003,"ternity":49004,"iqueness":49005,"ython":49006,"><":49007,"Ġstd":49008,"Url":49009,"Ġnamespace":49010,"Ġtion":49011,"oother":49012,"Ó":49013,"Ġhemor":49014,"Ġrg":49015,"ventory":49016,"ãĤ¢":49017,"anamo":49018,"Socket":49019,"Topics":49020,"apeshifter":49021,"gnu":49022,"Ġdetrim":49023,"`.":49024,"romeda":49025,"çIJ":49026,"Ġlambda":49027,"Compan":49028,"Variable":49029,"Ġusb":49030,"ĠAdamant":49031,"ournal":49032,"Ġcovari":49033,"ãĥ©":49034,"éĸ":49035,"åİ":49036,"otaur":49037,"Ġ(),":49038,"Marginal":49039,"ãģı":49040,"Ġphysic":49041,"adeon":49042,"RESULTS":49043,"200000":49044,"ãģį":49045,"udeb":49046,"ãģĵ":49047,"COMPLE":49048,"Ġmsg":49049,"ghazi":49050,"/*":49051,"ĠDeity":49052,"Ġdisapp":49053,"Availability":49054,"Ġillum":49055,"à©":49056,"ptives":49057,",âĢĶ":49058,"chnology":49059,"Ġaccur":49060,"Ġapi":49061,"Obj":49062,"ãĤ«":49063,"ãĤ¸":49064,"ä¹ĭ":49065,"ËĪ":49066,"Ġtcp":49067,"Required":49068,".<":49069,"\".[":49070,"Ġ~/.":49071,"Ġobser":49072,"RFC":49073,"Ġintegers":49074,"åī":49075,"Installation":49076,"Ô":49077,"ó":49078,"csv":49079,"ãĥ«":49080,"ĠNoticed":49081,"âĸĵ":49082,"Tumblr":49083,"Reply":49084,"||":49085,"Ġconclud":49086,"Ġ))":49087,"ebin":49088,"sql":49089,"Closure":49090,"++++":49091,"],[":49092,"âĹı":49093,"Ġprolet":49094,"Ġ>=":49095,"estinal":49096,"Ġ[*":49097,"ĠInquisitor":49098,"Ġcmd":49099,"FINE":49100,"CRIP":49101,"Ġvertex":49102,"TeX":49103,"///":49104,"Ö¼":49105,"iscons":49106,"Ġmyster":49107,"Changed":49108,"timeout":49109,"irtual":49110,"Methods":49111,"Ġcerts":49112,"texture":49113,"Roaming":49114,"Proxy":49115,"Override":49116,"éĹ":49117,"utf":49118,"python":49119,"ĠRarity":49120,"ilitarian":49121,"çľ":49122,"().":49123,"æł":49124,"Ġbuf":49125,"åij":49126,"çķ":49127,"Ġ*.":49128,"umerable":49129,"~~~~":49130,"å¦":49131,"Ġsimultane":49132,"Ġjson":49133,"Requires":49134,"Ġperl":49135,"Interface":49136,"rupal":49137,"":49138,"uilt":49139,"mercial":49140,"ĠPalestin":49141,"theless":49142,")=":49143,"Generic":49144,"&&":49145,"ALSE":49146,"Ġdebugger":49147,"paralle":49148,"acly":49149,"ĠScourge":49150,")].":49151,"Ġinstr":49152,"Ġ{}":49153,"]+":49154,"Ġdilig":49155,"åŃIJ":49156,"Ġcaptcha":49157,"kefeller":49158,"iosyncr":49159,"Ġchars":49160,"Ġinitialize":49161,"Width":49162,"Ġgithub":49163,"Ġinitialization":49164,"ĠGamerGate":49165,"Ġþ":49166,"drm":49167,"slaught":49168,"Ġtiss":49169,".............":49170,"Ĥ¬":49171,"Ġplent":49172,"ãģķ":49173,"cfg":49174,"âĨ":49175,"Ġpokemon":49176,"\"],":49177,"Ġtyr":49178,"SELECT":49179,"othal":49180,"Tags":49181,"ĠMarketable":49182,"-----------":49183,"icter":49184,"irlf":49185,"ormons":49186,"Database":49187,"ĠãĤ":49188,"Ġ{\"":49189,"î":49190,"Handler":49191,"âĶĢ":49192,"$$$$":49193,"ĠJaune":49194,"ãĤ³":49195,"(),":49196,")+":49197,"--------":49198,"Ġshenan":49199,"Ġwelf":49200,"Ġ',":49201,"attribute":49202,"Uncommon":49203,"maxwell":49204,"Browser":49205,"ĠPastebin":49206,"uberty":49207,"debug":49208,"Ġmosqu":49209,"ĠBoolean":49210,"wcs":49211,"é£":49212,"/âĢĭ":49213,"çĦ":49214,"(){":49215,"////////////////////////////////":49216,"ĠGleaming":49217,"regor":49218,"ĠMercenary":49219,"ensional":49220,"mpeg":49221,"sudo":49222,"ãģ®å":49223,"iggurat":49224,"vironment":49225,"Directory":49226,"ĠDecoder":49227,"SPONSORED":49228,"intendo":49229,"Ġ<=":49230,"btn":49231,"ï¸":49232,"ä½ľ":49233,"paio":49234,"Tokens":49235,"ãĢį":49236,"params":49237,"Offline":49238,"Ġmetab":49239,"ĠLisp":49240,"anwhile":49241,">:":49242,"itialized":49243,"HTTP":49244,"Trivia":49245,"Sov":49246,"wrapper":49247,"={":49248,"ĠAzerb":49249,"aeper":49250,"Ġneighb":49251,"initions":49252,"Ġsts":49253,"ĠSasuke":49254,"#$":49255,"uliffe":49256,"æĸ¹":49257,"++++++++++++++++":49258,"ĠElven":49259,"ãģĤ":49260,"Ġartif":49261,"Folder":49262,"Ġà¨":49263,"åĤ":49264,"Ġphyl":49265,"uggest":49266,"blance":49267,"ãģł":49268,"Requirements":49269,"Usage":49270,"Ġinitialized":49271,"ã쮿":49272,"conservancy":49273,"ĠReincarn":49274,")|":49275,"Ġantioxid":49276,"ĠClicker":49277,"Ġunlaw":49278,"Ġ\\(":49279,"ãĥĪ":49280,"Ġ[*]":49281,"Characters":49282,"////////":49283,"ãĢIJ":49284,"ãĤ·":49285,"webkit":49286,"ãĢij":49287,"Ġxp":49288,"alkyrie":49289,"Console":49290,"());":49291,"ĠKorra":49292,"\"))":49293,"oooooooooooooooo":49294,"Timer":49295,"////////////////":49296,"yout":49297,"engeance":49298,"emetery":49299,"Ġmages":49300,"mods":49301,"Null":49302,"Ġphilos":49303,"ascript":49304,"Ġaddon":49305,"ĠâĸĪ":49306,"emale":49307,"----------------------------------------------------------------":49308,"Ġ\\\\":49309,"=[":49310,"ĠParables":49311,"ãĥĨ":49312,"VALUE":49313,"Ġ@@":49314,"Ġuint":49315,"${":49316,"cpp":49317,"%%":49318,"Ġ(âĪĴ":49319,"utils":49320,"prefix":49321,"å°Ĩ":49322,"ãĥŃ":49323,"Completed":49324,"Ġgoto":49325,"ãĤ¯":49326,"Winged":49327,"perty":49328,"[\"":49329,"ãĥİ":49330,"ĠScythe":49331,"Ġæľ":49332,"Ġ!=":49333,"Buffer":49334,"docker":49335,"ĠWATCHED":49336,"èĢħ":49337,"())":49338,"Ġdst":49339,"SIZE":49340,"ĠDemonic":49341,"Ġresil":49342,"ãĤ¿":49343,"Ġpione":49344,"cpu":49345,"++)":49346,"TEXT":49347,"Ġdiscrep":49348,"debian":49349,"quished":49350,"Ġacknow":49351,"Ġtrave":49352,"Ġgcc":49353,"Catalog":49354,"ctrl":49355,"ĠMoroc":49356,"Ġcpu":49357,"Ġ];":49358,"ĠSorceress":49359,"Introduced":49360,"Frames":49361,"Ġcondem":49362,"¶æ":49363,"~~~~~~~~":49364,"ĠEmacs":49365,"][/":49366,"Ġglim":49367,"Init":49368,"ĠPrimordial":49369,"ãĥĥ":49370,"Ġ+=":49371,"Ġblat":49372,"à¼":49373,"------------------------------------------------":49374,"gpu":49375,"ãĥĥãĥĪ":49376,"Ġxml":49377,"Ġboolean":49378,"References":49379,"Ġ?)":49380,"Ġsatell":49381,"Queue":49382,"Ġpestic":49383,"Ġ}}":49384,"Attribute":49385,"Ġdx":49386,"ĠDefin":49387,"Synopsis":49388,"..................":49389,"ãĥ¬":49390,"plugin":49391,"Disable":49392,"0000000000000000":49393,")\\":49394,"ĠIchigo":49395,"println":49396,"rontal":49397,"Setup":49398,"Ġ��������":49399,"å§":49400,"âĸº":49401,"ĠPengu":49402,"ailability":49403,"Duration":49404,"Timeout":49405,"ãĢĮ":49406,"Ġbehav":49407,"Reviewed":49408,"Ġtoget":49409,"\\.":49410,"lished":49411,"Ġthous":49412,"Ġperpend":49413,"ecause":49414,"Layout":49415,"è»":49416,"ĠDexterity":49417,"unsigned":49418,"+=":49419,"[[":49420,"ĠRunes":49421,"ãĤ¦":49422,"};":49423,"})":49424,"FTWARE":49425,"ength":49426,"milo":49427,"duino":49428,"天":49429,"ĠClojure":49430,"ļé":49431,"ãĥ¥":49432,"gradient":49433,"Ġ\"\"\"":49434,"âĨij":49435,"@#":49436,"JSON":49437,"Ġproport":49438,"addr":49439,"});":49440,"ãĥIJ":49441,"ä¸ī":49442,"Ġtmp":49443,"å£":49444,"../":49445,"zsche":49446,"Ġâμ":49447,"Entity":49448,"æ©Ł":49449,"ĠâĶľâĶĢâĶĢ":49450,"filename":49451,"{{":49452,"@@":49453,"ĠSeym":49454,"Ġ/**":49455,"ĠSummoner":49456,"Quantity":49457,"ç·":49458,"Attach":49459,"Ġbool":49460,"Texture":49461,"Ġopio":49462,".}":49463,"ãĥĭ":49464,"integer":49465,"Ġregex":49466,"Ġnomine":49467,"ription":49468,"ãģ®ç":49469,"ãĥķ":49470,"Ġsubparagraph":49471,"GGGG":49472,"Ġexplan":49473,"Header":49474,"Spawn":49475,"toggle":49476,"²¾":49477,"Abyss":49478,"expr":49479,"ĠZerg":49480,"ĠGrimoire":49481,"Contents":49482,"Instance":49483,"cyclopedia":49484,"ãĥĹ":49485,"ĠTakeru":49486,"=(":49487,"代":49488,"\\)":49489,"Ġrgb":49490,"htt":49491,"bryce":49492,"Ġlivest":49493,"ĠAnnotations":49494,"âĶĢâĶĢâĶĢâĶĢâĶĢâĶĢâĶĢâĶĢ":49495,"berus":49496,"ntil":49497,"Ġskelet":49498,"callback":49499,"åħī":49500,"Joined":49501,"ãĤª":49502,"Ġargs":49503,"artifacts":49504,"Ġå¤":49505,"ÃĽ":49506,"ãĥŀ":49507,"Streamer":49508,"}\"":49509,"Ġunden":49510,"ãĥģ":49511,"Īè":49512,"ãĥ£":49513,"Ġ0004":49514,"Ġ\\'":49515,"ãĤ°":49516,"ĠCONFIG":49517,"Ġ#####":49518,"``":49519,"anguage":49520,"Ġ*)":49521,"Template":49522,"MODE":49523,"Ġ00000000":49524,"'';":49525,">":49526,"士":49527,"essage":49528,"ntax":49529,"Cmd":49530,"ividual":49531,"Unix":49532,"è£":49533,"çĭ":49534,"使":49535,"():":49536,"ãĥī":49537,"gdala":49538,"etheless":49539,"ktop":49540,"ĠACPI":49541,"ãĥĸ":49542,"Ġsshd":49543,"Ġ000000":49544,"Ġchalleng":49545,"âĶĢâĶĢ":49546,"ĠFlavoring":49547,"çİĭ":49548,"Http":49549,"Ĭ±":49550,"Accessory":49551,"oldemort":49552,"ĠIzan":49553,"galitarian":49554,"ĠChocobo":49555,"edIn":49556,"++++++++":49557,"Ġprintf":49558,"çīĪ":49559,"izoph":49560,"ruciating":49561,"Ġenum":49562,",,,,":49563,"Ġpregn":49564,"sembly":49565,"Ġtherap":49566,"Ġingred":49567,"ãĤµ":49568,"Ġsql":49569,"(*":49570,"Appearance":49571,"ngth":49572,"invoke":49573,"ãĥĥãĤ¯":49574,"ctx":49575,"Ġdmg":49576,"Plugin":49577,"ãĥ¡":49578,"ulhu":49579,"ãĤ§":49580,"Ġwarr":49581,"Ġmetic":49582,"女":49583,"Ġoun":49584,"ð":49585,"Ġtooltip":49586,"ãĤŃ":49587,"Ġvolunte":49588,"imgur":49589,"accompan":49590,"aterasu":49591,"olkien":49592,"ãĤº":49593,"Ġnodd":49594,"ĠMetatron":49595,"javascript":49596,"umbledore":49597,"ãĥł":49598,"--------------------------------------------------------":49599,"runtime":49600,"ĠLeban":49601,"Configuration":49602,"emort":49603,"(_":49604,"Connector":49605,"iosyn":49606,"reddits":49607,"Ġ\"%":49608,"Ġ[&":49609,"ĠSwordsman":49610,"ĠAwoken":49611,"Ġ;;":49612,"ãĥ¼ãĥ«":49613,"Ġ:=":49614,"ãĤ¹ãĥĪ":49615,"Ġcomr":49616,"Adapter":49617,"sbm":49618,"âķIJâķIJ":49619,"çļ":49620,"Loader":49621,"ãĥĵ":49622,"okemon":49623,"ãģ®é":49624,"-->":49625,"Ġlvl":49626,"Footnote":49627,"Iter":49628,"####":49629,"ãĥij":49630,"ĠCarbuncle":49631,"Ġ[+]":49632,"Ġmathemat":49633,"Allows":49634,"Ġ4090":49635,"Async":49636,"ģ«":49637,"Ͻ":49638,"))))":49639,"á½":49640,"Ġcx":49641,"Ġansw":49642,"{\"":49643,"ãĥŁ":49644,"addons":49645,"Filename":49646,"Appearances":49647,"ĠãĢĮ":49648,"Ġaddr":49649,"Ġcharact":49650,"glomer":49651,"Advertisements":49652,"Ġdracon":49653,"ĠFenrir":49654,"Ġ();":49655,"ĠCitiz":49656,"acebook":49657,"Ġparams":49658,"]=":49659,"Ġsubscript":49660,"Ġentreprene":49661,"tnc":49662,"iversal":49663,"Ġmillenn":49664,"ithub":49665,"/>":49666,"Ġ\"{":49667,"Frameworks":49668,"avorite":49669,"Ġ])":49670,"Constructed":49671,"fml":49672,"ãĥį":49673,"################################":49674,"-|":49675,"¥ŀ":49676,"Ġwithd":49677,"ĠCth":49678,"AppData":49679,"Msg":49680,":{":49681,"ãĤ¨":49682,"Ġtuple":49683,"ç¥ŀ":49684,"Ġintrins":49685,"ĠCooldown":49686,"ategory":49687,"^{":49688,"ãĥĬ":49689,"''''":49690,"çͰ":49691,"ĠDEBUG":49692,"Ġcannabin":49693,"ocobo":49694,"Invalid":49695,"ãĥĢ":49696,"Compat":49697,"Ġ({":49698,"Removed":49699,"Ġconvol":49700,"}:":49701,"interstitial":49702,"Ġ":49703,"Ġcontrace":49704,"uyomi":49705,"Callback":49706,"Parser":49707,"äºĶ":49708,"Versions":49709,"::::":49710,"Recomm":49711,"}\\":49712,"Ġ\"_":49713,"Debug":49714,"ĠAoE":49715,"atever":49716,"ĠTradable":49717,"Reloaded":49718,"ĠReincarnated":49719,"ĠStrongh":49720,">\"":49721,"initialized":49722,"Ġexting":49723,"Poké":49724,"Parameters":49725,"¶ħ":49726,"########":49727,"NULL":49728,"ãĥĩ":49729,"groupon":49730,"\\-":49731,"ãĥı":49732,"ãĤ±":49733,"Ġsubsequ":49734,"ccording":49735,"ĠMODULE":49736,"ĠProtoss":49737,"\"},{\"":49738,"Ġ..............":49739,"Integer":49740,"endif":49741,"ãĥĻ":49742,"parser":49743,"lambda":49744,"Ġcarbohyd":49745,"ĠUnloaded":49746,"_{":49747,"âĸ¬âĸ¬":49748,"Ġdebian":49749,"]}":49750,"ãĤ¶":49751,"Parameter":49752,"ãĤ£":49753,"ãĤ»":49754,"Ġ$_":49755,"İĭ":49756,"Ġiterator":49757,"ãĤ¬":49758,"WINDOWS":49759,"CONCLUS":49760,"Ġ\"\\":49761,"umbn":49762,"(&":49763,"ãĥ©ãĥ³":49764,"usercontent":49765,"ometimes":49766,"METHOD":49767,"ãĥ¢":49768,"potion":49769,"ãĥ¯":49770,"everal":49771,"Ġweap":49772,"minecraft":49773,"================================":49774,"printf":49775,"ĠShinra":49776,"Ġreluct":49777,"\\\",":49778,"Runtime":49779,"xff":49780,"ĠAbyssal":49781,"akeru":49782,"Ġ\\(\\":49783,"\"/>":49784,"efficients":49785,"Ü":49786,"avascript":49787,"Ġbehavi":49788,"++;":49789,"=#":49790,"Attributes":49791,"âĵĺ":49792,"lvl":49793,"¬¼":49794,"/**":49795,"Gameplay":49796,"ĠLeilan":49797,">)":49798,"=\"/":49799,"Ġ));":49800,"ãĥĨãĤ£":49801,"ġ":49802,".":49803,"Ġantidepress":49804,"Ġhtt":49805,"################":49806,"arnaev":49807,"ãĤ½":49808,"DERR":49809,"¥µ":49810,"âĸĪ":49811,"Ġ|--":49812,"Ġundermin":49813,"Ġ)))":49814,"ãĥĩãĤ£":49815,"awaru":49816,"\":[{\"":49817,"aution":49818,"ãĤ¤ãĥĪ":49819,"ô":49820,"ĠILCS":49821,"dfx":49822,"ĨĴ":49823,"âĸĴ":49824,"Ġcitiz":49825,"Ġ-=":49826,"ĠAllaah":49827,"Ġ(_":49828,"ĸļ":49829,"Ġ{\\":49830,"Ġsrf":49831,"ãĤ´":49832,"æŃ¦":49833,"»Ĵ":49834,"Ptr":49835,"'>":49836,"DEBUG":49837,"âĶģ":49838,"ãĢı":49839,"WithNo":49840,"Redditor":49841,"ĠâĶľ":49842,"Ġfmt":49843,"ãĢİ":49844,"Ġmsec":49845,"ĪĴ":49846,"eatures":49847,"itially":49848,"\"\"\"":49849,"ãĥ¼ãĤ¯":49850,"Textures":49851,"\"},":49852,"\">":49853,"Ġenthusi":49854,"CHAPTER":49855,"Ġunbeliev":49856,"Ġearthqu":49857,"Ġ><":49858,"||||":49859,"ß":49860,"iterator":49861,"è£ħ":49862,"Ĥª":49863,"ojure":49864,"ãħĭãħĭ":49865,"ãĥ¼ãĥ³":49866,"Ġprintln":49867,"Ġ][":49868,"âĸĪâĸĪ":49869,"âķIJ":49870,"\\\":":49871,"senal":49872,"é¾į":49873,"é¾":49874,"Ġcryst":49875,"ãĥķãĤ¡":49876,"ĠCosponsors":49877,"ãĤ·ãĥ£":49878,"Magikarp":49879,"ĠMagicka":49880,"âĸĪâĸĪâĸĪâĸĪ":49881,",,,,,,,,":49882,"vertisement":49883,"âĶĢâĶĢâĶĢâĶĢ":49884,"ãĥķãĤ©":49885,"luaj":49886,"CLASSIFIED":49887,".''.":49888,"byss":49889,"Ġ{:":49890,"ĠNanto":49891,"Ġptr":49892,"Ġ%%":49893,"Ġteasp":49894,"[_":49895,"ãĥ¤":49896,"ħĭ":49897,"ŃĶ":49898,"Ġpci":49899,"Ġ\"<":49900,"GGGGGGGG":49901,"æĪ¦":49902,"--+":49903,"ãĤ®":49904,"Ġ())":49905,"âĸ¬":49906,"Ġsizeof":49907,"}}}":49908,";;;;;;;;":49909,">]":49910,"âĸĪâĸĪâĸĪâĸĪâĸĪâĸĪâĸĪâĸĪ":49911,"Vaults":49912,"Ġistg":49913,"Ġnewcom":49914,"=]":49915,"¿½":49916,"ĵĺ":49917,"{\\":49918,"Args":49919,"Ġexha":49920,"(\\":49921,"Ġunnecess":49922,"\"}],\"":49923,"ĠUNCLASSIFIED":49924,">(":49925,"ãĤ¢ãĥ«":49926,"æ©":49927,"70710":49928,"Ń·":49929,"ãĥ¼ãĥĨãĤ£":49930,"ĠSakuya":49931,"ãĥĥãĥī":49932,"ĠPyrrha":49933,"escription":49934,"VIDIA":49935,"================================================================":49936,"Ġlooph":49937,"=~":49938,"Ġcumbers":49939,"Ġ)]":49940,"govtrack":49941,"ĠãĤµ":49942,"Ġsubur":49943,"Þ":49944,"Ġâī¡":49945,"Interstitial":49946,"ãĥ¼ãĥĨ":49947,"Ġgobl":49948,"ãĥīãĥ©":49949,"oldown":49950,"ģĸ":49951,"Depths":49952,"Ġ());":49953,"Ġ._":49954,"20439":49955,"Ġç¥ŀ":49956,"ãģ®å®":49957,"ãĤ¼":49958,"Ġ$\\":49959,"âĹ¼":49960,"Ġencount":49961,"Ġ": 48457,
+ "Ġstreng": 48458,
+ "agascar": 48459,
+ "guyen": 48460,
+ "((": 48461,
+ ")[": 48462,
+ "ĠNorn": 48463,
+ "Ġhippocamp": 48464,
+ "Ġ¯": 48465,
+ "îĢ": 48466,
+ "Connection": 48467,
+ "PATH": 48468,
+ "mbuds": 48469,
+ "ĠShards": 48470,
+ "Ġadvoc": 48471,
+ "Ġsimulac": 48472,
+ "âĸij": 48473,
+ "!?\"": 48474,
+ "ĠPotion": 48475,
+ "Ġamulet": 48476,
+ "ĠFnatic": 48477,
+ "Ġcryptoc": 48478,
+ "wav": 48479,
+ "radius": 48480,
+ "pkg": 48481,
+ "ĠMFT": 48482,
+ "æĢ": 48483,
+ "Ġtoile": 48484,
+ "Items": 48485,
+ "ifference": 48486,
+ "errors": 48487,
+ "ĠCelt": 48488,
+ "Ġunpop": 48489,
+ "ilogy": 48490,
+ "6666": 48491,
+ "hesda": 48492,
+ "Instruct": 48493,
+ "å·": 48494,
+ "Materials": 48495,
+ "ettings": 48496,
+ "Percent": 48497,
+ "Ġresistor": 48498,
+ "tymology": 48499,
+ "Ġdeprecated": 48500,
+ "Ġgrep": 48501,
+ "ĠWRITE": 48502,
+ "Ġtriv": 48503,
+ "Ġscrut": 48504,
+ "[/": 48505,
+ "anyl": 48506,
+ "skirts": 48507,
+ "MSN": 48508,
+ "ĠCodec": 48509,
+ "ecd": 48510,
+ "Anth": 48511,
+ "){": 48512,
+ "%]": 48513,
+ "veyard": 48514,
+ "aspberry": 48515,
+ "ãĢ": 48516,
+ "Reward": 48517,
+ "rha": 48518,
+ "Stretch": 48519,
+ "]-": 48520,
+ "Prev": 48521,
+ "Context": 48522,
+ "Ġlinux": 48523,
+ "HAHA": 48524,
+ "perties": 48525,
+ "ĠVIDE": 48526,
+ "Domain": 48527,
+ "Ġmurd": 48528,
+ "ĠLegions": 48529,
+ "apache": 48530,
+ "æŃ": 48531,
+ "Pause": 48532,
+ "Temperature": 48533,
+ "ufact": 48534,
+ "igslist": 48535,
+ "ĠRetrieved": 48536,
+ "èª": 48537,
+ "ãģĮ": 48538,
+ "Ingredients": 48539,
+ "ruary": 48540,
+ "dyl": 48541,
+ "Alias": 48542,
+ "ĠÎĶ": 48543,
+ "Ġinval": 48544,
+ "amsung": 48545,
+ "!--": 48546,
+ "olean": 48547,
+ "æī": 48548,
+ "ãģ¯": 48549,
+ "Ġcoefficients": 48550,
+ "ĠDHCP": 48551,
+ "âĨĴ": 48552,
+ "utonium": 48553,
+ ":[": 48554,
+ "âĹ": 48555,
+ "cli": 48556,
+ "Container": 48557,
+ "å¼": 48558,
+ "nexus": 48559,
+ "SOURCE": 48560,
+ "Ò": 48561,
+ "=/": 48562,
+ "Ġmysql": 48563,
+ "ĠGained": 48564,
+ "Ġ/*": 48565,
+ "uncture": 48566,
+ "Ġstatically": 48567,
+ "âĸł": 48568,
+ "æĺ¯": 48569,
+ "æ°": 48570,
+ "estamp": 48571,
+ "Cache": 48572,
+ "ulkan": 48573,
+ "staking": 48574,
+ "apter": 48575,
+ "ãģ¾": 48576,
+ "Ġμg": 48577,
+ "Ġtremend": 48578,
+ "ĠPiercing": 48579,
+ "naissance": 48580,
+ "ĠHealer": 48581,
+ "Enabled": 48582,
+ "éģ": 48583,
+ "âĸ": 48584,
+ "ĠThumbnails": 48585,
+ "Ġhither": 48586,
+ "Format": 48587,
+ "utherland": 48588,
+ "íķ": 48589,
+ "Ġdestro": 48590,
+ "fff": 48591,
+ "execute": 48592,
+ "msg": 48593,
+ "romancer": 48594,
+ "ĠCanaver": 48595,
+ "ĠVaults": 48596,
+ "oided": 48597,
+ "iage": 48598,
+ "Ġimg": 48599,
+ "summary": 48600,
+ "]);": 48601,
+ "ĠABE": 48602,
+ "ĠGamergate": 48603,
+ "utherford": 48604,
+ "Ġoverwrite": 48605,
+ "enment": 48606,
+ "æķ": 48607,
+ "Ġsystemd": 48608,
+ "tif": 48609,
+ "]).": 48610,
+ "ãĤ¤": 48611,
+ "Widget": 48612,
+ "======": 48613,
+ "(-": 48614,
+ "Ġ\"+": 48615,
+ "ĠIncarnation": 48616,
+ "æĥ": 48617,
+ "���": 48618,
+ "GUI": 48619,
+ "èĥ": 48620,
+ "forums": 48621,
+ "Ġrunes": 48622,
+ "Ġâī¤": 48623,
+ "Ġdefic": 48624,
+ "Distance": 48625,
+ "directory": 48626,
+ "ĠHorus": 48627,
+ "iltr": 48628,
+ "ortium": 48629,
+ "Ġ./": 48630,
+ "bda": 48631,
+ "owship": 48632,
+ "ĠâĨij": 48633,
+ "}.": 48634,
+ "åĩ": 48635,
+ "1027": 48636,
+ "Weapons": 48637,
+ "lucent": 48638,
+ "Ġauth": 48639,
+ ";;": 48640,
+ "Recommended": 48641,
+ "Ġsurv": 48642,
+ "Ġvm": 48643,
+ "ĠStronghold": 48644,
+ "Ġparan": 48645,
+ "ĠTrance": 48646,
+ "æĺ": 48647,
+ "Ġsovere": 48648,
+ "Ġcorrid": 48649,
+ "ĠPwr": 48650,
+ "Ġ[/": 48651,
+ "Ġseq": 48652,
+ "Population": 48653,
+ "Ġ[];": 48654,
+ "Ġreferen": 48655,
+ "ĠInstr": 48656,
+ "ĠStamina": 48657,
+ "kernel": 48658,
+ "Python": 48659,
+ "-+": 48660,
+ "Ġallele": 48661,
+ "éĽ": 48662,
+ "isode": 48663,
+ "ä¸į": 48664,
+ "otonin": 48665,
+ "modules": 48666,
+ "Notable": 48667,
+ "Spell": 48668,
+ "\\\\": 48669,
+ "Pref": 48670,
+ "Ġdatas": 48671,
+ "setup": 48672,
+ "Ġhapl": 48673,
+ "Height": 48674,
+ "åĭ": 48675,
+ "ãģ£": 48676,
+ "]),": 48677,
+ "Handle": 48678,
+ "umenthal": 48679,
+ "Package": 48680,
+ "Ġenthus": 48681,
+ "Ġunsus": 48682,
+ "Narr": 48683,
+ "Examples": 48684,
+ "FAQ": 48685,
+ "REDACTED": 48686,
+ "Ġnotor": 48687,
+ "Enable": 48688,
+ "Pattern": 48689,
+ "aeda": 48690,
+ ">.": 48691,
+ "CHECK": 48692,
+ "Ġ����": 48693,
+ "Ġ'.": 48694,
+ "Ġãĥ": 48695,
+ "append": 48696,
+ "����": 48697,
+ "gemony": 48698,
+ "terness": 48699,
+ "ĠHaku": 48700,
+ "NVIDIA": 48701,
+ "queue": 48702,
+ "Bind": 48703,
+ "Ġneigh": 48704,
+ "armor": 48705,
+ "retty": 48706,
+ "LOD": 48707,
+ "plugins": 48708,
+ "Ġ/>": 48709,
+ "TYPE": 48710,
+ "Ġ4096": 48711,
+ "-------": 48712,
+ "Preview": 48713,
+ "FML": 48714,
+ "Ġproletarian": 48715,
+ "zees": 48716,
+ "enfranch": 48717,
+ "ãģĨ": 48718,
+ "Ctrl": 48719,
+ "Module": 48720,
+ "ĠSurviv": 48721,
+ "ĠStarcraft": 48722,
+ "rored": 48723,
+ "reddit": 48724,
+ "Ġrul": 48725,
+ "Ġtx": 48726,
+ "Ġmage": 48727,
+ "Sword": 48728,
+ "Ġ~/": 48729,
+ "Effects": 48730,
+ "éļ": 48731,
+ "ä¹": 48732,
+ "Sensor": 48733,
+ "Solution": 48734,
+ "ãģĻ": 48735,
+ "Arcade": 48736,
+ "Ġpredec": 48737,
+ "Values": 48738,
+ "Length": 48739,
+ "Ġfortun": 48740,
+ "ttp": 48741,
+ "\"[": 48742,
+ "tmp": 48743,
+ "ĠBerserker": 48744,
+ "åĨ": 48745,
+ "ositories": 48746,
+ "Ġcouncill": 48747,
+ "ffff": 48748,
+ "));": 48749,
+ "Recipe": 48750,
+ "ĠASCII": 48751,
+ "âĦ¢:": 48752,
+ "ä": 48753,
+ "Ġhorm": 48754,
+ "=>": 48755,
+ "sers": 48756,
+ "ãģĭ": 48757,
+ "Recommend": 48758,
+ "['": 48759,
+ "agame": 48760,
+ "Animation": 48761,
+ "aucuses": 48762,
+ "Discussion": 48763,
+ "Ġhelicop": 48764,
+ "å¿": 48765,
+ "Float": 48766,
+ "Component": 48767,
+ "instance": 48768,
+ "Ġfoo": 48769,
+ "localhost": 48770,
+ "=-": 48771,
+ "Offset": 48772,
+ "Psy": 48773,
+ "ĠGohan": 48774,
+ "buquerque": 48775,
+ "Ġdefe": 48776,
+ "chwitz": 48777,
+ "parse": 48778,
+ "Ġdors": 48779,
+ "Ġspons": 48780,
+ "Ġasync": 48781,
+ "agonists": 48782,
+ "Ġindo": 48783,
+ ".>>": 48784,
+ "ĠDisciple": 48785,
+ "Ġfilename": 48786,
+ "rency": 48787,
+ "ĠDise": 48788,
+ "Ġ\"/": 48789,
+ "template": 48790,
+ "ãĤ¹": 48791,
+ "swers": 48792,
+ "Ġ++": 48793,
+ "Ġ[(": 48794,
+ "thora": 48795,
+ "ĠDepths": 48796,
+ "livious": 48797,
+ "Ġdisadvant": 48798,
+ "foundland": 48799,
+ "Upload": 48800,
+ "Ġ§§": 48801,
+ "Ġsophistic": 48802,
+ ";}": 48803,
+ "izont": 48804,
+ "\"}": 48805,
+ "estial": 48806,
+ "Ranked": 48807,
+ "ĠOccupations": 48808,
+ "LEASE": 48809,
+ "ĠOgre": 48810,
+ "folder": 48811,
+ "Plot": 48812,
+ "farious": 48813,
+ "Ġsuscept": 48814,
+ "Types": 48815,
+ "Discuss": 48816,
+ "Ġ'/": 48817,
+ "æµ": 48818,
+ "earable": 48819,
+ "æ³": 48820,
+ "Tile": 48821,
+ "iatus": 48822,
+ "åŃ": 48823,
+ "Ġreperto": 48824,
+ "Helper": 48825,
+ "Returns": 48826,
+ "ä¸Ĭ": 48827,
+ "imaru": 48828,
+ "Ġreq": 48829,
+ "Ġdissatisf": 48830,
+ "multipl": 48831,
+ "}{": 48832,
+ "-[": 48833,
+ "itial": 48834,
+ "*/": 48835,
+ "Config": 48836,
+ "Example": 48837,
+ "ĠjQuery": 48838,
+ "Mods": 48839,
+ "ĠGPIO": 48840,
+ "Ġlaun": 48841,
+ "layout": 48842,
+ "cised": 48843,
+ "Ġ......": 48844,
+ "+++": 48845,
+ "prototype": 48846,
+ "Exception": 48847,
+ "Ġsubsections": 48848,
+ "Ġresemb": 48849,
+ "Ġâĩ": 48850,
+ "ĠPubMed": 48851,
+ "username": 48852,
+ "Ġaggro": 48853,
+ "éĥ": 48854,
+ "Ġ};": 48855,
+ "ĠMages": 48856,
+ "ryu": 48857,
+ "apons": 48858,
+ "Optional": 48859,
+ "ĠAncients": 48860,
+ "ãĤĬ": 48861,
+ "Quotes": 48862,
+ "oaded": 48863,
+ "Ġsuspic": 48864,
+ "inline": 48865,
+ "omial": 48866,
+ "ĠMahjong": 48867,
+ "auntlets": 48868,
+ "Ġanarchism": 48869,
+ "Ġsubclass": 48870,
+ "ĠMLG": 48871,
+ "...]": 48872,
+ "Dialog": 48873,
+ "uphem": 48874,
+ "Ġrecursive": 48875,
+ "7601": 48876,
+ "frac": 48877,
+ "Else": 48878,
+ "ĠSeverus": 48879,
+ "},{\"": 48880,
+ "ĠCLIENT": 48881,
+ "Ġjavascript": 48882,
+ "sama": 48883,
+ "ĠLearns": 48884,
+ "ãĤĤ": 48885,
+ "Upgrade": 48886,
+ "Listener": 48887,
+ "Ġsnipp": 48888,
+ "Ġrune": 48889,
+ "ĠTTL": 48890,
+ "ertation": 48891,
+ "olicy": 48892,
+ "=\"\"": 48893,
+ "«ĺ": 48894,
+ "Ġexpr": 48895,
+ "ovych": 48896,
+ "Ġãģ": 48897,
+ "_-_": 48898,
+ "munition": 48899,
+ "////": 48900,
+ "func": 48901,
+ ">>>>": 48902,
+ "Provider": 48903,
+ "Ïī": 48904,
+ "BUG": 48905,
+ "Ġ[-": 48906,
+ "Ġarrang": 48907,
+ "merce": 48908,
+ "ãĥ": 48909,
+ "incarn": 48910,
+ "Valid": 48911,
+ "ĠAether": 48912,
+ "ãĤĵ": 48913,
+ "ĠUTF": 48914,
+ "ĠMonstrous": 48915,
+ "ãĤĮ": 48916,
+ "hedon": 48917,
+ "áµ": 48918,
+ ":#": 48919,
+ "ĠFrieza": 48920,
+ "padding": 48921,
+ "Reviewer": 48922,
+ "Ġpsychiat": 48923,
+ "yrinth": 48924,
+ "ĠâĶĤ": 48925,
+ "hillary": 48926,
+ "Static": 48927,
+ "Newsletter": 48928,
+ "Avg": 48929,
+ "Ġfn": 48930,
+ "Topic": 48931,
+ "choes": 48932,
+ "Ġnewsp": 48933,
+ "á¸": 48934,
+ "Ġ[+": 48935,
+ "~~~~~~~~~~~~~~~~": 48936,
+ ":]": 48937,
+ "apego": 48938,
+ "buf": 48939,
+ "Translation": 48940,
+ "ById": 48941,
+ "Ġmmol": 48942,
+ "ãĥ¼ãĥ": 48943,
+ "å½": 48944,
+ "ãĤī": 48945,
+ "Ġparser": 48946,
+ "ãĥª": 48947,
+ "`,": 48948,
+ "Lair": 48949,
+ ")}": 48950,
+ "ypes": 48951,
+ "adobe": 48952,
+ "Ġancest": 48953,
+ "ernel": 48954,
+ "ĠNULL": 48955,
+ "ç«": 48956,
+ "anguages": 48957,
+ "Increases": 48958,
+ "æĦ": 48959,
+ "utorial": 48960,
+ "ithmetic": 48961,
+ "dll": 48962,
+ "ĠArcane": 48963,
+ "çī": 48964,
+ "Ġtc": 48965,
+ "urtles": 48966,
+ "èĪ": 48967,
+ "Bytes": 48968,
+ "Slot": 48969,
+ "ĠBahá": 48970,
+ "Weapon": 48971,
+ "widget": 48972,
+ "querque": 48973,
+ "Ġembodiments": 48974,
+ "å¥": 48975,
+ "WARN": 48976,
+ "swer": 48977,
+ "thumbnails": 48978,
+ "FFFF": 48979,
+ "inguishable": 48980,
+ "Ġâī": 48981,
+ "Ġ${": 48982,
+ "AAAAAAAA": 48983,
+ "Conclusion": 48984,
+ "ĻĤ": 48985,
+ "disable": 48986,
+ "Rect": 48987,
+ "Ġsubp": 48988,
+ "Ġ().": 48989,
+ "ĠDetected": 48990,
+ "èĢ": 48991,
+ "[]": 48992,
+ "Ġcoerc": 48993,
+ "ĠmM": 48994,
+ "recated": 48995,
+ "fusc": 48996,
+ "ĠSorce": 48997,
+ "çĶŁ": 48998,
+ ").[": 48999,
+ "Ġ})": 49000,
+ "mobi": 49001,
+ "yip": 49002,
+ "Acknowled": 49003,
+ "ternity": 49004,
+ "iqueness": 49005,
+ "ython": 49006,
+ "><": 49007,
+ "Ġstd": 49008,
+ "Url": 49009,
+ "Ġnamespace": 49010,
+ "Ġtion": 49011,
+ "oother": 49012,
+ "Ó": 49013,
+ "Ġhemor": 49014,
+ "Ġrg": 49015,
+ "ventory": 49016,
+ "ãĤ¢": 49017,
+ "anamo": 49018,
+ "Socket": 49019,
+ "Topics": 49020,
+ "apeshifter": 49021,
+ "gnu": 49022,
+ "Ġdetrim": 49023,
+ "`.": 49024,
+ "romeda": 49025,
+ "çIJ": 49026,
+ "Ġlambda": 49027,
+ "Compan": 49028,
+ "Variable": 49029,
+ "Ġusb": 49030,
+ "ĠAdamant": 49031,
+ "ournal": 49032,
+ "Ġcovari": 49033,
+ "ãĥ©": 49034,
+ "éĸ": 49035,
+ "åİ": 49036,
+ "otaur": 49037,
+ "Ġ(),": 49038,
+ "Marginal": 49039,
+ "ãģı": 49040,
+ "Ġphysic": 49041,
+ "adeon": 49042,
+ "RESULTS": 49043,
+ "200000": 49044,
+ "ãģį": 49045,
+ "udeb": 49046,
+ "ãģĵ": 49047,
+ "COMPLE": 49048,
+ "Ġmsg": 49049,
+ "ghazi": 49050,
+ "/*": 49051,
+ "ĠDeity": 49052,
+ "Ġdisapp": 49053,
+ "Availability": 49054,
+ "Ġillum": 49055,
+ "à©": 49056,
+ "ptives": 49057,
+ ",âĢĶ": 49058,
+ "chnology": 49059,
+ "Ġaccur": 49060,
+ "Ġapi": 49061,
+ "Obj": 49062,
+ "ãĤ«": 49063,
+ "ãĤ¸": 49064,
+ "ä¹ĭ": 49065,
+ "ËĪ": 49066,
+ "Ġtcp": 49067,
+ "Required": 49068,
+ ".<": 49069,
+ "\".[": 49070,
+ "Ġ~/.": 49071,
+ "Ġobser": 49072,
+ "RFC": 49073,
+ "Ġintegers": 49074,
+ "åī": 49075,
+ "Installation": 49076,
+ "Ô": 49077,
+ "ó": 49078,
+ "csv": 49079,
+ "ãĥ«": 49080,
+ "ĠNoticed": 49081,
+ "âĸĵ": 49082,
+ "Tumblr": 49083,
+ "Reply": 49084,
+ "||": 49085,
+ "Ġconclud": 49086,
+ "Ġ))": 49087,
+ "ebin": 49088,
+ "sql": 49089,
+ "Closure": 49090,
+ "++++": 49091,
+ "],[": 49092,
+ "âĹı": 49093,
+ "Ġprolet": 49094,
+ "Ġ>=": 49095,
+ "estinal": 49096,
+ "Ġ[*": 49097,
+ "ĠInquisitor": 49098,
+ "Ġcmd": 49099,
+ "FINE": 49100,
+ "CRIP": 49101,
+ "Ġvertex": 49102,
+ "TeX": 49103,
+ "///": 49104,
+ "Ö¼": 49105,
+ "iscons": 49106,
+ "Ġmyster": 49107,
+ "Changed": 49108,
+ "timeout": 49109,
+ "irtual": 49110,
+ "Methods": 49111,
+ "Ġcerts": 49112,
+ "texture": 49113,
+ "Roaming": 49114,
+ "Proxy": 49115,
+ "Override": 49116,
+ "éĹ": 49117,
+ "utf": 49118,
+ "python": 49119,
+ "ĠRarity": 49120,
+ "ilitarian": 49121,
+ "çľ": 49122,
+ "().": 49123,
+ "æł": 49124,
+ "Ġbuf": 49125,
+ "åij": 49126,
+ "çķ": 49127,
+ "Ġ*.": 49128,
+ "umerable": 49129,
+ "~~~~": 49130,
+ "å¦": 49131,
+ "Ġsimultane": 49132,
+ "Ġjson": 49133,
+ "Requires": 49134,
+ "Ġperl": 49135,
+ "Interface": 49136,
+ "rupal": 49137,
+ "": 49138,
+ "uilt": 49139,
+ "mercial": 49140,
+ "ĠPalestin": 49141,
+ "theless": 49142,
+ ")=": 49143,
+ "Generic": 49144,
+ "&&": 49145,
+ "ALSE": 49146,
+ "Ġdebugger": 49147,
+ "paralle": 49148,
+ "acly": 49149,
+ "ĠScourge": 49150,
+ ")].": 49151,
+ "Ġinstr": 49152,
+ "Ġ{}": 49153,
+ "]+": 49154,
+ "Ġdilig": 49155,
+ "åŃIJ": 49156,
+ "Ġcaptcha": 49157,
+ "kefeller": 49158,
+ "iosyncr": 49159,
+ "Ġchars": 49160,
+ "Ġinitialize": 49161,
+ "Width": 49162,
+ "Ġgithub": 49163,
+ "Ġinitialization": 49164,
+ "ĠGamerGate": 49165,
+ "Ġþ": 49166,
+ "drm": 49167,
+ "slaught": 49168,
+ "Ġtiss": 49169,
+ ".............": 49170,
+ "Ĥ¬": 49171,
+ "Ġplent": 49172,
+ "ãģķ": 49173,
+ "cfg": 49174,
+ "âĨ": 49175,
+ "Ġpokemon": 49176,
+ "\"],": 49177,
+ "Ġtyr": 49178,
+ "SELECT": 49179,
+ "othal": 49180,
+ "Tags": 49181,
+ "ĠMarketable": 49182,
+ "-----------": 49183,
+ "icter": 49184,
+ "irlf": 49185,
+ "ormons": 49186,
+ "Database": 49187,
+ "ĠãĤ": 49188,
+ "Ġ{\"": 49189,
+ "î": 49190,
+ "Handler": 49191,
+ "âĶĢ": 49192,
+ "$$$$": 49193,
+ "ĠJaune": 49194,
+ "ãĤ³": 49195,
+ "(),": 49196,
+ ")+": 49197,
+ "--------": 49198,
+ "Ġshenan": 49199,
+ "Ġwelf": 49200,
+ "Ġ',": 49201,
+ "attribute": 49202,
+ "Uncommon": 49203,
+ "maxwell": 49204,
+ "Browser": 49205,
+ "ĠPastebin": 49206,
+ "uberty": 49207,
+ "debug": 49208,
+ "Ġmosqu": 49209,
+ "ĠBoolean": 49210,
+ "wcs": 49211,
+ "é£": 49212,
+ "/âĢĭ": 49213,
+ "çĦ": 49214,
+ "(){": 49215,
+ "////////////////////////////////": 49216,
+ "ĠGleaming": 49217,
+ "regor": 49218,
+ "ĠMercenary": 49219,
+ "ensional": 49220,
+ "mpeg": 49221,
+ "sudo": 49222,
+ "ãģ®å": 49223,
+ "iggurat": 49224,
+ "vironment": 49225,
+ "Directory": 49226,
+ "ĠDecoder": 49227,
+ "SPONSORED": 49228,
+ "intendo": 49229,
+ "Ġ<=": 49230,
+ "btn": 49231,
+ "ï¸": 49232,
+ "ä½ľ": 49233,
+ "paio": 49234,
+ "Tokens": 49235,
+ "ãĢį": 49236,
+ "params": 49237,
+ "Offline": 49238,
+ "Ġmetab": 49239,
+ "ĠLisp": 49240,
+ "anwhile": 49241,
+ ">:": 49242,
+ "itialized": 49243,
+ "HTTP": 49244,
+ "Trivia": 49245,
+ "Sov": 49246,
+ "wrapper": 49247,
+ "={": 49248,
+ "ĠAzerb": 49249,
+ "aeper": 49250,
+ "Ġneighb": 49251,
+ "initions": 49252,
+ "Ġsts": 49253,
+ "ĠSasuke": 49254,
+ "#$": 49255,
+ "uliffe": 49256,
+ "æĸ¹": 49257,
+ "++++++++++++++++": 49258,
+ "ĠElven": 49259,
+ "ãģĤ": 49260,
+ "Ġartif": 49261,
+ "Folder": 49262,
+ "Ġà¨": 49263,
+ "åĤ": 49264,
+ "Ġphyl": 49265,
+ "uggest": 49266,
+ "blance": 49267,
+ "ãģł": 49268,
+ "Requirements": 49269,
+ "Usage": 49270,
+ "Ġinitialized": 49271,
+ "ã쮿": 49272,
+ "conservancy": 49273,
+ "ĠReincarn": 49274,
+ ")|": 49275,
+ "Ġantioxid": 49276,
+ "ĠClicker": 49277,
+ "Ġunlaw": 49278,
+ "Ġ\\(": 49279,
+ "ãĥĪ": 49280,
+ "Ġ[*]": 49281,
+ "Characters": 49282,
+ "////////": 49283,
+ "ãĢIJ": 49284,
+ "ãĤ·": 49285,
+ "webkit": 49286,
+ "ãĢij": 49287,
+ "Ġxp": 49288,
+ "alkyrie": 49289,
+ "Console": 49290,
+ "());": 49291,
+ "ĠKorra": 49292,
+ "\"))": 49293,
+ "oooooooooooooooo": 49294,
+ "Timer": 49295,
+ "////////////////": 49296,
+ "yout": 49297,
+ "engeance": 49298,
+ "emetery": 49299,
+ "Ġmages": 49300,
+ "mods": 49301,
+ "Null": 49302,
+ "Ġphilos": 49303,
+ "ascript": 49304,
+ "Ġaddon": 49305,
+ "ĠâĸĪ": 49306,
+ "emale": 49307,
+ "----------------------------------------------------------------": 49308,
+ "Ġ\\\\": 49309,
+ "=[": 49310,
+ "ĠParables": 49311,
+ "ãĥĨ": 49312,
+ "VALUE": 49313,
+ "Ġ@@": 49314,
+ "Ġuint": 49315,
+ "${": 49316,
+ "cpp": 49317,
+ "%%": 49318,
+ "Ġ(âĪĴ": 49319,
+ "utils": 49320,
+ "prefix": 49321,
+ "å°Ĩ": 49322,
+ "ãĥŃ": 49323,
+ "Completed": 49324,
+ "Ġgoto": 49325,
+ "ãĤ¯": 49326,
+ "Winged": 49327,
+ "perty": 49328,
+ "[\"": 49329,
+ "ãĥİ": 49330,
+ "ĠScythe": 49331,
+ "Ġæľ": 49332,
+ "Ġ!=": 49333,
+ "Buffer": 49334,
+ "docker": 49335,
+ "ĠWATCHED": 49336,
+ "èĢħ": 49337,
+ "())": 49338,
+ "Ġdst": 49339,
+ "SIZE": 49340,
+ "ĠDemonic": 49341,
+ "Ġresil": 49342,
+ "ãĤ¿": 49343,
+ "Ġpione": 49344,
+ "cpu": 49345,
+ "++)": 49346,
+ "TEXT": 49347,
+ "Ġdiscrep": 49348,
+ "debian": 49349,
+ "quished": 49350,
+ "Ġacknow": 49351,
+ "Ġtrave": 49352,
+ "Ġgcc": 49353,
+ "Catalog": 49354,
+ "ctrl": 49355,
+ "ĠMoroc": 49356,
+ "Ġcpu": 49357,
+ "Ġ];": 49358,
+ "ĠSorceress": 49359,
+ "Introduced": 49360,
+ "Frames": 49361,
+ "Ġcondem": 49362,
+ "¶æ": 49363,
+ "~~~~~~~~": 49364,
+ "ĠEmacs": 49365,
+ "][/": 49366,
+ "Ġglim": 49367,
+ "Init": 49368,
+ "ĠPrimordial": 49369,
+ "ãĥĥ": 49370,
+ "Ġ+=": 49371,
+ "Ġblat": 49372,
+ "à¼": 49373,
+ "------------------------------------------------": 49374,
+ "gpu": 49375,
+ "ãĥĥãĥĪ": 49376,
+ "Ġxml": 49377,
+ "Ġboolean": 49378,
+ "References": 49379,
+ "Ġ?)": 49380,
+ "Ġsatell": 49381,
+ "Queue": 49382,
+ "Ġpestic": 49383,
+ "Ġ}}": 49384,
+ "Attribute": 49385,
+ "Ġdx": 49386,
+ "ĠDefin": 49387,
+ "Synopsis": 49388,
+ "..................": 49389,
+ "ãĥ¬": 49390,
+ "plugin": 49391,
+ "Disable": 49392,
+ "0000000000000000": 49393,
+ ")\\": 49394,
+ "ĠIchigo": 49395,
+ "println": 49396,
+ "rontal": 49397,
+ "Setup": 49398,
+ "Ġ��������": 49399,
+ "å§": 49400,
+ "âĸº": 49401,
+ "ĠPengu": 49402,
+ "ailability": 49403,
+ "Duration": 49404,
+ "Timeout": 49405,
+ "ãĢĮ": 49406,
+ "Ġbehav": 49407,
+ "Reviewed": 49408,
+ "Ġtoget": 49409,
+ "\\.": 49410,
+ "lished": 49411,
+ "Ġthous": 49412,
+ "Ġperpend": 49413,
+ "ecause": 49414,
+ "Layout": 49415,
+ "è»": 49416,
+ "ĠDexterity": 49417,
+ "unsigned": 49418,
+ "+=": 49419,
+ "[[": 49420,
+ "ĠRunes": 49421,
+ "ãĤ¦": 49422,
+ "};": 49423,
+ "})": 49424,
+ "FTWARE": 49425,
+ "ength": 49426,
+ "milo": 49427,
+ "duino": 49428,
+ "天": 49429,
+ "ĠClojure": 49430,
+ "ļé": 49431,
+ "ãĥ¥": 49432,
+ "gradient": 49433,
+ "Ġ\"\"\"": 49434,
+ "âĨij": 49435,
+ "@#": 49436,
+ "JSON": 49437,
+ "Ġproport": 49438,
+ "addr": 49439,
+ "});": 49440,
+ "ãĥIJ": 49441,
+ "ä¸ī": 49442,
+ "Ġtmp": 49443,
+ "å£": 49444,
+ "../": 49445,
+ "zsche": 49446,
+ "Ġâμ": 49447,
+ "Entity": 49448,
+ "æ©Ł": 49449,
+ "ĠâĶľâĶĢâĶĢ": 49450,
+ "filename": 49451,
+ "{{": 49452,
+ "@@": 49453,
+ "ĠSeym": 49454,
+ "Ġ/**": 49455,
+ "ĠSummoner": 49456,
+ "Quantity": 49457,
+ "ç·": 49458,
+ "Attach": 49459,
+ "Ġbool": 49460,
+ "Texture": 49461,
+ "Ġopio": 49462,
+ ".}": 49463,
+ "ãĥĭ": 49464,
+ "integer": 49465,
+ "Ġregex": 49466,
+ "Ġnomine": 49467,
+ "ription": 49468,
+ "ãģ®ç": 49469,
+ "ãĥķ": 49470,
+ "Ġsubparagraph": 49471,
+ "GGGG": 49472,
+ "Ġexplan": 49473,
+ "Header": 49474,
+ "Spawn": 49475,
+ "toggle": 49476,
+ "²¾": 49477,
+ "Abyss": 49478,
+ "expr": 49479,
+ "ĠZerg": 49480,
+ "ĠGrimoire": 49481,
+ "Contents": 49482,
+ "Instance": 49483,
+ "cyclopedia": 49484,
+ "ãĥĹ": 49485,
+ "ĠTakeru": 49486,
+ "=(": 49487,
+ "代": 49488,
+ "\\)": 49489,
+ "Ġrgb": 49490,
+ "htt": 49491,
+ "bryce": 49492,
+ "Ġlivest": 49493,
+ "ĠAnnotations": 49494,
+ "âĶĢâĶĢâĶĢâĶĢâĶĢâĶĢâĶĢâĶĢ": 49495,
+ "berus": 49496,
+ "ntil": 49497,
+ "Ġskelet": 49498,
+ "callback": 49499,
+ "åħī": 49500,
+ "Joined": 49501,
+ "ãĤª": 49502,
+ "Ġargs": 49503,
+ "artifacts": 49504,
+ "Ġå¤": 49505,
+ "ÃĽ": 49506,
+ "ãĥŀ": 49507,
+ "Streamer": 49508,
+ "}\"": 49509,
+ "Ġunden": 49510,
+ "ãĥģ": 49511,
+ "Īè": 49512,
+ "ãĥ£": 49513,
+ "Ġ0004": 49514,
+ "Ġ\\'": 49515,
+ "ãĤ°": 49516,
+ "ĠCONFIG": 49517,
+ "Ġ#####": 49518,
+ "``": 49519,
+ "anguage": 49520,
+ "Ġ*)": 49521,
+ "Template": 49522,
+ "MODE": 49523,
+ "Ġ00000000": 49524,
+ "'';": 49525,
+ ">": 49526,
+ "士": 49527,
+ "essage": 49528,
+ "ntax": 49529,
+ "Cmd": 49530,
+ "ividual": 49531,
+ "Unix": 49532,
+ "è£": 49533,
+ "çĭ": 49534,
+ "使": 49535,
+ "():": 49536,
+ "ãĥī": 49537,
+ "gdala": 49538,
+ "etheless": 49539,
+ "ktop": 49540,
+ "ĠACPI": 49541,
+ "ãĥĸ": 49542,
+ "Ġsshd": 49543,
+ "Ġ000000": 49544,
+ "Ġchalleng": 49545,
+ "âĶĢâĶĢ": 49546,
+ "ĠFlavoring": 49547,
+ "çİĭ": 49548,
+ "Http": 49549,
+ "Ĭ±": 49550,
+ "Accessory": 49551,
+ "oldemort": 49552,
+ "ĠIzan": 49553,
+ "galitarian": 49554,
+ "ĠChocobo": 49555,
+ "edIn": 49556,
+ "++++++++": 49557,
+ "Ġprintf": 49558,
+ "çīĪ": 49559,
+ "izoph": 49560,
+ "ruciating": 49561,
+ "Ġenum": 49562,
+ ",,,,": 49563,
+ "Ġpregn": 49564,
+ "sembly": 49565,
+ "Ġtherap": 49566,
+ "Ġingred": 49567,
+ "ãĤµ": 49568,
+ "Ġsql": 49569,
+ "(*": 49570,
+ "Appearance": 49571,
+ "ngth": 49572,
+ "invoke": 49573,
+ "ãĥĥãĤ¯": 49574,
+ "ctx": 49575,
+ "Ġdmg": 49576,
+ "Plugin": 49577,
+ "ãĥ¡": 49578,
+ "ulhu": 49579,
+ "ãĤ§": 49580,
+ "Ġwarr": 49581,
+ "Ġmetic": 49582,
+ "女": 49583,
+ "Ġoun": 49584,
+ "ð": 49585,
+ "Ġtooltip": 49586,
+ "ãĤŃ": 49587,
+ "Ġvolunte": 49588,
+ "imgur": 49589,
+ "accompan": 49590,
+ "aterasu": 49591,
+ "olkien": 49592,
+ "ãĤº": 49593,
+ "Ġnodd": 49594,
+ "ĠMetatron": 49595,
+ "javascript": 49596,
+ "umbledore": 49597,
+ "ãĥł": 49598,
+ "--------------------------------------------------------": 49599,
+ "runtime": 49600,
+ "ĠLeban": 49601,
+ "Configuration": 49602,
+ "emort": 49603,
+ "(_": 49604,
+ "Connector": 49605,
+ "iosyn": 49606,
+ "reddits": 49607,
+ "Ġ\"%": 49608,
+ "Ġ[&": 49609,
+ "ĠSwordsman": 49610,
+ "ĠAwoken": 49611,
+ "Ġ;;": 49612,
+ "ãĥ¼ãĥ«": 49613,
+ "Ġ:=": 49614,
+ "ãĤ¹ãĥĪ": 49615,
+ "Ġcomr": 49616,
+ "Adapter": 49617,
+ "sbm": 49618,
+ "âķIJâķIJ": 49619,
+ "çļ": 49620,
+ "Loader": 49621,
+ "ãĥĵ": 49622,
+ "okemon": 49623,
+ "ãģ®é": 49624,
+ "-->": 49625,
+ "Ġlvl": 49626,
+ "Footnote": 49627,
+ "Iter": 49628,
+ "####": 49629,
+ "ãĥij": 49630,
+ "ĠCarbuncle": 49631,
+ "Ġ[+]": 49632,
+ "Ġmathemat": 49633,
+ "Allows": 49634,
+ "Ġ4090": 49635,
+ "Async": 49636,
+ "ģ«": 49637,
+ "Ͻ": 49638,
+ "))))": 49639,
+ "á½": 49640,
+ "Ġcx": 49641,
+ "Ġansw": 49642,
+ "{\"": 49643,
+ "ãĥŁ": 49644,
+ "addons": 49645,
+ "Filename": 49646,
+ "Appearances": 49647,
+ "ĠãĢĮ": 49648,
+ "Ġaddr": 49649,
+ "Ġcharact": 49650,
+ "glomer": 49651,
+ "Advertisements": 49652,
+ "Ġdracon": 49653,
+ "ĠFenrir": 49654,
+ "Ġ();": 49655,
+ "ĠCitiz": 49656,
+ "acebook": 49657,
+ "Ġparams": 49658,
+ "]=": 49659,
+ "Ġsubscript": 49660,
+ "Ġentreprene": 49661,
+ "tnc": 49662,
+ "iversal": 49663,
+ "Ġmillenn": 49664,
+ "ithub": 49665,
+ "/>": 49666,
+ "Ġ\"{": 49667,
+ "Frameworks": 49668,
+ "avorite": 49669,
+ "Ġ])": 49670,
+ "Constructed": 49671,
+ "fml": 49672,
+ "ãĥį": 49673,
+ "################################": 49674,
+ "-|": 49675,
+ "¥ŀ": 49676,
+ "Ġwithd": 49677,
+ "ĠCth": 49678,
+ "AppData": 49679,
+ "Msg": 49680,
+ ":{": 49681,
+ "ãĤ¨": 49682,
+ "Ġtuple": 49683,
+ "ç¥ŀ": 49684,
+ "Ġintrins": 49685,
+ "ĠCooldown": 49686,
+ "ategory": 49687,
+ "^{": 49688,
+ "ãĥĬ": 49689,
+ "''''": 49690,
+ "çͰ": 49691,
+ "ĠDEBUG": 49692,
+ "Ġcannabin": 49693,
+ "ocobo": 49694,
+ "Invalid": 49695,
+ "ãĥĢ": 49696,
+ "Compat": 49697,
+ "Ġ({": 49698,
+ "Removed": 49699,
+ "Ġconvol": 49700,
+ "}:": 49701,
+ "interstitial": 49702,
+ "Ġ": 49703,
+ "Ġcontrace": 49704,
+ "uyomi": 49705,
+ "Callback": 49706,
+ "Parser": 49707,
+ "äºĶ": 49708,
+ "Versions": 49709,
+ "::::": 49710,
+ "Recomm": 49711,
+ "}\\": 49712,
+ "Ġ\"_": 49713,
+ "Debug": 49714,
+ "ĠAoE": 49715,
+ "atever": 49716,
+ "ĠTradable": 49717,
+ "Reloaded": 49718,
+ "ĠReincarnated": 49719,
+ "ĠStrongh": 49720,
+ ">\"": 49721,
+ "initialized": 49722,
+ "Ġexting": 49723,
+ "Poké": 49724,
+ "Parameters": 49725,
+ "¶ħ": 49726,
+ "########": 49727,
+ "NULL": 49728,
+ "ãĥĩ": 49729,
+ "groupon": 49730,
+ "\\-": 49731,
+ "ãĥı": 49732,
+ "ãĤ±": 49733,
+ "Ġsubsequ": 49734,
+ "ccording": 49735,
+ "ĠMODULE": 49736,
+ "ĠProtoss": 49737,
+ "\"},{\"": 49738,
+ "Ġ..............": 49739,
+ "Integer": 49740,
+ "endif": 49741,
+ "ãĥĻ": 49742,
+ "parser": 49743,
+ "lambda": 49744,
+ "Ġcarbohyd": 49745,
+ "ĠUnloaded": 49746,
+ "_{": 49747,
+ "âĸ¬âĸ¬": 49748,
+ "Ġdebian": 49749,
+ "]}": 49750,
+ "ãĤ¶": 49751,
+ "Parameter": 49752,
+ "ãĤ£": 49753,
+ "ãĤ»": 49754,
+ "Ġ$_": 49755,
+ "İĭ": 49756,
+ "Ġiterator": 49757,
+ "ãĤ¬": 49758,
+ "WINDOWS": 49759,
+ "CONCLUS": 49760,
+ "Ġ\"\\": 49761,
+ "umbn": 49762,
+ "(&": 49763,
+ "ãĥ©ãĥ³": 49764,
+ "usercontent": 49765,
+ "ometimes": 49766,
+ "METHOD": 49767,
+ "ãĥ¢": 49768,
+ "potion": 49769,
+ "ãĥ¯": 49770,
+ "everal": 49771,
+ "Ġweap": 49772,
+ "minecraft": 49773,
+ "================================": 49774,
+ "printf": 49775,
+ "ĠShinra": 49776,
+ "Ġreluct": 49777,
+ "\\\",": 49778,
+ "Runtime": 49779,
+ "xff": 49780,
+ "ĠAbyssal": 49781,
+ "akeru": 49782,
+ "Ġ\\(\\": 49783,
+ "\"/>": 49784,
+ "efficients": 49785,
+ "Ü": 49786,
+ "avascript": 49787,
+ "Ġbehavi": 49788,
+ "++;": 49789,
+ "=#": 49790,
+ "Attributes": 49791,
+ "âĵĺ": 49792,
+ "lvl": 49793,
+ "¬¼": 49794,
+ "/**": 49795,
+ "Gameplay": 49796,
+ "ĠLeilan": 49797,
+ ">)": 49798,
+ "=\"/": 49799,
+ "Ġ));": 49800,
+ "ãĥĨãĤ£": 49801,
+ "ġ": 49802,
+ ".": 49803,
+ "Ġantidepress": 49804,
+ "Ġhtt": 49805,
+ "################": 49806,
+ "arnaev": 49807,
+ "ãĤ½": 49808,
+ "DERR": 49809,
+ "¥µ": 49810,
+ "âĸĪ": 49811,
+ "Ġ|--": 49812,
+ "Ġundermin": 49813,
+ "Ġ)))": 49814,
+ "ãĥĩãĤ£": 49815,
+ "awaru": 49816,
+ "\":[{\"": 49817,
+ "aution": 49818,
+ "ãĤ¤ãĥĪ": 49819,
+ "ô": 49820,
+ "ĠILCS": 49821,
+ "dfx": 49822,
+ "ĨĴ": 49823,
+ "âĸĴ": 49824,
+ "Ġcitiz": 49825,
+ "Ġ-=": 49826,
+ "ĠAllaah": 49827,
+ "Ġ(_": 49828,
+ "ĸļ": 49829,
+ "Ġ{\\": 49830,
+ "Ġsrf": 49831,
+ "ãĤ´": 49832,
+ "æŃ¦": 49833,
+ "»Ĵ": 49834,
+ "Ptr": 49835,
+ "'>": 49836,
+ "DEBUG": 49837,
+ "âĶģ": 49838,
+ "ãĢı": 49839,
+ "WithNo": 49840,
+ "Redditor": 49841,
+ "ĠâĶľ": 49842,
+ "Ġfmt": 49843,
+ "ãĢİ": 49844,
+ "Ġmsec": 49845,
+ "ĪĴ": 49846,
+ "eatures": 49847,
+ "itially": 49848,
+ "\"\"\"": 49849,
+ "ãĥ¼ãĤ¯": 49850,
+ "Textures": 49851,
+ "\"},": 49852,
+ "\">": 49853,
+ "Ġenthusi": 49854,
+ "CHAPTER": 49855,
+ "Ġunbeliev": 49856,
+ "Ġearthqu": 49857,
+ "Ġ><": 49858,
+ "||||": 49859,
+ "ß": 49860,
+ "iterator": 49861,
+ "è£ħ": 49862,
+ "Ĥª": 49863,
+ "ojure": 49864,
+ "ãħĭãħĭ": 49865,
+ "ãĥ¼ãĥ³": 49866,
+ "Ġprintln": 49867,
+ "Ġ][": 49868,
+ "âĸĪâĸĪ": 49869,
+ "âķIJ": 49870,
+ "\\\":": 49871,
+ "senal": 49872,
+ "é¾į": 49873,
+ "é¾": 49874,
+ "Ġcryst": 49875,
+ "ãĥķãĤ¡": 49876,
+ "ĠCosponsors": 49877,
+ "ãĤ·ãĥ£": 49878,
+ "Magikarp": 49879,
+ "ĠMagicka": 49880,
+ "âĸĪâĸĪâĸĪâĸĪ": 49881,
+ ",,,,,,,,": 49882,
+ "vertisement": 49883,
+ "âĶĢâĶĢâĶĢâĶĢ": 49884,
+ "ãĥķãĤ©": 49885,
+ "luaj": 49886,
+ "CLASSIFIED": 49887,
+ ".''.": 49888,
+ "byss": 49889,
+ "Ġ{:": 49890,
+ "ĠNanto": 49891,
+ "Ġptr": 49892,
+ "Ġ%%": 49893,
+ "Ġteasp": 49894,
+ "[_": 49895,
+ "ãĥ¤": 49896,
+ "ħĭ": 49897,
+ "ŃĶ": 49898,
+ "Ġpci": 49899,
+ "Ġ\"<": 49900,
+ "GGGGGGGG": 49901,
+ "æĪ¦": 49902,
+ "--+": 49903,
+ "ãĤ®": 49904,
+ "Ġ())": 49905,
+ "âĸ¬": 49906,
+ "Ġsizeof": 49907,
+ "}}}": 49908,
+ ";;;;;;;;": 49909,
+ ">]": 49910,
+ "âĸĪâĸĪâĸĪâĸĪâĸĪâĸĪâĸĪâĸĪ": 49911,
+ "Vaults": 49912,
+ "Ġistg": 49913,
+ "Ġnewcom": 49914,
+ "=]": 49915,
+ "¿½": 49916,
+ "ĵĺ": 49917,
+ "{\\": 49918,
+ "Args": 49919,
+ "Ġexha": 49920,
+ "(\\": 49921,
+ "Ġunnecess": 49922,
+ "\"}],\"": 49923,
+ "ĠUNCLASSIFIED": 49924,
+ ">(": 49925,
+ "ãĤ¢ãĥ«": 49926,
+ "æ©": 49927,
+ "70710": 49928,
+ "Ń·": 49929,
+ "ãĥ¼ãĥĨãĤ£": 49930,
+ "ĠSakuya": 49931,
+ "ãĥĥãĥī": 49932,
+ "ĠPyrrha": 49933,
+ "escription": 49934,
+ "VIDIA": 49935,
+ "================================================================": 49936,
+ "Ġlooph": 49937,
+ "=~": 49938,
+ "Ġcumbers": 49939,
+ "Ġ)]": 49940,
+ "govtrack": 49941,
+ "ĠãĤµ": 49942,
+ "Ġsubur": 49943,
+ "Þ": 49944,
+ "Ġâī¡": 49945,
+ "Interstitial": 49946,
+ "ãĥ¼ãĥĨ": 49947,
+ "Ġgobl": 49948,
+ "ãĥīãĥ©": 49949,
+ "oldown": 49950,
+ "ģĸ": 49951,
+ "Depths": 49952,
+ "Ġ());": 49953,
+ "Ġ._": 49954,
+ "20439": 49955,
+ "Ġç¥ŀ": 49956,
+ "ãģ®å®": 49957,
+ "ãĤ¼": 49958,
+ "Ġ$\\": 49959,
+ "âĹ¼": 49960,
+ "Ġencount": 49961,
+ "Ġ": 48457,
+ "Ġstreng": 48458,
+ "agascar": 48459,
+ "guyen": 48460,
+ "((": 48461,
+ ")[": 48462,
+ "ĠNorn": 48463,
+ "Ġhippocamp": 48464,
+ "Ġ¯": 48465,
+ "îĢ": 48466,
+ "Connection": 48467,
+ "PATH": 48468,
+ "mbuds": 48469,
+ "ĠShards": 48470,
+ "Ġadvoc": 48471,
+ "Ġsimulac": 48472,
+ "âĸij": 48473,
+ "!?\"": 48474,
+ "ĠPotion": 48475,
+ "Ġamulet": 48476,
+ "ĠFnatic": 48477,
+ "Ġcryptoc": 48478,
+ "wav": 48479,
+ "radius": 48480,
+ "pkg": 48481,
+ "ĠMFT": 48482,
+ "æĢ": 48483,
+ "Ġtoile": 48484,
+ "Items": 48485,
+ "ifference": 48486,
+ "errors": 48487,
+ "ĠCelt": 48488,
+ "Ġunpop": 48489,
+ "ilogy": 48490,
+ "6666": 48491,
+ "hesda": 48492,
+ "Instruct": 48493,
+ "å·": 48494,
+ "Materials": 48495,
+ "ettings": 48496,
+ "Percent": 48497,
+ "Ġresistor": 48498,
+ "tymology": 48499,
+ "Ġdeprecated": 48500,
+ "Ġgrep": 48501,
+ "ĠWRITE": 48502,
+ "Ġtriv": 48503,
+ "Ġscrut": 48504,
+ "[/": 48505,
+ "anyl": 48506,
+ "skirts": 48507,
+ "MSN": 48508,
+ "ĠCodec": 48509,
+ "ecd": 48510,
+ "Anth": 48511,
+ "){": 48512,
+ "%]": 48513,
+ "veyard": 48514,
+ "aspberry": 48515,
+ "ãĢ": 48516,
+ "Reward": 48517,
+ "rha": 48518,
+ "Stretch": 48519,
+ "]-": 48520,
+ "Prev": 48521,
+ "Context": 48522,
+ "Ġlinux": 48523,
+ "HAHA": 48524,
+ "perties": 48525,
+ "ĠVIDE": 48526,
+ "Domain": 48527,
+ "Ġmurd": 48528,
+ "ĠLegions": 48529,
+ "apache": 48530,
+ "æŃ": 48531,
+ "Pause": 48532,
+ "Temperature": 48533,
+ "ufact": 48534,
+ "igslist": 48535,
+ "ĠRetrieved": 48536,
+ "èª": 48537,
+ "ãģĮ": 48538,
+ "Ingredients": 48539,
+ "ruary": 48540,
+ "dyl": 48541,
+ "Alias": 48542,
+ "ĠÎĶ": 48543,
+ "Ġinval": 48544,
+ "amsung": 48545,
+ "!--": 48546,
+ "olean": 48547,
+ "æī": 48548,
+ "ãģ¯": 48549,
+ "Ġcoefficients": 48550,
+ "ĠDHCP": 48551,
+ "âĨĴ": 48552,
+ "utonium": 48553,
+ ":[": 48554,
+ "âĹ": 48555,
+ "cli": 48556,
+ "Container": 48557,
+ "å¼": 48558,
+ "nexus": 48559,
+ "SOURCE": 48560,
+ "Ò": 48561,
+ "=/": 48562,
+ "Ġmysql": 48563,
+ "ĠGained": 48564,
+ "Ġ/*": 48565,
+ "uncture": 48566,
+ "Ġstatically": 48567,
+ "âĸł": 48568,
+ "æĺ¯": 48569,
+ "æ°": 48570,
+ "estamp": 48571,
+ "Cache": 48572,
+ "ulkan": 48573,
+ "staking": 48574,
+ "apter": 48575,
+ "ãģ¾": 48576,
+ "Ġμg": 48577,
+ "Ġtremend": 48578,
+ "ĠPiercing": 48579,
+ "naissance": 48580,
+ "ĠHealer": 48581,
+ "Enabled": 48582,
+ "éģ": 48583,
+ "âĸ": 48584,
+ "ĠThumbnails": 48585,
+ "Ġhither": 48586,
+ "Format": 48587,
+ "utherland": 48588,
+ "íķ": 48589,
+ "Ġdestro": 48590,
+ "fff": 48591,
+ "execute": 48592,
+ "msg": 48593,
+ "romancer": 48594,
+ "ĠCanaver": 48595,
+ "ĠVaults": 48596,
+ "oided": 48597,
+ "iage": 48598,
+ "Ġimg": 48599,
+ "summary": 48600,
+ "]);": 48601,
+ "ĠABE": 48602,
+ "ĠGamergate": 48603,
+ "utherford": 48604,
+ "Ġoverwrite": 48605,
+ "enment": 48606,
+ "æķ": 48607,
+ "Ġsystemd": 48608,
+ "tif": 48609,
+ "]).": 48610,
+ "ãĤ¤": 48611,
+ "Widget": 48612,
+ "======": 48613,
+ "(-": 48614,
+ "Ġ\"+": 48615,
+ "ĠIncarnation": 48616,
+ "æĥ": 48617,
+ "���": 48618,
+ "GUI": 48619,
+ "èĥ": 48620,
+ "forums": 48621,
+ "Ġrunes": 48622,
+ "Ġâī¤": 48623,
+ "Ġdefic": 48624,
+ "Distance": 48625,
+ "directory": 48626,
+ "ĠHorus": 48627,
+ "iltr": 48628,
+ "ortium": 48629,
+ "Ġ./": 48630,
+ "bda": 48631,
+ "owship": 48632,
+ "ĠâĨij": 48633,
+ "}.": 48634,
+ "åĩ": 48635,
+ "1027": 48636,
+ "Weapons": 48637,
+ "lucent": 48638,
+ "Ġauth": 48639,
+ ";;": 48640,
+ "Recommended": 48641,
+ "Ġsurv": 48642,
+ "Ġvm": 48643,
+ "ĠStronghold": 48644,
+ "Ġparan": 48645,
+ "ĠTrance": 48646,
+ "æĺ": 48647,
+ "Ġsovere": 48648,
+ "Ġcorrid": 48649,
+ "ĠPwr": 48650,
+ "Ġ[/": 48651,
+ "Ġseq": 48652,
+ "Population": 48653,
+ "Ġ[];": 48654,
+ "Ġreferen": 48655,
+ "ĠInstr": 48656,
+ "ĠStamina": 48657,
+ "kernel": 48658,
+ "Python": 48659,
+ "-+": 48660,
+ "Ġallele": 48661,
+ "éĽ": 48662,
+ "isode": 48663,
+ "ä¸į": 48664,
+ "otonin": 48665,
+ "modules": 48666,
+ "Notable": 48667,
+ "Spell": 48668,
+ "\\\\": 48669,
+ "Pref": 48670,
+ "Ġdatas": 48671,
+ "setup": 48672,
+ "Ġhapl": 48673,
+ "Height": 48674,
+ "åĭ": 48675,
+ "ãģ£": 48676,
+ "]),": 48677,
+ "Handle": 48678,
+ "umenthal": 48679,
+ "Package": 48680,
+ "Ġenthus": 48681,
+ "Ġunsus": 48682,
+ "Narr": 48683,
+ "Examples": 48684,
+ "FAQ": 48685,
+ "REDACTED": 48686,
+ "Ġnotor": 48687,
+ "Enable": 48688,
+ "Pattern": 48689,
+ "aeda": 48690,
+ ">.": 48691,
+ "CHECK": 48692,
+ "Ġ����": 48693,
+ "Ġ'.": 48694,
+ "Ġãĥ": 48695,
+ "append": 48696,
+ "����": 48697,
+ "gemony": 48698,
+ "terness": 48699,
+ "ĠHaku": 48700,
+ "NVIDIA": 48701,
+ "queue": 48702,
+ "Bind": 48703,
+ "Ġneigh": 48704,
+ "armor": 48705,
+ "retty": 48706,
+ "LOD": 48707,
+ "plugins": 48708,
+ "Ġ/>": 48709,
+ "TYPE": 48710,
+ "Ġ4096": 48711,
+ "-------": 48712,
+ "Preview": 48713,
+ "FML": 48714,
+ "Ġproletarian": 48715,
+ "zees": 48716,
+ "enfranch": 48717,
+ "ãģĨ": 48718,
+ "Ctrl": 48719,
+ "Module": 48720,
+ "ĠSurviv": 48721,
+ "ĠStarcraft": 48722,
+ "rored": 48723,
+ "reddit": 48724,
+ "Ġrul": 48725,
+ "Ġtx": 48726,
+ "Ġmage": 48727,
+ "Sword": 48728,
+ "Ġ~/": 48729,
+ "Effects": 48730,
+ "éļ": 48731,
+ "ä¹": 48732,
+ "Sensor": 48733,
+ "Solution": 48734,
+ "ãģĻ": 48735,
+ "Arcade": 48736,
+ "Ġpredec": 48737,
+ "Values": 48738,
+ "Length": 48739,
+ "Ġfortun": 48740,
+ "ttp": 48741,
+ "\"[": 48742,
+ "tmp": 48743,
+ "ĠBerserker": 48744,
+ "åĨ": 48745,
+ "ositories": 48746,
+ "Ġcouncill": 48747,
+ "ffff": 48748,
+ "));": 48749,
+ "Recipe": 48750,
+ "ĠASCII": 48751,
+ "âĦ¢:": 48752,
+ "ä": 48753,
+ "Ġhorm": 48754,
+ "=>": 48755,
+ "sers": 48756,
+ "ãģĭ": 48757,
+ "Recommend": 48758,
+ "['": 48759,
+ "agame": 48760,
+ "Animation": 48761,
+ "aucuses": 48762,
+ "Discussion": 48763,
+ "Ġhelicop": 48764,
+ "å¿": 48765,
+ "Float": 48766,
+ "Component": 48767,
+ "instance": 48768,
+ "Ġfoo": 48769,
+ "localhost": 48770,
+ "=-": 48771,
+ "Offset": 48772,
+ "Psy": 48773,
+ "ĠGohan": 48774,
+ "buquerque": 48775,
+ "Ġdefe": 48776,
+ "chwitz": 48777,
+ "parse": 48778,
+ "Ġdors": 48779,
+ "Ġspons": 48780,
+ "Ġasync": 48781,
+ "agonists": 48782,
+ "Ġindo": 48783,
+ ".>>": 48784,
+ "ĠDisciple": 48785,
+ "Ġfilename": 48786,
+ "rency": 48787,
+ "ĠDise": 48788,
+ "Ġ\"/": 48789,
+ "template": 48790,
+ "ãĤ¹": 48791,
+ "swers": 48792,
+ "Ġ++": 48793,
+ "Ġ[(": 48794,
+ "thora": 48795,
+ "ĠDepths": 48796,
+ "livious": 48797,
+ "Ġdisadvant": 48798,
+ "foundland": 48799,
+ "Upload": 48800,
+ "Ġ§§": 48801,
+ "Ġsophistic": 48802,
+ ";}": 48803,
+ "izont": 48804,
+ "\"}": 48805,
+ "estial": 48806,
+ "Ranked": 48807,
+ "ĠOccupations": 48808,
+ "LEASE": 48809,
+ "ĠOgre": 48810,
+ "folder": 48811,
+ "Plot": 48812,
+ "farious": 48813,
+ "Ġsuscept": 48814,
+ "Types": 48815,
+ "Discuss": 48816,
+ "Ġ'/": 48817,
+ "æµ": 48818,
+ "earable": 48819,
+ "æ³": 48820,
+ "Tile": 48821,
+ "iatus": 48822,
+ "åŃ": 48823,
+ "Ġreperto": 48824,
+ "Helper": 48825,
+ "Returns": 48826,
+ "ä¸Ĭ": 48827,
+ "imaru": 48828,
+ "Ġreq": 48829,
+ "Ġdissatisf": 48830,
+ "multipl": 48831,
+ "}{": 48832,
+ "-[": 48833,
+ "itial": 48834,
+ "*/": 48835,
+ "Config": 48836,
+ "Example": 48837,
+ "ĠjQuery": 48838,
+ "Mods": 48839,
+ "ĠGPIO": 48840,
+ "Ġlaun": 48841,
+ "layout": 48842,
+ "cised": 48843,
+ "Ġ......": 48844,
+ "+++": 48845,
+ "prototype": 48846,
+ "Exception": 48847,
+ "Ġsubsections": 48848,
+ "Ġresemb": 48849,
+ "Ġâĩ": 48850,
+ "ĠPubMed": 48851,
+ "username": 48852,
+ "Ġaggro": 48853,
+ "éĥ": 48854,
+ "Ġ};": 48855,
+ "ĠMages": 48856,
+ "ryu": 48857,
+ "apons": 48858,
+ "Optional": 48859,
+ "ĠAncients": 48860,
+ "ãĤĬ": 48861,
+ "Quotes": 48862,
+ "oaded": 48863,
+ "Ġsuspic": 48864,
+ "inline": 48865,
+ "omial": 48866,
+ "ĠMahjong": 48867,
+ "auntlets": 48868,
+ "Ġanarchism": 48869,
+ "Ġsubclass": 48870,
+ "ĠMLG": 48871,
+ "...]": 48872,
+ "Dialog": 48873,
+ "uphem": 48874,
+ "Ġrecursive": 48875,
+ "7601": 48876,
+ "frac": 48877,
+ "Else": 48878,
+ "ĠSeverus": 48879,
+ "},{\"": 48880,
+ "ĠCLIENT": 48881,
+ "Ġjavascript": 48882,
+ "sama": 48883,
+ "ĠLearns": 48884,
+ "ãĤĤ": 48885,
+ "Upgrade": 48886,
+ "Listener": 48887,
+ "Ġsnipp": 48888,
+ "Ġrune": 48889,
+ "ĠTTL": 48890,
+ "ertation": 48891,
+ "olicy": 48892,
+ "=\"\"": 48893,
+ "«ĺ": 48894,
+ "Ġexpr": 48895,
+ "ovych": 48896,
+ "Ġãģ": 48897,
+ "_-_": 48898,
+ "munition": 48899,
+ "////": 48900,
+ "func": 48901,
+ ">>>>": 48902,
+ "Provider": 48903,
+ "Ïī": 48904,
+ "BUG": 48905,
+ "Ġ[-": 48906,
+ "Ġarrang": 48907,
+ "merce": 48908,
+ "ãĥ": 48909,
+ "incarn": 48910,
+ "Valid": 48911,
+ "ĠAether": 48912,
+ "ãĤĵ": 48913,
+ "ĠUTF": 48914,
+ "ĠMonstrous": 48915,
+ "ãĤĮ": 48916,
+ "hedon": 48917,
+ "áµ": 48918,
+ ":#": 48919,
+ "ĠFrieza": 48920,
+ "padding": 48921,
+ "Reviewer": 48922,
+ "Ġpsychiat": 48923,
+ "yrinth": 48924,
+ "ĠâĶĤ": 48925,
+ "hillary": 48926,
+ "Static": 48927,
+ "Newsletter": 48928,
+ "Avg": 48929,
+ "Ġfn": 48930,
+ "Topic": 48931,
+ "choes": 48932,
+ "Ġnewsp": 48933,
+ "á¸": 48934,
+ "Ġ[+": 48935,
+ "~~~~~~~~~~~~~~~~": 48936,
+ ":]": 48937,
+ "apego": 48938,
+ "buf": 48939,
+ "Translation": 48940,
+ "ById": 48941,
+ "Ġmmol": 48942,
+ "ãĥ¼ãĥ": 48943,
+ "å½": 48944,
+ "ãĤī": 48945,
+ "Ġparser": 48946,
+ "ãĥª": 48947,
+ "`,": 48948,
+ "Lair": 48949,
+ ")}": 48950,
+ "ypes": 48951,
+ "adobe": 48952,
+ "Ġancest": 48953,
+ "ernel": 48954,
+ "ĠNULL": 48955,
+ "ç«": 48956,
+ "anguages": 48957,
+ "Increases": 48958,
+ "æĦ": 48959,
+ "utorial": 48960,
+ "ithmetic": 48961,
+ "dll": 48962,
+ "ĠArcane": 48963,
+ "çī": 48964,
+ "Ġtc": 48965,
+ "urtles": 48966,
+ "èĪ": 48967,
+ "Bytes": 48968,
+ "Slot": 48969,
+ "ĠBahá": 48970,
+ "Weapon": 48971,
+ "widget": 48972,
+ "querque": 48973,
+ "Ġembodiments": 48974,
+ "å¥": 48975,
+ "WARN": 48976,
+ "swer": 48977,
+ "thumbnails": 48978,
+ "FFFF": 48979,
+ "inguishable": 48980,
+ "Ġâī": 48981,
+ "Ġ${": 48982,
+ "AAAAAAAA": 48983,
+ "Conclusion": 48984,
+ "ĻĤ": 48985,
+ "disable": 48986,
+ "Rect": 48987,
+ "Ġsubp": 48988,
+ "Ġ().": 48989,
+ "ĠDetected": 48990,
+ "èĢ": 48991,
+ "[]": 48992,
+ "Ġcoerc": 48993,
+ "ĠmM": 48994,
+ "recated": 48995,
+ "fusc": 48996,
+ "ĠSorce": 48997,
+ "çĶŁ": 48998,
+ ").[": 48999,
+ "Ġ})": 49000,
+ "mobi": 49001,
+ "yip": 49002,
+ "Acknowled": 49003,
+ "ternity": 49004,
+ "iqueness": 49005,
+ "ython": 49006,
+ "><": 49007,
+ "Ġstd": 49008,
+ "Url": 49009,
+ "Ġnamespace": 49010,
+ "Ġtion": 49011,
+ "oother": 49012,
+ "Ó": 49013,
+ "Ġhemor": 49014,
+ "Ġrg": 49015,
+ "ventory": 49016,
+ "ãĤ¢": 49017,
+ "anamo": 49018,
+ "Socket": 49019,
+ "Topics": 49020,
+ "apeshifter": 49021,
+ "gnu": 49022,
+ "Ġdetrim": 49023,
+ "`.": 49024,
+ "romeda": 49025,
+ "çIJ": 49026,
+ "Ġlambda": 49027,
+ "Compan": 49028,
+ "Variable": 49029,
+ "Ġusb": 49030,
+ "ĠAdamant": 49031,
+ "ournal": 49032,
+ "Ġcovari": 49033,
+ "ãĥ©": 49034,
+ "éĸ": 49035,
+ "åİ": 49036,
+ "otaur": 49037,
+ "Ġ(),": 49038,
+ "Marginal": 49039,
+ "ãģı": 49040,
+ "Ġphysic": 49041,
+ "adeon": 49042,
+ "RESULTS": 49043,
+ "200000": 49044,
+ "ãģį": 49045,
+ "udeb": 49046,
+ "ãģĵ": 49047,
+ "COMPLE": 49048,
+ "Ġmsg": 49049,
+ "ghazi": 49050,
+ "/*": 49051,
+ "ĠDeity": 49052,
+ "Ġdisapp": 49053,
+ "Availability": 49054,
+ "Ġillum": 49055,
+ "à©": 49056,
+ "ptives": 49057,
+ ",âĢĶ": 49058,
+ "chnology": 49059,
+ "Ġaccur": 49060,
+ "Ġapi": 49061,
+ "Obj": 49062,
+ "ãĤ«": 49063,
+ "ãĤ¸": 49064,
+ "ä¹ĭ": 49065,
+ "ËĪ": 49066,
+ "Ġtcp": 49067,
+ "Required": 49068,
+ ".<": 49069,
+ "\".[": 49070,
+ "Ġ~/.": 49071,
+ "Ġobser": 49072,
+ "RFC": 49073,
+ "Ġintegers": 49074,
+ "åī": 49075,
+ "Installation": 49076,
+ "Ô": 49077,
+ "ó": 49078,
+ "csv": 49079,
+ "ãĥ«": 49080,
+ "ĠNoticed": 49081,
+ "âĸĵ": 49082,
+ "Tumblr": 49083,
+ "Reply": 49084,
+ "||": 49085,
+ "Ġconclud": 49086,
+ "Ġ))": 49087,
+ "ebin": 49088,
+ "sql": 49089,
+ "Closure": 49090,
+ "++++": 49091,
+ "],[": 49092,
+ "âĹı": 49093,
+ "Ġprolet": 49094,
+ "Ġ>=": 49095,
+ "estinal": 49096,
+ "Ġ[*": 49097,
+ "ĠInquisitor": 49098,
+ "Ġcmd": 49099,
+ "FINE": 49100,
+ "CRIP": 49101,
+ "Ġvertex": 49102,
+ "TeX": 49103,
+ "///": 49104,
+ "Ö¼": 49105,
+ "iscons": 49106,
+ "Ġmyster": 49107,
+ "Changed": 49108,
+ "timeout": 49109,
+ "irtual": 49110,
+ "Methods": 49111,
+ "Ġcerts": 49112,
+ "texture": 49113,
+ "Roaming": 49114,
+ "Proxy": 49115,
+ "Override": 49116,
+ "éĹ": 49117,
+ "utf": 49118,
+ "python": 49119,
+ "ĠRarity": 49120,
+ "ilitarian": 49121,
+ "çľ": 49122,
+ "().": 49123,
+ "æł": 49124,
+ "Ġbuf": 49125,
+ "åij": 49126,
+ "çķ": 49127,
+ "Ġ*.": 49128,
+ "umerable": 49129,
+ "~~~~": 49130,
+ "å¦": 49131,
+ "Ġsimultane": 49132,
+ "Ġjson": 49133,
+ "Requires": 49134,
+ "Ġperl": 49135,
+ "Interface": 49136,
+ "rupal": 49137,
+ "": 49138,
+ "uilt": 49139,
+ "mercial": 49140,
+ "ĠPalestin": 49141,
+ "theless": 49142,
+ ")=": 49143,
+ "Generic": 49144,
+ "&&": 49145,
+ "ALSE": 49146,
+ "Ġdebugger": 49147,
+ "paralle": 49148,
+ "acly": 49149,
+ "ĠScourge": 49150,
+ ")].": 49151,
+ "Ġinstr": 49152,
+ "Ġ{}": 49153,
+ "]+": 49154,
+ "Ġdilig": 49155,
+ "åŃIJ": 49156,
+ "Ġcaptcha": 49157,
+ "kefeller": 49158,
+ "iosyncr": 49159,
+ "Ġchars": 49160,
+ "Ġinitialize": 49161,
+ "Width": 49162,
+ "Ġgithub": 49163,
+ "Ġinitialization": 49164,
+ "ĠGamerGate": 49165,
+ "Ġþ": 49166,
+ "drm": 49167,
+ "slaught": 49168,
+ "Ġtiss": 49169,
+ ".............": 49170,
+ "Ĥ¬": 49171,
+ "Ġplent": 49172,
+ "ãģķ": 49173,
+ "cfg": 49174,
+ "âĨ": 49175,
+ "Ġpokemon": 49176,
+ "\"],": 49177,
+ "Ġtyr": 49178,
+ "SELECT": 49179,
+ "othal": 49180,
+ "Tags": 49181,
+ "ĠMarketable": 49182,
+ "-----------": 49183,
+ "icter": 49184,
+ "irlf": 49185,
+ "ormons": 49186,
+ "Database": 49187,
+ "ĠãĤ": 49188,
+ "Ġ{\"": 49189,
+ "î": 49190,
+ "Handler": 49191,
+ "âĶĢ": 49192,
+ "$$$$": 49193,
+ "ĠJaune": 49194,
+ "ãĤ³": 49195,
+ "(),": 49196,
+ ")+": 49197,
+ "--------": 49198,
+ "Ġshenan": 49199,
+ "Ġwelf": 49200,
+ "Ġ',": 49201,
+ "attribute": 49202,
+ "Uncommon": 49203,
+ "maxwell": 49204,
+ "Browser": 49205,
+ "ĠPastebin": 49206,
+ "uberty": 49207,
+ "debug": 49208,
+ "Ġmosqu": 49209,
+ "ĠBoolean": 49210,
+ "wcs": 49211,
+ "é£": 49212,
+ "/âĢĭ": 49213,
+ "çĦ": 49214,
+ "(){": 49215,
+ "////////////////////////////////": 49216,
+ "ĠGleaming": 49217,
+ "regor": 49218,
+ "ĠMercenary": 49219,
+ "ensional": 49220,
+ "mpeg": 49221,
+ "sudo": 49222,
+ "ãģ®å": 49223,
+ "iggurat": 49224,
+ "vironment": 49225,
+ "Directory": 49226,
+ "ĠDecoder": 49227,
+ "SPONSORED": 49228,
+ "intendo": 49229,
+ "Ġ<=": 49230,
+ "btn": 49231,
+ "ï¸": 49232,
+ "ä½ľ": 49233,
+ "paio": 49234,
+ "Tokens": 49235,
+ "ãĢį": 49236,
+ "params": 49237,
+ "Offline": 49238,
+ "Ġmetab": 49239,
+ "ĠLisp": 49240,
+ "anwhile": 49241,
+ ">:": 49242,
+ "itialized": 49243,
+ "HTTP": 49244,
+ "Trivia": 49245,
+ "Sov": 49246,
+ "wrapper": 49247,
+ "={": 49248,
+ "ĠAzerb": 49249,
+ "aeper": 49250,
+ "Ġneighb": 49251,
+ "initions": 49252,
+ "Ġsts": 49253,
+ "ĠSasuke": 49254,
+ "#$": 49255,
+ "uliffe": 49256,
+ "æĸ¹": 49257,
+ "++++++++++++++++": 49258,
+ "ĠElven": 49259,
+ "ãģĤ": 49260,
+ "Ġartif": 49261,
+ "Folder": 49262,
+ "Ġà¨": 49263,
+ "åĤ": 49264,
+ "Ġphyl": 49265,
+ "uggest": 49266,
+ "blance": 49267,
+ "ãģł": 49268,
+ "Requirements": 49269,
+ "Usage": 49270,
+ "Ġinitialized": 49271,
+ "ã쮿": 49272,
+ "conservancy": 49273,
+ "ĠReincarn": 49274,
+ ")|": 49275,
+ "Ġantioxid": 49276,
+ "ĠClicker": 49277,
+ "Ġunlaw": 49278,
+ "Ġ\\(": 49279,
+ "ãĥĪ": 49280,
+ "Ġ[*]": 49281,
+ "Characters": 49282,
+ "////////": 49283,
+ "ãĢIJ": 49284,
+ "ãĤ·": 49285,
+ "webkit": 49286,
+ "ãĢij": 49287,
+ "Ġxp": 49288,
+ "alkyrie": 49289,
+ "Console": 49290,
+ "());": 49291,
+ "ĠKorra": 49292,
+ "\"))": 49293,
+ "oooooooooooooooo": 49294,
+ "Timer": 49295,
+ "////////////////": 49296,
+ "yout": 49297,
+ "engeance": 49298,
+ "emetery": 49299,
+ "Ġmages": 49300,
+ "mods": 49301,
+ "Null": 49302,
+ "Ġphilos": 49303,
+ "ascript": 49304,
+ "Ġaddon": 49305,
+ "ĠâĸĪ": 49306,
+ "emale": 49307,
+ "----------------------------------------------------------------": 49308,
+ "Ġ\\\\": 49309,
+ "=[": 49310,
+ "ĠParables": 49311,
+ "ãĥĨ": 49312,
+ "VALUE": 49313,
+ "Ġ@@": 49314,
+ "Ġuint": 49315,
+ "${": 49316,
+ "cpp": 49317,
+ "%%": 49318,
+ "Ġ(âĪĴ": 49319,
+ "utils": 49320,
+ "prefix": 49321,
+ "å°Ĩ": 49322,
+ "ãĥŃ": 49323,
+ "Completed": 49324,
+ "Ġgoto": 49325,
+ "ãĤ¯": 49326,
+ "Winged": 49327,
+ "perty": 49328,
+ "[\"": 49329,
+ "ãĥİ": 49330,
+ "ĠScythe": 49331,
+ "Ġæľ": 49332,
+ "Ġ!=": 49333,
+ "Buffer": 49334,
+ "docker": 49335,
+ "ĠWATCHED": 49336,
+ "èĢħ": 49337,
+ "())": 49338,
+ "Ġdst": 49339,
+ "SIZE": 49340,
+ "ĠDemonic": 49341,
+ "Ġresil": 49342,
+ "ãĤ¿": 49343,
+ "Ġpione": 49344,
+ "cpu": 49345,
+ "++)": 49346,
+ "TEXT": 49347,
+ "Ġdiscrep": 49348,
+ "debian": 49349,
+ "quished": 49350,
+ "Ġacknow": 49351,
+ "Ġtrave": 49352,
+ "Ġgcc": 49353,
+ "Catalog": 49354,
+ "ctrl": 49355,
+ "ĠMoroc": 49356,
+ "Ġcpu": 49357,
+ "Ġ];": 49358,
+ "ĠSorceress": 49359,
+ "Introduced": 49360,
+ "Frames": 49361,
+ "Ġcondem": 49362,
+ "¶æ": 49363,
+ "~~~~~~~~": 49364,
+ "ĠEmacs": 49365,
+ "][/": 49366,
+ "Ġglim": 49367,
+ "Init": 49368,
+ "ĠPrimordial": 49369,
+ "ãĥĥ": 49370,
+ "Ġ+=": 49371,
+ "Ġblat": 49372,
+ "à¼": 49373,
+ "------------------------------------------------": 49374,
+ "gpu": 49375,
+ "ãĥĥãĥĪ": 49376,
+ "Ġxml": 49377,
+ "Ġboolean": 49378,
+ "References": 49379,
+ "Ġ?)": 49380,
+ "Ġsatell": 49381,
+ "Queue": 49382,
+ "Ġpestic": 49383,
+ "Ġ}}": 49384,
+ "Attribute": 49385,
+ "Ġdx": 49386,
+ "ĠDefin": 49387,
+ "Synopsis": 49388,
+ "..................": 49389,
+ "ãĥ¬": 49390,
+ "plugin": 49391,
+ "Disable": 49392,
+ "0000000000000000": 49393,
+ ")\\": 49394,
+ "ĠIchigo": 49395,
+ "println": 49396,
+ "rontal": 49397,
+ "Setup": 49398,
+ "Ġ��������": 49399,
+ "å§": 49400,
+ "âĸº": 49401,
+ "ĠPengu": 49402,
+ "ailability": 49403,
+ "Duration": 49404,
+ "Timeout": 49405,
+ "ãĢĮ": 49406,
+ "Ġbehav": 49407,
+ "Reviewed": 49408,
+ "Ġtoget": 49409,
+ "\\.": 49410,
+ "lished": 49411,
+ "Ġthous": 49412,
+ "Ġperpend": 49413,
+ "ecause": 49414,
+ "Layout": 49415,
+ "è»": 49416,
+ "ĠDexterity": 49417,
+ "unsigned": 49418,
+ "+=": 49419,
+ "[[": 49420,
+ "ĠRunes": 49421,
+ "ãĤ¦": 49422,
+ "};": 49423,
+ "})": 49424,
+ "FTWARE": 49425,
+ "ength": 49426,
+ "milo": 49427,
+ "duino": 49428,
+ "天": 49429,
+ "ĠClojure": 49430,
+ "ļé": 49431,
+ "ãĥ¥": 49432,
+ "gradient": 49433,
+ "Ġ\"\"\"": 49434,
+ "âĨij": 49435,
+ "@#": 49436,
+ "JSON": 49437,
+ "Ġproport": 49438,
+ "addr": 49439,
+ "});": 49440,
+ "ãĥIJ": 49441,
+ "ä¸ī": 49442,
+ "Ġtmp": 49443,
+ "å£": 49444,
+ "../": 49445,
+ "zsche": 49446,
+ "Ġâμ": 49447,
+ "Entity": 49448,
+ "æ©Ł": 49449,
+ "ĠâĶľâĶĢâĶĢ": 49450,
+ "filename": 49451,
+ "{{": 49452,
+ "@@": 49453,
+ "ĠSeym": 49454,
+ "Ġ/**": 49455,
+ "ĠSummoner": 49456,
+ "Quantity": 49457,
+ "ç·": 49458,
+ "Attach": 49459,
+ "Ġbool": 49460,
+ "Texture": 49461,
+ "Ġopio": 49462,
+ ".}": 49463,
+ "ãĥĭ": 49464,
+ "integer": 49465,
+ "Ġregex": 49466,
+ "Ġnomine": 49467,
+ "ription": 49468,
+ "ãģ®ç": 49469,
+ "ãĥķ": 49470,
+ "Ġsubparagraph": 49471,
+ "GGGG": 49472,
+ "Ġexplan": 49473,
+ "Header": 49474,
+ "Spawn": 49475,
+ "toggle": 49476,
+ "²¾": 49477,
+ "Abyss": 49478,
+ "expr": 49479,
+ "ĠZerg": 49480,
+ "ĠGrimoire": 49481,
+ "Contents": 49482,
+ "Instance": 49483,
+ "cyclopedia": 49484,
+ "ãĥĹ": 49485,
+ "ĠTakeru": 49486,
+ "=(": 49487,
+ "代": 49488,
+ "\\)": 49489,
+ "Ġrgb": 49490,
+ "htt": 49491,
+ "bryce": 49492,
+ "Ġlivest": 49493,
+ "ĠAnnotations": 49494,
+ "âĶĢâĶĢâĶĢâĶĢâĶĢâĶĢâĶĢâĶĢ": 49495,
+ "berus": 49496,
+ "ntil": 49497,
+ "Ġskelet": 49498,
+ "callback": 49499,
+ "åħī": 49500,
+ "Joined": 49501,
+ "ãĤª": 49502,
+ "Ġargs": 49503,
+ "artifacts": 49504,
+ "Ġå¤": 49505,
+ "ÃĽ": 49506,
+ "ãĥŀ": 49507,
+ "Streamer": 49508,
+ "}\"": 49509,
+ "Ġunden": 49510,
+ "ãĥģ": 49511,
+ "Īè": 49512,
+ "ãĥ£": 49513,
+ "Ġ0004": 49514,
+ "Ġ\\'": 49515,
+ "ãĤ°": 49516,
+ "ĠCONFIG": 49517,
+ "Ġ#####": 49518,
+ "``": 49519,
+ "anguage": 49520,
+ "Ġ*)": 49521,
+ "Template": 49522,
+ "MODE": 49523,
+ "Ġ00000000": 49524,
+ "'';": 49525,
+ ">": 49526,
+ "士": 49527,
+ "essage": 49528,
+ "ntax": 49529,
+ "Cmd": 49530,
+ "ividual": 49531,
+ "Unix": 49532,
+ "è£": 49533,
+ "çĭ": 49534,
+ "使": 49535,
+ "():": 49536,
+ "ãĥī": 49537,
+ "gdala": 49538,
+ "etheless": 49539,
+ "ktop": 49540,
+ "ĠACPI": 49541,
+ "ãĥĸ": 49542,
+ "Ġsshd": 49543,
+ "Ġ000000": 49544,
+ "Ġchalleng": 49545,
+ "âĶĢâĶĢ": 49546,
+ "ĠFlavoring": 49547,
+ "çİĭ": 49548,
+ "Http": 49549,
+ "Ĭ±": 49550,
+ "Accessory": 49551,
+ "oldemort": 49552,
+ "ĠIzan": 49553,
+ "galitarian": 49554,
+ "ĠChocobo": 49555,
+ "edIn": 49556,
+ "++++++++": 49557,
+ "Ġprintf": 49558,
+ "çīĪ": 49559,
+ "izoph": 49560,
+ "ruciating": 49561,
+ "Ġenum": 49562,
+ ",,,,": 49563,
+ "Ġpregn": 49564,
+ "sembly": 49565,
+ "Ġtherap": 49566,
+ "Ġingred": 49567,
+ "ãĤµ": 49568,
+ "Ġsql": 49569,
+ "(*": 49570,
+ "Appearance": 49571,
+ "ngth": 49572,
+ "invoke": 49573,
+ "ãĥĥãĤ¯": 49574,
+ "ctx": 49575,
+ "Ġdmg": 49576,
+ "Plugin": 49577,
+ "ãĥ¡": 49578,
+ "ulhu": 49579,
+ "ãĤ§": 49580,
+ "Ġwarr": 49581,
+ "Ġmetic": 49582,
+ "女": 49583,
+ "Ġoun": 49584,
+ "ð": 49585,
+ "Ġtooltip": 49586,
+ "ãĤŃ": 49587,
+ "Ġvolunte": 49588,
+ "imgur": 49589,
+ "accompan": 49590,
+ "aterasu": 49591,
+ "olkien": 49592,
+ "ãĤº": 49593,
+ "Ġnodd": 49594,
+ "ĠMetatron": 49595,
+ "javascript": 49596,
+ "umbledore": 49597,
+ "ãĥł": 49598,
+ "--------------------------------------------------------": 49599,
+ "runtime": 49600,
+ "ĠLeban": 49601,
+ "Configuration": 49602,
+ "emort": 49603,
+ "(_": 49604,
+ "Connector": 49605,
+ "iosyn": 49606,
+ "reddits": 49607,
+ "Ġ\"%": 49608,
+ "Ġ[&": 49609,
+ "ĠSwordsman": 49610,
+ "ĠAwoken": 49611,
+ "Ġ;;": 49612,
+ "ãĥ¼ãĥ«": 49613,
+ "Ġ:=": 49614,
+ "ãĤ¹ãĥĪ": 49615,
+ "Ġcomr": 49616,
+ "Adapter": 49617,
+ "sbm": 49618,
+ "âķIJâķIJ": 49619,
+ "çļ": 49620,
+ "Loader": 49621,
+ "ãĥĵ": 49622,
+ "okemon": 49623,
+ "ãģ®é": 49624,
+ "-->": 49625,
+ "Ġlvl": 49626,
+ "Footnote": 49627,
+ "Iter": 49628,
+ "####": 49629,
+ "ãĥij": 49630,
+ "ĠCarbuncle": 49631,
+ "Ġ[+]": 49632,
+ "Ġmathemat": 49633,
+ "Allows": 49634,
+ "Ġ4090": 49635,
+ "Async": 49636,
+ "ģ«": 49637,
+ "Ͻ": 49638,
+ "))))": 49639,
+ "á½": 49640,
+ "Ġcx": 49641,
+ "Ġansw": 49642,
+ "{\"": 49643,
+ "ãĥŁ": 49644,
+ "addons": 49645,
+ "Filename": 49646,
+ "Appearances": 49647,
+ "ĠãĢĮ": 49648,
+ "Ġaddr": 49649,
+ "Ġcharact": 49650,
+ "glomer": 49651,
+ "Advertisements": 49652,
+ "Ġdracon": 49653,
+ "ĠFenrir": 49654,
+ "Ġ();": 49655,
+ "ĠCitiz": 49656,
+ "acebook": 49657,
+ "Ġparams": 49658,
+ "]=": 49659,
+ "Ġsubscript": 49660,
+ "Ġentreprene": 49661,
+ "tnc": 49662,
+ "iversal": 49663,
+ "Ġmillenn": 49664,
+ "ithub": 49665,
+ "/>": 49666,
+ "Ġ\"{": 49667,
+ "Frameworks": 49668,
+ "avorite": 49669,
+ "Ġ])": 49670,
+ "Constructed": 49671,
+ "fml": 49672,
+ "ãĥį": 49673,
+ "################################": 49674,
+ "-|": 49675,
+ "¥ŀ": 49676,
+ "Ġwithd": 49677,
+ "ĠCth": 49678,
+ "AppData": 49679,
+ "Msg": 49680,
+ ":{": 49681,
+ "ãĤ¨": 49682,
+ "Ġtuple": 49683,
+ "ç¥ŀ": 49684,
+ "Ġintrins": 49685,
+ "ĠCooldown": 49686,
+ "ategory": 49687,
+ "^{": 49688,
+ "ãĥĬ": 49689,
+ "''''": 49690,
+ "çͰ": 49691,
+ "ĠDEBUG": 49692,
+ "Ġcannabin": 49693,
+ "ocobo": 49694,
+ "Invalid": 49695,
+ "ãĥĢ": 49696,
+ "Compat": 49697,
+ "Ġ({": 49698,
+ "Removed": 49699,
+ "Ġconvol": 49700,
+ "}:": 49701,
+ "interstitial": 49702,
+ "Ġ": 49703,
+ "Ġcontrace": 49704,
+ "uyomi": 49705,
+ "Callback": 49706,
+ "Parser": 49707,
+ "äºĶ": 49708,
+ "Versions": 49709,
+ "::::": 49710,
+ "Recomm": 49711,
+ "}\\": 49712,
+ "Ġ\"_": 49713,
+ "Debug": 49714,
+ "ĠAoE": 49715,
+ "atever": 49716,
+ "ĠTradable": 49717,
+ "Reloaded": 49718,
+ "ĠReincarnated": 49719,
+ "ĠStrongh": 49720,
+ ">\"": 49721,
+ "initialized": 49722,
+ "Ġexting": 49723,
+ "Poké": 49724,
+ "Parameters": 49725,
+ "¶ħ": 49726,
+ "########": 49727,
+ "NULL": 49728,
+ "ãĥĩ": 49729,
+ "groupon": 49730,
+ "\\-": 49731,
+ "ãĥı": 49732,
+ "ãĤ±": 49733,
+ "Ġsubsequ": 49734,
+ "ccording": 49735,
+ "ĠMODULE": 49736,
+ "ĠProtoss": 49737,
+ "\"},{\"": 49738,
+ "Ġ..............": 49739,
+ "Integer": 49740,
+ "endif": 49741,
+ "ãĥĻ": 49742,
+ "parser": 49743,
+ "lambda": 49744,
+ "Ġcarbohyd": 49745,
+ "ĠUnloaded": 49746,
+ "_{": 49747,
+ "âĸ¬âĸ¬": 49748,
+ "Ġdebian": 49749,
+ "]}": 49750,
+ "ãĤ¶": 49751,
+ "Parameter": 49752,
+ "ãĤ£": 49753,
+ "ãĤ»": 49754,
+ "Ġ$_": 49755,
+ "İĭ": 49756,
+ "Ġiterator": 49757,
+ "ãĤ¬": 49758,
+ "WINDOWS": 49759,
+ "CONCLUS": 49760,
+ "Ġ\"\\": 49761,
+ "umbn": 49762,
+ "(&": 49763,
+ "ãĥ©ãĥ³": 49764,
+ "usercontent": 49765,
+ "ometimes": 49766,
+ "METHOD": 49767,
+ "ãĥ¢": 49768,
+ "potion": 49769,
+ "ãĥ¯": 49770,
+ "everal": 49771,
+ "Ġweap": 49772,
+ "minecraft": 49773,
+ "================================": 49774,
+ "printf": 49775,
+ "ĠShinra": 49776,
+ "Ġreluct": 49777,
+ "\\\",": 49778,
+ "Runtime": 49779,
+ "xff": 49780,
+ "ĠAbyssal": 49781,
+ "akeru": 49782,
+ "Ġ\\(\\": 49783,
+ "\"/>": 49784,
+ "efficients": 49785,
+ "Ü": 49786,
+ "avascript": 49787,
+ "Ġbehavi": 49788,
+ "++;": 49789,
+ "=#": 49790,
+ "Attributes": 49791,
+ "âĵĺ": 49792,
+ "lvl": 49793,
+ "¬¼": 49794,
+ "/**": 49795,
+ "Gameplay": 49796,
+ "ĠLeilan": 49797,
+ ">)": 49798,
+ "=\"/": 49799,
+ "Ġ));": 49800,
+ "ãĥĨãĤ£": 49801,
+ "ġ": 49802,
+ ".": 49803,
+ "Ġantidepress": 49804,
+ "Ġhtt": 49805,
+ "################": 49806,
+ "arnaev": 49807,
+ "ãĤ½": 49808,
+ "DERR": 49809,
+ "¥µ": 49810,
+ "âĸĪ": 49811,
+ "Ġ|--": 49812,
+ "Ġundermin": 49813,
+ "Ġ)))": 49814,
+ "ãĥĩãĤ£": 49815,
+ "awaru": 49816,
+ "\":[{\"": 49817,
+ "aution": 49818,
+ "ãĤ¤ãĥĪ": 49819,
+ "ô": 49820,
+ "ĠILCS": 49821,
+ "dfx": 49822,
+ "ĨĴ": 49823,
+ "âĸĴ": 49824,
+ "Ġcitiz": 49825,
+ "Ġ-=": 49826,
+ "ĠAllaah": 49827,
+ "Ġ(_": 49828,
+ "ĸļ": 49829,
+ "Ġ{\\": 49830,
+ "Ġsrf": 49831,
+ "ãĤ´": 49832,
+ "æŃ¦": 49833,
+ "»Ĵ": 49834,
+ "Ptr": 49835,
+ "'>": 49836,
+ "DEBUG": 49837,
+ "âĶģ": 49838,
+ "ãĢı": 49839,
+ "WithNo": 49840,
+ "Redditor": 49841,
+ "ĠâĶľ": 49842,
+ "Ġfmt": 49843,
+ "ãĢİ": 49844,
+ "Ġmsec": 49845,
+ "ĪĴ": 49846,
+ "eatures": 49847,
+ "itially": 49848,
+ "\"\"\"": 49849,
+ "ãĥ¼ãĤ¯": 49850,
+ "Textures": 49851,
+ "\"},": 49852,
+ "\">": 49853,
+ "Ġenthusi": 49854,
+ "CHAPTER": 49855,
+ "Ġunbeliev": 49856,
+ "Ġearthqu": 49857,
+ "Ġ><": 49858,
+ "||||": 49859,
+ "ß": 49860,
+ "iterator": 49861,
+ "è£ħ": 49862,
+ "Ĥª": 49863,
+ "ojure": 49864,
+ "ãħĭãħĭ": 49865,
+ "ãĥ¼ãĥ³": 49866,
+ "Ġprintln": 49867,
+ "Ġ][": 49868,
+ "âĸĪâĸĪ": 49869,
+ "âķIJ": 49870,
+ "\\\":": 49871,
+ "senal": 49872,
+ "é¾į": 49873,
+ "é¾": 49874,
+ "Ġcryst": 49875,
+ "ãĥķãĤ¡": 49876,
+ "ĠCosponsors": 49877,
+ "ãĤ·ãĥ£": 49878,
+ "Magikarp": 49879,
+ "ĠMagicka": 49880,
+ "âĸĪâĸĪâĸĪâĸĪ": 49881,
+ ",,,,,,,,": 49882,
+ "vertisement": 49883,
+ "âĶĢâĶĢâĶĢâĶĢ": 49884,
+ "ãĥķãĤ©": 49885,
+ "luaj": 49886,
+ "CLASSIFIED": 49887,
+ ".''.": 49888,
+ "byss": 49889,
+ "Ġ{:": 49890,
+ "ĠNanto": 49891,
+ "Ġptr": 49892,
+ "Ġ%%": 49893,
+ "Ġteasp": 49894,
+ "[_": 49895,
+ "ãĥ¤": 49896,
+ "ħĭ": 49897,
+ "ŃĶ": 49898,
+ "Ġpci": 49899,
+ "Ġ\"<": 49900,
+ "GGGGGGGG": 49901,
+ "æĪ¦": 49902,
+ "--+": 49903,
+ "ãĤ®": 49904,
+ "Ġ())": 49905,
+ "âĸ¬": 49906,
+ "Ġsizeof": 49907,
+ "}}}": 49908,
+ ";;;;;;;;": 49909,
+ ">]": 49910,
+ "âĸĪâĸĪâĸĪâĸĪâĸĪâĸĪâĸĪâĸĪ": 49911,
+ "Vaults": 49912,
+ "Ġistg": 49913,
+ "Ġnewcom": 49914,
+ "=]": 49915,
+ "¿½": 49916,
+ "ĵĺ": 49917,
+ "{\\": 49918,
+ "Args": 49919,
+ "Ġexha": 49920,
+ "(\\": 49921,
+ "Ġunnecess": 49922,
+ "\"}],\"": 49923,
+ "ĠUNCLASSIFIED": 49924,
+ ">(": 49925,
+ "ãĤ¢ãĥ«": 49926,
+ "æ©": 49927,
+ "70710": 49928,
+ "Ń·": 49929,
+ "ãĥ¼ãĥĨãĤ£": 49930,
+ "ĠSakuya": 49931,
+ "ãĥĥãĥī": 49932,
+ "ĠPyrrha": 49933,
+ "escription": 49934,
+ "VIDIA": 49935,
+ "================================================================": 49936,
+ "Ġlooph": 49937,
+ "=~": 49938,
+ "Ġcumbers": 49939,
+ "Ġ)]": 49940,
+ "govtrack": 49941,
+ "ĠãĤµ": 49942,
+ "Ġsubur": 49943,
+ "Þ": 49944,
+ "Ġâī¡": 49945,
+ "Interstitial": 49946,
+ "ãĥ¼ãĥĨ": 49947,
+ "Ġgobl": 49948,
+ "ãĥīãĥ©": 49949,
+ "oldown": 49950,
+ "ģĸ": 49951,
+ "Depths": 49952,
+ "Ġ());": 49953,
+ "Ġ._": 49954,
+ "20439": 49955,
+ "Ġç¥ŀ": 49956,
+ "ãģ®å®": 49957,
+ "ãĤ¼": 49958,
+ "Ġ$\\": 49959,
+ "âĹ¼": 49960,
+ "Ġencount": 49961,
+ "Ġ":48457,"Ġstreng":48458,"agascar":48459,"guyen":48460,"((":48461,")[":48462,"ĠNorn":48463,"Ġhippocamp":48464,"Ġ¯":48465,"îĢ":48466,"Connection":48467,"PATH":48468,"mbuds":48469,"ĠShards":48470,"Ġadvoc":48471,"Ġsimulac":48472,"âĸij":48473,"!?\"":48474,"ĠPotion":48475,"Ġamulet":48476,"ĠFnatic":48477,"Ġcryptoc":48478,"wav":48479,"radius":48480,"pkg":48481,"ĠMFT":48482,"æĢ":48483,"Ġtoile":48484,"Items":48485,"ifference":48486,"errors":48487,"ĠCelt":48488,"Ġunpop":48489,"ilogy":48490,"6666":48491,"hesda":48492,"Instruct":48493,"å·":48494,"Materials":48495,"ettings":48496,"Percent":48497,"Ġresistor":48498,"tymology":48499,"Ġdeprecated":48500,"Ġgrep":48501,"ĠWRITE":48502,"Ġtriv":48503,"Ġscrut":48504,"[/":48505,"anyl":48506,"skirts":48507,"MSN":48508,"ĠCodec":48509,"ecd":48510,"Anth":48511,"){":48512,"%]":48513,"veyard":48514,"aspberry":48515,"ãĢ":48516,"Reward":48517,"rha":48518,"Stretch":48519,"]-":48520,"Prev":48521,"Context":48522,"Ġlinux":48523,"HAHA":48524,"perties":48525,"ĠVIDE":48526,"Domain":48527,"Ġmurd":48528,"ĠLegions":48529,"apache":48530,"æŃ":48531,"Pause":48532,"Temperature":48533,"ufact":48534,"igslist":48535,"ĠRetrieved":48536,"èª":48537,"ãģĮ":48538,"Ingredients":48539,"ruary":48540,"dyl":48541,"Alias":48542,"ĠÎĶ":48543,"Ġinval":48544,"amsung":48545,"!--":48546,"olean":48547,"æī":48548,"ãģ¯":48549,"Ġcoefficients":48550,"ĠDHCP":48551,"âĨĴ":48552,"utonium":48553,":[":48554,"âĹ":48555,"cli":48556,"Container":48557,"å¼":48558,"nexus":48559,"SOURCE":48560,"Ò":48561,"=/":48562,"Ġmysql":48563,"ĠGained":48564,"Ġ/*":48565,"uncture":48566,"Ġstatically":48567,"âĸł":48568,"æĺ¯":48569,"æ°":48570,"estamp":48571,"Cache":48572,"ulkan":48573,"staking":48574,"apter":48575,"ãģ¾":48576,"Ġμg":48577,"Ġtremend":48578,"ĠPiercing":48579,"naissance":48580,"ĠHealer":48581,"Enabled":48582,"éģ":48583,"âĸ":48584,"ĠThumbnails":48585,"Ġhither":48586,"Format":48587,"utherland":48588,"íķ":48589,"Ġdestro":48590,"fff":48591,"execute":48592,"msg":48593,"romancer":48594,"ĠCanaver":48595,"ĠVaults":48596,"oided":48597,"iage":48598,"Ġimg":48599,"summary":48600,"]);":48601,"ĠABE":48602,"ĠGamergate":48603,"utherford":48604,"Ġoverwrite":48605,"enment":48606,"æķ":48607,"Ġsystemd":48608,"tif":48609,"]).":48610,"ãĤ¤":48611,"Widget":48612,"======":48613,"(-":48614,"Ġ\"+":48615,"ĠIncarnation":48616,"æĥ":48617,"���":48618,"GUI":48619,"èĥ":48620,"forums":48621,"Ġrunes":48622,"Ġâī¤":48623,"Ġdefic":48624,"Distance":48625,"directory":48626,"ĠHorus":48627,"iltr":48628,"ortium":48629,"Ġ./":48630,"bda":48631,"owship":48632,"ĠâĨij":48633,"}.":48634,"åĩ":48635,"1027":48636,"Weapons":48637,"lucent":48638,"Ġauth":48639,";;":48640,"Recommended":48641,"Ġsurv":48642,"Ġvm":48643,"ĠStronghold":48644,"Ġparan":48645,"ĠTrance":48646,"æĺ":48647,"Ġsovere":48648,"Ġcorrid":48649,"ĠPwr":48650,"Ġ[/":48651,"Ġseq":48652,"Population":48653,"Ġ[];":48654,"Ġreferen":48655,"ĠInstr":48656,"ĠStamina":48657,"kernel":48658,"Python":48659,"-+":48660,"Ġallele":48661,"éĽ":48662,"isode":48663,"ä¸į":48664,"otonin":48665,"modules":48666,"Notable":48667,"Spell":48668,"\\\\":48669,"Pref":48670,"Ġdatas":48671,"setup":48672,"Ġhapl":48673,"Height":48674,"åĭ":48675,"ãģ£":48676,"]),":48677,"Handle":48678,"umenthal":48679,"Package":48680,"Ġenthus":48681,"Ġunsus":48682,"Narr":48683,"Examples":48684,"FAQ":48685,"REDACTED":48686,"Ġnotor":48687,"Enable":48688,"Pattern":48689,"aeda":48690,">.":48691,"CHECK":48692,"Ġ����":48693,"Ġ'.":48694,"Ġãĥ":48695,"append":48696,"����":48697,"gemony":48698,"terness":48699,"ĠHaku":48700,"NVIDIA":48701,"queue":48702,"Bind":48703,"Ġneigh":48704,"armor":48705,"retty":48706,"LOD":48707,"plugins":48708,"Ġ/>":48709,"TYPE":48710,"Ġ4096":48711,"-------":48712,"Preview":48713,"FML":48714,"Ġproletarian":48715,"zees":48716,"enfranch":48717,"ãģĨ":48718,"Ctrl":48719,"Module":48720,"ĠSurviv":48721,"ĠStarcraft":48722,"rored":48723,"reddit":48724,"Ġrul":48725,"Ġtx":48726,"Ġmage":48727,"Sword":48728,"Ġ~/":48729,"Effects":48730,"éļ":48731,"ä¹":48732,"Sensor":48733,"Solution":48734,"ãģĻ":48735,"Arcade":48736,"Ġpredec":48737,"Values":48738,"Length":48739,"Ġfortun":48740,"ttp":48741,"\"[":48742,"tmp":48743,"ĠBerserker":48744,"åĨ":48745,"ositories":48746,"Ġcouncill":48747,"ffff":48748,"));":48749,"Recipe":48750,"ĠASCII":48751,"âĦ¢:":48752,"ä":48753,"Ġhorm":48754,"=>":48755,"sers":48756,"ãģĭ":48757,"Recommend":48758,"['":48759,"agame":48760,"Animation":48761,"aucuses":48762,"Discussion":48763,"Ġhelicop":48764,"å¿":48765,"Float":48766,"Component":48767,"instance":48768,"Ġfoo":48769,"localhost":48770,"=-":48771,"Offset":48772,"Psy":48773,"ĠGohan":48774,"buquerque":48775,"Ġdefe":48776,"chwitz":48777,"parse":48778,"Ġdors":48779,"Ġspons":48780,"Ġasync":48781,"agonists":48782,"Ġindo":48783,".>>":48784,"ĠDisciple":48785,"Ġfilename":48786,"rency":48787,"ĠDise":48788,"Ġ\"/":48789,"template":48790,"ãĤ¹":48791,"swers":48792,"Ġ++":48793,"Ġ[(":48794,"thora":48795,"ĠDepths":48796,"livious":48797,"Ġdisadvant":48798,"foundland":48799,"Upload":48800,"Ġ§§":48801,"Ġsophistic":48802,";}":48803,"izont":48804,"\"}":48805,"estial":48806,"Ranked":48807,"ĠOccupations":48808,"LEASE":48809,"ĠOgre":48810,"folder":48811,"Plot":48812,"farious":48813,"Ġsuscept":48814,"Types":48815,"Discuss":48816,"Ġ'/":48817,"æµ":48818,"earable":48819,"æ³":48820,"Tile":48821,"iatus":48822,"åŃ":48823,"Ġreperto":48824,"Helper":48825,"Returns":48826,"ä¸Ĭ":48827,"imaru":48828,"Ġreq":48829,"Ġdissatisf":48830,"multipl":48831,"}{":48832,"-[":48833,"itial":48834,"*/":48835,"Config":48836,"Example":48837,"ĠjQuery":48838,"Mods":48839,"ĠGPIO":48840,"Ġlaun":48841,"layout":48842,"cised":48843,"Ġ......":48844,"+++":48845,"prototype":48846,"Exception":48847,"Ġsubsections":48848,"Ġresemb":48849,"Ġâĩ":48850,"ĠPubMed":48851,"username":48852,"Ġaggro":48853,"éĥ":48854,"Ġ};":48855,"ĠMages":48856,"ryu":48857,"apons":48858,"Optional":48859,"ĠAncients":48860,"ãĤĬ":48861,"Quotes":48862,"oaded":48863,"Ġsuspic":48864,"inline":48865,"omial":48866,"ĠMahjong":48867,"auntlets":48868,"Ġanarchism":48869,"Ġsubclass":48870,"ĠMLG":48871,"...]":48872,"Dialog":48873,"uphem":48874,"Ġrecursive":48875,"7601":48876,"frac":48877,"Else":48878,"ĠSeverus":48879,"},{\"":48880,"ĠCLIENT":48881,"Ġjavascript":48882,"sama":48883,"ĠLearns":48884,"ãĤĤ":48885,"Upgrade":48886,"Listener":48887,"Ġsnipp":48888,"Ġrune":48889,"ĠTTL":48890,"ertation":48891,"olicy":48892,"=\"\"":48893,"«ĺ":48894,"Ġexpr":48895,"ovych":48896,"Ġãģ":48897,"_-_":48898,"munition":48899,"////":48900,"func":48901,">>>>":48902,"Provider":48903,"Ïī":48904,"BUG":48905,"Ġ[-":48906,"Ġarrang":48907,"merce":48908,"ãĥ":48909,"incarn":48910,"Valid":48911,"ĠAether":48912,"ãĤĵ":48913,"ĠUTF":48914,"ĠMonstrous":48915,"ãĤĮ":48916,"hedon":48917,"áµ":48918,":#":48919,"ĠFrieza":48920,"padding":48921,"Reviewer":48922,"Ġpsychiat":48923,"yrinth":48924,"ĠâĶĤ":48925,"hillary":48926,"Static":48927,"Newsletter":48928,"Avg":48929,"Ġfn":48930,"Topic":48931,"choes":48932,"Ġnewsp":48933,"á¸":48934,"Ġ[+":48935,"~~~~~~~~~~~~~~~~":48936,":]":48937,"apego":48938,"buf":48939,"Translation":48940,"ById":48941,"Ġmmol":48942,"ãĥ¼ãĥ":48943,"å½":48944,"ãĤī":48945,"Ġparser":48946,"ãĥª":48947,"`,":48948,"Lair":48949,")}":48950,"ypes":48951,"adobe":48952,"Ġancest":48953,"ernel":48954,"ĠNULL":48955,"ç«":48956,"anguages":48957,"Increases":48958,"æĦ":48959,"utorial":48960,"ithmetic":48961,"dll":48962,"ĠArcane":48963,"çī":48964,"Ġtc":48965,"urtles":48966,"èĪ":48967,"Bytes":48968,"Slot":48969,"ĠBahá":48970,"Weapon":48971,"widget":48972,"querque":48973,"Ġembodiments":48974,"å¥":48975,"WARN":48976,"swer":48977,"thumbnails":48978,"FFFF":48979,"inguishable":48980,"Ġâī":48981,"Ġ${":48982,"AAAAAAAA":48983,"Conclusion":48984,"ĻĤ":48985,"disable":48986,"Rect":48987,"Ġsubp":48988,"Ġ().":48989,"ĠDetected":48990,"èĢ":48991,"[]":48992,"Ġcoerc":48993,"ĠmM":48994,"recated":48995,"fusc":48996,"ĠSorce":48997,"çĶŁ":48998,").[":48999,"Ġ})":49000,"mobi":49001,"yip":49002,"Acknowled":49003,"ternity":49004,"iqueness":49005,"ython":49006,"><":49007,"Ġstd":49008,"Url":49009,"Ġnamespace":49010,"Ġtion":49011,"oother":49012,"Ó":49013,"Ġhemor":49014,"Ġrg":49015,"ventory":49016,"ãĤ¢":49017,"anamo":49018,"Socket":49019,"Topics":49020,"apeshifter":49021,"gnu":49022,"Ġdetrim":49023,"`.":49024,"romeda":49025,"çIJ":49026,"Ġlambda":49027,"Compan":49028,"Variable":49029,"Ġusb":49030,"ĠAdamant":49031,"ournal":49032,"Ġcovari":49033,"ãĥ©":49034,"éĸ":49035,"åİ":49036,"otaur":49037,"Ġ(),":49038,"Marginal":49039,"ãģı":49040,"Ġphysic":49041,"adeon":49042,"RESULTS":49043,"200000":49044,"ãģį":49045,"udeb":49046,"ãģĵ":49047,"COMPLE":49048,"Ġmsg":49049,"ghazi":49050,"/*":49051,"ĠDeity":49052,"Ġdisapp":49053,"Availability":49054,"Ġillum":49055,"à©":49056,"ptives":49057,",âĢĶ":49058,"chnology":49059,"Ġaccur":49060,"Ġapi":49061,"Obj":49062,"ãĤ«":49063,"ãĤ¸":49064,"ä¹ĭ":49065,"ËĪ":49066,"Ġtcp":49067,"Required":49068,".<":49069,"\".[":49070,"Ġ~/.":49071,"Ġobser":49072,"RFC":49073,"Ġintegers":49074,"åī":49075,"Installation":49076,"Ô":49077,"ó":49078,"csv":49079,"ãĥ«":49080,"ĠNoticed":49081,"âĸĵ":49082,"Tumblr":49083,"Reply":49084,"||":49085,"Ġconclud":49086,"Ġ))":49087,"ebin":49088,"sql":49089,"Closure":49090,"++++":49091,"],[":49092,"âĹı":49093,"Ġprolet":49094,"Ġ>=":49095,"estinal":49096,"Ġ[*":49097,"ĠInquisitor":49098,"Ġcmd":49099,"FINE":49100,"CRIP":49101,"Ġvertex":49102,"TeX":49103,"///":49104,"Ö¼":49105,"iscons":49106,"Ġmyster":49107,"Changed":49108,"timeout":49109,"irtual":49110,"Methods":49111,"Ġcerts":49112,"texture":49113,"Roaming":49114,"Proxy":49115,"Override":49116,"éĹ":49117,"utf":49118,"python":49119,"ĠRarity":49120,"ilitarian":49121,"çľ":49122,"().":49123,"æł":49124,"Ġbuf":49125,"åij":49126,"çķ":49127,"Ġ*.":49128,"umerable":49129,"~~~~":49130,"å¦":49131,"Ġsimultane":49132,"Ġjson":49133,"Requires":49134,"Ġperl":49135,"Interface":49136,"rupal":49137,"":49138,"uilt":49139,"mercial":49140,"ĠPalestin":49141,"theless":49142,")=":49143,"Generic":49144,"&&":49145,"ALSE":49146,"Ġdebugger":49147,"paralle":49148,"acly":49149,"ĠScourge":49150,")].":49151,"Ġinstr":49152,"Ġ{}":49153,"]+":49154,"Ġdilig":49155,"åŃIJ":49156,"Ġcaptcha":49157,"kefeller":49158,"iosyncr":49159,"Ġchars":49160,"Ġinitialize":49161,"Width":49162,"Ġgithub":49163,"Ġinitialization":49164,"ĠGamerGate":49165,"Ġþ":49166,"drm":49167,"slaught":49168,"Ġtiss":49169,".............":49170,"Ĥ¬":49171,"Ġplent":49172,"ãģķ":49173,"cfg":49174,"âĨ":49175,"Ġpokemon":49176,"\"],":49177,"Ġtyr":49178,"SELECT":49179,"othal":49180,"Tags":49181,"ĠMarketable":49182,"-----------":49183,"icter":49184,"irlf":49185,"ormons":49186,"Database":49187,"ĠãĤ":49188,"Ġ{\"":49189,"î":49190,"Handler":49191,"âĶĢ":49192,"$$$$":49193,"ĠJaune":49194,"ãĤ³":49195,"(),":49196,")+":49197,"--------":49198,"Ġshenan":49199,"Ġwelf":49200,"Ġ',":49201,"attribute":49202,"Uncommon":49203,"maxwell":49204,"Browser":49205,"ĠPastebin":49206,"uberty":49207,"debug":49208,"Ġmosqu":49209,"ĠBoolean":49210,"wcs":49211,"é£":49212,"/âĢĭ":49213,"çĦ":49214,"(){":49215,"////////////////////////////////":49216,"ĠGleaming":49217,"regor":49218,"ĠMercenary":49219,"ensional":49220,"mpeg":49221,"sudo":49222,"ãģ®å":49223,"iggurat":49224,"vironment":49225,"Directory":49226,"ĠDecoder":49227,"SPONSORED":49228,"intendo":49229,"Ġ<=":49230,"btn":49231,"ï¸":49232,"ä½ľ":49233,"paio":49234,"Tokens":49235,"ãĢį":49236,"params":49237,"Offline":49238,"Ġmetab":49239,"ĠLisp":49240,"anwhile":49241,">:":49242,"itialized":49243,"HTTP":49244,"Trivia":49245,"Sov":49246,"wrapper":49247,"={":49248,"ĠAzerb":49249,"aeper":49250,"Ġneighb":49251,"initions":49252,"Ġsts":49253,"ĠSasuke":49254,"#$":49255,"uliffe":49256,"æĸ¹":49257,"++++++++++++++++":49258,"ĠElven":49259,"ãģĤ":49260,"Ġartif":49261,"Folder":49262,"Ġà¨":49263,"åĤ":49264,"Ġphyl":49265,"uggest":49266,"blance":49267,"ãģł":49268,"Requirements":49269,"Usage":49270,"Ġinitialized":49271,"ã쮿":49272,"conservancy":49273,"ĠReincarn":49274,")|":49275,"Ġantioxid":49276,"ĠClicker":49277,"Ġunlaw":49278,"Ġ\\(":49279,"ãĥĪ":49280,"Ġ[*]":49281,"Characters":49282,"////////":49283,"ãĢIJ":49284,"ãĤ·":49285,"webkit":49286,"ãĢij":49287,"Ġxp":49288,"alkyrie":49289,"Console":49290,"());":49291,"ĠKorra":49292,"\"))":49293,"oooooooooooooooo":49294,"Timer":49295,"////////////////":49296,"yout":49297,"engeance":49298,"emetery":49299,"Ġmages":49300,"mods":49301,"Null":49302,"Ġphilos":49303,"ascript":49304,"Ġaddon":49305,"ĠâĸĪ":49306,"emale":49307,"----------------------------------------------------------------":49308,"Ġ\\\\":49309,"=[":49310,"ĠParables":49311,"ãĥĨ":49312,"VALUE":49313,"Ġ@@":49314,"Ġuint":49315,"${":49316,"cpp":49317,"%%":49318,"Ġ(âĪĴ":49319,"utils":49320,"prefix":49321,"å°Ĩ":49322,"ãĥŃ":49323,"Completed":49324,"Ġgoto":49325,"ãĤ¯":49326,"Winged":49327,"perty":49328,"[\"":49329,"ãĥİ":49330,"ĠScythe":49331,"Ġæľ":49332,"Ġ!=":49333,"Buffer":49334,"docker":49335,"ĠWATCHED":49336,"èĢħ":49337,"())":49338,"Ġdst":49339,"SIZE":49340,"ĠDemonic":49341,"Ġresil":49342,"ãĤ¿":49343,"Ġpione":49344,"cpu":49345,"++)":49346,"TEXT":49347,"Ġdiscrep":49348,"debian":49349,"quished":49350,"Ġacknow":49351,"Ġtrave":49352,"Ġgcc":49353,"Catalog":49354,"ctrl":49355,"ĠMoroc":49356,"Ġcpu":49357,"Ġ];":49358,"ĠSorceress":49359,"Introduced":49360,"Frames":49361,"Ġcondem":49362,"¶æ":49363,"~~~~~~~~":49364,"ĠEmacs":49365,"][/":49366,"Ġglim":49367,"Init":49368,"ĠPrimordial":49369,"ãĥĥ":49370,"Ġ+=":49371,"Ġblat":49372,"à¼":49373,"------------------------------------------------":49374,"gpu":49375,"ãĥĥãĥĪ":49376,"Ġxml":49377,"Ġboolean":49378,"References":49379,"Ġ?)":49380,"Ġsatell":49381,"Queue":49382,"Ġpestic":49383,"Ġ}}":49384,"Attribute":49385,"Ġdx":49386,"ĠDefin":49387,"Synopsis":49388,"..................":49389,"ãĥ¬":49390,"plugin":49391,"Disable":49392,"0000000000000000":49393,")\\":49394,"ĠIchigo":49395,"println":49396,"rontal":49397,"Setup":49398,"Ġ��������":49399,"å§":49400,"âĸº":49401,"ĠPengu":49402,"ailability":49403,"Duration":49404,"Timeout":49405,"ãĢĮ":49406,"Ġbehav":49407,"Reviewed":49408,"Ġtoget":49409,"\\.":49410,"lished":49411,"Ġthous":49412,"Ġperpend":49413,"ecause":49414,"Layout":49415,"è»":49416,"ĠDexterity":49417,"unsigned":49418,"+=":49419,"[[":49420,"ĠRunes":49421,"ãĤ¦":49422,"};":49423,"})":49424,"FTWARE":49425,"ength":49426,"milo":49427,"duino":49428,"天":49429,"ĠClojure":49430,"ļé":49431,"ãĥ¥":49432,"gradient":49433,"Ġ\"\"\"":49434,"âĨij":49435,"@#":49436,"JSON":49437,"Ġproport":49438,"addr":49439,"});":49440,"ãĥIJ":49441,"ä¸ī":49442,"Ġtmp":49443,"å£":49444,"../":49445,"zsche":49446,"Ġâμ":49447,"Entity":49448,"æ©Ł":49449,"ĠâĶľâĶĢâĶĢ":49450,"filename":49451,"{{":49452,"@@":49453,"ĠSeym":49454,"Ġ/**":49455,"ĠSummoner":49456,"Quantity":49457,"ç·":49458,"Attach":49459,"Ġbool":49460,"Texture":49461,"Ġopio":49462,".}":49463,"ãĥĭ":49464,"integer":49465,"Ġregex":49466,"Ġnomine":49467,"ription":49468,"ãģ®ç":49469,"ãĥķ":49470,"Ġsubparagraph":49471,"GGGG":49472,"Ġexplan":49473,"Header":49474,"Spawn":49475,"toggle":49476,"²¾":49477,"Abyss":49478,"expr":49479,"ĠZerg":49480,"ĠGrimoire":49481,"Contents":49482,"Instance":49483,"cyclopedia":49484,"ãĥĹ":49485,"ĠTakeru":49486,"=(":49487,"代":49488,"\\)":49489,"Ġrgb":49490,"htt":49491,"bryce":49492,"Ġlivest":49493,"ĠAnnotations":49494,"âĶĢâĶĢâĶĢâĶĢâĶĢâĶĢâĶĢâĶĢ":49495,"berus":49496,"ntil":49497,"Ġskelet":49498,"callback":49499,"åħī":49500,"Joined":49501,"ãĤª":49502,"Ġargs":49503,"artifacts":49504,"Ġå¤":49505,"ÃĽ":49506,"ãĥŀ":49507,"Streamer":49508,"}\"":49509,"Ġunden":49510,"ãĥģ":49511,"Īè":49512,"ãĥ£":49513,"Ġ0004":49514,"Ġ\\'":49515,"ãĤ°":49516,"ĠCONFIG":49517,"Ġ#####":49518,"``":49519,"anguage":49520,"Ġ*)":49521,"Template":49522,"MODE":49523,"Ġ00000000":49524,"'';":49525,">":49526,"士":49527,"essage":49528,"ntax":49529,"Cmd":49530,"ividual":49531,"Unix":49532,"è£":49533,"çĭ":49534,"使":49535,"():":49536,"ãĥī":49537,"gdala":49538,"etheless":49539,"ktop":49540,"ĠACPI":49541,"ãĥĸ":49542,"Ġsshd":49543,"Ġ000000":49544,"Ġchalleng":49545,"âĶĢâĶĢ":49546,"ĠFlavoring":49547,"çİĭ":49548,"Http":49549,"Ĭ±":49550,"Accessory":49551,"oldemort":49552,"ĠIzan":49553,"galitarian":49554,"ĠChocobo":49555,"edIn":49556,"++++++++":49557,"Ġprintf":49558,"çīĪ":49559,"izoph":49560,"ruciating":49561,"Ġenum":49562,",,,,":49563,"Ġpregn":49564,"sembly":49565,"Ġtherap":49566,"Ġingred":49567,"ãĤµ":49568,"Ġsql":49569,"(*":49570,"Appearance":49571,"ngth":49572,"invoke":49573,"ãĥĥãĤ¯":49574,"ctx":49575,"Ġdmg":49576,"Plugin":49577,"ãĥ¡":49578,"ulhu":49579,"ãĤ§":49580,"Ġwarr":49581,"Ġmetic":49582,"女":49583,"Ġoun":49584,"ð":49585,"Ġtooltip":49586,"ãĤŃ":49587,"Ġvolunte":49588,"imgur":49589,"accompan":49590,"aterasu":49591,"olkien":49592,"ãĤº":49593,"Ġnodd":49594,"ĠMetatron":49595,"javascript":49596,"umbledore":49597,"ãĥł":49598,"--------------------------------------------------------":49599,"runtime":49600,"ĠLeban":49601,"Configuration":49602,"emort":49603,"(_":49604,"Connector":49605,"iosyn":49606,"reddits":49607,"Ġ\"%":49608,"Ġ[&":49609,"ĠSwordsman":49610,"ĠAwoken":49611,"Ġ;;":49612,"ãĥ¼ãĥ«":49613,"Ġ:=":49614,"ãĤ¹ãĥĪ":49615,"Ġcomr":49616,"Adapter":49617,"sbm":49618,"âķIJâķIJ":49619,"çļ":49620,"Loader":49621,"ãĥĵ":49622,"okemon":49623,"ãģ®é":49624,"-->":49625,"Ġlvl":49626,"Footnote":49627,"Iter":49628,"####":49629,"ãĥij":49630,"ĠCarbuncle":49631,"Ġ[+]":49632,"Ġmathemat":49633,"Allows":49634,"Ġ4090":49635,"Async":49636,"ģ«":49637,"Ͻ":49638,"))))":49639,"á½":49640,"Ġcx":49641,"Ġansw":49642,"{\"":49643,"ãĥŁ":49644,"addons":49645,"Filename":49646,"Appearances":49647,"ĠãĢĮ":49648,"Ġaddr":49649,"Ġcharact":49650,"glomer":49651,"Advertisements":49652,"Ġdracon":49653,"ĠFenrir":49654,"Ġ();":49655,"ĠCitiz":49656,"acebook":49657,"Ġparams":49658,"]=":49659,"Ġsubscript":49660,"Ġentreprene":49661,"tnc":49662,"iversal":49663,"Ġmillenn":49664,"ithub":49665,"/>":49666,"Ġ\"{":49667,"Frameworks":49668,"avorite":49669,"Ġ])":49670,"Constructed":49671,"fml":49672,"ãĥį":49673,"################################":49674,"-|":49675,"¥ŀ":49676,"Ġwithd":49677,"ĠCth":49678,"AppData":49679,"Msg":49680,":{":49681,"ãĤ¨":49682,"Ġtuple":49683,"ç¥ŀ":49684,"Ġintrins":49685,"ĠCooldown":49686,"ategory":49687,"^{":49688,"ãĥĬ":49689,"''''":49690,"çͰ":49691,"ĠDEBUG":49692,"Ġcannabin":49693,"ocobo":49694,"Invalid":49695,"ãĥĢ":49696,"Compat":49697,"Ġ({":49698,"Removed":49699,"Ġconvol":49700,"}:":49701,"interstitial":49702,"Ġ":49703,"Ġcontrace":49704,"uyomi":49705,"Callback":49706,"Parser":49707,"äºĶ":49708,"Versions":49709,"::::":49710,"Recomm":49711,"}\\":49712,"Ġ\"_":49713,"Debug":49714,"ĠAoE":49715,"atever":49716,"ĠTradable":49717,"Reloaded":49718,"ĠReincarnated":49719,"ĠStrongh":49720,">\"":49721,"initialized":49722,"Ġexting":49723,"Poké":49724,"Parameters":49725,"¶ħ":49726,"########":49727,"NULL":49728,"ãĥĩ":49729,"groupon":49730,"\\-":49731,"ãĥı":49732,"ãĤ±":49733,"Ġsubsequ":49734,"ccording":49735,"ĠMODULE":49736,"ĠProtoss":49737,"\"},{\"":49738,"Ġ..............":49739,"Integer":49740,"endif":49741,"ãĥĻ":49742,"parser":49743,"lambda":49744,"Ġcarbohyd":49745,"ĠUnloaded":49746,"_{":49747,"âĸ¬âĸ¬":49748,"Ġdebian":49749,"]}":49750,"ãĤ¶":49751,"Parameter":49752,"ãĤ£":49753,"ãĤ»":49754,"Ġ$_":49755,"İĭ":49756,"Ġiterator":49757,"ãĤ¬":49758,"WINDOWS":49759,"CONCLUS":49760,"Ġ\"\\":49761,"umbn":49762,"(&":49763,"ãĥ©ãĥ³":49764,"usercontent":49765,"ometimes":49766,"METHOD":49767,"ãĥ¢":49768,"potion":49769,"ãĥ¯":49770,"everal":49771,"Ġweap":49772,"minecraft":49773,"================================":49774,"printf":49775,"ĠShinra":49776,"Ġreluct":49777,"\\\",":49778,"Runtime":49779,"xff":49780,"ĠAbyssal":49781,"akeru":49782,"Ġ\\(\\":49783,"\"/>":49784,"efficients":49785,"Ü":49786,"avascript":49787,"Ġbehavi":49788,"++;":49789,"=#":49790,"Attributes":49791,"âĵĺ":49792,"lvl":49793,"¬¼":49794,"/**":49795,"Gameplay":49796,"ĠLeilan":49797,">)":49798,"=\"/":49799,"Ġ));":49800,"ãĥĨãĤ£":49801,"ġ":49802,".":49803,"Ġantidepress":49804,"Ġhtt":49805,"################":49806,"arnaev":49807,"ãĤ½":49808,"DERR":49809,"¥µ":49810,"âĸĪ":49811,"Ġ|--":49812,"Ġundermin":49813,"Ġ)))":49814,"ãĥĩãĤ£":49815,"awaru":49816,"\":[{\"":49817,"aution":49818,"ãĤ¤ãĥĪ":49819,"ô":49820,"ĠILCS":49821,"dfx":49822,"ĨĴ":49823,"âĸĴ":49824,"Ġcitiz":49825,"Ġ-=":49826,"ĠAllaah":49827,"Ġ(_":49828,"ĸļ":49829,"Ġ{\\":49830,"Ġsrf":49831,"ãĤ´":49832,"æŃ¦":49833,"»Ĵ":49834,"Ptr":49835,"'>":49836,"DEBUG":49837,"âĶģ":49838,"ãĢı":49839,"WithNo":49840,"Redditor":49841,"ĠâĶľ":49842,"Ġfmt":49843,"ãĢİ":49844,"Ġmsec":49845,"ĪĴ":49846,"eatures":49847,"itially":49848,"\"\"\"":49849,"ãĥ¼ãĤ¯":49850,"Textures":49851,"\"},":49852,"\">":49853,"Ġenthusi":49854,"CHAPTER":49855,"Ġunbeliev":49856,"Ġearthqu":49857,"Ġ><":49858,"||||":49859,"ß":49860,"iterator":49861,"è£ħ":49862,"Ĥª":49863,"ojure":49864,"ãħĭãħĭ":49865,"ãĥ¼ãĥ³":49866,"Ġprintln":49867,"Ġ][":49868,"âĸĪâĸĪ":49869,"âķIJ":49870,"\\\":":49871,"senal":49872,"é¾į":49873,"é¾":49874,"Ġcryst":49875,"ãĥķãĤ¡":49876,"ĠCosponsors":49877,"ãĤ·ãĥ£":49878,"Magikarp":49879,"ĠMagicka":49880,"âĸĪâĸĪâĸĪâĸĪ":49881,",,,,,,,,":49882,"vertisement":49883,"âĶĢâĶĢâĶĢâĶĢ":49884,"ãĥķãĤ©":49885,"luaj":49886,"CLASSIFIED":49887,".''.":49888,"byss":49889,"Ġ{:":49890,"ĠNanto":49891,"Ġptr":49892,"Ġ%%":49893,"Ġteasp":49894,"[_":49895,"ãĥ¤":49896,"ħĭ":49897,"ŃĶ":49898,"Ġpci":49899,"Ġ\"<":49900,"GGGGGGGG":49901,"æĪ¦":49902,"--+":49903,"ãĤ®":49904,"Ġ())":49905,"âĸ¬":49906,"Ġsizeof":49907,"}}}":49908,";;;;;;;;":49909,">]":49910,"âĸĪâĸĪâĸĪâĸĪâĸĪâĸĪâĸĪâĸĪ":49911,"Vaults":49912,"Ġistg":49913,"Ġnewcom":49914,"=]":49915,"¿½":49916,"ĵĺ":49917,"{\\":49918,"Args":49919,"Ġexha":49920,"(\\":49921,"Ġunnecess":49922,"\"}],\"":49923,"ĠUNCLASSIFIED":49924,">(":49925,"ãĤ¢ãĥ«":49926,"æ©":49927,"70710":49928,"Ń·":49929,"ãĥ¼ãĥĨãĤ£":49930,"ĠSakuya":49931,"ãĥĥãĥī":49932,"ĠPyrrha":49933,"escription":49934,"VIDIA":49935,"================================================================":49936,"Ġlooph":49937,"=~":49938,"Ġcumbers":49939,"Ġ)]":49940,"govtrack":49941,"ĠãĤµ":49942,"Ġsubur":49943,"Þ":49944,"Ġâī¡":49945,"Interstitial":49946,"ãĥ¼ãĥĨ":49947,"Ġgobl":49948,"ãĥīãĥ©":49949,"oldown":49950,"ģĸ":49951,"Depths":49952,"Ġ());":49953,"Ġ._":49954,"20439":49955,"Ġç¥ŀ":49956,"ãģ®å®":49957,"ãĤ¼":49958,"Ġ$\\":49959,"âĹ¼":49960,"Ġencount":49961,"Ġ